diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" --- "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.498, "train/learning_rate": 2.6438836104513065e-05, "train/epoch": 3.36, "train/global_step": 3000, "_runtime": 19379, "_timestamp": 1646680618, "_step": 3001, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 124.0, 12.0, 12.0, 7.0, 5.0, 28645.0, 1553.0, 70.0, 27.0, 12.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.125, -217.333984375, -209.54296875, -201.751953125, -193.9609375, -186.169921875, -178.37890625, -170.587890625, -162.796875, -155.005859375, -147.21484375, -139.423828125, -131.6328125, -123.841796875, -116.05078125, -108.259765625, -100.46875, -92.677734375, -84.88671875, -77.095703125, -69.3046875, -61.513671875, -53.72265625, -45.931640625, -38.140625, -30.349609375, -22.55859375, -14.767578125, -6.9765625, 0.814453125, 8.60546875, 16.396484375, 24.1875, 31.978515625, 39.76953125, 47.560546875, 55.3515625, 63.142578125, 70.93359375, 78.724609375, 86.515625, 94.306640625, 102.09765625, 109.888671875, 117.6796875, 125.470703125, 133.26171875, 141.052734375, 148.84375, 156.634765625, 164.42578125, 172.216796875, 180.0078125, 187.798828125, 195.58984375, 203.380859375, 211.171875, 218.962890625, 226.75390625, 234.544921875, 242.3359375, 250.126953125, 257.91796875, 265.708984375, 273.5]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 11.0, 9.0, 1.0, 9.0, 4.0, 12.0, 24.0, 17.0, 13.0, 32.0, 24.0, 29.0, 40.0, 42.0, 47.0, 50.0, 56.0, 40.0, 50.0, 46.0, 44.0, 45.0, 26.0, 52.0, 44.0, 32.0, 34.0, 22.0, 32.0, 16.0, 16.0, 12.0, 16.0, 9.0, 8.0, 7.0, 9.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-74.72195434570312, -72.6103286743164, -70.49870300292969, -68.38707733154297, -66.27545166015625, -64.16383361816406, -62.052207946777344, -59.940582275390625, -57.828956604003906, -55.71733093261719, -53.60570526123047, -51.494083404541016, -49.3824577331543, -47.27083206176758, -45.159210205078125, -43.047584533691406, -40.93595886230469, -38.82433319091797, -36.71270751953125, -34.6010856628418, -32.48945999145508, -30.37783432006836, -28.266210556030273, -26.154586791992188, -24.04296112060547, -21.93133544921875, -19.819711685180664, -17.708087921142578, -15.59646224975586, -13.484837532043457, -11.373212814331055, -9.261588096618652, -7.14996337890625, -5.038338661193848, -2.9267139434814453, -0.815089225769043, 1.2965354919433594, 3.4081602096557617, 5.519784927368164, 7.631409645080566, 9.743034362792969, 11.854659080505371, 13.966283798217773, 16.07790756225586, 18.189533233642578, 20.301158905029297, 22.412782669067383, 24.52440643310547, 26.636032104492188, 28.747657775878906, 30.859281539916992, 32.97090530395508, 35.0825309753418, 37.194156646728516, 39.30577850341797, 41.41740417480469, 43.529029846191406, 45.640655517578125, 47.752281188964844, 49.8639030456543, 51.975528717041016, 54.087154388427734, 56.19877624511719, 58.310401916503906, 60.422027587890625]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 4.0, 8.0, 14.0, 14.0, 17.0, 13.0, 20.0, 21.0, 25.0, 28.0, 35.0, 37.0, 35.0, 33.0, 39.0, 33.0, 36.0, 60.0, 42.0, 47.0, 54.0, 44.0, 41.0, 38.0, 34.0, 24.0, 29.0, 28.0, 27.0, 23.0, 14.0, 17.0, 17.0, 11.0, 7.0, 6.0, 2.0, 10.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-61.42485427856445, -59.36589431762695, -57.30693054199219, -55.24797058105469, -53.18901062011719, -51.13005065917969, -49.07108688354492, -47.01212692260742, -44.953163146972656, -42.894203186035156, -40.83523941040039, -38.77627944946289, -36.71731948852539, -34.658355712890625, -32.599395751953125, -30.540435791015625, -28.481475830078125, -26.422513961791992, -24.363554000854492, -22.30459213256836, -20.24563217163086, -18.186670303344727, -16.127708435058594, -14.068747520446777, -12.009786605834961, -9.950825691223145, -7.89186429977417, -5.832902908325195, -3.773941993713379, -1.7149810791015625, 0.3439807891845703, 2.4029417037963867, 4.461906433105469, 6.520867347717285, 8.579828262329102, 10.638790130615234, 12.69775104522705, 14.756711959838867, 16.815673828125, 18.8746337890625, 20.933595657348633, 22.992557525634766, 25.051517486572266, 27.1104793548584, 29.16944122314453, 31.22840118408203, 33.28736114501953, 35.3463249206543, 37.4052848815918, 39.4642448425293, 41.52320861816406, 43.58216857910156, 45.64112854003906, 47.70008850097656, 49.75905227661133, 51.81801223754883, 53.876976013183594, 55.935935974121094, 57.99489974975586, 60.05385971069336, 62.11281967163086, 64.17178344726562, 66.23074340820312, 68.28970336914062, 70.34866333007812]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 7.0, 12.0, 23.0, 31.0, 39.0, 61.0, 100.0, 186.0, 268.0, 417.0, 702.0, 1103.0, 1823.0, 2903.0, 4755.0, 7737.0, 12414.0, 19372.0, 29772.0, 45294.0, 66337.0, 94783.0, 138869.0, 200950.0, 136304.0, 94272.0, 65514.0, 44389.0, 29154.0, 18957.0, 12150.0, 7644.0, 4765.0, 2831.0, 1848.0, 1074.0, 649.0, 400.0, 246.0, 148.0, 98.0, 61.0, 35.0, 27.0, 11.0, 12.0, 2.0, 7.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-185.25, -179.716796875, -174.18359375, -168.650390625, -163.1171875, -157.583984375, -152.05078125, -146.517578125, -140.984375, -135.451171875, -129.91796875, -124.384765625, -118.8515625, -113.318359375, -107.78515625, -102.251953125, -96.71875, -91.185546875, -85.65234375, -80.119140625, -74.5859375, -69.052734375, -63.51953125, -57.986328125, -52.453125, -46.919921875, -41.38671875, -35.853515625, -30.3203125, -24.787109375, -19.25390625, -13.720703125, -8.1875, -2.654296875, 2.87890625, 8.412109375, 13.9453125, 19.478515625, 25.01171875, 30.544921875, 36.078125, 41.611328125, 47.14453125, 52.677734375, 58.2109375, 63.744140625, 69.27734375, 74.810546875, 80.34375, 85.876953125, 91.41015625, 96.943359375, 102.4765625, 108.009765625, 113.54296875, 119.076171875, 124.609375, 130.142578125, 135.67578125, 141.208984375, 146.7421875, 152.275390625, 157.80859375, 163.341796875, 168.875]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 8.0, 4.0, 10.0, 8.0, 8.0, 12.0, 20.0, 24.0, 36.0, 25.0, 27.0, 47.0, 45.0, 49.0, 50.0, 71.0, 84.0, 80.0, 55.0, 46.0, 41.0, 37.0, 30.0, 34.0, 20.0, 26.0, 13.0, 13.0, 10.0, 13.0, 15.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-70.875, -68.412109375, -65.94921875, -63.486328125, -61.0234375, -58.560546875, -56.09765625, -53.634765625, -51.171875, -48.708984375, -46.24609375, -43.783203125, -41.3203125, -38.857421875, -36.39453125, -33.931640625, -31.46875, -29.005859375, -26.54296875, -24.080078125, -21.6171875, -19.154296875, -16.69140625, -14.228515625, -11.765625, -9.302734375, -6.83984375, -4.376953125, -1.9140625, 0.548828125, 3.01171875, 5.474609375, 7.9375, 10.400390625, 12.86328125, 15.326171875, 17.7890625, 20.251953125, 22.71484375, 25.177734375, 27.640625, 30.103515625, 32.56640625, 35.029296875, 37.4921875, 39.955078125, 42.41796875, 44.880859375, 47.34375, 49.806640625, 52.26953125, 54.732421875, 57.1953125, 59.658203125, 62.12109375, 64.583984375, 67.046875, 69.509765625, 71.97265625, 74.435546875, 76.8984375, 79.361328125, 81.82421875, 84.287109375, 86.75]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 8.0, 6.0, 7.0, 10.0, 12.0, 14.0, 18.0, 22.0, 23.0, 29.0, 37.0, 42.0, 47.0, 47.0, 54.0, 46.0, 43.0, 35.0, 55.0, 41.0, 46.0, 30.0, 47.0, 47.0, 39.0, 22.0, 36.0, 27.0, 19.0, 14.0, 10.0, 11.0, 11.0, 10.0, 7.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-44.54986572265625, -43.15780258178711, -41.76573944091797, -40.37367630004883, -38.98161315917969, -37.58955001831055, -36.197486877441406, -34.805419921875, -33.413360595703125, -32.021297454833984, -30.629234313964844, -29.237171173095703, -27.845108032226562, -26.453044891357422, -25.06097984313965, -23.668916702270508, -22.276851654052734, -20.884788513183594, -19.492725372314453, -18.100662231445312, -16.708599090576172, -15.316534996032715, -13.924470901489258, -12.532407760620117, -11.140344619750977, -9.748281478881836, -8.356218338012695, -6.964154243469238, -5.572091102600098, -4.180027961730957, -2.7879638671875, -1.3959007263183594, -0.003841400146484375, 1.3882219791412354, 2.780285358428955, 4.172348976135254, 5.5644121170043945, 6.956475257873535, 8.348539352416992, 9.740602493286133, 11.132665634155273, 12.524728775024414, 13.916791915893555, 15.308856010437012, 16.70092010498047, 18.09298324584961, 19.48504638671875, 20.87710952758789, 22.26917266845703, 23.661235809326172, 25.053298950195312, 26.445362091064453, 27.837425231933594, 29.229488372802734, 30.621553421020508, 32.01361846923828, 33.405677795410156, 34.7977409362793, 36.18980407714844, 37.58186721801758, 38.97393035888672, 40.36599349975586, 41.758056640625, 43.150123596191406, 44.54218673706055]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 5.0, 7.0, 9.0, 12.0, 11.0, 15.0, 8.0, 17.0, 23.0, 16.0, 29.0, 28.0, 26.0, 34.0, 38.0, 28.0, 51.0, 37.0, 45.0, 50.0, 37.0, 40.0, 41.0, 28.0, 37.0, 40.0, 41.0, 35.0, 24.0, 25.0, 17.0, 14.0, 24.0, 34.0, 12.0, 11.0, 13.0, 11.0, 6.0, 6.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-43.415096282958984, -42.046897888183594, -40.67869567871094, -39.31049728393555, -37.942298889160156, -36.574100494384766, -35.20589828491211, -33.83769989013672, -32.46950149536133, -31.101301193237305, -29.733102798461914, -28.36490249633789, -26.9967041015625, -25.628503799438477, -24.260303497314453, -22.892105102539062, -21.52390480041504, -20.155704498291016, -18.787506103515625, -17.4193058013916, -16.05110740661621, -14.682907104492188, -13.31470775604248, -11.946508407592773, -10.578309059143066, -9.21010971069336, -7.841910362243652, -6.473710536956787, -5.10551118850708, -3.737311840057373, -2.369112014770508, -1.0009126663208008, 0.36728668212890625, 1.7354861497879028, 3.1036856174468994, 4.4718852043151855, 5.840084552764893, 7.2082839012146, 8.576483726501465, 9.944683074951172, 11.312882423400879, 12.681081771850586, 14.049281120300293, 15.41748046875, 16.785680770874023, 18.153879165649414, 19.522079467773438, 20.890277862548828, 22.25847816467285, 23.626678466796875, 24.994876861572266, 26.36307716369629, 27.73127555847168, 29.099475860595703, 30.467674255371094, 31.835874557495117, 33.20407485961914, 34.57227325439453, 35.94047546386719, 37.30867385864258, 38.67687225341797, 40.04507064819336, 41.413272857666016, 42.781471252441406, 44.1496696472168]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 17.0, 25.0, 31.0, 51.0, 112.0, 142.0, 267.0, 413.0, 753.0, 1419.0, 2574.0, 4965.0, 9317.0, 18299.0, 36227.0, 75341.0, 161111.0, 349709.0, 684125.0, 987716.0, 879756.0, 511220.0, 244412.0, 113880.0, 54964.0, 27328.0, 14056.0, 7163.0, 3895.0, 2155.0, 1201.0, 686.0, 366.0, 227.0, 144.0, 77.0, 44.0, 41.0, 15.0, 13.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.125, -41.7236328125, -40.322265625, -38.9208984375, -37.51953125, -36.1181640625, -34.716796875, -33.3154296875, -31.9140625, -30.5126953125, -29.111328125, -27.7099609375, -26.30859375, -24.9072265625, -23.505859375, -22.1044921875, -20.703125, -19.3017578125, -17.900390625, -16.4990234375, -15.09765625, -13.6962890625, -12.294921875, -10.8935546875, -9.4921875, -8.0908203125, -6.689453125, -5.2880859375, -3.88671875, -2.4853515625, -1.083984375, 0.3173828125, 1.71875, 3.1201171875, 4.521484375, 5.9228515625, 7.32421875, 8.7255859375, 10.126953125, 11.5283203125, 12.9296875, 14.3310546875, 15.732421875, 17.1337890625, 18.53515625, 19.9365234375, 21.337890625, 22.7392578125, 24.140625, 25.5419921875, 26.943359375, 28.3447265625, 29.74609375, 31.1474609375, 32.548828125, 33.9501953125, 35.3515625, 36.7529296875, 38.154296875, 39.5556640625, 40.95703125, 42.3583984375, 43.759765625, 45.1611328125, 46.5625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 5.0, 9.0, 6.0, 12.0, 7.0, 12.0, 18.0, 18.0, 16.0, 21.0, 20.0, 35.0, 36.0, 36.0, 37.0, 57.0, 41.0, 38.0, 43.0, 29.0, 42.0, 37.0, 38.0, 42.0, 36.0, 32.0, 30.0, 32.0, 18.0, 23.0, 27.0, 27.0, 26.0, 14.0, 11.0, 11.0, 12.0, 11.0, 4.0, 8.0, 7.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.359375, -29.343505859375, -28.32763671875, -27.311767578125, -26.2958984375, -25.280029296875, -24.26416015625, -23.248291015625, -22.232421875, -21.216552734375, -20.20068359375, -19.184814453125, -18.1689453125, -17.153076171875, -16.13720703125, -15.121337890625, -14.10546875, -13.089599609375, -12.07373046875, -11.057861328125, -10.0419921875, -9.026123046875, -8.01025390625, -6.994384765625, -5.978515625, -4.962646484375, -3.94677734375, -2.930908203125, -1.9150390625, -0.899169921875, 0.11669921875, 1.132568359375, 2.1484375, 3.164306640625, 4.18017578125, 5.196044921875, 6.2119140625, 7.227783203125, 8.24365234375, 9.259521484375, 10.275390625, 11.291259765625, 12.30712890625, 13.322998046875, 14.3388671875, 15.354736328125, 16.37060546875, 17.386474609375, 18.40234375, 19.418212890625, 20.43408203125, 21.449951171875, 22.4658203125, 23.481689453125, 24.49755859375, 25.513427734375, 26.529296875, 27.545166015625, 28.56103515625, 29.576904296875, 30.5927734375, 31.608642578125, 32.62451171875, 33.640380859375, 34.65625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 15.0, 27.0, 42.0, 58.0, 90.0, 145.0, 250.0, 365.0, 541.0, 839.0, 1339.0, 1925.0, 3059.0, 4894.0, 7612.0, 12396.0, 19727.0, 31819.0, 51473.0, 82860.0, 134808.0, 212573.0, 327342.0, 476793.0, 621866.0, 648228.0, 526715.0, 370826.0, 245139.0, 155888.0, 96832.0, 60241.0, 36699.0, 22775.0, 14032.0, 8736.0, 5455.0, 3538.0, 2200.0, 1399.0, 942.0, 617.0, 413.0, 256.0, 187.0, 113.0, 75.0, 48.0, 33.0, 11.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-30.75, -29.793701171875, -28.83740234375, -27.881103515625, -26.9248046875, -25.968505859375, -25.01220703125, -24.055908203125, -23.099609375, -22.143310546875, -21.18701171875, -20.230712890625, -19.2744140625, -18.318115234375, -17.36181640625, -16.405517578125, -15.44921875, -14.492919921875, -13.53662109375, -12.580322265625, -11.6240234375, -10.667724609375, -9.71142578125, -8.755126953125, -7.798828125, -6.842529296875, -5.88623046875, -4.929931640625, -3.9736328125, -3.017333984375, -2.06103515625, -1.104736328125, -0.1484375, 0.807861328125, 1.76416015625, 2.720458984375, 3.6767578125, 4.633056640625, 5.58935546875, 6.545654296875, 7.501953125, 8.458251953125, 9.41455078125, 10.370849609375, 11.3271484375, 12.283447265625, 13.23974609375, 14.196044921875, 15.15234375, 16.108642578125, 17.06494140625, 18.021240234375, 18.9775390625, 19.933837890625, 20.89013671875, 21.846435546875, 22.802734375, 23.759033203125, 24.71533203125, 25.671630859375, 26.6279296875, 27.584228515625, 28.54052734375, 29.496826171875, 30.453125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 10.0, 7.0, 14.0, 14.0, 16.0, 22.0, 37.0, 57.0, 72.0, 72.0, 90.0, 127.0, 154.0, 202.0, 226.0, 257.0, 278.0, 295.0, 286.0, 294.0, 279.0, 241.0, 191.0, 165.0, 120.0, 128.0, 92.0, 64.0, 47.0, 44.0, 40.0, 16.0, 30.0, 26.0, 10.0, 11.0, 8.0, 8.0, 11.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.36474609375, -13.8544921875, -13.34423828125, -12.833984375, -12.32373046875, -11.8134765625, -11.30322265625, -10.79296875, -10.28271484375, -9.7724609375, -9.26220703125, -8.751953125, -8.24169921875, -7.7314453125, -7.22119140625, -6.7109375, -6.20068359375, -5.6904296875, -5.18017578125, -4.669921875, -4.15966796875, -3.6494140625, -3.13916015625, -2.62890625, -2.11865234375, -1.6083984375, -1.09814453125, -0.587890625, -0.07763671875, 0.4326171875, 0.94287109375, 1.453125, 1.96337890625, 2.4736328125, 2.98388671875, 3.494140625, 4.00439453125, 4.5146484375, 5.02490234375, 5.53515625, 6.04541015625, 6.5556640625, 7.06591796875, 7.576171875, 8.08642578125, 8.5966796875, 9.10693359375, 9.6171875, 10.12744140625, 10.6376953125, 11.14794921875, 11.658203125, 12.16845703125, 12.6787109375, 13.18896484375, 13.69921875, 14.20947265625, 14.7197265625, 15.22998046875, 15.740234375, 16.25048828125, 16.7607421875, 17.27099609375, 17.78125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 4.0, 9.0, 3.0, 7.0, 16.0, 14.0, 13.0, 22.0, 16.0, 24.0, 38.0, 40.0, 37.0, 52.0, 51.0, 51.0, 63.0, 45.0, 44.0, 40.0, 51.0, 56.0, 40.0, 33.0, 37.0, 29.0, 25.0, 25.0, 18.0, 17.0, 12.0, 10.0, 7.0, 7.0, 6.0, 5.0, 4.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.79423522949219, -33.62215805053711, -32.4500846862793, -31.27800941467285, -30.105934143066406, -28.933856964111328, -27.761781692504883, -26.589706420898438, -25.417631149291992, -24.245555877685547, -23.0734806060791, -21.901405334472656, -20.729328155517578, -19.557254791259766, -18.385177612304688, -17.213102340698242, -16.041027069091797, -14.868951797485352, -13.696876525878906, -12.524800300598145, -11.3527250289917, -10.180649757385254, -9.008573532104492, -7.836498260498047, -6.664422988891602, -5.492347717285156, -4.320271968841553, -3.1481964588165283, -1.976120948791504, -0.8040456771850586, 0.3680300712585449, 1.5401058197021484, 2.7121810913085938, 3.884256601333618, 5.056332111358643, 6.228407859802246, 7.400483131408691, 8.572558403015137, 9.744634628295898, 10.916709899902344, 12.088785171508789, 13.260860443115234, 14.43293571472168, 15.605011940002441, 16.777088165283203, 17.949161529541016, 19.121238708496094, 20.29331398010254, 21.465389251708984, 22.63746452331543, 23.809539794921875, 24.98161506652832, 26.153690338134766, 27.325767517089844, 28.49784278869629, 29.669918060302734, 30.84199333190918, 32.014068603515625, 33.1861457824707, 34.358219146728516, 35.530296325683594, 36.702369689941406, 37.874446868896484, 39.04652404785156, 40.218597412109375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 9.0, 11.0, 8.0, 16.0, 20.0, 21.0, 24.0, 13.0, 28.0, 27.0, 30.0, 34.0, 35.0, 37.0, 39.0, 34.0, 34.0, 40.0, 33.0, 51.0, 38.0, 44.0, 31.0, 34.0, 24.0, 33.0, 25.0, 33.0, 23.0, 25.0, 19.0, 15.0, 12.0, 12.0, 18.0, 10.0, 8.0, 7.0, 8.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-39.64094161987305, -38.548095703125, -37.45524978637695, -36.362403869628906, -35.269561767578125, -34.17671585083008, -33.08386993408203, -31.991024017333984, -30.898178100585938, -29.80533218383789, -28.712486267089844, -27.61964225769043, -26.526796340942383, -25.433950424194336, -24.341106414794922, -23.248260498046875, -22.155414581298828, -21.06256866455078, -19.969722747802734, -18.87687873840332, -17.784032821655273, -16.691186904907227, -15.598341941833496, -14.505496978759766, -13.412651062011719, -12.319805145263672, -11.226960182189941, -10.134115219116211, -9.041269302368164, -7.948423862457275, -6.855578422546387, -5.762732982635498, -4.669885635375977, -3.577040195465088, -2.484194755554199, -1.3913493156433105, -0.2985038757324219, 0.7943415641784668, 1.8871870040893555, 2.980032444000244, 4.072877883911133, 5.1657233238220215, 6.25856876373291, 7.351414203643799, 8.444259643554688, 9.537105560302734, 10.629950523376465, 11.722795486450195, 12.815641403198242, 13.908487319946289, 15.00133228302002, 16.09417724609375, 17.187023162841797, 18.279869079589844, 19.37271499633789, 20.465559005737305, 21.55840492248535, 22.6512508392334, 23.744094848632812, 24.83694076538086, 25.929786682128906, 27.022632598876953, 28.115478515625, 29.208322525024414, 30.30116844177246]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 1.0, 3.0, 6.0, 7.0, 12.0, 13.0, 13.0, 19.0, 33.0, 47.0, 63.0, 92.0, 122.0, 165.0, 264.0, 360.0, 563.0, 857.0, 1458.0, 2246.0, 4020.0, 6803.0, 12902.0, 25905.0, 53552.0, 114514.0, 227500.0, 277057.0, 164118.0, 78238.0, 37121.0, 18122.0, 9441.0, 4997.0, 2880.0, 1683.0, 1136.0, 711.0, 497.0, 290.0, 226.0, 139.0, 115.0, 67.0, 56.0, 44.0, 21.0, 17.0, 10.0, 7.0, 12.0, 10.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-38.875, -37.630859375, -36.38671875, -35.142578125, -33.8984375, -32.654296875, -31.41015625, -30.166015625, -28.921875, -27.677734375, -26.43359375, -25.189453125, -23.9453125, -22.701171875, -21.45703125, -20.212890625, -18.96875, -17.724609375, -16.48046875, -15.236328125, -13.9921875, -12.748046875, -11.50390625, -10.259765625, -9.015625, -7.771484375, -6.52734375, -5.283203125, -4.0390625, -2.794921875, -1.55078125, -0.306640625, 0.9375, 2.181640625, 3.42578125, 4.669921875, 5.9140625, 7.158203125, 8.40234375, 9.646484375, 10.890625, 12.134765625, 13.37890625, 14.623046875, 15.8671875, 17.111328125, 18.35546875, 19.599609375, 20.84375, 22.087890625, 23.33203125, 24.576171875, 25.8203125, 27.064453125, 28.30859375, 29.552734375, 30.796875, 32.041015625, 33.28515625, 34.529296875, 35.7734375, 37.017578125, 38.26171875, 39.505859375, 40.75]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 7.0, 6.0, 4.0, 9.0, 10.0, 6.0, 13.0, 21.0, 8.0, 25.0, 11.0, 24.0, 23.0, 35.0, 32.0, 35.0, 32.0, 31.0, 31.0, 35.0, 33.0, 34.0, 49.0, 49.0, 29.0, 32.0, 27.0, 42.0, 33.0, 36.0, 28.0, 34.0, 22.0, 24.0, 19.0, 13.0, 10.0, 14.0, 12.0, 15.0, 19.0, 4.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0], "bins": [-36.75, -35.7392578125, -34.728515625, -33.7177734375, -32.70703125, -31.6962890625, -30.685546875, -29.6748046875, -28.6640625, -27.6533203125, -26.642578125, -25.6318359375, -24.62109375, -23.6103515625, -22.599609375, -21.5888671875, -20.578125, -19.5673828125, -18.556640625, -17.5458984375, -16.53515625, -15.5244140625, -14.513671875, -13.5029296875, -12.4921875, -11.4814453125, -10.470703125, -9.4599609375, -8.44921875, -7.4384765625, -6.427734375, -5.4169921875, -4.40625, -3.3955078125, -2.384765625, -1.3740234375, -0.36328125, 0.6474609375, 1.658203125, 2.6689453125, 3.6796875, 4.6904296875, 5.701171875, 6.7119140625, 7.72265625, 8.7333984375, 9.744140625, 10.7548828125, 11.765625, 12.7763671875, 13.787109375, 14.7978515625, 15.80859375, 16.8193359375, 17.830078125, 18.8408203125, 19.8515625, 20.8623046875, 21.873046875, 22.8837890625, 23.89453125, 24.9052734375, 25.916015625, 26.9267578125, 27.9375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 15.0, 24.0, 39.0, 45.0, 54.0, 78.0, 146.0, 226.0, 429.0, 685.0, 1519.0, 3379.0, 8466.0, 24909.0, 87692.0, 338566.0, 416545.0, 115519.0, 31894.0, 10490.0, 3934.0, 1772.0, 910.0, 451.0, 247.0, 160.0, 135.0, 65.0, 47.0, 25.0, 16.0, 10.0, 10.0, 12.0, 10.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.4375, -39.09423828125, -37.7509765625, -36.40771484375, -35.064453125, -33.72119140625, -32.3779296875, -31.03466796875, -29.69140625, -28.34814453125, -27.0048828125, -25.66162109375, -24.318359375, -22.97509765625, -21.6318359375, -20.28857421875, -18.9453125, -17.60205078125, -16.2587890625, -14.91552734375, -13.572265625, -12.22900390625, -10.8857421875, -9.54248046875, -8.19921875, -6.85595703125, -5.5126953125, -4.16943359375, -2.826171875, -1.48291015625, -0.1396484375, 1.20361328125, 2.546875, 3.89013671875, 5.2333984375, 6.57666015625, 7.919921875, 9.26318359375, 10.6064453125, 11.94970703125, 13.29296875, 14.63623046875, 15.9794921875, 17.32275390625, 18.666015625, 20.00927734375, 21.3525390625, 22.69580078125, 24.0390625, 25.38232421875, 26.7255859375, 28.06884765625, 29.412109375, 30.75537109375, 32.0986328125, 33.44189453125, 34.78515625, 36.12841796875, 37.4716796875, 38.81494140625, 40.158203125, 41.50146484375, 42.8447265625, 44.18798828125, 45.53125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 6.0, 10.0, 12.0, 10.0, 11.0, 11.0, 12.0, 19.0, 24.0, 23.0, 34.0, 31.0, 24.0, 31.0, 38.0, 43.0, 37.0, 54.0, 52.0, 36.0, 31.0, 41.0, 43.0, 42.0, 37.0, 40.0, 30.0, 22.0, 26.0, 30.0, 22.0, 23.0, 18.0, 10.0, 12.0, 10.0, 6.0, 8.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.328125, -23.532958984375, -22.73779296875, -21.942626953125, -21.1474609375, -20.352294921875, -19.55712890625, -18.761962890625, -17.966796875, -17.171630859375, -16.37646484375, -15.581298828125, -14.7861328125, -13.990966796875, -13.19580078125, -12.400634765625, -11.60546875, -10.810302734375, -10.01513671875, -9.219970703125, -8.4248046875, -7.629638671875, -6.83447265625, -6.039306640625, -5.244140625, -4.448974609375, -3.65380859375, -2.858642578125, -2.0634765625, -1.268310546875, -0.47314453125, 0.322021484375, 1.1171875, 1.912353515625, 2.70751953125, 3.502685546875, 4.2978515625, 5.093017578125, 5.88818359375, 6.683349609375, 7.478515625, 8.273681640625, 9.06884765625, 9.864013671875, 10.6591796875, 11.454345703125, 12.24951171875, 13.044677734375, 13.83984375, 14.635009765625, 15.43017578125, 16.225341796875, 17.0205078125, 17.815673828125, 18.61083984375, 19.406005859375, 20.201171875, 20.996337890625, 21.79150390625, 22.586669921875, 23.3818359375, 24.177001953125, 24.97216796875, 25.767333984375, 26.5625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 2.0, 6.0, 10.0, 16.0, 15.0, 28.0, 34.0, 52.0, 67.0, 122.0, 165.0, 282.0, 507.0, 1102.0, 2738.0, 9405.0, 114056.0, 889558.0, 22260.0, 4865.0, 1593.0, 708.0, 357.0, 207.0, 135.0, 73.0, 60.0, 32.0, 25.0, 26.0, 12.0, 7.0, 5.0, 14.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-93.8125, -90.8095703125, -87.806640625, -84.8037109375, -81.80078125, -78.7978515625, -75.794921875, -72.7919921875, -69.7890625, -66.7861328125, -63.783203125, -60.7802734375, -57.77734375, -54.7744140625, -51.771484375, -48.7685546875, -45.765625, -42.7626953125, -39.759765625, -36.7568359375, -33.75390625, -30.7509765625, -27.748046875, -24.7451171875, -21.7421875, -18.7392578125, -15.736328125, -12.7333984375, -9.73046875, -6.7275390625, -3.724609375, -0.7216796875, 2.28125, 5.2841796875, 8.287109375, 11.2900390625, 14.29296875, 17.2958984375, 20.298828125, 23.3017578125, 26.3046875, 29.3076171875, 32.310546875, 35.3134765625, 38.31640625, 41.3193359375, 44.322265625, 47.3251953125, 50.328125, 53.3310546875, 56.333984375, 59.3369140625, 62.33984375, 65.3427734375, 68.345703125, 71.3486328125, 74.3515625, 77.3544921875, 80.357421875, 83.3603515625, 86.36328125, 89.3662109375, 92.369140625, 95.3720703125, 98.375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 7.0, 7.0, 10.0, 9.0, 14.0, 18.0, 42.0, 97.0, 225.0, 242.0, 140.0, 70.0, 32.0, 19.0, 11.0, 4.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003589630126953125, -0.0034744441509246826, -0.0033592581748962402, -0.003244072198867798, -0.0031288862228393555, -0.003013700246810913, -0.0028985142707824707, -0.0027833282947540283, -0.002668142318725586, -0.0025529563426971436, -0.002437770366668701, -0.002322584390640259, -0.0022073984146118164, -0.002092212438583374, -0.0019770264625549316, -0.0018618404865264893, -0.0017466545104980469, -0.0016314685344696045, -0.0015162825584411621, -0.0014010965824127197, -0.0012859106063842773, -0.001170724630355835, -0.0010555386543273926, -0.0009403526782989502, -0.0008251667022705078, -0.0007099807262420654, -0.000594794750213623, -0.00047960877418518066, -0.0003644227981567383, -0.0002492368221282959, -0.00013405084609985352, -1.8864870071411133e-05, 9.632110595703125e-05, 0.00021150708198547363, 0.000326693058013916, 0.0004418790340423584, 0.0005570650100708008, 0.0006722509860992432, 0.0007874369621276855, 0.0009026229381561279, 0.0010178089141845703, 0.0011329948902130127, 0.001248180866241455, 0.0013633668422698975, 0.0014785528182983398, 0.0015937387943267822, 0.0017089247703552246, 0.001824110746383667, 0.0019392967224121094, 0.0020544826984405518, 0.002169668674468994, 0.0022848546504974365, 0.002400040626525879, 0.0025152266025543213, 0.0026304125785827637, 0.002745598554611206, 0.0028607845306396484, 0.002975970506668091, 0.003091156482696533, 0.0032063424587249756, 0.003321528434753418, 0.0034367144107818604, 0.0035519003868103027, 0.003667086362838745, 0.0037822723388671875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 3.0, 10.0, 12.0, 22.0, 21.0, 27.0, 34.0, 52.0, 68.0, 97.0, 97.0, 122.0, 172.0, 245.0, 332.0, 428.0, 637.0, 878.0, 1294.0, 2066.0, 3243.0, 5726.0, 12143.0, 42005.0, 266668.0, 577087.0, 94520.0, 20499.0, 7846.0, 4163.0, 2509.0, 1702.0, 1094.0, 755.0, 484.0, 395.0, 262.0, 200.0, 162.0, 110.0, 78.0, 68.0, 51.0, 49.0, 28.0, 23.0, 19.0, 11.0, 16.0, 8.0, 4.0, 6.0, 2.0, 6.0, 1.0, 2.0], "bins": [-47.78125, -46.34375, -44.90625, -43.46875, -42.03125, -40.59375, -39.15625, -37.71875, -36.28125, -34.84375, -33.40625, -31.96875, -30.53125, -29.09375, -27.65625, -26.21875, -24.78125, -23.34375, -21.90625, -20.46875, -19.03125, -17.59375, -16.15625, -14.71875, -13.28125, -11.84375, -10.40625, -8.96875, -7.53125, -6.09375, -4.65625, -3.21875, -1.78125, -0.34375, 1.09375, 2.53125, 3.96875, 5.40625, 6.84375, 8.28125, 9.71875, 11.15625, 12.59375, 14.03125, 15.46875, 16.90625, 18.34375, 19.78125, 21.21875, 22.65625, 24.09375, 25.53125, 26.96875, 28.40625, 29.84375, 31.28125, 32.71875, 34.15625, 35.59375, 37.03125, 38.46875, 39.90625, 41.34375, 42.78125, 44.21875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 7.0, 5.0, 6.0, 15.0, 18.0, 32.0, 50.0, 107.0, 215.0, 258.0, 125.0, 51.0, 53.0, 22.0, 13.0, 7.0, 2.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.953125, -17.3955078125, -16.837890625, -16.2802734375, -15.72265625, -15.1650390625, -14.607421875, -14.0498046875, -13.4921875, -12.9345703125, -12.376953125, -11.8193359375, -11.26171875, -10.7041015625, -10.146484375, -9.5888671875, -9.03125, -8.4736328125, -7.916015625, -7.3583984375, -6.80078125, -6.2431640625, -5.685546875, -5.1279296875, -4.5703125, -4.0126953125, -3.455078125, -2.8974609375, -2.33984375, -1.7822265625, -1.224609375, -0.6669921875, -0.109375, 0.4482421875, 1.005859375, 1.5634765625, 2.12109375, 2.6787109375, 3.236328125, 3.7939453125, 4.3515625, 4.9091796875, 5.466796875, 6.0244140625, 6.58203125, 7.1396484375, 7.697265625, 8.2548828125, 8.8125, 9.3701171875, 9.927734375, 10.4853515625, 11.04296875, 11.6005859375, 12.158203125, 12.7158203125, 13.2734375, 13.8310546875, 14.388671875, 14.9462890625, 15.50390625, 16.0615234375, 16.619140625, 17.1767578125, 17.734375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 3.0, 4.0, 8.0, 7.0, 10.0, 11.0, 15.0, 15.0, 23.0, 34.0, 30.0, 53.0, 42.0, 51.0, 55.0, 53.0, 54.0, 45.0, 56.0, 58.0, 36.0, 53.0, 43.0, 33.0, 41.0, 27.0, 18.0, 20.0, 15.0, 14.0, 12.0, 15.0, 9.0, 6.0, 7.0, 4.0, 2.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.55209732055664, -36.39091110229492, -35.2297248840332, -34.068538665771484, -32.907352447509766, -31.746166229248047, -30.584980010986328, -29.42379379272461, -28.26260757446289, -27.101421356201172, -25.940235137939453, -24.779048919677734, -23.617862701416016, -22.456676483154297, -21.295490264892578, -20.13430404663086, -18.973115921020508, -17.81192970275879, -16.65074348449707, -15.489557266235352, -14.328371047973633, -13.167184829711914, -12.005997657775879, -10.84481143951416, -9.683625221252441, -8.522439002990723, -7.361252784729004, -6.200066089630127, -5.038879871368408, -3.8776936531066895, -2.7165069580078125, -1.5553207397460938, -0.394134521484375, 0.7670518159866333, 1.9282381534576416, 3.0894246101379395, 4.250610828399658, 5.411797046661377, 6.572983741760254, 7.734169960021973, 8.895356178283691, 10.05654239654541, 11.217728614807129, 12.378915786743164, 13.540102005004883, 14.701288223266602, 15.86247444152832, 17.02366065979004, 18.184846878051758, 19.346033096313477, 20.507219314575195, 21.668405532836914, 22.829591751098633, 23.99077796936035, 25.151966094970703, 26.313152313232422, 27.47433853149414, 28.63552474975586, 29.796710968017578, 30.957897186279297, 32.119083404541016, 33.280269622802734, 34.44145584106445, 35.60264205932617, 36.76382827758789]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 5.0, 4.0, 3.0, 8.0, 11.0, 6.0, 21.0, 11.0, 13.0, 20.0, 17.0, 16.0, 25.0, 29.0, 23.0, 36.0, 42.0, 28.0, 40.0, 28.0, 44.0, 37.0, 37.0, 37.0, 31.0, 43.0, 35.0, 27.0, 38.0, 32.0, 26.0, 31.0, 23.0, 24.0, 24.0, 20.0, 13.0, 15.0, 12.0, 8.0, 18.0, 14.0, 6.0, 3.0, 6.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-34.88758850097656, -33.88644790649414, -32.88530731201172, -31.88416862487793, -30.88302993774414, -29.88188934326172, -28.880748748779297, -27.879608154296875, -26.878469467163086, -25.877328872680664, -24.876190185546875, -23.875049591064453, -22.87390899658203, -21.872770309448242, -20.87162971496582, -19.87049102783203, -18.86935043334961, -17.868209838867188, -16.8670711517334, -15.865930557250977, -14.864790916442871, -13.863651275634766, -12.862510681152344, -11.861371040344238, -10.860231399536133, -9.859091758728027, -8.857952117919922, -7.8568115234375, -6.8556718826293945, -5.854532241821289, -4.853392124176025, -3.8522520065307617, -2.8511085510253906, -1.849968671798706, -0.8488287925720215, 0.15231108665466309, 1.1534509658813477, 2.154590606689453, 3.155730724334717, 4.1568708419799805, 5.158010482788086, 6.159150123596191, 7.160290241241455, 8.161430358886719, 9.162569999694824, 10.16370964050293, 11.164850234985352, 12.165989875793457, 13.167129516601562, 14.168269157409668, 15.169408798217773, 16.170549392700195, 17.171688079833984, 18.172828674316406, 19.173969268798828, 20.17510986328125, 21.17624855041504, 22.17738914489746, 23.17852783203125, 24.179668426513672, 25.180809020996094, 26.181947708129883, 27.183088302612305, 28.184226989746094, 29.185367584228516]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 10.0, 10.0, 14.0, 21.0, 35.0, 40.0, 55.0, 65.0, 106.0, 158.0, 230.0, 365.0, 595.0, 929.0, 1571.0, 2556.0, 4399.0, 7117.0, 12190.0, 20353.0, 33281.0, 52838.0, 79783.0, 109089.0, 133730.0, 143180.0, 131736.0, 106757.0, 76301.0, 51125.0, 31706.0, 19391.0, 11509.0, 6788.0, 3969.0, 2465.0, 1483.0, 924.0, 570.0, 391.0, 241.0, 157.0, 102.0, 78.0, 43.0, 37.0, 25.0, 19.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.1875, -32.02099609375, -30.8544921875, -29.68798828125, -28.521484375, -27.35498046875, -26.1884765625, -25.02197265625, -23.85546875, -22.68896484375, -21.5224609375, -20.35595703125, -19.189453125, -18.02294921875, -16.8564453125, -15.68994140625, -14.5234375, -13.35693359375, -12.1904296875, -11.02392578125, -9.857421875, -8.69091796875, -7.5244140625, -6.35791015625, -5.19140625, -4.02490234375, -2.8583984375, -1.69189453125, -0.525390625, 0.64111328125, 1.8076171875, 2.97412109375, 4.140625, 5.30712890625, 6.4736328125, 7.64013671875, 8.806640625, 9.97314453125, 11.1396484375, 12.30615234375, 13.47265625, 14.63916015625, 15.8056640625, 16.97216796875, 18.138671875, 19.30517578125, 20.4716796875, 21.63818359375, 22.8046875, 23.97119140625, 25.1376953125, 26.30419921875, 27.470703125, 28.63720703125, 29.8037109375, 30.97021484375, 32.13671875, 33.30322265625, 34.4697265625, 35.63623046875, 36.802734375, 37.96923828125, 39.1357421875, 40.30224609375, 41.46875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 1.0, 7.0, 7.0, 5.0, 8.0, 12.0, 17.0, 19.0, 19.0, 18.0, 24.0, 20.0, 37.0, 37.0, 36.0, 43.0, 34.0, 36.0, 31.0, 42.0, 34.0, 31.0, 47.0, 33.0, 37.0, 38.0, 35.0, 30.0, 35.0, 22.0, 19.0, 33.0, 16.0, 21.0, 24.0, 16.0, 13.0, 14.0, 11.0, 8.0, 5.0, 6.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-34.5, -33.527587890625, -32.55517578125, -31.582763671875, -30.6103515625, -29.637939453125, -28.66552734375, -27.693115234375, -26.720703125, -25.748291015625, -24.77587890625, -23.803466796875, -22.8310546875, -21.858642578125, -20.88623046875, -19.913818359375, -18.94140625, -17.968994140625, -16.99658203125, -16.024169921875, -15.0517578125, -14.079345703125, -13.10693359375, -12.134521484375, -11.162109375, -10.189697265625, -9.21728515625, -8.244873046875, -7.2724609375, -6.300048828125, -5.32763671875, -4.355224609375, -3.3828125, -2.410400390625, -1.43798828125, -0.465576171875, 0.5068359375, 1.479248046875, 2.45166015625, 3.424072265625, 4.396484375, 5.368896484375, 6.34130859375, 7.313720703125, 8.2861328125, 9.258544921875, 10.23095703125, 11.203369140625, 12.17578125, 13.148193359375, 14.12060546875, 15.093017578125, 16.0654296875, 17.037841796875, 18.01025390625, 18.982666015625, 19.955078125, 20.927490234375, 21.89990234375, 22.872314453125, 23.8447265625, 24.817138671875, 25.78955078125, 26.761962890625, 27.734375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 4.0, 10.0, 12.0, 14.0, 18.0, 28.0, 57.0, 76.0, 122.0, 168.0, 282.0, 423.0, 716.0, 1063.0, 1708.0, 2741.0, 4398.0, 7294.0, 12027.0, 19454.0, 31320.0, 49800.0, 74200.0, 102963.0, 129044.0, 140711.0, 132103.0, 109764.0, 80790.0, 54911.0, 35508.0, 21971.0, 13389.0, 8199.0, 4898.0, 3066.0, 1912.0, 1213.0, 760.0, 517.0, 317.0, 200.0, 122.0, 91.0, 44.0, 45.0, 31.0, 24.0, 7.0, 8.0, 7.0, 6.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.53125, -31.39453125, -30.2578125, -29.12109375, -27.984375, -26.84765625, -25.7109375, -24.57421875, -23.4375, -22.30078125, -21.1640625, -20.02734375, -18.890625, -17.75390625, -16.6171875, -15.48046875, -14.34375, -13.20703125, -12.0703125, -10.93359375, -9.796875, -8.66015625, -7.5234375, -6.38671875, -5.25, -4.11328125, -2.9765625, -1.83984375, -0.703125, 0.43359375, 1.5703125, 2.70703125, 3.84375, 4.98046875, 6.1171875, 7.25390625, 8.390625, 9.52734375, 10.6640625, 11.80078125, 12.9375, 14.07421875, 15.2109375, 16.34765625, 17.484375, 18.62109375, 19.7578125, 20.89453125, 22.03125, 23.16796875, 24.3046875, 25.44140625, 26.578125, 27.71484375, 28.8515625, 29.98828125, 31.125, 32.26171875, 33.3984375, 34.53515625, 35.671875, 36.80859375, 37.9453125, 39.08203125, 40.21875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 8.0, 4.0, 11.0, 8.0, 14.0, 9.0, 19.0, 17.0, 23.0, 26.0, 22.0, 18.0, 52.0, 36.0, 33.0, 38.0, 43.0, 38.0, 62.0, 40.0, 43.0, 36.0, 32.0, 37.0, 33.0, 39.0, 40.0, 34.0, 33.0, 22.0, 21.0, 16.0, 14.0, 9.0, 9.0, 16.0, 9.0, 9.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.65625, -20.97265625, -20.2890625, -19.60546875, -18.921875, -18.23828125, -17.5546875, -16.87109375, -16.1875, -15.50390625, -14.8203125, -14.13671875, -13.453125, -12.76953125, -12.0859375, -11.40234375, -10.71875, -10.03515625, -9.3515625, -8.66796875, -7.984375, -7.30078125, -6.6171875, -5.93359375, -5.25, -4.56640625, -3.8828125, -3.19921875, -2.515625, -1.83203125, -1.1484375, -0.46484375, 0.21875, 0.90234375, 1.5859375, 2.26953125, 2.953125, 3.63671875, 4.3203125, 5.00390625, 5.6875, 6.37109375, 7.0546875, 7.73828125, 8.421875, 9.10546875, 9.7890625, 10.47265625, 11.15625, 11.83984375, 12.5234375, 13.20703125, 13.890625, 14.57421875, 15.2578125, 15.94140625, 16.625, 17.30859375, 17.9921875, 18.67578125, 19.359375, 20.04296875, 20.7265625, 21.41015625, 22.09375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 8.0, 11.0, 15.0, 26.0, 36.0, 66.0, 79.0, 142.0, 162.0, 256.0, 374.0, 557.0, 838.0, 1244.0, 1914.0, 2905.0, 4481.0, 7342.0, 12399.0, 21219.0, 37018.0, 63319.0, 103836.0, 150441.0, 177081.0, 162121.0, 118324.0, 74558.0, 44004.0, 25356.0, 14583.0, 8786.0, 5319.0, 3332.0, 2084.0, 1387.0, 1001.0, 627.0, 402.0, 312.0, 193.0, 119.0, 87.0, 62.0, 33.0, 27.0, 24.0, 14.0, 10.0, 12.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.6640625, -13.232421875, -12.80078125, -12.369140625, -11.9375, -11.505859375, -11.07421875, -10.642578125, -10.2109375, -9.779296875, -9.34765625, -8.916015625, -8.484375, -8.052734375, -7.62109375, -7.189453125, -6.7578125, -6.326171875, -5.89453125, -5.462890625, -5.03125, -4.599609375, -4.16796875, -3.736328125, -3.3046875, -2.873046875, -2.44140625, -2.009765625, -1.578125, -1.146484375, -0.71484375, -0.283203125, 0.1484375, 0.580078125, 1.01171875, 1.443359375, 1.875, 2.306640625, 2.73828125, 3.169921875, 3.6015625, 4.033203125, 4.46484375, 4.896484375, 5.328125, 5.759765625, 6.19140625, 6.623046875, 7.0546875, 7.486328125, 7.91796875, 8.349609375, 8.78125, 9.212890625, 9.64453125, 10.076171875, 10.5078125, 10.939453125, 11.37109375, 11.802734375, 12.234375, 12.666015625, 13.09765625, 13.529296875, 13.9609375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 8.0, 11.0, 16.0, 23.0, 26.0, 23.0, 32.0, 40.0, 49.0, 63.0, 60.0, 72.0, 76.0, 78.0, 56.0, 50.0, 69.0, 38.0, 59.0, 28.0, 19.0, 20.0, 16.0, 10.0, 11.0, 11.0, 4.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001445770263671875, -0.0013970434665679932, -0.0013483166694641113, -0.0012995898723602295, -0.0012508630752563477, -0.0012021362781524658, -0.001153409481048584, -0.0011046826839447021, -0.0010559558868408203, -0.0010072290897369385, -0.0009585022926330566, -0.0009097754955291748, -0.000861048698425293, -0.0008123219013214111, -0.0007635951042175293, -0.0007148683071136475, -0.0006661415100097656, -0.0006174147129058838, -0.000568687915802002, -0.0005199611186981201, -0.0004712343215942383, -0.00042250752449035645, -0.0003737807273864746, -0.0003250539302825928, -0.00027632713317871094, -0.0002276003360748291, -0.00017887353897094727, -0.00013014674186706543, -8.14199447631836e-05, -3.269314765930176e-05, 1.6033649444580078e-05, 6.476044654846191e-05, 0.00011348724365234375, 0.00016221404075622559, 0.00021094083786010742, 0.00025966763496398926, 0.0003083944320678711, 0.00035712122917175293, 0.00040584802627563477, 0.0004545748233795166, 0.0005033016204833984, 0.0005520284175872803, 0.0006007552146911621, 0.0006494820117950439, 0.0006982088088989258, 0.0007469356060028076, 0.0007956624031066895, 0.0008443892002105713, 0.0008931159973144531, 0.000941842794418335, 0.0009905695915222168, 0.0010392963886260986, 0.0010880231857299805, 0.0011367499828338623, 0.0011854767799377441, 0.001234203577041626, 0.0012829303741455078, 0.0013316571712493896, 0.0013803839683532715, 0.0014291107654571533, 0.0014778375625610352, 0.001526564359664917, 0.0015752911567687988, 0.0016240179538726807, 0.0016727447509765625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 17.0, 24.0, 31.0, 45.0, 75.0, 98.0, 134.0, 224.0, 338.0, 563.0, 902.0, 1390.0, 2295.0, 3834.0, 6542.0, 10962.0, 18185.0, 29896.0, 48837.0, 74977.0, 106953.0, 136546.0, 149928.0, 138168.0, 110075.0, 77774.0, 50564.0, 31429.0, 19129.0, 11385.0, 6708.0, 4153.0, 2459.0, 1460.0, 877.0, 564.0, 340.0, 236.0, 159.0, 91.0, 56.0, 48.0, 27.0, 24.0, 13.0, 11.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.6484375, -10.2998046875, -9.951171875, -9.6025390625, -9.25390625, -8.9052734375, -8.556640625, -8.2080078125, -7.859375, -7.5107421875, -7.162109375, -6.8134765625, -6.46484375, -6.1162109375, -5.767578125, -5.4189453125, -5.0703125, -4.7216796875, -4.373046875, -4.0244140625, -3.67578125, -3.3271484375, -2.978515625, -2.6298828125, -2.28125, -1.9326171875, -1.583984375, -1.2353515625, -0.88671875, -0.5380859375, -0.189453125, 0.1591796875, 0.5078125, 0.8564453125, 1.205078125, 1.5537109375, 1.90234375, 2.2509765625, 2.599609375, 2.9482421875, 3.296875, 3.6455078125, 3.994140625, 4.3427734375, 4.69140625, 5.0400390625, 5.388671875, 5.7373046875, 6.0859375, 6.4345703125, 6.783203125, 7.1318359375, 7.48046875, 7.8291015625, 8.177734375, 8.5263671875, 8.875, 9.2236328125, 9.572265625, 9.9208984375, 10.26953125, 10.6181640625, 10.966796875, 11.3154296875, 11.6640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 13.0, 9.0, 6.0, 11.0, 19.0, 14.0, 12.0, 18.0, 21.0, 29.0, 31.0, 43.0, 51.0, 53.0, 51.0, 56.0, 62.0, 52.0, 46.0, 45.0, 57.0, 53.0, 46.0, 32.0, 21.0, 33.0, 17.0, 12.0, 15.0, 12.0, 17.0, 9.0, 10.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-6.22265625, -6.05877685546875, -5.8948974609375, -5.73101806640625, -5.567138671875, -5.40325927734375, -5.2393798828125, -5.07550048828125, -4.91162109375, -4.74774169921875, -4.5838623046875, -4.41998291015625, -4.256103515625, -4.09222412109375, -3.9283447265625, -3.76446533203125, -3.6005859375, -3.43670654296875, -3.2728271484375, -3.10894775390625, -2.945068359375, -2.78118896484375, -2.6173095703125, -2.45343017578125, -2.28955078125, -2.12567138671875, -1.9617919921875, -1.79791259765625, -1.634033203125, -1.47015380859375, -1.3062744140625, -1.14239501953125, -0.978515625, -0.81463623046875, -0.6507568359375, -0.48687744140625, -0.322998046875, -0.15911865234375, 0.0047607421875, 0.16864013671875, 0.33251953125, 0.49639892578125, 0.6602783203125, 0.82415771484375, 0.988037109375, 1.15191650390625, 1.3157958984375, 1.47967529296875, 1.6435546875, 1.80743408203125, 1.9713134765625, 2.13519287109375, 2.299072265625, 2.46295166015625, 2.6268310546875, 2.79071044921875, 2.95458984375, 3.11846923828125, 3.2823486328125, 3.44622802734375, 3.610107421875, 3.77398681640625, 3.9378662109375, 4.10174560546875, 4.265625]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 11.0, 4.0, 9.0, 12.0, 12.0, 12.0, 25.0, 14.0, 27.0, 35.0, 42.0, 38.0, 35.0, 57.0, 45.0, 57.0, 58.0, 55.0, 56.0, 48.0, 63.0, 46.0, 39.0, 25.0, 31.0, 29.0, 17.0, 17.0, 22.0, 17.0, 13.0, 5.0, 8.0, 5.0, 2.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.06857681274414, -36.91872024536133, -35.76885986328125, -34.61900329589844, -33.469146728515625, -32.31928634643555, -31.169429779052734, -30.01957130432129, -28.869712829589844, -27.7198543548584, -26.569997787475586, -25.42013931274414, -24.270280838012695, -23.12042236328125, -21.970565795898438, -20.820707321166992, -19.67085075378418, -18.520992279052734, -17.371135711669922, -16.221277236938477, -15.071418762207031, -13.921561241149902, -12.771703720092773, -11.621845245361328, -10.4719877243042, -9.32213020324707, -8.172271728515625, -7.022414207458496, -5.872556209564209, -4.722698211669922, -3.572840690612793, -2.4229822158813477, -1.2731246948242188, -0.12326681613922119, 1.0265910625457764, 2.1764488220214844, 3.3263068199157715, 4.476164817810059, 5.6260223388671875, 6.775880813598633, 7.925738334655762, 9.07559585571289, 10.225454330444336, 11.375311851501465, 12.525169372558594, 13.675027847290039, 14.824885368347168, 15.974743843078613, 17.124601364135742, 18.274459838867188, 19.42431640625, 20.574174880981445, 21.72403335571289, 22.873889923095703, 24.02374839782715, 25.173606872558594, 26.323463439941406, 27.47332191467285, 28.623178482055664, 29.77303695678711, 30.922895431518555, 32.07275390625, 33.22261047363281, 34.372467041015625, 35.5223274230957]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 5.0, 5.0, 10.0, 6.0, 8.0, 2.0, 11.0, 13.0, 17.0, 12.0, 18.0, 22.0, 22.0, 25.0, 25.0, 26.0, 28.0, 33.0, 34.0, 28.0, 48.0, 40.0, 26.0, 38.0, 32.0, 32.0, 22.0, 36.0, 25.0, 31.0, 26.0, 28.0, 26.0, 22.0, 25.0, 23.0, 23.0, 21.0, 14.0, 12.0, 9.0, 12.0, 13.0, 15.0, 8.0, 7.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0], "bins": [-30.306537628173828, -29.422033309936523, -28.53752899169922, -27.653026580810547, -26.768522262573242, -25.884017944335938, -24.999515533447266, -24.11501121520996, -23.230506896972656, -22.34600257873535, -21.461498260498047, -20.576995849609375, -19.69249153137207, -18.807987213134766, -17.923484802246094, -17.03898048400879, -16.154476165771484, -15.26997184753418, -14.385468482971191, -13.500965118408203, -12.616460800170898, -11.731956481933594, -10.847453117370605, -9.962949752807617, -9.078445434570312, -8.193941116333008, -7.3094377517700195, -6.424933910369873, -5.540430068969727, -4.65592622756958, -3.7714223861694336, -2.886918544769287, -2.0024166107177734, -1.117912769317627, -0.23340892791748047, 0.651094913482666, 1.5355987548828125, 2.420102596282959, 3.3046064376831055, 4.189110279083252, 5.073614120483398, 5.958117961883545, 6.842621803283691, 7.727125644683838, 8.611629486083984, 9.496133804321289, 10.380637168884277, 11.265140533447266, 12.14964485168457, 13.034149169921875, 13.918652534484863, 14.803155899047852, 15.687660217285156, 16.57216453552246, 17.456668853759766, 18.341171264648438, 19.225675582885742, 20.110179901123047, 20.99468231201172, 21.879186630249023, 22.763690948486328, 23.648195266723633, 24.532699584960938, 25.41720199584961, 26.301706314086914]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 13.0, 18.0, 27.0, 28.0, 39.0, 81.0, 134.0, 209.0, 315.0, 552.0, 792.0, 1351.0, 2121.0, 3513.0, 6138.0, 10226.0, 17545.0, 30253.0, 53437.0, 92746.0, 162304.0, 272818.0, 430047.0, 593847.0, 677186.0, 621004.0, 469297.0, 305518.0, 184992.0, 108221.0, 62568.0, 36078.0, 20843.0, 12083.0, 7214.0, 4221.0, 2610.0, 1554.0, 891.0, 532.0, 356.0, 216.0, 138.0, 84.0, 47.0, 25.0, 17.0, 13.0, 8.0, 9.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.84375, -24.032470703125, -23.22119140625, -22.409912109375, -21.5986328125, -20.787353515625, -19.97607421875, -19.164794921875, -18.353515625, -17.542236328125, -16.73095703125, -15.919677734375, -15.1083984375, -14.297119140625, -13.48583984375, -12.674560546875, -11.86328125, -11.052001953125, -10.24072265625, -9.429443359375, -8.6181640625, -7.806884765625, -6.99560546875, -6.184326171875, -5.373046875, -4.561767578125, -3.75048828125, -2.939208984375, -2.1279296875, -1.316650390625, -0.50537109375, 0.305908203125, 1.1171875, 1.928466796875, 2.73974609375, 3.551025390625, 4.3623046875, 5.173583984375, 5.98486328125, 6.796142578125, 7.607421875, 8.418701171875, 9.22998046875, 10.041259765625, 10.8525390625, 11.663818359375, 12.47509765625, 13.286376953125, 14.09765625, 14.908935546875, 15.72021484375, 16.531494140625, 17.3427734375, 18.154052734375, 18.96533203125, 19.776611328125, 20.587890625, 21.399169921875, 22.21044921875, 23.021728515625, 23.8330078125, 24.644287109375, 25.45556640625, 26.266845703125, 27.078125]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 10.0, 4.0, 12.0, 7.0, 9.0, 14.0, 16.0, 16.0, 17.0, 21.0, 29.0, 24.0, 21.0, 31.0, 43.0, 36.0, 37.0, 36.0, 37.0, 49.0, 33.0, 39.0, 34.0, 37.0, 34.0, 33.0, 33.0, 37.0, 29.0, 24.0, 24.0, 31.0, 16.0, 19.0, 19.0, 11.0, 11.0, 19.0, 10.0, 5.0, 10.0, 4.0, 8.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.875, -24.135498046875, -23.39599609375, -22.656494140625, -21.9169921875, -21.177490234375, -20.43798828125, -19.698486328125, -18.958984375, -18.219482421875, -17.47998046875, -16.740478515625, -16.0009765625, -15.261474609375, -14.52197265625, -13.782470703125, -13.04296875, -12.303466796875, -11.56396484375, -10.824462890625, -10.0849609375, -9.345458984375, -8.60595703125, -7.866455078125, -7.126953125, -6.387451171875, -5.64794921875, -4.908447265625, -4.1689453125, -3.429443359375, -2.68994140625, -1.950439453125, -1.2109375, -0.471435546875, 0.26806640625, 1.007568359375, 1.7470703125, 2.486572265625, 3.22607421875, 3.965576171875, 4.705078125, 5.444580078125, 6.18408203125, 6.923583984375, 7.6630859375, 8.402587890625, 9.14208984375, 9.881591796875, 10.62109375, 11.360595703125, 12.10009765625, 12.839599609375, 13.5791015625, 14.318603515625, 15.05810546875, 15.797607421875, 16.537109375, 17.276611328125, 18.01611328125, 18.755615234375, 19.4951171875, 20.234619140625, 20.97412109375, 21.713623046875, 22.453125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 19.0, 16.0, 21.0, 32.0, 56.0, 77.0, 139.0, 195.0, 305.0, 479.0, 718.0, 1157.0, 1779.0, 2809.0, 4444.0, 7199.0, 11263.0, 18252.0, 29437.0, 45773.0, 72213.0, 110511.0, 164832.0, 239372.0, 327690.0, 421793.0, 492607.0, 508945.0, 465378.0, 381014.0, 287765.0, 205118.0, 139248.0, 92206.0, 59808.0, 37614.0, 23837.0, 14968.0, 9381.0, 5726.0, 3694.0, 2287.0, 1490.0, 976.0, 615.0, 354.0, 242.0, 163.0, 105.0, 63.0, 40.0, 20.0, 17.0, 7.0, 7.0, 2.0, 3.0, 3.0], "bins": [-21.28125, -20.641845703125, -20.00244140625, -19.363037109375, -18.7236328125, -18.084228515625, -17.44482421875, -16.805419921875, -16.166015625, -15.526611328125, -14.88720703125, -14.247802734375, -13.6083984375, -12.968994140625, -12.32958984375, -11.690185546875, -11.05078125, -10.411376953125, -9.77197265625, -9.132568359375, -8.4931640625, -7.853759765625, -7.21435546875, -6.574951171875, -5.935546875, -5.296142578125, -4.65673828125, -4.017333984375, -3.3779296875, -2.738525390625, -2.09912109375, -1.459716796875, -0.8203125, -0.180908203125, 0.45849609375, 1.097900390625, 1.7373046875, 2.376708984375, 3.01611328125, 3.655517578125, 4.294921875, 4.934326171875, 5.57373046875, 6.213134765625, 6.8525390625, 7.491943359375, 8.13134765625, 8.770751953125, 9.41015625, 10.049560546875, 10.68896484375, 11.328369140625, 11.9677734375, 12.607177734375, 13.24658203125, 13.885986328125, 14.525390625, 15.164794921875, 15.80419921875, 16.443603515625, 17.0830078125, 17.722412109375, 18.36181640625, 19.001220703125, 19.640625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 9.0, 3.0, 8.0, 13.0, 22.0, 25.0, 27.0, 27.0, 57.0, 57.0, 67.0, 62.0, 104.0, 119.0, 122.0, 156.0, 168.0, 200.0, 193.0, 209.0, 215.0, 226.0, 209.0, 229.0, 191.0, 190.0, 192.0, 150.0, 135.0, 112.0, 104.0, 82.0, 57.0, 55.0, 56.0, 47.0, 41.0, 23.0, 27.0, 13.0, 17.0, 11.0, 10.0, 13.0, 7.0, 7.0, 5.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.484375, -9.158935546875, -8.83349609375, -8.508056640625, -8.1826171875, -7.857177734375, -7.53173828125, -7.206298828125, -6.880859375, -6.555419921875, -6.22998046875, -5.904541015625, -5.5791015625, -5.253662109375, -4.92822265625, -4.602783203125, -4.27734375, -3.951904296875, -3.62646484375, -3.301025390625, -2.9755859375, -2.650146484375, -2.32470703125, -1.999267578125, -1.673828125, -1.348388671875, -1.02294921875, -0.697509765625, -0.3720703125, -0.046630859375, 0.27880859375, 0.604248046875, 0.9296875, 1.255126953125, 1.58056640625, 1.906005859375, 2.2314453125, 2.556884765625, 2.88232421875, 3.207763671875, 3.533203125, 3.858642578125, 4.18408203125, 4.509521484375, 4.8349609375, 5.160400390625, 5.48583984375, 5.811279296875, 6.13671875, 6.462158203125, 6.78759765625, 7.113037109375, 7.4384765625, 7.763916015625, 8.08935546875, 8.414794921875, 8.740234375, 9.065673828125, 9.39111328125, 9.716552734375, 10.0419921875, 10.367431640625, 10.69287109375, 11.018310546875, 11.34375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 10.0, 11.0, 16.0, 17.0, 23.0, 31.0, 37.0, 42.0, 50.0, 46.0, 50.0, 50.0, 46.0, 56.0, 66.0, 56.0, 57.0, 65.0, 40.0, 30.0, 26.0, 33.0, 32.0, 21.0, 25.0, 13.0, 11.0, 10.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.06985092163086, -34.99314498901367, -33.91644287109375, -32.83973693847656, -31.763032913208008, -30.686328887939453, -29.609622955322266, -28.53291893005371, -27.456214904785156, -26.3795108795166, -25.302806854248047, -24.22610092163086, -23.149396896362305, -22.07269287109375, -20.995986938476562, -19.919282913208008, -18.842578887939453, -17.7658748626709, -16.689170837402344, -15.612464904785156, -14.535760879516602, -13.459056854248047, -12.382351875305176, -11.305646896362305, -10.22894287109375, -9.152238845825195, -8.075533866882324, -6.998829364776611, -5.922124862670898, -4.8454203605651855, -3.7687158584594727, -2.6920113563537598, -1.6153106689453125, -0.5386061668395996, 0.5380983352661133, 1.6148028373718262, 2.691507339477539, 3.768211841583252, 4.844916343688965, 5.921620845794678, 6.998325347900391, 8.075029373168945, 9.151734352111816, 10.228439331054688, 11.305143356323242, 12.381847381591797, 13.458552360534668, 14.535257339477539, 15.611961364746094, 16.68866539001465, 17.765369415283203, 18.84207534790039, 19.918779373168945, 20.9954833984375, 22.072189331054688, 23.148893356323242, 24.225597381591797, 25.30230140686035, 26.379005432128906, 27.455711364746094, 28.53241539001465, 29.609119415283203, 30.68582534790039, 31.762529373168945, 32.8392333984375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 9.0, 8.0, 7.0, 11.0, 23.0, 18.0, 16.0, 18.0, 27.0, 27.0, 22.0, 31.0, 38.0, 33.0, 31.0, 41.0, 39.0, 35.0, 38.0, 50.0, 32.0, 28.0, 39.0, 33.0, 39.0, 38.0, 30.0, 31.0, 26.0, 19.0, 23.0, 22.0, 18.0, 16.0, 13.0, 14.0, 12.0, 7.0, 11.0, 3.0, 1.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.962976455688477, -28.074247360229492, -27.18552017211914, -26.296791076660156, -25.408061981201172, -24.51933479309082, -23.630605697631836, -22.741878509521484, -21.8531494140625, -20.964420318603516, -20.075693130493164, -19.18696403503418, -18.298236846923828, -17.409507751464844, -16.52077865600586, -15.632050514221191, -14.743322372436523, -13.854594230651855, -12.965866088867188, -12.077136993408203, -11.188408851623535, -10.299680709838867, -9.410951614379883, -8.522223472595215, -7.633495330810547, -6.744767189025879, -5.856038570404053, -4.967309951782227, -4.078581809997559, -3.1898536682128906, -2.3011250495910645, -1.4123964309692383, -0.5236701965332031, 0.36505818367004395, 1.253786563873291, 2.142514944076538, 3.031243324279785, 3.919971466064453, 4.808700084686279, 5.6974287033081055, 6.586156845092773, 7.474884986877441, 8.36361312866211, 9.252342224121094, 10.141070365905762, 11.02979850769043, 11.918527603149414, 12.807255744934082, 13.69598388671875, 14.584712028503418, 15.473440170288086, 16.36216926574707, 17.250896453857422, 18.139625549316406, 19.02835464477539, 19.917083740234375, 20.805810928344727, 21.69454002380371, 22.583267211914062, 23.471996307373047, 24.36072540283203, 25.249452590942383, 26.138181686401367, 27.02690887451172, 27.915637969970703]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 8.0, 4.0, 4.0, 13.0, 21.0, 16.0, 22.0, 38.0, 46.0, 73.0, 113.0, 157.0, 244.0, 393.0, 566.0, 981.0, 1527.0, 2561.0, 4349.0, 7669.0, 13849.0, 25351.0, 46015.0, 83679.0, 143445.0, 211334.0, 202736.0, 132925.0, 75968.0, 41562.0, 22800.0, 12565.0, 6996.0, 4122.0, 2468.0, 1394.0, 905.0, 538.0, 372.0, 227.0, 158.0, 90.0, 93.0, 45.0, 40.0, 18.0, 20.0, 13.0, 6.0, 14.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-31.609375, -30.649169921875, -29.68896484375, -28.728759765625, -27.7685546875, -26.808349609375, -25.84814453125, -24.887939453125, -23.927734375, -22.967529296875, -22.00732421875, -21.047119140625, -20.0869140625, -19.126708984375, -18.16650390625, -17.206298828125, -16.24609375, -15.285888671875, -14.32568359375, -13.365478515625, -12.4052734375, -11.445068359375, -10.48486328125, -9.524658203125, -8.564453125, -7.604248046875, -6.64404296875, -5.683837890625, -4.7236328125, -3.763427734375, -2.80322265625, -1.843017578125, -0.8828125, 0.077392578125, 1.03759765625, 1.997802734375, 2.9580078125, 3.918212890625, 4.87841796875, 5.838623046875, 6.798828125, 7.759033203125, 8.71923828125, 9.679443359375, 10.6396484375, 11.599853515625, 12.56005859375, 13.520263671875, 14.48046875, 15.440673828125, 16.40087890625, 17.361083984375, 18.3212890625, 19.281494140625, 20.24169921875, 21.201904296875, 22.162109375, 23.122314453125, 24.08251953125, 25.042724609375, 26.0029296875, 26.963134765625, 27.92333984375, 28.883544921875, 29.84375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 7.0, 12.0, 13.0, 8.0, 14.0, 9.0, 23.0, 17.0, 19.0, 27.0, 24.0, 35.0, 29.0, 33.0, 35.0, 32.0, 48.0, 29.0, 39.0, 38.0, 51.0, 32.0, 40.0, 30.0, 34.0, 30.0, 38.0, 40.0, 24.0, 22.0, 32.0, 27.0, 13.0, 21.0, 17.0, 9.0, 8.0, 12.0, 10.0, 8.0, 3.0, 5.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.8125, -28.909912109375, -28.00732421875, -27.104736328125, -26.2021484375, -25.299560546875, -24.39697265625, -23.494384765625, -22.591796875, -21.689208984375, -20.78662109375, -19.884033203125, -18.9814453125, -18.078857421875, -17.17626953125, -16.273681640625, -15.37109375, -14.468505859375, -13.56591796875, -12.663330078125, -11.7607421875, -10.858154296875, -9.95556640625, -9.052978515625, -8.150390625, -7.247802734375, -6.34521484375, -5.442626953125, -4.5400390625, -3.637451171875, -2.73486328125, -1.832275390625, -0.9296875, -0.027099609375, 0.87548828125, 1.778076171875, 2.6806640625, 3.583251953125, 4.48583984375, 5.388427734375, 6.291015625, 7.193603515625, 8.09619140625, 8.998779296875, 9.9013671875, 10.803955078125, 11.70654296875, 12.609130859375, 13.51171875, 14.414306640625, 15.31689453125, 16.219482421875, 17.1220703125, 18.024658203125, 18.92724609375, 19.829833984375, 20.732421875, 21.635009765625, 22.53759765625, 23.440185546875, 24.3427734375, 25.245361328125, 26.14794921875, 27.050537109375, 27.953125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 15.0, 20.0, 28.0, 44.0, 57.0, 89.0, 141.0, 220.0, 353.0, 669.0, 1111.0, 2059.0, 4123.0, 8280.0, 18096.0, 43980.0, 113613.0, 276261.0, 326034.0, 150552.0, 58059.0, 23451.0, 10538.0, 4911.0, 2566.0, 1406.0, 701.0, 443.0, 255.0, 163.0, 114.0, 58.0, 45.0, 35.0, 24.0, 6.0, 5.0, 7.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.859375, -30.868408203125, -29.87744140625, -28.886474609375, -27.8955078125, -26.904541015625, -25.91357421875, -24.922607421875, -23.931640625, -22.940673828125, -21.94970703125, -20.958740234375, -19.9677734375, -18.976806640625, -17.98583984375, -16.994873046875, -16.00390625, -15.012939453125, -14.02197265625, -13.031005859375, -12.0400390625, -11.049072265625, -10.05810546875, -9.067138671875, -8.076171875, -7.085205078125, -6.09423828125, -5.103271484375, -4.1123046875, -3.121337890625, -2.13037109375, -1.139404296875, -0.1484375, 0.842529296875, 1.83349609375, 2.824462890625, 3.8154296875, 4.806396484375, 5.79736328125, 6.788330078125, 7.779296875, 8.770263671875, 9.76123046875, 10.752197265625, 11.7431640625, 12.734130859375, 13.72509765625, 14.716064453125, 15.70703125, 16.697998046875, 17.68896484375, 18.679931640625, 19.6708984375, 20.661865234375, 21.65283203125, 22.643798828125, 23.634765625, 24.625732421875, 25.61669921875, 26.607666015625, 27.5986328125, 28.589599609375, 29.58056640625, 30.571533203125, 31.5625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 5.0, 5.0, 6.0, 11.0, 6.0, 12.0, 13.0, 17.0, 18.0, 29.0, 28.0, 29.0, 34.0, 37.0, 35.0, 43.0, 56.0, 59.0, 39.0, 42.0, 41.0, 58.0, 41.0, 47.0, 34.0, 41.0, 36.0, 30.0, 29.0, 27.0, 20.0, 17.0, 11.0, 14.0, 6.0, 10.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.0, -30.181640625, -29.36328125, -28.544921875, -27.7265625, -26.908203125, -26.08984375, -25.271484375, -24.453125, -23.634765625, -22.81640625, -21.998046875, -21.1796875, -20.361328125, -19.54296875, -18.724609375, -17.90625, -17.087890625, -16.26953125, -15.451171875, -14.6328125, -13.814453125, -12.99609375, -12.177734375, -11.359375, -10.541015625, -9.72265625, -8.904296875, -8.0859375, -7.267578125, -6.44921875, -5.630859375, -4.8125, -3.994140625, -3.17578125, -2.357421875, -1.5390625, -0.720703125, 0.09765625, 0.916015625, 1.734375, 2.552734375, 3.37109375, 4.189453125, 5.0078125, 5.826171875, 6.64453125, 7.462890625, 8.28125, 9.099609375, 9.91796875, 10.736328125, 11.5546875, 12.373046875, 13.19140625, 14.009765625, 14.828125, 15.646484375, 16.46484375, 17.283203125, 18.1015625, 18.919921875, 19.73828125, 20.556640625, 21.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 6.0, 10.0, 11.0, 18.0, 19.0, 50.0, 50.0, 87.0, 108.0, 188.0, 273.0, 392.0, 612.0, 976.0, 1595.0, 2771.0, 4793.0, 8853.0, 17967.0, 42655.0, 129639.0, 475948.0, 243066.0, 65991.0, 25803.0, 11802.0, 6152.0, 3424.0, 1937.0, 1183.0, 728.0, 489.0, 325.0, 222.0, 138.0, 79.0, 69.0, 40.0, 33.0, 20.0, 15.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.89892578125, -23.0947265625, -22.29052734375, -21.486328125, -20.68212890625, -19.8779296875, -19.07373046875, -18.26953125, -17.46533203125, -16.6611328125, -15.85693359375, -15.052734375, -14.24853515625, -13.4443359375, -12.64013671875, -11.8359375, -11.03173828125, -10.2275390625, -9.42333984375, -8.619140625, -7.81494140625, -7.0107421875, -6.20654296875, -5.40234375, -4.59814453125, -3.7939453125, -2.98974609375, -2.185546875, -1.38134765625, -0.5771484375, 0.22705078125, 1.03125, 1.83544921875, 2.6396484375, 3.44384765625, 4.248046875, 5.05224609375, 5.8564453125, 6.66064453125, 7.46484375, 8.26904296875, 9.0732421875, 9.87744140625, 10.681640625, 11.48583984375, 12.2900390625, 13.09423828125, 13.8984375, 14.70263671875, 15.5068359375, 16.31103515625, 17.115234375, 17.91943359375, 18.7236328125, 19.52783203125, 20.33203125, 21.13623046875, 21.9404296875, 22.74462890625, 23.548828125, 24.35302734375, 25.1572265625, 25.96142578125, 26.765625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 2.0, 10.0, 4.0, 4.0, 11.0, 12.0, 14.0, 20.0, 12.0, 10.0, 28.0, 28.0, 33.0, 38.0, 63.0, 82.0, 101.0, 93.0, 99.0, 61.0, 38.0, 35.0, 38.0, 31.0, 25.0, 12.0, 13.0, 6.0, 10.0, 10.0, 7.0, 12.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002422332763671875, -0.0023520290851593018, -0.0022817254066467285, -0.0022114217281341553, -0.002141118049621582, -0.002070814371109009, -0.0020005106925964355, -0.0019302070140838623, -0.001859903335571289, -0.0017895996570587158, -0.0017192959785461426, -0.0016489923000335693, -0.001578688621520996, -0.0015083849430084229, -0.0014380812644958496, -0.0013677775859832764, -0.0012974739074707031, -0.0012271702289581299, -0.0011568665504455566, -0.0010865628719329834, -0.0010162591934204102, -0.0009459555149078369, -0.0008756518363952637, -0.0008053481578826904, -0.0007350444793701172, -0.0006647408008575439, -0.0005944371223449707, -0.0005241334438323975, -0.0004538297653198242, -0.000383526086807251, -0.00031322240829467773, -0.0002429187297821045, -0.00017261505126953125, -0.00010231137275695801, -3.2007694244384766e-05, 3.8295984268188477e-05, 0.00010859966278076172, 0.00017890334129333496, 0.0002492070198059082, 0.00031951069831848145, 0.0003898143768310547, 0.00046011805534362793, 0.0005304217338562012, 0.0006007254123687744, 0.0006710290908813477, 0.0007413327693939209, 0.0008116364479064941, 0.0008819401264190674, 0.0009522438049316406, 0.0010225474834442139, 0.0010928511619567871, 0.0011631548404693604, 0.0012334585189819336, 0.0013037621974945068, 0.00137406587600708, 0.0014443695545196533, 0.0015146732330322266, 0.0015849769115447998, 0.001655280590057373, 0.0017255842685699463, 0.0017958879470825195, 0.0018661916255950928, 0.001936495304107666, 0.0020067989826202393, 0.0020771026611328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 7.0, 3.0, 5.0, 7.0, 10.0, 14.0, 22.0, 23.0, 24.0, 40.0, 53.0, 68.0, 116.0, 144.0, 219.0, 305.0, 463.0, 644.0, 1090.0, 1723.0, 2826.0, 4917.0, 8967.0, 16637.0, 33943.0, 73119.0, 175090.0, 340515.0, 214910.0, 88313.0, 40176.0, 19447.0, 10344.0, 5562.0, 3389.0, 1876.0, 1162.0, 760.0, 492.0, 305.0, 230.0, 152.0, 146.0, 85.0, 59.0, 39.0, 23.0, 27.0, 14.0, 18.0, 11.0, 18.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0], "bins": [-26.03125, -25.2568359375, -24.482421875, -23.7080078125, -22.93359375, -22.1591796875, -21.384765625, -20.6103515625, -19.8359375, -19.0615234375, -18.287109375, -17.5126953125, -16.73828125, -15.9638671875, -15.189453125, -14.4150390625, -13.640625, -12.8662109375, -12.091796875, -11.3173828125, -10.54296875, -9.7685546875, -8.994140625, -8.2197265625, -7.4453125, -6.6708984375, -5.896484375, -5.1220703125, -4.34765625, -3.5732421875, -2.798828125, -2.0244140625, -1.25, -0.4755859375, 0.298828125, 1.0732421875, 1.84765625, 2.6220703125, 3.396484375, 4.1708984375, 4.9453125, 5.7197265625, 6.494140625, 7.2685546875, 8.04296875, 8.8173828125, 9.591796875, 10.3662109375, 11.140625, 11.9150390625, 12.689453125, 13.4638671875, 14.23828125, 15.0126953125, 15.787109375, 16.5615234375, 17.3359375, 18.1103515625, 18.884765625, 19.6591796875, 20.43359375, 21.2080078125, 21.982421875, 22.7568359375, 23.53125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 5.0, 4.0, 17.0, 22.0, 24.0, 49.0, 53.0, 86.0, 187.0, 192.0, 132.0, 77.0, 40.0, 22.0, 24.0, 18.0, 13.0, 12.0, 1.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.40625, -14.896484375, -14.38671875, -13.876953125, -13.3671875, -12.857421875, -12.34765625, -11.837890625, -11.328125, -10.818359375, -10.30859375, -9.798828125, -9.2890625, -8.779296875, -8.26953125, -7.759765625, -7.25, -6.740234375, -6.23046875, -5.720703125, -5.2109375, -4.701171875, -4.19140625, -3.681640625, -3.171875, -2.662109375, -2.15234375, -1.642578125, -1.1328125, -0.623046875, -0.11328125, 0.396484375, 0.90625, 1.416015625, 1.92578125, 2.435546875, 2.9453125, 3.455078125, 3.96484375, 4.474609375, 4.984375, 5.494140625, 6.00390625, 6.513671875, 7.0234375, 7.533203125, 8.04296875, 8.552734375, 9.0625, 9.572265625, 10.08203125, 10.591796875, 11.1015625, 11.611328125, 12.12109375, 12.630859375, 13.140625, 13.650390625, 14.16015625, 14.669921875, 15.1796875, 15.689453125, 16.19921875, 16.708984375, 17.21875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 8.0, 3.0, 5.0, 15.0, 9.0, 7.0, 14.0, 21.0, 23.0, 31.0, 28.0, 42.0, 36.0, 38.0, 29.0, 43.0, 57.0, 42.0, 51.0, 46.0, 46.0, 49.0, 44.0, 40.0, 51.0, 28.0, 33.0, 30.0, 23.0, 23.0, 20.0, 23.0, 10.0, 13.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-29.059724807739258, -28.15408706665039, -27.248449325561523, -26.342811584472656, -25.43717384338379, -24.531536102294922, -23.625898361206055, -22.720260620117188, -21.81462287902832, -20.908985137939453, -20.003347396850586, -19.09770965576172, -18.19207191467285, -17.286434173583984, -16.380796432495117, -15.47515869140625, -14.569520950317383, -13.663883209228516, -12.758245468139648, -11.852607727050781, -10.946969985961914, -10.041332244873047, -9.13569450378418, -8.230056762695312, -7.324419021606445, -6.418781280517578, -5.513143539428711, -4.607505798339844, -3.7018680572509766, -2.7962303161621094, -1.8905925750732422, -0.984954833984375, -0.07931900024414062, 0.8263187408447266, 1.7319564819335938, 2.637594223022461, 3.543231964111328, 4.448869705200195, 5.3545074462890625, 6.26014518737793, 7.165782928466797, 8.071420669555664, 8.977058410644531, 9.882696151733398, 10.788333892822266, 11.693971633911133, 12.599609375, 13.505247116088867, 14.410884857177734, 15.316522598266602, 16.22216033935547, 17.127798080444336, 18.033435821533203, 18.93907356262207, 19.844711303710938, 20.750349044799805, 21.655986785888672, 22.56162452697754, 23.467262268066406, 24.372900009155273, 25.27853775024414, 26.184175491333008, 27.089813232421875, 27.995450973510742, 28.90108871459961]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 5.0, 4.0, 7.0, 11.0, 10.0, 10.0, 12.0, 18.0, 20.0, 14.0, 31.0, 30.0, 16.0, 32.0, 32.0, 34.0, 35.0, 35.0, 37.0, 38.0, 39.0, 29.0, 28.0, 41.0, 24.0, 34.0, 44.0, 35.0, 26.0, 27.0, 20.0, 32.0, 32.0, 21.0, 17.0, 13.0, 21.0, 16.0, 11.0, 15.0, 11.0, 3.0, 10.0, 4.0, 8.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.29692840576172, -24.493085861206055, -23.689241409301758, -22.885398864746094, -22.081554412841797, -21.277711868286133, -20.47386932373047, -19.670024871826172, -18.866180419921875, -18.06233787536621, -17.258493423461914, -16.45465087890625, -15.650806427001953, -14.846963882446289, -14.043120384216309, -13.239276885986328, -12.435434341430664, -11.631590843200684, -10.827747344970703, -10.023904800415039, -9.220060348510742, -8.416217803955078, -7.612374305725098, -6.808530807495117, -6.004687309265137, -5.200843811035156, -4.397000312805176, -3.5931572914123535, -2.789313793182373, -1.9854702949523926, -1.1816272735595703, -0.37778377532958984, 0.4260578155517578, 1.2299011945724487, 2.0337445735931396, 2.837587833404541, 3.6414313316345215, 4.445274829864502, 5.249117851257324, 6.052961349487305, 6.856804847717285, 7.660648345947266, 8.464491844177246, 9.268335342407227, 10.07217788696289, 10.876022338867188, 11.679864883422852, 12.483708381652832, 13.287551879882812, 14.091395378112793, 14.895238876342773, 15.699081420898438, 16.502925872802734, 17.3067684173584, 18.110610961914062, 18.91445541381836, 19.718299865722656, 20.52214241027832, 21.325986862182617, 22.12982940673828, 22.933673858642578, 23.737516403198242, 24.541358947753906, 25.345203399658203, 26.149045944213867]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 10.0, 8.0, 22.0, 31.0, 50.0, 66.0, 112.0, 158.0, 221.0, 310.0, 545.0, 896.0, 1256.0, 2012.0, 3201.0, 4808.0, 7785.0, 11677.0, 17826.0, 26748.0, 39234.0, 54791.0, 74144.0, 94439.0, 109726.0, 116220.0, 112338.0, 98721.0, 80459.0, 60048.0, 43216.0, 29934.0, 19945.0, 13291.0, 8553.0, 5667.0, 3577.0, 2256.0, 1489.0, 991.0, 596.0, 423.0, 266.0, 164.0, 101.0, 74.0, 42.0, 32.0, 32.0, 13.0, 6.0, 11.0, 10.0, 2.0, 2.0, 2.0, 1.0], "bins": [-25.875, -25.082275390625, -24.28955078125, -23.496826171875, -22.7041015625, -21.911376953125, -21.11865234375, -20.325927734375, -19.533203125, -18.740478515625, -17.94775390625, -17.155029296875, -16.3623046875, -15.569580078125, -14.77685546875, -13.984130859375, -13.19140625, -12.398681640625, -11.60595703125, -10.813232421875, -10.0205078125, -9.227783203125, -8.43505859375, -7.642333984375, -6.849609375, -6.056884765625, -5.26416015625, -4.471435546875, -3.6787109375, -2.885986328125, -2.09326171875, -1.300537109375, -0.5078125, 0.284912109375, 1.07763671875, 1.870361328125, 2.6630859375, 3.455810546875, 4.24853515625, 5.041259765625, 5.833984375, 6.626708984375, 7.41943359375, 8.212158203125, 9.0048828125, 9.797607421875, 10.59033203125, 11.383056640625, 12.17578125, 12.968505859375, 13.76123046875, 14.553955078125, 15.3466796875, 16.139404296875, 16.93212890625, 17.724853515625, 18.517578125, 19.310302734375, 20.10302734375, 20.895751953125, 21.6884765625, 22.481201171875, 23.27392578125, 24.066650390625, 24.859375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 14.0, 12.0, 15.0, 12.0, 24.0, 29.0, 23.0, 25.0, 24.0, 37.0, 22.0, 35.0, 28.0, 35.0, 40.0, 27.0, 48.0, 37.0, 38.0, 38.0, 45.0, 30.0, 35.0, 34.0, 32.0, 28.0, 23.0, 23.0, 22.0, 30.0, 14.0, 14.0, 14.0, 16.0, 14.0, 3.0, 8.0, 7.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.9375, -23.16748046875, -22.3974609375, -21.62744140625, -20.857421875, -20.08740234375, -19.3173828125, -18.54736328125, -17.77734375, -17.00732421875, -16.2373046875, -15.46728515625, -14.697265625, -13.92724609375, -13.1572265625, -12.38720703125, -11.6171875, -10.84716796875, -10.0771484375, -9.30712890625, -8.537109375, -7.76708984375, -6.9970703125, -6.22705078125, -5.45703125, -4.68701171875, -3.9169921875, -3.14697265625, -2.376953125, -1.60693359375, -0.8369140625, -0.06689453125, 0.703125, 1.47314453125, 2.2431640625, 3.01318359375, 3.783203125, 4.55322265625, 5.3232421875, 6.09326171875, 6.86328125, 7.63330078125, 8.4033203125, 9.17333984375, 9.943359375, 10.71337890625, 11.4833984375, 12.25341796875, 13.0234375, 13.79345703125, 14.5634765625, 15.33349609375, 16.103515625, 16.87353515625, 17.6435546875, 18.41357421875, 19.18359375, 19.95361328125, 20.7236328125, 21.49365234375, 22.263671875, 23.03369140625, 23.8037109375, 24.57373046875, 25.34375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 11.0, 10.0, 21.0, 43.0, 69.0, 85.0, 136.0, 190.0, 311.0, 530.0, 797.0, 1229.0, 1877.0, 2947.0, 4709.0, 7379.0, 11361.0, 17389.0, 26345.0, 38745.0, 55218.0, 73798.0, 93523.0, 110313.0, 117332.0, 113864.0, 99359.0, 80168.0, 60990.0, 43744.0, 29826.0, 19867.0, 13050.0, 8420.0, 5357.0, 3420.0, 2232.0, 1363.0, 906.0, 577.0, 363.0, 247.0, 145.0, 110.0, 60.0, 40.0, 37.0, 8.0, 11.0, 5.0, 8.0, 2.0, 5.0, 3.0], "bins": [-26.6875, -25.91748046875, -25.1474609375, -24.37744140625, -23.607421875, -22.83740234375, -22.0673828125, -21.29736328125, -20.52734375, -19.75732421875, -18.9873046875, -18.21728515625, -17.447265625, -16.67724609375, -15.9072265625, -15.13720703125, -14.3671875, -13.59716796875, -12.8271484375, -12.05712890625, -11.287109375, -10.51708984375, -9.7470703125, -8.97705078125, -8.20703125, -7.43701171875, -6.6669921875, -5.89697265625, -5.126953125, -4.35693359375, -3.5869140625, -2.81689453125, -2.046875, -1.27685546875, -0.5068359375, 0.26318359375, 1.033203125, 1.80322265625, 2.5732421875, 3.34326171875, 4.11328125, 4.88330078125, 5.6533203125, 6.42333984375, 7.193359375, 7.96337890625, 8.7333984375, 9.50341796875, 10.2734375, 11.04345703125, 11.8134765625, 12.58349609375, 13.353515625, 14.12353515625, 14.8935546875, 15.66357421875, 16.43359375, 17.20361328125, 17.9736328125, 18.74365234375, 19.513671875, 20.28369140625, 21.0537109375, 21.82373046875, 22.59375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 6.0, 9.0, 7.0, 14.0, 10.0, 14.0, 14.0, 19.0, 16.0, 25.0, 27.0, 26.0, 25.0, 26.0, 29.0, 33.0, 31.0, 35.0, 47.0, 52.0, 39.0, 31.0, 29.0, 47.0, 33.0, 34.0, 40.0, 26.0, 34.0, 26.0, 28.0, 33.0, 19.0, 15.0, 16.0, 14.0, 13.0, 9.0, 4.0, 11.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0], "bins": [-17.203125, -16.697265625, -16.19140625, -15.685546875, -15.1796875, -14.673828125, -14.16796875, -13.662109375, -13.15625, -12.650390625, -12.14453125, -11.638671875, -11.1328125, -10.626953125, -10.12109375, -9.615234375, -9.109375, -8.603515625, -8.09765625, -7.591796875, -7.0859375, -6.580078125, -6.07421875, -5.568359375, -5.0625, -4.556640625, -4.05078125, -3.544921875, -3.0390625, -2.533203125, -2.02734375, -1.521484375, -1.015625, -0.509765625, -0.00390625, 0.501953125, 1.0078125, 1.513671875, 2.01953125, 2.525390625, 3.03125, 3.537109375, 4.04296875, 4.548828125, 5.0546875, 5.560546875, 6.06640625, 6.572265625, 7.078125, 7.583984375, 8.08984375, 8.595703125, 9.1015625, 9.607421875, 10.11328125, 10.619140625, 11.125, 11.630859375, 12.13671875, 12.642578125, 13.1484375, 13.654296875, 14.16015625, 14.666015625, 15.171875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 1.0, 8.0, 7.0, 7.0, 12.0, 23.0, 29.0, 45.0, 70.0, 82.0, 127.0, 147.0, 279.0, 386.0, 583.0, 879.0, 1357.0, 2179.0, 3604.0, 6189.0, 10691.0, 18804.0, 34640.0, 64264.0, 117155.0, 183905.0, 214154.0, 166369.0, 99603.0, 54325.0, 29282.0, 16168.0, 9121.0, 5435.0, 3224.0, 1806.0, 1230.0, 750.0, 555.0, 343.0, 245.0, 165.0, 102.0, 55.0, 44.0, 34.0, 23.0, 26.0, 11.0, 7.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.609375, -16.9658203125, -16.322265625, -15.6787109375, -15.03515625, -14.3916015625, -13.748046875, -13.1044921875, -12.4609375, -11.8173828125, -11.173828125, -10.5302734375, -9.88671875, -9.2431640625, -8.599609375, -7.9560546875, -7.3125, -6.6689453125, -6.025390625, -5.3818359375, -4.73828125, -4.0947265625, -3.451171875, -2.8076171875, -2.1640625, -1.5205078125, -0.876953125, -0.2333984375, 0.41015625, 1.0537109375, 1.697265625, 2.3408203125, 2.984375, 3.6279296875, 4.271484375, 4.9150390625, 5.55859375, 6.2021484375, 6.845703125, 7.4892578125, 8.1328125, 8.7763671875, 9.419921875, 10.0634765625, 10.70703125, 11.3505859375, 11.994140625, 12.6376953125, 13.28125, 13.9248046875, 14.568359375, 15.2119140625, 15.85546875, 16.4990234375, 17.142578125, 17.7861328125, 18.4296875, 19.0732421875, 19.716796875, 20.3603515625, 21.00390625, 21.6474609375, 22.291015625, 22.9345703125, 23.578125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 5.0, 8.0, 13.0, 13.0, 28.0, 28.0, 38.0, 66.0, 64.0, 96.0, 97.0, 95.0, 95.0, 82.0, 60.0, 46.0, 39.0, 30.0, 24.0, 15.0, 10.0, 12.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0028324127197265625, -0.0027543604373931885, -0.0026763081550598145, -0.0025982558727264404, -0.0025202035903930664, -0.0024421513080596924, -0.0023640990257263184, -0.0022860467433929443, -0.0022079944610595703, -0.0021299421787261963, -0.0020518898963928223, -0.0019738376140594482, -0.0018957853317260742, -0.0018177330493927002, -0.0017396807670593262, -0.0016616284847259521, -0.0015835762023925781, -0.001505523920059204, -0.00142747163772583, -0.001349419355392456, -0.001271367073059082, -0.001193314790725708, -0.001115262508392334, -0.00103721022605896, -0.0009591579437255859, -0.0008811056613922119, -0.0008030533790588379, -0.0007250010967254639, -0.0006469488143920898, -0.0005688965320587158, -0.0004908442497253418, -0.0004127919673919678, -0.00033473968505859375, -0.0002566874027252197, -0.0001786351203918457, -0.00010058283805847168, -2.2530555725097656e-05, 5.552172660827637e-05, 0.0001335740089416504, 0.00021162629127502441, 0.00028967857360839844, 0.00036773085594177246, 0.0004457831382751465, 0.0005238354206085205, 0.0006018877029418945, 0.0006799399852752686, 0.0007579922676086426, 0.0008360445499420166, 0.0009140968322753906, 0.0009921491146087646, 0.0010702013969421387, 0.0011482536792755127, 0.0012263059616088867, 0.0013043582439422607, 0.0013824105262756348, 0.0014604628086090088, 0.0015385150909423828, 0.0016165673732757568, 0.0016946196556091309, 0.0017726719379425049, 0.001850724220275879, 0.001928776502609253, 0.002006828784942627, 0.002084881067276001, 0.002162933349609375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 16.0, 16.0, 25.0, 43.0, 80.0, 101.0, 126.0, 229.0, 404.0, 553.0, 910.0, 1480.0, 2442.0, 4008.0, 6775.0, 11900.0, 21121.0, 37522.0, 65955.0, 107523.0, 153300.0, 179084.0, 162638.0, 118350.0, 73744.0, 43115.0, 24049.0, 13618.0, 7788.0, 4484.0, 2716.0, 1628.0, 1007.0, 657.0, 420.0, 237.0, 165.0, 96.0, 77.0, 38.0, 33.0, 14.0, 20.0, 17.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.015625, -14.525146484375, -14.03466796875, -13.544189453125, -13.0537109375, -12.563232421875, -12.07275390625, -11.582275390625, -11.091796875, -10.601318359375, -10.11083984375, -9.620361328125, -9.1298828125, -8.639404296875, -8.14892578125, -7.658447265625, -7.16796875, -6.677490234375, -6.18701171875, -5.696533203125, -5.2060546875, -4.715576171875, -4.22509765625, -3.734619140625, -3.244140625, -2.753662109375, -2.26318359375, -1.772705078125, -1.2822265625, -0.791748046875, -0.30126953125, 0.189208984375, 0.6796875, 1.170166015625, 1.66064453125, 2.151123046875, 2.6416015625, 3.132080078125, 3.62255859375, 4.113037109375, 4.603515625, 5.093994140625, 5.58447265625, 6.074951171875, 6.5654296875, 7.055908203125, 7.54638671875, 8.036865234375, 8.52734375, 9.017822265625, 9.50830078125, 9.998779296875, 10.4892578125, 10.979736328125, 11.47021484375, 11.960693359375, 12.451171875, 12.941650390625, 13.43212890625, 13.922607421875, 14.4130859375, 14.903564453125, 15.39404296875, 15.884521484375, 16.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 0.0, 8.0, 9.0, 6.0, 13.0, 12.0, 18.0, 19.0, 20.0, 23.0, 29.0, 27.0, 44.0, 47.0, 61.0, 60.0, 51.0, 51.0, 55.0, 44.0, 47.0, 73.0, 44.0, 40.0, 39.0, 28.0, 28.0, 19.0, 21.0, 10.0, 12.0, 5.0, 3.0, 11.0, 4.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-7.45703125, -7.2685546875, -7.080078125, -6.8916015625, -6.703125, -6.5146484375, -6.326171875, -6.1376953125, -5.94921875, -5.7607421875, -5.572265625, -5.3837890625, -5.1953125, -5.0068359375, -4.818359375, -4.6298828125, -4.44140625, -4.2529296875, -4.064453125, -3.8759765625, -3.6875, -3.4990234375, -3.310546875, -3.1220703125, -2.93359375, -2.7451171875, -2.556640625, -2.3681640625, -2.1796875, -1.9912109375, -1.802734375, -1.6142578125, -1.42578125, -1.2373046875, -1.048828125, -0.8603515625, -0.671875, -0.4833984375, -0.294921875, -0.1064453125, 0.08203125, 0.2705078125, 0.458984375, 0.6474609375, 0.8359375, 1.0244140625, 1.212890625, 1.4013671875, 1.58984375, 1.7783203125, 1.966796875, 2.1552734375, 2.34375, 2.5322265625, 2.720703125, 2.9091796875, 3.09765625, 3.2861328125, 3.474609375, 3.6630859375, 3.8515625, 4.0400390625, 4.228515625, 4.4169921875, 4.60546875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 8.0, 7.0, 18.0, 10.0, 21.0, 15.0, 16.0, 28.0, 38.0, 47.0, 45.0, 53.0, 62.0, 51.0, 54.0, 43.0, 51.0, 55.0, 59.0, 46.0, 42.0, 41.0, 46.0, 23.0, 29.0, 22.0, 15.0, 12.0, 12.0, 12.0, 6.0, 7.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.955902099609375, -32.97262954711914, -31.98935317993164, -31.006078720092773, -30.022804260253906, -29.039531707763672, -28.056257247924805, -27.072982788085938, -26.08970832824707, -25.106433868408203, -24.123159408569336, -23.13988494873047, -22.156612396240234, -21.173336029052734, -20.1900634765625, -19.206789016723633, -18.223514556884766, -17.2402400970459, -16.25696563720703, -15.27369213104248, -14.290417671203613, -13.307143211364746, -12.323869705200195, -11.340595245361328, -10.357320785522461, -9.374046325683594, -8.390771865844727, -7.407498359680176, -6.424223899841309, -5.440949440002441, -4.457675457000732, -3.4744014739990234, -2.4911270141601562, -1.5078527927398682, -0.5245785713195801, 0.458695650100708, 1.441969871520996, 2.4252443313598633, 3.4085183143615723, 4.391792297363281, 5.375066757202148, 6.358341217041016, 7.341615200042725, 8.324889183044434, 9.3081636428833, 10.291438102722168, 11.274711608886719, 12.257986068725586, 13.241260528564453, 14.22453498840332, 15.207809448242188, 16.191083908081055, 17.174358367919922, 18.157630920410156, 19.140905380249023, 20.12417984008789, 21.107454299926758, 22.090728759765625, 23.074003219604492, 24.05727767944336, 25.040550231933594, 26.023826599121094, 27.007099151611328, 27.990373611450195, 28.973648071289062]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 12.0, 16.0, 10.0, 14.0, 20.0, 22.0, 33.0, 26.0, 20.0, 29.0, 29.0, 31.0, 32.0, 45.0, 43.0, 41.0, 37.0, 32.0, 40.0, 32.0, 36.0, 32.0, 35.0, 36.0, 27.0, 33.0, 28.0, 28.0, 32.0, 12.0, 20.0, 15.0, 19.0, 14.0, 17.0, 7.0, 9.0, 3.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.039749145507812, -26.171367645263672, -25.30298614501953, -24.43460464477539, -23.566221237182617, -22.697839736938477, -21.829458236694336, -20.961076736450195, -20.092693328857422, -19.22431182861328, -18.35593032836914, -17.487548828125, -16.619165420532227, -15.750783920288086, -14.882402420043945, -14.014020919799805, -13.145639419555664, -12.277257919311523, -11.408875465393066, -10.540493965148926, -9.672111511230469, -8.803730010986328, -7.9353485107421875, -7.066966533660889, -6.19858455657959, -5.330202579498291, -4.461820602416992, -3.5934391021728516, -2.7250571250915527, -1.856675148010254, -0.9882936477661133, -0.11991167068481445, 0.7484683990478516, 1.6168502569198608, 2.48523211479187, 3.35361385345459, 4.221995830535889, 5.0903778076171875, 5.958759307861328, 6.827141284942627, 7.695523262023926, 8.563904762268066, 9.432287216186523, 10.300668716430664, 11.169050216674805, 12.037432670593262, 12.905814170837402, 13.77419662475586, 14.642578125, 15.51095962524414, 16.37934112548828, 17.247722625732422, 18.116106033325195, 18.984487533569336, 19.852869033813477, 20.721250534057617, 21.58963394165039, 22.45801544189453, 23.326396942138672, 24.194778442382812, 25.063161849975586, 25.931543350219727, 26.799924850463867, 27.668306350708008, 28.53668785095215]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 17.0, 26.0, 57.0, 80.0, 130.0, 213.0, 355.0, 682.0, 1154.0, 1933.0, 3472.0, 6186.0, 11442.0, 21141.0, 39655.0, 74094.0, 135711.0, 246564.0, 419776.0, 624995.0, 750695.0, 687072.0, 496261.0, 303845.0, 170197.0, 91831.0, 49177.0, 26129.0, 14114.0, 7576.0, 4240.0, 2299.0, 1323.0, 765.0, 423.0, 259.0, 160.0, 96.0, 42.0, 38.0, 23.0, 8.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.9375, -23.18212890625, -22.4267578125, -21.67138671875, -20.916015625, -20.16064453125, -19.4052734375, -18.64990234375, -17.89453125, -17.13916015625, -16.3837890625, -15.62841796875, -14.873046875, -14.11767578125, -13.3623046875, -12.60693359375, -11.8515625, -11.09619140625, -10.3408203125, -9.58544921875, -8.830078125, -8.07470703125, -7.3193359375, -6.56396484375, -5.80859375, -5.05322265625, -4.2978515625, -3.54248046875, -2.787109375, -2.03173828125, -1.2763671875, -0.52099609375, 0.234375, 0.98974609375, 1.7451171875, 2.50048828125, 3.255859375, 4.01123046875, 4.7666015625, 5.52197265625, 6.27734375, 7.03271484375, 7.7880859375, 8.54345703125, 9.298828125, 10.05419921875, 10.8095703125, 11.56494140625, 12.3203125, 13.07568359375, 13.8310546875, 14.58642578125, 15.341796875, 16.09716796875, 16.8525390625, 17.60791015625, 18.36328125, 19.11865234375, 19.8740234375, 20.62939453125, 21.384765625, 22.14013671875, 22.8955078125, 23.65087890625, 24.40625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 13.0, 8.0, 15.0, 14.0, 32.0, 23.0, 17.0, 36.0, 28.0, 25.0, 40.0, 29.0, 37.0, 48.0, 42.0, 40.0, 41.0, 49.0, 21.0, 42.0, 44.0, 42.0, 23.0, 44.0, 35.0, 27.0, 24.0, 17.0, 24.0, 28.0, 12.0, 14.0, 12.0, 16.0, 7.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.15625, -18.499267578125, -17.84228515625, -17.185302734375, -16.5283203125, -15.871337890625, -15.21435546875, -14.557373046875, -13.900390625, -13.243408203125, -12.58642578125, -11.929443359375, -11.2724609375, -10.615478515625, -9.95849609375, -9.301513671875, -8.64453125, -7.987548828125, -7.33056640625, -6.673583984375, -6.0166015625, -5.359619140625, -4.70263671875, -4.045654296875, -3.388671875, -2.731689453125, -2.07470703125, -1.417724609375, -0.7607421875, -0.103759765625, 0.55322265625, 1.210205078125, 1.8671875, 2.524169921875, 3.18115234375, 3.838134765625, 4.4951171875, 5.152099609375, 5.80908203125, 6.466064453125, 7.123046875, 7.780029296875, 8.43701171875, 9.093994140625, 9.7509765625, 10.407958984375, 11.06494140625, 11.721923828125, 12.37890625, 13.035888671875, 13.69287109375, 14.349853515625, 15.0068359375, 15.663818359375, 16.32080078125, 16.977783203125, 17.634765625, 18.291748046875, 18.94873046875, 19.605712890625, 20.2626953125, 20.919677734375, 21.57666015625, 22.233642578125, 22.890625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 10.0, 4.0, 10.0, 22.0, 37.0, 42.0, 86.0, 136.0, 192.0, 328.0, 521.0, 853.0, 1308.0, 2192.0, 3682.0, 5945.0, 9996.0, 16604.0, 27200.0, 45516.0, 73672.0, 116903.0, 180330.0, 265677.0, 370794.0, 472921.0, 536853.0, 531704.0, 460808.0, 358341.0, 254634.0, 170504.0, 110288.0, 68931.0, 42250.0, 25989.0, 15545.0, 9203.0, 5531.0, 3412.0, 2014.0, 1275.0, 773.0, 465.0, 275.0, 198.0, 121.0, 73.0, 42.0, 31.0, 17.0, 16.0, 10.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-17.484375, -16.919189453125, -16.35400390625, -15.788818359375, -15.2236328125, -14.658447265625, -14.09326171875, -13.528076171875, -12.962890625, -12.397705078125, -11.83251953125, -11.267333984375, -10.7021484375, -10.136962890625, -9.57177734375, -9.006591796875, -8.44140625, -7.876220703125, -7.31103515625, -6.745849609375, -6.1806640625, -5.615478515625, -5.05029296875, -4.485107421875, -3.919921875, -3.354736328125, -2.78955078125, -2.224365234375, -1.6591796875, -1.093994140625, -0.52880859375, 0.036376953125, 0.6015625, 1.166748046875, 1.73193359375, 2.297119140625, 2.8623046875, 3.427490234375, 3.99267578125, 4.557861328125, 5.123046875, 5.688232421875, 6.25341796875, 6.818603515625, 7.3837890625, 7.948974609375, 8.51416015625, 9.079345703125, 9.64453125, 10.209716796875, 10.77490234375, 11.340087890625, 11.9052734375, 12.470458984375, 13.03564453125, 13.600830078125, 14.166015625, 14.731201171875, 15.29638671875, 15.861572265625, 16.4267578125, 16.991943359375, 17.55712890625, 18.122314453125, 18.6875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 9.0, 7.0, 10.0, 10.0, 7.0, 13.0, 21.0, 31.0, 34.0, 34.0, 34.0, 78.0, 75.0, 98.0, 104.0, 139.0, 158.0, 183.0, 200.0, 207.0, 231.0, 224.0, 238.0, 209.0, 222.0, 198.0, 186.0, 166.0, 144.0, 130.0, 124.0, 103.0, 87.0, 72.0, 61.0, 46.0, 37.0, 31.0, 27.0, 26.0, 12.0, 8.0, 17.0, 3.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.810302734375, -7.52685546875, -7.243408203125, -6.9599609375, -6.676513671875, -6.39306640625, -6.109619140625, -5.826171875, -5.542724609375, -5.25927734375, -4.975830078125, -4.6923828125, -4.408935546875, -4.12548828125, -3.842041015625, -3.55859375, -3.275146484375, -2.99169921875, -2.708251953125, -2.4248046875, -2.141357421875, -1.85791015625, -1.574462890625, -1.291015625, -1.007568359375, -0.72412109375, -0.440673828125, -0.1572265625, 0.126220703125, 0.40966796875, 0.693115234375, 0.9765625, 1.260009765625, 1.54345703125, 1.826904296875, 2.1103515625, 2.393798828125, 2.67724609375, 2.960693359375, 3.244140625, 3.527587890625, 3.81103515625, 4.094482421875, 4.3779296875, 4.661376953125, 4.94482421875, 5.228271484375, 5.51171875, 5.795166015625, 6.07861328125, 6.362060546875, 6.6455078125, 6.928955078125, 7.21240234375, 7.495849609375, 7.779296875, 8.062744140625, 8.34619140625, 8.629638671875, 8.9130859375, 9.196533203125, 9.47998046875, 9.763427734375, 10.046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 2.0, 10.0, 11.0, 11.0, 15.0, 15.0, 10.0, 24.0, 25.0, 31.0, 29.0, 42.0, 47.0, 53.0, 53.0, 31.0, 43.0, 46.0, 53.0, 59.0, 54.0, 46.0, 45.0, 38.0, 28.0, 23.0, 25.0, 21.0, 19.0, 17.0, 10.0, 19.0, 9.0, 3.0, 4.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.62458610534668, -22.894315719604492, -22.164047241210938, -21.43377685546875, -20.703506469726562, -19.973236083984375, -19.242965698242188, -18.512697219848633, -17.782426834106445, -17.052156448364258, -16.321887969970703, -15.591617584228516, -14.861347198486328, -14.13107681274414, -13.40080738067627, -12.670537948608398, -11.940267562866211, -11.209997177124023, -10.479727745056152, -9.749458312988281, -9.019187927246094, -8.288917541503906, -7.558648109436035, -6.828378200531006, -6.098108291625977, -5.367838382720947, -4.637568473815918, -3.9072985649108887, -3.1770286560058594, -2.44675874710083, -1.7164888381958008, -0.9862189292907715, -0.2559471130371094, 0.4743227958679199, 1.2045927047729492, 1.9348626136779785, 2.665132522583008, 3.395402431488037, 4.125672340393066, 4.855942249298096, 5.586212158203125, 6.316482067108154, 7.046751976013184, 7.777021884918213, 8.507291793823242, 9.23756217956543, 9.9678316116333, 10.698101043701172, 11.42837142944336, 12.158641815185547, 12.888911247253418, 13.619180679321289, 14.349451065063477, 15.079721450805664, 15.809990882873535, 16.540260314941406, 17.270530700683594, 18.00080108642578, 18.73107147216797, 19.461339950561523, 20.19161033630371, 20.9218807220459, 21.652149200439453, 22.38241958618164, 23.112689971923828]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 9.0, 10.0, 14.0, 17.0, 13.0, 17.0, 18.0, 30.0, 32.0, 32.0, 31.0, 39.0, 29.0, 30.0, 39.0, 36.0, 33.0, 45.0, 33.0, 38.0, 45.0, 36.0, 47.0, 30.0, 36.0, 26.0, 34.0, 26.0, 25.0, 17.0, 18.0, 9.0, 21.0, 13.0, 12.0, 10.0, 9.0, 9.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.705747604370117, -21.97810935974121, -21.250471115112305, -20.5228328704834, -19.795194625854492, -19.067556381225586, -18.339920043945312, -17.612281799316406, -16.8846435546875, -16.157005310058594, -15.429367065429688, -14.701728820800781, -13.974090576171875, -13.246452331542969, -12.518815040588379, -11.791176795959473, -11.06353759765625, -10.335899353027344, -9.608261108398438, -8.880622863769531, -8.152984619140625, -7.425346851348877, -6.697709083557129, -5.970070838928223, -5.242432594299316, -4.51479434967041, -3.787156343460083, -3.059518337249756, -2.3318800926208496, -1.6042418479919434, -0.8766040802001953, -0.14896583557128906, 0.5786724090576172, 1.3063105344772339, 2.0339486598968506, 2.7615866661071777, 3.489224910736084, 4.21686315536499, 4.944500923156738, 5.6721391677856445, 6.399777412414551, 7.127415657043457, 7.855053901672363, 8.582691192626953, 9.31032943725586, 10.037967681884766, 10.765605926513672, 11.493244171142578, 12.220882415771484, 12.94852066040039, 13.676158905029297, 14.403797149658203, 15.13143539428711, 15.859073638916016, 16.586711883544922, 17.314350128173828, 18.041988372802734, 18.76962661743164, 19.497264862060547, 20.224903106689453, 20.95254135131836, 21.680179595947266, 22.407817840576172, 23.135456085205078, 23.86309242248535]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 14.0, 11.0, 27.0, 25.0, 59.0, 105.0, 166.0, 260.0, 403.0, 615.0, 985.0, 1531.0, 2534.0, 4236.0, 7005.0, 11554.0, 19133.0, 32257.0, 53553.0, 87318.0, 134627.0, 179745.0, 175950.0, 127904.0, 82883.0, 50149.0, 29833.0, 17894.0, 10842.0, 6535.0, 3926.0, 2496.0, 1486.0, 920.0, 620.0, 345.0, 239.0, 127.0, 94.0, 55.0, 33.0, 24.0, 12.0, 10.0, 7.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.828125, -19.207275390625, -18.58642578125, -17.965576171875, -17.3447265625, -16.723876953125, -16.10302734375, -15.482177734375, -14.861328125, -14.240478515625, -13.61962890625, -12.998779296875, -12.3779296875, -11.757080078125, -11.13623046875, -10.515380859375, -9.89453125, -9.273681640625, -8.65283203125, -8.031982421875, -7.4111328125, -6.790283203125, -6.16943359375, -5.548583984375, -4.927734375, -4.306884765625, -3.68603515625, -3.065185546875, -2.4443359375, -1.823486328125, -1.20263671875, -0.581787109375, 0.0390625, 0.659912109375, 1.28076171875, 1.901611328125, 2.5224609375, 3.143310546875, 3.76416015625, 4.385009765625, 5.005859375, 5.626708984375, 6.24755859375, 6.868408203125, 7.4892578125, 8.110107421875, 8.73095703125, 9.351806640625, 9.97265625, 10.593505859375, 11.21435546875, 11.835205078125, 12.4560546875, 13.076904296875, 13.69775390625, 14.318603515625, 14.939453125, 15.560302734375, 16.18115234375, 16.802001953125, 17.4228515625, 18.043701171875, 18.66455078125, 19.285400390625, 19.90625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 5.0, 9.0, 9.0, 15.0, 17.0, 11.0, 18.0, 18.0, 25.0, 28.0, 31.0, 26.0, 24.0, 40.0, 32.0, 40.0, 36.0, 31.0, 37.0, 46.0, 39.0, 44.0, 34.0, 36.0, 43.0, 31.0, 39.0, 37.0, 25.0, 29.0, 19.0, 13.0, 17.0, 14.0, 17.0, 13.0, 13.0, 9.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0], "bins": [-23.03125, -22.304443359375, -21.57763671875, -20.850830078125, -20.1240234375, -19.397216796875, -18.67041015625, -17.943603515625, -17.216796875, -16.489990234375, -15.76318359375, -15.036376953125, -14.3095703125, -13.582763671875, -12.85595703125, -12.129150390625, -11.40234375, -10.675537109375, -9.94873046875, -9.221923828125, -8.4951171875, -7.768310546875, -7.04150390625, -6.314697265625, -5.587890625, -4.861083984375, -4.13427734375, -3.407470703125, -2.6806640625, -1.953857421875, -1.22705078125, -0.500244140625, 0.2265625, 0.953369140625, 1.68017578125, 2.406982421875, 3.1337890625, 3.860595703125, 4.58740234375, 5.314208984375, 6.041015625, 6.767822265625, 7.49462890625, 8.221435546875, 8.9482421875, 9.675048828125, 10.40185546875, 11.128662109375, 11.85546875, 12.582275390625, 13.30908203125, 14.035888671875, 14.7626953125, 15.489501953125, 16.21630859375, 16.943115234375, 17.669921875, 18.396728515625, 19.12353515625, 19.850341796875, 20.5771484375, 21.303955078125, 22.03076171875, 22.757568359375, 23.484375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 11.0, 10.0, 19.0, 27.0, 34.0, 60.0, 104.0, 142.0, 206.0, 331.0, 631.0, 1050.0, 1897.0, 3644.0, 7117.0, 14599.0, 31527.0, 70930.0, 161243.0, 293229.0, 246761.0, 117741.0, 51365.0, 23129.0, 10805.0, 5460.0, 2810.0, 1512.0, 872.0, 492.0, 304.0, 183.0, 94.0, 70.0, 40.0, 25.0, 21.0, 16.0, 10.0, 8.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.09375, -20.408935546875, -19.72412109375, -19.039306640625, -18.3544921875, -17.669677734375, -16.98486328125, -16.300048828125, -15.615234375, -14.930419921875, -14.24560546875, -13.560791015625, -12.8759765625, -12.191162109375, -11.50634765625, -10.821533203125, -10.13671875, -9.451904296875, -8.76708984375, -8.082275390625, -7.3974609375, -6.712646484375, -6.02783203125, -5.343017578125, -4.658203125, -3.973388671875, -3.28857421875, -2.603759765625, -1.9189453125, -1.234130859375, -0.54931640625, 0.135498046875, 0.8203125, 1.505126953125, 2.18994140625, 2.874755859375, 3.5595703125, 4.244384765625, 4.92919921875, 5.614013671875, 6.298828125, 6.983642578125, 7.66845703125, 8.353271484375, 9.0380859375, 9.722900390625, 10.40771484375, 11.092529296875, 11.77734375, 12.462158203125, 13.14697265625, 13.831787109375, 14.5166015625, 15.201416015625, 15.88623046875, 16.571044921875, 17.255859375, 17.940673828125, 18.62548828125, 19.310302734375, 19.9951171875, 20.679931640625, 21.36474609375, 22.049560546875, 22.734375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 9.0, 10.0, 7.0, 15.0, 15.0, 17.0, 25.0, 21.0, 29.0, 20.0, 24.0, 34.0, 25.0, 35.0, 42.0, 37.0, 43.0, 40.0, 40.0, 49.0, 43.0, 37.0, 38.0, 38.0, 25.0, 38.0, 36.0, 30.0, 33.0, 15.0, 9.0, 28.0, 14.0, 10.0, 11.0, 13.0, 12.0, 4.0, 4.0, 3.0, 2.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.580322265625, -17.98876953125, -17.397216796875, -16.8056640625, -16.214111328125, -15.62255859375, -15.031005859375, -14.439453125, -13.847900390625, -13.25634765625, -12.664794921875, -12.0732421875, -11.481689453125, -10.89013671875, -10.298583984375, -9.70703125, -9.115478515625, -8.52392578125, -7.932373046875, -7.3408203125, -6.749267578125, -6.15771484375, -5.566162109375, -4.974609375, -4.383056640625, -3.79150390625, -3.199951171875, -2.6083984375, -2.016845703125, -1.42529296875, -0.833740234375, -0.2421875, 0.349365234375, 0.94091796875, 1.532470703125, 2.1240234375, 2.715576171875, 3.30712890625, 3.898681640625, 4.490234375, 5.081787109375, 5.67333984375, 6.264892578125, 6.8564453125, 7.447998046875, 8.03955078125, 8.631103515625, 9.22265625, 9.814208984375, 10.40576171875, 10.997314453125, 11.5888671875, 12.180419921875, 12.77197265625, 13.363525390625, 13.955078125, 14.546630859375, 15.13818359375, 15.729736328125, 16.3212890625, 16.912841796875, 17.50439453125, 18.095947265625, 18.6875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 8.0, 7.0, 5.0, 8.0, 21.0, 22.0, 22.0, 43.0, 67.0, 93.0, 103.0, 167.0, 221.0, 391.0, 664.0, 1172.0, 2426.0, 5469.0, 15441.0, 66065.0, 589396.0, 308903.0, 38723.0, 10571.0, 4143.0, 1840.0, 947.0, 539.0, 327.0, 234.0, 167.0, 94.0, 76.0, 44.0, 31.0, 31.0, 25.0, 15.0, 10.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.53125, -28.632080078125, -27.73291015625, -26.833740234375, -25.9345703125, -25.035400390625, -24.13623046875, -23.237060546875, -22.337890625, -21.438720703125, -20.53955078125, -19.640380859375, -18.7412109375, -17.842041015625, -16.94287109375, -16.043701171875, -15.14453125, -14.245361328125, -13.34619140625, -12.447021484375, -11.5478515625, -10.648681640625, -9.74951171875, -8.850341796875, -7.951171875, -7.052001953125, -6.15283203125, -5.253662109375, -4.3544921875, -3.455322265625, -2.55615234375, -1.656982421875, -0.7578125, 0.141357421875, 1.04052734375, 1.939697265625, 2.8388671875, 3.738037109375, 4.63720703125, 5.536376953125, 6.435546875, 7.334716796875, 8.23388671875, 9.133056640625, 10.0322265625, 10.931396484375, 11.83056640625, 12.729736328125, 13.62890625, 14.528076171875, 15.42724609375, 16.326416015625, 17.2255859375, 18.124755859375, 19.02392578125, 19.923095703125, 20.822265625, 21.721435546875, 22.62060546875, 23.519775390625, 24.4189453125, 25.318115234375, 26.21728515625, 27.116455078125, 28.015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 5.0, 6.0, 13.0, 8.0, 21.0, 20.0, 40.0, 44.0, 80.0, 113.0, 133.0, 161.0, 108.0, 72.0, 42.0, 34.0, 19.0, 21.0, 13.0, 9.0, 10.0, 4.0, 9.0, 2.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019989013671875, -0.0019301772117614746, -0.0018614530563354492, -0.0017927289009094238, -0.0017240047454833984, -0.001655280590057373, -0.0015865564346313477, -0.0015178322792053223, -0.0014491081237792969, -0.0013803839683532715, -0.001311659812927246, -0.0012429356575012207, -0.0011742115020751953, -0.00110548734664917, -0.0010367631912231445, -0.0009680390357971191, -0.0008993148803710938, -0.0008305907249450684, -0.000761866569519043, -0.0006931424140930176, -0.0006244182586669922, -0.0005556941032409668, -0.0004869699478149414, -0.000418245792388916, -0.0003495216369628906, -0.00028079748153686523, -0.00021207332611083984, -0.00014334917068481445, -7.462501525878906e-05, -5.900859832763672e-06, 6.282329559326172e-05, 0.0001315474510192871, 0.0002002716064453125, 0.0002689957618713379, 0.0003377199172973633, 0.00040644407272338867, 0.00047516822814941406, 0.0005438923835754395, 0.0006126165390014648, 0.0006813406944274902, 0.0007500648498535156, 0.000818789005279541, 0.0008875131607055664, 0.0009562373161315918, 0.0010249614715576172, 0.0010936856269836426, 0.001162409782409668, 0.0012311339378356934, 0.0012998580932617188, 0.0013685822486877441, 0.0014373064041137695, 0.001506030559539795, 0.0015747547149658203, 0.0016434788703918457, 0.001712203025817871, 0.0017809271812438965, 0.0018496513366699219, 0.0019183754920959473, 0.0019870996475219727, 0.002055823802947998, 0.0021245479583740234, 0.002193272113800049, 0.0022619962692260742, 0.0023307204246520996, 0.002399444580078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 13.0, 8.0, 20.0, 30.0, 43.0, 62.0, 71.0, 126.0, 193.0, 297.0, 413.0, 623.0, 982.0, 1499.0, 2420.0, 4065.0, 6890.0, 12715.0, 26633.0, 63738.0, 171710.0, 345629.0, 242402.0, 93016.0, 36565.0, 16804.0, 8566.0, 5020.0, 2899.0, 1758.0, 1131.0, 760.0, 495.0, 341.0, 205.0, 132.0, 94.0, 59.0, 43.0, 23.0, 23.0, 14.0, 13.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.0728759765625, -14.528564453125, -13.9842529296875, -13.43994140625, -12.8956298828125, -12.351318359375, -11.8070068359375, -11.2626953125, -10.7183837890625, -10.174072265625, -9.6297607421875, -9.08544921875, -8.5411376953125, -7.996826171875, -7.4525146484375, -6.908203125, -6.3638916015625, -5.819580078125, -5.2752685546875, -4.73095703125, -4.1866455078125, -3.642333984375, -3.0980224609375, -2.5537109375, -2.0093994140625, -1.465087890625, -0.9207763671875, -0.37646484375, 0.1678466796875, 0.712158203125, 1.2564697265625, 1.80078125, 2.3450927734375, 2.889404296875, 3.4337158203125, 3.97802734375, 4.5223388671875, 5.066650390625, 5.6109619140625, 6.1552734375, 6.6995849609375, 7.243896484375, 7.7882080078125, 8.33251953125, 8.8768310546875, 9.421142578125, 9.9654541015625, 10.509765625, 11.0540771484375, 11.598388671875, 12.1427001953125, 12.68701171875, 13.2313232421875, 13.775634765625, 14.3199462890625, 14.8642578125, 15.4085693359375, 15.952880859375, 16.4971923828125, 17.04150390625, 17.5858154296875, 18.130126953125, 18.6744384765625, 19.21875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 10.0, 8.0, 8.0, 16.0, 19.0, 30.0, 44.0, 45.0, 66.0, 78.0, 105.0, 103.0, 102.0, 75.0, 63.0, 56.0, 38.0, 24.0, 16.0, 13.0, 11.0, 7.0, 9.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.6484375, -6.4447021484375, -6.240966796875, -6.0372314453125, -5.83349609375, -5.6297607421875, -5.426025390625, -5.2222900390625, -5.0185546875, -4.8148193359375, -4.611083984375, -4.4073486328125, -4.20361328125, -3.9998779296875, -3.796142578125, -3.5924072265625, -3.388671875, -3.1849365234375, -2.981201171875, -2.7774658203125, -2.57373046875, -2.3699951171875, -2.166259765625, -1.9625244140625, -1.7587890625, -1.5550537109375, -1.351318359375, -1.1475830078125, -0.94384765625, -0.7401123046875, -0.536376953125, -0.3326416015625, -0.12890625, 0.0748291015625, 0.278564453125, 0.4822998046875, 0.68603515625, 0.8897705078125, 1.093505859375, 1.2972412109375, 1.5009765625, 1.7047119140625, 1.908447265625, 2.1121826171875, 2.31591796875, 2.5196533203125, 2.723388671875, 2.9271240234375, 3.130859375, 3.3345947265625, 3.538330078125, 3.7420654296875, 3.94580078125, 4.1495361328125, 4.353271484375, 4.5570068359375, 4.7607421875, 4.9644775390625, 5.168212890625, 5.3719482421875, 5.57568359375, 5.7794189453125, 5.983154296875, 6.1868896484375, 6.390625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 1.0, 10.0, 7.0, 10.0, 12.0, 18.0, 17.0, 22.0, 33.0, 38.0, 30.0, 48.0, 50.0, 44.0, 52.0, 58.0, 64.0, 66.0, 66.0, 49.0, 48.0, 46.0, 37.0, 38.0, 31.0, 20.0, 20.0, 16.0, 13.0, 11.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.093067169189453, -25.244964599609375, -24.396862030029297, -23.54875946044922, -22.70065689086914, -21.852554321289062, -21.004451751708984, -20.156349182128906, -19.308246612548828, -18.46014404296875, -17.612041473388672, -16.763938903808594, -15.915836334228516, -15.067733764648438, -14.219632148742676, -13.371529579162598, -12.523427963256836, -11.675325393676758, -10.82722282409668, -9.979120254516602, -9.131017684936523, -8.282915115356445, -7.434813499450684, -6.5867109298706055, -5.738608360290527, -4.890505790710449, -4.042403221130371, -3.194301128387451, -2.346198558807373, -1.498095989227295, -0.649993896484375, 0.19810867309570312, 1.046213150024414, 1.8943156003952026, 2.742418050765991, 3.5905203819274902, 4.438622951507568, 5.2867255210876465, 6.134827613830566, 6.9829301834106445, 7.831032752990723, 8.6791353225708, 9.527237892150879, 10.37533950805664, 11.223442077636719, 12.071544647216797, 12.919647216796875, 13.767749786376953, 14.615852355957031, 15.46395492553711, 16.312057495117188, 17.160160064697266, 18.008262634277344, 18.856365203857422, 19.7044677734375, 20.552570343017578, 21.400672912597656, 22.248775482177734, 23.096878051757812, 23.94498062133789, 24.79308319091797, 25.641185760498047, 26.489288330078125, 27.337390899658203, 28.18549156188965]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 3.0, 8.0, 14.0, 18.0, 12.0, 23.0, 24.0, 31.0, 29.0, 38.0, 36.0, 24.0, 29.0, 46.0, 35.0, 45.0, 38.0, 36.0, 40.0, 42.0, 51.0, 32.0, 41.0, 32.0, 37.0, 26.0, 22.0, 22.0, 34.0, 19.0, 19.0, 15.0, 11.0, 8.0, 11.0, 10.0, 10.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.562864303588867, -21.806659698486328, -21.050457000732422, -20.294252395629883, -19.538049697875977, -18.781845092773438, -18.02564239501953, -17.269437789916992, -16.513233184814453, -15.75702953338623, -15.000825881958008, -14.244621276855469, -13.488418579101562, -12.732213973999023, -11.9760103225708, -11.219806671142578, -10.463603973388672, -9.70740032196045, -8.951196670532227, -8.194992065429688, -7.438788890838623, -6.6825852394104, -5.9263811111450195, -5.170177459716797, -4.413973808288574, -3.6577701568603516, -2.90156626701355, -2.145362377166748, -1.3891587257385254, -0.6329550743103027, 0.12324905395507812, 0.8794527053833008, 1.6356544494628906, 2.3918581008911133, 3.148061990737915, 3.904265880584717, 4.6604695320129395, 5.416673183441162, 6.172877311706543, 6.929080963134766, 7.685284614562988, 8.441488265991211, 9.197691917419434, 9.953895568847656, 10.710100173950195, 11.466302871704102, 12.22250747680664, 12.978711128234863, 13.734914779663086, 14.491118431091309, 15.247322082519531, 16.00352668762207, 16.759729385375977, 17.515933990478516, 18.272136688232422, 19.02834129333496, 19.7845458984375, 20.54075050354004, 21.296953201293945, 22.053157806396484, 22.80936050415039, 23.56556510925293, 24.32176971435547, 25.077972412109375, 25.83417510986328]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 9.0, 18.0, 15.0, 17.0, 39.0, 47.0, 80.0, 102.0, 160.0, 242.0, 378.0, 543.0, 924.0, 1541.0, 2512.0, 4195.0, 7271.0, 12795.0, 21847.0, 37774.0, 61536.0, 94476.0, 130070.0, 154761.0, 153415.0, 127048.0, 90832.0, 59057.0, 35998.0, 21066.0, 12197.0, 7100.0, 4062.0, 2456.0, 1447.0, 855.0, 572.0, 369.0, 249.0, 148.0, 123.0, 71.0, 39.0, 25.0, 16.0, 13.0, 11.0, 14.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-28.515625, -27.650390625, -26.78515625, -25.919921875, -25.0546875, -24.189453125, -23.32421875, -22.458984375, -21.59375, -20.728515625, -19.86328125, -18.998046875, -18.1328125, -17.267578125, -16.40234375, -15.537109375, -14.671875, -13.806640625, -12.94140625, -12.076171875, -11.2109375, -10.345703125, -9.48046875, -8.615234375, -7.75, -6.884765625, -6.01953125, -5.154296875, -4.2890625, -3.423828125, -2.55859375, -1.693359375, -0.828125, 0.037109375, 0.90234375, 1.767578125, 2.6328125, 3.498046875, 4.36328125, 5.228515625, 6.09375, 6.958984375, 7.82421875, 8.689453125, 9.5546875, 10.419921875, 11.28515625, 12.150390625, 13.015625, 13.880859375, 14.74609375, 15.611328125, 16.4765625, 17.341796875, 18.20703125, 19.072265625, 19.9375, 20.802734375, 21.66796875, 22.533203125, 23.3984375, 24.263671875, 25.12890625, 25.994140625, 26.859375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 10.0, 8.0, 15.0, 17.0, 17.0, 22.0, 22.0, 33.0, 24.0, 29.0, 40.0, 36.0, 41.0, 40.0, 39.0, 39.0, 28.0, 42.0, 45.0, 37.0, 43.0, 43.0, 36.0, 34.0, 27.0, 28.0, 32.0, 25.0, 21.0, 18.0, 16.0, 11.0, 20.0, 17.0, 7.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.28125, -20.564697265625, -19.84814453125, -19.131591796875, -18.4150390625, -17.698486328125, -16.98193359375, -16.265380859375, -15.548828125, -14.832275390625, -14.11572265625, -13.399169921875, -12.6826171875, -11.966064453125, -11.24951171875, -10.532958984375, -9.81640625, -9.099853515625, -8.38330078125, -7.666748046875, -6.9501953125, -6.233642578125, -5.51708984375, -4.800537109375, -4.083984375, -3.367431640625, -2.65087890625, -1.934326171875, -1.2177734375, -0.501220703125, 0.21533203125, 0.931884765625, 1.6484375, 2.364990234375, 3.08154296875, 3.798095703125, 4.5146484375, 5.231201171875, 5.94775390625, 6.664306640625, 7.380859375, 8.097412109375, 8.81396484375, 9.530517578125, 10.2470703125, 10.963623046875, 11.68017578125, 12.396728515625, 13.11328125, 13.829833984375, 14.54638671875, 15.262939453125, 15.9794921875, 16.696044921875, 17.41259765625, 18.129150390625, 18.845703125, 19.562255859375, 20.27880859375, 20.995361328125, 21.7119140625, 22.428466796875, 23.14501953125, 23.861572265625, 24.578125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 9.0, 11.0, 15.0, 26.0, 22.0, 39.0, 50.0, 85.0, 129.0, 183.0, 231.0, 379.0, 480.0, 711.0, 1140.0, 1611.0, 2417.0, 3762.0, 5757.0, 8688.0, 13936.0, 20967.0, 31212.0, 46535.0, 65750.0, 88640.0, 109765.0, 124007.0, 123250.0, 109063.0, 87942.0, 65503.0, 45614.0, 31075.0, 20465.0, 13577.0, 8586.0, 5707.0, 3650.0, 2468.0, 1728.0, 1088.0, 760.0, 470.0, 329.0, 242.0, 149.0, 110.0, 69.0, 45.0, 27.0, 26.0, 22.0, 15.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0], "bins": [-19.515625, -18.8857421875, -18.255859375, -17.6259765625, -16.99609375, -16.3662109375, -15.736328125, -15.1064453125, -14.4765625, -13.8466796875, -13.216796875, -12.5869140625, -11.95703125, -11.3271484375, -10.697265625, -10.0673828125, -9.4375, -8.8076171875, -8.177734375, -7.5478515625, -6.91796875, -6.2880859375, -5.658203125, -5.0283203125, -4.3984375, -3.7685546875, -3.138671875, -2.5087890625, -1.87890625, -1.2490234375, -0.619140625, 0.0107421875, 0.640625, 1.2705078125, 1.900390625, 2.5302734375, 3.16015625, 3.7900390625, 4.419921875, 5.0498046875, 5.6796875, 6.3095703125, 6.939453125, 7.5693359375, 8.19921875, 8.8291015625, 9.458984375, 10.0888671875, 10.71875, 11.3486328125, 11.978515625, 12.6083984375, 13.23828125, 13.8681640625, 14.498046875, 15.1279296875, 15.7578125, 16.3876953125, 17.017578125, 17.6474609375, 18.27734375, 18.9072265625, 19.537109375, 20.1669921875, 20.796875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 4.0, 7.0, 13.0, 10.0, 12.0, 16.0, 21.0, 19.0, 20.0, 34.0, 24.0, 34.0, 42.0, 51.0, 41.0, 32.0, 46.0, 46.0, 50.0, 41.0, 39.0, 46.0, 39.0, 45.0, 39.0, 28.0, 31.0, 15.0, 24.0, 24.0, 19.0, 23.0, 8.0, 10.0, 10.0, 7.0, 5.0, 3.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.078125, -14.56591796875, -14.0537109375, -13.54150390625, -13.029296875, -12.51708984375, -12.0048828125, -11.49267578125, -10.98046875, -10.46826171875, -9.9560546875, -9.44384765625, -8.931640625, -8.41943359375, -7.9072265625, -7.39501953125, -6.8828125, -6.37060546875, -5.8583984375, -5.34619140625, -4.833984375, -4.32177734375, -3.8095703125, -3.29736328125, -2.78515625, -2.27294921875, -1.7607421875, -1.24853515625, -0.736328125, -0.22412109375, 0.2880859375, 0.80029296875, 1.3125, 1.82470703125, 2.3369140625, 2.84912109375, 3.361328125, 3.87353515625, 4.3857421875, 4.89794921875, 5.41015625, 5.92236328125, 6.4345703125, 6.94677734375, 7.458984375, 7.97119140625, 8.4833984375, 8.99560546875, 9.5078125, 10.02001953125, 10.5322265625, 11.04443359375, 11.556640625, 12.06884765625, 12.5810546875, 13.09326171875, 13.60546875, 14.11767578125, 14.6298828125, 15.14208984375, 15.654296875, 16.16650390625, 16.6787109375, 17.19091796875, 17.703125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 9.0, 17.0, 13.0, 22.0, 37.0, 42.0, 50.0, 66.0, 103.0, 138.0, 239.0, 331.0, 516.0, 853.0, 1382.0, 2455.0, 4275.0, 8228.0, 16574.0, 36143.0, 83671.0, 183142.0, 285719.0, 223940.0, 108871.0, 47582.0, 21242.0, 10157.0, 5307.0, 2901.0, 1705.0, 1001.0, 576.0, 372.0, 263.0, 178.0, 124.0, 76.0, 49.0, 41.0, 37.0, 32.0, 18.0, 13.0, 6.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0], "bins": [-25.5625, -24.755126953125, -23.94775390625, -23.140380859375, -22.3330078125, -21.525634765625, -20.71826171875, -19.910888671875, -19.103515625, -18.296142578125, -17.48876953125, -16.681396484375, -15.8740234375, -15.066650390625, -14.25927734375, -13.451904296875, -12.64453125, -11.837158203125, -11.02978515625, -10.222412109375, -9.4150390625, -8.607666015625, -7.80029296875, -6.992919921875, -6.185546875, -5.378173828125, -4.57080078125, -3.763427734375, -2.9560546875, -2.148681640625, -1.34130859375, -0.533935546875, 0.2734375, 1.080810546875, 1.88818359375, 2.695556640625, 3.5029296875, 4.310302734375, 5.11767578125, 5.925048828125, 6.732421875, 7.539794921875, 8.34716796875, 9.154541015625, 9.9619140625, 10.769287109375, 11.57666015625, 12.384033203125, 13.19140625, 13.998779296875, 14.80615234375, 15.613525390625, 16.4208984375, 17.228271484375, 18.03564453125, 18.843017578125, 19.650390625, 20.457763671875, 21.26513671875, 22.072509765625, 22.8798828125, 23.687255859375, 24.49462890625, 25.302001953125, 26.109375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 6.0, 8.0, 8.0, 11.0, 21.0, 21.0, 21.0, 34.0, 34.0, 37.0, 54.0, 71.0, 77.0, 72.0, 80.0, 72.0, 57.0, 59.0, 48.0, 42.0, 34.0, 31.0, 16.0, 21.0, 14.0, 13.0, 10.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00173187255859375, -0.0016799569129943848, -0.0016280412673950195, -0.0015761256217956543, -0.001524209976196289, -0.0014722943305969238, -0.0014203786849975586, -0.0013684630393981934, -0.0013165473937988281, -0.0012646317481994629, -0.0012127161026000977, -0.0011608004570007324, -0.0011088848114013672, -0.001056969165802002, -0.0010050535202026367, -0.0009531378746032715, -0.0009012222290039062, -0.000849306583404541, -0.0007973909378051758, -0.0007454752922058105, -0.0006935596466064453, -0.0006416440010070801, -0.0005897283554077148, -0.0005378127098083496, -0.0004858970642089844, -0.00043398141860961914, -0.0003820657730102539, -0.00033015012741088867, -0.00027823448181152344, -0.0002263188362121582, -0.00017440319061279297, -0.00012248754501342773, -7.05718994140625e-05, -1.8656253814697266e-05, 3.325939178466797e-05, 8.51750373840332e-05, 0.00013709068298339844, 0.00018900632858276367, 0.0002409219741821289, 0.00029283761978149414, 0.0003447532653808594, 0.0003966689109802246, 0.00044858455657958984, 0.0005005002021789551, 0.0005524158477783203, 0.0006043314933776855, 0.0006562471389770508, 0.000708162784576416, 0.0007600784301757812, 0.0008119940757751465, 0.0008639097213745117, 0.000915825366973877, 0.0009677410125732422, 0.0010196566581726074, 0.0010715723037719727, 0.0011234879493713379, 0.0011754035949707031, 0.0012273192405700684, 0.0012792348861694336, 0.0013311505317687988, 0.001383066177368164, 0.0014349818229675293, 0.0014868974685668945, 0.0015388131141662598, 0.001590728759765625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 9.0, 5.0, 7.0, 6.0, 12.0, 17.0, 20.0, 20.0, 32.0, 46.0, 61.0, 81.0, 106.0, 163.0, 231.0, 365.0, 541.0, 829.0, 1395.0, 2442.0, 4389.0, 8688.0, 18771.0, 44732.0, 112642.0, 244044.0, 300461.0, 177748.0, 73658.0, 29380.0, 13058.0, 6151.0, 3337.0, 1898.0, 1124.0, 657.0, 428.0, 290.0, 203.0, 130.0, 84.0, 77.0, 54.0, 56.0, 25.0, 24.0, 15.0, 11.0, 14.0, 8.0, 7.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0], "bins": [-28.296875, -27.4462890625, -26.595703125, -25.7451171875, -24.89453125, -24.0439453125, -23.193359375, -22.3427734375, -21.4921875, -20.6416015625, -19.791015625, -18.9404296875, -18.08984375, -17.2392578125, -16.388671875, -15.5380859375, -14.6875, -13.8369140625, -12.986328125, -12.1357421875, -11.28515625, -10.4345703125, -9.583984375, -8.7333984375, -7.8828125, -7.0322265625, -6.181640625, -5.3310546875, -4.48046875, -3.6298828125, -2.779296875, -1.9287109375, -1.078125, -0.2275390625, 0.623046875, 1.4736328125, 2.32421875, 3.1748046875, 4.025390625, 4.8759765625, 5.7265625, 6.5771484375, 7.427734375, 8.2783203125, 9.12890625, 9.9794921875, 10.830078125, 11.6806640625, 12.53125, 13.3818359375, 14.232421875, 15.0830078125, 15.93359375, 16.7841796875, 17.634765625, 18.4853515625, 19.3359375, 20.1865234375, 21.037109375, 21.8876953125, 22.73828125, 23.5888671875, 24.439453125, 25.2900390625, 26.140625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 11.0, 4.0, 7.0, 7.0, 19.0, 21.0, 22.0, 38.0, 45.0, 65.0, 62.0, 90.0, 75.0, 102.0, 83.0, 82.0, 72.0, 44.0, 38.0, 31.0, 20.0, 21.0, 9.0, 10.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.078125, -9.793212890625, -9.50830078125, -9.223388671875, -8.9384765625, -8.653564453125, -8.36865234375, -8.083740234375, -7.798828125, -7.513916015625, -7.22900390625, -6.944091796875, -6.6591796875, -6.374267578125, -6.08935546875, -5.804443359375, -5.51953125, -5.234619140625, -4.94970703125, -4.664794921875, -4.3798828125, -4.094970703125, -3.81005859375, -3.525146484375, -3.240234375, -2.955322265625, -2.67041015625, -2.385498046875, -2.1005859375, -1.815673828125, -1.53076171875, -1.245849609375, -0.9609375, -0.676025390625, -0.39111328125, -0.106201171875, 0.1787109375, 0.463623046875, 0.74853515625, 1.033447265625, 1.318359375, 1.603271484375, 1.88818359375, 2.173095703125, 2.4580078125, 2.742919921875, 3.02783203125, 3.312744140625, 3.59765625, 3.882568359375, 4.16748046875, 4.452392578125, 4.7373046875, 5.022216796875, 5.30712890625, 5.592041015625, 5.876953125, 6.161865234375, 6.44677734375, 6.731689453125, 7.0166015625, 7.301513671875, 7.58642578125, 7.871337890625, 8.15625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 4.0, 13.0, 15.0, 17.0, 25.0, 34.0, 32.0, 49.0, 41.0, 48.0, 57.0, 47.0, 47.0, 54.0, 51.0, 56.0, 49.0, 56.0, 50.0, 54.0, 46.0, 24.0, 20.0, 24.0, 25.0, 9.0, 9.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.972904205322266, -28.169275283813477, -27.365646362304688, -26.562015533447266, -25.758386611938477, -24.954757690429688, -24.151126861572266, -23.347497940063477, -22.543869018554688, -21.7402400970459, -20.93661117553711, -20.132980346679688, -19.3293514251709, -18.52572250366211, -17.722091674804688, -16.9184627532959, -16.11483383178711, -15.31120491027832, -14.507575035095215, -13.70394515991211, -12.90031623840332, -12.096687316894531, -11.293057441711426, -10.48942756652832, -9.685798645019531, -8.882169723510742, -8.078539848327637, -7.2749104499816895, -6.471281051635742, -5.667651653289795, -4.864022254943848, -4.0603928565979, -3.256765365600586, -2.4531359672546387, -1.6495065689086914, -0.8458771705627441, -0.042247772216796875, 0.7613816261291504, 1.5650110244750977, 2.368640422821045, 3.172269821166992, 3.9758992195129395, 4.779528617858887, 5.583158016204834, 6.386787414550781, 7.1904168128967285, 7.994046211242676, 8.797676086425781, 9.60130500793457, 10.40493392944336, 11.208563804626465, 12.01219367980957, 12.81582260131836, 13.619451522827148, 14.423081398010254, 15.22671127319336, 16.03034019470215, 16.833969116210938, 17.63759994506836, 18.44122886657715, 19.244857788085938, 20.048486709594727, 20.852115631103516, 21.655746459960938, 22.459375381469727]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 12.0, 18.0, 21.0, 27.0, 19.0, 22.0, 39.0, 32.0, 38.0, 49.0, 40.0, 47.0, 45.0, 46.0, 36.0, 39.0, 48.0, 43.0, 38.0, 47.0, 32.0, 43.0, 28.0, 29.0, 22.0, 21.0, 13.0, 13.0, 17.0, 9.0, 7.0, 13.0, 12.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.88239097595215, -24.017698287963867, -23.153003692626953, -22.288311004638672, -21.42361831665039, -20.55892562866211, -19.694231033325195, -18.829538345336914, -17.964845657348633, -17.10015296936035, -16.235458374023438, -15.370765686035156, -14.506072998046875, -13.641379356384277, -12.77668571472168, -11.911993026733398, -11.0472993850708, -10.182605743408203, -9.317913055419922, -8.453219413757324, -7.588526725769043, -6.723833084106445, -5.859139919281006, -4.994446754455566, -4.129753589630127, -3.2650604248046875, -2.400367259979248, -1.5356738567352295, -0.67098069190979, 0.19371271133422852, 1.058405876159668, 1.9230990409851074, 2.787792205810547, 3.6524853706359863, 4.517178535461426, 5.381872177124023, 6.246564865112305, 7.111258506774902, 7.975951671600342, 8.840644836425781, 9.705337524414062, 10.57003116607666, 11.434723854064941, 12.299417495727539, 13.16411018371582, 14.028803825378418, 14.893497467041016, 15.758190155029297, 16.622882843017578, 17.48757553100586, 18.352270126342773, 19.216962814331055, 20.081655502319336, 20.94635009765625, 21.81104278564453, 22.675735473632812, 23.540430068969727, 24.405122756958008, 25.269817352294922, 26.134510040283203, 26.999202728271484, 27.863895416259766, 28.72859001159668, 29.59328269958496, 30.457975387573242]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 13.0, 19.0, 24.0, 38.0, 56.0, 75.0, 114.0, 154.0, 304.0, 473.0, 785.0, 1451.0, 2394.0, 4222.0, 7253.0, 13014.0, 22667.0, 40539.0, 71161.0, 124818.0, 212699.0, 346833.0, 512911.0, 650034.0, 668191.0, 552550.0, 385754.0, 240599.0, 143140.0, 82422.0, 46945.0, 26599.0, 15007.0, 8757.0, 4951.0, 2945.0, 1720.0, 1030.0, 591.0, 401.0, 235.0, 141.0, 86.0, 66.0, 27.0, 25.0, 23.0, 15.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.8125, -18.24462890625, -17.6767578125, -17.10888671875, -16.541015625, -15.97314453125, -15.4052734375, -14.83740234375, -14.26953125, -13.70166015625, -13.1337890625, -12.56591796875, -11.998046875, -11.43017578125, -10.8623046875, -10.29443359375, -9.7265625, -9.15869140625, -8.5908203125, -8.02294921875, -7.455078125, -6.88720703125, -6.3193359375, -5.75146484375, -5.18359375, -4.61572265625, -4.0478515625, -3.47998046875, -2.912109375, -2.34423828125, -1.7763671875, -1.20849609375, -0.640625, -0.07275390625, 0.4951171875, 1.06298828125, 1.630859375, 2.19873046875, 2.7666015625, 3.33447265625, 3.90234375, 4.47021484375, 5.0380859375, 5.60595703125, 6.173828125, 6.74169921875, 7.3095703125, 7.87744140625, 8.4453125, 9.01318359375, 9.5810546875, 10.14892578125, 10.716796875, 11.28466796875, 11.8525390625, 12.42041015625, 12.98828125, 13.55615234375, 14.1240234375, 14.69189453125, 15.259765625, 15.82763671875, 16.3955078125, 16.96337890625, 17.53125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 9.0, 12.0, 17.0, 13.0, 17.0, 23.0, 26.0, 20.0, 24.0, 27.0, 41.0, 42.0, 45.0, 47.0, 30.0, 51.0, 43.0, 28.0, 45.0, 36.0, 46.0, 39.0, 36.0, 31.0, 29.0, 27.0, 26.0, 24.0, 23.0, 24.0, 14.0, 7.0, 12.0, 12.0, 4.0, 14.0, 7.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.623291015625, -15.10595703125, -14.588623046875, -14.0712890625, -13.553955078125, -13.03662109375, -12.519287109375, -12.001953125, -11.484619140625, -10.96728515625, -10.449951171875, -9.9326171875, -9.415283203125, -8.89794921875, -8.380615234375, -7.86328125, -7.345947265625, -6.82861328125, -6.311279296875, -5.7939453125, -5.276611328125, -4.75927734375, -4.241943359375, -3.724609375, -3.207275390625, -2.68994140625, -2.172607421875, -1.6552734375, -1.137939453125, -0.62060546875, -0.103271484375, 0.4140625, 0.931396484375, 1.44873046875, 1.966064453125, 2.4833984375, 3.000732421875, 3.51806640625, 4.035400390625, 4.552734375, 5.070068359375, 5.58740234375, 6.104736328125, 6.6220703125, 7.139404296875, 7.65673828125, 8.174072265625, 8.69140625, 9.208740234375, 9.72607421875, 10.243408203125, 10.7607421875, 11.278076171875, 11.79541015625, 12.312744140625, 12.830078125, 13.347412109375, 13.86474609375, 14.382080078125, 14.8994140625, 15.416748046875, 15.93408203125, 16.451416015625, 16.96875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 14.0, 21.0, 42.0, 54.0, 75.0, 111.0, 172.0, 350.0, 471.0, 774.0, 1359.0, 2305.0, 3763.0, 6367.0, 10729.0, 18285.0, 30501.0, 50967.0, 83506.0, 133131.0, 204549.0, 298799.0, 403940.0, 497146.0, 541356.0, 517367.0, 435076.0, 329444.0, 229474.0, 151319.0, 95657.0, 59077.0, 35461.0, 21190.0, 12711.0, 7454.0, 4316.0, 2727.0, 1609.0, 966.0, 598.0, 373.0, 254.0, 131.0, 91.0, 62.0, 49.0, 28.0, 26.0, 6.0, 15.0, 9.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-14.703125, -14.238525390625, -13.77392578125, -13.309326171875, -12.8447265625, -12.380126953125, -11.91552734375, -11.450927734375, -10.986328125, -10.521728515625, -10.05712890625, -9.592529296875, -9.1279296875, -8.663330078125, -8.19873046875, -7.734130859375, -7.26953125, -6.804931640625, -6.34033203125, -5.875732421875, -5.4111328125, -4.946533203125, -4.48193359375, -4.017333984375, -3.552734375, -3.088134765625, -2.62353515625, -2.158935546875, -1.6943359375, -1.229736328125, -0.76513671875, -0.300537109375, 0.1640625, 0.628662109375, 1.09326171875, 1.557861328125, 2.0224609375, 2.487060546875, 2.95166015625, 3.416259765625, 3.880859375, 4.345458984375, 4.81005859375, 5.274658203125, 5.7392578125, 6.203857421875, 6.66845703125, 7.133056640625, 7.59765625, 8.062255859375, 8.52685546875, 8.991455078125, 9.4560546875, 9.920654296875, 10.38525390625, 10.849853515625, 11.314453125, 11.779052734375, 12.24365234375, 12.708251953125, 13.1728515625, 13.637451171875, 14.10205078125, 14.566650390625, 15.03125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 6.0, 9.0, 14.0, 20.0, 19.0, 25.0, 38.0, 39.0, 69.0, 75.0, 75.0, 105.0, 123.0, 165.0, 137.0, 157.0, 172.0, 213.0, 209.0, 234.0, 235.0, 210.0, 212.0, 203.0, 170.0, 181.0, 167.0, 148.0, 125.0, 89.0, 72.0, 69.0, 59.0, 52.0, 40.0, 28.0, 15.0, 20.0, 12.0, 21.0, 14.0, 12.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.16796875, -6.93292236328125, -6.6978759765625, -6.46282958984375, -6.227783203125, -5.99273681640625, -5.7576904296875, -5.52264404296875, -5.28759765625, -5.05255126953125, -4.8175048828125, -4.58245849609375, -4.347412109375, -4.11236572265625, -3.8773193359375, -3.64227294921875, -3.4072265625, -3.17218017578125, -2.9371337890625, -2.70208740234375, -2.467041015625, -2.23199462890625, -1.9969482421875, -1.76190185546875, -1.52685546875, -1.29180908203125, -1.0567626953125, -0.82171630859375, -0.586669921875, -0.35162353515625, -0.1165771484375, 0.11846923828125, 0.353515625, 0.58856201171875, 0.8236083984375, 1.05865478515625, 1.293701171875, 1.52874755859375, 1.7637939453125, 1.99884033203125, 2.23388671875, 2.46893310546875, 2.7039794921875, 2.93902587890625, 3.174072265625, 3.40911865234375, 3.6441650390625, 3.87921142578125, 4.1142578125, 4.34930419921875, 4.5843505859375, 4.81939697265625, 5.054443359375, 5.28948974609375, 5.5245361328125, 5.75958251953125, 5.99462890625, 6.22967529296875, 6.4647216796875, 6.69976806640625, 6.934814453125, 7.16986083984375, 7.4049072265625, 7.63995361328125, 7.875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 7.0, 10.0, 12.0, 13.0, 27.0, 19.0, 23.0, 32.0, 33.0, 37.0, 38.0, 46.0, 43.0, 55.0, 53.0, 57.0, 50.0, 59.0, 49.0, 57.0, 45.0, 33.0, 26.0, 29.0, 18.0, 21.0, 21.0, 12.0, 8.0, 11.0, 10.0, 5.0, 9.0, 6.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-19.732757568359375, -19.13155174255371, -18.530345916748047, -17.929140090942383, -17.32793426513672, -16.726726531982422, -16.125520706176758, -15.524314880371094, -14.92310905456543, -14.321903228759766, -13.720697402954102, -13.119490623474121, -12.518284797668457, -11.917078971862793, -11.315872192382812, -10.714666366577148, -10.113460540771484, -9.51225471496582, -8.911048889160156, -8.309842109680176, -7.708636283874512, -7.107430458068848, -6.506224155426025, -5.905017852783203, -5.303812026977539, -4.702606201171875, -4.101399898529053, -3.5001938343048096, -2.8989877700805664, -2.2977817058563232, -1.69657564163208, -1.0953693389892578, -0.49416160583496094, 0.10704445838928223, 0.7082505226135254, 1.3094565868377686, 1.9106626510620117, 2.511868715286255, 3.113074779510498, 3.7142810821533203, 4.315486907958984, 4.916692733764648, 5.517899036407471, 6.119105339050293, 6.720311164855957, 7.321516990661621, 7.922723293304443, 8.523929595947266, 9.12513542175293, 9.726341247558594, 10.327547073364258, 10.928753852844238, 11.529959678649902, 12.131165504455566, 12.732372283935547, 13.333578109741211, 13.934783935546875, 14.535989761352539, 15.137195587158203, 15.738402366638184, 16.33960723876953, 16.940814971923828, 17.542020797729492, 18.143226623535156, 18.74443244934082]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 5.0, 9.0, 9.0, 13.0, 14.0, 23.0, 17.0, 17.0, 22.0, 30.0, 31.0, 41.0, 42.0, 49.0, 50.0, 44.0, 33.0, 44.0, 52.0, 36.0, 37.0, 47.0, 39.0, 37.0, 44.0, 31.0, 24.0, 26.0, 17.0, 13.0, 15.0, 10.0, 15.0, 12.0, 14.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.35784149169922, -18.696195602416992, -18.034549713134766, -17.37290382385254, -16.711257934570312, -16.049612045288086, -15.387967109680176, -14.72632122039795, -14.064675331115723, -13.403029441833496, -12.74138355255127, -12.079737663269043, -11.418092727661133, -10.756446838378906, -10.09480094909668, -9.433155059814453, -8.771509170532227, -8.10986328125, -7.448217391967773, -6.786571979522705, -6.1249260902404785, -5.463280200958252, -4.801634788513184, -4.139988899230957, -3.4783430099487305, -2.816697120666504, -2.1550514698028564, -1.4934056997299194, -0.8317599296569824, -0.17011404037475586, 0.4915316104888916, 1.153177261352539, 1.8148212432861328, 2.4764671325683594, 3.138112783432007, 3.7997584342956543, 4.461404323577881, 5.123050212860107, 5.784695625305176, 6.446341514587402, 7.107987403869629, 7.7696332931518555, 8.431279182434082, 9.092925071716309, 9.754570007324219, 10.416215896606445, 11.077861785888672, 11.739507675170898, 12.401153564453125, 13.062799453735352, 13.724445343017578, 14.386091232299805, 15.047737121582031, 15.709383010864258, 16.371028900146484, 17.032672882080078, 17.694320678710938, 18.355966567993164, 19.01761245727539, 19.679258346557617, 20.340904235839844, 21.00255012512207, 21.664196014404297, 22.32583999633789, 22.987485885620117]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 13.0, 21.0, 15.0, 39.0, 44.0, 60.0, 89.0, 117.0, 174.0, 223.0, 333.0, 420.0, 660.0, 872.0, 1284.0, 1925.0, 2654.0, 4019.0, 6161.0, 9274.0, 14447.0, 23130.0, 36894.0, 60210.0, 96205.0, 146595.0, 182219.0, 161168.0, 110806.0, 69711.0, 43116.0, 26467.0, 16839.0, 10853.0, 6964.0, 4465.0, 3108.0, 2123.0, 1440.0, 1038.0, 721.0, 470.0, 343.0, 237.0, 156.0, 98.0, 82.0, 70.0, 57.0, 38.0, 29.0, 21.0, 17.0, 9.0, 4.0, 4.0, 5.0], "bins": [-11.6015625, -11.2568359375, -10.912109375, -10.5673828125, -10.22265625, -9.8779296875, -9.533203125, -9.1884765625, -8.84375, -8.4990234375, -8.154296875, -7.8095703125, -7.46484375, -7.1201171875, -6.775390625, -6.4306640625, -6.0859375, -5.7412109375, -5.396484375, -5.0517578125, -4.70703125, -4.3623046875, -4.017578125, -3.6728515625, -3.328125, -2.9833984375, -2.638671875, -2.2939453125, -1.94921875, -1.6044921875, -1.259765625, -0.9150390625, -0.5703125, -0.2255859375, 0.119140625, 0.4638671875, 0.80859375, 1.1533203125, 1.498046875, 1.8427734375, 2.1875, 2.5322265625, 2.876953125, 3.2216796875, 3.56640625, 3.9111328125, 4.255859375, 4.6005859375, 4.9453125, 5.2900390625, 5.634765625, 5.9794921875, 6.32421875, 6.6689453125, 7.013671875, 7.3583984375, 7.703125, 8.0478515625, 8.392578125, 8.7373046875, 9.08203125, 9.4267578125, 9.771484375, 10.1162109375, 10.4609375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 13.0, 13.0, 19.0, 17.0, 17.0, 17.0, 25.0, 27.0, 26.0, 27.0, 34.0, 38.0, 62.0, 49.0, 39.0, 37.0, 43.0, 39.0, 40.0, 38.0, 47.0, 32.0, 32.0, 35.0, 30.0, 26.0, 19.0, 22.0, 12.0, 18.0, 12.0, 17.0, 9.0, 9.0, 12.0, 8.0, 8.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.171875, -18.528564453125, -17.88525390625, -17.241943359375, -16.5986328125, -15.955322265625, -15.31201171875, -14.668701171875, -14.025390625, -13.382080078125, -12.73876953125, -12.095458984375, -11.4521484375, -10.808837890625, -10.16552734375, -9.522216796875, -8.87890625, -8.235595703125, -7.59228515625, -6.948974609375, -6.3056640625, -5.662353515625, -5.01904296875, -4.375732421875, -3.732421875, -3.089111328125, -2.44580078125, -1.802490234375, -1.1591796875, -0.515869140625, 0.12744140625, 0.770751953125, 1.4140625, 2.057373046875, 2.70068359375, 3.343994140625, 3.9873046875, 4.630615234375, 5.27392578125, 5.917236328125, 6.560546875, 7.203857421875, 7.84716796875, 8.490478515625, 9.1337890625, 9.777099609375, 10.42041015625, 11.063720703125, 11.70703125, 12.350341796875, 12.99365234375, 13.636962890625, 14.2802734375, 14.923583984375, 15.56689453125, 16.210205078125, 16.853515625, 17.496826171875, 18.14013671875, 18.783447265625, 19.4267578125, 20.070068359375, 20.71337890625, 21.356689453125, 22.0]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 5.0, 8.0, 8.0, 6.0, 24.0, 29.0, 44.0, 55.0, 116.0, 157.0, 229.0, 372.0, 573.0, 912.0, 1558.0, 2549.0, 4555.0, 8771.0, 17267.0, 35217.0, 76076.0, 164028.0, 283301.0, 233140.0, 114400.0, 52432.0, 24789.0, 12659.0, 6573.0, 3469.0, 2001.0, 1227.0, 716.0, 451.0, 284.0, 171.0, 118.0, 84.0, 63.0, 50.0, 26.0, 16.0, 7.0, 6.0, 4.0, 0.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-14.5078125, -14.0904541015625, -13.673095703125, -13.2557373046875, -12.83837890625, -12.4210205078125, -12.003662109375, -11.5863037109375, -11.1689453125, -10.7515869140625, -10.334228515625, -9.9168701171875, -9.49951171875, -9.0821533203125, -8.664794921875, -8.2474365234375, -7.830078125, -7.4127197265625, -6.995361328125, -6.5780029296875, -6.16064453125, -5.7432861328125, -5.325927734375, -4.9085693359375, -4.4912109375, -4.0738525390625, -3.656494140625, -3.2391357421875, -2.82177734375, -2.4044189453125, -1.987060546875, -1.5697021484375, -1.15234375, -0.7349853515625, -0.317626953125, 0.0997314453125, 0.51708984375, 0.9344482421875, 1.351806640625, 1.7691650390625, 2.1865234375, 2.6038818359375, 3.021240234375, 3.4385986328125, 3.85595703125, 4.2733154296875, 4.690673828125, 5.1080322265625, 5.525390625, 5.9427490234375, 6.360107421875, 6.7774658203125, 7.19482421875, 7.6121826171875, 8.029541015625, 8.4468994140625, 8.8642578125, 9.2816162109375, 9.698974609375, 10.1163330078125, 10.53369140625, 10.9510498046875, 11.368408203125, 11.7857666015625, 12.203125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 9.0, 6.0, 3.0, 2.0, 7.0, 7.0, 5.0, 4.0, 7.0, 13.0, 10.0, 13.0, 11.0, 23.0, 28.0, 31.0, 27.0, 33.0, 31.0, 38.0, 40.0, 37.0, 31.0, 32.0, 50.0, 31.0, 52.0, 40.0, 42.0, 50.0, 35.0, 44.0, 32.0, 25.0, 27.0, 17.0, 21.0, 17.0, 22.0, 8.0, 15.0, 5.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.4375, -13.9840087890625, -13.530517578125, -13.0770263671875, -12.62353515625, -12.1700439453125, -11.716552734375, -11.2630615234375, -10.8095703125, -10.3560791015625, -9.902587890625, -9.4490966796875, -8.99560546875, -8.5421142578125, -8.088623046875, -7.6351318359375, -7.181640625, -6.7281494140625, -6.274658203125, -5.8211669921875, -5.36767578125, -4.9141845703125, -4.460693359375, -4.0072021484375, -3.5537109375, -3.1002197265625, -2.646728515625, -2.1932373046875, -1.73974609375, -1.2862548828125, -0.832763671875, -0.3792724609375, 0.07421875, 0.5277099609375, 0.981201171875, 1.4346923828125, 1.88818359375, 2.3416748046875, 2.795166015625, 3.2486572265625, 3.7021484375, 4.1556396484375, 4.609130859375, 5.0626220703125, 5.51611328125, 5.9696044921875, 6.423095703125, 6.8765869140625, 7.330078125, 7.7835693359375, 8.237060546875, 8.6905517578125, 9.14404296875, 9.5975341796875, 10.051025390625, 10.5045166015625, 10.9580078125, 11.4114990234375, 11.864990234375, 12.3184814453125, 12.77197265625, 13.2254638671875, 13.678955078125, 14.1324462890625, 14.5859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 13.0, 16.0, 13.0, 30.0, 35.0, 46.0, 82.0, 124.0, 136.0, 214.0, 330.0, 479.0, 873.0, 1338.0, 2520.0, 5249.0, 12166.0, 36495.0, 159332.0, 568150.0, 193090.0, 42114.0, 13589.0, 5526.0, 2586.0, 1505.0, 868.0, 498.0, 372.0, 216.0, 166.0, 101.0, 81.0, 53.0, 49.0, 25.0, 21.0, 8.0, 17.0, 8.0, 2.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.84375, -9.5413818359375, -9.239013671875, -8.9366455078125, -8.63427734375, -8.3319091796875, -8.029541015625, -7.7271728515625, -7.4248046875, -7.1224365234375, -6.820068359375, -6.5177001953125, -6.21533203125, -5.9129638671875, -5.610595703125, -5.3082275390625, -5.005859375, -4.7034912109375, -4.401123046875, -4.0987548828125, -3.79638671875, -3.4940185546875, -3.191650390625, -2.8892822265625, -2.5869140625, -2.2845458984375, -1.982177734375, -1.6798095703125, -1.37744140625, -1.0750732421875, -0.772705078125, -0.4703369140625, -0.16796875, 0.1343994140625, 0.436767578125, 0.7391357421875, 1.04150390625, 1.3438720703125, 1.646240234375, 1.9486083984375, 2.2509765625, 2.5533447265625, 2.855712890625, 3.1580810546875, 3.46044921875, 3.7628173828125, 4.065185546875, 4.3675537109375, 4.669921875, 4.9722900390625, 5.274658203125, 5.5770263671875, 5.87939453125, 6.1817626953125, 6.484130859375, 6.7864990234375, 7.0888671875, 7.3912353515625, 7.693603515625, 7.9959716796875, 8.29833984375, 8.6007080078125, 8.903076171875, 9.2054443359375, 9.5078125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 4.0, 14.0, 16.0, 21.0, 9.0, 29.0, 24.0, 42.0, 41.0, 87.0, 92.0, 97.0, 111.0, 85.0, 76.0, 45.0, 35.0, 25.0, 20.0, 17.0, 10.0, 14.0, 10.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004925727844238281, -0.00047606974840164185, -0.00045956671237945557, -0.0004430636763572693, -0.000426560640335083, -0.00041005760431289673, -0.00039355456829071045, -0.00037705153226852417, -0.0003605484962463379, -0.0003440454602241516, -0.00032754242420196533, -0.00031103938817977905, -0.0002945363521575928, -0.0002780333161354065, -0.0002615302801132202, -0.00024502724409103394, -0.00022852420806884766, -0.00021202117204666138, -0.0001955181360244751, -0.00017901510000228882, -0.00016251206398010254, -0.00014600902795791626, -0.00012950599193572998, -0.0001130029559135437, -9.649991989135742e-05, -7.999688386917114e-05, -6.349384784698486e-05, -4.6990811824798584e-05, -3.0487775802612305e-05, -1.3984739780426025e-05, 2.518296241760254e-06, 1.9021332263946533e-05, 3.552436828613281e-05, 5.202740430831909e-05, 6.853044033050537e-05, 8.503347635269165e-05, 0.00010153651237487793, 0.00011803954839706421, 0.0001345425844192505, 0.00015104562044143677, 0.00016754865646362305, 0.00018405169248580933, 0.0002005547285079956, 0.00021705776453018188, 0.00023356080055236816, 0.00025006383657455444, 0.0002665668725967407, 0.000283069908618927, 0.0002995729446411133, 0.00031607598066329956, 0.00033257901668548584, 0.0003490820527076721, 0.0003655850887298584, 0.0003820881247520447, 0.00039859116077423096, 0.00041509419679641724, 0.0004315972328186035, 0.0004481002688407898, 0.0004646033048629761, 0.00048110634088516235, 0.0004976093769073486, 0.0005141124129295349, 0.0005306154489517212, 0.0005471184849739075, 0.0005636215209960938]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 10.0, 2.0, 12.0, 16.0, 18.0, 28.0, 43.0, 62.0, 81.0, 113.0, 167.0, 249.0, 326.0, 442.0, 670.0, 919.0, 1425.0, 2238.0, 3562.0, 5670.0, 10208.0, 18745.0, 37215.0, 82922.0, 201919.0, 345207.0, 184032.0, 75472.0, 34195.0, 17477.0, 9666.0, 5508.0, 3409.0, 1991.0, 1454.0, 874.0, 596.0, 448.0, 311.0, 232.0, 155.0, 118.0, 96.0, 77.0, 50.0, 41.0, 19.0, 29.0, 17.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.2109375, -7.9654541015625, -7.719970703125, -7.4744873046875, -7.22900390625, -6.9835205078125, -6.738037109375, -6.4925537109375, -6.2470703125, -6.0015869140625, -5.756103515625, -5.5106201171875, -5.26513671875, -5.0196533203125, -4.774169921875, -4.5286865234375, -4.283203125, -4.0377197265625, -3.792236328125, -3.5467529296875, -3.30126953125, -3.0557861328125, -2.810302734375, -2.5648193359375, -2.3193359375, -2.0738525390625, -1.828369140625, -1.5828857421875, -1.33740234375, -1.0919189453125, -0.846435546875, -0.6009521484375, -0.35546875, -0.1099853515625, 0.135498046875, 0.3809814453125, 0.62646484375, 0.8719482421875, 1.117431640625, 1.3629150390625, 1.6083984375, 1.8538818359375, 2.099365234375, 2.3448486328125, 2.59033203125, 2.8358154296875, 3.081298828125, 3.3267822265625, 3.572265625, 3.8177490234375, 4.063232421875, 4.3087158203125, 4.55419921875, 4.7996826171875, 5.045166015625, 5.2906494140625, 5.5361328125, 5.7816162109375, 6.027099609375, 6.2725830078125, 6.51806640625, 6.7635498046875, 7.009033203125, 7.2545166015625, 7.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 5.0, 9.0, 3.0, 11.0, 8.0, 20.0, 11.0, 26.0, 30.0, 32.0, 42.0, 67.0, 61.0, 92.0, 87.0, 83.0, 73.0, 67.0, 56.0, 29.0, 32.0, 23.0, 22.0, 13.0, 11.0, 13.0, 5.0, 9.0, 5.0, 7.0, 3.0, 4.0, 7.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.09765625, -3.008575439453125, -2.91949462890625, -2.830413818359375, -2.7413330078125, -2.652252197265625, -2.56317138671875, -2.474090576171875, -2.385009765625, -2.295928955078125, -2.20684814453125, -2.117767333984375, -2.0286865234375, -1.939605712890625, -1.85052490234375, -1.761444091796875, -1.67236328125, -1.583282470703125, -1.49420166015625, -1.405120849609375, -1.3160400390625, -1.226959228515625, -1.13787841796875, -1.048797607421875, -0.959716796875, -0.870635986328125, -0.78155517578125, -0.692474365234375, -0.6033935546875, -0.514312744140625, -0.42523193359375, -0.336151123046875, -0.2470703125, -0.157989501953125, -0.06890869140625, 0.020172119140625, 0.1092529296875, 0.198333740234375, 0.28741455078125, 0.376495361328125, 0.465576171875, 0.554656982421875, 0.64373779296875, 0.732818603515625, 0.8218994140625, 0.910980224609375, 1.00006103515625, 1.089141845703125, 1.17822265625, 1.267303466796875, 1.35638427734375, 1.445465087890625, 1.5345458984375, 1.623626708984375, 1.71270751953125, 1.801788330078125, 1.890869140625, 1.979949951171875, 2.06903076171875, 2.158111572265625, 2.2471923828125, 2.336273193359375, 2.42535400390625, 2.514434814453125, 2.603515625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 14.0, 18.0, 16.0, 21.0, 28.0, 31.0, 39.0, 29.0, 30.0, 53.0, 49.0, 56.0, 65.0, 57.0, 65.0, 69.0, 39.0, 50.0, 47.0, 31.0, 27.0, 18.0, 27.0, 14.0, 17.0, 16.0, 11.0, 6.0, 8.0, 9.0, 7.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-21.192150115966797, -20.558141708374023, -19.924131393432617, -19.290122985839844, -18.656112670898438, -18.022104263305664, -17.38809585571289, -16.754085540771484, -16.12007713317871, -15.486067771911621, -14.852058410644531, -14.218050003051758, -13.584040641784668, -12.950031280517578, -12.316022872924805, -11.682013511657715, -11.048004150390625, -10.413994789123535, -9.779985427856445, -9.145977020263672, -8.511967658996582, -7.877958297729492, -7.2439494132995605, -6.609940528869629, -5.975931167602539, -5.341921806335449, -4.707912921905518, -4.073904037475586, -3.439894676208496, -2.8058855533599854, -2.1718764305114746, -1.537867546081543, -0.9038600921630859, -0.2698509693145752, 0.36415815353393555, 0.9981672763824463, 1.632176399230957, 2.2661855220794678, 2.9001946449279785, 3.53420352935791, 4.168212890625, 4.80222225189209, 5.4362311363220215, 6.070240020751953, 6.704249382019043, 7.338258743286133, 7.9722676277160645, 8.606276512145996, 9.240285873413086, 9.874295234680176, 10.508304595947266, 11.142313003540039, 11.776322364807129, 12.410331726074219, 13.044340133666992, 13.678349494934082, 14.312358856201172, 14.946368217468262, 15.580377578735352, 16.214385986328125, 16.84839630126953, 17.482404708862305, 18.116413116455078, 18.750423431396484, 19.384431838989258]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 9.0, 4.0, 8.0, 6.0, 14.0, 9.0, 19.0, 20.0, 23.0, 15.0, 20.0, 42.0, 29.0, 33.0, 45.0, 46.0, 52.0, 44.0, 36.0, 44.0, 46.0, 43.0, 35.0, 50.0, 39.0, 43.0, 32.0, 27.0, 26.0, 19.0, 19.0, 15.0, 15.0, 13.0, 14.0, 9.0, 9.0, 11.0, 7.0, 4.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.311397552490234, -17.65253448486328, -16.993669509887695, -16.334806442260742, -15.675941467285156, -15.017077445983887, -14.358213424682617, -13.699350357055664, -13.040485382080078, -12.381621360778809, -11.722757339477539, -11.06389331817627, -10.405029296875, -9.74616527557373, -9.087301254272461, -8.428438186645508, -7.769574165344238, -7.110710144042969, -6.451846122741699, -5.79298210144043, -5.13411808013916, -4.475254058837891, -3.8163905143737793, -3.1575264930725098, -2.4986624717712402, -1.8397984504699707, -1.1809345483779907, -0.5220706462860107, 0.1367933750152588, 0.7956573963165283, 1.4545211791992188, 2.1133852005004883, 2.772249221801758, 3.4311132431030273, 4.089977264404297, 4.748841285705566, 5.407705307006836, 6.0665693283081055, 6.725432872772217, 7.384296894073486, 8.043161392211914, 8.702025413513184, 9.360889434814453, 10.019753456115723, 10.678617477416992, 11.337481498718262, 11.996345520019531, 12.655208587646484, 13.314072608947754, 13.972936630249023, 14.631800651550293, 15.290664672851562, 15.949528694152832, 16.6083927154541, 17.267255783081055, 17.92612075805664, 18.584983825683594, 19.243846893310547, 19.902711868286133, 20.561574935913086, 21.220439910888672, 21.879302978515625, 22.53816795349121, 23.197031021118164, 23.85589599609375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 12.0, 18.0, 23.0, 39.0, 61.0, 87.0, 140.0, 218.0, 317.0, 483.0, 766.0, 1228.0, 1783.0, 2851.0, 4474.0, 7125.0, 11569.0, 18014.0, 28249.0, 42658.0, 62537.0, 86414.0, 109583.0, 126508.0, 127992.0, 115770.0, 93586.0, 69465.0, 47807.0, 31729.0, 20762.0, 13308.0, 8462.0, 5215.0, 3401.0, 2126.0, 1331.0, 866.0, 568.0, 338.0, 219.0, 159.0, 94.0, 79.0, 45.0, 21.0, 23.0, 11.0, 10.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-18.296875, -17.727783203125, -17.15869140625, -16.589599609375, -16.0205078125, -15.451416015625, -14.88232421875, -14.313232421875, -13.744140625, -13.175048828125, -12.60595703125, -12.036865234375, -11.4677734375, -10.898681640625, -10.32958984375, -9.760498046875, -9.19140625, -8.622314453125, -8.05322265625, -7.484130859375, -6.9150390625, -6.345947265625, -5.77685546875, -5.207763671875, -4.638671875, -4.069580078125, -3.50048828125, -2.931396484375, -2.3623046875, -1.793212890625, -1.22412109375, -0.655029296875, -0.0859375, 0.483154296875, 1.05224609375, 1.621337890625, 2.1904296875, 2.759521484375, 3.32861328125, 3.897705078125, 4.466796875, 5.035888671875, 5.60498046875, 6.174072265625, 6.7431640625, 7.312255859375, 7.88134765625, 8.450439453125, 9.01953125, 9.588623046875, 10.15771484375, 10.726806640625, 11.2958984375, 11.864990234375, 12.43408203125, 13.003173828125, 13.572265625, 14.141357421875, 14.71044921875, 15.279541015625, 15.8486328125, 16.417724609375, 16.98681640625, 17.555908203125, 18.125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 9.0, 12.0, 14.0, 12.0, 20.0, 29.0, 32.0, 21.0, 33.0, 36.0, 38.0, 34.0, 45.0, 53.0, 38.0, 44.0, 50.0, 43.0, 40.0, 33.0, 46.0, 44.0, 31.0, 28.0, 32.0, 28.0, 20.0, 22.0, 9.0, 17.0, 18.0, 11.0, 9.0, 4.0, 9.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.146484375, -15.51171875, -14.876953125, -14.2421875, -13.607421875, -12.97265625, -12.337890625, -11.703125, -11.068359375, -10.43359375, -9.798828125, -9.1640625, -8.529296875, -7.89453125, -7.259765625, -6.625, -5.990234375, -5.35546875, -4.720703125, -4.0859375, -3.451171875, -2.81640625, -2.181640625, -1.546875, -0.912109375, -0.27734375, 0.357421875, 0.9921875, 1.626953125, 2.26171875, 2.896484375, 3.53125, 4.166015625, 4.80078125, 5.435546875, 6.0703125, 6.705078125, 7.33984375, 7.974609375, 8.609375, 9.244140625, 9.87890625, 10.513671875, 11.1484375, 11.783203125, 12.41796875, 13.052734375, 13.6875, 14.322265625, 14.95703125, 15.591796875, 16.2265625, 16.861328125, 17.49609375, 18.130859375, 18.765625, 19.400390625, 20.03515625, 20.669921875, 21.3046875, 21.939453125, 22.57421875, 23.208984375, 23.84375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 7.0, 13.0, 14.0, 22.0, 46.0, 55.0, 74.0, 131.0, 188.0, 290.0, 421.0, 666.0, 1032.0, 1519.0, 2318.0, 3581.0, 5364.0, 8543.0, 12935.0, 20003.0, 29006.0, 42325.0, 59430.0, 79452.0, 98607.0, 112774.0, 116986.0, 110618.0, 94306.0, 74519.0, 55527.0, 39194.0, 26709.0, 17894.0, 11874.0, 7786.0, 5100.0, 3167.0, 2140.0, 1375.0, 883.0, 535.0, 372.0, 264.0, 173.0, 115.0, 66.0, 41.0, 34.0, 25.0, 15.0, 12.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0], "bins": [-15.703125, -15.21826171875, -14.7333984375, -14.24853515625, -13.763671875, -13.27880859375, -12.7939453125, -12.30908203125, -11.82421875, -11.33935546875, -10.8544921875, -10.36962890625, -9.884765625, -9.39990234375, -8.9150390625, -8.43017578125, -7.9453125, -7.46044921875, -6.9755859375, -6.49072265625, -6.005859375, -5.52099609375, -5.0361328125, -4.55126953125, -4.06640625, -3.58154296875, -3.0966796875, -2.61181640625, -2.126953125, -1.64208984375, -1.1572265625, -0.67236328125, -0.1875, 0.29736328125, 0.7822265625, 1.26708984375, 1.751953125, 2.23681640625, 2.7216796875, 3.20654296875, 3.69140625, 4.17626953125, 4.6611328125, 5.14599609375, 5.630859375, 6.11572265625, 6.6005859375, 7.08544921875, 7.5703125, 8.05517578125, 8.5400390625, 9.02490234375, 9.509765625, 9.99462890625, 10.4794921875, 10.96435546875, 11.44921875, 11.93408203125, 12.4189453125, 12.90380859375, 13.388671875, 13.87353515625, 14.3583984375, 14.84326171875, 15.328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 2.0, 7.0, 3.0, 12.0, 12.0, 16.0, 23.0, 14.0, 18.0, 28.0, 34.0, 40.0, 34.0, 33.0, 46.0, 31.0, 46.0, 64.0, 47.0, 41.0, 36.0, 33.0, 44.0, 35.0, 36.0, 38.0, 27.0, 39.0, 31.0, 21.0, 14.0, 17.0, 10.0, 14.0, 13.0, 3.0, 8.0, 8.0, 10.0, 3.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.67236328125, -13.2666015625, -12.86083984375, -12.455078125, -12.04931640625, -11.6435546875, -11.23779296875, -10.83203125, -10.42626953125, -10.0205078125, -9.61474609375, -9.208984375, -8.80322265625, -8.3974609375, -7.99169921875, -7.5859375, -7.18017578125, -6.7744140625, -6.36865234375, -5.962890625, -5.55712890625, -5.1513671875, -4.74560546875, -4.33984375, -3.93408203125, -3.5283203125, -3.12255859375, -2.716796875, -2.31103515625, -1.9052734375, -1.49951171875, -1.09375, -0.68798828125, -0.2822265625, 0.12353515625, 0.529296875, 0.93505859375, 1.3408203125, 1.74658203125, 2.15234375, 2.55810546875, 2.9638671875, 3.36962890625, 3.775390625, 4.18115234375, 4.5869140625, 4.99267578125, 5.3984375, 5.80419921875, 6.2099609375, 6.61572265625, 7.021484375, 7.42724609375, 7.8330078125, 8.23876953125, 8.64453125, 9.05029296875, 9.4560546875, 9.86181640625, 10.267578125, 10.67333984375, 11.0791015625, 11.48486328125, 11.890625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 16.0, 18.0, 24.0, 31.0, 68.0, 74.0, 88.0, 146.0, 181.0, 279.0, 368.0, 575.0, 892.0, 1270.0, 2101.0, 3865.0, 7845.0, 22199.0, 93456.0, 423680.0, 376713.0, 78360.0, 19700.0, 7292.0, 3471.0, 1902.0, 1290.0, 809.0, 567.0, 375.0, 256.0, 173.0, 131.0, 88.0, 75.0, 44.0, 40.0, 23.0, 19.0, 16.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.5625, -39.1611328125, -37.759765625, -36.3583984375, -34.95703125, -33.5556640625, -32.154296875, -30.7529296875, -29.3515625, -27.9501953125, -26.548828125, -25.1474609375, -23.74609375, -22.3447265625, -20.943359375, -19.5419921875, -18.140625, -16.7392578125, -15.337890625, -13.9365234375, -12.53515625, -11.1337890625, -9.732421875, -8.3310546875, -6.9296875, -5.5283203125, -4.126953125, -2.7255859375, -1.32421875, 0.0771484375, 1.478515625, 2.8798828125, 4.28125, 5.6826171875, 7.083984375, 8.4853515625, 9.88671875, 11.2880859375, 12.689453125, 14.0908203125, 15.4921875, 16.8935546875, 18.294921875, 19.6962890625, 21.09765625, 22.4990234375, 23.900390625, 25.3017578125, 26.703125, 28.1044921875, 29.505859375, 30.9072265625, 32.30859375, 33.7099609375, 35.111328125, 36.5126953125, 37.9140625, 39.3154296875, 40.716796875, 42.1181640625, 43.51953125, 44.9208984375, 46.322265625, 47.7236328125, 49.125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 7.0, 10.0, 18.0, 26.0, 46.0, 81.0, 119.0, 156.0, 161.0, 135.0, 81.0, 64.0, 31.0, 22.0, 14.0, 7.0, 6.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024013519287109375, -0.0023057162761688232, -0.002210080623626709, -0.0021144449710845947, -0.0020188093185424805, -0.0019231736660003662, -0.001827538013458252, -0.0017319023609161377, -0.0016362667083740234, -0.0015406310558319092, -0.001444995403289795, -0.0013493597507476807, -0.0012537240982055664, -0.0011580884456634521, -0.0010624527931213379, -0.0009668171405792236, -0.0008711814880371094, -0.0007755458354949951, -0.0006799101829528809, -0.0005842745304107666, -0.0004886388778686523, -0.0003930032253265381, -0.00029736757278442383, -0.00020173192024230957, -0.00010609626770019531, -1.0460615158081055e-05, 8.51750373840332e-05, 0.00018081068992614746, 0.0002764463424682617, 0.000372081995010376, 0.00046771764755249023, 0.0005633533000946045, 0.0006589889526367188, 0.000754624605178833, 0.0008502602577209473, 0.0009458959102630615, 0.0010415315628051758, 0.00113716721534729, 0.0012328028678894043, 0.0013284385204315186, 0.0014240741729736328, 0.001519709825515747, 0.0016153454780578613, 0.0017109811305999756, 0.0018066167831420898, 0.001902252435684204, 0.0019978880882263184, 0.0020935237407684326, 0.002189159393310547, 0.002284795045852661, 0.0023804306983947754, 0.0024760663509368896, 0.002571702003479004, 0.002667337656021118, 0.0027629733085632324, 0.0028586089611053467, 0.002954244613647461, 0.003049880266189575, 0.0031455159187316895, 0.0032411515712738037, 0.003336787223815918, 0.0034324228763580322, 0.0035280585289001465, 0.0036236941814422607, 0.003719329833984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 10.0, 13.0, 14.0, 25.0, 32.0, 43.0, 80.0, 125.0, 208.0, 300.0, 447.0, 649.0, 1079.0, 1722.0, 2869.0, 4721.0, 8032.0, 14255.0, 27756.0, 58457.0, 124029.0, 221255.0, 252568.0, 165809.0, 81436.0, 37983.0, 19136.0, 10153.0, 5894.0, 3532.0, 2191.0, 1338.0, 821.0, 560.0, 375.0, 224.0, 135.0, 99.0, 59.0, 39.0, 28.0, 16.0, 8.0, 14.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.609375, -20.007080078125, -19.40478515625, -18.802490234375, -18.2001953125, -17.597900390625, -16.99560546875, -16.393310546875, -15.791015625, -15.188720703125, -14.58642578125, -13.984130859375, -13.3818359375, -12.779541015625, -12.17724609375, -11.574951171875, -10.97265625, -10.370361328125, -9.76806640625, -9.165771484375, -8.5634765625, -7.961181640625, -7.35888671875, -6.756591796875, -6.154296875, -5.552001953125, -4.94970703125, -4.347412109375, -3.7451171875, -3.142822265625, -2.54052734375, -1.938232421875, -1.3359375, -0.733642578125, -0.13134765625, 0.470947265625, 1.0732421875, 1.675537109375, 2.27783203125, 2.880126953125, 3.482421875, 4.084716796875, 4.68701171875, 5.289306640625, 5.8916015625, 6.493896484375, 7.09619140625, 7.698486328125, 8.30078125, 8.903076171875, 9.50537109375, 10.107666015625, 10.7099609375, 11.312255859375, 11.91455078125, 12.516845703125, 13.119140625, 13.721435546875, 14.32373046875, 14.926025390625, 15.5283203125, 16.130615234375, 16.73291015625, 17.335205078125, 17.9375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 6.0, 9.0, 11.0, 13.0, 13.0, 26.0, 13.0, 30.0, 41.0, 41.0, 61.0, 82.0, 61.0, 64.0, 62.0, 81.0, 81.0, 58.0, 43.0, 43.0, 33.0, 34.0, 18.0, 20.0, 17.0, 9.0, 6.0, 5.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.80078125, -6.59033203125, -6.3798828125, -6.16943359375, -5.958984375, -5.74853515625, -5.5380859375, -5.32763671875, -5.1171875, -4.90673828125, -4.6962890625, -4.48583984375, -4.275390625, -4.06494140625, -3.8544921875, -3.64404296875, -3.43359375, -3.22314453125, -3.0126953125, -2.80224609375, -2.591796875, -2.38134765625, -2.1708984375, -1.96044921875, -1.75, -1.53955078125, -1.3291015625, -1.11865234375, -0.908203125, -0.69775390625, -0.4873046875, -0.27685546875, -0.06640625, 0.14404296875, 0.3544921875, 0.56494140625, 0.775390625, 0.98583984375, 1.1962890625, 1.40673828125, 1.6171875, 1.82763671875, 2.0380859375, 2.24853515625, 2.458984375, 2.66943359375, 2.8798828125, 3.09033203125, 3.30078125, 3.51123046875, 3.7216796875, 3.93212890625, 4.142578125, 4.35302734375, 4.5634765625, 4.77392578125, 4.984375, 5.19482421875, 5.4052734375, 5.61572265625, 5.826171875, 6.03662109375, 6.2470703125, 6.45751953125, 6.66796875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 5.0, 9.0, 18.0, 15.0, 26.0, 21.0, 40.0, 31.0, 44.0, 49.0, 65.0, 44.0, 55.0, 66.0, 70.0, 60.0, 64.0, 54.0, 44.0, 36.0, 30.0, 26.0, 27.0, 15.0, 15.0, 18.0, 8.0, 13.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.826841354370117, -22.11463165283203, -21.402421951293945, -20.690210342407227, -19.97800064086914, -19.265790939331055, -18.55358123779297, -17.84136962890625, -17.129159927368164, -16.416950225830078, -15.704739570617676, -14.99252986907959, -14.280319213867188, -13.568109512329102, -12.855899810791016, -12.143689155578613, -11.431479454040527, -10.719269752502441, -10.007059097290039, -9.294849395751953, -8.58263874053955, -7.870429039001465, -7.158218860626221, -6.446008682250977, -5.733798503875732, -5.021588325500488, -4.309378147125244, -3.597168207168579, -2.884958028793335, -2.172747850418091, -1.4605379104614258, -0.7483277320861816, -0.0361175537109375, 0.6760925650596619, 1.3883026838302612, 2.100512742996216, 2.81272292137146, 3.524933099746704, 4.237143039703369, 4.949353218078613, 5.661563396453857, 6.373773574829102, 7.085983753204346, 7.79819393157959, 8.510403633117676, 9.222614288330078, 9.934823989868164, 10.64703369140625, 11.359244346618652, 12.071454048156738, 12.78366470336914, 13.495874404907227, 14.208085060119629, 14.920294761657715, 15.632505416870117, 16.344715118408203, 17.05692481994629, 17.769134521484375, 18.48134422302246, 19.19355583190918, 19.905765533447266, 20.61797523498535, 21.330184936523438, 22.042396545410156, 22.754606246948242]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 7.0, 6.0, 14.0, 15.0, 18.0, 14.0, 12.0, 35.0, 25.0, 23.0, 34.0, 33.0, 47.0, 36.0, 32.0, 45.0, 31.0, 45.0, 44.0, 43.0, 46.0, 38.0, 39.0, 34.0, 34.0, 21.0, 29.0, 20.0, 23.0, 18.0, 16.0, 13.0, 21.0, 12.0, 11.0, 12.0, 7.0, 10.0, 12.0, 4.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.465261459350586, -18.8212890625, -18.17731475830078, -17.533342361450195, -16.88936996459961, -16.245397567749023, -15.601424217224121, -14.957450866699219, -14.313478469848633, -13.669506072998047, -13.025532722473145, -12.381559371948242, -11.737586975097656, -11.09361457824707, -10.449641227722168, -9.805667877197266, -9.16169548034668, -8.517723083496094, -7.873749732971191, -7.229776859283447, -6.585803985595703, -5.941831111907959, -5.297858238220215, -4.653885364532471, -4.009912490844727, -3.3659396171569824, -2.7219667434692383, -2.077993869781494, -1.43402099609375, -0.7900481224060059, -0.14607524871826172, 0.4978976249694824, 1.1418724060058594, 1.7858452796936035, 2.4298181533813477, 3.073791027069092, 3.717763900756836, 4.36173677444458, 5.005709648132324, 5.649682521820068, 6.2936553955078125, 6.937628269195557, 7.581601142883301, 8.225574493408203, 8.869546890258789, 9.513519287109375, 10.157492637634277, 10.80146598815918, 11.445438385009766, 12.089410781860352, 12.733384132385254, 13.377357482910156, 14.021329879760742, 14.665302276611328, 15.30927562713623, 15.953248977661133, 16.59722137451172, 17.241193771362305, 17.88516616821289, 18.52914047241211, 19.173112869262695, 19.81708526611328, 20.4610595703125, 21.105031967163086, 21.749004364013672]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 9.0, 10.0, 7.0, 24.0, 34.0, 66.0, 91.0, 118.0, 198.0, 323.0, 530.0, 835.0, 1370.0, 2222.0, 3526.0, 5884.0, 9290.0, 14941.0, 24227.0, 39596.0, 63509.0, 101642.0, 160864.0, 246675.0, 360717.0, 481444.0, 565720.0, 568082.0, 486516.0, 364521.0, 251697.0, 164075.0, 104040.0, 65516.0, 40663.0, 24938.0, 15312.0, 9530.0, 5735.0, 3617.0, 2218.0, 1435.0, 885.0, 598.0, 358.0, 238.0, 163.0, 106.0, 65.0, 36.0, 30.0, 17.0, 10.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0], "bins": [-13.3828125, -12.96484375, -12.546875, -12.12890625, -11.7109375, -11.29296875, -10.875, -10.45703125, -10.0390625, -9.62109375, -9.203125, -8.78515625, -8.3671875, -7.94921875, -7.53125, -7.11328125, -6.6953125, -6.27734375, -5.859375, -5.44140625, -5.0234375, -4.60546875, -4.1875, -3.76953125, -3.3515625, -2.93359375, -2.515625, -2.09765625, -1.6796875, -1.26171875, -0.84375, -0.42578125, -0.0078125, 0.41015625, 0.828125, 1.24609375, 1.6640625, 2.08203125, 2.5, 2.91796875, 3.3359375, 3.75390625, 4.171875, 4.58984375, 5.0078125, 5.42578125, 5.84375, 6.26171875, 6.6796875, 7.09765625, 7.515625, 7.93359375, 8.3515625, 8.76953125, 9.1875, 9.60546875, 10.0234375, 10.44140625, 10.859375, 11.27734375, 11.6953125, 12.11328125, 12.53125, 12.94921875, 13.3671875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 9.0, 7.0, 8.0, 7.0, 11.0, 8.0, 13.0, 16.0, 16.0, 31.0, 35.0, 24.0, 36.0, 35.0, 22.0, 41.0, 33.0, 28.0, 44.0, 39.0, 49.0, 30.0, 44.0, 43.0, 33.0, 45.0, 35.0, 29.0, 21.0, 31.0, 27.0, 18.0, 13.0, 20.0, 13.0, 13.0, 17.0, 13.0, 7.0, 6.0, 7.0, 7.0, 2.0, 8.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.078125, -11.673095703125, -11.26806640625, -10.863037109375, -10.4580078125, -10.052978515625, -9.64794921875, -9.242919921875, -8.837890625, -8.432861328125, -8.02783203125, -7.622802734375, -7.2177734375, -6.812744140625, -6.40771484375, -6.002685546875, -5.59765625, -5.192626953125, -4.78759765625, -4.382568359375, -3.9775390625, -3.572509765625, -3.16748046875, -2.762451171875, -2.357421875, -1.952392578125, -1.54736328125, -1.142333984375, -0.7373046875, -0.332275390625, 0.07275390625, 0.477783203125, 0.8828125, 1.287841796875, 1.69287109375, 2.097900390625, 2.5029296875, 2.907958984375, 3.31298828125, 3.718017578125, 4.123046875, 4.528076171875, 4.93310546875, 5.338134765625, 5.7431640625, 6.148193359375, 6.55322265625, 6.958251953125, 7.36328125, 7.768310546875, 8.17333984375, 8.578369140625, 8.9833984375, 9.388427734375, 9.79345703125, 10.198486328125, 10.603515625, 11.008544921875, 11.41357421875, 11.818603515625, 12.2236328125, 12.628662109375, 13.03369140625, 13.438720703125, 13.84375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 18.0, 21.0, 40.0, 65.0, 93.0, 145.0, 217.0, 416.0, 710.0, 1074.0, 1724.0, 3057.0, 4802.0, 7950.0, 13037.0, 21641.0, 35154.0, 56996.0, 90990.0, 140853.0, 213103.0, 304964.0, 406012.0, 491743.0, 529541.0, 500564.0, 420543.0, 318897.0, 224502.0, 150810.0, 96934.0, 60611.0, 37705.0, 23286.0, 13940.0, 8534.0, 5298.0, 3131.0, 1994.0, 1230.0, 706.0, 428.0, 294.0, 170.0, 104.0, 86.0, 48.0, 29.0, 27.0, 13.0, 8.0, 5.0, 1.0, 5.0, 1.0, 2.0], "bins": [-12.4609375, -12.078369140625, -11.69580078125, -11.313232421875, -10.9306640625, -10.548095703125, -10.16552734375, -9.782958984375, -9.400390625, -9.017822265625, -8.63525390625, -8.252685546875, -7.8701171875, -7.487548828125, -7.10498046875, -6.722412109375, -6.33984375, -5.957275390625, -5.57470703125, -5.192138671875, -4.8095703125, -4.427001953125, -4.04443359375, -3.661865234375, -3.279296875, -2.896728515625, -2.51416015625, -2.131591796875, -1.7490234375, -1.366455078125, -0.98388671875, -0.601318359375, -0.21875, 0.163818359375, 0.54638671875, 0.928955078125, 1.3115234375, 1.694091796875, 2.07666015625, 2.459228515625, 2.841796875, 3.224365234375, 3.60693359375, 3.989501953125, 4.3720703125, 4.754638671875, 5.13720703125, 5.519775390625, 5.90234375, 6.284912109375, 6.66748046875, 7.050048828125, 7.4326171875, 7.815185546875, 8.19775390625, 8.580322265625, 8.962890625, 9.345458984375, 9.72802734375, 10.110595703125, 10.4931640625, 10.875732421875, 11.25830078125, 11.640869140625, 12.0234375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 10.0, 7.0, 14.0, 12.0, 17.0, 17.0, 34.0, 37.0, 39.0, 56.0, 72.0, 95.0, 100.0, 117.0, 127.0, 183.0, 167.0, 215.0, 178.0, 232.0, 220.0, 230.0, 230.0, 214.0, 188.0, 163.0, 159.0, 167.0, 127.0, 118.0, 107.0, 83.0, 55.0, 55.0, 48.0, 40.0, 41.0, 32.0, 13.0, 15.0, 15.0, 8.0, 9.0, 5.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.7734375, -5.57672119140625, -5.3800048828125, -5.18328857421875, -4.986572265625, -4.78985595703125, -4.5931396484375, -4.39642333984375, -4.19970703125, -4.00299072265625, -3.8062744140625, -3.60955810546875, -3.412841796875, -3.21612548828125, -3.0194091796875, -2.82269287109375, -2.6259765625, -2.42926025390625, -2.2325439453125, -2.03582763671875, -1.839111328125, -1.64239501953125, -1.4456787109375, -1.24896240234375, -1.05224609375, -0.85552978515625, -0.6588134765625, -0.46209716796875, -0.265380859375, -0.06866455078125, 0.1280517578125, 0.32476806640625, 0.521484375, 0.71820068359375, 0.9149169921875, 1.11163330078125, 1.308349609375, 1.50506591796875, 1.7017822265625, 1.89849853515625, 2.09521484375, 2.29193115234375, 2.4886474609375, 2.68536376953125, 2.882080078125, 3.07879638671875, 3.2755126953125, 3.47222900390625, 3.6689453125, 3.86566162109375, 4.0623779296875, 4.25909423828125, 4.455810546875, 4.65252685546875, 4.8492431640625, 5.04595947265625, 5.24267578125, 5.43939208984375, 5.6361083984375, 5.83282470703125, 6.029541015625, 6.22625732421875, 6.4229736328125, 6.61968994140625, 6.81640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 6.0, 3.0, 5.0, 9.0, 11.0, 18.0, 17.0, 20.0, 15.0, 42.0, 33.0, 26.0, 53.0, 52.0, 50.0, 70.0, 44.0, 61.0, 58.0, 48.0, 44.0, 39.0, 43.0, 31.0, 32.0, 38.0, 18.0, 22.0, 16.0, 11.0, 7.0, 16.0, 13.0, 3.0, 8.0, 2.0, 1.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-18.666393280029297, -18.12498664855957, -17.58357810974121, -17.042171478271484, -16.500762939453125, -15.959356307983398, -15.417948722839355, -14.876541137695312, -14.335134506225586, -13.793726921081543, -13.2523193359375, -12.710912704467773, -12.16950511932373, -11.628097534179688, -11.086689949035645, -10.545282363891602, -10.003874778747559, -9.462467193603516, -8.921059608459473, -8.37965202331543, -7.838245391845703, -7.29683780670166, -6.755430221557617, -6.214022636413574, -5.6726155281066895, -5.1312079429626465, -4.589800834655762, -4.048393249511719, -3.506985902786255, -2.965578556060791, -2.424170970916748, -1.8827636241912842, -1.341355323791504, -0.7999479174613953, -0.2585405111312866, 0.2828669548034668, 0.8242743015289307, 1.3656816482543945, 1.9070892333984375, 2.4484965801239014, 2.9899039268493652, 3.531311273574829, 4.072718620300293, 4.614126205444336, 5.155533790588379, 5.696940898895264, 6.238348484039307, 6.779755592346191, 7.321163177490234, 7.862570762634277, 8.40397834777832, 8.945384979248047, 9.48679256439209, 10.028200149536133, 10.569607734680176, 11.111015319824219, 11.652421951293945, 12.193829536437988, 12.735237121582031, 13.276643753051758, 13.8180513381958, 14.359458923339844, 14.900866508483887, 15.44227409362793, 15.983681678771973]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 15.0, 10.0, 9.0, 13.0, 12.0, 19.0, 17.0, 19.0, 30.0, 30.0, 28.0, 45.0, 36.0, 40.0, 38.0, 36.0, 38.0, 35.0, 39.0, 40.0, 44.0, 39.0, 52.0, 27.0, 30.0, 31.0, 33.0, 25.0, 25.0, 16.0, 19.0, 21.0, 10.0, 9.0, 10.0, 5.0, 14.0, 5.0, 6.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.412023544311523, -15.893648147583008, -15.375272750854492, -14.85689640045166, -14.338521003723145, -13.820145606994629, -13.301769256591797, -12.783393859863281, -12.265018463134766, -11.74664306640625, -11.228267669677734, -10.709891319274902, -10.191515922546387, -9.673140525817871, -9.154764175415039, -8.636388778686523, -8.118013381958008, -7.599637985229492, -7.081262111663818, -6.5628862380981445, -6.044510841369629, -5.526135444641113, -5.0077595710754395, -4.489383697509766, -3.97100830078125, -3.4526326656341553, -2.9342570304870605, -2.415881395339966, -1.897505760192871, -1.3791301250457764, -0.8607544898986816, -0.3423788547515869, 0.175994873046875, 0.6943705081939697, 1.2127461433410645, 1.7311217784881592, 2.249497413635254, 2.7678730487823486, 3.2862486839294434, 3.804624319076538, 4.322999954223633, 4.841375350952148, 5.359751224517822, 5.878127098083496, 6.396502494812012, 6.914877891540527, 7.433253765106201, 7.951629638671875, 8.47000503540039, 8.988380432128906, 9.506755828857422, 10.025132179260254, 10.54350757598877, 11.061882972717285, 11.580259323120117, 12.098634719848633, 12.617010116577148, 13.135385513305664, 13.65376091003418, 14.172137260437012, 14.690512657165527, 15.208888053894043, 15.727264404296875, 16.24563980102539, 16.764015197753906]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 10.0, 17.0, 33.0, 30.0, 41.0, 51.0, 67.0, 98.0, 112.0, 178.0, 195.0, 336.0, 465.0, 708.0, 1060.0, 1739.0, 3339.0, 6993.0, 17241.0, 47585.0, 140417.0, 334159.0, 304459.0, 119779.0, 40371.0, 15050.0, 6180.0, 3005.0, 1625.0, 1009.0, 636.0, 444.0, 304.0, 211.0, 149.0, 110.0, 89.0, 69.0, 51.0, 39.0, 37.0, 15.0, 18.0, 13.0, 4.0, 0.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-17.28125, -16.75634765625, -16.2314453125, -15.70654296875, -15.181640625, -14.65673828125, -14.1318359375, -13.60693359375, -13.08203125, -12.55712890625, -12.0322265625, -11.50732421875, -10.982421875, -10.45751953125, -9.9326171875, -9.40771484375, -8.8828125, -8.35791015625, -7.8330078125, -7.30810546875, -6.783203125, -6.25830078125, -5.7333984375, -5.20849609375, -4.68359375, -4.15869140625, -3.6337890625, -3.10888671875, -2.583984375, -2.05908203125, -1.5341796875, -1.00927734375, -0.484375, 0.04052734375, 0.5654296875, 1.09033203125, 1.615234375, 2.14013671875, 2.6650390625, 3.18994140625, 3.71484375, 4.23974609375, 4.7646484375, 5.28955078125, 5.814453125, 6.33935546875, 6.8642578125, 7.38916015625, 7.9140625, 8.43896484375, 8.9638671875, 9.48876953125, 10.013671875, 10.53857421875, 11.0634765625, 11.58837890625, 12.11328125, 12.63818359375, 13.1630859375, 13.68798828125, 14.212890625, 14.73779296875, 15.2626953125, 15.78759765625, 16.3125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 9.0, 19.0, 9.0, 15.0, 29.0, 25.0, 31.0, 32.0, 28.0, 42.0, 28.0, 40.0, 40.0, 28.0, 36.0, 38.0, 34.0, 44.0, 42.0, 33.0, 60.0, 38.0, 33.0, 22.0, 27.0, 27.0, 24.0, 16.0, 16.0, 12.0, 12.0, 14.0, 10.0, 9.0, 12.0, 8.0, 7.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-16.359375, -15.839111328125, -15.31884765625, -14.798583984375, -14.2783203125, -13.758056640625, -13.23779296875, -12.717529296875, -12.197265625, -11.677001953125, -11.15673828125, -10.636474609375, -10.1162109375, -9.595947265625, -9.07568359375, -8.555419921875, -8.03515625, -7.514892578125, -6.99462890625, -6.474365234375, -5.9541015625, -5.433837890625, -4.91357421875, -4.393310546875, -3.873046875, -3.352783203125, -2.83251953125, -2.312255859375, -1.7919921875, -1.271728515625, -0.75146484375, -0.231201171875, 0.2890625, 0.809326171875, 1.32958984375, 1.849853515625, 2.3701171875, 2.890380859375, 3.41064453125, 3.930908203125, 4.451171875, 4.971435546875, 5.49169921875, 6.011962890625, 6.5322265625, 7.052490234375, 7.57275390625, 8.093017578125, 8.61328125, 9.133544921875, 9.65380859375, 10.174072265625, 10.6943359375, 11.214599609375, 11.73486328125, 12.255126953125, 12.775390625, 13.295654296875, 13.81591796875, 14.336181640625, 14.8564453125, 15.376708984375, 15.89697265625, 16.417236328125, 16.9375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 16.0, 27.0, 41.0, 64.0, 91.0, 135.0, 211.0, 375.0, 762.0, 1697.0, 4907.0, 19725.0, 112628.0, 542952.0, 302311.0, 47835.0, 9597.0, 2834.0, 1048.0, 484.0, 272.0, 186.0, 102.0, 77.0, 46.0, 41.0, 21.0, 15.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.34375, -22.60888671875, -21.8740234375, -21.13916015625, -20.404296875, -19.66943359375, -18.9345703125, -18.19970703125, -17.46484375, -16.72998046875, -15.9951171875, -15.26025390625, -14.525390625, -13.79052734375, -13.0556640625, -12.32080078125, -11.5859375, -10.85107421875, -10.1162109375, -9.38134765625, -8.646484375, -7.91162109375, -7.1767578125, -6.44189453125, -5.70703125, -4.97216796875, -4.2373046875, -3.50244140625, -2.767578125, -2.03271484375, -1.2978515625, -0.56298828125, 0.171875, 0.90673828125, 1.6416015625, 2.37646484375, 3.111328125, 3.84619140625, 4.5810546875, 5.31591796875, 6.05078125, 6.78564453125, 7.5205078125, 8.25537109375, 8.990234375, 9.72509765625, 10.4599609375, 11.19482421875, 11.9296875, 12.66455078125, 13.3994140625, 14.13427734375, 14.869140625, 15.60400390625, 16.3388671875, 17.07373046875, 17.80859375, 18.54345703125, 19.2783203125, 20.01318359375, 20.748046875, 21.48291015625, 22.2177734375, 22.95263671875, 23.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 3.0, 9.0, 10.0, 11.0, 1.0, 8.0, 17.0, 22.0, 12.0, 24.0, 21.0, 29.0, 18.0, 23.0, 18.0, 28.0, 30.0, 30.0, 39.0, 23.0, 41.0, 31.0, 37.0, 33.0, 25.0, 32.0, 41.0, 32.0, 30.0, 34.0, 30.0, 24.0, 18.0, 25.0, 24.0, 20.0, 19.0, 22.0, 14.0, 5.0, 15.0, 8.0, 15.0, 13.0, 8.0, 5.0, 9.0, 6.0, 0.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.4296875, -10.094970703125, -9.76025390625, -9.425537109375, -9.0908203125, -8.756103515625, -8.42138671875, -8.086669921875, -7.751953125, -7.417236328125, -7.08251953125, -6.747802734375, -6.4130859375, -6.078369140625, -5.74365234375, -5.408935546875, -5.07421875, -4.739501953125, -4.40478515625, -4.070068359375, -3.7353515625, -3.400634765625, -3.06591796875, -2.731201171875, -2.396484375, -2.061767578125, -1.72705078125, -1.392333984375, -1.0576171875, -0.722900390625, -0.38818359375, -0.053466796875, 0.28125, 0.615966796875, 0.95068359375, 1.285400390625, 1.6201171875, 1.954833984375, 2.28955078125, 2.624267578125, 2.958984375, 3.293701171875, 3.62841796875, 3.963134765625, 4.2978515625, 4.632568359375, 4.96728515625, 5.302001953125, 5.63671875, 5.971435546875, 6.30615234375, 6.640869140625, 6.9755859375, 7.310302734375, 7.64501953125, 7.979736328125, 8.314453125, 8.649169921875, 8.98388671875, 9.318603515625, 9.6533203125, 9.988037109375, 10.32275390625, 10.657470703125, 10.9921875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 12.0, 22.0, 25.0, 41.0, 67.0, 86.0, 146.0, 214.0, 344.0, 566.0, 941.0, 1720.0, 3306.0, 7027.0, 16627.0, 46706.0, 154290.0, 414136.0, 273805.0, 81389.0, 26411.0, 10402.0, 4724.0, 2346.0, 1273.0, 719.0, 431.0, 262.0, 189.0, 101.0, 61.0, 58.0, 25.0, 24.0, 17.0, 10.0, 12.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3671875, -4.2203369140625, -4.073486328125, -3.9266357421875, -3.77978515625, -3.6329345703125, -3.486083984375, -3.3392333984375, -3.1923828125, -3.0455322265625, -2.898681640625, -2.7518310546875, -2.60498046875, -2.4581298828125, -2.311279296875, -2.1644287109375, -2.017578125, -1.8707275390625, -1.723876953125, -1.5770263671875, -1.43017578125, -1.2833251953125, -1.136474609375, -0.9896240234375, -0.8427734375, -0.6959228515625, -0.549072265625, -0.4022216796875, -0.25537109375, -0.1085205078125, 0.038330078125, 0.1851806640625, 0.33203125, 0.4788818359375, 0.625732421875, 0.7725830078125, 0.91943359375, 1.0662841796875, 1.213134765625, 1.3599853515625, 1.5068359375, 1.6536865234375, 1.800537109375, 1.9473876953125, 2.09423828125, 2.2410888671875, 2.387939453125, 2.5347900390625, 2.681640625, 2.8284912109375, 2.975341796875, 3.1221923828125, 3.26904296875, 3.4158935546875, 3.562744140625, 3.7095947265625, 3.8564453125, 4.0032958984375, 4.150146484375, 4.2969970703125, 4.44384765625, 4.5906982421875, 4.737548828125, 4.8843994140625, 5.03125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 8.0, 22.0, 28.0, 38.0, 91.0, 128.0, 156.0, 165.0, 115.0, 82.0, 44.0, 25.0, 21.0, 15.0, 6.0, 12.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038433074951171875, -0.0003683045506477356, -0.00035227835178375244, -0.0003362521529197693, -0.00032022595405578613, -0.000304199755191803, -0.0002881735563278198, -0.00027214735746383667, -0.0002561211585998535, -0.00024009495973587036, -0.0002240687608718872, -0.00020804256200790405, -0.0001920163631439209, -0.00017599016427993774, -0.0001599639654159546, -0.00014393776655197144, -0.00012791156768798828, -0.00011188536882400513, -9.585916996002197e-05, -7.983297109603882e-05, -6.380677223205566e-05, -4.778057336807251e-05, -3.1754374504089355e-05, -1.57281756401062e-05, 2.980232238769531e-07, 1.6324222087860107e-05, 3.235042095184326e-05, 4.8376619815826416e-05, 6.440281867980957e-05, 8.042901754379272e-05, 9.645521640777588e-05, 0.00011248141527175903, 0.0001285076141357422, 0.00014453381299972534, 0.0001605600118637085, 0.00017658621072769165, 0.0001926124095916748, 0.00020863860845565796, 0.0002246648073196411, 0.00024069100618362427, 0.0002567172050476074, 0.0002727434039115906, 0.00028876960277557373, 0.0003047958016395569, 0.00032082200050354004, 0.0003368481993675232, 0.00035287439823150635, 0.0003689005970954895, 0.00038492679595947266, 0.0004009529948234558, 0.00041697919368743896, 0.0004330053925514221, 0.0004490315914154053, 0.00046505779027938843, 0.0004810839891433716, 0.0004971101880073547, 0.0005131363868713379, 0.000529162585735321, 0.0005451887845993042, 0.0005612149834632874, 0.0005772411823272705, 0.0005932673811912537, 0.0006092935800552368, 0.00062531977891922, 0.0006413459777832031]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 13.0, 10.0, 13.0, 17.0, 33.0, 53.0, 66.0, 87.0, 121.0, 171.0, 256.0, 398.0, 541.0, 769.0, 1108.0, 1587.0, 2365.0, 3524.0, 5345.0, 8296.0, 12541.0, 19696.0, 32207.0, 52849.0, 86262.0, 137710.0, 186912.0, 175593.0, 121716.0, 74855.0, 45351.0, 27722.0, 17411.0, 11023.0, 7121.0, 4798.0, 3089.0, 2178.0, 1436.0, 1050.0, 694.0, 468.0, 304.0, 254.0, 162.0, 121.0, 86.0, 60.0, 52.0, 27.0, 15.0, 12.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0], "bins": [-2.859375, -2.7723388671875, -2.685302734375, -2.5982666015625, -2.51123046875, -2.4241943359375, -2.337158203125, -2.2501220703125, -2.1630859375, -2.0760498046875, -1.989013671875, -1.9019775390625, -1.81494140625, -1.7279052734375, -1.640869140625, -1.5538330078125, -1.466796875, -1.3797607421875, -1.292724609375, -1.2056884765625, -1.11865234375, -1.0316162109375, -0.944580078125, -0.8575439453125, -0.7705078125, -0.6834716796875, -0.596435546875, -0.5093994140625, -0.42236328125, -0.3353271484375, -0.248291015625, -0.1612548828125, -0.07421875, 0.0128173828125, 0.099853515625, 0.1868896484375, 0.27392578125, 0.3609619140625, 0.447998046875, 0.5350341796875, 0.6220703125, 0.7091064453125, 0.796142578125, 0.8831787109375, 0.97021484375, 1.0572509765625, 1.144287109375, 1.2313232421875, 1.318359375, 1.4053955078125, 1.492431640625, 1.5794677734375, 1.66650390625, 1.7535400390625, 1.840576171875, 1.9276123046875, 2.0146484375, 2.1016845703125, 2.188720703125, 2.2757568359375, 2.36279296875, 2.4498291015625, 2.536865234375, 2.6239013671875, 2.7109375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 10.0, 10.0, 6.0, 12.0, 8.0, 8.0, 15.0, 25.0, 24.0, 24.0, 25.0, 44.0, 50.0, 44.0, 51.0, 57.0, 58.0, 63.0, 40.0, 45.0, 58.0, 38.0, 43.0, 33.0, 27.0, 25.0, 20.0, 26.0, 22.0, 13.0, 16.0, 12.0, 7.0, 5.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1138916015625, -1.077392578125, -1.0408935546875, -1.00439453125, -0.9678955078125, -0.931396484375, -0.8948974609375, -0.8583984375, -0.8218994140625, -0.785400390625, -0.7489013671875, -0.71240234375, -0.6759033203125, -0.639404296875, -0.6029052734375, -0.56640625, -0.5299072265625, -0.493408203125, -0.4569091796875, -0.42041015625, -0.3839111328125, -0.347412109375, -0.3109130859375, -0.2744140625, -0.2379150390625, -0.201416015625, -0.1649169921875, -0.12841796875, -0.0919189453125, -0.055419921875, -0.0189208984375, 0.017578125, 0.0540771484375, 0.090576171875, 0.1270751953125, 0.16357421875, 0.2000732421875, 0.236572265625, 0.2730712890625, 0.3095703125, 0.3460693359375, 0.382568359375, 0.4190673828125, 0.45556640625, 0.4920654296875, 0.528564453125, 0.5650634765625, 0.6015625, 0.6380615234375, 0.674560546875, 0.7110595703125, 0.74755859375, 0.7840576171875, 0.820556640625, 0.8570556640625, 0.8935546875, 0.9300537109375, 0.966552734375, 1.0030517578125, 1.03955078125, 1.0760498046875, 1.112548828125, 1.1490478515625, 1.185546875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 1.0, 4.0, 7.0, 10.0, 14.0, 18.0, 16.0, 10.0, 28.0, 28.0, 35.0, 30.0, 37.0, 50.0, 54.0, 58.0, 56.0, 68.0, 50.0, 48.0, 40.0, 41.0, 46.0, 39.0, 41.0, 24.0, 21.0, 24.0, 19.0, 10.0, 17.0, 11.0, 11.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-18.613073348999023, -18.07569694519043, -17.53832244873047, -17.000946044921875, -16.46356964111328, -15.926193237304688, -15.38881778717041, -14.851442337036133, -14.314065933227539, -13.776689529418945, -13.239314079284668, -12.70193862915039, -12.164562225341797, -11.627185821533203, -11.089810371398926, -10.552434921264648, -10.015058517456055, -9.477682113647461, -8.940306663513184, -8.402931213378906, -7.8655548095703125, -7.328178882598877, -6.790802955627441, -6.253427028656006, -5.71605110168457, -5.178675174713135, -4.641299247741699, -4.103923320770264, -3.566547393798828, -3.0291714668273926, -2.491795539855957, -1.9544196128845215, -1.4170417785644531, -0.8796658515930176, -0.34228992462158203, 0.19508600234985352, 0.7324619293212891, 1.2698378562927246, 1.8072137832641602, 2.3445897102355957, 2.8819656372070312, 3.419341564178467, 3.9567174911499023, 4.494093418121338, 5.031469345092773, 5.568845272064209, 6.1062211990356445, 6.64359712600708, 7.180973052978516, 7.718348979949951, 8.255724906921387, 8.793100357055664, 9.330476760864258, 9.867853164672852, 10.405228614807129, 10.942604064941406, 11.47998046875, 12.017356872558594, 12.554732322692871, 13.092107772827148, 13.629484176635742, 14.166860580444336, 14.704236030578613, 15.24161148071289, 15.778987884521484]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 18.0, 10.0, 9.0, 10.0, 14.0, 14.0, 15.0, 22.0, 22.0, 36.0, 29.0, 39.0, 42.0, 35.0, 44.0, 30.0, 34.0, 36.0, 39.0, 36.0, 43.0, 38.0, 49.0, 38.0, 28.0, 33.0, 33.0, 26.0, 24.0, 22.0, 13.0, 22.0, 11.0, 14.0, 8.0, 12.0, 6.0, 10.0, 6.0, 6.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-16.14914321899414, -15.641006469726562, -15.1328706741333, -14.624733924865723, -14.116598129272461, -13.608461380004883, -13.100324630737305, -12.592187881469727, -12.084052085876465, -11.575915336608887, -11.067779541015625, -10.559642791748047, -10.051506042480469, -9.543370246887207, -9.035233497619629, -8.527097702026367, -8.018960952758789, -7.510824680328369, -7.002688407897949, -6.494551658630371, -5.986415386199951, -5.478279113769531, -4.970142364501953, -4.462006092071533, -3.9538698196411133, -3.4457335472106934, -2.9375970363616943, -2.4294605255126953, -1.9213242530822754, -1.4131879806518555, -0.9050514698028564, -0.3969149589538574, 0.1112213134765625, 0.619357705116272, 1.1274940967559814, 1.635630488395691, 2.1437668800354004, 2.6519031524658203, 3.1600396633148193, 3.6681761741638184, 4.176312446594238, 4.684448719024658, 5.192584991455078, 5.700721740722656, 6.208858013153076, 6.716994285583496, 7.225131034851074, 7.733267307281494, 8.241403579711914, 8.749540328979492, 9.257676124572754, 9.765812873840332, 10.273948669433594, 10.782085418701172, 11.29022216796875, 11.798358917236328, 12.30649471282959, 12.814631462097168, 13.32276725769043, 13.830904006958008, 14.339040756225586, 14.847176551818848, 15.355313301086426, 15.863449096679688, 16.371585845947266]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 9.0, 4.0, 13.0, 12.0, 22.0, 39.0, 58.0, 109.0, 152.0, 268.0, 389.0, 625.0, 1025.0, 1684.0, 2691.0, 4392.0, 6877.0, 10995.0, 17165.0, 26466.0, 39476.0, 56927.0, 78198.0, 98787.0, 115531.0, 122056.0, 115852.0, 99784.0, 77976.0, 57695.0, 39941.0, 26649.0, 17348.0, 11020.0, 7037.0, 4297.0, 2656.0, 1651.0, 983.0, 634.0, 401.0, 240.0, 162.0, 109.0, 61.0, 42.0, 32.0, 13.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.2421875, -12.7777099609375, -12.313232421875, -11.8487548828125, -11.38427734375, -10.9197998046875, -10.455322265625, -9.9908447265625, -9.5263671875, -9.0618896484375, -8.597412109375, -8.1329345703125, -7.66845703125, -7.2039794921875, -6.739501953125, -6.2750244140625, -5.810546875, -5.3460693359375, -4.881591796875, -4.4171142578125, -3.95263671875, -3.4881591796875, -3.023681640625, -2.5592041015625, -2.0947265625, -1.6302490234375, -1.165771484375, -0.7012939453125, -0.23681640625, 0.2276611328125, 0.692138671875, 1.1566162109375, 1.62109375, 2.0855712890625, 2.550048828125, 3.0145263671875, 3.47900390625, 3.9434814453125, 4.407958984375, 4.8724365234375, 5.3369140625, 5.8013916015625, 6.265869140625, 6.7303466796875, 7.19482421875, 7.6593017578125, 8.123779296875, 8.5882568359375, 9.052734375, 9.5172119140625, 9.981689453125, 10.4461669921875, 10.91064453125, 11.3751220703125, 11.839599609375, 12.3040771484375, 12.7685546875, 13.2330322265625, 13.697509765625, 14.1619873046875, 14.62646484375, 15.0909423828125, 15.555419921875, 16.0198974609375, 16.484375]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 4.0, 11.0, 4.0, 19.0, 18.0, 15.0, 14.0, 18.0, 23.0, 24.0, 28.0, 42.0, 35.0, 39.0, 43.0, 36.0, 35.0, 43.0, 38.0, 27.0, 45.0, 35.0, 53.0, 43.0, 26.0, 34.0, 28.0, 33.0, 32.0, 23.0, 13.0, 21.0, 15.0, 13.0, 14.0, 11.0, 7.0, 6.0, 5.0, 7.0, 6.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.490234375, -14.99609375, -14.501953125, -14.0078125, -13.513671875, -13.01953125, -12.525390625, -12.03125, -11.537109375, -11.04296875, -10.548828125, -10.0546875, -9.560546875, -9.06640625, -8.572265625, -8.078125, -7.583984375, -7.08984375, -6.595703125, -6.1015625, -5.607421875, -5.11328125, -4.619140625, -4.125, -3.630859375, -3.13671875, -2.642578125, -2.1484375, -1.654296875, -1.16015625, -0.666015625, -0.171875, 0.322265625, 0.81640625, 1.310546875, 1.8046875, 2.298828125, 2.79296875, 3.287109375, 3.78125, 4.275390625, 4.76953125, 5.263671875, 5.7578125, 6.251953125, 6.74609375, 7.240234375, 7.734375, 8.228515625, 8.72265625, 9.216796875, 9.7109375, 10.205078125, 10.69921875, 11.193359375, 11.6875, 12.181640625, 12.67578125, 13.169921875, 13.6640625, 14.158203125, 14.65234375, 15.146484375, 15.640625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 17.0, 24.0, 48.0, 52.0, 89.0, 155.0, 221.0, 347.0, 579.0, 950.0, 1519.0, 2428.0, 3986.0, 6254.0, 10164.0, 15764.0, 25148.0, 38052.0, 56044.0, 77274.0, 100805.0, 119826.0, 126658.0, 119940.0, 101112.0, 77827.0, 56190.0, 38207.0, 25400.0, 16246.0, 10212.0, 6416.0, 4032.0, 2449.0, 1592.0, 969.0, 585.0, 356.0, 216.0, 160.0, 84.0, 55.0, 39.0, 16.0, 15.0, 14.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.765625, -13.314453125, -12.86328125, -12.412109375, -11.9609375, -11.509765625, -11.05859375, -10.607421875, -10.15625, -9.705078125, -9.25390625, -8.802734375, -8.3515625, -7.900390625, -7.44921875, -6.998046875, -6.546875, -6.095703125, -5.64453125, -5.193359375, -4.7421875, -4.291015625, -3.83984375, -3.388671875, -2.9375, -2.486328125, -2.03515625, -1.583984375, -1.1328125, -0.681640625, -0.23046875, 0.220703125, 0.671875, 1.123046875, 1.57421875, 2.025390625, 2.4765625, 2.927734375, 3.37890625, 3.830078125, 4.28125, 4.732421875, 5.18359375, 5.634765625, 6.0859375, 6.537109375, 6.98828125, 7.439453125, 7.890625, 8.341796875, 8.79296875, 9.244140625, 9.6953125, 10.146484375, 10.59765625, 11.048828125, 11.5, 11.951171875, 12.40234375, 12.853515625, 13.3046875, 13.755859375, 14.20703125, 14.658203125, 15.109375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 6.0, 4.0, 4.0, 12.0, 12.0, 16.0, 15.0, 19.0, 18.0, 26.0, 33.0, 32.0, 34.0, 39.0, 25.0, 34.0, 45.0, 40.0, 45.0, 48.0, 47.0, 48.0, 37.0, 43.0, 31.0, 37.0, 36.0, 21.0, 33.0, 24.0, 18.0, 24.0, 17.0, 15.0, 13.0, 5.0, 11.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.875, -11.5216064453125, -11.168212890625, -10.8148193359375, -10.46142578125, -10.1080322265625, -9.754638671875, -9.4012451171875, -9.0478515625, -8.6944580078125, -8.341064453125, -7.9876708984375, -7.63427734375, -7.2808837890625, -6.927490234375, -6.5740966796875, -6.220703125, -5.8673095703125, -5.513916015625, -5.1605224609375, -4.80712890625, -4.4537353515625, -4.100341796875, -3.7469482421875, -3.3935546875, -3.0401611328125, -2.686767578125, -2.3333740234375, -1.97998046875, -1.6265869140625, -1.273193359375, -0.9197998046875, -0.56640625, -0.2130126953125, 0.140380859375, 0.4937744140625, 0.84716796875, 1.2005615234375, 1.553955078125, 1.9073486328125, 2.2607421875, 2.6141357421875, 2.967529296875, 3.3209228515625, 3.67431640625, 4.0277099609375, 4.381103515625, 4.7344970703125, 5.087890625, 5.4412841796875, 5.794677734375, 6.1480712890625, 6.50146484375, 6.8548583984375, 7.208251953125, 7.5616455078125, 7.9150390625, 8.2684326171875, 8.621826171875, 8.9752197265625, 9.32861328125, 9.6820068359375, 10.035400390625, 10.3887939453125, 10.7421875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 11.0, 11.0, 20.0, 36.0, 51.0, 83.0, 123.0, 194.0, 262.0, 433.0, 635.0, 980.0, 1642.0, 2732.0, 4301.0, 6999.0, 11850.0, 20238.0, 34121.0, 57769.0, 94590.0, 139592.0, 172753.0, 166359.0, 126872.0, 82848.0, 49945.0, 29473.0, 17424.0, 10027.0, 6242.0, 3743.0, 2254.0, 1390.0, 876.0, 591.0, 375.0, 239.0, 169.0, 105.0, 74.0, 38.0, 26.0, 21.0, 12.0, 12.0, 7.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3671875, -11.0103759765625, -10.653564453125, -10.2967529296875, -9.93994140625, -9.5831298828125, -9.226318359375, -8.8695068359375, -8.5126953125, -8.1558837890625, -7.799072265625, -7.4422607421875, -7.08544921875, -6.7286376953125, -6.371826171875, -6.0150146484375, -5.658203125, -5.3013916015625, -4.944580078125, -4.5877685546875, -4.23095703125, -3.8741455078125, -3.517333984375, -3.1605224609375, -2.8037109375, -2.4468994140625, -2.090087890625, -1.7332763671875, -1.37646484375, -1.0196533203125, -0.662841796875, -0.3060302734375, 0.05078125, 0.4075927734375, 0.764404296875, 1.1212158203125, 1.47802734375, 1.8348388671875, 2.191650390625, 2.5484619140625, 2.9052734375, 3.2620849609375, 3.618896484375, 3.9757080078125, 4.33251953125, 4.6893310546875, 5.046142578125, 5.4029541015625, 5.759765625, 6.1165771484375, 6.473388671875, 6.8302001953125, 7.18701171875, 7.5438232421875, 7.900634765625, 8.2574462890625, 8.6142578125, 8.9710693359375, 9.327880859375, 9.6846923828125, 10.04150390625, 10.3983154296875, 10.755126953125, 11.1119384765625, 11.46875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 6.0, 9.0, 7.0, 10.0, 16.0, 16.0, 17.0, 26.0, 25.0, 35.0, 39.0, 46.0, 54.0, 51.0, 64.0, 55.0, 58.0, 59.0, 66.0, 61.0, 48.0, 42.0, 33.0, 31.0, 31.0, 21.0, 15.0, 10.0, 11.0, 7.0, 3.0, 9.0, 3.0, 5.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0010356903076171875, -0.0010036379098892212, -0.0009715855121612549, -0.0009395331144332886, -0.0009074807167053223, -0.000875428318977356, -0.0008433759212493896, -0.0008113235235214233, -0.000779271125793457, -0.0007472187280654907, -0.0007151663303375244, -0.0006831139326095581, -0.0006510615348815918, -0.0006190091371536255, -0.0005869567394256592, -0.0005549043416976929, -0.0005228519439697266, -0.0004907995462417603, -0.00045874714851379395, -0.00042669475078582764, -0.00039464235305786133, -0.000362589955329895, -0.0003305375576019287, -0.0002984851598739624, -0.0002664327621459961, -0.00023438036441802979, -0.00020232796669006348, -0.00017027556896209717, -0.00013822317123413086, -0.00010617077350616455, -7.411837577819824e-05, -4.2065978050231934e-05, -1.0013580322265625e-05, 2.2038817405700684e-05, 5.409121513366699e-05, 8.61436128616333e-05, 0.00011819601058959961, 0.00015024840831756592, 0.00018230080604553223, 0.00021435320377349854, 0.00024640560150146484, 0.00027845799922943115, 0.00031051039695739746, 0.00034256279468536377, 0.0003746151924133301, 0.0004066675901412964, 0.0004387199878692627, 0.000470772385597229, 0.0005028247833251953, 0.0005348771810531616, 0.0005669295787811279, 0.0005989819765090942, 0.0006310343742370605, 0.0006630867719650269, 0.0006951391696929932, 0.0007271915674209595, 0.0007592439651489258, 0.0007912963628768921, 0.0008233487606048584, 0.0008554011583328247, 0.000887453556060791, 0.0009195059537887573, 0.0009515583515167236, 0.00098361074924469, 0.0010156631469726562]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 16.0, 16.0, 24.0, 56.0, 77.0, 113.0, 210.0, 330.0, 550.0, 887.0, 1433.0, 2592.0, 4413.0, 7965.0, 13706.0, 24160.0, 41199.0, 68887.0, 107003.0, 148826.0, 170629.0, 155096.0, 115699.0, 75911.0, 45734.0, 26932.0, 15473.0, 8749.0, 4894.0, 2908.0, 1610.0, 941.0, 559.0, 377.0, 198.0, 137.0, 73.0, 65.0, 28.0, 25.0, 12.0, 10.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 3.0], "bins": [-11.6328125, -11.3060302734375, -10.979248046875, -10.6524658203125, -10.32568359375, -9.9989013671875, -9.672119140625, -9.3453369140625, -9.0185546875, -8.6917724609375, -8.364990234375, -8.0382080078125, -7.71142578125, -7.3846435546875, -7.057861328125, -6.7310791015625, -6.404296875, -6.0775146484375, -5.750732421875, -5.4239501953125, -5.09716796875, -4.7703857421875, -4.443603515625, -4.1168212890625, -3.7900390625, -3.4632568359375, -3.136474609375, -2.8096923828125, -2.48291015625, -2.1561279296875, -1.829345703125, -1.5025634765625, -1.17578125, -0.8489990234375, -0.522216796875, -0.1954345703125, 0.13134765625, 0.4581298828125, 0.784912109375, 1.1116943359375, 1.4384765625, 1.7652587890625, 2.092041015625, 2.4188232421875, 2.74560546875, 3.0723876953125, 3.399169921875, 3.7259521484375, 4.052734375, 4.3795166015625, 4.706298828125, 5.0330810546875, 5.35986328125, 5.6866455078125, 6.013427734375, 6.3402099609375, 6.6669921875, 6.9937744140625, 7.320556640625, 7.6473388671875, 7.97412109375, 8.3009033203125, 8.627685546875, 8.9544677734375, 9.28125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 8.0, 8.0, 10.0, 17.0, 19.0, 24.0, 25.0, 25.0, 37.0, 43.0, 60.0, 49.0, 63.0, 53.0, 64.0, 61.0, 55.0, 48.0, 60.0, 44.0, 41.0, 37.0, 34.0, 27.0, 19.0, 16.0, 12.0, 12.0, 12.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.5301513671875, -4.392333984375, -4.2545166015625, -4.11669921875, -3.9788818359375, -3.841064453125, -3.7032470703125, -3.5654296875, -3.4276123046875, -3.289794921875, -3.1519775390625, -3.01416015625, -2.8763427734375, -2.738525390625, -2.6007080078125, -2.462890625, -2.3250732421875, -2.187255859375, -2.0494384765625, -1.91162109375, -1.7738037109375, -1.635986328125, -1.4981689453125, -1.3603515625, -1.2225341796875, -1.084716796875, -0.9468994140625, -0.80908203125, -0.6712646484375, -0.533447265625, -0.3956298828125, -0.2578125, -0.1199951171875, 0.017822265625, 0.1556396484375, 0.29345703125, 0.4312744140625, 0.569091796875, 0.7069091796875, 0.8447265625, 0.9825439453125, 1.120361328125, 1.2581787109375, 1.39599609375, 1.5338134765625, 1.671630859375, 1.8094482421875, 1.947265625, 2.0850830078125, 2.222900390625, 2.3607177734375, 2.49853515625, 2.6363525390625, 2.774169921875, 2.9119873046875, 3.0498046875, 3.1876220703125, 3.325439453125, 3.4632568359375, 3.60107421875, 3.7388916015625, 3.876708984375, 4.0145263671875, 4.15234375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 6.0, 5.0, 7.0, 12.0, 15.0, 27.0, 19.0, 19.0, 25.0, 32.0, 43.0, 49.0, 62.0, 49.0, 49.0, 59.0, 52.0, 48.0, 50.0, 49.0, 59.0, 47.0, 38.0, 28.0, 22.0, 26.0, 21.0, 17.0, 13.0, 13.0, 10.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.10588836669922, -19.526273727416992, -18.9466609954834, -18.367046356201172, -17.787433624267578, -17.20781898498535, -16.628206253051758, -16.04859161376953, -15.468978881835938, -14.889365196228027, -14.309751510620117, -13.730137825012207, -13.150524139404297, -12.570910453796387, -11.991296768188477, -11.41168212890625, -10.83206844329834, -10.25245475769043, -9.67284107208252, -9.09322738647461, -8.5136137008667, -7.934000015258789, -7.354385852813721, -6.7747721672058105, -6.1951584815979, -5.61554479598999, -5.03593111038208, -4.456316947937012, -3.8767035007476807, -3.2970898151397705, -2.7174758911132812, -2.137862205505371, -1.558248519897461, -0.978634774684906, -0.3990210294723511, 0.18059277534484863, 0.7602064609527588, 1.339820146560669, 1.9194340705871582, 2.4990477561950684, 3.0786614418029785, 3.6582751274108887, 4.237888813018799, 4.817502975463867, 5.397116661071777, 5.9767303466796875, 6.556344032287598, 7.135957717895508, 7.715571403503418, 8.295185089111328, 8.874798774719238, 9.454412460327148, 10.034026145935059, 10.613639831542969, 11.193254470825195, 11.772867202758789, 12.352481842041016, 12.932095527648926, 13.511709213256836, 14.091322898864746, 14.670936584472656, 15.250550270080566, 15.830163955688477, 16.409778594970703, 16.989391326904297]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 4.0, 14.0, 16.0, 12.0, 13.0, 19.0, 12.0, 32.0, 37.0, 24.0, 42.0, 28.0, 37.0, 36.0, 40.0, 42.0, 41.0, 39.0, 37.0, 44.0, 32.0, 39.0, 38.0, 34.0, 44.0, 44.0, 28.0, 15.0, 17.0, 20.0, 16.0, 15.0, 19.0, 15.0, 11.0, 10.0, 3.0, 2.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.94496726989746, -17.39909553527832, -16.85322380065918, -16.307350158691406, -15.761478424072266, -15.215606689453125, -14.669734954833984, -14.123863220214844, -13.577990531921387, -13.032118797302246, -12.486246109008789, -11.940374374389648, -11.394502639770508, -10.84862995147705, -10.30275821685791, -9.756885528564453, -9.211013793945312, -8.665142059326172, -8.119269371032715, -7.573397636413574, -7.027525424957275, -6.481653213500977, -5.935781478881836, -5.389909267425537, -4.844037055969238, -4.2981648445129395, -3.7522928714752197, -3.2064208984375, -2.660548686981201, -2.1146764755249023, -1.5688045024871826, -1.022932529449463, -0.47705841064453125, 0.06881368160247803, 0.6146857738494873, 1.1605578660964966, 1.7064299583435059, 2.2523021697998047, 2.7981741428375244, 3.344046115875244, 3.889918327331543, 4.435790538787842, 4.981662750244141, 5.527534484863281, 6.07340669631958, 6.619278907775879, 7.1651506423950195, 7.711022853851318, 8.256895065307617, 8.802766799926758, 9.348639488220215, 9.894511222839355, 10.440383911132812, 10.986255645751953, 11.532127380371094, 12.077999114990234, 12.623871803283691, 13.169743537902832, 13.715616226196289, 14.26148796081543, 14.80735969543457, 15.353232383728027, 15.899104118347168, 16.444976806640625, 16.990848541259766]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 6.0, 6.0, 11.0, 23.0, 32.0, 43.0, 65.0, 110.0, 185.0, 243.0, 390.0, 619.0, 1014.0, 1585.0, 2695.0, 4264.0, 7156.0, 11936.0, 19766.0, 33508.0, 56012.0, 93276.0, 153718.0, 246096.0, 376545.0, 526608.0, 629303.0, 616128.0, 497676.0, 347717.0, 224737.0, 138123.0, 83248.0, 49172.0, 29212.0, 17110.0, 10240.0, 6181.0, 3693.0, 2252.0, 1407.0, 853.0, 457.0, 313.0, 200.0, 119.0, 88.0, 43.0, 33.0, 22.0, 22.0, 6.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-11.3046875, -10.913330078125, -10.52197265625, -10.130615234375, -9.7392578125, -9.347900390625, -8.95654296875, -8.565185546875, -8.173828125, -7.782470703125, -7.39111328125, -6.999755859375, -6.6083984375, -6.217041015625, -5.82568359375, -5.434326171875, -5.04296875, -4.651611328125, -4.26025390625, -3.868896484375, -3.4775390625, -3.086181640625, -2.69482421875, -2.303466796875, -1.912109375, -1.520751953125, -1.12939453125, -0.738037109375, -0.3466796875, 0.044677734375, 0.43603515625, 0.827392578125, 1.21875, 1.610107421875, 2.00146484375, 2.392822265625, 2.7841796875, 3.175537109375, 3.56689453125, 3.958251953125, 4.349609375, 4.740966796875, 5.13232421875, 5.523681640625, 5.9150390625, 6.306396484375, 6.69775390625, 7.089111328125, 7.48046875, 7.871826171875, 8.26318359375, 8.654541015625, 9.0458984375, 9.437255859375, 9.82861328125, 10.219970703125, 10.611328125, 11.002685546875, 11.39404296875, 11.785400390625, 12.1767578125, 12.568115234375, 12.95947265625, 13.350830078125, 13.7421875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 8.0, 3.0, 7.0, 9.0, 12.0, 11.0, 12.0, 14.0, 21.0, 25.0, 38.0, 41.0, 36.0, 26.0, 40.0, 46.0, 38.0, 44.0, 43.0, 38.0, 43.0, 44.0, 35.0, 37.0, 43.0, 37.0, 37.0, 30.0, 30.0, 25.0, 24.0, 18.0, 17.0, 15.0, 15.0, 11.0, 7.0, 8.0, 6.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.4228515625, -11.041015625, -10.6591796875, -10.27734375, -9.8955078125, -9.513671875, -9.1318359375, -8.75, -8.3681640625, -7.986328125, -7.6044921875, -7.22265625, -6.8408203125, -6.458984375, -6.0771484375, -5.6953125, -5.3134765625, -4.931640625, -4.5498046875, -4.16796875, -3.7861328125, -3.404296875, -3.0224609375, -2.640625, -2.2587890625, -1.876953125, -1.4951171875, -1.11328125, -0.7314453125, -0.349609375, 0.0322265625, 0.4140625, 0.7958984375, 1.177734375, 1.5595703125, 1.94140625, 2.3232421875, 2.705078125, 3.0869140625, 3.46875, 3.8505859375, 4.232421875, 4.6142578125, 4.99609375, 5.3779296875, 5.759765625, 6.1416015625, 6.5234375, 6.9052734375, 7.287109375, 7.6689453125, 8.05078125, 8.4326171875, 8.814453125, 9.1962890625, 9.578125, 9.9599609375, 10.341796875, 10.7236328125, 11.10546875, 11.4873046875, 11.869140625, 12.2509765625, 12.6328125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 13.0, 15.0, 34.0, 40.0, 53.0, 106.0, 158.0, 286.0, 503.0, 737.0, 1222.0, 2082.0, 3416.0, 5693.0, 9678.0, 16594.0, 27908.0, 47230.0, 80130.0, 131844.0, 208808.0, 313977.0, 435798.0, 541788.0, 583312.0, 535498.0, 427375.0, 303972.0, 201563.0, 125855.0, 76884.0, 46099.0, 26996.0, 15931.0, 9189.0, 5287.0, 3194.0, 1866.0, 1194.0, 722.0, 471.0, 273.0, 175.0, 108.0, 76.0, 41.0, 34.0, 19.0, 12.0, 6.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0], "bins": [-11.6015625, -11.244140625, -10.88671875, -10.529296875, -10.171875, -9.814453125, -9.45703125, -9.099609375, -8.7421875, -8.384765625, -8.02734375, -7.669921875, -7.3125, -6.955078125, -6.59765625, -6.240234375, -5.8828125, -5.525390625, -5.16796875, -4.810546875, -4.453125, -4.095703125, -3.73828125, -3.380859375, -3.0234375, -2.666015625, -2.30859375, -1.951171875, -1.59375, -1.236328125, -0.87890625, -0.521484375, -0.1640625, 0.193359375, 0.55078125, 0.908203125, 1.265625, 1.623046875, 1.98046875, 2.337890625, 2.6953125, 3.052734375, 3.41015625, 3.767578125, 4.125, 4.482421875, 4.83984375, 5.197265625, 5.5546875, 5.912109375, 6.26953125, 6.626953125, 6.984375, 7.341796875, 7.69921875, 8.056640625, 8.4140625, 8.771484375, 9.12890625, 9.486328125, 9.84375, 10.201171875, 10.55859375, 10.916015625, 11.2734375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 10.0, 12.0, 24.0, 28.0, 23.0, 46.0, 53.0, 52.0, 65.0, 114.0, 105.0, 128.0, 166.0, 150.0, 187.0, 227.0, 249.0, 226.0, 217.0, 244.0, 240.0, 232.0, 181.0, 181.0, 152.0, 137.0, 127.0, 110.0, 80.0, 58.0, 47.0, 34.0, 39.0, 25.0, 25.0, 20.0, 14.0, 12.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.375, -5.1934814453125, -5.011962890625, -4.8304443359375, -4.64892578125, -4.4674072265625, -4.285888671875, -4.1043701171875, -3.9228515625, -3.7413330078125, -3.559814453125, -3.3782958984375, -3.19677734375, -3.0152587890625, -2.833740234375, -2.6522216796875, -2.470703125, -2.2891845703125, -2.107666015625, -1.9261474609375, -1.74462890625, -1.5631103515625, -1.381591796875, -1.2000732421875, -1.0185546875, -0.8370361328125, -0.655517578125, -0.4739990234375, -0.29248046875, -0.1109619140625, 0.070556640625, 0.2520751953125, 0.43359375, 0.6151123046875, 0.796630859375, 0.9781494140625, 1.15966796875, 1.3411865234375, 1.522705078125, 1.7042236328125, 1.8857421875, 2.0672607421875, 2.248779296875, 2.4302978515625, 2.61181640625, 2.7933349609375, 2.974853515625, 3.1563720703125, 3.337890625, 3.5194091796875, 3.700927734375, 3.8824462890625, 4.06396484375, 4.2454833984375, 4.427001953125, 4.6085205078125, 4.7900390625, 4.9715576171875, 5.153076171875, 5.3345947265625, 5.51611328125, 5.6976318359375, 5.879150390625, 6.0606689453125, 6.2421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 7.0, 4.0, 5.0, 8.0, 9.0, 15.0, 17.0, 24.0, 35.0, 35.0, 35.0, 56.0, 62.0, 50.0, 66.0, 55.0, 70.0, 64.0, 62.0, 70.0, 49.0, 27.0, 39.0, 31.0, 23.0, 14.0, 17.0, 9.0, 9.0, 10.0, 9.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.511024475097656, -22.925106048583984, -22.339189529418945, -21.753271102905273, -21.1673526763916, -20.58143424987793, -19.99551773071289, -19.40959930419922, -18.823680877685547, -18.237762451171875, -17.651845932006836, -17.065927505493164, -16.480009078979492, -15.894091606140137, -15.308174133300781, -14.72225570678711, -14.136338233947754, -13.550420761108398, -12.964502334594727, -12.378584861755371, -11.7926664352417, -11.206748962402344, -10.620830535888672, -10.034913063049316, -9.448995590209961, -8.863078117370605, -8.277159690856934, -7.691242218017578, -7.105323791503906, -6.519406318664551, -5.933488368988037, -5.347570419311523, -4.761651039123535, -4.1757330894470215, -3.589815139770508, -3.0038974285125732, -2.4179794788360596, -1.832061529159546, -1.2461438179016113, -0.6602258682250977, -0.07430791854858398, 0.5116099715232849, 1.0975278615951538, 1.683445692062378, 2.2693636417388916, 2.8552815914154053, 3.44119930267334, 4.0271172523498535, 4.613035202026367, 5.198953151702881, 5.7848711013793945, 6.37078857421875, 6.956707000732422, 7.542624473571777, 8.128541946411133, 8.714460372924805, 9.300378799438477, 9.886296272277832, 10.472214698791504, 11.05813217163086, 11.644050598144531, 12.229968070983887, 12.815885543823242, 13.401803970336914, 13.98772144317627]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 8.0, 9.0, 12.0, 17.0, 18.0, 16.0, 22.0, 26.0, 32.0, 28.0, 31.0, 32.0, 25.0, 29.0, 37.0, 42.0, 42.0, 37.0, 38.0, 39.0, 44.0, 46.0, 28.0, 50.0, 28.0, 36.0, 22.0, 32.0, 22.0, 15.0, 24.0, 14.0, 9.0, 10.0, 14.0, 12.0, 15.0, 8.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.461763381958008, -14.01747989654541, -13.573196411132812, -13.128912925720215, -12.684629440307617, -12.240346908569336, -11.796063423156738, -11.35177993774414, -10.907496452331543, -10.463212966918945, -10.018929481506348, -9.57464599609375, -9.130363464355469, -8.686079025268555, -8.241796493530273, -7.797513008117676, -7.353229522705078, -6.9089460372924805, -6.464662551879883, -6.020379543304443, -5.576096057891846, -5.131812572479248, -4.687529563903809, -4.243246078491211, -3.7989625930786133, -3.3546791076660156, -2.910395860671997, -2.4661126136779785, -2.021829128265381, -1.5775456428527832, -1.1332623958587646, -0.6889791488647461, -0.24469566345214844, 0.19958770275115967, 0.6438710689544678, 1.0881544351577759, 1.532437801361084, 1.9767212867736816, 2.4210045337677, 2.8652877807617188, 3.3095712661743164, 3.753854751586914, 4.198138236999512, 4.642421245574951, 5.086704730987549, 5.5309882164001465, 5.975271224975586, 6.419554710388184, 6.863838195800781, 7.308121681213379, 7.752405166625977, 8.196688652038574, 8.640972137451172, 9.085254669189453, 9.52953815460205, 9.973821640014648, 10.418105125427246, 10.862388610839844, 11.306672096252441, 11.750955581665039, 12.19523811340332, 12.639522552490234, 13.083805084228516, 13.528088569641113, 13.972372055053711]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 15.0, 28.0, 30.0, 55.0, 78.0, 119.0, 179.0, 264.0, 428.0, 693.0, 1067.0, 1868.0, 3190.0, 5598.0, 9991.0, 17748.0, 32443.0, 59033.0, 104572.0, 166919.0, 206711.0, 176975.0, 114473.0, 64881.0, 35844.0, 19557.0, 10672.0, 6171.0, 3629.0, 2038.0, 1252.0, 746.0, 465.0, 264.0, 184.0, 109.0, 87.0, 59.0, 28.0, 27.0, 15.0, 8.0, 14.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.19140625, -5.98895263671875, -5.7864990234375, -5.58404541015625, -5.381591796875, -5.17913818359375, -4.9766845703125, -4.77423095703125, -4.57177734375, -4.36932373046875, -4.1668701171875, -3.96441650390625, -3.761962890625, -3.55950927734375, -3.3570556640625, -3.15460205078125, -2.9521484375, -2.74969482421875, -2.5472412109375, -2.34478759765625, -2.142333984375, -1.93988037109375, -1.7374267578125, -1.53497314453125, -1.33251953125, -1.13006591796875, -0.9276123046875, -0.72515869140625, -0.522705078125, -0.32025146484375, -0.1177978515625, 0.08465576171875, 0.287109375, 0.48956298828125, 0.6920166015625, 0.89447021484375, 1.096923828125, 1.29937744140625, 1.5018310546875, 1.70428466796875, 1.90673828125, 2.10919189453125, 2.3116455078125, 2.51409912109375, 2.716552734375, 2.91900634765625, 3.1214599609375, 3.32391357421875, 3.5263671875, 3.72882080078125, 3.9312744140625, 4.13372802734375, 4.336181640625, 4.53863525390625, 4.7410888671875, 4.94354248046875, 5.14599609375, 5.34844970703125, 5.5509033203125, 5.75335693359375, 5.955810546875, 6.15826416015625, 6.3607177734375, 6.56317138671875, 6.765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 3.0, 6.0, 9.0, 10.0, 15.0, 14.0, 20.0, 26.0, 24.0, 15.0, 31.0, 36.0, 31.0, 33.0, 36.0, 25.0, 34.0, 41.0, 45.0, 38.0, 44.0, 43.0, 39.0, 35.0, 32.0, 37.0, 35.0, 27.0, 28.0, 27.0, 23.0, 14.0, 21.0, 11.0, 18.0, 13.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.0, -13.5455322265625, -13.091064453125, -12.6365966796875, -12.18212890625, -11.7276611328125, -11.273193359375, -10.8187255859375, -10.3642578125, -9.9097900390625, -9.455322265625, -9.0008544921875, -8.54638671875, -8.0919189453125, -7.637451171875, -7.1829833984375, -6.728515625, -6.2740478515625, -5.819580078125, -5.3651123046875, -4.91064453125, -4.4561767578125, -4.001708984375, -3.5472412109375, -3.0927734375, -2.6383056640625, -2.183837890625, -1.7293701171875, -1.27490234375, -0.8204345703125, -0.365966796875, 0.0885009765625, 0.54296875, 0.9974365234375, 1.451904296875, 1.9063720703125, 2.36083984375, 2.8153076171875, 3.269775390625, 3.7242431640625, 4.1787109375, 4.6331787109375, 5.087646484375, 5.5421142578125, 5.99658203125, 6.4510498046875, 6.905517578125, 7.3599853515625, 7.814453125, 8.2689208984375, 8.723388671875, 9.1778564453125, 9.63232421875, 10.0867919921875, 10.541259765625, 10.9957275390625, 11.4501953125, 11.9046630859375, 12.359130859375, 12.8135986328125, 13.26806640625, 13.7225341796875, 14.177001953125, 14.6314697265625, 15.0859375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 5.0, 12.0, 17.0, 29.0, 38.0, 64.0, 102.0, 168.0, 296.0, 461.0, 861.0, 1556.0, 2928.0, 5834.0, 12064.0, 25864.0, 58138.0, 129337.0, 247142.0, 272160.0, 158006.0, 72090.0, 31967.0, 14610.0, 7122.0, 3601.0, 1800.0, 964.0, 544.0, 285.0, 183.0, 108.0, 79.0, 37.0, 26.0, 23.0, 10.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.45703125, -6.21905517578125, -5.9810791015625, -5.74310302734375, -5.505126953125, -5.26715087890625, -5.0291748046875, -4.79119873046875, -4.55322265625, -4.31524658203125, -4.0772705078125, -3.83929443359375, -3.601318359375, -3.36334228515625, -3.1253662109375, -2.88739013671875, -2.6494140625, -2.41143798828125, -2.1734619140625, -1.93548583984375, -1.697509765625, -1.45953369140625, -1.2215576171875, -0.98358154296875, -0.74560546875, -0.50762939453125, -0.2696533203125, -0.03167724609375, 0.206298828125, 0.44427490234375, 0.6822509765625, 0.92022705078125, 1.158203125, 1.39617919921875, 1.6341552734375, 1.87213134765625, 2.110107421875, 2.34808349609375, 2.5860595703125, 2.82403564453125, 3.06201171875, 3.29998779296875, 3.5379638671875, 3.77593994140625, 4.013916015625, 4.25189208984375, 4.4898681640625, 4.72784423828125, 4.9658203125, 5.20379638671875, 5.4417724609375, 5.67974853515625, 5.917724609375, 6.15570068359375, 6.3936767578125, 6.63165283203125, 6.86962890625, 7.10760498046875, 7.3455810546875, 7.58355712890625, 7.821533203125, 8.05950927734375, 8.2974853515625, 8.53546142578125, 8.7734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 14.0, 3.0, 11.0, 16.0, 15.0, 15.0, 18.0, 26.0, 18.0, 24.0, 32.0, 23.0, 32.0, 38.0, 38.0, 35.0, 39.0, 25.0, 37.0, 42.0, 50.0, 44.0, 43.0, 37.0, 42.0, 28.0, 38.0, 26.0, 40.0, 35.0, 19.0, 16.0, 10.0, 20.0, 15.0, 9.0, 7.0, 4.0, 6.0, 3.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.6484375, -11.319091796875, -10.98974609375, -10.660400390625, -10.3310546875, -10.001708984375, -9.67236328125, -9.343017578125, -9.013671875, -8.684326171875, -8.35498046875, -8.025634765625, -7.6962890625, -7.366943359375, -7.03759765625, -6.708251953125, -6.37890625, -6.049560546875, -5.72021484375, -5.390869140625, -5.0615234375, -4.732177734375, -4.40283203125, -4.073486328125, -3.744140625, -3.414794921875, -3.08544921875, -2.756103515625, -2.4267578125, -2.097412109375, -1.76806640625, -1.438720703125, -1.109375, -0.780029296875, -0.45068359375, -0.121337890625, 0.2080078125, 0.537353515625, 0.86669921875, 1.196044921875, 1.525390625, 1.854736328125, 2.18408203125, 2.513427734375, 2.8427734375, 3.172119140625, 3.50146484375, 3.830810546875, 4.16015625, 4.489501953125, 4.81884765625, 5.148193359375, 5.4775390625, 5.806884765625, 6.13623046875, 6.465576171875, 6.794921875, 7.124267578125, 7.45361328125, 7.782958984375, 8.1123046875, 8.441650390625, 8.77099609375, 9.100341796875, 9.4296875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 12.0, 21.0, 45.0, 30.0, 80.0, 139.0, 222.0, 349.0, 753.0, 1489.0, 3334.0, 8708.0, 27054.0, 98672.0, 329512.0, 391082.0, 132952.0, 35408.0, 10951.0, 3999.0, 1779.0, 863.0, 448.0, 248.0, 142.0, 92.0, 55.0, 29.0, 29.0, 16.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.6796875, -3.580535888671875, -3.48138427734375, -3.382232666015625, -3.2830810546875, -3.183929443359375, -3.08477783203125, -2.985626220703125, -2.886474609375, -2.787322998046875, -2.68817138671875, -2.589019775390625, -2.4898681640625, -2.390716552734375, -2.29156494140625, -2.192413330078125, -2.09326171875, -1.994110107421875, -1.89495849609375, -1.795806884765625, -1.6966552734375, -1.597503662109375, -1.49835205078125, -1.399200439453125, -1.300048828125, -1.200897216796875, -1.10174560546875, -1.002593994140625, -0.9034423828125, -0.804290771484375, -0.70513916015625, -0.605987548828125, -0.5068359375, -0.407684326171875, -0.30853271484375, -0.209381103515625, -0.1102294921875, -0.011077880859375, 0.08807373046875, 0.187225341796875, 0.286376953125, 0.385528564453125, 0.48468017578125, 0.583831787109375, 0.6829833984375, 0.782135009765625, 0.88128662109375, 0.980438232421875, 1.07958984375, 1.178741455078125, 1.27789306640625, 1.377044677734375, 1.4761962890625, 1.575347900390625, 1.67449951171875, 1.773651123046875, 1.872802734375, 1.971954345703125, 2.07110595703125, 2.170257568359375, 2.2694091796875, 2.368560791015625, 2.46771240234375, 2.566864013671875, 2.666015625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 9.0, 7.0, 8.0, 11.0, 16.0, 29.0, 43.0, 72.0, 88.0, 100.0, 106.0, 111.0, 90.0, 91.0, 70.0, 44.0, 30.0, 28.0, 14.0, 10.0, 7.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027680397033691406, -0.00026993080973625183, -0.0002630576491355896, -0.00025618448853492737, -0.00024931132793426514, -0.0002424381673336029, -0.00023556500673294067, -0.00022869184613227844, -0.0002218186855316162, -0.00021494552493095398, -0.00020807236433029175, -0.00020119920372962952, -0.00019432604312896729, -0.00018745288252830505, -0.00018057972192764282, -0.0001737065613269806, -0.00016683340072631836, -0.00015996024012565613, -0.0001530870795249939, -0.00014621391892433167, -0.00013934075832366943, -0.0001324675977230072, -0.00012559443712234497, -0.00011872127652168274, -0.00011184811592102051, -0.00010497495532035828, -9.810179471969604e-05, -9.122863411903381e-05, -8.435547351837158e-05, -7.748231291770935e-05, -7.060915231704712e-05, -6.373599171638489e-05, -5.6862831115722656e-05, -4.9989670515060425e-05, -4.311650991439819e-05, -3.624334931373596e-05, -2.937018871307373e-05, -2.24970281124115e-05, -1.5623867511749268e-05, -8.750706911087036e-06, -1.8775463104248047e-06, 4.995614290237427e-06, 1.1868774890899658e-05, 1.874193549156189e-05, 2.561509609222412e-05, 3.248825669288635e-05, 3.9361417293548584e-05, 4.6234577894210815e-05, 5.310773849487305e-05, 5.998089909553528e-05, 6.685405969619751e-05, 7.372722029685974e-05, 8.060038089752197e-05, 8.74735414981842e-05, 9.434670209884644e-05, 0.00010121986269950867, 0.0001080930233001709, 0.00011496618390083313, 0.00012183934450149536, 0.0001287125051021576, 0.00013558566570281982, 0.00014245882630348206, 0.0001493319869041443, 0.00015620514750480652, 0.00016307830810546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 7.0, 8.0, 6.0, 18.0, 36.0, 31.0, 54.0, 91.0, 144.0, 204.0, 321.0, 522.0, 863.0, 1369.0, 2298.0, 3856.0, 6147.0, 10495.0, 17646.0, 29282.0, 49445.0, 80832.0, 125642.0, 173383.0, 180133.0, 137084.0, 89811.0, 55300.0, 33328.0, 20101.0, 12119.0, 7045.0, 4257.0, 2532.0, 1584.0, 938.0, 611.0, 348.0, 232.0, 154.0, 101.0, 64.0, 36.0, 29.0, 26.0, 12.0, 10.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.001953125, -1.9449462890625, -1.887939453125, -1.8309326171875, -1.77392578125, -1.7169189453125, -1.659912109375, -1.6029052734375, -1.5458984375, -1.4888916015625, -1.431884765625, -1.3748779296875, -1.31787109375, -1.2608642578125, -1.203857421875, -1.1468505859375, -1.08984375, -1.0328369140625, -0.975830078125, -0.9188232421875, -0.86181640625, -0.8048095703125, -0.747802734375, -0.6907958984375, -0.6337890625, -0.5767822265625, -0.519775390625, -0.4627685546875, -0.40576171875, -0.3487548828125, -0.291748046875, -0.2347412109375, -0.177734375, -0.1207275390625, -0.063720703125, -0.0067138671875, 0.05029296875, 0.1072998046875, 0.164306640625, 0.2213134765625, 0.2783203125, 0.3353271484375, 0.392333984375, 0.4493408203125, 0.50634765625, 0.5633544921875, 0.620361328125, 0.6773681640625, 0.734375, 0.7913818359375, 0.848388671875, 0.9053955078125, 0.96240234375, 1.0194091796875, 1.076416015625, 1.1334228515625, 1.1904296875, 1.2474365234375, 1.304443359375, 1.3614501953125, 1.41845703125, 1.4754638671875, 1.532470703125, 1.5894775390625, 1.646484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 9.0, 2.0, 9.0, 12.0, 23.0, 24.0, 21.0, 31.0, 45.0, 42.0, 45.0, 46.0, 58.0, 44.0, 58.0, 61.0, 59.0, 54.0, 59.0, 35.0, 43.0, 54.0, 26.0, 25.0, 18.0, 11.0, 17.0, 9.0, 7.0, 12.0, 6.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.119140625, -1.088134765625, -1.05712890625, -1.026123046875, -0.9951171875, -0.964111328125, -0.93310546875, -0.902099609375, -0.87109375, -0.840087890625, -0.80908203125, -0.778076171875, -0.7470703125, -0.716064453125, -0.68505859375, -0.654052734375, -0.623046875, -0.592041015625, -0.56103515625, -0.530029296875, -0.4990234375, -0.468017578125, -0.43701171875, -0.406005859375, -0.375, -0.343994140625, -0.31298828125, -0.281982421875, -0.2509765625, -0.219970703125, -0.18896484375, -0.157958984375, -0.126953125, -0.095947265625, -0.06494140625, -0.033935546875, -0.0029296875, 0.028076171875, 0.05908203125, 0.090087890625, 0.12109375, 0.152099609375, 0.18310546875, 0.214111328125, 0.2451171875, 0.276123046875, 0.30712890625, 0.338134765625, 0.369140625, 0.400146484375, 0.43115234375, 0.462158203125, 0.4931640625, 0.524169921875, 0.55517578125, 0.586181640625, 0.6171875, 0.648193359375, 0.67919921875, 0.710205078125, 0.7412109375, 0.772216796875, 0.80322265625, 0.834228515625, 0.865234375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 7.0, 2.0, 14.0, 6.0, 13.0, 26.0, 27.0, 40.0, 33.0, 44.0, 53.0, 71.0, 63.0, 57.0, 57.0, 67.0, 67.0, 56.0, 55.0, 36.0, 53.0, 29.0, 27.0, 18.0, 14.0, 13.0, 12.0, 8.0, 9.0, 7.0, 3.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.028072357177734, -22.44537353515625, -21.8626766204834, -21.279977798461914, -20.69727897644043, -20.114580154418945, -19.531883239746094, -18.94918441772461, -18.366485595703125, -17.78378677368164, -17.20108985900879, -16.618391036987305, -16.03569221496582, -15.452994346618652, -14.870296478271484, -14.28759765625, -13.704899787902832, -13.122201919555664, -12.53950309753418, -11.956805229187012, -11.374106407165527, -10.79140853881836, -10.208709716796875, -9.626011848449707, -9.043313980102539, -8.460616111755371, -7.877917289733887, -7.295219421386719, -6.712520599365234, -6.129822731018066, -5.54712438583374, -4.964426040649414, -4.381728172302246, -3.79902982711792, -3.2163314819335938, -2.6336333751678467, -2.0509350299835205, -1.4682366847991943, -0.8855385780334473, -0.3028402328491211, 0.2798581123352051, 0.8625563979148865, 1.4452546834945679, 2.0279529094696045, 2.6106512546539307, 3.193349599838257, 3.776047706604004, 4.35874605178833, 4.941444396972656, 5.524142742156982, 6.106841087341309, 6.689538955688477, 7.272237777709961, 7.854935646057129, 8.437633514404297, 9.020332336425781, 9.603031158447266, 10.185729026794434, 10.768427848815918, 11.351125717163086, 11.93382453918457, 12.516522407531738, 13.099220275878906, 13.68191909790039, 14.264616966247559]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 3.0, 2.0, 6.0, 4.0, 7.0, 11.0, 12.0, 14.0, 23.0, 17.0, 23.0, 22.0, 38.0, 26.0, 32.0, 37.0, 25.0, 30.0, 38.0, 41.0, 41.0, 36.0, 42.0, 34.0, 52.0, 41.0, 39.0, 43.0, 32.0, 25.0, 29.0, 24.0, 19.0, 19.0, 20.0, 12.0, 9.0, 13.0, 18.0, 10.0, 9.0, 6.0, 7.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.479897499084473, -14.029635429382324, -13.579374313354492, -13.129112243652344, -12.678850173950195, -12.228589057922363, -11.778326988220215, -11.328065872192383, -10.877803802490234, -10.427541732788086, -9.977280616760254, -9.527018547058105, -9.076757431030273, -8.626495361328125, -8.176233291625977, -7.725971698760986, -7.275710105895996, -6.825448513031006, -6.375186920166016, -5.924924850463867, -5.474663257598877, -5.024401664733887, -4.574139595031738, -4.123878002166748, -3.673616409301758, -3.2233548164367676, -2.7730929851531982, -2.322831153869629, -1.8725695610046387, -1.4223079681396484, -0.9720461368560791, -0.5217843055725098, -0.07152175903320312, 0.37873995304107666, 0.8290016651153564, 1.2792633771896362, 1.729525089263916, 2.1797866821289062, 2.6300485134124756, 3.080310344696045, 3.530571937561035, 3.9808335304260254, 4.431095123291016, 4.881357192993164, 5.331618785858154, 5.7818803787231445, 6.232142448425293, 6.682404041290283, 7.132665634155273, 7.582927227020264, 8.033188819885254, 8.483450889587402, 8.933712005615234, 9.383974075317383, 9.834236145019531, 10.28449821472168, 10.734759330749512, 11.18502140045166, 11.635282516479492, 12.08554458618164, 12.535806655883789, 12.986067771911621, 13.43632984161377, 13.886590957641602, 14.33685302734375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 1.0, 3.0, 6.0, 5.0, 8.0, 14.0, 18.0, 27.0, 57.0, 72.0, 105.0, 163.0, 262.0, 421.0, 655.0, 1010.0, 1527.0, 2446.0, 4010.0, 6558.0, 10834.0, 17265.0, 26588.0, 41061.0, 60385.0, 83595.0, 108144.0, 125246.0, 129888.0, 118182.0, 96543.0, 72114.0, 50205.0, 33409.0, 21610.0, 13484.0, 8661.0, 5163.0, 3294.0, 2026.0, 1283.0, 797.0, 466.0, 366.0, 180.0, 139.0, 93.0, 54.0, 56.0, 23.0, 10.0, 12.0, 7.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-12.640625, -12.248779296875, -11.85693359375, -11.465087890625, -11.0732421875, -10.681396484375, -10.28955078125, -9.897705078125, -9.505859375, -9.114013671875, -8.72216796875, -8.330322265625, -7.9384765625, -7.546630859375, -7.15478515625, -6.762939453125, -6.37109375, -5.979248046875, -5.58740234375, -5.195556640625, -4.8037109375, -4.411865234375, -4.02001953125, -3.628173828125, -3.236328125, -2.844482421875, -2.45263671875, -2.060791015625, -1.6689453125, -1.277099609375, -0.88525390625, -0.493408203125, -0.1015625, 0.290283203125, 0.68212890625, 1.073974609375, 1.4658203125, 1.857666015625, 2.24951171875, 2.641357421875, 3.033203125, 3.425048828125, 3.81689453125, 4.208740234375, 4.6005859375, 4.992431640625, 5.38427734375, 5.776123046875, 6.16796875, 6.559814453125, 6.95166015625, 7.343505859375, 7.7353515625, 8.127197265625, 8.51904296875, 8.910888671875, 9.302734375, 9.694580078125, 10.08642578125, 10.478271484375, 10.8701171875, 11.261962890625, 11.65380859375, 12.045654296875, 12.4375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 8.0, 6.0, 10.0, 11.0, 13.0, 19.0, 20.0, 17.0, 20.0, 29.0, 28.0, 26.0, 31.0, 31.0, 21.0, 46.0, 38.0, 45.0, 40.0, 54.0, 54.0, 39.0, 37.0, 33.0, 35.0, 38.0, 37.0, 21.0, 18.0, 28.0, 25.0, 20.0, 11.0, 13.0, 19.0, 11.0, 11.0, 6.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.0546875, -13.610595703125, -13.16650390625, -12.722412109375, -12.2783203125, -11.834228515625, -11.39013671875, -10.946044921875, -10.501953125, -10.057861328125, -9.61376953125, -9.169677734375, -8.7255859375, -8.281494140625, -7.83740234375, -7.393310546875, -6.94921875, -6.505126953125, -6.06103515625, -5.616943359375, -5.1728515625, -4.728759765625, -4.28466796875, -3.840576171875, -3.396484375, -2.952392578125, -2.50830078125, -2.064208984375, -1.6201171875, -1.176025390625, -0.73193359375, -0.287841796875, 0.15625, 0.600341796875, 1.04443359375, 1.488525390625, 1.9326171875, 2.376708984375, 2.82080078125, 3.264892578125, 3.708984375, 4.153076171875, 4.59716796875, 5.041259765625, 5.4853515625, 5.929443359375, 6.37353515625, 6.817626953125, 7.26171875, 7.705810546875, 8.14990234375, 8.593994140625, 9.0380859375, 9.482177734375, 9.92626953125, 10.370361328125, 10.814453125, 11.258544921875, 11.70263671875, 12.146728515625, 12.5908203125, 13.034912109375, 13.47900390625, 13.923095703125, 14.3671875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 15.0, 15.0, 21.0, 27.0, 49.0, 78.0, 135.0, 166.0, 253.0, 457.0, 695.0, 1104.0, 1684.0, 2575.0, 4155.0, 6344.0, 9828.0, 14962.0, 22983.0, 33955.0, 49352.0, 68768.0, 89439.0, 108703.0, 119811.0, 118124.0, 105030.0, 85885.0, 65002.0, 46464.0, 31678.0, 21297.0, 14019.0, 9143.0, 5780.0, 3843.0, 2448.0, 1584.0, 944.0, 624.0, 414.0, 250.0, 165.0, 114.0, 72.0, 29.0, 23.0, 14.0, 14.0, 4.0, 9.0, 5.0, 3.0, 1.0, 2.0], "bins": [-12.0, -11.6461181640625, -11.292236328125, -10.9383544921875, -10.58447265625, -10.2305908203125, -9.876708984375, -9.5228271484375, -9.1689453125, -8.8150634765625, -8.461181640625, -8.1072998046875, -7.75341796875, -7.3995361328125, -7.045654296875, -6.6917724609375, -6.337890625, -5.9840087890625, -5.630126953125, -5.2762451171875, -4.92236328125, -4.5684814453125, -4.214599609375, -3.8607177734375, -3.5068359375, -3.1529541015625, -2.799072265625, -2.4451904296875, -2.09130859375, -1.7374267578125, -1.383544921875, -1.0296630859375, -0.67578125, -0.3218994140625, 0.031982421875, 0.3858642578125, 0.73974609375, 1.0936279296875, 1.447509765625, 1.8013916015625, 2.1552734375, 2.5091552734375, 2.863037109375, 3.2169189453125, 3.57080078125, 3.9246826171875, 4.278564453125, 4.6324462890625, 4.986328125, 5.3402099609375, 5.694091796875, 6.0479736328125, 6.40185546875, 6.7557373046875, 7.109619140625, 7.4635009765625, 7.8173828125, 8.1712646484375, 8.525146484375, 8.8790283203125, 9.23291015625, 9.5867919921875, 9.940673828125, 10.2945556640625, 10.6484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 15.0, 15.0, 13.0, 26.0, 16.0, 19.0, 33.0, 24.0, 39.0, 25.0, 45.0, 30.0, 31.0, 32.0, 42.0, 41.0, 36.0, 38.0, 53.0, 33.0, 34.0, 24.0, 37.0, 38.0, 27.0, 31.0, 21.0, 26.0, 18.0, 18.0, 14.0, 23.0, 8.0, 7.0, 10.0, 11.0, 6.0, 5.0, 4.0, 7.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.7265625, -9.439697265625, -9.15283203125, -8.865966796875, -8.5791015625, -8.292236328125, -8.00537109375, -7.718505859375, -7.431640625, -7.144775390625, -6.85791015625, -6.571044921875, -6.2841796875, -5.997314453125, -5.71044921875, -5.423583984375, -5.13671875, -4.849853515625, -4.56298828125, -4.276123046875, -3.9892578125, -3.702392578125, -3.41552734375, -3.128662109375, -2.841796875, -2.554931640625, -2.26806640625, -1.981201171875, -1.6943359375, -1.407470703125, -1.12060546875, -0.833740234375, -0.546875, -0.260009765625, 0.02685546875, 0.313720703125, 0.6005859375, 0.887451171875, 1.17431640625, 1.461181640625, 1.748046875, 2.034912109375, 2.32177734375, 2.608642578125, 2.8955078125, 3.182373046875, 3.46923828125, 3.756103515625, 4.04296875, 4.329833984375, 4.61669921875, 4.903564453125, 5.1904296875, 5.477294921875, 5.76416015625, 6.051025390625, 6.337890625, 6.624755859375, 6.91162109375, 7.198486328125, 7.4853515625, 7.772216796875, 8.05908203125, 8.345947265625, 8.6328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 1.0, 2.0, 3.0, 6.0, 6.0, 12.0, 11.0, 28.0, 39.0, 51.0, 88.0, 128.0, 198.0, 242.0, 373.0, 569.0, 1056.0, 1713.0, 2873.0, 5206.0, 9639.0, 18732.0, 37993.0, 76853.0, 146563.0, 225553.0, 223698.0, 144435.0, 75225.0, 37011.0, 18458.0, 9500.0, 4991.0, 2863.0, 1658.0, 998.0, 660.0, 393.0, 231.0, 170.0, 106.0, 65.0, 50.0, 38.0, 27.0, 12.0, 13.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.5859375, -15.1273193359375, -14.668701171875, -14.2100830078125, -13.75146484375, -13.2928466796875, -12.834228515625, -12.3756103515625, -11.9169921875, -11.4583740234375, -10.999755859375, -10.5411376953125, -10.08251953125, -9.6239013671875, -9.165283203125, -8.7066650390625, -8.248046875, -7.7894287109375, -7.330810546875, -6.8721923828125, -6.41357421875, -5.9549560546875, -5.496337890625, -5.0377197265625, -4.5791015625, -4.1204833984375, -3.661865234375, -3.2032470703125, -2.74462890625, -2.2860107421875, -1.827392578125, -1.3687744140625, -0.91015625, -0.4515380859375, 0.007080078125, 0.4656982421875, 0.92431640625, 1.3829345703125, 1.841552734375, 2.3001708984375, 2.7587890625, 3.2174072265625, 3.676025390625, 4.1346435546875, 4.59326171875, 5.0518798828125, 5.510498046875, 5.9691162109375, 6.427734375, 6.8863525390625, 7.344970703125, 7.8035888671875, 8.26220703125, 8.7208251953125, 9.179443359375, 9.6380615234375, 10.0966796875, 10.5552978515625, 11.013916015625, 11.4725341796875, 11.93115234375, 12.3897705078125, 12.848388671875, 13.3070068359375, 13.765625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 3.0, 6.0, 5.0, 11.0, 11.0, 8.0, 16.0, 20.0, 12.0, 28.0, 33.0, 34.0, 31.0, 39.0, 51.0, 57.0, 54.0, 50.0, 55.0, 58.0, 56.0, 47.0, 60.0, 36.0, 30.0, 31.0, 17.0, 19.0, 16.0, 19.0, 14.0, 14.0, 4.0, 10.0, 8.0, 6.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000766754150390625, -0.0007396489381790161, -0.0007125437259674072, -0.0006854385137557983, -0.0006583333015441895, -0.0006312280893325806, -0.0006041228771209717, -0.0005770176649093628, -0.0005499124526977539, -0.000522807240486145, -0.0004957020282745361, -0.00046859681606292725, -0.00044149160385131836, -0.00041438639163970947, -0.0003872811794281006, -0.0003601759672164917, -0.0003330707550048828, -0.0003059655427932739, -0.00027886033058166504, -0.00025175511837005615, -0.00022464990615844727, -0.00019754469394683838, -0.0001704394817352295, -0.0001433342695236206, -0.00011622905731201172, -8.912384510040283e-05, -6.201863288879395e-05, -3.491342067718506e-05, -7.808208465576172e-06, 1.9297003746032715e-05, 4.64022159576416e-05, 7.350742816925049e-05, 0.00010061264038085938, 0.00012771785259246826, 0.00015482306480407715, 0.00018192827701568604, 0.00020903348922729492, 0.0002361387014389038, 0.0002632439136505127, 0.0002903491258621216, 0.00031745433807373047, 0.00034455955028533936, 0.00037166476249694824, 0.00039876997470855713, 0.000425875186920166, 0.0004529803991317749, 0.0004800856113433838, 0.0005071908235549927, 0.0005342960357666016, 0.0005614012479782104, 0.0005885064601898193, 0.0006156116724014282, 0.0006427168846130371, 0.000669822096824646, 0.0006969273090362549, 0.0007240325212478638, 0.0007511377334594727, 0.0007782429456710815, 0.0008053481578826904, 0.0008324533700942993, 0.0008595585823059082, 0.0008866637945175171, 0.000913769006729126, 0.0009408742189407349, 0.0009679794311523438]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 5.0, 13.0, 13.0, 36.0, 36.0, 62.0, 77.0, 93.0, 156.0, 242.0, 384.0, 587.0, 847.0, 1359.0, 2037.0, 3206.0, 4874.0, 7731.0, 12018.0, 19554.0, 30642.0, 48293.0, 73337.0, 105289.0, 136042.0, 149433.0, 137291.0, 106180.0, 74442.0, 48839.0, 31248.0, 19731.0, 12483.0, 7806.0, 4861.0, 3157.0, 2099.0, 1301.0, 911.0, 623.0, 416.0, 253.0, 178.0, 130.0, 78.0, 61.0, 35.0, 20.0, 7.0, 16.0, 8.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.38916015625, -8.1142578125, -7.83935546875, -7.564453125, -7.28955078125, -7.0146484375, -6.73974609375, -6.46484375, -6.18994140625, -5.9150390625, -5.64013671875, -5.365234375, -5.09033203125, -4.8154296875, -4.54052734375, -4.265625, -3.99072265625, -3.7158203125, -3.44091796875, -3.166015625, -2.89111328125, -2.6162109375, -2.34130859375, -2.06640625, -1.79150390625, -1.5166015625, -1.24169921875, -0.966796875, -0.69189453125, -0.4169921875, -0.14208984375, 0.1328125, 0.40771484375, 0.6826171875, 0.95751953125, 1.232421875, 1.50732421875, 1.7822265625, 2.05712890625, 2.33203125, 2.60693359375, 2.8818359375, 3.15673828125, 3.431640625, 3.70654296875, 3.9814453125, 4.25634765625, 4.53125, 4.80615234375, 5.0810546875, 5.35595703125, 5.630859375, 5.90576171875, 6.1806640625, 6.45556640625, 6.73046875, 7.00537109375, 7.2802734375, 7.55517578125, 7.830078125, 8.10498046875, 8.3798828125, 8.65478515625, 8.9296875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 6.0, 7.0, 10.0, 17.0, 15.0, 12.0, 26.0, 23.0, 22.0, 32.0, 30.0, 33.0, 44.0, 41.0, 41.0, 55.0, 58.0, 52.0, 46.0, 51.0, 50.0, 35.0, 51.0, 32.0, 36.0, 19.0, 41.0, 21.0, 20.0, 16.0, 13.0, 5.0, 8.0, 6.0, 8.0, 5.0, 5.0, 1.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.951171875, -3.845367431640625, -3.73956298828125, -3.633758544921875, -3.5279541015625, -3.422149658203125, -3.31634521484375, -3.210540771484375, -3.104736328125, -2.998931884765625, -2.89312744140625, -2.787322998046875, -2.6815185546875, -2.575714111328125, -2.46990966796875, -2.364105224609375, -2.25830078125, -2.152496337890625, -2.04669189453125, -1.940887451171875, -1.8350830078125, -1.729278564453125, -1.62347412109375, -1.517669677734375, -1.411865234375, -1.306060791015625, -1.20025634765625, -1.094451904296875, -0.9886474609375, -0.882843017578125, -0.77703857421875, -0.671234130859375, -0.5654296875, -0.459625244140625, -0.35382080078125, -0.248016357421875, -0.1422119140625, -0.036407470703125, 0.06939697265625, 0.175201416015625, 0.281005859375, 0.386810302734375, 0.49261474609375, 0.598419189453125, 0.7042236328125, 0.810028076171875, 0.91583251953125, 1.021636962890625, 1.12744140625, 1.233245849609375, 1.33905029296875, 1.444854736328125, 1.5506591796875, 1.656463623046875, 1.76226806640625, 1.868072509765625, 1.973876953125, 2.079681396484375, 2.18548583984375, 2.291290283203125, 2.3970947265625, 2.502899169921875, 2.60870361328125, 2.714508056640625, 2.8203125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 14.0, 10.0, 13.0, 18.0, 23.0, 38.0, 31.0, 32.0, 56.0, 50.0, 54.0, 63.0, 58.0, 52.0, 73.0, 69.0, 62.0, 51.0, 49.0, 36.0, 34.0, 26.0, 21.0, 12.0, 10.0, 15.0, 11.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-24.050546646118164, -23.466747283935547, -22.88294792175293, -22.299148559570312, -21.715347290039062, -21.131547927856445, -20.547748565673828, -19.96394920349121, -19.380149841308594, -18.796350479125977, -18.21255111694336, -17.628751754760742, -17.044952392578125, -16.461151123046875, -15.877351760864258, -15.29355239868164, -14.709753036499023, -14.125953674316406, -13.542154312133789, -12.958353996276855, -12.374554634094238, -11.790755271911621, -11.206954956054688, -10.62315559387207, -10.039356231689453, -9.455556869506836, -8.871757507324219, -8.287957191467285, -7.704157829284668, -7.120358467102051, -6.536558628082275, -5.9527587890625, -5.368960380554199, -4.785161018371582, -4.201361179351807, -3.6175615787506104, -3.033761978149414, -2.4499623775482178, -1.8661627769470215, -1.282362937927246, -0.6985635757446289, -0.11476397514343262, 0.46903562545776367, 1.05283522605896, 1.6366348266601562, 2.2204344272613525, 2.804234027862549, 3.388033866882324, 3.9718332290649414, 4.555632591247559, 5.139432430267334, 5.723232269287109, 6.307031631469727, 6.890830993652344, 7.474630832672119, 8.058430671691895, 8.642230033874512, 9.226029396057129, 9.809829711914062, 10.39362907409668, 10.977428436279297, 11.561227798461914, 12.145027160644531, 12.728827476501465, 13.312626838684082]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 14.0, 11.0, 9.0, 17.0, 14.0, 22.0, 22.0, 24.0, 34.0, 25.0, 31.0, 55.0, 23.0, 41.0, 36.0, 33.0, 34.0, 44.0, 42.0, 50.0, 47.0, 27.0, 38.0, 31.0, 21.0, 23.0, 37.0, 30.0, 22.0, 23.0, 22.0, 15.0, 11.0, 16.0, 11.0, 9.0, 2.0, 6.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.633767127990723, -14.180418014526367, -13.727068901062012, -13.273719787597656, -12.8203706741333, -12.367021560668945, -11.913671493530273, -11.460323333740234, -11.006973266601562, -10.553624153137207, -10.100275039672852, -9.646925926208496, -9.19357681274414, -8.740227699279785, -8.28687858581543, -7.833528995513916, -7.380180358886719, -6.926831245422363, -6.473482131958008, -6.020133018493652, -5.566783905029297, -5.113434791564941, -4.660085201263428, -4.206736087799072, -3.753386974334717, -3.3000378608703613, -2.846688747406006, -2.3933393955230713, -1.9399902820587158, -1.4866411685943604, -1.0332918167114258, -0.5799427032470703, -0.12659358978271484, 0.3267555832862854, 0.7801047563552856, 1.2334539890289307, 1.6868031024932861, 2.1401522159576416, 2.593501567840576, 3.0468506813049316, 3.500199794769287, 3.9535489082336426, 4.406898021697998, 4.860247611999512, 5.313596725463867, 5.766945838928223, 6.220294952392578, 6.673644065856934, 7.126993179321289, 7.5803422927856445, 8.03369140625, 8.487040519714355, 8.940389633178711, 9.393738746643066, 9.847087860107422, 10.300437927246094, 10.753786087036133, 11.207135200500488, 11.660484313964844, 12.1138334274292, 12.567182540893555, 13.02053165435791, 13.473880767822266, 13.927230834960938, 14.380579948425293]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 11.0, 11.0, 5.0, 24.0, 26.0, 41.0, 69.0, 88.0, 153.0, 228.0, 410.0, 635.0, 1030.0, 1681.0, 2658.0, 4359.0, 7133.0, 11942.0, 19412.0, 32662.0, 54347.0, 90348.0, 148043.0, 236576.0, 362670.0, 506887.0, 611195.0, 610318.0, 504791.0, 362591.0, 240009.0, 150157.0, 91972.0, 56114.0, 34223.0, 20263.0, 12192.0, 7539.0, 4344.0, 2632.0, 1685.0, 1024.0, 679.0, 414.0, 240.0, 139.0, 115.0, 73.0, 52.0, 35.0, 16.0, 12.0, 6.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.6875, -9.353515625, -9.01953125, -8.685546875, -8.3515625, -8.017578125, -7.68359375, -7.349609375, -7.015625, -6.681640625, -6.34765625, -6.013671875, -5.6796875, -5.345703125, -5.01171875, -4.677734375, -4.34375, -4.009765625, -3.67578125, -3.341796875, -3.0078125, -2.673828125, -2.33984375, -2.005859375, -1.671875, -1.337890625, -1.00390625, -0.669921875, -0.3359375, -0.001953125, 0.33203125, 0.666015625, 1.0, 1.333984375, 1.66796875, 2.001953125, 2.3359375, 2.669921875, 3.00390625, 3.337890625, 3.671875, 4.005859375, 4.33984375, 4.673828125, 5.0078125, 5.341796875, 5.67578125, 6.009765625, 6.34375, 6.677734375, 7.01171875, 7.345703125, 7.6796875, 8.013671875, 8.34765625, 8.681640625, 9.015625, 9.349609375, 9.68359375, 10.017578125, 10.3515625, 10.685546875, 11.01953125, 11.353515625, 11.6875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 10.0, 11.0, 15.0, 16.0, 16.0, 22.0, 17.0, 33.0, 32.0, 29.0, 33.0, 40.0, 49.0, 33.0, 46.0, 44.0, 37.0, 43.0, 38.0, 47.0, 43.0, 36.0, 34.0, 31.0, 33.0, 28.0, 28.0, 19.0, 19.0, 18.0, 19.0, 12.0, 9.0, 8.0, 8.0, 6.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.6640625, -10.3499755859375, -10.035888671875, -9.7218017578125, -9.40771484375, -9.0936279296875, -8.779541015625, -8.4654541015625, -8.1513671875, -7.8372802734375, -7.523193359375, -7.2091064453125, -6.89501953125, -6.5809326171875, -6.266845703125, -5.9527587890625, -5.638671875, -5.3245849609375, -5.010498046875, -4.6964111328125, -4.38232421875, -4.0682373046875, -3.754150390625, -3.4400634765625, -3.1259765625, -2.8118896484375, -2.497802734375, -2.1837158203125, -1.86962890625, -1.5555419921875, -1.241455078125, -0.9273681640625, -0.61328125, -0.2991943359375, 0.014892578125, 0.3289794921875, 0.64306640625, 0.9571533203125, 1.271240234375, 1.5853271484375, 1.8994140625, 2.2135009765625, 2.527587890625, 2.8416748046875, 3.15576171875, 3.4698486328125, 3.783935546875, 4.0980224609375, 4.412109375, 4.7261962890625, 5.040283203125, 5.3543701171875, 5.66845703125, 5.9825439453125, 6.296630859375, 6.6107177734375, 6.9248046875, 7.2388916015625, 7.552978515625, 7.8670654296875, 8.18115234375, 8.4952392578125, 8.809326171875, 9.1234130859375, 9.4375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 16.0, 20.0, 22.0, 43.0, 66.0, 111.0, 207.0, 329.0, 537.0, 829.0, 1388.0, 2383.0, 4067.0, 6871.0, 11718.0, 19685.0, 33458.0, 56628.0, 95001.0, 153597.0, 238980.0, 352391.0, 472324.0, 560211.0, 574036.0, 503427.0, 386357.0, 271865.0, 176576.0, 109484.0, 66088.0, 39397.0, 23084.0, 13386.0, 8102.0, 4688.0, 2723.0, 1676.0, 965.0, 563.0, 386.0, 201.0, 143.0, 94.0, 69.0, 42.0, 22.0, 15.0, 3.0, 6.0, 3.0, 1.0, 5.0], "bins": [-11.078125, -10.762939453125, -10.44775390625, -10.132568359375, -9.8173828125, -9.502197265625, -9.18701171875, -8.871826171875, -8.556640625, -8.241455078125, -7.92626953125, -7.611083984375, -7.2958984375, -6.980712890625, -6.66552734375, -6.350341796875, -6.03515625, -5.719970703125, -5.40478515625, -5.089599609375, -4.7744140625, -4.459228515625, -4.14404296875, -3.828857421875, -3.513671875, -3.198486328125, -2.88330078125, -2.568115234375, -2.2529296875, -1.937744140625, -1.62255859375, -1.307373046875, -0.9921875, -0.677001953125, -0.36181640625, -0.046630859375, 0.2685546875, 0.583740234375, 0.89892578125, 1.214111328125, 1.529296875, 1.844482421875, 2.15966796875, 2.474853515625, 2.7900390625, 3.105224609375, 3.42041015625, 3.735595703125, 4.05078125, 4.365966796875, 4.68115234375, 4.996337890625, 5.3115234375, 5.626708984375, 5.94189453125, 6.257080078125, 6.572265625, 6.887451171875, 7.20263671875, 7.517822265625, 7.8330078125, 8.148193359375, 8.46337890625, 8.778564453125, 9.09375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 6.0, 8.0, 13.0, 23.0, 24.0, 40.0, 49.0, 59.0, 69.0, 70.0, 123.0, 127.0, 146.0, 150.0, 185.0, 211.0, 244.0, 233.0, 230.0, 222.0, 207.0, 203.0, 213.0, 187.0, 147.0, 157.0, 134.0, 115.0, 121.0, 79.0, 56.0, 47.0, 43.0, 28.0, 30.0, 19.0, 12.0, 12.0, 4.0, 3.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.58880615234375, -4.4354248046875, -4.28204345703125, -4.128662109375, -3.97528076171875, -3.8218994140625, -3.66851806640625, -3.51513671875, -3.36175537109375, -3.2083740234375, -3.05499267578125, -2.901611328125, -2.74822998046875, -2.5948486328125, -2.44146728515625, -2.2880859375, -2.13470458984375, -1.9813232421875, -1.82794189453125, -1.674560546875, -1.52117919921875, -1.3677978515625, -1.21441650390625, -1.06103515625, -0.90765380859375, -0.7542724609375, -0.60089111328125, -0.447509765625, -0.29412841796875, -0.1407470703125, 0.01263427734375, 0.166015625, 0.31939697265625, 0.4727783203125, 0.62615966796875, 0.779541015625, 0.93292236328125, 1.0863037109375, 1.23968505859375, 1.39306640625, 1.54644775390625, 1.6998291015625, 1.85321044921875, 2.006591796875, 2.15997314453125, 2.3133544921875, 2.46673583984375, 2.6201171875, 2.77349853515625, 2.9268798828125, 3.08026123046875, 3.233642578125, 3.38702392578125, 3.5404052734375, 3.69378662109375, 3.84716796875, 4.00054931640625, 4.1539306640625, 4.30731201171875, 4.460693359375, 4.61407470703125, 4.7674560546875, 4.92083740234375, 5.07421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 5.0, 8.0, 10.0, 14.0, 20.0, 26.0, 26.0, 30.0, 42.0, 42.0, 43.0, 53.0, 63.0, 64.0, 44.0, 73.0, 55.0, 46.0, 53.0, 39.0, 36.0, 40.0, 35.0, 23.0, 17.0, 21.0, 10.0, 11.0, 9.0, 6.0, 11.0, 4.0, 1.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.228256225585938, -14.76685905456543, -14.305462837219238, -13.84406566619873, -13.382668495178223, -12.921272277832031, -12.459875106811523, -11.998477935791016, -11.537081718444824, -11.075684547424316, -10.614288330078125, -10.152891159057617, -9.69149398803711, -9.230097770690918, -8.76870059967041, -8.307304382324219, -7.845906734466553, -7.384510040283203, -6.923112869262695, -6.461716175079346, -6.000319480895996, -5.538922309875488, -5.077525615692139, -4.616128921508789, -4.154731750488281, -3.6933348178863525, -3.231938123703003, -2.770541191101074, -2.3091444969177246, -1.847747564315796, -1.3863506317138672, -0.9249539375305176, -0.46355724334716797, -0.002160400152206421, 0.4592364430427551, 0.9206333160400391, 1.3820301294326782, 1.8434269428253174, 2.304823875427246, 2.7662205696105957, 3.2276175022125244, 3.689014434814453, 4.150411128997803, 4.611807823181152, 5.07320499420166, 5.53460168838501, 5.995998382568359, 6.457395553588867, 6.918792247772217, 7.380188941955566, 7.841586112976074, 8.302982330322266, 8.764379501342773, 9.225776672363281, 9.687173843383789, 10.14857006072998, 10.609967231750488, 11.071364402770996, 11.532760620117188, 11.994157791137695, 12.455554962158203, 12.916951179504395, 13.378348350524902, 13.839744567871094, 14.301141738891602]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 5.0, 11.0, 12.0, 7.0, 17.0, 9.0, 23.0, 25.0, 21.0, 34.0, 23.0, 32.0, 34.0, 37.0, 41.0, 53.0, 53.0, 51.0, 35.0, 43.0, 48.0, 46.0, 33.0, 36.0, 40.0, 30.0, 28.0, 20.0, 21.0, 22.0, 22.0, 17.0, 14.0, 15.0, 9.0, 11.0, 9.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.497854232788086, -13.082695960998535, -12.667536735534668, -12.252378463745117, -11.83721923828125, -11.4220609664917, -11.006902694702148, -10.591743469238281, -10.17658519744873, -9.76142692565918, -9.346267700195312, -8.931109428405762, -8.515951156616211, -8.100791931152344, -7.685633659362793, -7.270474910736084, -6.855316162109375, -6.440157413482666, -6.024998664855957, -5.609840393066406, -5.194681644439697, -4.779522895812988, -4.3643646240234375, -3.9492058753967285, -3.5340471267700195, -3.1188883781433105, -2.7037298679351807, -2.288571357727051, -1.8734126091003418, -1.4582538604736328, -1.043095350265503, -0.627936840057373, -0.21277713775634766, 0.20238149166107178, 0.6175401210784912, 1.0326987504959106, 1.44785737991333, 1.863016128540039, 2.278174638748169, 2.693333148956299, 3.108491897583008, 3.523650646209717, 3.9388091564178467, 4.353967666625977, 4.7691264152526855, 5.1842851638793945, 5.599443435668945, 6.014602184295654, 6.429760932922363, 6.844919681549072, 7.260078430175781, 7.675236701965332, 8.090394973754883, 8.50555419921875, 8.9207124710083, 9.335870742797852, 9.751029968261719, 10.16618824005127, 10.581347465515137, 10.996505737304688, 11.411664962768555, 11.826823234558105, 12.241981506347656, 12.657140731811523, 13.072299003601074]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 9.0, 21.0, 29.0, 58.0, 72.0, 157.0, 262.0, 357.0, 648.0, 1071.0, 1761.0, 2981.0, 5270.0, 8822.0, 15339.0, 26712.0, 45799.0, 76018.0, 120460.0, 168105.0, 184043.0, 147518.0, 98137.0, 59769.0, 35899.0, 20459.0, 11868.0, 6827.0, 4012.0, 2399.0, 1405.0, 895.0, 511.0, 319.0, 186.0, 108.0, 82.0, 59.0, 42.0, 16.0, 14.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.95849609375, -3.8232421875, -3.68798828125, -3.552734375, -3.41748046875, -3.2822265625, -3.14697265625, -3.01171875, -2.87646484375, -2.7412109375, -2.60595703125, -2.470703125, -2.33544921875, -2.2001953125, -2.06494140625, -1.9296875, -1.79443359375, -1.6591796875, -1.52392578125, -1.388671875, -1.25341796875, -1.1181640625, -0.98291015625, -0.84765625, -0.71240234375, -0.5771484375, -0.44189453125, -0.306640625, -0.17138671875, -0.0361328125, 0.09912109375, 0.234375, 0.36962890625, 0.5048828125, 0.64013671875, 0.775390625, 0.91064453125, 1.0458984375, 1.18115234375, 1.31640625, 1.45166015625, 1.5869140625, 1.72216796875, 1.857421875, 1.99267578125, 2.1279296875, 2.26318359375, 2.3984375, 2.53369140625, 2.6689453125, 2.80419921875, 2.939453125, 3.07470703125, 3.2099609375, 3.34521484375, 3.48046875, 3.61572265625, 3.7509765625, 3.88623046875, 4.021484375, 4.15673828125, 4.2919921875, 4.42724609375, 4.5625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 2.0, 3.0, 6.0, 5.0, 11.0, 13.0, 16.0, 20.0, 21.0, 14.0, 17.0, 29.0, 38.0, 36.0, 34.0, 35.0, 44.0, 53.0, 62.0, 42.0, 37.0, 34.0, 37.0, 36.0, 39.0, 31.0, 39.0, 31.0, 37.0, 26.0, 23.0, 18.0, 15.0, 14.0, 18.0, 10.0, 12.0, 12.0, 10.0, 9.0, 3.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.609375, -13.2052001953125, -12.801025390625, -12.3968505859375, -11.99267578125, -11.5885009765625, -11.184326171875, -10.7801513671875, -10.3759765625, -9.9718017578125, -9.567626953125, -9.1634521484375, -8.75927734375, -8.3551025390625, -7.950927734375, -7.5467529296875, -7.142578125, -6.7384033203125, -6.334228515625, -5.9300537109375, -5.52587890625, -5.1217041015625, -4.717529296875, -4.3133544921875, -3.9091796875, -3.5050048828125, -3.100830078125, -2.6966552734375, -2.29248046875, -1.8883056640625, -1.484130859375, -1.0799560546875, -0.67578125, -0.2716064453125, 0.132568359375, 0.5367431640625, 0.94091796875, 1.3450927734375, 1.749267578125, 2.1534423828125, 2.5576171875, 2.9617919921875, 3.365966796875, 3.7701416015625, 4.17431640625, 4.5784912109375, 4.982666015625, 5.3868408203125, 5.791015625, 6.1951904296875, 6.599365234375, 7.0035400390625, 7.40771484375, 7.8118896484375, 8.216064453125, 8.6202392578125, 9.0244140625, 9.4285888671875, 9.832763671875, 10.2369384765625, 10.64111328125, 11.0452880859375, 11.449462890625, 11.8536376953125, 12.2578125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 4.0, 9.0, 24.0, 22.0, 27.0, 49.0, 57.0, 75.0, 114.0, 185.0, 279.0, 456.0, 748.0, 1170.0, 2002.0, 3266.0, 5791.0, 10617.0, 19681.0, 36093.0, 67675.0, 121535.0, 189717.0, 213966.0, 162247.0, 96761.0, 52514.0, 28074.0, 15234.0, 8337.0, 4837.0, 2738.0, 1561.0, 963.0, 602.0, 384.0, 238.0, 174.0, 115.0, 66.0, 51.0, 25.0, 15.0, 9.0, 14.0, 6.0, 7.0, 3.0, 6.0, 1.0, 1.0, 5.0, 1.0, 2.0], "bins": [-4.6328125, -4.49365234375, -4.3544921875, -4.21533203125, -4.076171875, -3.93701171875, -3.7978515625, -3.65869140625, -3.51953125, -3.38037109375, -3.2412109375, -3.10205078125, -2.962890625, -2.82373046875, -2.6845703125, -2.54541015625, -2.40625, -2.26708984375, -2.1279296875, -1.98876953125, -1.849609375, -1.71044921875, -1.5712890625, -1.43212890625, -1.29296875, -1.15380859375, -1.0146484375, -0.87548828125, -0.736328125, -0.59716796875, -0.4580078125, -0.31884765625, -0.1796875, -0.04052734375, 0.0986328125, 0.23779296875, 0.376953125, 0.51611328125, 0.6552734375, 0.79443359375, 0.93359375, 1.07275390625, 1.2119140625, 1.35107421875, 1.490234375, 1.62939453125, 1.7685546875, 1.90771484375, 2.046875, 2.18603515625, 2.3251953125, 2.46435546875, 2.603515625, 2.74267578125, 2.8818359375, 3.02099609375, 3.16015625, 3.29931640625, 3.4384765625, 3.57763671875, 3.716796875, 3.85595703125, 3.9951171875, 4.13427734375, 4.2734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 4.0, 10.0, 8.0, 16.0, 11.0, 13.0, 19.0, 21.0, 24.0, 35.0, 27.0, 43.0, 33.0, 35.0, 38.0, 50.0, 45.0, 37.0, 44.0, 40.0, 46.0, 35.0, 39.0, 41.0, 29.0, 36.0, 34.0, 32.0, 19.0, 21.0, 14.0, 15.0, 15.0, 12.0, 12.0, 9.0, 10.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3359375, -8.0501708984375, -7.764404296875, -7.4786376953125, -7.19287109375, -6.9071044921875, -6.621337890625, -6.3355712890625, -6.0498046875, -5.7640380859375, -5.478271484375, -5.1925048828125, -4.90673828125, -4.6209716796875, -4.335205078125, -4.0494384765625, -3.763671875, -3.4779052734375, -3.192138671875, -2.9063720703125, -2.62060546875, -2.3348388671875, -2.049072265625, -1.7633056640625, -1.4775390625, -1.1917724609375, -0.906005859375, -0.6202392578125, -0.33447265625, -0.0487060546875, 0.237060546875, 0.5228271484375, 0.80859375, 1.0943603515625, 1.380126953125, 1.6658935546875, 1.95166015625, 2.2374267578125, 2.523193359375, 2.8089599609375, 3.0947265625, 3.3804931640625, 3.666259765625, 3.9520263671875, 4.23779296875, 4.5235595703125, 4.809326171875, 5.0950927734375, 5.380859375, 5.6666259765625, 5.952392578125, 6.2381591796875, 6.52392578125, 6.8096923828125, 7.095458984375, 7.3812255859375, 7.6669921875, 7.9527587890625, 8.238525390625, 8.5242919921875, 8.81005859375, 9.0958251953125, 9.381591796875, 9.6673583984375, 9.953125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 9.0, 11.0, 6.0, 20.0, 39.0, 43.0, 77.0, 156.0, 232.0, 461.0, 946.0, 2225.0, 5514.0, 16041.0, 56940.0, 220451.0, 461232.0, 206414.0, 53177.0, 15272.0, 5214.0, 2152.0, 897.0, 450.0, 228.0, 117.0, 78.0, 50.0, 41.0, 18.0, 16.0, 15.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.818359375, -2.736602783203125, -2.65484619140625, -2.573089599609375, -2.4913330078125, -2.409576416015625, -2.32781982421875, -2.246063232421875, -2.164306640625, -2.082550048828125, -2.00079345703125, -1.919036865234375, -1.8372802734375, -1.755523681640625, -1.67376708984375, -1.592010498046875, -1.51025390625, -1.428497314453125, -1.34674072265625, -1.264984130859375, -1.1832275390625, -1.101470947265625, -1.01971435546875, -0.937957763671875, -0.856201171875, -0.774444580078125, -0.69268798828125, -0.610931396484375, -0.5291748046875, -0.447418212890625, -0.36566162109375, -0.283905029296875, -0.2021484375, -0.120391845703125, -0.03863525390625, 0.043121337890625, 0.1248779296875, 0.206634521484375, 0.28839111328125, 0.370147705078125, 0.451904296875, 0.533660888671875, 0.61541748046875, 0.697174072265625, 0.7789306640625, 0.860687255859375, 0.94244384765625, 1.024200439453125, 1.10595703125, 1.187713623046875, 1.26947021484375, 1.351226806640625, 1.4329833984375, 1.514739990234375, 1.59649658203125, 1.678253173828125, 1.760009765625, 1.841766357421875, 1.92352294921875, 2.005279541015625, 2.0870361328125, 2.168792724609375, 2.25054931640625, 2.332305908203125, 2.4140625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 5.0, 6.0, 6.0, 13.0, 12.0, 11.0, 16.0, 23.0, 34.0, 34.0, 48.0, 42.0, 46.0, 63.0, 58.0, 89.0, 65.0, 52.0, 76.0, 45.0, 44.0, 47.0, 44.0, 32.0, 18.0, 12.0, 13.0, 9.0, 14.0, 8.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.244680404663086e-05, -8.973106741905212e-05, -8.701533079147339e-05, -8.429959416389465e-05, -8.158385753631592e-05, -7.886812090873718e-05, -7.615238428115845e-05, -7.343664765357971e-05, -7.072091102600098e-05, -6.800517439842224e-05, -6.52894377708435e-05, -6.257370114326477e-05, -5.9857964515686035e-05, -5.71422278881073e-05, -5.4426491260528564e-05, -5.171075463294983e-05, -4.8995018005371094e-05, -4.627928137779236e-05, -4.356354475021362e-05, -4.084780812263489e-05, -3.813207149505615e-05, -3.541633486747742e-05, -3.270059823989868e-05, -2.9984861612319946e-05, -2.726912498474121e-05, -2.4553388357162476e-05, -2.183765172958374e-05, -1.9121915102005005e-05, -1.640617847442627e-05, -1.3690441846847534e-05, -1.0974705219268799e-05, -8.258968591690063e-06, -5.543231964111328e-06, -2.8274953365325928e-06, -1.1175870895385742e-07, 2.603977918624878e-06, 5.319714546203613e-06, 8.035451173782349e-06, 1.0751187801361084e-05, 1.346692442893982e-05, 1.6182661056518555e-05, 1.889839768409729e-05, 2.1614134311676025e-05, 2.432987093925476e-05, 2.7045607566833496e-05, 2.976134419441223e-05, 3.247708082199097e-05, 3.51928174495697e-05, 3.790855407714844e-05, 4.062429070472717e-05, 4.334002733230591e-05, 4.6055763959884644e-05, 4.877150058746338e-05, 5.1487237215042114e-05, 5.420297384262085e-05, 5.6918710470199585e-05, 5.963444709777832e-05, 6.235018372535706e-05, 6.506592035293579e-05, 6.778165698051453e-05, 7.049739360809326e-05, 7.3213130235672e-05, 7.592886686325073e-05, 7.864460349082947e-05, 8.13603401184082e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 10.0, 14.0, 15.0, 25.0, 35.0, 42.0, 57.0, 73.0, 129.0, 188.0, 302.0, 488.0, 775.0, 1252.0, 2156.0, 3947.0, 7486.0, 14076.0, 28801.0, 58503.0, 120374.0, 224489.0, 262908.0, 162264.0, 79917.0, 38961.0, 19287.0, 9828.0, 5198.0, 2827.0, 1500.0, 984.0, 543.0, 392.0, 217.0, 147.0, 111.0, 66.0, 50.0, 42.0, 31.0, 11.0, 11.0, 4.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9541015625, -1.8934478759765625, -1.832794189453125, -1.7721405029296875, -1.71148681640625, -1.6508331298828125, -1.590179443359375, -1.5295257568359375, -1.4688720703125, -1.4082183837890625, -1.347564697265625, -1.2869110107421875, -1.22625732421875, -1.1656036376953125, -1.104949951171875, -1.0442962646484375, -0.983642578125, -0.9229888916015625, -0.862335205078125, -0.8016815185546875, -0.74102783203125, -0.6803741455078125, -0.619720458984375, -0.5590667724609375, -0.4984130859375, -0.4377593994140625, -0.377105712890625, -0.3164520263671875, -0.25579833984375, -0.1951446533203125, -0.134490966796875, -0.0738372802734375, -0.01318359375, 0.0474700927734375, 0.108123779296875, 0.1687774658203125, 0.22943115234375, 0.2900848388671875, 0.350738525390625, 0.4113922119140625, 0.4720458984375, 0.5326995849609375, 0.593353271484375, 0.6540069580078125, 0.71466064453125, 0.7753143310546875, 0.835968017578125, 0.8966217041015625, 0.957275390625, 1.0179290771484375, 1.078582763671875, 1.1392364501953125, 1.19989013671875, 1.2605438232421875, 1.321197509765625, 1.3818511962890625, 1.4425048828125, 1.5031585693359375, 1.563812255859375, 1.6244659423828125, 1.68511962890625, 1.7457733154296875, 1.806427001953125, 1.8670806884765625, 1.927734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 12.0, 8.0, 11.0, 15.0, 20.0, 26.0, 12.0, 42.0, 38.0, 41.0, 38.0, 45.0, 50.0, 72.0, 62.0, 52.0, 79.0, 43.0, 58.0, 63.0, 45.0, 30.0, 20.0, 22.0, 15.0, 28.0, 6.0, 9.0, 4.0, 8.0, 6.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6185760498046875, -0.594573974609375, -0.5705718994140625, -0.54656982421875, -0.5225677490234375, -0.498565673828125, -0.4745635986328125, -0.4505615234375, -0.4265594482421875, -0.402557373046875, -0.3785552978515625, -0.35455322265625, -0.3305511474609375, -0.306549072265625, -0.2825469970703125, -0.258544921875, -0.2345428466796875, -0.210540771484375, -0.1865386962890625, -0.16253662109375, -0.1385345458984375, -0.114532470703125, -0.0905303955078125, -0.0665283203125, -0.0425262451171875, -0.018524169921875, 0.0054779052734375, 0.02947998046875, 0.0534820556640625, 0.077484130859375, 0.1014862060546875, 0.12548828125, 0.1494903564453125, 0.173492431640625, 0.1974945068359375, 0.22149658203125, 0.2454986572265625, 0.269500732421875, 0.2935028076171875, 0.3175048828125, 0.3415069580078125, 0.365509033203125, 0.3895111083984375, 0.41351318359375, 0.4375152587890625, 0.461517333984375, 0.4855194091796875, 0.509521484375, 0.5335235595703125, 0.557525634765625, 0.5815277099609375, 0.60552978515625, 0.6295318603515625, 0.653533935546875, 0.6775360107421875, 0.7015380859375, 0.7255401611328125, 0.749542236328125, 0.7735443115234375, 0.79754638671875, 0.8215484619140625, 0.845550537109375, 0.8695526123046875, 0.8935546875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 4.0, 9.0, 9.0, 11.0, 15.0, 25.0, 29.0, 16.0, 35.0, 51.0, 38.0, 65.0, 56.0, 63.0, 41.0, 83.0, 69.0, 38.0, 46.0, 43.0, 47.0, 40.0, 32.0, 25.0, 24.0, 20.0, 12.0, 13.0, 10.0, 4.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.322518348693848, -14.847289085388184, -14.37205982208252, -13.896830558776855, -13.421602249145508, -12.946372985839844, -12.47114372253418, -11.995914459228516, -11.520685195922852, -11.045455932617188, -10.570226669311523, -10.09499740600586, -9.619768142700195, -9.144538879394531, -8.669310569763184, -8.19408130645752, -7.7188520431518555, -7.243622779846191, -6.768393516540527, -6.2931647300720215, -5.817935466766357, -5.342706203460693, -4.8674774169921875, -4.392248153686523, -3.9170188903808594, -3.4417896270751953, -2.9665606021881104, -2.4913315773010254, -2.0161023139953613, -1.5408730506896973, -1.0656440258026123, -0.5904150009155273, -0.11518669128417969, 0.3600424528121948, 0.8352715969085693, 1.3105007410049438, 1.7857298851013184, 2.2609591484069824, 2.7361881732940674, 3.2114171981811523, 3.6866464614868164, 4.1618757247924805, 4.6371049880981445, 5.11233377456665, 5.5875630378723145, 6.0627923011779785, 6.538021087646484, 7.013250350952148, 7.4884796142578125, 7.963708877563477, 8.43893814086914, 8.914167404174805, 9.389396667480469, 9.864625930786133, 10.33985424041748, 10.815083503723145, 11.290312767028809, 11.765542030334473, 12.240771293640137, 12.7160005569458, 13.191228866577148, 13.666458129882812, 14.141687393188477, 14.61691665649414, 15.092145919799805]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 10.0, 9.0, 10.0, 17.0, 10.0, 21.0, 18.0, 28.0, 32.0, 25.0, 30.0, 33.0, 38.0, 45.0, 52.0, 57.0, 43.0, 37.0, 43.0, 44.0, 48.0, 35.0, 32.0, 38.0, 29.0, 34.0, 24.0, 20.0, 21.0, 19.0, 18.0, 16.0, 11.0, 14.0, 7.0, 10.0, 9.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.431235313415527, -13.019692420959473, -12.608149528503418, -12.196606636047363, -11.785063743591309, -11.373520851135254, -10.961978912353516, -10.550436019897461, -10.138893127441406, -9.727350234985352, -9.315807342529297, -8.904264450073242, -8.492721557617188, -8.081178665161133, -7.669636249542236, -7.258093357086182, -6.846549987792969, -6.435007095336914, -6.023464202880859, -5.611921310424805, -5.20037841796875, -4.788835525512695, -4.377293109893799, -3.965750217437744, -3.5542073249816895, -3.1426644325256348, -2.73112154006958, -2.3195788860321045, -1.9080359935760498, -1.4964931011199951, -1.0849504470825195, -0.6734075546264648, -0.26186561584472656, 0.14967721700668335, 0.5612200498580933, 0.9727628231048584, 1.384305715560913, 1.7958486080169678, 2.2073912620544434, 2.618934154510498, 3.0304770469665527, 3.4420199394226074, 3.853562831878662, 4.265105247497559, 4.676648139953613, 5.088191032409668, 5.499733924865723, 5.911276817321777, 6.322819709777832, 6.734362602233887, 7.145905494689941, 7.557448387145996, 7.968991279602051, 8.380534172058105, 8.792076110839844, 9.203619003295898, 9.615161895751953, 10.026704788208008, 10.438247680664062, 10.849790573120117, 11.261333465576172, 11.672876358032227, 12.084419250488281, 12.495962142944336, 12.90750503540039]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 9.0, 6.0, 12.0, 17.0, 19.0, 29.0, 57.0, 71.0, 137.0, 232.0, 331.0, 591.0, 1071.0, 1937.0, 3600.0, 7065.0, 13760.0, 27357.0, 52024.0, 93449.0, 149323.0, 191404.0, 185858.0, 139225.0, 84832.0, 46265.0, 24170.0, 12190.0, 6169.0, 3263.0, 1741.0, 943.0, 516.0, 315.0, 193.0, 111.0, 89.0, 51.0, 27.0, 33.0, 20.0, 14.0, 6.0, 5.0, 8.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -15.95263671875, -15.4365234375, -14.92041015625, -14.404296875, -13.88818359375, -13.3720703125, -12.85595703125, -12.33984375, -11.82373046875, -11.3076171875, -10.79150390625, -10.275390625, -9.75927734375, -9.2431640625, -8.72705078125, -8.2109375, -7.69482421875, -7.1787109375, -6.66259765625, -6.146484375, -5.63037109375, -5.1142578125, -4.59814453125, -4.08203125, -3.56591796875, -3.0498046875, -2.53369140625, -2.017578125, -1.50146484375, -0.9853515625, -0.46923828125, 0.046875, 0.56298828125, 1.0791015625, 1.59521484375, 2.111328125, 2.62744140625, 3.1435546875, 3.65966796875, 4.17578125, 4.69189453125, 5.2080078125, 5.72412109375, 6.240234375, 6.75634765625, 7.2724609375, 7.78857421875, 8.3046875, 8.82080078125, 9.3369140625, 9.85302734375, 10.369140625, 10.88525390625, 11.4013671875, 11.91748046875, 12.43359375, 12.94970703125, 13.4658203125, 13.98193359375, 14.498046875, 15.01416015625, 15.5302734375, 16.04638671875, 16.5625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 8.0, 15.0, 16.0, 8.0, 22.0, 20.0, 26.0, 26.0, 21.0, 35.0, 37.0, 24.0, 37.0, 53.0, 49.0, 57.0, 41.0, 50.0, 50.0, 34.0, 39.0, 30.0, 34.0, 32.0, 38.0, 26.0, 28.0, 11.0, 20.0, 16.0, 20.0, 16.0, 14.0, 6.0, 11.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.359375, -12.9664306640625, -12.573486328125, -12.1805419921875, -11.78759765625, -11.3946533203125, -11.001708984375, -10.6087646484375, -10.2158203125, -9.8228759765625, -9.429931640625, -9.0369873046875, -8.64404296875, -8.2510986328125, -7.858154296875, -7.4652099609375, -7.072265625, -6.6793212890625, -6.286376953125, -5.8934326171875, -5.50048828125, -5.1075439453125, -4.714599609375, -4.3216552734375, -3.9287109375, -3.5357666015625, -3.142822265625, -2.7498779296875, -2.35693359375, -1.9639892578125, -1.571044921875, -1.1781005859375, -0.78515625, -0.3922119140625, 0.000732421875, 0.3936767578125, 0.78662109375, 1.1795654296875, 1.572509765625, 1.9654541015625, 2.3583984375, 2.7513427734375, 3.144287109375, 3.5372314453125, 3.93017578125, 4.3231201171875, 4.716064453125, 5.1090087890625, 5.501953125, 5.8948974609375, 6.287841796875, 6.6807861328125, 7.07373046875, 7.4666748046875, 7.859619140625, 8.2525634765625, 8.6455078125, 9.0384521484375, 9.431396484375, 9.8243408203125, 10.21728515625, 10.6102294921875, 11.003173828125, 11.3961181640625, 11.7890625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 13.0, 20.0, 21.0, 32.0, 63.0, 109.0, 148.0, 248.0, 367.0, 505.0, 780.0, 1085.0, 1698.0, 2530.0, 3656.0, 5456.0, 8085.0, 11934.0, 17318.0, 24988.0, 35497.0, 48416.0, 65261.0, 81846.0, 97314.0, 107187.0, 108004.0, 99466.0, 85071.0, 67748.0, 51972.0, 37394.0, 26649.0, 18524.0, 12580.0, 8623.0, 5862.0, 3964.0, 2635.0, 1829.0, 1188.0, 774.0, 550.0, 364.0, 235.0, 192.0, 117.0, 71.0, 48.0, 36.0, 29.0, 10.0, 10.0, 13.0, 8.0, 2.0, 1.0, 4.0], "bins": [-8.59375, -8.325927734375, -8.05810546875, -7.790283203125, -7.5224609375, -7.254638671875, -6.98681640625, -6.718994140625, -6.451171875, -6.183349609375, -5.91552734375, -5.647705078125, -5.3798828125, -5.112060546875, -4.84423828125, -4.576416015625, -4.30859375, -4.040771484375, -3.77294921875, -3.505126953125, -3.2373046875, -2.969482421875, -2.70166015625, -2.433837890625, -2.166015625, -1.898193359375, -1.63037109375, -1.362548828125, -1.0947265625, -0.826904296875, -0.55908203125, -0.291259765625, -0.0234375, 0.244384765625, 0.51220703125, 0.780029296875, 1.0478515625, 1.315673828125, 1.58349609375, 1.851318359375, 2.119140625, 2.386962890625, 2.65478515625, 2.922607421875, 3.1904296875, 3.458251953125, 3.72607421875, 3.993896484375, 4.26171875, 4.529541015625, 4.79736328125, 5.065185546875, 5.3330078125, 5.600830078125, 5.86865234375, 6.136474609375, 6.404296875, 6.672119140625, 6.93994140625, 7.207763671875, 7.4755859375, 7.743408203125, 8.01123046875, 8.279052734375, 8.546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 3.0, 3.0, 6.0, 9.0, 8.0, 11.0, 8.0, 15.0, 21.0, 26.0, 25.0, 26.0, 27.0, 32.0, 26.0, 32.0, 30.0, 30.0, 44.0, 31.0, 38.0, 36.0, 41.0, 34.0, 40.0, 36.0, 48.0, 36.0, 37.0, 34.0, 27.0, 24.0, 16.0, 31.0, 24.0, 18.0, 17.0, 6.0, 10.0, 9.0, 5.0, 4.0, 4.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2109375, -5.9879150390625, -5.764892578125, -5.5418701171875, -5.31884765625, -5.0958251953125, -4.872802734375, -4.6497802734375, -4.4267578125, -4.2037353515625, -3.980712890625, -3.7576904296875, -3.53466796875, -3.3116455078125, -3.088623046875, -2.8656005859375, -2.642578125, -2.4195556640625, -2.196533203125, -1.9735107421875, -1.75048828125, -1.5274658203125, -1.304443359375, -1.0814208984375, -0.8583984375, -0.6353759765625, -0.412353515625, -0.1893310546875, 0.03369140625, 0.2567138671875, 0.479736328125, 0.7027587890625, 0.92578125, 1.1488037109375, 1.371826171875, 1.5948486328125, 1.81787109375, 2.0408935546875, 2.263916015625, 2.4869384765625, 2.7099609375, 2.9329833984375, 3.156005859375, 3.3790283203125, 3.60205078125, 3.8250732421875, 4.048095703125, 4.2711181640625, 4.494140625, 4.7171630859375, 4.940185546875, 5.1632080078125, 5.38623046875, 5.6092529296875, 5.832275390625, 6.0552978515625, 6.2783203125, 6.5013427734375, 6.724365234375, 6.9473876953125, 7.17041015625, 7.3934326171875, 7.616455078125, 7.8394775390625, 8.0625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 12.0, 17.0, 37.0, 34.0, 51.0, 75.0, 84.0, 136.0, 188.0, 284.0, 371.0, 517.0, 800.0, 1183.0, 1757.0, 2572.0, 4308.0, 7990.0, 17848.0, 52798.0, 216529.0, 476239.0, 183593.0, 45610.0, 16165.0, 7570.0, 4076.0, 2435.0, 1582.0, 1122.0, 749.0, 544.0, 368.0, 273.0, 189.0, 135.0, 79.0, 53.0, 49.0, 35.0, 22.0, 14.0, 17.0, 4.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.015625, -25.188232421875, -24.36083984375, -23.533447265625, -22.7060546875, -21.878662109375, -21.05126953125, -20.223876953125, -19.396484375, -18.569091796875, -17.74169921875, -16.914306640625, -16.0869140625, -15.259521484375, -14.43212890625, -13.604736328125, -12.77734375, -11.949951171875, -11.12255859375, -10.295166015625, -9.4677734375, -8.640380859375, -7.81298828125, -6.985595703125, -6.158203125, -5.330810546875, -4.50341796875, -3.676025390625, -2.8486328125, -2.021240234375, -1.19384765625, -0.366455078125, 0.4609375, 1.288330078125, 2.11572265625, 2.943115234375, 3.7705078125, 4.597900390625, 5.42529296875, 6.252685546875, 7.080078125, 7.907470703125, 8.73486328125, 9.562255859375, 10.3896484375, 11.217041015625, 12.04443359375, 12.871826171875, 13.69921875, 14.526611328125, 15.35400390625, 16.181396484375, 17.0087890625, 17.836181640625, 18.66357421875, 19.490966796875, 20.318359375, 21.145751953125, 21.97314453125, 22.800537109375, 23.6279296875, 24.455322265625, 25.28271484375, 26.110107421875, 26.9375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 22.0, 25.0, 49.0, 72.0, 158.0, 142.0, 191.0, 129.0, 65.0, 43.0, 23.0, 13.0, 9.0, 9.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017957687377929688, -0.0017336159944534302, -0.0016714632511138916, -0.001609310507774353, -0.0015471577644348145, -0.0014850050210952759, -0.0014228522777557373, -0.0013606995344161987, -0.0012985467910766602, -0.0012363940477371216, -0.001174241304397583, -0.0011120885610580444, -0.0010499358177185059, -0.0009877830743789673, -0.0009256303310394287, -0.0008634775876998901, -0.0008013248443603516, -0.000739172101020813, -0.0006770193576812744, -0.0006148666143417358, -0.0005527138710021973, -0.0004905611276626587, -0.0004284083843231201, -0.00036625564098358154, -0.00030410289764404297, -0.0002419501543045044, -0.00017979741096496582, -0.00011764466762542725, -5.549192428588867e-05, 6.660819053649902e-06, 6.881356239318848e-05, 0.00013096630573272705, 0.00019311904907226562, 0.0002552717924118042, 0.0003174245357513428, 0.00037957727909088135, 0.0004417300224304199, 0.0005038827657699585, 0.0005660355091094971, 0.0006281882524490356, 0.0006903409957885742, 0.0007524937391281128, 0.0008146464824676514, 0.0008767992258071899, 0.0009389519691467285, 0.001001104712486267, 0.0010632574558258057, 0.0011254101991653442, 0.0011875629425048828, 0.0012497156858444214, 0.00131186842918396, 0.0013740211725234985, 0.0014361739158630371, 0.0014983266592025757, 0.0015604794025421143, 0.0016226321458816528, 0.0016847848892211914, 0.00174693763256073, 0.0018090903759002686, 0.0018712431192398071, 0.0019333958625793457, 0.0019955486059188843, 0.002057701349258423, 0.0021198540925979614, 0.0021820068359375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 5.0, 15.0, 9.0, 33.0, 20.0, 37.0, 59.0, 78.0, 128.0, 146.0, 251.0, 349.0, 492.0, 762.0, 1077.0, 1626.0, 2562.0, 3965.0, 6742.0, 12235.0, 23997.0, 50282.0, 109553.0, 212634.0, 266036.0, 181143.0, 87834.0, 40570.0, 19681.0, 10244.0, 5798.0, 3423.0, 2149.0, 1472.0, 996.0, 660.0, 458.0, 321.0, 238.0, 143.0, 96.0, 72.0, 55.0, 37.0, 30.0, 13.0, 12.0, 10.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.4609375, -13.044921875, -12.62890625, -12.212890625, -11.796875, -11.380859375, -10.96484375, -10.548828125, -10.1328125, -9.716796875, -9.30078125, -8.884765625, -8.46875, -8.052734375, -7.63671875, -7.220703125, -6.8046875, -6.388671875, -5.97265625, -5.556640625, -5.140625, -4.724609375, -4.30859375, -3.892578125, -3.4765625, -3.060546875, -2.64453125, -2.228515625, -1.8125, -1.396484375, -0.98046875, -0.564453125, -0.1484375, 0.267578125, 0.68359375, 1.099609375, 1.515625, 1.931640625, 2.34765625, 2.763671875, 3.1796875, 3.595703125, 4.01171875, 4.427734375, 4.84375, 5.259765625, 5.67578125, 6.091796875, 6.5078125, 6.923828125, 7.33984375, 7.755859375, 8.171875, 8.587890625, 9.00390625, 9.419921875, 9.8359375, 10.251953125, 10.66796875, 11.083984375, 11.5, 11.916015625, 12.33203125, 12.748046875, 13.1640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 6.0, 6.0, 9.0, 6.0, 15.0, 17.0, 26.0, 47.0, 52.0, 51.0, 63.0, 84.0, 98.0, 86.0, 89.0, 73.0, 60.0, 51.0, 50.0, 39.0, 15.0, 12.0, 17.0, 5.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.55078125, -4.40447998046875, -4.2581787109375, -4.11187744140625, -3.965576171875, -3.81927490234375, -3.6729736328125, -3.52667236328125, -3.38037109375, -3.23406982421875, -3.0877685546875, -2.94146728515625, -2.795166015625, -2.64886474609375, -2.5025634765625, -2.35626220703125, -2.2099609375, -2.06365966796875, -1.9173583984375, -1.77105712890625, -1.624755859375, -1.47845458984375, -1.3321533203125, -1.18585205078125, -1.03955078125, -0.89324951171875, -0.7469482421875, -0.60064697265625, -0.454345703125, -0.30804443359375, -0.1617431640625, -0.01544189453125, 0.130859375, 0.27716064453125, 0.4234619140625, 0.56976318359375, 0.716064453125, 0.86236572265625, 1.0086669921875, 1.15496826171875, 1.30126953125, 1.44757080078125, 1.5938720703125, 1.74017333984375, 1.886474609375, 2.03277587890625, 2.1790771484375, 2.32537841796875, 2.4716796875, 2.61798095703125, 2.7642822265625, 2.91058349609375, 3.056884765625, 3.20318603515625, 3.3494873046875, 3.49578857421875, 3.64208984375, 3.78839111328125, 3.9346923828125, 4.08099365234375, 4.227294921875, 4.37359619140625, 4.5198974609375, 4.66619873046875, 4.8125]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 10.0, 12.0, 21.0, 23.0, 38.0, 29.0, 32.0, 38.0, 44.0, 55.0, 52.0, 58.0, 59.0, 61.0, 57.0, 60.0, 47.0, 42.0, 46.0, 36.0, 32.0, 23.0, 16.0, 14.0, 12.0, 17.0, 11.0, 7.0, 5.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-16.181367874145508, -15.691378593444824, -15.20138931274414, -14.711400032043457, -14.221410751342773, -13.73142147064209, -13.241432189941406, -12.751442909240723, -12.261453628540039, -11.771464347839355, -11.281475067138672, -10.791485786437988, -10.301496505737305, -9.811507225036621, -9.321517944335938, -8.831528663635254, -8.34153938293457, -7.851550102233887, -7.361560821533203, -6.8715715408325195, -6.381582260131836, -5.891592979431152, -5.401603698730469, -4.911614418029785, -4.421625137329102, -3.931635856628418, -3.4416465759277344, -2.951657295227051, -2.461668014526367, -1.9716787338256836, -1.481689453125, -0.9917001724243164, -0.5017108917236328, -0.011721611022949219, 0.4782676696777344, 0.968256950378418, 1.4582462310791016, 1.9482355117797852, 2.4382247924804688, 2.9282140731811523, 3.418203353881836, 3.9081926345825195, 4.398181915283203, 4.888171195983887, 5.37816047668457, 5.868149757385254, 6.3581390380859375, 6.848128318786621, 7.338117599487305, 7.828106880187988, 8.318096160888672, 8.808085441589355, 9.298074722290039, 9.788064002990723, 10.278053283691406, 10.76804256439209, 11.258031845092773, 11.748021125793457, 12.23801040649414, 12.727999687194824, 13.217988967895508, 13.707978248596191, 14.197967529296875, 14.687956809997559, 15.177946090698242]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 7.0, 8.0, 11.0, 15.0, 11.0, 13.0, 19.0, 31.0, 21.0, 33.0, 34.0, 33.0, 33.0, 43.0, 40.0, 44.0, 43.0, 54.0, 45.0, 43.0, 38.0, 32.0, 45.0, 31.0, 37.0, 20.0, 32.0, 26.0, 22.0, 11.0, 20.0, 13.0, 16.0, 8.0, 12.0, 11.0, 14.0, 7.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.362497329711914, -12.960062980651855, -12.557628631591797, -12.155194282531738, -11.75275993347168, -11.350325584411621, -10.947891235351562, -10.545456886291504, -10.143022537231445, -9.740588188171387, -9.338153839111328, -8.93571949005127, -8.533285140991211, -8.130850791931152, -7.728416442871094, -7.325982093811035, -6.923548221588135, -6.521113872528076, -6.118679523468018, -5.716245174407959, -5.3138108253479, -4.911376953125, -4.508942604064941, -4.106508255004883, -3.704073667526245, -3.3016393184661865, -2.899204969406128, -2.4967708587646484, -2.09433650970459, -1.6919021606445312, -1.2894678115844727, -0.8870334625244141, -0.48459911346435547, -0.08216479420661926, 0.32026952505111694, 0.7227038145065308, 1.1251381635665894, 1.5275723934173584, 1.930006742477417, 2.3324410915374756, 2.734875440597534, 3.1373097896575928, 3.5397441387176514, 3.942178249359131, 4.3446125984191895, 4.747046947479248, 5.149481296539307, 5.551915645599365, 5.954349994659424, 6.356784343719482, 6.759218692779541, 7.1616530418396, 7.564087390899658, 7.966521263122559, 8.368955612182617, 8.771389961242676, 9.173824310302734, 9.576258659362793, 9.978693008422852, 10.38112735748291, 10.783561706542969, 11.185996055603027, 11.588430404663086, 11.990864753723145, 12.393299102783203]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 5.0, 10.0, 10.0, 20.0, 25.0, 29.0, 44.0, 72.0, 114.0, 181.0, 294.0, 514.0, 795.0, 1243.0, 2022.0, 3385.0, 5457.0, 8801.0, 14388.0, 23759.0, 39408.0, 63731.0, 105313.0, 169981.0, 269879.0, 405372.0, 549206.0, 632820.0, 595264.0, 463044.0, 316672.0, 203535.0, 125419.0, 76191.0, 46232.0, 27840.0, 17054.0, 10299.0, 6105.0, 3798.0, 2362.0, 1367.0, 840.0, 550.0, 334.0, 188.0, 95.0, 78.0, 55.0, 33.0, 24.0, 13.0, 6.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.625, -9.3114013671875, -8.997802734375, -8.6842041015625, -8.37060546875, -8.0570068359375, -7.743408203125, -7.4298095703125, -7.1162109375, -6.8026123046875, -6.489013671875, -6.1754150390625, -5.86181640625, -5.5482177734375, -5.234619140625, -4.9210205078125, -4.607421875, -4.2938232421875, -3.980224609375, -3.6666259765625, -3.35302734375, -3.0394287109375, -2.725830078125, -2.4122314453125, -2.0986328125, -1.7850341796875, -1.471435546875, -1.1578369140625, -0.84423828125, -0.5306396484375, -0.217041015625, 0.0965576171875, 0.41015625, 0.7237548828125, 1.037353515625, 1.3509521484375, 1.66455078125, 1.9781494140625, 2.291748046875, 2.6053466796875, 2.9189453125, 3.2325439453125, 3.546142578125, 3.8597412109375, 4.17333984375, 4.4869384765625, 4.800537109375, 5.1141357421875, 5.427734375, 5.7413330078125, 6.054931640625, 6.3685302734375, 6.68212890625, 6.9957275390625, 7.309326171875, 7.6229248046875, 7.9365234375, 8.2501220703125, 8.563720703125, 8.8773193359375, 9.19091796875, 9.5045166015625, 9.818115234375, 10.1317138671875, 10.4453125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 3.0, 5.0, 5.0, 5.0, 11.0, 5.0, 9.0, 19.0, 11.0, 13.0, 22.0, 25.0, 23.0, 27.0, 32.0, 30.0, 38.0, 45.0, 34.0, 41.0, 35.0, 50.0, 35.0, 44.0, 39.0, 44.0, 48.0, 29.0, 30.0, 24.0, 24.0, 22.0, 26.0, 16.0, 24.0, 15.0, 10.0, 13.0, 16.0, 12.0, 6.0, 12.0, 12.0, 8.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.5078125, -8.2552490234375, -8.002685546875, -7.7501220703125, -7.49755859375, -7.2449951171875, -6.992431640625, -6.7398681640625, -6.4873046875, -6.2347412109375, -5.982177734375, -5.7296142578125, -5.47705078125, -5.2244873046875, -4.971923828125, -4.7193603515625, -4.466796875, -4.2142333984375, -3.961669921875, -3.7091064453125, -3.45654296875, -3.2039794921875, -2.951416015625, -2.6988525390625, -2.4462890625, -2.1937255859375, -1.941162109375, -1.6885986328125, -1.43603515625, -1.1834716796875, -0.930908203125, -0.6783447265625, -0.42578125, -0.1732177734375, 0.079345703125, 0.3319091796875, 0.58447265625, 0.8370361328125, 1.089599609375, 1.3421630859375, 1.5947265625, 1.8472900390625, 2.099853515625, 2.3524169921875, 2.60498046875, 2.8575439453125, 3.110107421875, 3.3626708984375, 3.615234375, 3.8677978515625, 4.120361328125, 4.3729248046875, 4.62548828125, 4.8780517578125, 5.130615234375, 5.3831787109375, 5.6357421875, 5.8883056640625, 6.140869140625, 6.3934326171875, 6.64599609375, 6.8985595703125, 7.151123046875, 7.4036865234375, 7.65625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 11.0, 17.0, 12.0, 28.0, 51.0, 65.0, 97.0, 141.0, 245.0, 344.0, 548.0, 916.0, 1414.0, 2336.0, 3885.0, 6376.0, 10329.0, 17266.0, 29029.0, 48874.0, 81396.0, 133101.0, 211735.0, 318337.0, 445237.0, 551902.0, 588140.0, 533232.0, 418878.0, 295078.0, 192461.0, 120113.0, 73015.0, 44110.0, 25864.0, 15512.0, 9329.0, 5702.0, 3406.0, 2075.0, 1399.0, 842.0, 536.0, 309.0, 199.0, 151.0, 88.0, 50.0, 33.0, 27.0, 16.0, 9.0, 9.0, 2.0, 4.0, 5.0], "bins": [-10.375, -10.0733642578125, -9.771728515625, -9.4700927734375, -9.16845703125, -8.8668212890625, -8.565185546875, -8.2635498046875, -7.9619140625, -7.6602783203125, -7.358642578125, -7.0570068359375, -6.75537109375, -6.4537353515625, -6.152099609375, -5.8504638671875, -5.548828125, -5.2471923828125, -4.945556640625, -4.6439208984375, -4.34228515625, -4.0406494140625, -3.739013671875, -3.4373779296875, -3.1357421875, -2.8341064453125, -2.532470703125, -2.2308349609375, -1.92919921875, -1.6275634765625, -1.325927734375, -1.0242919921875, -0.72265625, -0.4210205078125, -0.119384765625, 0.1822509765625, 0.48388671875, 0.7855224609375, 1.087158203125, 1.3887939453125, 1.6904296875, 1.9920654296875, 2.293701171875, 2.5953369140625, 2.89697265625, 3.1986083984375, 3.500244140625, 3.8018798828125, 4.103515625, 4.4051513671875, 4.706787109375, 5.0084228515625, 5.31005859375, 5.6116943359375, 5.913330078125, 6.2149658203125, 6.5166015625, 6.8182373046875, 7.119873046875, 7.4215087890625, 7.72314453125, 8.0247802734375, 8.326416015625, 8.6280517578125, 8.9296875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 13.0, 18.0, 11.0, 19.0, 35.0, 34.0, 42.0, 62.0, 75.0, 103.0, 117.0, 146.0, 176.0, 171.0, 192.0, 241.0, 228.0, 225.0, 220.0, 257.0, 216.0, 211.0, 231.0, 162.0, 184.0, 147.0, 98.0, 107.0, 72.0, 46.0, 49.0, 43.0, 29.0, 30.0, 16.0, 11.0, 2.0, 16.0, 6.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.09375, -4.9488525390625, -4.803955078125, -4.6590576171875, -4.51416015625, -4.3692626953125, -4.224365234375, -4.0794677734375, -3.9345703125, -3.7896728515625, -3.644775390625, -3.4998779296875, -3.35498046875, -3.2100830078125, -3.065185546875, -2.9202880859375, -2.775390625, -2.6304931640625, -2.485595703125, -2.3406982421875, -2.19580078125, -2.0509033203125, -1.906005859375, -1.7611083984375, -1.6162109375, -1.4713134765625, -1.326416015625, -1.1815185546875, -1.03662109375, -0.8917236328125, -0.746826171875, -0.6019287109375, -0.45703125, -0.3121337890625, -0.167236328125, -0.0223388671875, 0.12255859375, 0.2674560546875, 0.412353515625, 0.5572509765625, 0.7021484375, 0.8470458984375, 0.991943359375, 1.1368408203125, 1.28173828125, 1.4266357421875, 1.571533203125, 1.7164306640625, 1.861328125, 2.0062255859375, 2.151123046875, 2.2960205078125, 2.44091796875, 2.5858154296875, 2.730712890625, 2.8756103515625, 3.0205078125, 3.1654052734375, 3.310302734375, 3.4552001953125, 3.60009765625, 3.7449951171875, 3.889892578125, 4.0347900390625, 4.1796875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 12.0, 14.0, 25.0, 17.0, 24.0, 28.0, 51.0, 40.0, 48.0, 48.0, 37.0, 69.0, 58.0, 65.0, 66.0, 53.0, 61.0, 50.0, 33.0, 43.0, 25.0, 22.0, 15.0, 17.0, 19.0, 11.0, 4.0, 4.0, 7.0, 6.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.664194107055664, -14.20682144165039, -13.7494478225708, -13.292075157165527, -12.834702491760254, -12.377328872680664, -11.91995620727539, -11.462583541870117, -11.005210876464844, -10.54783821105957, -10.09046459197998, -9.633091926574707, -9.175719261169434, -8.718345642089844, -8.26097297668457, -7.803600311279297, -7.346226692199707, -6.888853549957275, -6.431480884552002, -5.97410774230957, -5.516735076904297, -5.059361934661865, -4.601988792419434, -4.14461612701416, -3.6872429847717285, -3.229870080947876, -2.7724971771240234, -2.315124034881592, -1.8577511310577393, -1.4003782272338867, -0.9430050849914551, -0.48563218116760254, -0.02825927734375, 0.4291136860847473, 0.8864866495132446, 1.3438596725463867, 1.8012325763702393, 2.258605480194092, 2.7159786224365234, 3.173351526260376, 3.6307244300842285, 4.08809757232666, 4.545470237731934, 5.002843379974365, 5.460216522216797, 5.91758918762207, 6.374962329864502, 6.832335472106934, 7.289708137512207, 7.747081279754639, 8.20445442199707, 8.661827087402344, 9.119199752807617, 9.57657241821289, 10.03394603729248, 10.491318702697754, 10.948692321777344, 11.406064987182617, 11.863438606262207, 12.32081127166748, 12.778183937072754, 13.235557556152344, 13.692930221557617, 14.15030288696289, 14.607675552368164]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 4.0, 8.0, 7.0, 8.0, 14.0, 11.0, 17.0, 25.0, 19.0, 26.0, 27.0, 34.0, 44.0, 33.0, 40.0, 29.0, 32.0, 42.0, 40.0, 48.0, 47.0, 42.0, 29.0, 43.0, 31.0, 34.0, 34.0, 34.0, 17.0, 25.0, 23.0, 25.0, 18.0, 11.0, 18.0, 18.0, 9.0, 9.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.138998031616211, -10.810748100280762, -10.482499122619629, -10.15424919128418, -9.826000213623047, -9.497750282287598, -9.169501304626465, -8.841251373291016, -8.513002395629883, -8.184752464294434, -7.856503486633301, -7.52825403213501, -7.200004577636719, -6.871755123138428, -6.543505668640137, -6.2152557373046875, -5.8870062828063965, -5.5587568283081055, -5.2305073738098145, -4.902257919311523, -4.574008464813232, -4.245759010314941, -3.9175093173980713, -3.5892598628997803, -3.2610104084014893, -2.9327609539031982, -2.6045114994049072, -2.276261806488037, -1.9480124711990356, -1.6197630167007446, -1.291513442993164, -0.963263988494873, -0.635014533996582, -0.30676504969596863, 0.021484434604644775, 0.34973394870758057, 0.6779834032058716, 1.0062328577041626, 1.3344824314117432, 1.6627318859100342, 1.9909813404083252, 2.319230794906616, 2.6474802494049072, 2.9757299423217773, 3.3039793968200684, 3.6322288513183594, 3.9604783058166504, 4.288727760314941, 4.616977214813232, 4.945226669311523, 5.2734761238098145, 5.6017255783081055, 5.9299750328063965, 6.2582244873046875, 6.586474418640137, 6.9147233963012695, 7.242973327636719, 7.57122278213501, 7.899472236633301, 8.22772216796875, 8.555971145629883, 8.884221076965332, 9.212470054626465, 9.540719985961914, 9.868968963623047]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 5.0, 22.0, 21.0, 23.0, 35.0, 39.0, 73.0, 104.0, 161.0, 221.0, 342.0, 471.0, 649.0, 1011.0, 1623.0, 2412.0, 3730.0, 5790.0, 8932.0, 14209.0, 22620.0, 35864.0, 56395.0, 87055.0, 125747.0, 157606.0, 157737.0, 125611.0, 86528.0, 55864.0, 35581.0, 22211.0, 14010.0, 9067.0, 5805.0, 3761.0, 2379.0, 1578.0, 1010.0, 680.0, 455.0, 342.0, 222.0, 159.0, 121.0, 79.0, 57.0, 38.0, 35.0, 23.0, 11.0, 7.0, 9.0, 3.0, 4.0, 1.0, 3.0], "bins": [-2.986328125, -2.89581298828125, -2.8052978515625, -2.71478271484375, -2.624267578125, -2.53375244140625, -2.4432373046875, -2.35272216796875, -2.26220703125, -2.17169189453125, -2.0811767578125, -1.99066162109375, -1.900146484375, -1.80963134765625, -1.7191162109375, -1.62860107421875, -1.5380859375, -1.44757080078125, -1.3570556640625, -1.26654052734375, -1.176025390625, -1.08551025390625, -0.9949951171875, -0.90447998046875, -0.81396484375, -0.72344970703125, -0.6329345703125, -0.54241943359375, -0.451904296875, -0.36138916015625, -0.2708740234375, -0.18035888671875, -0.08984375, 0.00067138671875, 0.0911865234375, 0.18170166015625, 0.272216796875, 0.36273193359375, 0.4532470703125, 0.54376220703125, 0.63427734375, 0.72479248046875, 0.8153076171875, 0.90582275390625, 0.996337890625, 1.08685302734375, 1.1773681640625, 1.26788330078125, 1.3583984375, 1.44891357421875, 1.5394287109375, 1.62994384765625, 1.720458984375, 1.81097412109375, 1.9014892578125, 1.99200439453125, 2.08251953125, 2.17303466796875, 2.2635498046875, 2.35406494140625, 2.444580078125, 2.53509521484375, 2.6256103515625, 2.71612548828125, 2.806640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 7.0, 7.0, 10.0, 8.0, 9.0, 18.0, 13.0, 26.0, 21.0, 30.0, 31.0, 28.0, 30.0, 33.0, 40.0, 37.0, 31.0, 40.0, 37.0, 42.0, 46.0, 39.0, 35.0, 36.0, 32.0, 36.0, 33.0, 26.0, 32.0, 26.0, 22.0, 21.0, 15.0, 18.0, 22.0, 17.0, 11.0, 13.0, 5.0, 6.0, 5.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.3046875, -9.972900390625, -9.64111328125, -9.309326171875, -8.9775390625, -8.645751953125, -8.31396484375, -7.982177734375, -7.650390625, -7.318603515625, -6.98681640625, -6.655029296875, -6.3232421875, -5.991455078125, -5.65966796875, -5.327880859375, -4.99609375, -4.664306640625, -4.33251953125, -4.000732421875, -3.6689453125, -3.337158203125, -3.00537109375, -2.673583984375, -2.341796875, -2.010009765625, -1.67822265625, -1.346435546875, -1.0146484375, -0.682861328125, -0.35107421875, -0.019287109375, 0.3125, 0.644287109375, 0.97607421875, 1.307861328125, 1.6396484375, 1.971435546875, 2.30322265625, 2.635009765625, 2.966796875, 3.298583984375, 3.63037109375, 3.962158203125, 4.2939453125, 4.625732421875, 4.95751953125, 5.289306640625, 5.62109375, 5.952880859375, 6.28466796875, 6.616455078125, 6.9482421875, 7.280029296875, 7.61181640625, 7.943603515625, 8.275390625, 8.607177734375, 8.93896484375, 9.270751953125, 9.6025390625, 9.934326171875, 10.26611328125, 10.597900390625, 10.9296875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 11.0, 11.0, 18.0, 26.0, 35.0, 46.0, 89.0, 135.0, 172.0, 290.0, 502.0, 862.0, 1439.0, 2527.0, 4366.0, 7901.0, 15088.0, 28608.0, 56181.0, 105824.0, 182706.0, 233140.0, 182809.0, 106467.0, 56305.0, 29161.0, 15107.0, 8066.0, 4457.0, 2529.0, 1452.0, 865.0, 481.0, 294.0, 192.0, 144.0, 70.0, 58.0, 39.0, 24.0, 18.0, 13.0, 2.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.04296875, -3.92230224609375, -3.8016357421875, -3.68096923828125, -3.560302734375, -3.43963623046875, -3.3189697265625, -3.19830322265625, -3.07763671875, -2.95697021484375, -2.8363037109375, -2.71563720703125, -2.594970703125, -2.47430419921875, -2.3536376953125, -2.23297119140625, -2.1123046875, -1.99163818359375, -1.8709716796875, -1.75030517578125, -1.629638671875, -1.50897216796875, -1.3883056640625, -1.26763916015625, -1.14697265625, -1.02630615234375, -0.9056396484375, -0.78497314453125, -0.664306640625, -0.54364013671875, -0.4229736328125, -0.30230712890625, -0.181640625, -0.06097412109375, 0.0596923828125, 0.18035888671875, 0.301025390625, 0.42169189453125, 0.5423583984375, 0.66302490234375, 0.78369140625, 0.90435791015625, 1.0250244140625, 1.14569091796875, 1.266357421875, 1.38702392578125, 1.5076904296875, 1.62835693359375, 1.7490234375, 1.86968994140625, 1.9903564453125, 2.11102294921875, 2.231689453125, 2.35235595703125, 2.4730224609375, 2.59368896484375, 2.71435546875, 2.83502197265625, 2.9556884765625, 3.07635498046875, 3.197021484375, 3.31768798828125, 3.4383544921875, 3.55902099609375, 3.6796875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 4.0, 9.0, 4.0, 4.0, 11.0, 6.0, 11.0, 21.0, 18.0, 15.0, 20.0, 20.0, 32.0, 22.0, 40.0, 37.0, 28.0, 34.0, 43.0, 37.0, 43.0, 39.0, 50.0, 38.0, 40.0, 39.0, 33.0, 35.0, 33.0, 36.0, 31.0, 32.0, 8.0, 16.0, 23.0, 19.0, 18.0, 7.0, 7.0, 11.0, 9.0, 6.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.609375, -6.39508056640625, -6.1807861328125, -5.96649169921875, -5.752197265625, -5.53790283203125, -5.3236083984375, -5.10931396484375, -4.89501953125, -4.68072509765625, -4.4664306640625, -4.25213623046875, -4.037841796875, -3.82354736328125, -3.6092529296875, -3.39495849609375, -3.1806640625, -2.96636962890625, -2.7520751953125, -2.53778076171875, -2.323486328125, -2.10919189453125, -1.8948974609375, -1.68060302734375, -1.46630859375, -1.25201416015625, -1.0377197265625, -0.82342529296875, -0.609130859375, -0.39483642578125, -0.1805419921875, 0.03375244140625, 0.248046875, 0.46234130859375, 0.6766357421875, 0.89093017578125, 1.105224609375, 1.31951904296875, 1.5338134765625, 1.74810791015625, 1.96240234375, 2.17669677734375, 2.3909912109375, 2.60528564453125, 2.819580078125, 3.03387451171875, 3.2481689453125, 3.46246337890625, 3.6767578125, 3.89105224609375, 4.1053466796875, 4.31964111328125, 4.533935546875, 4.74822998046875, 4.9625244140625, 5.17681884765625, 5.39111328125, 5.60540771484375, 5.8197021484375, 6.03399658203125, 6.248291015625, 6.46258544921875, 6.6768798828125, 6.89117431640625, 7.10546875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 4.0, 10.0, 24.0, 23.0, 35.0, 53.0, 75.0, 123.0, 179.0, 313.0, 583.0, 934.0, 1645.0, 3462.0, 7886.0, 20622.0, 64336.0, 223367.0, 424487.0, 206252.0, 60097.0, 19382.0, 7476.0, 3294.0, 1642.0, 869.0, 486.0, 301.0, 210.0, 143.0, 71.0, 61.0, 28.0, 24.0, 13.0, 9.0, 9.0, 5.0, 2.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8408203125, -1.78411865234375, -1.7274169921875, -1.67071533203125, -1.614013671875, -1.55731201171875, -1.5006103515625, -1.44390869140625, -1.38720703125, -1.33050537109375, -1.2738037109375, -1.21710205078125, -1.160400390625, -1.10369873046875, -1.0469970703125, -0.99029541015625, -0.93359375, -0.87689208984375, -0.8201904296875, -0.76348876953125, -0.706787109375, -0.65008544921875, -0.5933837890625, -0.53668212890625, -0.47998046875, -0.42327880859375, -0.3665771484375, -0.30987548828125, -0.253173828125, -0.19647216796875, -0.1397705078125, -0.08306884765625, -0.0263671875, 0.03033447265625, 0.0870361328125, 0.14373779296875, 0.200439453125, 0.25714111328125, 0.3138427734375, 0.37054443359375, 0.42724609375, 0.48394775390625, 0.5406494140625, 0.59735107421875, 0.654052734375, 0.71075439453125, 0.7674560546875, 0.82415771484375, 0.880859375, 0.93756103515625, 0.9942626953125, 1.05096435546875, 1.107666015625, 1.16436767578125, 1.2210693359375, 1.27777099609375, 1.33447265625, 1.39117431640625, 1.4478759765625, 1.50457763671875, 1.561279296875, 1.61798095703125, 1.6746826171875, 1.73138427734375, 1.7880859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 2.0, 8.0, 7.0, 7.0, 12.0, 20.0, 18.0, 23.0, 25.0, 22.0, 34.0, 38.0, 33.0, 47.0, 50.0, 51.0, 60.0, 65.0, 69.0, 56.0, 54.0, 54.0, 36.0, 33.0, 32.0, 35.0, 20.0, 15.0, 19.0, 11.0, 8.0, 7.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.965066909790039e-05, -4.78941947221756e-05, -4.6137720346450806e-05, -4.438124597072601e-05, -4.262477159500122e-05, -4.086829721927643e-05, -3.9111822843551636e-05, -3.735534846782684e-05, -3.559887409210205e-05, -3.384239971637726e-05, -3.2085925340652466e-05, -3.0329450964927673e-05, -2.857297658920288e-05, -2.681650221347809e-05, -2.5060027837753296e-05, -2.3303553462028503e-05, -2.154707908630371e-05, -1.979060471057892e-05, -1.8034130334854126e-05, -1.6277655959129333e-05, -1.4521181583404541e-05, -1.2764707207679749e-05, -1.1008232831954956e-05, -9.251758456230164e-06, -7.495284080505371e-06, -5.738809704780579e-06, -3.982335329055786e-06, -2.2258609533309937e-06, -4.6938657760620117e-07, 1.2870877981185913e-06, 3.043562173843384e-06, 4.800036549568176e-06, 6.556510925292969e-06, 8.312985301017761e-06, 1.0069459676742554e-05, 1.1825934052467346e-05, 1.3582408428192139e-05, 1.533888280391693e-05, 1.7095357179641724e-05, 1.8851831555366516e-05, 2.060830593109131e-05, 2.23647803068161e-05, 2.4121254682540894e-05, 2.5877729058265686e-05, 2.763420343399048e-05, 2.939067780971527e-05, 3.1147152185440063e-05, 3.2903626561164856e-05, 3.466010093688965e-05, 3.641657531261444e-05, 3.8173049688339233e-05, 3.9929524064064026e-05, 4.168599843978882e-05, 4.344247281551361e-05, 4.51989471912384e-05, 4.6955421566963196e-05, 4.871189594268799e-05, 5.046837031841278e-05, 5.222484469413757e-05, 5.3981319069862366e-05, 5.573779344558716e-05, 5.749426782131195e-05, 5.925074219703674e-05, 6.1007216572761536e-05, 6.276369094848633e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 6.0, 3.0, 4.0, 7.0, 11.0, 13.0, 18.0, 31.0, 43.0, 56.0, 106.0, 190.0, 299.0, 539.0, 911.0, 1638.0, 3089.0, 5677.0, 11189.0, 22688.0, 48330.0, 109929.0, 235858.0, 298490.0, 168225.0, 73873.0, 33609.0, 16053.0, 8169.0, 4206.0, 2205.0, 1323.0, 729.0, 424.0, 246.0, 131.0, 79.0, 52.0, 41.0, 21.0, 19.0, 12.0, 3.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3486328125, -1.299163818359375, -1.24969482421875, -1.200225830078125, -1.1507568359375, -1.101287841796875, -1.05181884765625, -1.002349853515625, -0.952880859375, -0.903411865234375, -0.85394287109375, -0.804473876953125, -0.7550048828125, -0.705535888671875, -0.65606689453125, -0.606597900390625, -0.55712890625, -0.507659912109375, -0.45819091796875, -0.408721923828125, -0.3592529296875, -0.309783935546875, -0.26031494140625, -0.210845947265625, -0.161376953125, -0.111907958984375, -0.06243896484375, -0.012969970703125, 0.0364990234375, 0.085968017578125, 0.13543701171875, 0.184906005859375, 0.234375, 0.283843994140625, 0.33331298828125, 0.382781982421875, 0.4322509765625, 0.481719970703125, 0.53118896484375, 0.580657958984375, 0.630126953125, 0.679595947265625, 0.72906494140625, 0.778533935546875, 0.8280029296875, 0.877471923828125, 0.92694091796875, 0.976409912109375, 1.02587890625, 1.075347900390625, 1.12481689453125, 1.174285888671875, 1.2237548828125, 1.273223876953125, 1.32269287109375, 1.372161865234375, 1.421630859375, 1.471099853515625, 1.52056884765625, 1.570037841796875, 1.6195068359375, 1.668975830078125, 1.71844482421875, 1.767913818359375, 1.8173828125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 5.0, 5.0, 9.0, 9.0, 15.0, 17.0, 23.0, 29.0, 27.0, 35.0, 36.0, 54.0, 57.0, 56.0, 62.0, 61.0, 70.0, 64.0, 71.0, 52.0, 45.0, 38.0, 39.0, 29.0, 15.0, 23.0, 13.0, 9.0, 10.0, 5.0, 5.0, 2.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.537109375, -0.5211334228515625, -0.505157470703125, -0.4891815185546875, -0.47320556640625, -0.4572296142578125, -0.441253662109375, -0.4252777099609375, -0.4093017578125, -0.3933258056640625, -0.377349853515625, -0.3613739013671875, -0.34539794921875, -0.3294219970703125, -0.313446044921875, -0.2974700927734375, -0.281494140625, -0.2655181884765625, -0.249542236328125, -0.2335662841796875, -0.21759033203125, -0.2016143798828125, -0.185638427734375, -0.1696624755859375, -0.1536865234375, -0.1377105712890625, -0.121734619140625, -0.1057586669921875, -0.08978271484375, -0.0738067626953125, -0.057830810546875, -0.0418548583984375, -0.02587890625, -0.0099029541015625, 0.006072998046875, 0.0220489501953125, 0.03802490234375, 0.0540008544921875, 0.069976806640625, 0.0859527587890625, 0.1019287109375, 0.1179046630859375, 0.133880615234375, 0.1498565673828125, 0.16583251953125, 0.1818084716796875, 0.197784423828125, 0.2137603759765625, 0.229736328125, 0.2457122802734375, 0.261688232421875, 0.2776641845703125, 0.29364013671875, 0.3096160888671875, 0.325592041015625, 0.3415679931640625, 0.3575439453125, 0.3735198974609375, 0.389495849609375, 0.4054718017578125, 0.42144775390625, 0.4374237060546875, 0.453399658203125, 0.4693756103515625, 0.4853515625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 20.0, 19.0, 15.0, 30.0, 37.0, 49.0, 44.0, 40.0, 46.0, 57.0, 67.0, 63.0, 72.0, 56.0, 61.0, 55.0, 39.0, 37.0, 37.0, 25.0, 17.0, 15.0, 20.0, 13.0, 7.0, 3.0, 5.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.116645812988281, -14.653024673461914, -14.18940258026123, -13.725781440734863, -13.26215934753418, -12.798538208007812, -12.334917068481445, -11.871294975280762, -11.407672882080078, -10.944051742553711, -10.480429649353027, -10.01680850982666, -9.553186416625977, -9.08956527709961, -8.625944137573242, -8.162322044372559, -7.698700904846191, -7.235079288482666, -6.771457672119141, -6.307836532592773, -5.84421443939209, -5.380593299865723, -4.916971683502197, -4.453350067138672, -3.9897284507751465, -3.526106834411621, -3.0624852180480957, -2.5988638401031494, -2.135242223739624, -1.6716206073760986, -1.2079992294311523, -0.744377613067627, -0.28075504302978516, 0.18286651372909546, 0.6464880704879761, 1.110109567642212, 1.5737311840057373, 2.0373528003692627, 2.500974178314209, 2.9645957946777344, 3.4282174110412598, 3.891839027404785, 4.3554606437683105, 4.819082260131836, 5.282703399658203, 5.746325492858887, 6.209946632385254, 6.673568248748779, 7.137189865112305, 7.60081148147583, 8.064433097839355, 8.528054237365723, 8.991676330566406, 9.455297470092773, 9.91891860961914, 10.382540702819824, 10.846162796020508, 11.309783935546875, 11.773406028747559, 12.237027168273926, 12.70064926147461, 13.164270401000977, 13.627891540527344, 14.091513633728027, 14.555134773254395]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 9.0, 4.0, 7.0, 7.0, 11.0, 15.0, 10.0, 21.0, 21.0, 19.0, 22.0, 36.0, 33.0, 43.0, 34.0, 33.0, 32.0, 34.0, 44.0, 38.0, 48.0, 54.0, 38.0, 31.0, 32.0, 37.0, 35.0, 34.0, 28.0, 21.0, 26.0, 22.0, 23.0, 18.0, 13.0, 20.0, 12.0, 12.0, 7.0, 5.0, 6.0, 3.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.011168479919434, -10.68464183807373, -10.358116149902344, -10.03158950805664, -9.705062866210938, -9.378536224365234, -9.052009582519531, -8.725483894348145, -8.398957252502441, -8.072430610656738, -7.745904445648193, -7.419378280639648, -7.092851638793945, -6.766324996948242, -6.439798831939697, -6.113272666931152, -5.786746025085449, -5.460219383239746, -5.133693218231201, -4.807167053222656, -4.480640411376953, -4.15411376953125, -3.827587604522705, -3.501061201095581, -3.174534797668457, -2.848008394241333, -2.521481990814209, -2.194955587387085, -1.868429183959961, -1.541902780532837, -1.215376377105713, -0.8888499736785889, -0.5623235702514648, -0.23579716682434082, 0.0907292366027832, 0.4172556400299072, 0.7437820434570312, 1.0703084468841553, 1.3968348503112793, 1.7233612537384033, 2.0498876571655273, 2.3764140605926514, 2.7029404640197754, 3.0294668674468994, 3.3559932708740234, 3.6825196743011475, 4.0090460777282715, 4.335572242736816, 4.6620988845825195, 4.988625526428223, 5.315151691436768, 5.6416778564453125, 5.968204498291016, 6.294731140136719, 6.621257305145264, 6.947783470153809, 7.274310111999512, 7.600836753845215, 7.92736291885376, 8.253889083862305, 8.580415725708008, 8.906942367553711, 9.233469009399414, 9.5599946975708, 9.886521339416504]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 8.0, 10.0, 13.0, 20.0, 27.0, 54.0, 60.0, 122.0, 147.0, 253.0, 388.0, 574.0, 930.0, 1478.0, 2372.0, 3738.0, 6314.0, 10142.0, 17390.0, 28401.0, 45508.0, 70989.0, 103385.0, 133663.0, 150149.0, 141431.0, 112981.0, 80163.0, 53227.0, 33198.0, 20302.0, 11984.0, 7248.0, 4476.0, 2773.0, 1668.0, 1079.0, 687.0, 439.0, 310.0, 154.0, 122.0, 67.0, 40.0, 29.0, 20.0, 12.0, 11.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.5303955078125, -9.185791015625, -8.8411865234375, -8.49658203125, -8.1519775390625, -7.807373046875, -7.4627685546875, -7.1181640625, -6.7735595703125, -6.428955078125, -6.0843505859375, -5.73974609375, -5.3951416015625, -5.050537109375, -4.7059326171875, -4.361328125, -4.0167236328125, -3.672119140625, -3.3275146484375, -2.98291015625, -2.6383056640625, -2.293701171875, -1.9490966796875, -1.6044921875, -1.2598876953125, -0.915283203125, -0.5706787109375, -0.22607421875, 0.1185302734375, 0.463134765625, 0.8077392578125, 1.15234375, 1.4969482421875, 1.841552734375, 2.1861572265625, 2.53076171875, 2.8753662109375, 3.219970703125, 3.5645751953125, 3.9091796875, 4.2537841796875, 4.598388671875, 4.9429931640625, 5.28759765625, 5.6322021484375, 5.976806640625, 6.3214111328125, 6.666015625, 7.0106201171875, 7.355224609375, 7.6998291015625, 8.04443359375, 8.3890380859375, 8.733642578125, 9.0782470703125, 9.4228515625, 9.7674560546875, 10.112060546875, 10.4566650390625, 10.80126953125, 11.1458740234375, 11.490478515625, 11.8350830078125, 12.1796875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 4.0, 12.0, 11.0, 6.0, 16.0, 15.0, 13.0, 20.0, 20.0, 18.0, 19.0, 40.0, 42.0, 29.0, 39.0, 40.0, 36.0, 42.0, 46.0, 44.0, 33.0, 49.0, 38.0, 33.0, 34.0, 30.0, 34.0, 28.0, 26.0, 22.0, 27.0, 26.0, 23.0, 9.0, 10.0, 10.0, 15.0, 12.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-10.671875, -10.3480224609375, -10.024169921875, -9.7003173828125, -9.37646484375, -9.0526123046875, -8.728759765625, -8.4049072265625, -8.0810546875, -7.7572021484375, -7.433349609375, -7.1094970703125, -6.78564453125, -6.4617919921875, -6.137939453125, -5.8140869140625, -5.490234375, -5.1663818359375, -4.842529296875, -4.5186767578125, -4.19482421875, -3.8709716796875, -3.547119140625, -3.2232666015625, -2.8994140625, -2.5755615234375, -2.251708984375, -1.9278564453125, -1.60400390625, -1.2801513671875, -0.956298828125, -0.6324462890625, -0.30859375, 0.0152587890625, 0.339111328125, 0.6629638671875, 0.98681640625, 1.3106689453125, 1.634521484375, 1.9583740234375, 2.2822265625, 2.6060791015625, 2.929931640625, 3.2537841796875, 3.57763671875, 3.9014892578125, 4.225341796875, 4.5491943359375, 4.873046875, 5.1968994140625, 5.520751953125, 5.8446044921875, 6.16845703125, 6.4923095703125, 6.816162109375, 7.1400146484375, 7.4638671875, 7.7877197265625, 8.111572265625, 8.4354248046875, 8.75927734375, 9.0831298828125, 9.406982421875, 9.7308349609375, 10.0546875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [5.0, 2.0, 7.0, 7.0, 7.0, 10.0, 22.0, 25.0, 39.0, 53.0, 99.0, 114.0, 158.0, 303.0, 416.0, 606.0, 1003.0, 1603.0, 2540.0, 4079.0, 6798.0, 11066.0, 17795.0, 28655.0, 45577.0, 69033.0, 97844.0, 126721.0, 142268.0, 137320.0, 114041.0, 84761.0, 57894.0, 36583.0, 23349.0, 14205.0, 8809.0, 5474.0, 3444.0, 2099.0, 1281.0, 834.0, 560.0, 339.0, 240.0, 155.0, 124.0, 71.0, 52.0, 33.0, 17.0, 13.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.88330078125, -8.5634765625, -8.24365234375, -7.923828125, -7.60400390625, -7.2841796875, -6.96435546875, -6.64453125, -6.32470703125, -6.0048828125, -5.68505859375, -5.365234375, -5.04541015625, -4.7255859375, -4.40576171875, -4.0859375, -3.76611328125, -3.4462890625, -3.12646484375, -2.806640625, -2.48681640625, -2.1669921875, -1.84716796875, -1.52734375, -1.20751953125, -0.8876953125, -0.56787109375, -0.248046875, 0.07177734375, 0.3916015625, 0.71142578125, 1.03125, 1.35107421875, 1.6708984375, 1.99072265625, 2.310546875, 2.63037109375, 2.9501953125, 3.27001953125, 3.58984375, 3.90966796875, 4.2294921875, 4.54931640625, 4.869140625, 5.18896484375, 5.5087890625, 5.82861328125, 6.1484375, 6.46826171875, 6.7880859375, 7.10791015625, 7.427734375, 7.74755859375, 8.0673828125, 8.38720703125, 8.70703125, 9.02685546875, 9.3466796875, 9.66650390625, 9.986328125, 10.30615234375, 10.6259765625, 10.94580078125, 11.265625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 6.0, 10.0, 4.0, 16.0, 5.0, 8.0, 12.0, 17.0, 22.0, 17.0, 27.0, 28.0, 24.0, 33.0, 40.0, 32.0, 46.0, 41.0, 34.0, 44.0, 51.0, 30.0, 51.0, 35.0, 29.0, 39.0, 35.0, 26.0, 39.0, 26.0, 24.0, 16.0, 16.0, 22.0, 17.0, 10.0, 12.0, 9.0, 14.0, 9.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.1658935546875, -5.964599609375, -5.7633056640625, -5.56201171875, -5.3607177734375, -5.159423828125, -4.9581298828125, -4.7568359375, -4.5555419921875, -4.354248046875, -4.1529541015625, -3.95166015625, -3.7503662109375, -3.549072265625, -3.3477783203125, -3.146484375, -2.9451904296875, -2.743896484375, -2.5426025390625, -2.34130859375, -2.1400146484375, -1.938720703125, -1.7374267578125, -1.5361328125, -1.3348388671875, -1.133544921875, -0.9322509765625, -0.73095703125, -0.5296630859375, -0.328369140625, -0.1270751953125, 0.07421875, 0.2755126953125, 0.476806640625, 0.6781005859375, 0.87939453125, 1.0806884765625, 1.281982421875, 1.4832763671875, 1.6845703125, 1.8858642578125, 2.087158203125, 2.2884521484375, 2.48974609375, 2.6910400390625, 2.892333984375, 3.0936279296875, 3.294921875, 3.4962158203125, 3.697509765625, 3.8988037109375, 4.10009765625, 4.3013916015625, 4.502685546875, 4.7039794921875, 4.9052734375, 5.1065673828125, 5.307861328125, 5.5091552734375, 5.71044921875, 5.9117431640625, 6.113037109375, 6.3143310546875, 6.515625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 7.0, 3.0, 13.0, 21.0, 15.0, 34.0, 46.0, 73.0, 110.0, 140.0, 191.0, 305.0, 444.0, 586.0, 881.0, 1342.0, 2060.0, 3118.0, 5049.0, 7961.0, 12936.0, 21369.0, 35930.0, 61446.0, 102221.0, 154415.0, 187464.0, 164235.0, 113253.0, 69072.0, 40940.0, 24033.0, 14212.0, 8741.0, 5557.0, 3423.0, 2298.0, 1460.0, 1000.0, 669.0, 436.0, 316.0, 231.0, 153.0, 90.0, 86.0, 57.0, 38.0, 25.0, 18.0, 13.0, 7.0, 9.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.5703125, -8.3074951171875, -8.044677734375, -7.7818603515625, -7.51904296875, -7.2562255859375, -6.993408203125, -6.7305908203125, -6.4677734375, -6.2049560546875, -5.942138671875, -5.6793212890625, -5.41650390625, -5.1536865234375, -4.890869140625, -4.6280517578125, -4.365234375, -4.1024169921875, -3.839599609375, -3.5767822265625, -3.31396484375, -3.0511474609375, -2.788330078125, -2.5255126953125, -2.2626953125, -1.9998779296875, -1.737060546875, -1.4742431640625, -1.21142578125, -0.9486083984375, -0.685791015625, -0.4229736328125, -0.16015625, 0.1026611328125, 0.365478515625, 0.6282958984375, 0.89111328125, 1.1539306640625, 1.416748046875, 1.6795654296875, 1.9423828125, 2.2052001953125, 2.468017578125, 2.7308349609375, 2.99365234375, 3.2564697265625, 3.519287109375, 3.7821044921875, 4.044921875, 4.3077392578125, 4.570556640625, 4.8333740234375, 5.09619140625, 5.3590087890625, 5.621826171875, 5.8846435546875, 6.1474609375, 6.4102783203125, 6.673095703125, 6.9359130859375, 7.19873046875, 7.4615478515625, 7.724365234375, 7.9871826171875, 8.25]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 11.0, 8.0, 9.0, 8.0, 20.0, 19.0, 32.0, 54.0, 53.0, 72.0, 80.0, 74.0, 89.0, 71.0, 78.0, 71.0, 57.0, 41.0, 45.0, 32.0, 23.0, 11.0, 9.0, 4.0, 7.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008616447448730469, -0.0008344501256942749, -0.0008072555065155029, -0.000780060887336731, -0.000752866268157959, -0.000725671648979187, -0.000698477029800415, -0.0006712824106216431, -0.0006440877914428711, -0.0006168931722640991, -0.0005896985530853271, -0.0005625039339065552, -0.0005353093147277832, -0.0005081146955490112, -0.00048092007637023926, -0.0004537254571914673, -0.0004265308380126953, -0.00039933621883392334, -0.00037214159965515137, -0.0003449469804763794, -0.0003177523612976074, -0.00029055774211883545, -0.0002633631229400635, -0.0002361685037612915, -0.00020897388458251953, -0.00018177926540374756, -0.00015458464622497559, -0.0001273900270462036, -0.00010019540786743164, -7.300078868865967e-05, -4.5806169509887695e-05, -1.8611550331115723e-05, 8.58306884765625e-06, 3.577768802642822e-05, 6.29723072052002e-05, 9.016692638397217e-05, 0.00011736154556274414, 0.0001445561647415161, 0.00017175078392028809, 0.00019894540309906006, 0.00022614002227783203, 0.000253334641456604, 0.000280529260635376, 0.00030772387981414795, 0.0003349184989929199, 0.0003621131181716919, 0.00038930773735046387, 0.00041650235652923584, 0.0004436969757080078, 0.0004708915948867798, 0.0004980862140655518, 0.0005252808332443237, 0.0005524754524230957, 0.0005796700716018677, 0.0006068646907806396, 0.0006340593099594116, 0.0006612539291381836, 0.0006884485483169556, 0.0007156431674957275, 0.0007428377866744995, 0.0007700324058532715, 0.0007972270250320435, 0.0008244216442108154, 0.0008516162633895874, 0.0008788108825683594]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 14.0, 19.0, 21.0, 39.0, 46.0, 54.0, 90.0, 156.0, 209.0, 302.0, 501.0, 693.0, 1124.0, 1863.0, 3014.0, 5097.0, 8594.0, 15482.0, 28155.0, 51374.0, 92652.0, 153653.0, 203741.0, 189273.0, 127324.0, 72652.0, 40563.0, 21893.0, 12188.0, 6892.0, 4050.0, 2499.0, 1498.0, 929.0, 669.0, 391.0, 271.0, 174.0, 123.0, 88.0, 49.0, 50.0, 23.0, 28.0, 11.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.328125, -9.043701171875, -8.75927734375, -8.474853515625, -8.1904296875, -7.906005859375, -7.62158203125, -7.337158203125, -7.052734375, -6.768310546875, -6.48388671875, -6.199462890625, -5.9150390625, -5.630615234375, -5.34619140625, -5.061767578125, -4.77734375, -4.492919921875, -4.20849609375, -3.924072265625, -3.6396484375, -3.355224609375, -3.07080078125, -2.786376953125, -2.501953125, -2.217529296875, -1.93310546875, -1.648681640625, -1.3642578125, -1.079833984375, -0.79541015625, -0.510986328125, -0.2265625, 0.057861328125, 0.34228515625, 0.626708984375, 0.9111328125, 1.195556640625, 1.47998046875, 1.764404296875, 2.048828125, 2.333251953125, 2.61767578125, 2.902099609375, 3.1865234375, 3.470947265625, 3.75537109375, 4.039794921875, 4.32421875, 4.608642578125, 4.89306640625, 5.177490234375, 5.4619140625, 5.746337890625, 6.03076171875, 6.315185546875, 6.599609375, 6.884033203125, 7.16845703125, 7.452880859375, 7.7373046875, 8.021728515625, 8.30615234375, 8.590576171875, 8.875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 7.0, 11.0, 4.0, 13.0, 16.0, 13.0, 21.0, 20.0, 36.0, 37.0, 30.0, 40.0, 52.0, 55.0, 59.0, 49.0, 65.0, 85.0, 61.0, 58.0, 45.0, 34.0, 37.0, 32.0, 20.0, 13.0, 16.0, 8.0, 13.0, 14.0, 9.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.560546875, -2.4774169921875, -2.394287109375, -2.3111572265625, -2.22802734375, -2.1448974609375, -2.061767578125, -1.9786376953125, -1.8955078125, -1.8123779296875, -1.729248046875, -1.6461181640625, -1.56298828125, -1.4798583984375, -1.396728515625, -1.3135986328125, -1.23046875, -1.1473388671875, -1.064208984375, -0.9810791015625, -0.89794921875, -0.8148193359375, -0.731689453125, -0.6485595703125, -0.5654296875, -0.4822998046875, -0.399169921875, -0.3160400390625, -0.23291015625, -0.1497802734375, -0.066650390625, 0.0164794921875, 0.099609375, 0.1827392578125, 0.265869140625, 0.3489990234375, 0.43212890625, 0.5152587890625, 0.598388671875, 0.6815185546875, 0.7646484375, 0.8477783203125, 0.930908203125, 1.0140380859375, 1.09716796875, 1.1802978515625, 1.263427734375, 1.3465576171875, 1.4296875, 1.5128173828125, 1.595947265625, 1.6790771484375, 1.76220703125, 1.8453369140625, 1.928466796875, 2.0115966796875, 2.0947265625, 2.1778564453125, 2.260986328125, 2.3441162109375, 2.42724609375, 2.5103759765625, 2.593505859375, 2.6766357421875, 2.759765625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 10.0, 9.0, 5.0, 14.0, 16.0, 21.0, 15.0, 30.0, 26.0, 56.0, 38.0, 59.0, 50.0, 54.0, 62.0, 74.0, 60.0, 70.0, 65.0, 40.0, 38.0, 33.0, 33.0, 22.0, 21.0, 19.0, 16.0, 9.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.324382781982422, -15.844747543334961, -15.365111351013184, -14.885476112365723, -14.405840873718262, -13.926204681396484, -13.446569442749023, -12.966934204101562, -12.487298965454102, -12.00766372680664, -11.528027534484863, -11.048392295837402, -10.568757057189941, -10.089120864868164, -9.609485626220703, -9.129850387573242, -8.650215148925781, -8.17057991027832, -7.690944194793701, -7.211308479309082, -6.731673240661621, -6.252037525177002, -5.772401809692383, -5.292766571044922, -4.8131303787231445, -4.333494663238525, -3.8538594245910645, -3.3742237091064453, -2.8945884704589844, -2.4149527549743652, -1.9353172779083252, -1.4556818008422852, -0.9760465621948242, -0.4964110553264618, -0.016775548458099365, 0.46285998821258545, 0.9424954652786255, 1.422131061553955, 1.9017665386199951, 2.381402015686035, 2.861037492752075, 3.3406729698181152, 3.8203084468841553, 4.299943923950195, 4.7795796394348145, 5.259215354919434, 5.7388505935668945, 6.2184858322143555, 6.698121547698975, 7.177757263183594, 7.657392501831055, 8.137027740478516, 8.616663932800293, 9.096299171447754, 9.575934410095215, 10.055570602416992, 10.535205841064453, 11.014841079711914, 11.494477272033691, 11.974112510681152, 12.453747749328613, 12.93338394165039, 13.413019180297852, 13.892654418945312, 14.372289657592773]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 11.0, 10.0, 10.0, 17.0, 18.0, 19.0, 30.0, 25.0, 25.0, 26.0, 27.0, 33.0, 31.0, 45.0, 35.0, 39.0, 40.0, 42.0, 44.0, 33.0, 43.0, 39.0, 29.0, 29.0, 28.0, 31.0, 31.0, 30.0, 20.0, 21.0, 17.0, 20.0, 16.0, 18.0, 10.0, 14.0, 5.0, 5.0, 6.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.885758399963379, -10.55757999420166, -10.229402542114258, -9.901224136352539, -9.57304573059082, -9.244867324829102, -8.9166898727417, -8.58851146697998, -8.260334014892578, -7.932156085968018, -7.603977680206299, -7.275799751281738, -6.9476213455200195, -6.619443416595459, -6.291265487670898, -5.96308708190918, -5.634908676147461, -5.3067307472229, -4.978552341461182, -4.650374412536621, -4.322196006774902, -3.994018077850342, -3.6658401489257812, -3.3376619815826416, -3.009483814239502, -2.6813056468963623, -2.3531274795532227, -2.024949550628662, -1.6967713832855225, -1.3685932159423828, -1.0404151678085327, -0.7122371196746826, -0.38405799865722656, -0.05587989091873169, 0.2722982168197632, 0.6004763245582581, 0.9286544322967529, 1.2568325996398926, 1.5850106477737427, 1.9131886959075928, 2.2413668632507324, 2.569545030593872, 2.8977231979370117, 3.2259011268615723, 3.554079294204712, 3.8822574615478516, 4.210435390472412, 4.538613319396973, 4.866791725158691, 5.194969654083252, 5.523148059844971, 5.851325988769531, 6.17950439453125, 6.5076823234558105, 6.835860252380371, 7.16403865814209, 7.49221658706665, 7.820394515991211, 8.14857292175293, 8.476751327514648, 8.80492877960205, 9.13310718536377, 9.461285591125488, 9.78946304321289, 10.11764144897461]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 4.0, 6.0, 8.0, 18.0, 19.0, 32.0, 46.0, 74.0, 104.0, 194.0, 322.0, 481.0, 627.0, 1050.0, 1690.0, 2635.0, 4246.0, 6602.0, 10457.0, 16936.0, 27234.0, 44491.0, 72332.0, 117970.0, 190899.0, 299182.0, 442164.0, 579241.0, 636789.0, 565708.0, 422254.0, 282220.0, 180656.0, 110414.0, 67984.0, 41482.0, 25629.0, 15686.0, 9874.0, 6103.0, 3826.0, 2406.0, 1533.0, 919.0, 655.0, 397.0, 267.0, 164.0, 90.0, 63.0, 37.0, 30.0, 24.0, 12.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.2265625, -8.942138671875, -8.65771484375, -8.373291015625, -8.0888671875, -7.804443359375, -7.52001953125, -7.235595703125, -6.951171875, -6.666748046875, -6.38232421875, -6.097900390625, -5.8134765625, -5.529052734375, -5.24462890625, -4.960205078125, -4.67578125, -4.391357421875, -4.10693359375, -3.822509765625, -3.5380859375, -3.253662109375, -2.96923828125, -2.684814453125, -2.400390625, -2.115966796875, -1.83154296875, -1.547119140625, -1.2626953125, -0.978271484375, -0.69384765625, -0.409423828125, -0.125, 0.159423828125, 0.44384765625, 0.728271484375, 1.0126953125, 1.297119140625, 1.58154296875, 1.865966796875, 2.150390625, 2.434814453125, 2.71923828125, 3.003662109375, 3.2880859375, 3.572509765625, 3.85693359375, 4.141357421875, 4.42578125, 4.710205078125, 4.99462890625, 5.279052734375, 5.5634765625, 5.847900390625, 6.13232421875, 6.416748046875, 6.701171875, 6.985595703125, 7.27001953125, 7.554443359375, 7.8388671875, 8.123291015625, 8.40771484375, 8.692138671875, 8.9765625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 7.0, 8.0, 16.0, 13.0, 20.0, 19.0, 13.0, 22.0, 37.0, 48.0, 30.0, 30.0, 39.0, 41.0, 43.0, 44.0, 53.0, 47.0, 46.0, 45.0, 36.0, 46.0, 38.0, 31.0, 39.0, 31.0, 17.0, 25.0, 21.0, 16.0, 14.0, 20.0, 14.0, 8.0, 4.0, 2.0, 8.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.046875, -7.79791259765625, -7.5489501953125, -7.29998779296875, -7.051025390625, -6.80206298828125, -6.5531005859375, -6.30413818359375, -6.05517578125, -5.80621337890625, -5.5572509765625, -5.30828857421875, -5.059326171875, -4.81036376953125, -4.5614013671875, -4.31243896484375, -4.0634765625, -3.81451416015625, -3.5655517578125, -3.31658935546875, -3.067626953125, -2.81866455078125, -2.5697021484375, -2.32073974609375, -2.07177734375, -1.82281494140625, -1.5738525390625, -1.32489013671875, -1.075927734375, -0.82696533203125, -0.5780029296875, -0.32904052734375, -0.080078125, 0.16888427734375, 0.4178466796875, 0.66680908203125, 0.915771484375, 1.16473388671875, 1.4136962890625, 1.66265869140625, 1.91162109375, 2.16058349609375, 2.4095458984375, 2.65850830078125, 2.907470703125, 3.15643310546875, 3.4053955078125, 3.65435791015625, 3.9033203125, 4.15228271484375, 4.4012451171875, 4.65020751953125, 4.899169921875, 5.14813232421875, 5.3970947265625, 5.64605712890625, 5.89501953125, 6.14398193359375, 6.3929443359375, 6.64190673828125, 6.890869140625, 7.13983154296875, 7.3887939453125, 7.63775634765625, 7.88671875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 9.0, 20.0, 19.0, 37.0, 61.0, 120.0, 163.0, 265.0, 429.0, 714.0, 1125.0, 1791.0, 2964.0, 4925.0, 8310.0, 14342.0, 23668.0, 40800.0, 69050.0, 115130.0, 187993.0, 294698.0, 427810.0, 555153.0, 614901.0, 567101.0, 445722.0, 310378.0, 201087.0, 124018.0, 74215.0, 44051.0, 25749.0, 15144.0, 8896.0, 5124.0, 3226.0, 2001.0, 1184.0, 650.0, 475.0, 286.0, 197.0, 120.0, 73.0, 38.0, 16.0, 17.0, 6.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.84375, -8.5635986328125, -8.283447265625, -8.0032958984375, -7.72314453125, -7.4429931640625, -7.162841796875, -6.8826904296875, -6.6025390625, -6.3223876953125, -6.042236328125, -5.7620849609375, -5.48193359375, -5.2017822265625, -4.921630859375, -4.6414794921875, -4.361328125, -4.0811767578125, -3.801025390625, -3.5208740234375, -3.24072265625, -2.9605712890625, -2.680419921875, -2.4002685546875, -2.1201171875, -1.8399658203125, -1.559814453125, -1.2796630859375, -0.99951171875, -0.7193603515625, -0.439208984375, -0.1590576171875, 0.12109375, 0.4012451171875, 0.681396484375, 0.9615478515625, 1.24169921875, 1.5218505859375, 1.802001953125, 2.0821533203125, 2.3623046875, 2.6424560546875, 2.922607421875, 3.2027587890625, 3.48291015625, 3.7630615234375, 4.043212890625, 4.3233642578125, 4.603515625, 4.8836669921875, 5.163818359375, 5.4439697265625, 5.72412109375, 6.0042724609375, 6.284423828125, 6.5645751953125, 6.8447265625, 7.1248779296875, 7.405029296875, 7.6851806640625, 7.96533203125, 8.2454833984375, 8.525634765625, 8.8057861328125, 9.0859375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 13.0, 20.0, 17.0, 34.0, 44.0, 45.0, 67.0, 89.0, 119.0, 128.0, 110.0, 159.0, 193.0, 208.0, 238.0, 267.0, 264.0, 263.0, 229.0, 232.0, 183.0, 193.0, 185.0, 131.0, 129.0, 107.0, 81.0, 73.0, 56.0, 47.0, 43.0, 29.0, 24.0, 13.0, 10.0, 4.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.09442138671875, -3.9622802734375, -3.83013916015625, -3.697998046875, -3.56585693359375, -3.4337158203125, -3.30157470703125, -3.16943359375, -3.03729248046875, -2.9051513671875, -2.77301025390625, -2.640869140625, -2.50872802734375, -2.3765869140625, -2.24444580078125, -2.1123046875, -1.98016357421875, -1.8480224609375, -1.71588134765625, -1.583740234375, -1.45159912109375, -1.3194580078125, -1.18731689453125, -1.05517578125, -0.92303466796875, -0.7908935546875, -0.65875244140625, -0.526611328125, -0.39447021484375, -0.2623291015625, -0.13018798828125, 0.001953125, 0.13409423828125, 0.2662353515625, 0.39837646484375, 0.530517578125, 0.66265869140625, 0.7947998046875, 0.92694091796875, 1.05908203125, 1.19122314453125, 1.3233642578125, 1.45550537109375, 1.587646484375, 1.71978759765625, 1.8519287109375, 1.98406982421875, 2.1162109375, 2.24835205078125, 2.3804931640625, 2.51263427734375, 2.644775390625, 2.77691650390625, 2.9090576171875, 3.04119873046875, 3.17333984375, 3.30548095703125, 3.4376220703125, 3.56976318359375, 3.701904296875, 3.83404541015625, 3.9661865234375, 4.09832763671875, 4.23046875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 8.0, 6.0, 5.0, 8.0, 5.0, 11.0, 19.0, 16.0, 23.0, 28.0, 31.0, 41.0, 52.0, 67.0, 76.0, 71.0, 90.0, 77.0, 62.0, 69.0, 35.0, 42.0, 39.0, 26.0, 15.0, 18.0, 12.0, 13.0, 7.0, 6.0, 12.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.437036514282227, -13.960897445678711, -13.484758377075195, -13.00861930847168, -12.532480239868164, -12.056341171264648, -11.580202102661133, -11.104063987731934, -10.627924919128418, -10.151785850524902, -9.675646781921387, -9.199507713317871, -8.723368644714355, -8.247230529785156, -7.771090984344482, -7.294952392578125, -6.818812847137451, -6.3426737785339355, -5.86653470993042, -5.3903961181640625, -4.914257049560547, -4.438117980957031, -3.9619789123535156, -3.485840082168579, -3.0097010135650635, -2.533561944961548, -2.0574231147766113, -1.5812840461730957, -1.1051450967788696, -0.6290061473846436, -0.15286707878112793, 0.3232717514038086, 0.7994108200073242, 1.2755497694015503, 1.7516887187957764, 2.227827787399292, 2.7039666175842285, 3.180105686187744, 3.6562447547912598, 4.132383346557617, 4.608522415161133, 5.084661483764648, 5.560800552368164, 6.03693962097168, 6.513078212738037, 6.989217281341553, 7.465356349945068, 7.941494941711426, 8.417634963989258, 8.893774032592773, 9.369913101196289, 9.846052169799805, 10.32219123840332, 10.798330307006836, 11.274469375610352, 11.75060749053955, 12.226746559143066, 12.702885627746582, 13.179024696350098, 13.655163764953613, 14.131302833557129, 14.607440948486328, 15.083580017089844, 15.55971908569336, 16.035858154296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 7.0, 4.0, 7.0, 12.0, 17.0, 8.0, 17.0, 13.0, 24.0, 23.0, 24.0, 25.0, 21.0, 25.0, 34.0, 28.0, 40.0, 40.0, 33.0, 42.0, 39.0, 43.0, 34.0, 42.0, 27.0, 30.0, 30.0, 33.0, 26.0, 39.0, 22.0, 36.0, 21.0, 25.0, 17.0, 12.0, 12.0, 11.0, 13.0, 8.0, 10.0, 5.0, 2.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.54083776473999, -7.280722141265869, -7.02060604095459, -6.760490417480469, -6.500374794006348, -6.240258693695068, -5.980143070220947, -5.720026969909668, -5.459911346435547, -5.199795722961426, -4.9396796226501465, -4.679563999176025, -4.419447898864746, -4.159332275390625, -3.899216651916504, -3.6391007900238037, -3.3789849281311035, -3.1188690662384033, -2.858753204345703, -2.598637580871582, -2.338521718978882, -2.0784058570861816, -1.818290114402771, -1.5581743717193604, -1.2980585098266602, -1.03794264793396, -0.7778269052505493, -0.5177111029624939, -0.2575953006744385, 0.0025205612182617188, 0.26263630390167236, 0.522752046585083, 0.782867431640625, 1.0429832935333252, 1.3030990362167358, 1.5632147789001465, 1.8233306407928467, 2.083446502685547, 2.343562126159668, 2.603677988052368, 2.8637938499450684, 3.1239097118377686, 3.3840255737304688, 3.64414119720459, 3.90425705909729, 4.16437292098999, 4.424488544464111, 4.684604644775391, 4.944720268249512, 5.204835891723633, 5.464951992034912, 5.725067615509033, 5.9851837158203125, 6.245299339294434, 6.505414962768555, 6.765530586242676, 7.025646686553955, 7.285762310028076, 7.5458784103393555, 7.805994033813477, 8.066109657287598, 8.326225280761719, 8.586341857910156, 8.846457481384277, 9.106573104858398]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 6.0, 12.0, 10.0, 22.0, 26.0, 29.0, 32.0, 49.0, 72.0, 93.0, 110.0, 178.0, 274.0, 408.0, 615.0, 926.0, 1585.0, 3169.0, 9818.0, 63880.0, 482637.0, 417448.0, 51511.0, 8485.0, 2862.0, 1550.0, 893.0, 586.0, 360.0, 258.0, 169.0, 109.0, 70.0, 62.0, 64.0, 43.0, 22.0, 24.0, 19.0, 20.0, 10.0, 7.0, 6.0, 1.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.1619873046875, -9.784912109375, -9.4078369140625, -9.03076171875, -8.6536865234375, -8.276611328125, -7.8995361328125, -7.5224609375, -7.1453857421875, -6.768310546875, -6.3912353515625, -6.01416015625, -5.6370849609375, -5.260009765625, -4.8829345703125, -4.505859375, -4.1287841796875, -3.751708984375, -3.3746337890625, -2.99755859375, -2.6204833984375, -2.243408203125, -1.8663330078125, -1.4892578125, -1.1121826171875, -0.735107421875, -0.3580322265625, 0.01904296875, 0.3961181640625, 0.773193359375, 1.1502685546875, 1.52734375, 1.9044189453125, 2.281494140625, 2.6585693359375, 3.03564453125, 3.4127197265625, 3.789794921875, 4.1668701171875, 4.5439453125, 4.9210205078125, 5.298095703125, 5.6751708984375, 6.05224609375, 6.4293212890625, 6.806396484375, 7.1834716796875, 7.560546875, 7.9376220703125, 8.314697265625, 8.6917724609375, 9.06884765625, 9.4459228515625, 9.822998046875, 10.2000732421875, 10.5771484375, 10.9542236328125, 11.331298828125, 11.7083740234375, 12.08544921875, 12.4625244140625, 12.839599609375, 13.2166748046875, 13.59375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 6.0, 5.0, 8.0, 14.0, 16.0, 16.0, 12.0, 21.0, 20.0, 20.0, 30.0, 30.0, 31.0, 41.0, 29.0, 25.0, 40.0, 56.0, 50.0, 40.0, 41.0, 38.0, 26.0, 41.0, 35.0, 37.0, 32.0, 26.0, 29.0, 27.0, 23.0, 16.0, 23.0, 22.0, 18.0, 15.0, 6.0, 7.0, 6.0, 0.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3671875, -9.0716552734375, -8.776123046875, -8.4805908203125, -8.18505859375, -7.8895263671875, -7.593994140625, -7.2984619140625, -7.0029296875, -6.7073974609375, -6.411865234375, -6.1163330078125, -5.82080078125, -5.5252685546875, -5.229736328125, -4.9342041015625, -4.638671875, -4.3431396484375, -4.047607421875, -3.7520751953125, -3.45654296875, -3.1610107421875, -2.865478515625, -2.5699462890625, -2.2744140625, -1.9788818359375, -1.683349609375, -1.3878173828125, -1.09228515625, -0.7967529296875, -0.501220703125, -0.2056884765625, 0.08984375, 0.3853759765625, 0.680908203125, 0.9764404296875, 1.27197265625, 1.5675048828125, 1.863037109375, 2.1585693359375, 2.4541015625, 2.7496337890625, 3.045166015625, 3.3406982421875, 3.63623046875, 3.9317626953125, 4.227294921875, 4.5228271484375, 4.818359375, 5.1138916015625, 5.409423828125, 5.7049560546875, 6.00048828125, 6.2960205078125, 6.591552734375, 6.8870849609375, 7.1826171875, 7.4781494140625, 7.773681640625, 8.0692138671875, 8.36474609375, 8.6602783203125, 8.955810546875, 9.2513427734375, 9.546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 16.0, 18.0, 26.0, 39.0, 47.0, 61.0, 83.0, 123.0, 152.0, 223.0, 381.0, 701.0, 1539.0, 4127.0, 15843.0, 88146.0, 475032.0, 380422.0, 62995.0, 11998.0, 3451.0, 1327.0, 634.0, 334.0, 219.0, 139.0, 127.0, 81.0, 53.0, 42.0, 37.0, 26.0, 23.0, 10.0, 14.0, 10.0, 11.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.6484375, -9.3460693359375, -9.043701171875, -8.7413330078125, -8.43896484375, -8.1365966796875, -7.834228515625, -7.5318603515625, -7.2294921875, -6.9271240234375, -6.624755859375, -6.3223876953125, -6.02001953125, -5.7176513671875, -5.415283203125, -5.1129150390625, -4.810546875, -4.5081787109375, -4.205810546875, -3.9034423828125, -3.60107421875, -3.2987060546875, -2.996337890625, -2.6939697265625, -2.3916015625, -2.0892333984375, -1.786865234375, -1.4844970703125, -1.18212890625, -0.8797607421875, -0.577392578125, -0.2750244140625, 0.02734375, 0.3297119140625, 0.632080078125, 0.9344482421875, 1.23681640625, 1.5391845703125, 1.841552734375, 2.1439208984375, 2.4462890625, 2.7486572265625, 3.051025390625, 3.3533935546875, 3.65576171875, 3.9581298828125, 4.260498046875, 4.5628662109375, 4.865234375, 5.1676025390625, 5.469970703125, 5.7723388671875, 6.07470703125, 6.3770751953125, 6.679443359375, 6.9818115234375, 7.2841796875, 7.5865478515625, 7.888916015625, 8.1912841796875, 8.49365234375, 8.7960205078125, 9.098388671875, 9.4007568359375, 9.703125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 13.0, 10.0, 16.0, 11.0, 18.0, 16.0, 23.0, 28.0, 31.0, 29.0, 35.0, 28.0, 45.0, 38.0, 44.0, 50.0, 51.0, 59.0, 37.0, 56.0, 30.0, 43.0, 29.0, 27.0, 37.0, 28.0, 34.0, 26.0, 19.0, 11.0, 19.0, 9.0, 6.0, 9.0, 10.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.59375, -7.3873291015625, -7.180908203125, -6.9744873046875, -6.76806640625, -6.5616455078125, -6.355224609375, -6.1488037109375, -5.9423828125, -5.7359619140625, -5.529541015625, -5.3231201171875, -5.11669921875, -4.9102783203125, -4.703857421875, -4.4974365234375, -4.291015625, -4.0845947265625, -3.878173828125, -3.6717529296875, -3.46533203125, -3.2589111328125, -3.052490234375, -2.8460693359375, -2.6396484375, -2.4332275390625, -2.226806640625, -2.0203857421875, -1.81396484375, -1.6075439453125, -1.401123046875, -1.1947021484375, -0.98828125, -0.7818603515625, -0.575439453125, -0.3690185546875, -0.16259765625, 0.0438232421875, 0.250244140625, 0.4566650390625, 0.6630859375, 0.8695068359375, 1.075927734375, 1.2823486328125, 1.48876953125, 1.6951904296875, 1.901611328125, 2.1080322265625, 2.314453125, 2.5208740234375, 2.727294921875, 2.9337158203125, 3.14013671875, 3.3465576171875, 3.552978515625, 3.7593994140625, 3.9658203125, 4.1722412109375, 4.378662109375, 4.5850830078125, 4.79150390625, 4.9979248046875, 5.204345703125, 5.4107666015625, 5.6171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 9.0, 14.0, 18.0, 17.0, 17.0, 29.0, 44.0, 59.0, 101.0, 118.0, 220.0, 342.0, 534.0, 867.0, 1560.0, 2819.0, 5723.0, 13919.0, 40827.0, 147643.0, 437885.0, 280495.0, 74799.0, 22772.0, 8697.0, 4051.0, 1986.0, 1106.0, 694.0, 416.0, 242.0, 168.0, 115.0, 72.0, 44.0, 41.0, 25.0, 13.0, 17.0, 13.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5302734375, -1.480499267578125, -1.43072509765625, -1.380950927734375, -1.3311767578125, -1.281402587890625, -1.23162841796875, -1.181854248046875, -1.132080078125, -1.082305908203125, -1.03253173828125, -0.982757568359375, -0.9329833984375, -0.883209228515625, -0.83343505859375, -0.783660888671875, -0.73388671875, -0.684112548828125, -0.63433837890625, -0.584564208984375, -0.5347900390625, -0.485015869140625, -0.43524169921875, -0.385467529296875, -0.335693359375, -0.285919189453125, -0.23614501953125, -0.186370849609375, -0.1365966796875, -0.086822509765625, -0.03704833984375, 0.012725830078125, 0.0625, 0.112274169921875, 0.16204833984375, 0.211822509765625, 0.2615966796875, 0.311370849609375, 0.36114501953125, 0.410919189453125, 0.460693359375, 0.510467529296875, 0.56024169921875, 0.610015869140625, 0.6597900390625, 0.709564208984375, 0.75933837890625, 0.809112548828125, 0.85888671875, 0.908660888671875, 0.95843505859375, 1.008209228515625, 1.0579833984375, 1.107757568359375, 1.15753173828125, 1.207305908203125, 1.257080078125, 1.306854248046875, 1.35662841796875, 1.406402587890625, 1.4561767578125, 1.505950927734375, 1.55572509765625, 1.605499267578125, 1.6552734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 7.0, 13.0, 30.0, 66.0, 117.0, 180.0, 186.0, 141.0, 112.0, 66.0, 34.0, 18.0, 10.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001456737518310547, -0.0001413356512784958, -0.0001369975507259369, -0.000132659450173378, -0.0001283213496208191, -0.0001239832490682602, -0.0001196451485157013, -0.0001153070479631424, -0.0001109689474105835, -0.0001066308468580246, -0.0001022927463054657, -9.79546457529068e-05, -9.36165452003479e-05, -8.9278444647789e-05, -8.49403440952301e-05, -8.06022435426712e-05, -7.62641429901123e-05, -7.19260424375534e-05, -6.758794188499451e-05, -6.324984133243561e-05, -5.891174077987671e-05, -5.457364022731781e-05, -5.023553967475891e-05, -4.589743912220001e-05, -4.155933856964111e-05, -3.7221238017082214e-05, -3.2883137464523315e-05, -2.8545036911964417e-05, -2.4206936359405518e-05, -1.986883580684662e-05, -1.553073525428772e-05, -1.119263470172882e-05, -6.854534149169922e-06, -2.516433596611023e-06, 1.821666955947876e-06, 6.159767508506775e-06, 1.0497868061065674e-05, 1.4835968613624573e-05, 1.917406916618347e-05, 2.351216971874237e-05, 2.785027027130127e-05, 3.218837082386017e-05, 3.652647137641907e-05, 4.0864571928977966e-05, 4.5202672481536865e-05, 4.9540773034095764e-05, 5.387887358665466e-05, 5.821697413921356e-05, 6.255507469177246e-05, 6.689317524433136e-05, 7.123127579689026e-05, 7.556937634944916e-05, 7.990747690200806e-05, 8.424557745456696e-05, 8.858367800712585e-05, 9.292177855968475e-05, 9.725987911224365e-05, 0.00010159797966480255, 0.00010593608021736145, 0.00011027418076992035, 0.00011461228132247925, 0.00011895038187503815, 0.00012328848242759705, 0.00012762658298015594, 0.00013196468353271484]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 7.0, 5.0, 3.0, 8.0, 9.0, 13.0, 19.0, 20.0, 36.0, 35.0, 52.0, 79.0, 135.0, 147.0, 171.0, 224.0, 293.0, 349.0, 439.0, 637.0, 917.0, 1374.0, 1932.0, 3095.0, 5684.0, 11446.0, 26589.0, 75840.0, 261454.0, 418680.0, 153186.0, 46522.0, 18081.0, 8337.0, 4320.0, 2579.0, 1558.0, 1105.0, 813.0, 543.0, 428.0, 336.0, 232.0, 168.0, 118.0, 108.0, 95.0, 73.0, 70.0, 42.0, 44.0, 32.0, 20.0, 15.0, 15.0, 11.0, 14.0, 4.0, 2.0, 3.0], "bins": [-2.013671875, -1.9531707763671875, -1.892669677734375, -1.8321685791015625, -1.77166748046875, -1.7111663818359375, -1.650665283203125, -1.5901641845703125, -1.5296630859375, -1.4691619873046875, -1.408660888671875, -1.3481597900390625, -1.28765869140625, -1.2271575927734375, -1.166656494140625, -1.1061553955078125, -1.045654296875, -0.9851531982421875, -0.924652099609375, -0.8641510009765625, -0.80364990234375, -0.7431488037109375, -0.682647705078125, -0.6221466064453125, -0.5616455078125, -0.5011444091796875, -0.440643310546875, -0.3801422119140625, -0.31964111328125, -0.2591400146484375, -0.198638916015625, -0.1381378173828125, -0.07763671875, -0.0171356201171875, 0.043365478515625, 0.1038665771484375, 0.16436767578125, 0.2248687744140625, 0.285369873046875, 0.3458709716796875, 0.4063720703125, 0.4668731689453125, 0.527374267578125, 0.5878753662109375, 0.64837646484375, 0.7088775634765625, 0.769378662109375, 0.8298797607421875, 0.890380859375, 0.9508819580078125, 1.011383056640625, 1.0718841552734375, 1.13238525390625, 1.1928863525390625, 1.253387451171875, 1.3138885498046875, 1.3743896484375, 1.4348907470703125, 1.495391845703125, 1.5558929443359375, 1.61639404296875, 1.6768951416015625, 1.737396240234375, 1.7978973388671875, 1.8583984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 4.0, 1.0, 4.0, 9.0, 10.0, 8.0, 8.0, 12.0, 7.0, 13.0, 10.0, 16.0, 25.0, 29.0, 27.0, 43.0, 54.0, 46.0, 41.0, 57.0, 68.0, 82.0, 62.0, 59.0, 49.0, 43.0, 30.0, 31.0, 21.0, 23.0, 20.0, 17.0, 12.0, 5.0, 11.0, 9.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.42138671875, -0.4091072082519531, -0.39682769775390625, -0.3845481872558594, -0.3722686767578125, -0.3599891662597656, -0.34770965576171875, -0.3354301452636719, -0.323150634765625, -0.3108711242675781, -0.29859161376953125, -0.2863121032714844, -0.2740325927734375, -0.2617530822753906, -0.24947357177734375, -0.23719406127929688, -0.22491455078125, -0.21263504028320312, -0.20035552978515625, -0.18807601928710938, -0.1757965087890625, -0.16351699829101562, -0.15123748779296875, -0.13895797729492188, -0.126678466796875, -0.11439895629882812, -0.10211944580078125, -0.08983993530273438, -0.0775604248046875, -0.06528091430664062, -0.05300140380859375, -0.040721893310546875, -0.0284423828125, -0.016162872314453125, -0.00388336181640625, 0.008396148681640625, 0.0206756591796875, 0.032955169677734375, 0.04523468017578125, 0.057514190673828125, 0.069793701171875, 0.08207321166992188, 0.09435272216796875, 0.10663223266601562, 0.1189117431640625, 0.13119125366210938, 0.14347076416015625, 0.15575027465820312, 0.16802978515625, 0.18030929565429688, 0.19258880615234375, 0.20486831665039062, 0.2171478271484375, 0.22942733764648438, 0.24170684814453125, 0.2539863586425781, 0.266265869140625, 0.2785453796386719, 0.29082489013671875, 0.3031044006347656, 0.3153839111328125, 0.3276634216308594, 0.33994293212890625, 0.3522224426269531, 0.364501953125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 11.0, 5.0, 6.0, 4.0, 7.0, 15.0, 18.0, 17.0, 27.0, 31.0, 33.0, 51.0, 52.0, 67.0, 77.0, 73.0, 78.0, 89.0, 58.0, 60.0, 38.0, 41.0, 24.0, 29.0, 16.0, 16.0, 13.0, 11.0, 4.0, 6.0, 9.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.17252254486084, -13.698163986206055, -13.223804473876953, -12.749445915222168, -12.275087356567383, -11.800727844238281, -11.326369285583496, -10.852010726928711, -10.37765121459961, -9.903292655944824, -9.428933143615723, -8.954574584960938, -8.480216026306152, -8.005857467651367, -7.531497955322266, -7.0571393966674805, -6.582780838012695, -6.108421802520752, -5.634063243865967, -5.159704208374023, -4.685345649719238, -4.210986614227295, -3.7366275787353516, -3.2622687816619873, -2.787909984588623, -2.313551187515259, -1.839192271232605, -1.3648333549499512, -0.8904745578765869, -0.41611576080322266, 0.0582432746887207, 0.532602071762085, 1.0069618225097656, 1.4813206195831299, 1.9556795358657837, 2.4300384521484375, 2.9043972492218018, 3.378756046295166, 3.8531150817871094, 4.3274736404418945, 4.801832675933838, 5.276191711425781, 5.750550270080566, 6.22490930557251, 6.699268341064453, 7.173626899719238, 7.647985935211182, 8.122344970703125, 8.59670352935791, 9.071062088012695, 9.545421600341797, 10.019780158996582, 10.494138717651367, 10.968498229980469, 11.442856788635254, 11.917215347290039, 12.39157485961914, 12.865933418273926, 13.340292930603027, 13.814651489257812, 14.289010047912598, 14.763368606567383, 15.237728118896484, 15.71208667755127, 16.186445236206055]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 5.0, 6.0, 14.0, 19.0, 4.0, 21.0, 14.0, 18.0, 24.0, 23.0, 28.0, 19.0, 27.0, 31.0, 34.0, 34.0, 40.0, 33.0, 42.0, 46.0, 31.0, 37.0, 42.0, 29.0, 32.0, 27.0, 34.0, 28.0, 31.0, 28.0, 37.0, 19.0, 22.0, 18.0, 15.0, 10.0, 15.0, 12.0, 8.0, 9.0, 6.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.589195728302002, -7.3310770988464355, -7.072958946228027, -6.814840316772461, -6.5567216873168945, -6.298603057861328, -6.040484428405762, -5.7823662757873535, -5.524247646331787, -5.266129016876221, -5.0080108642578125, -4.749892234802246, -4.49177360534668, -4.233654975891113, -3.975536584854126, -3.7174181938171387, -3.4592995643615723, -3.201180934906006, -2.9430625438690186, -2.6849441528320312, -2.426825523376465, -2.1687068939208984, -1.9105885028839111, -1.6524699926376343, -1.3943514823913574, -1.1362329721450806, -0.8781144618988037, -0.6199959516525269, -0.36187744140625, -0.10375893115997314, 0.1543595790863037, 0.41247808933258057, 0.6705961227416992, 0.9287146329879761, 1.186833143234253, 1.4449516534805298, 1.7030701637268066, 1.9611886739730835, 2.2193071842193604, 2.4774255752563477, 2.735544204711914, 2.9936628341674805, 3.2517812252044678, 3.509899616241455, 3.7680182456970215, 4.026136875152588, 4.284255027770996, 4.5423736572265625, 4.800492286682129, 5.058610916137695, 5.316729545593262, 5.57484769821167, 5.832966327667236, 6.091084957122803, 6.349203109741211, 6.607321739196777, 6.865440368652344, 7.12355899810791, 7.381677627563477, 7.639795780181885, 7.897914409637451, 8.15603256225586, 8.414151191711426, 8.672269821166992, 8.930388450622559]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 2.0, 9.0, 4.0, 12.0, 9.0, 19.0, 28.0, 35.0, 42.0, 67.0, 73.0, 120.0, 209.0, 298.0, 459.0, 787.0, 1379.0, 2535.0, 4685.0, 9530.0, 19036.0, 38261.0, 73986.0, 129095.0, 186818.0, 203055.0, 163264.0, 102440.0, 55237.0, 28018.0, 13829.0, 7013.0, 3489.0, 1849.0, 1079.0, 605.0, 386.0, 258.0, 175.0, 102.0, 60.0, 56.0, 33.0, 21.0, 23.0, 16.0, 13.0, 10.0, 11.0, 4.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0], "bins": [-12.3671875, -11.9840087890625, -11.600830078125, -11.2176513671875, -10.83447265625, -10.4512939453125, -10.068115234375, -9.6849365234375, -9.3017578125, -8.9185791015625, -8.535400390625, -8.1522216796875, -7.76904296875, -7.3858642578125, -7.002685546875, -6.6195068359375, -6.236328125, -5.8531494140625, -5.469970703125, -5.0867919921875, -4.70361328125, -4.3204345703125, -3.937255859375, -3.5540771484375, -3.1708984375, -2.7877197265625, -2.404541015625, -2.0213623046875, -1.63818359375, -1.2550048828125, -0.871826171875, -0.4886474609375, -0.10546875, 0.2777099609375, 0.660888671875, 1.0440673828125, 1.42724609375, 1.8104248046875, 2.193603515625, 2.5767822265625, 2.9599609375, 3.3431396484375, 3.726318359375, 4.1094970703125, 4.49267578125, 4.8758544921875, 5.259033203125, 5.6422119140625, 6.025390625, 6.4085693359375, 6.791748046875, 7.1749267578125, 7.55810546875, 7.9412841796875, 8.324462890625, 8.7076416015625, 9.0908203125, 9.4739990234375, 9.857177734375, 10.2403564453125, 10.62353515625, 11.0067138671875, 11.389892578125, 11.7730712890625, 12.15625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 5.0, 5.0, 5.0, 11.0, 11.0, 13.0, 17.0, 18.0, 21.0, 18.0, 24.0, 34.0, 30.0, 17.0, 38.0, 39.0, 34.0, 42.0, 31.0, 48.0, 33.0, 35.0, 35.0, 45.0, 36.0, 34.0, 41.0, 30.0, 26.0, 14.0, 22.0, 36.0, 23.0, 20.0, 15.0, 20.0, 16.0, 10.0, 12.0, 6.0, 7.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7109375, -8.4384765625, -8.166015625, -7.8935546875, -7.62109375, -7.3486328125, -7.076171875, -6.8037109375, -6.53125, -6.2587890625, -5.986328125, -5.7138671875, -5.44140625, -5.1689453125, -4.896484375, -4.6240234375, -4.3515625, -4.0791015625, -3.806640625, -3.5341796875, -3.26171875, -2.9892578125, -2.716796875, -2.4443359375, -2.171875, -1.8994140625, -1.626953125, -1.3544921875, -1.08203125, -0.8095703125, -0.537109375, -0.2646484375, 0.0078125, 0.2802734375, 0.552734375, 0.8251953125, 1.09765625, 1.3701171875, 1.642578125, 1.9150390625, 2.1875, 2.4599609375, 2.732421875, 3.0048828125, 3.27734375, 3.5498046875, 3.822265625, 4.0947265625, 4.3671875, 4.6396484375, 4.912109375, 5.1845703125, 5.45703125, 5.7294921875, 6.001953125, 6.2744140625, 6.546875, 6.8193359375, 7.091796875, 7.3642578125, 7.63671875, 7.9091796875, 8.181640625, 8.4541015625, 8.7265625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 9.0, 5.0, 17.0, 17.0, 22.0, 29.0, 31.0, 38.0, 55.0, 65.0, 119.0, 171.0, 263.0, 444.0, 694.0, 1358.0, 2732.0, 5299.0, 11422.0, 24024.0, 51898.0, 101416.0, 171580.0, 218714.0, 197264.0, 128876.0, 68313.0, 33106.0, 15511.0, 7341.0, 3478.0, 1784.0, 910.0, 513.0, 334.0, 196.0, 135.0, 90.0, 65.0, 54.0, 36.0, 33.0, 20.0, 25.0, 12.0, 8.0, 8.0, 5.0, 8.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-12.9140625, -12.5067138671875, -12.099365234375, -11.6920166015625, -11.28466796875, -10.8773193359375, -10.469970703125, -10.0626220703125, -9.6552734375, -9.2479248046875, -8.840576171875, -8.4332275390625, -8.02587890625, -7.6185302734375, -7.211181640625, -6.8038330078125, -6.396484375, -5.9891357421875, -5.581787109375, -5.1744384765625, -4.76708984375, -4.3597412109375, -3.952392578125, -3.5450439453125, -3.1376953125, -2.7303466796875, -2.322998046875, -1.9156494140625, -1.50830078125, -1.1009521484375, -0.693603515625, -0.2862548828125, 0.12109375, 0.5284423828125, 0.935791015625, 1.3431396484375, 1.75048828125, 2.1578369140625, 2.565185546875, 2.9725341796875, 3.3798828125, 3.7872314453125, 4.194580078125, 4.6019287109375, 5.00927734375, 5.4166259765625, 5.823974609375, 6.2313232421875, 6.638671875, 7.0460205078125, 7.453369140625, 7.8607177734375, 8.26806640625, 8.6754150390625, 9.082763671875, 9.4901123046875, 9.8974609375, 10.3048095703125, 10.712158203125, 11.1195068359375, 11.52685546875, 11.9342041015625, 12.341552734375, 12.7489013671875, 13.15625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 7.0, 6.0, 15.0, 13.0, 10.0, 10.0, 19.0, 23.0, 21.0, 31.0, 28.0, 26.0, 35.0, 33.0, 37.0, 40.0, 31.0, 44.0, 46.0, 38.0, 33.0, 41.0, 41.0, 32.0, 36.0, 26.0, 32.0, 22.0, 27.0, 27.0, 31.0, 16.0, 20.0, 14.0, 18.0, 14.0, 8.0, 9.0, 9.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.7265625, -5.55419921875, -5.3818359375, -5.20947265625, -5.037109375, -4.86474609375, -4.6923828125, -4.52001953125, -4.34765625, -4.17529296875, -4.0029296875, -3.83056640625, -3.658203125, -3.48583984375, -3.3134765625, -3.14111328125, -2.96875, -2.79638671875, -2.6240234375, -2.45166015625, -2.279296875, -2.10693359375, -1.9345703125, -1.76220703125, -1.58984375, -1.41748046875, -1.2451171875, -1.07275390625, -0.900390625, -0.72802734375, -0.5556640625, -0.38330078125, -0.2109375, -0.03857421875, 0.1337890625, 0.30615234375, 0.478515625, 0.65087890625, 0.8232421875, 0.99560546875, 1.16796875, 1.34033203125, 1.5126953125, 1.68505859375, 1.857421875, 2.02978515625, 2.2021484375, 2.37451171875, 2.546875, 2.71923828125, 2.8916015625, 3.06396484375, 3.236328125, 3.40869140625, 3.5810546875, 3.75341796875, 3.92578125, 4.09814453125, 4.2705078125, 4.44287109375, 4.615234375, 4.78759765625, 4.9599609375, 5.13232421875, 5.3046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 8.0, 3.0, 9.0, 9.0, 19.0, 26.0, 31.0, 54.0, 62.0, 101.0, 122.0, 155.0, 317.0, 589.0, 1027.0, 2156.0, 4924.0, 13435.0, 44489.0, 175972.0, 449907.0, 258795.0, 65548.0, 18590.0, 6560.0, 2713.0, 1204.0, 671.0, 399.0, 219.0, 129.0, 89.0, 68.0, 33.0, 31.0, 30.0, 16.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.328125, -16.7626953125, -16.197265625, -15.6318359375, -15.06640625, -14.5009765625, -13.935546875, -13.3701171875, -12.8046875, -12.2392578125, -11.673828125, -11.1083984375, -10.54296875, -9.9775390625, -9.412109375, -8.8466796875, -8.28125, -7.7158203125, -7.150390625, -6.5849609375, -6.01953125, -5.4541015625, -4.888671875, -4.3232421875, -3.7578125, -3.1923828125, -2.626953125, -2.0615234375, -1.49609375, -0.9306640625, -0.365234375, 0.2001953125, 0.765625, 1.3310546875, 1.896484375, 2.4619140625, 3.02734375, 3.5927734375, 4.158203125, 4.7236328125, 5.2890625, 5.8544921875, 6.419921875, 6.9853515625, 7.55078125, 8.1162109375, 8.681640625, 9.2470703125, 9.8125, 10.3779296875, 10.943359375, 11.5087890625, 12.07421875, 12.6396484375, 13.205078125, 13.7705078125, 14.3359375, 14.9013671875, 15.466796875, 16.0322265625, 16.59765625, 17.1630859375, 17.728515625, 18.2939453125, 18.859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 5.0, 7.0, 16.0, 14.0, 17.0, 21.0, 22.0, 26.0, 35.0, 42.0, 53.0, 64.0, 69.0, 66.0, 67.0, 64.0, 72.0, 63.0, 49.0, 49.0, 37.0, 40.0, 24.0, 18.0, 11.0, 13.0, 5.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0007619857788085938, -0.0007436051964759827, -0.0007252246141433716, -0.0007068440318107605, -0.0006884634494781494, -0.0006700828671455383, -0.0006517022848129272, -0.0006333217024803162, -0.0006149411201477051, -0.000596560537815094, -0.0005781799554824829, -0.0005597993731498718, -0.0005414187908172607, -0.0005230382084846497, -0.0005046576261520386, -0.0004862770438194275, -0.0004678964614868164, -0.0004495158791542053, -0.00043113529682159424, -0.00041275471448898315, -0.00039437413215637207, -0.000375993549823761, -0.0003576129674911499, -0.0003392323851585388, -0.00032085180282592773, -0.00030247122049331665, -0.00028409063816070557, -0.0002657100558280945, -0.0002473294734954834, -0.00022894889116287231, -0.00021056830883026123, -0.00019218772649765015, -0.00017380714416503906, -0.00015542656183242798, -0.0001370459794998169, -0.00011866539716720581, -0.00010028481483459473, -8.190423250198364e-05, -6.352365016937256e-05, -4.5143067836761475e-05, -2.676248550415039e-05, -8.381903171539307e-06, 9.998679161071777e-06, 2.837926149368286e-05, 4.6759843826293945e-05, 6.514042615890503e-05, 8.352100849151611e-05, 0.0001019015908241272, 0.00012028217315673828, 0.00013866275548934937, 0.00015704333782196045, 0.00017542392015457153, 0.00019380450248718262, 0.0002121850848197937, 0.00023056566715240479, 0.00024894624948501587, 0.00026732683181762695, 0.00028570741415023804, 0.0003040879964828491, 0.0003224685788154602, 0.0003408491611480713, 0.0003592297434806824, 0.00037761032581329346, 0.00039599090814590454, 0.0004143714904785156]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 14.0, 23.0, 36.0, 48.0, 70.0, 102.0, 149.0, 230.0, 322.0, 498.0, 763.0, 1119.0, 1658.0, 2459.0, 3838.0, 5874.0, 8919.0, 14137.0, 22117.0, 34600.0, 54114.0, 81142.0, 114980.0, 143969.0, 150020.0, 128508.0, 95373.0, 65286.0, 42823.0, 26700.0, 17156.0, 10758.0, 7001.0, 4787.0, 2997.0, 1903.0, 1349.0, 883.0, 567.0, 411.0, 261.0, 190.0, 117.0, 89.0, 63.0, 34.0, 29.0, 18.0, 12.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0], "bins": [-5.5859375, -5.41778564453125, -5.2496337890625, -5.08148193359375, -4.913330078125, -4.74517822265625, -4.5770263671875, -4.40887451171875, -4.24072265625, -4.07257080078125, -3.9044189453125, -3.73626708984375, -3.568115234375, -3.39996337890625, -3.2318115234375, -3.06365966796875, -2.8955078125, -2.72735595703125, -2.5592041015625, -2.39105224609375, -2.222900390625, -2.05474853515625, -1.8865966796875, -1.71844482421875, -1.55029296875, -1.38214111328125, -1.2139892578125, -1.04583740234375, -0.877685546875, -0.70953369140625, -0.5413818359375, -0.37322998046875, -0.205078125, -0.03692626953125, 0.1312255859375, 0.29937744140625, 0.467529296875, 0.63568115234375, 0.8038330078125, 0.97198486328125, 1.14013671875, 1.30828857421875, 1.4764404296875, 1.64459228515625, 1.812744140625, 1.98089599609375, 2.1490478515625, 2.31719970703125, 2.4853515625, 2.65350341796875, 2.8216552734375, 2.98980712890625, 3.157958984375, 3.32611083984375, 3.4942626953125, 3.66241455078125, 3.83056640625, 3.99871826171875, 4.1668701171875, 4.33502197265625, 4.503173828125, 4.67132568359375, 4.8394775390625, 5.00762939453125, 5.17578125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 7.0, 15.0, 6.0, 11.0, 17.0, 15.0, 18.0, 19.0, 26.0, 29.0, 43.0, 47.0, 39.0, 46.0, 39.0, 63.0, 56.0, 48.0, 55.0, 50.0, 28.0, 46.0, 39.0, 29.0, 25.0, 20.0, 22.0, 19.0, 15.0, 15.0, 18.0, 9.0, 8.0, 7.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.8076171875, -1.748809814453125, -1.69000244140625, -1.631195068359375, -1.5723876953125, -1.513580322265625, -1.45477294921875, -1.395965576171875, -1.337158203125, -1.278350830078125, -1.21954345703125, -1.160736083984375, -1.1019287109375, -1.043121337890625, -0.98431396484375, -0.925506591796875, -0.86669921875, -0.807891845703125, -0.74908447265625, -0.690277099609375, -0.6314697265625, -0.572662353515625, -0.51385498046875, -0.455047607421875, -0.396240234375, -0.337432861328125, -0.27862548828125, -0.219818115234375, -0.1610107421875, -0.102203369140625, -0.04339599609375, 0.015411376953125, 0.07421875, 0.133026123046875, 0.19183349609375, 0.250640869140625, 0.3094482421875, 0.368255615234375, 0.42706298828125, 0.485870361328125, 0.544677734375, 0.603485107421875, 0.66229248046875, 0.721099853515625, 0.7799072265625, 0.838714599609375, 0.89752197265625, 0.956329345703125, 1.01513671875, 1.073944091796875, 1.13275146484375, 1.191558837890625, 1.2503662109375, 1.309173583984375, 1.36798095703125, 1.426788330078125, 1.485595703125, 1.544403076171875, 1.60321044921875, 1.662017822265625, 1.7208251953125, 1.779632568359375, 1.83843994140625, 1.897247314453125, 1.9560546875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 2.0, 7.0, 6.0, 6.0, 5.0, 8.0, 12.0, 20.0, 19.0, 16.0, 35.0, 36.0, 48.0, 56.0, 80.0, 72.0, 71.0, 77.0, 72.0, 72.0, 46.0, 47.0, 39.0, 37.0, 22.0, 10.0, 24.0, 13.0, 10.0, 6.0, 8.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.887171745300293, -15.402544975280762, -14.917919158935547, -14.433292388916016, -13.9486665725708, -13.46403980255127, -12.979413986206055, -12.494787216186523, -12.010160446166992, -11.525533676147461, -11.040907859802246, -10.556281089782715, -10.0716552734375, -9.587028503417969, -9.102401733398438, -8.617775917053223, -8.133150100708008, -7.648523807525635, -7.163897514343262, -6.6792707443237305, -6.194644451141357, -5.710018157958984, -5.225391864776611, -4.740765571594238, -4.256138801574707, -3.771512508392334, -3.286885976791382, -2.802259683609009, -2.3176331520080566, -1.8330068588256836, -1.3483805656433105, -0.8637540340423584, -0.37912750244140625, 0.10549888014793396, 0.5901252627372742, 1.074751615524292, 1.5593780279159546, 2.044004440307617, 2.5286307334899902, 3.0132572650909424, 3.4978835582733154, 3.9825098514556885, 4.467136383056641, 4.951762676239014, 5.436388969421387, 5.921015739440918, 6.405641555786133, 6.890268325805664, 7.374894618988037, 7.85952091217041, 8.344147682189941, 8.828773498535156, 9.313400268554688, 9.798027038574219, 10.282652854919434, 10.767279624938965, 11.25190544128418, 11.736532211303711, 12.221158027648926, 12.705784797668457, 13.190410614013672, 13.675037384033203, 14.159664154052734, 14.64428997039795, 15.12891674041748]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 11.0, 15.0, 14.0, 13.0, 16.0, 17.0, 26.0, 29.0, 31.0, 24.0, 26.0, 30.0, 35.0, 31.0, 48.0, 42.0, 38.0, 46.0, 46.0, 48.0, 31.0, 43.0, 39.0, 31.0, 27.0, 30.0, 30.0, 36.0, 23.0, 25.0, 16.0, 12.0, 15.0, 11.0, 10.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.606806755065918, -8.29892635345459, -7.991044998168945, -7.683164119720459, -7.375283241271973, -7.067402362823486, -6.759521484375, -6.451641082763672, -6.143759727478027, -5.835878849029541, -5.527997970581055, -5.220117092132568, -4.912236213684082, -4.604355335235596, -4.296474456787109, -3.988593816757202, -3.680713176727295, -3.3728322982788086, -3.0649514198303223, -2.757070541381836, -2.4491896629333496, -2.1413087844848633, -1.833428144454956, -1.5255472660064697, -1.2176663875579834, -0.9097855091094971, -0.6019046902656555, -0.29402387142181396, 0.013857007026672363, 0.3217378854751587, 0.6296186447143555, 0.9374995231628418, 1.2453804016113281, 1.5532612800598145, 1.8611421585083008, 2.169023036956787, 2.4769039154052734, 2.7847847938537598, 3.092665433883667, 3.4005463123321533, 3.7084271907806396, 4.016307830810547, 4.324188709259033, 4.6320695877075195, 4.939950466156006, 5.247831344604492, 5.5557122230529785, 5.863593101501465, 6.171473979949951, 6.4793548583984375, 6.787235736846924, 7.09511661529541, 7.4029974937438965, 7.710878372192383, 8.018758773803711, 8.326640129089355, 8.634520530700684, 8.942400932312012, 9.250282287597656, 9.558162689208984, 9.866044044494629, 10.173924446105957, 10.481805801391602, 10.78968620300293, 11.097567558288574]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 9.0, 5.0, 10.0, 8.0, 28.0, 39.0, 51.0, 57.0, 121.0, 150.0, 212.0, 371.0, 658.0, 967.0, 1509.0, 2311.0, 3869.0, 5930.0, 9284.0, 15177.0, 24936.0, 39939.0, 64682.0, 106368.0, 171193.0, 269825.0, 406926.0, 553110.0, 635445.0, 591285.0, 456362.0, 311277.0, 200095.0, 123679.0, 76388.0, 46735.0, 28546.0, 17395.0, 11034.0, 6847.0, 4044.0, 2613.0, 1700.0, 1087.0, 749.0, 421.0, 298.0, 204.0, 123.0, 85.0, 49.0, 33.0, 27.0, 9.0, 10.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.73828125, -7.48590087890625, -7.2335205078125, -6.98114013671875, -6.728759765625, -6.47637939453125, -6.2239990234375, -5.97161865234375, -5.71923828125, -5.46685791015625, -5.2144775390625, -4.96209716796875, -4.709716796875, -4.45733642578125, -4.2049560546875, -3.95257568359375, -3.7001953125, -3.44781494140625, -3.1954345703125, -2.94305419921875, -2.690673828125, -2.43829345703125, -2.1859130859375, -1.93353271484375, -1.68115234375, -1.42877197265625, -1.1763916015625, -0.92401123046875, -0.671630859375, -0.41925048828125, -0.1668701171875, 0.08551025390625, 0.337890625, 0.59027099609375, 0.8426513671875, 1.09503173828125, 1.347412109375, 1.59979248046875, 1.8521728515625, 2.10455322265625, 2.35693359375, 2.60931396484375, 2.8616943359375, 3.11407470703125, 3.366455078125, 3.61883544921875, 3.8712158203125, 4.12359619140625, 4.3759765625, 4.62835693359375, 4.8807373046875, 5.13311767578125, 5.385498046875, 5.63787841796875, 5.8902587890625, 6.14263916015625, 6.39501953125, 6.64739990234375, 6.8997802734375, 7.15216064453125, 7.404541015625, 7.65692138671875, 7.9093017578125, 8.16168212890625, 8.4140625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 7.0, 11.0, 18.0, 6.0, 18.0, 18.0, 20.0, 25.0, 24.0, 28.0, 27.0, 34.0, 37.0, 46.0, 37.0, 42.0, 37.0, 46.0, 46.0, 53.0, 42.0, 47.0, 40.0, 31.0, 37.0, 39.0, 28.0, 24.0, 23.0, 21.0, 17.0, 18.0, 12.0, 7.0, 5.0, 11.0, 5.0, 5.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28125, -6.0732421875, -5.865234375, -5.6572265625, -5.44921875, -5.2412109375, -5.033203125, -4.8251953125, -4.6171875, -4.4091796875, -4.201171875, -3.9931640625, -3.78515625, -3.5771484375, -3.369140625, -3.1611328125, -2.953125, -2.7451171875, -2.537109375, -2.3291015625, -2.12109375, -1.9130859375, -1.705078125, -1.4970703125, -1.2890625, -1.0810546875, -0.873046875, -0.6650390625, -0.45703125, -0.2490234375, -0.041015625, 0.1669921875, 0.375, 0.5830078125, 0.791015625, 0.9990234375, 1.20703125, 1.4150390625, 1.623046875, 1.8310546875, 2.0390625, 2.2470703125, 2.455078125, 2.6630859375, 2.87109375, 3.0791015625, 3.287109375, 3.4951171875, 3.703125, 3.9111328125, 4.119140625, 4.3271484375, 4.53515625, 4.7431640625, 4.951171875, 5.1591796875, 5.3671875, 5.5751953125, 5.783203125, 5.9912109375, 6.19921875, 6.4072265625, 6.615234375, 6.8232421875, 7.03125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 13.0, 18.0, 27.0, 37.0, 74.0, 105.0, 191.0, 255.0, 511.0, 826.0, 1502.0, 2522.0, 4536.0, 8080.0, 14453.0, 26513.0, 47997.0, 87908.0, 155909.0, 268816.0, 431195.0, 606978.0, 701389.0, 642164.0, 476604.0, 307213.0, 181105.0, 102066.0, 56348.0, 30627.0, 16922.0, 9211.0, 5118.0, 2952.0, 1669.0, 1008.0, 575.0, 323.0, 193.0, 131.0, 85.0, 46.0, 23.0, 11.0, 11.0, 8.0, 8.0, 5.0, 4.0], "bins": [-11.046875, -10.7532958984375, -10.459716796875, -10.1661376953125, -9.87255859375, -9.5789794921875, -9.285400390625, -8.9918212890625, -8.6982421875, -8.4046630859375, -8.111083984375, -7.8175048828125, -7.52392578125, -7.2303466796875, -6.936767578125, -6.6431884765625, -6.349609375, -6.0560302734375, -5.762451171875, -5.4688720703125, -5.17529296875, -4.8817138671875, -4.588134765625, -4.2945556640625, -4.0009765625, -3.7073974609375, -3.413818359375, -3.1202392578125, -2.82666015625, -2.5330810546875, -2.239501953125, -1.9459228515625, -1.65234375, -1.3587646484375, -1.065185546875, -0.7716064453125, -0.47802734375, -0.1844482421875, 0.109130859375, 0.4027099609375, 0.6962890625, 0.9898681640625, 1.283447265625, 1.5770263671875, 1.87060546875, 2.1641845703125, 2.457763671875, 2.7513427734375, 3.044921875, 3.3385009765625, 3.632080078125, 3.9256591796875, 4.21923828125, 4.5128173828125, 4.806396484375, 5.0999755859375, 5.3935546875, 5.6871337890625, 5.980712890625, 6.2742919921875, 6.56787109375, 6.8614501953125, 7.155029296875, 7.4486083984375, 7.7421875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 1.0, 0.0, 9.0, 6.0, 7.0, 15.0, 17.0, 32.0, 39.0, 47.0, 63.0, 69.0, 64.0, 108.0, 117.0, 147.0, 143.0, 159.0, 195.0, 203.0, 194.0, 224.0, 221.0, 209.0, 221.0, 221.0, 170.0, 184.0, 143.0, 139.0, 124.0, 119.0, 84.0, 75.0, 67.0, 45.0, 40.0, 28.0, 29.0, 22.0, 16.0, 14.0, 11.0, 10.0, 13.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.45703125, -3.35430908203125, -3.2515869140625, -3.14886474609375, -3.046142578125, -2.94342041015625, -2.8406982421875, -2.73797607421875, -2.63525390625, -2.53253173828125, -2.4298095703125, -2.32708740234375, -2.224365234375, -2.12164306640625, -2.0189208984375, -1.91619873046875, -1.8134765625, -1.71075439453125, -1.6080322265625, -1.50531005859375, -1.402587890625, -1.29986572265625, -1.1971435546875, -1.09442138671875, -0.99169921875, -0.88897705078125, -0.7862548828125, -0.68353271484375, -0.580810546875, -0.47808837890625, -0.3753662109375, -0.27264404296875, -0.169921875, -0.06719970703125, 0.0355224609375, 0.13824462890625, 0.240966796875, 0.34368896484375, 0.4464111328125, 0.54913330078125, 0.65185546875, 0.75457763671875, 0.8572998046875, 0.96002197265625, 1.062744140625, 1.16546630859375, 1.2681884765625, 1.37091064453125, 1.4736328125, 1.57635498046875, 1.6790771484375, 1.78179931640625, 1.884521484375, 1.98724365234375, 2.0899658203125, 2.19268798828125, 2.29541015625, 2.39813232421875, 2.5008544921875, 2.60357666015625, 2.706298828125, 2.80902099609375, 2.9117431640625, 3.01446533203125, 3.1171875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 11.0, 11.0, 17.0, 12.0, 28.0, 34.0, 51.0, 64.0, 58.0, 76.0, 76.0, 81.0, 84.0, 99.0, 59.0, 44.0, 30.0, 36.0, 32.0, 20.0, 16.0, 15.0, 7.0, 8.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.02396297454834, -14.513556480407715, -14.00314998626709, -13.492743492126465, -12.982336044311523, -12.471929550170898, -11.961523056030273, -11.451116561889648, -10.940710067749023, -10.430303573608398, -9.919897079467773, -9.409490585327148, -8.899084091186523, -8.388677597045898, -7.878270149230957, -7.367863655090332, -6.857457160949707, -6.347050666809082, -5.836644172668457, -5.326237201690674, -4.815830707550049, -4.305424213409424, -3.7950174808502197, -3.2846107482910156, -2.7742042541503906, -2.2637977600097656, -1.7533910274505615, -1.242984414100647, -0.7325778007507324, -0.22217130661010742, 0.2882354259490967, 0.7986421585083008, 1.3090496063232422, 1.8194562196731567, 2.3298628330230713, 2.8402695655822754, 3.3506760597229004, 3.8610825538635254, 4.371489524841309, 4.881896018981934, 5.392302513122559, 5.902709007263184, 6.413115501403809, 6.923522472381592, 7.433928966522217, 7.944335460662842, 8.454742431640625, 8.96514892578125, 9.475555419921875, 9.9859619140625, 10.496368408203125, 11.00677490234375, 11.517181396484375, 12.027587890625, 12.537995338439941, 13.048401832580566, 13.558808326721191, 14.069214820861816, 14.579621315002441, 15.090027809143066, 15.600435256958008, 16.110841751098633, 16.621248245239258, 17.131654739379883, 17.642061233520508]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 10.0, 6.0, 7.0, 4.0, 14.0, 9.0, 13.0, 21.0, 16.0, 20.0, 19.0, 21.0, 30.0, 26.0, 38.0, 31.0, 34.0, 43.0, 39.0, 42.0, 33.0, 46.0, 33.0, 42.0, 38.0, 34.0, 44.0, 26.0, 32.0, 40.0, 22.0, 27.0, 37.0, 16.0, 15.0, 5.0, 9.0, 20.0, 8.0, 7.0, 9.0, 4.0, 9.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.622216701507568, -6.375519752502441, -6.128823280334473, -5.882126808166504, -5.635429859161377, -5.38873291015625, -5.142036437988281, -4.8953399658203125, -4.6486430168151855, -4.401946067810059, -4.15524959564209, -3.908552885055542, -3.661856174468994, -3.4151594638824463, -3.1684627532958984, -2.9217660427093506, -2.6750693321228027, -2.428372621536255, -2.181675910949707, -1.9349792003631592, -1.6882824897766113, -1.4415857791900635, -1.1948890686035156, -0.9481923580169678, -0.7014956474304199, -0.45479893684387207, -0.20810222625732422, 0.03859448432922363, 0.2852911949157715, 0.5319879055023193, 0.7786846160888672, 1.025381326675415, 1.272078514099121, 1.518775224685669, 1.7654719352722168, 2.0121686458587646, 2.2588653564453125, 2.5055620670318604, 2.752258777618408, 2.998955488204956, 3.245652198791504, 3.4923489093780518, 3.7390456199645996, 3.9857423305511475, 4.232439041137695, 4.479135513305664, 4.725832462310791, 4.972529411315918, 5.219225883483887, 5.4659223556518555, 5.712619304656982, 5.959316253662109, 6.206012725830078, 6.452709197998047, 6.699406147003174, 6.946103096008301, 7.1927995681762695, 7.439496040344238, 7.686192989349365, 7.932889938354492, 8.179586410522461, 8.42628288269043, 8.672979354858398, 8.919676780700684, 9.166373252868652]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 7.0, 11.0, 12.0, 23.0, 30.0, 37.0, 42.0, 105.0, 129.0, 194.0, 269.0, 414.0, 664.0, 1082.0, 1706.0, 3008.0, 5231.0, 9594.0, 17964.0, 34213.0, 65674.0, 118760.0, 188567.0, 219978.0, 166665.0, 99340.0, 53476.0, 27919.0, 14793.0, 7776.0, 4287.0, 2484.0, 1472.0, 881.0, 566.0, 415.0, 242.0, 160.0, 139.0, 71.0, 45.0, 39.0, 21.0, 18.0, 9.0, 11.0, 5.0, 6.0, 3.0, 2.0, 3.0], "bins": [-3.025390625, -2.942138671875, -2.85888671875, -2.775634765625, -2.6923828125, -2.609130859375, -2.52587890625, -2.442626953125, -2.359375, -2.276123046875, -2.19287109375, -2.109619140625, -2.0263671875, -1.943115234375, -1.85986328125, -1.776611328125, -1.693359375, -1.610107421875, -1.52685546875, -1.443603515625, -1.3603515625, -1.277099609375, -1.19384765625, -1.110595703125, -1.02734375, -0.944091796875, -0.86083984375, -0.777587890625, -0.6943359375, -0.611083984375, -0.52783203125, -0.444580078125, -0.361328125, -0.278076171875, -0.19482421875, -0.111572265625, -0.0283203125, 0.054931640625, 0.13818359375, 0.221435546875, 0.3046875, 0.387939453125, 0.47119140625, 0.554443359375, 0.6376953125, 0.720947265625, 0.80419921875, 0.887451171875, 0.970703125, 1.053955078125, 1.13720703125, 1.220458984375, 1.3037109375, 1.386962890625, 1.47021484375, 1.553466796875, 1.63671875, 1.719970703125, 1.80322265625, 1.886474609375, 1.9697265625, 2.052978515625, 2.13623046875, 2.219482421875, 2.302734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 10.0, 13.0, 13.0, 16.0, 21.0, 17.0, 19.0, 20.0, 23.0, 29.0, 27.0, 25.0, 34.0, 37.0, 42.0, 39.0, 43.0, 44.0, 28.0, 43.0, 42.0, 26.0, 45.0, 37.0, 43.0, 29.0, 30.0, 24.0, 20.0, 28.0, 15.0, 19.0, 16.0, 7.0, 13.0, 12.0, 10.0, 9.0, 9.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3984375, -7.139892578125, -6.88134765625, -6.622802734375, -6.3642578125, -6.105712890625, -5.84716796875, -5.588623046875, -5.330078125, -5.071533203125, -4.81298828125, -4.554443359375, -4.2958984375, -4.037353515625, -3.77880859375, -3.520263671875, -3.26171875, -3.003173828125, -2.74462890625, -2.486083984375, -2.2275390625, -1.968994140625, -1.71044921875, -1.451904296875, -1.193359375, -0.934814453125, -0.67626953125, -0.417724609375, -0.1591796875, 0.099365234375, 0.35791015625, 0.616455078125, 0.875, 1.133544921875, 1.39208984375, 1.650634765625, 1.9091796875, 2.167724609375, 2.42626953125, 2.684814453125, 2.943359375, 3.201904296875, 3.46044921875, 3.718994140625, 3.9775390625, 4.236083984375, 4.49462890625, 4.753173828125, 5.01171875, 5.270263671875, 5.52880859375, 5.787353515625, 6.0458984375, 6.304443359375, 6.56298828125, 6.821533203125, 7.080078125, 7.338623046875, 7.59716796875, 7.855712890625, 8.1142578125, 8.372802734375, 8.63134765625, 8.889892578125, 9.1484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 16.0, 14.0, 28.0, 32.0, 47.0, 61.0, 81.0, 127.0, 190.0, 283.0, 525.0, 777.0, 1287.0, 2133.0, 3957.0, 7222.0, 13291.0, 25544.0, 51123.0, 99443.0, 175428.0, 233109.0, 194221.0, 114580.0, 59918.0, 30484.0, 15658.0, 8170.0, 4365.0, 2539.0, 1486.0, 881.0, 551.0, 318.0, 218.0, 126.0, 110.0, 73.0, 37.0, 21.0, 19.0, 17.0, 14.0, 5.0, 5.0, 7.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.72265625, -2.63372802734375, -2.5447998046875, -2.45587158203125, -2.366943359375, -2.27801513671875, -2.1890869140625, -2.10015869140625, -2.01123046875, -1.92230224609375, -1.8333740234375, -1.74444580078125, -1.655517578125, -1.56658935546875, -1.4776611328125, -1.38873291015625, -1.2998046875, -1.21087646484375, -1.1219482421875, -1.03302001953125, -0.944091796875, -0.85516357421875, -0.7662353515625, -0.67730712890625, -0.58837890625, -0.49945068359375, -0.4105224609375, -0.32159423828125, -0.232666015625, -0.14373779296875, -0.0548095703125, 0.03411865234375, 0.123046875, 0.21197509765625, 0.3009033203125, 0.38983154296875, 0.478759765625, 0.56768798828125, 0.6566162109375, 0.74554443359375, 0.83447265625, 0.92340087890625, 1.0123291015625, 1.10125732421875, 1.190185546875, 1.27911376953125, 1.3680419921875, 1.45697021484375, 1.5458984375, 1.63482666015625, 1.7237548828125, 1.81268310546875, 1.901611328125, 1.99053955078125, 2.0794677734375, 2.16839599609375, 2.25732421875, 2.34625244140625, 2.4351806640625, 2.52410888671875, 2.613037109375, 2.70196533203125, 2.7908935546875, 2.87982177734375, 2.96875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 4.0, 7.0, 6.0, 12.0, 13.0, 11.0, 13.0, 19.0, 16.0, 31.0, 20.0, 22.0, 27.0, 29.0, 30.0, 41.0, 34.0, 36.0, 40.0, 49.0, 50.0, 45.0, 49.0, 41.0, 38.0, 37.0, 28.0, 35.0, 24.0, 26.0, 18.0, 20.0, 13.0, 15.0, 18.0, 18.0, 10.0, 9.0, 8.0, 7.0, 1.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0], "bins": [-5.640625, -5.4808349609375, -5.321044921875, -5.1612548828125, -5.00146484375, -4.8416748046875, -4.681884765625, -4.5220947265625, -4.3623046875, -4.2025146484375, -4.042724609375, -3.8829345703125, -3.72314453125, -3.5633544921875, -3.403564453125, -3.2437744140625, -3.083984375, -2.9241943359375, -2.764404296875, -2.6046142578125, -2.44482421875, -2.2850341796875, -2.125244140625, -1.9654541015625, -1.8056640625, -1.6458740234375, -1.486083984375, -1.3262939453125, -1.16650390625, -1.0067138671875, -0.846923828125, -0.6871337890625, -0.52734375, -0.3675537109375, -0.207763671875, -0.0479736328125, 0.11181640625, 0.2716064453125, 0.431396484375, 0.5911865234375, 0.7509765625, 0.9107666015625, 1.070556640625, 1.2303466796875, 1.39013671875, 1.5499267578125, 1.709716796875, 1.8695068359375, 2.029296875, 2.1890869140625, 2.348876953125, 2.5086669921875, 2.66845703125, 2.8282470703125, 2.988037109375, 3.1478271484375, 3.3076171875, 3.4674072265625, 3.627197265625, 3.7869873046875, 3.94677734375, 4.1065673828125, 4.266357421875, 4.4261474609375, 4.5859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 7.0, 9.0, 11.0, 22.0, 25.0, 33.0, 58.0, 79.0, 93.0, 162.0, 213.0, 344.0, 551.0, 933.0, 1765.0, 3715.0, 9663.0, 34583.0, 179297.0, 550632.0, 207869.0, 39396.0, 10764.0, 3916.0, 1810.0, 947.0, 591.0, 349.0, 224.0, 136.0, 104.0, 58.0, 43.0, 41.0, 26.0, 18.0, 19.0, 11.0, 8.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51953125, -1.47283935546875, -1.4261474609375, -1.37945556640625, -1.332763671875, -1.28607177734375, -1.2393798828125, -1.19268798828125, -1.14599609375, -1.09930419921875, -1.0526123046875, -1.00592041015625, -0.959228515625, -0.91253662109375, -0.8658447265625, -0.81915283203125, -0.7724609375, -0.72576904296875, -0.6790771484375, -0.63238525390625, -0.585693359375, -0.53900146484375, -0.4923095703125, -0.44561767578125, -0.39892578125, -0.35223388671875, -0.3055419921875, -0.25885009765625, -0.212158203125, -0.16546630859375, -0.1187744140625, -0.07208251953125, -0.025390625, 0.02130126953125, 0.0679931640625, 0.11468505859375, 0.161376953125, 0.20806884765625, 0.2547607421875, 0.30145263671875, 0.34814453125, 0.39483642578125, 0.4415283203125, 0.48822021484375, 0.534912109375, 0.58160400390625, 0.6282958984375, 0.67498779296875, 0.7216796875, 0.76837158203125, 0.8150634765625, 0.86175537109375, 0.908447265625, 0.95513916015625, 1.0018310546875, 1.04852294921875, 1.09521484375, 1.14190673828125, 1.1885986328125, 1.23529052734375, 1.281982421875, 1.32867431640625, 1.3753662109375, 1.42205810546875, 1.46875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 9.0, 17.0, 28.0, 56.0, 93.0, 143.0, 206.0, 164.0, 105.0, 84.0, 32.0, 18.0, 9.0, 7.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013113021850585938, -0.00012734532356262207, -0.00012356042861938477, -0.00011977553367614746, -0.00011599063873291016, -0.00011220574378967285, -0.00010842084884643555, -0.00010463595390319824, -0.00010085105895996094, -9.706616401672363e-05, -9.328126907348633e-05, -8.949637413024902e-05, -8.571147918701172e-05, -8.192658424377441e-05, -7.814168930053711e-05, -7.43567943572998e-05, -7.05718994140625e-05, -6.67870044708252e-05, -6.300210952758789e-05, -5.9217214584350586e-05, -5.543231964111328e-05, -5.1647424697875977e-05, -4.786252975463867e-05, -4.407763481140137e-05, -4.029273986816406e-05, -3.650784492492676e-05, -3.272294998168945e-05, -2.893805503845215e-05, -2.5153160095214844e-05, -2.136826515197754e-05, -1.7583370208740234e-05, -1.379847526550293e-05, -1.0013580322265625e-05, -6.22868537902832e-06, -2.4437904357910156e-06, 1.341104507446289e-06, 5.125999450683594e-06, 8.910894393920898e-06, 1.2695789337158203e-05, 1.6480684280395508e-05, 2.0265579223632812e-05, 2.4050474166870117e-05, 2.7835369110107422e-05, 3.1620264053344727e-05, 3.540515899658203e-05, 3.9190053939819336e-05, 4.297494888305664e-05, 4.6759843826293945e-05, 5.054473876953125e-05, 5.4329633712768555e-05, 5.811452865600586e-05, 6.189942359924316e-05, 6.568431854248047e-05, 6.946921348571777e-05, 7.325410842895508e-05, 7.703900337219238e-05, 8.082389831542969e-05, 8.460879325866699e-05, 8.83936882019043e-05, 9.21785831451416e-05, 9.59634780883789e-05, 9.974837303161621e-05, 0.00010353326797485352, 0.00010731816291809082, 0.00011110305786132812]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 2.0, 7.0, 7.0, 19.0, 28.0, 27.0, 52.0, 62.0, 91.0, 107.0, 193.0, 253.0, 447.0, 693.0, 1144.0, 1984.0, 3797.0, 7840.0, 18148.0, 46740.0, 130464.0, 323589.0, 312128.0, 123361.0, 44060.0, 17057.0, 7557.0, 3745.0, 1898.0, 1147.0, 656.0, 419.0, 262.0, 177.0, 119.0, 82.0, 54.0, 27.0, 34.0, 24.0, 14.0, 8.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2099609375, -1.1732635498046875, -1.136566162109375, -1.0998687744140625, -1.06317138671875, -1.0264739990234375, -0.989776611328125, -0.9530792236328125, -0.9163818359375, -0.8796844482421875, -0.842987060546875, -0.8062896728515625, -0.76959228515625, -0.7328948974609375, -0.696197509765625, -0.6595001220703125, -0.622802734375, -0.5861053466796875, -0.549407958984375, -0.5127105712890625, -0.47601318359375, -0.4393157958984375, -0.402618408203125, -0.3659210205078125, -0.3292236328125, -0.2925262451171875, -0.255828857421875, -0.2191314697265625, -0.18243408203125, -0.1457366943359375, -0.109039306640625, -0.0723419189453125, -0.03564453125, 0.0010528564453125, 0.037750244140625, 0.0744476318359375, 0.11114501953125, 0.1478424072265625, 0.184539794921875, 0.2212371826171875, 0.2579345703125, 0.2946319580078125, 0.331329345703125, 0.3680267333984375, 0.40472412109375, 0.4414215087890625, 0.478118896484375, 0.5148162841796875, 0.551513671875, 0.5882110595703125, 0.624908447265625, 0.6616058349609375, 0.69830322265625, 0.7350006103515625, 0.771697998046875, 0.8083953857421875, 0.8450927734375, 0.8817901611328125, 0.918487548828125, 0.9551849365234375, 0.99188232421875, 1.0285797119140625, 1.065277099609375, 1.1019744873046875, 1.138671875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 6.0, 11.0, 9.0, 10.0, 15.0, 22.0, 37.0, 44.0, 45.0, 80.0, 99.0, 102.0, 115.0, 94.0, 82.0, 57.0, 40.0, 37.0, 24.0, 18.0, 15.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.456787109375, -0.4448089599609375, -0.432830810546875, -0.4208526611328125, -0.40887451171875, -0.3968963623046875, -0.384918212890625, -0.3729400634765625, -0.3609619140625, -0.3489837646484375, -0.337005615234375, -0.3250274658203125, -0.31304931640625, -0.3010711669921875, -0.289093017578125, -0.2771148681640625, -0.26513671875, -0.2531585693359375, -0.241180419921875, -0.2292022705078125, -0.21722412109375, -0.2052459716796875, -0.193267822265625, -0.1812896728515625, -0.1693115234375, -0.1573333740234375, -0.145355224609375, -0.1333770751953125, -0.12139892578125, -0.1094207763671875, -0.097442626953125, -0.0854644775390625, -0.073486328125, -0.0615081787109375, -0.049530029296875, -0.0375518798828125, -0.02557373046875, -0.0135955810546875, -0.001617431640625, 0.0103607177734375, 0.0223388671875, 0.0343170166015625, 0.046295166015625, 0.0582733154296875, 0.07025146484375, 0.0822296142578125, 0.094207763671875, 0.1061859130859375, 0.1181640625, 0.1301422119140625, 0.142120361328125, 0.1540985107421875, 0.16607666015625, 0.1780548095703125, 0.190032958984375, 0.2020111083984375, 0.2139892578125, 0.2259674072265625, 0.237945556640625, 0.2499237060546875, 0.26190185546875, 0.2738800048828125, 0.285858154296875, 0.2978363037109375, 0.309814453125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 10.0, 11.0, 18.0, 12.0, 26.0, 39.0, 51.0, 57.0, 58.0, 74.0, 85.0, 81.0, 82.0, 91.0, 75.0, 25.0, 35.0, 34.0, 31.0, 24.0, 14.0, 19.0, 8.0, 10.0, 4.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.803836822509766, -14.299918174743652, -13.796000480651855, -13.292081832885742, -12.788164138793945, -12.284245491027832, -11.780326843261719, -11.276409149169922, -10.772490501403809, -10.268571853637695, -9.764654159545898, -9.260735511779785, -8.756816864013672, -8.252899169921875, -7.748980522155762, -7.245062351226807, -6.741144180297852, -6.2372260093688965, -5.733307838439941, -5.229389190673828, -4.725471019744873, -4.221552848815918, -3.717634439468384, -3.2137160301208496, -2.7097978591918945, -2.2058796882629395, -1.7019612789154053, -1.1980429887771606, -0.694124698638916, -0.19020652770996094, 0.31371188163757324, 0.8176302909851074, 1.3215465545654297, 1.8254648447036743, 2.329383134841919, 2.833301544189453, 3.337219715118408, 3.8411378860473633, 4.345056533813477, 4.848974704742432, 5.352892875671387, 5.856811046600342, 6.360729217529297, 6.86464786529541, 7.368566036224365, 7.87248420715332, 8.376402854919434, 8.880321502685547, 9.384239196777344, 9.888157844543457, 10.392075538635254, 10.895994186401367, 11.399911880493164, 11.903830528259277, 12.40774917602539, 12.911666870117188, 13.4155855178833, 13.919504165649414, 14.423421859741211, 14.927340507507324, 15.431259155273438, 15.935176849365234, 16.43909454345703, 16.94301414489746, 17.446931838989258]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 9.0, 8.0, 6.0, 7.0, 9.0, 10.0, 14.0, 19.0, 18.0, 22.0, 16.0, 24.0, 27.0, 28.0, 42.0, 30.0, 29.0, 47.0, 38.0, 39.0, 34.0, 48.0, 29.0, 46.0, 34.0, 38.0, 38.0, 30.0, 34.0, 37.0, 23.0, 29.0, 37.0, 16.0, 12.0, 7.0, 10.0, 18.0, 10.0, 7.0, 8.0, 5.0, 8.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.60030460357666, -6.354197978973389, -6.108090877532959, -5.8619842529296875, -5.615877628326416, -5.3697710037231445, -5.123663902282715, -4.877557277679443, -4.631450653076172, -4.3853440284729, -4.139236927032471, -3.893130302429199, -3.6470236778259277, -3.400916814804077, -3.1548099517822266, -2.908703327178955, -2.6625964641571045, -2.416489601135254, -2.1703829765319824, -1.9242761135101318, -1.6781694889068604, -1.4320626258850098, -1.1859558820724487, -0.9398491382598877, -0.6937423944473267, -0.4476356506347656, -0.2015288770198822, 0.04457789659500122, 0.29068464040756226, 0.5367914438247681, 0.7828981876373291, 1.0290049314498901, 1.2751116752624512, 1.5212184190750122, 1.7673251628875732, 2.013432025909424, 2.2595386505126953, 2.505645513534546, 2.7517523765563965, 2.997859001159668, 3.2439656257629395, 3.49007248878479, 3.7361791133880615, 3.982285976409912, 4.228392601013184, 4.474499702453613, 4.720606327056885, 4.966712951660156, 5.212820053100586, 5.458926677703857, 5.705033779144287, 5.951140403747559, 6.19724702835083, 6.443353652954102, 6.689460754394531, 6.935567378997803, 7.181674003601074, 7.427780628204346, 7.673887729644775, 7.919994354248047, 8.166101455688477, 8.41220760345459, 8.65831470489502, 8.904420852661133, 9.150527954101562]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 17.0, 16.0, 23.0, 32.0, 58.0, 81.0, 126.0, 177.0, 352.0, 542.0, 821.0, 1406.0, 2269.0, 3735.0, 6475.0, 11089.0, 18288.0, 30810.0, 50162.0, 76921.0, 108503.0, 137252.0, 148929.0, 137236.0, 108834.0, 77473.0, 50502.0, 31027.0, 18503.0, 10920.0, 6291.0, 3818.0, 2290.0, 1277.0, 855.0, 488.0, 327.0, 204.0, 148.0, 92.0, 55.0, 35.0, 29.0, 21.0, 15.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0], "bins": [-7.06640625, -6.8489990234375, -6.631591796875, -6.4141845703125, -6.19677734375, -5.9793701171875, -5.761962890625, -5.5445556640625, -5.3271484375, -5.1097412109375, -4.892333984375, -4.6749267578125, -4.45751953125, -4.2401123046875, -4.022705078125, -3.8052978515625, -3.587890625, -3.3704833984375, -3.153076171875, -2.9356689453125, -2.71826171875, -2.5008544921875, -2.283447265625, -2.0660400390625, -1.8486328125, -1.6312255859375, -1.413818359375, -1.1964111328125, -0.97900390625, -0.7615966796875, -0.544189453125, -0.3267822265625, -0.109375, 0.1080322265625, 0.325439453125, 0.5428466796875, 0.76025390625, 0.9776611328125, 1.195068359375, 1.4124755859375, 1.6298828125, 1.8472900390625, 2.064697265625, 2.2821044921875, 2.49951171875, 2.7169189453125, 2.934326171875, 3.1517333984375, 3.369140625, 3.5865478515625, 3.803955078125, 4.0213623046875, 4.23876953125, 4.4561767578125, 4.673583984375, 4.8909912109375, 5.1083984375, 5.3258056640625, 5.543212890625, 5.7606201171875, 5.97802734375, 6.1954345703125, 6.412841796875, 6.6302490234375, 6.84765625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 11.0, 9.0, 17.0, 13.0, 12.0, 23.0, 19.0, 15.0, 34.0, 25.0, 29.0, 30.0, 35.0, 43.0, 43.0, 42.0, 44.0, 37.0, 47.0, 32.0, 37.0, 39.0, 31.0, 40.0, 32.0, 36.0, 31.0, 28.0, 24.0, 23.0, 9.0, 19.0, 16.0, 8.0, 10.0, 12.0, 12.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83984375, -6.58197021484375, -6.3240966796875, -6.06622314453125, -5.808349609375, -5.55047607421875, -5.2926025390625, -5.03472900390625, -4.77685546875, -4.51898193359375, -4.2611083984375, -4.00323486328125, -3.745361328125, -3.48748779296875, -3.2296142578125, -2.97174072265625, -2.7138671875, -2.45599365234375, -2.1981201171875, -1.94024658203125, -1.682373046875, -1.42449951171875, -1.1666259765625, -0.90875244140625, -0.65087890625, -0.39300537109375, -0.1351318359375, 0.12274169921875, 0.380615234375, 0.63848876953125, 0.8963623046875, 1.15423583984375, 1.412109375, 1.66998291015625, 1.9278564453125, 2.18572998046875, 2.443603515625, 2.70147705078125, 2.9593505859375, 3.21722412109375, 3.47509765625, 3.73297119140625, 3.9908447265625, 4.24871826171875, 4.506591796875, 4.76446533203125, 5.0223388671875, 5.28021240234375, 5.5380859375, 5.79595947265625, 6.0538330078125, 6.31170654296875, 6.569580078125, 6.82745361328125, 7.0853271484375, 7.34320068359375, 7.60107421875, 7.85894775390625, 8.1168212890625, 8.37469482421875, 8.632568359375, 8.89044189453125, 9.1483154296875, 9.40618896484375, 9.6640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 15.0, 22.0, 29.0, 31.0, 54.0, 106.0, 116.0, 219.0, 333.0, 513.0, 908.0, 1680.0, 3478.0, 8144.0, 21127.0, 53513.0, 123458.0, 225033.0, 266152.0, 187250.0, 91912.0, 37727.0, 14753.0, 6052.0, 2596.0, 1373.0, 712.0, 409.0, 257.0, 196.0, 127.0, 96.0, 50.0, 26.0, 21.0, 20.0, 14.0, 12.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4765625, -13.072021484375, -12.66748046875, -12.262939453125, -11.8583984375, -11.453857421875, -11.04931640625, -10.644775390625, -10.240234375, -9.835693359375, -9.43115234375, -9.026611328125, -8.6220703125, -8.217529296875, -7.81298828125, -7.408447265625, -7.00390625, -6.599365234375, -6.19482421875, -5.790283203125, -5.3857421875, -4.981201171875, -4.57666015625, -4.172119140625, -3.767578125, -3.363037109375, -2.95849609375, -2.553955078125, -2.1494140625, -1.744873046875, -1.34033203125, -0.935791015625, -0.53125, -0.126708984375, 0.27783203125, 0.682373046875, 1.0869140625, 1.491455078125, 1.89599609375, 2.300537109375, 2.705078125, 3.109619140625, 3.51416015625, 3.918701171875, 4.3232421875, 4.727783203125, 5.13232421875, 5.536865234375, 5.94140625, 6.345947265625, 6.75048828125, 7.155029296875, 7.5595703125, 7.964111328125, 8.36865234375, 8.773193359375, 9.177734375, 9.582275390625, 9.98681640625, 10.391357421875, 10.7958984375, 11.200439453125, 11.60498046875, 12.009521484375, 12.4140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 6.0, 9.0, 6.0, 8.0, 12.0, 5.0, 16.0, 15.0, 16.0, 27.0, 24.0, 33.0, 27.0, 24.0, 29.0, 34.0, 34.0, 34.0, 41.0, 34.0, 35.0, 31.0, 40.0, 33.0, 33.0, 28.0, 32.0, 37.0, 31.0, 37.0, 22.0, 26.0, 22.0, 26.0, 19.0, 15.0, 12.0, 12.0, 14.0, 8.0, 6.0, 7.0, 2.0, 3.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 4.0], "bins": [-4.3984375, -4.26251220703125, -4.1265869140625, -3.99066162109375, -3.854736328125, -3.71881103515625, -3.5828857421875, -3.44696044921875, -3.31103515625, -3.17510986328125, -3.0391845703125, -2.90325927734375, -2.767333984375, -2.63140869140625, -2.4954833984375, -2.35955810546875, -2.2236328125, -2.08770751953125, -1.9517822265625, -1.81585693359375, -1.679931640625, -1.54400634765625, -1.4080810546875, -1.27215576171875, -1.13623046875, -1.00030517578125, -0.8643798828125, -0.72845458984375, -0.592529296875, -0.45660400390625, -0.3206787109375, -0.18475341796875, -0.048828125, 0.08709716796875, 0.2230224609375, 0.35894775390625, 0.494873046875, 0.63079833984375, 0.7667236328125, 0.90264892578125, 1.03857421875, 1.17449951171875, 1.3104248046875, 1.44635009765625, 1.582275390625, 1.71820068359375, 1.8541259765625, 1.99005126953125, 2.1259765625, 2.26190185546875, 2.3978271484375, 2.53375244140625, 2.669677734375, 2.80560302734375, 2.9415283203125, 3.07745361328125, 3.21337890625, 3.34930419921875, 3.4852294921875, 3.62115478515625, 3.757080078125, 3.89300537109375, 4.0289306640625, 4.16485595703125, 4.30078125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 6.0, 7.0, 13.0, 15.0, 28.0, 46.0, 63.0, 82.0, 149.0, 245.0, 349.0, 639.0, 999.0, 1688.0, 2962.0, 5277.0, 9395.0, 18078.0, 36343.0, 75540.0, 152651.0, 241608.0, 230311.0, 136547.0, 66974.0, 32608.0, 16144.0, 8465.0, 4665.0, 2644.0, 1551.0, 938.0, 524.0, 357.0, 206.0, 143.0, 100.0, 63.0, 38.0, 29.0, 28.0, 12.0, 4.0, 4.0, 5.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.453125, -7.2196044921875, -6.986083984375, -6.7525634765625, -6.51904296875, -6.2855224609375, -6.052001953125, -5.8184814453125, -5.5849609375, -5.3514404296875, -5.117919921875, -4.8843994140625, -4.65087890625, -4.4173583984375, -4.183837890625, -3.9503173828125, -3.716796875, -3.4832763671875, -3.249755859375, -3.0162353515625, -2.78271484375, -2.5491943359375, -2.315673828125, -2.0821533203125, -1.8486328125, -1.6151123046875, -1.381591796875, -1.1480712890625, -0.91455078125, -0.6810302734375, -0.447509765625, -0.2139892578125, 0.01953125, 0.2530517578125, 0.486572265625, 0.7200927734375, 0.95361328125, 1.1871337890625, 1.420654296875, 1.6541748046875, 1.8876953125, 2.1212158203125, 2.354736328125, 2.5882568359375, 2.82177734375, 3.0552978515625, 3.288818359375, 3.5223388671875, 3.755859375, 3.9893798828125, 4.222900390625, 4.4564208984375, 4.68994140625, 4.9234619140625, 5.156982421875, 5.3905029296875, 5.6240234375, 5.8575439453125, 6.091064453125, 6.3245849609375, 6.55810546875, 6.7916259765625, 7.025146484375, 7.2586669921875, 7.4921875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 9.0, 9.0, 7.0, 15.0, 19.0, 21.0, 17.0, 19.0, 36.0, 43.0, 73.0, 90.0, 77.0, 103.0, 107.0, 68.0, 66.0, 55.0, 38.0, 32.0, 26.0, 19.0, 13.0, 6.0, 9.0, 7.0, 2.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006246566772460938, -0.0006067454814910889, -0.000588834285736084, -0.0005709230899810791, -0.0005530118942260742, -0.0005351006984710693, -0.0005171895027160645, -0.0004992783069610596, -0.0004813671112060547, -0.0004634559154510498, -0.0004455447196960449, -0.00042763352394104004, -0.00040972232818603516, -0.0003918111324310303, -0.0003738999366760254, -0.0003559887409210205, -0.0003380775451660156, -0.00032016634941101074, -0.00030225515365600586, -0.000284343957901001, -0.0002664327621459961, -0.0002485215663909912, -0.00023061037063598633, -0.00021269917488098145, -0.00019478797912597656, -0.00017687678337097168, -0.0001589655876159668, -0.00014105439186096191, -0.00012314319610595703, -0.00010523200035095215, -8.732080459594727e-05, -6.940960884094238e-05, -5.14984130859375e-05, -3.358721733093262e-05, -1.5676021575927734e-05, 2.2351741790771484e-06, 2.014636993408203e-05, 3.8057565689086914e-05, 5.59687614440918e-05, 7.387995719909668e-05, 9.179115295410156e-05, 0.00010970234870910645, 0.00012761354446411133, 0.0001455247402191162, 0.0001634359359741211, 0.00018134713172912598, 0.00019925832748413086, 0.00021716952323913574, 0.00023508071899414062, 0.0002529919147491455, 0.0002709031105041504, 0.0002888143062591553, 0.00030672550201416016, 0.00032463669776916504, 0.0003425478935241699, 0.0003604590892791748, 0.0003783702850341797, 0.00039628148078918457, 0.00041419267654418945, 0.00043210387229919434, 0.0004500150680541992, 0.0004679262638092041, 0.000485837459564209, 0.0005037486553192139, 0.0005216598510742188]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 11.0, 9.0, 31.0, 26.0, 41.0, 47.0, 93.0, 140.0, 224.0, 350.0, 621.0, 977.0, 1587.0, 2626.0, 4323.0, 7583.0, 13238.0, 23399.0, 42383.0, 75272.0, 126654.0, 180742.0, 194746.0, 152029.0, 95663.0, 54708.0, 30654.0, 17132.0, 9525.0, 5507.0, 3198.0, 1895.0, 1187.0, 709.0, 426.0, 268.0, 171.0, 131.0, 79.0, 55.0, 35.0, 18.0, 13.0, 8.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.21038818359375, -5.0379638671875, -4.86553955078125, -4.693115234375, -4.52069091796875, -4.3482666015625, -4.17584228515625, -4.00341796875, -3.83099365234375, -3.6585693359375, -3.48614501953125, -3.313720703125, -3.14129638671875, -2.9688720703125, -2.79644775390625, -2.6240234375, -2.45159912109375, -2.2791748046875, -2.10675048828125, -1.934326171875, -1.76190185546875, -1.5894775390625, -1.41705322265625, -1.24462890625, -1.07220458984375, -0.8997802734375, -0.72735595703125, -0.554931640625, -0.38250732421875, -0.2100830078125, -0.03765869140625, 0.134765625, 0.30718994140625, 0.4796142578125, 0.65203857421875, 0.824462890625, 0.99688720703125, 1.1693115234375, 1.34173583984375, 1.51416015625, 1.68658447265625, 1.8590087890625, 2.03143310546875, 2.203857421875, 2.37628173828125, 2.5487060546875, 2.72113037109375, 2.8935546875, 3.06597900390625, 3.2384033203125, 3.41082763671875, 3.583251953125, 3.75567626953125, 3.9281005859375, 4.10052490234375, 4.27294921875, 4.44537353515625, 4.6177978515625, 4.79022216796875, 4.962646484375, 5.13507080078125, 5.3074951171875, 5.47991943359375, 5.65234375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 1.0, 3.0, 6.0, 6.0, 12.0, 9.0, 15.0, 16.0, 22.0, 10.0, 22.0, 30.0, 37.0, 40.0, 47.0, 42.0, 56.0, 53.0, 44.0, 49.0, 45.0, 51.0, 41.0, 35.0, 40.0, 46.0, 36.0, 25.0, 34.0, 26.0, 17.0, 13.0, 16.0, 7.0, 9.0, 9.0, 5.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.4892578125, -1.4448394775390625, -1.400421142578125, -1.3560028076171875, -1.31158447265625, -1.2671661376953125, -1.222747802734375, -1.1783294677734375, -1.1339111328125, -1.0894927978515625, -1.045074462890625, -1.0006561279296875, -0.95623779296875, -0.9118194580078125, -0.867401123046875, -0.8229827880859375, -0.778564453125, -0.7341461181640625, -0.689727783203125, -0.6453094482421875, -0.60089111328125, -0.5564727783203125, -0.512054443359375, -0.4676361083984375, -0.4232177734375, -0.3787994384765625, -0.334381103515625, -0.2899627685546875, -0.24554443359375, -0.2011260986328125, -0.156707763671875, -0.1122894287109375, -0.06787109375, -0.0234527587890625, 0.020965576171875, 0.0653839111328125, 0.10980224609375, 0.1542205810546875, 0.198638916015625, 0.2430572509765625, 0.2874755859375, 0.3318939208984375, 0.376312255859375, 0.4207305908203125, 0.46514892578125, 0.5095672607421875, 0.553985595703125, 0.5984039306640625, 0.642822265625, 0.6872406005859375, 0.731658935546875, 0.7760772705078125, 0.82049560546875, 0.8649139404296875, 0.909332275390625, 0.9537506103515625, 0.9981689453125, 1.0425872802734375, 1.087005615234375, 1.1314239501953125, 1.17584228515625, 1.2202606201171875, 1.264678955078125, 1.3090972900390625, 1.353515625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 1.0, 6.0, 6.0, 13.0, 8.0, 16.0, 14.0, 25.0, 41.0, 39.0, 55.0, 58.0, 73.0, 84.0, 86.0, 78.0, 63.0, 71.0, 47.0, 59.0, 28.0, 29.0, 14.0, 20.0, 20.0, 11.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.905106544494629, -14.417510986328125, -13.929915428161621, -13.442319869995117, -12.954724311828613, -12.46712875366211, -11.979533195495605, -11.491937637329102, -11.004342079162598, -10.516746520996094, -10.02915096282959, -9.541555404663086, -9.053959846496582, -8.566364288330078, -8.078768730163574, -7.59117317199707, -7.103577613830566, -6.6159820556640625, -6.128386497497559, -5.640790939331055, -5.153195381164551, -4.665599822998047, -4.178004264831543, -3.690408706665039, -3.202813148498535, -2.7152175903320312, -2.2276220321655273, -1.7400264739990234, -1.2524309158325195, -0.7648353576660156, -0.2772397994995117, 0.2103557586669922, 0.6979522705078125, 1.1855478286743164, 1.6731433868408203, 2.160738945007324, 2.648334503173828, 3.135930061340332, 3.623525619506836, 4.11112117767334, 4.598716735839844, 5.086312294006348, 5.573907852172852, 6.0615034103393555, 6.549098968505859, 7.036694526672363, 7.524290084838867, 8.011885643005371, 8.499481201171875, 8.987076759338379, 9.474672317504883, 9.962267875671387, 10.44986343383789, 10.937458992004395, 11.425054550170898, 11.912650108337402, 12.400245666503906, 12.88784122467041, 13.375436782836914, 13.863032341003418, 14.350627899169922, 14.838223457336426, 15.32581901550293, 15.813414573669434, 16.301010131835938]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 11.0, 7.0, 14.0, 15.0, 20.0, 16.0, 19.0, 28.0, 31.0, 34.0, 19.0, 35.0, 30.0, 34.0, 41.0, 41.0, 44.0, 34.0, 30.0, 44.0, 40.0, 37.0, 43.0, 37.0, 34.0, 33.0, 30.0, 28.0, 24.0, 18.0, 26.0, 14.0, 15.0, 12.0, 8.0, 6.0, 7.0, 8.0, 8.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.769217491149902, -7.513876914978027, -7.258536338806152, -7.003195762634277, -6.747855186462402, -6.492514610290527, -6.237174034118652, -5.981833457946777, -5.726492881774902, -5.471152305603027, -5.215811729431152, -4.960471153259277, -4.705130577087402, -4.449790000915527, -4.194449424743652, -3.9391088485717773, -3.6837682723999023, -3.4284276962280273, -3.1730871200561523, -2.9177465438842773, -2.6624059677124023, -2.4070653915405273, -2.1517248153686523, -1.8963842391967773, -1.6410436630249023, -1.3857030868530273, -1.1303625106811523, -0.8750219345092773, -0.6196813583374023, -0.36434078216552734, -0.10900020599365234, 0.14634037017822266, 0.40168094635009766, 0.6570215225219727, 0.9123620986938477, 1.1677026748657227, 1.4230432510375977, 1.6783838272094727, 1.9337244033813477, 2.1890649795532227, 2.4444055557250977, 2.6997461318969727, 2.9550867080688477, 3.2104272842407227, 3.4657678604125977, 3.7211084365844727, 3.9764490127563477, 4.231789588928223, 4.487130165100098, 4.742470741271973, 4.997811317443848, 5.253151893615723, 5.508492469787598, 5.763833045959473, 6.019173622131348, 6.274514198303223, 6.529854774475098, 6.785195350646973, 7.040535926818848, 7.295876502990723, 7.551217079162598, 7.806557655334473, 8.061898231506348, 8.317238807678223, 8.572579383850098]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 11.0, 19.0, 22.0, 45.0, 66.0, 84.0, 126.0, 187.0, 287.0, 437.0, 681.0, 1074.0, 1555.0, 2444.0, 3792.0, 6005.0, 9473.0, 15090.0, 24533.0, 39136.0, 64692.0, 105205.0, 168615.0, 267434.0, 400731.0, 545534.0, 629071.0, 591333.0, 461686.0, 317936.0, 203811.0, 127324.0, 78210.0, 48078.0, 29470.0, 18302.0, 11250.0, 7389.0, 4595.0, 2940.0, 1886.0, 1292.0, 845.0, 539.0, 349.0, 254.0, 159.0, 103.0, 60.0, 49.0, 19.0, 21.0, 17.0, 11.0, 7.0, 5.0, 2.0], "bins": [-7.79296875, -7.56170654296875, -7.3304443359375, -7.09918212890625, -6.867919921875, -6.63665771484375, -6.4053955078125, -6.17413330078125, -5.94287109375, -5.71160888671875, -5.4803466796875, -5.24908447265625, -5.017822265625, -4.78656005859375, -4.5552978515625, -4.32403564453125, -4.0927734375, -3.86151123046875, -3.6302490234375, -3.39898681640625, -3.167724609375, -2.93646240234375, -2.7052001953125, -2.47393798828125, -2.24267578125, -2.01141357421875, -1.7801513671875, -1.54888916015625, -1.317626953125, -1.08636474609375, -0.8551025390625, -0.62384033203125, -0.392578125, -0.16131591796875, 0.0699462890625, 0.30120849609375, 0.532470703125, 0.76373291015625, 0.9949951171875, 1.22625732421875, 1.45751953125, 1.68878173828125, 1.9200439453125, 2.15130615234375, 2.382568359375, 2.61383056640625, 2.8450927734375, 3.07635498046875, 3.3076171875, 3.53887939453125, 3.7701416015625, 4.00140380859375, 4.232666015625, 4.46392822265625, 4.6951904296875, 4.92645263671875, 5.15771484375, 5.38897705078125, 5.6202392578125, 5.85150146484375, 6.082763671875, 6.31402587890625, 6.5452880859375, 6.77655029296875, 7.0078125]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 10.0, 8.0, 7.0, 14.0, 9.0, 14.0, 20.0, 18.0, 23.0, 15.0, 28.0, 32.0, 33.0, 32.0, 30.0, 35.0, 39.0, 46.0, 46.0, 24.0, 44.0, 37.0, 44.0, 33.0, 44.0, 36.0, 40.0, 30.0, 30.0, 26.0, 27.0, 22.0, 15.0, 14.0, 15.0, 8.0, 17.0, 4.0, 9.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.87890625, -4.70654296875, -4.5341796875, -4.36181640625, -4.189453125, -4.01708984375, -3.8447265625, -3.67236328125, -3.5, -3.32763671875, -3.1552734375, -2.98291015625, -2.810546875, -2.63818359375, -2.4658203125, -2.29345703125, -2.12109375, -1.94873046875, -1.7763671875, -1.60400390625, -1.431640625, -1.25927734375, -1.0869140625, -0.91455078125, -0.7421875, -0.56982421875, -0.3974609375, -0.22509765625, -0.052734375, 0.11962890625, 0.2919921875, 0.46435546875, 0.63671875, 0.80908203125, 0.9814453125, 1.15380859375, 1.326171875, 1.49853515625, 1.6708984375, 1.84326171875, 2.015625, 2.18798828125, 2.3603515625, 2.53271484375, 2.705078125, 2.87744140625, 3.0498046875, 3.22216796875, 3.39453125, 3.56689453125, 3.7392578125, 3.91162109375, 4.083984375, 4.25634765625, 4.4287109375, 4.60107421875, 4.7734375, 4.94580078125, 5.1181640625, 5.29052734375, 5.462890625, 5.63525390625, 5.8076171875, 5.97998046875, 6.15234375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 10.0, 30.0, 34.0, 38.0, 83.0, 135.0, 212.0, 288.0, 483.0, 740.0, 1319.0, 1900.0, 3084.0, 5116.0, 8265.0, 13060.0, 21140.0, 34328.0, 54797.0, 87357.0, 139057.0, 214048.0, 314545.0, 432599.0, 530884.0, 566670.0, 516547.0, 410631.0, 295554.0, 197733.0, 128712.0, 81265.0, 50551.0, 31366.0, 19457.0, 11963.0, 7512.0, 4784.0, 2861.0, 1864.0, 1215.0, 703.0, 508.0, 304.0, 208.0, 107.0, 80.0, 48.0, 31.0, 22.0, 7.0, 7.0, 4.0, 5.0, 1.0], "bins": [-7.55078125, -7.33135986328125, -7.1119384765625, -6.89251708984375, -6.673095703125, -6.45367431640625, -6.2342529296875, -6.01483154296875, -5.79541015625, -5.57598876953125, -5.3565673828125, -5.13714599609375, -4.917724609375, -4.69830322265625, -4.4788818359375, -4.25946044921875, -4.0400390625, -3.82061767578125, -3.6011962890625, -3.38177490234375, -3.162353515625, -2.94293212890625, -2.7235107421875, -2.50408935546875, -2.28466796875, -2.06524658203125, -1.8458251953125, -1.62640380859375, -1.406982421875, -1.18756103515625, -0.9681396484375, -0.74871826171875, -0.529296875, -0.30987548828125, -0.0904541015625, 0.12896728515625, 0.348388671875, 0.56781005859375, 0.7872314453125, 1.00665283203125, 1.22607421875, 1.44549560546875, 1.6649169921875, 1.88433837890625, 2.103759765625, 2.32318115234375, 2.5426025390625, 2.76202392578125, 2.9814453125, 3.20086669921875, 3.4202880859375, 3.63970947265625, 3.859130859375, 4.07855224609375, 4.2979736328125, 4.51739501953125, 4.73681640625, 4.95623779296875, 5.1756591796875, 5.39508056640625, 5.614501953125, 5.83392333984375, 6.0533447265625, 6.27276611328125, 6.4921875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 8.0, 10.0, 9.0, 12.0, 14.0, 21.0, 20.0, 30.0, 35.0, 40.0, 61.0, 64.0, 84.0, 78.0, 96.0, 124.0, 148.0, 159.0, 154.0, 172.0, 219.0, 214.0, 224.0, 221.0, 193.0, 211.0, 202.0, 179.0, 177.0, 165.0, 126.0, 100.0, 107.0, 70.0, 54.0, 43.0, 42.0, 42.0, 27.0, 26.0, 19.0, 20.0, 15.0, 9.0, 6.0, 2.0, 6.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.67578125, -2.5859375, -2.49609375, -2.40625, -2.31640625, -2.2265625, -2.13671875, -2.046875, -1.95703125, -1.8671875, -1.77734375, -1.6875, -1.59765625, -1.5078125, -1.41796875, -1.328125, -1.23828125, -1.1484375, -1.05859375, -0.96875, -0.87890625, -0.7890625, -0.69921875, -0.609375, -0.51953125, -0.4296875, -0.33984375, -0.25, -0.16015625, -0.0703125, 0.01953125, 0.109375, 0.19921875, 0.2890625, 0.37890625, 0.46875, 0.55859375, 0.6484375, 0.73828125, 0.828125, 0.91796875, 1.0078125, 1.09765625, 1.1875, 1.27734375, 1.3671875, 1.45703125, 1.546875, 1.63671875, 1.7265625, 1.81640625, 1.90625, 1.99609375, 2.0859375, 2.17578125, 2.265625, 2.35546875, 2.4453125, 2.53515625, 2.625, 2.71484375, 2.8046875, 2.89453125, 2.984375, 3.07421875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 3.0, 9.0, 9.0, 12.0, 12.0, 15.0, 22.0, 26.0, 46.0, 57.0, 71.0, 62.0, 83.0, 88.0, 79.0, 71.0, 61.0, 53.0, 49.0, 38.0, 30.0, 21.0, 10.0, 13.0, 13.0, 13.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.690620422363281, -15.239558219909668, -14.788495063781738, -14.337432861328125, -13.886370658874512, -13.435308456420898, -12.984245300292969, -12.533183097839355, -12.082120895385742, -11.631058692932129, -11.1799955368042, -10.728933334350586, -10.277871131896973, -9.82680892944336, -9.37574577331543, -8.924683570861816, -8.473620414733887, -8.022558212280273, -7.571495532989502, -7.1204328536987305, -6.669370651245117, -6.218307971954346, -5.767245292663574, -5.316183090209961, -4.8651204109191895, -4.414057731628418, -3.9629955291748047, -3.511932849884033, -3.060870409011841, -2.6098079681396484, -2.158745288848877, -1.7076828479766846, -1.2566194534301758, -0.8055569529533386, -0.35449445247650146, 0.09656810760498047, 0.5476305484771729, 0.9986929893493652, 1.4497556686401367, 1.900818109512329, 2.3518805503845215, 2.802942991256714, 3.2540054321289062, 3.7050681114196777, 4.156130790710449, 4.6071929931640625, 5.058255672454834, 5.5093183517456055, 5.960380554199219, 6.41144323348999, 6.8625054359436035, 7.313568115234375, 7.764630317687988, 8.215692520141602, 8.666755676269531, 9.117817878723145, 9.568880081176758, 10.019942283630371, 10.4710054397583, 10.922067642211914, 11.373129844665527, 11.82419204711914, 12.27525520324707, 12.726317405700684, 13.177380561828613]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 8.0, 4.0, 5.0, 9.0, 17.0, 17.0, 19.0, 26.0, 26.0, 32.0, 25.0, 23.0, 30.0, 38.0, 41.0, 37.0, 37.0, 43.0, 49.0, 38.0, 49.0, 35.0, 44.0, 33.0, 41.0, 27.0, 25.0, 32.0, 20.0, 31.0, 17.0, 17.0, 24.0, 18.0, 15.0, 6.0, 12.0, 5.0, 3.0, 7.0, 0.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.987983703613281, -6.75785493850708, -6.527725696563721, -6.2975969314575195, -6.06746768951416, -5.837338924407959, -5.6072096824646, -5.377080917358398, -5.146951675415039, -4.916822910308838, -4.6866936683654785, -4.456564903259277, -4.226435661315918, -3.996306896209717, -3.7661776542663574, -3.5360488891601562, -3.305919885635376, -3.0757908821105957, -2.8456618785858154, -2.615532875061035, -2.385403871536255, -2.1552748680114746, -1.9251459836959839, -1.6950169801712036, -1.4648879766464233, -1.234758973121643, -1.0046299695968628, -0.7745010256767273, -0.544372022151947, -0.3142430782318115, -0.08411407470703125, 0.14601492881774902, 0.3761439323425293, 0.6062729358673096, 0.8364019393920898, 1.0665309429168701, 1.2966599464416504, 1.5267888307571411, 1.7569178342819214, 1.9870468378067017, 2.2171759605407715, 2.4473049640655518, 2.677433967590332, 2.9075629711151123, 3.1376919746398926, 3.3678207397460938, 3.597949981689453, 3.8280787467956543, 4.0582075119018555, 4.288336277008057, 4.518465518951416, 4.748594284057617, 4.978723526000977, 5.208852291107178, 5.438981533050537, 5.669110298156738, 5.899239540100098, 6.129368305206299, 6.359497547149658, 6.589626312255859, 6.819755554199219, 7.04988431930542, 7.280013561248779, 7.5101423263549805, 7.74027156829834]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 9.0, 14.0, 14.0, 28.0, 31.0, 40.0, 60.0, 77.0, 102.0, 149.0, 210.0, 302.0, 372.0, 551.0, 875.0, 1318.0, 2199.0, 3909.0, 7653.0, 17216.0, 42320.0, 105677.0, 231100.0, 305914.0, 188005.0, 79970.0, 32032.0, 13571.0, 6141.0, 3198.0, 1848.0, 1124.0, 730.0, 525.0, 380.0, 252.0, 159.0, 131.0, 96.0, 72.0, 51.0, 41.0, 21.0, 17.0, 11.0, 11.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.609375, -3.494232177734375, -3.37908935546875, -3.263946533203125, -3.1488037109375, -3.033660888671875, -2.91851806640625, -2.803375244140625, -2.688232421875, -2.573089599609375, -2.45794677734375, -2.342803955078125, -2.2276611328125, -2.112518310546875, -1.99737548828125, -1.882232666015625, -1.76708984375, -1.651947021484375, -1.53680419921875, -1.421661376953125, -1.3065185546875, -1.191375732421875, -1.07623291015625, -0.961090087890625, -0.845947265625, -0.730804443359375, -0.61566162109375, -0.500518798828125, -0.3853759765625, -0.270233154296875, -0.15509033203125, -0.039947509765625, 0.0751953125, 0.190338134765625, 0.30548095703125, 0.420623779296875, 0.5357666015625, 0.650909423828125, 0.76605224609375, 0.881195068359375, 0.996337890625, 1.111480712890625, 1.22662353515625, 1.341766357421875, 1.4569091796875, 1.572052001953125, 1.68719482421875, 1.802337646484375, 1.91748046875, 2.032623291015625, 2.14776611328125, 2.262908935546875, 2.3780517578125, 2.493194580078125, 2.60833740234375, 2.723480224609375, 2.838623046875, 2.953765869140625, 3.06890869140625, 3.184051513671875, 3.2991943359375, 3.414337158203125, 3.52947998046875, 3.644622802734375, 3.759765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 9.0, 9.0, 19.0, 10.0, 17.0, 14.0, 12.0, 23.0, 29.0, 34.0, 33.0, 30.0, 27.0, 36.0, 34.0, 39.0, 49.0, 48.0, 45.0, 48.0, 49.0, 37.0, 44.0, 36.0, 38.0, 23.0, 24.0, 23.0, 17.0, 22.0, 25.0, 18.0, 18.0, 16.0, 14.0, 5.0, 2.0, 10.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.47265625, -7.21978759765625, -6.9669189453125, -6.71405029296875, -6.461181640625, -6.20831298828125, -5.9554443359375, -5.70257568359375, -5.44970703125, -5.19683837890625, -4.9439697265625, -4.69110107421875, -4.438232421875, -4.18536376953125, -3.9324951171875, -3.67962646484375, -3.4267578125, -3.17388916015625, -2.9210205078125, -2.66815185546875, -2.415283203125, -2.16241455078125, -1.9095458984375, -1.65667724609375, -1.40380859375, -1.15093994140625, -0.8980712890625, -0.64520263671875, -0.392333984375, -0.13946533203125, 0.1134033203125, 0.36627197265625, 0.619140625, 0.87200927734375, 1.1248779296875, 1.37774658203125, 1.630615234375, 1.88348388671875, 2.1363525390625, 2.38922119140625, 2.64208984375, 2.89495849609375, 3.1478271484375, 3.40069580078125, 3.653564453125, 3.90643310546875, 4.1593017578125, 4.41217041015625, 4.6650390625, 4.91790771484375, 5.1707763671875, 5.42364501953125, 5.676513671875, 5.92938232421875, 6.1822509765625, 6.43511962890625, 6.68798828125, 6.94085693359375, 7.1937255859375, 7.44659423828125, 7.699462890625, 7.95233154296875, 8.2052001953125, 8.45806884765625, 8.7109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 9.0, 6.0, 14.0, 19.0, 16.0, 31.0, 43.0, 63.0, 112.0, 168.0, 304.0, 607.0, 1375.0, 3922.0, 14964.0, 78010.0, 389290.0, 439065.0, 95184.0, 17892.0, 4401.0, 1557.0, 653.0, 332.0, 167.0, 109.0, 81.0, 50.0, 31.0, 22.0, 16.0, 12.0, 10.0, 3.0, 3.0, 4.0, 7.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.4234619140625, -6.202392578125, -5.9813232421875, -5.76025390625, -5.5391845703125, -5.318115234375, -5.0970458984375, -4.8759765625, -4.6549072265625, -4.433837890625, -4.2127685546875, -3.99169921875, -3.7706298828125, -3.549560546875, -3.3284912109375, -3.107421875, -2.8863525390625, -2.665283203125, -2.4442138671875, -2.22314453125, -2.0020751953125, -1.781005859375, -1.5599365234375, -1.3388671875, -1.1177978515625, -0.896728515625, -0.6756591796875, -0.45458984375, -0.2335205078125, -0.012451171875, 0.2086181640625, 0.4296875, 0.6507568359375, 0.871826171875, 1.0928955078125, 1.31396484375, 1.5350341796875, 1.756103515625, 1.9771728515625, 2.1982421875, 2.4193115234375, 2.640380859375, 2.8614501953125, 3.08251953125, 3.3035888671875, 3.524658203125, 3.7457275390625, 3.966796875, 4.1878662109375, 4.408935546875, 4.6300048828125, 4.85107421875, 5.0721435546875, 5.293212890625, 5.5142822265625, 5.7353515625, 5.9564208984375, 6.177490234375, 6.3985595703125, 6.61962890625, 6.8406982421875, 7.061767578125, 7.2828369140625, 7.50390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 8.0, 5.0, 7.0, 10.0, 8.0, 10.0, 19.0, 22.0, 15.0, 15.0, 25.0, 19.0, 20.0, 32.0, 31.0, 44.0, 41.0, 29.0, 44.0, 31.0, 43.0, 46.0, 36.0, 35.0, 43.0, 43.0, 40.0, 37.0, 36.0, 29.0, 35.0, 19.0, 19.0, 26.0, 13.0, 12.0, 16.0, 9.0, 10.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.484375, -4.3353271484375, -4.186279296875, -4.0372314453125, -3.88818359375, -3.7391357421875, -3.590087890625, -3.4410400390625, -3.2919921875, -3.1429443359375, -2.993896484375, -2.8448486328125, -2.69580078125, -2.5467529296875, -2.397705078125, -2.2486572265625, -2.099609375, -1.9505615234375, -1.801513671875, -1.6524658203125, -1.50341796875, -1.3543701171875, -1.205322265625, -1.0562744140625, -0.9072265625, -0.7581787109375, -0.609130859375, -0.4600830078125, -0.31103515625, -0.1619873046875, -0.012939453125, 0.1361083984375, 0.28515625, 0.4342041015625, 0.583251953125, 0.7322998046875, 0.88134765625, 1.0303955078125, 1.179443359375, 1.3284912109375, 1.4775390625, 1.6265869140625, 1.775634765625, 1.9246826171875, 2.07373046875, 2.2227783203125, 2.371826171875, 2.5208740234375, 2.669921875, 2.8189697265625, 2.968017578125, 3.1170654296875, 3.26611328125, 3.4151611328125, 3.564208984375, 3.7132568359375, 3.8623046875, 4.0113525390625, 4.160400390625, 4.3094482421875, 4.45849609375, 4.6075439453125, 4.756591796875, 4.9056396484375, 5.0546875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 4.0, 5.0, 13.0, 11.0, 27.0, 23.0, 39.0, 36.0, 57.0, 80.0, 138.0, 182.0, 294.0, 431.0, 763.0, 1330.0, 2942.0, 8832.0, 63495.0, 677413.0, 260980.0, 21764.0, 4925.0, 2005.0, 1019.0, 561.0, 348.0, 251.0, 155.0, 119.0, 81.0, 60.0, 37.0, 25.0, 32.0, 19.0, 9.0, 17.0, 3.0, 7.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.650390625, -2.569488525390625, -2.48858642578125, -2.407684326171875, -2.3267822265625, -2.245880126953125, -2.16497802734375, -2.084075927734375, -2.003173828125, -1.922271728515625, -1.84136962890625, -1.760467529296875, -1.6795654296875, -1.598663330078125, -1.51776123046875, -1.436859130859375, -1.35595703125, -1.275054931640625, -1.19415283203125, -1.113250732421875, -1.0323486328125, -0.951446533203125, -0.87054443359375, -0.789642333984375, -0.708740234375, -0.627838134765625, -0.54693603515625, -0.466033935546875, -0.3851318359375, -0.304229736328125, -0.22332763671875, -0.142425537109375, -0.0615234375, 0.019378662109375, 0.10028076171875, 0.181182861328125, 0.2620849609375, 0.342987060546875, 0.42388916015625, 0.504791259765625, 0.585693359375, 0.666595458984375, 0.74749755859375, 0.828399658203125, 0.9093017578125, 0.990203857421875, 1.07110595703125, 1.152008056640625, 1.23291015625, 1.313812255859375, 1.39471435546875, 1.475616455078125, 1.5565185546875, 1.637420654296875, 1.71832275390625, 1.799224853515625, 1.880126953125, 1.961029052734375, 2.04193115234375, 2.122833251953125, 2.2037353515625, 2.284637451171875, 2.36553955078125, 2.446441650390625, 2.52734375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 10.0, 43.0, 90.0, 215.0, 307.0, 191.0, 82.0, 29.0, 8.0, 4.0, 6.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019478797912597656, -0.00018912367522716522, -0.00018345937132835388, -0.00017779506742954254, -0.0001721307635307312, -0.00016646645963191986, -0.00016080215573310852, -0.00015513785183429718, -0.00014947354793548584, -0.0001438092440366745, -0.00013814494013786316, -0.00013248063623905182, -0.00012681633234024048, -0.00012115202844142914, -0.0001154877245426178, -0.00010982342064380646, -0.00010415911674499512, -9.849481284618378e-05, -9.283050894737244e-05, -8.71662050485611e-05, -8.150190114974976e-05, -7.583759725093842e-05, -7.017329335212708e-05, -6.450898945331573e-05, -5.8844685554504395e-05, -5.3180381655693054e-05, -4.7516077756881714e-05, -4.1851773858070374e-05, -3.618746995925903e-05, -3.052316606044769e-05, -2.4858862161636353e-05, -1.9194558262825012e-05, -1.3530254364013672e-05, -7.865950465202332e-06, -2.201646566390991e-06, 3.462657332420349e-06, 9.12696123123169e-06, 1.479126513004303e-05, 2.045556902885437e-05, 2.611987292766571e-05, 3.178417682647705e-05, 3.744848072528839e-05, 4.311278462409973e-05, 4.877708852291107e-05, 5.444139242172241e-05, 6.010569632053375e-05, 6.577000021934509e-05, 7.143430411815643e-05, 7.709860801696777e-05, 8.276291191577911e-05, 8.842721581459045e-05, 9.40915197134018e-05, 9.975582361221313e-05, 0.00010542012751102448, 0.00011108443140983582, 0.00011674873530864716, 0.0001224130392074585, 0.00012807734310626984, 0.00013374164700508118, 0.00013940595090389252, 0.00014507025480270386, 0.0001507345587015152, 0.00015639886260032654, 0.00016206316649913788, 0.00016772747039794922]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 11.0, 16.0, 17.0, 29.0, 27.0, 24.0, 56.0, 88.0, 102.0, 112.0, 160.0, 205.0, 274.0, 363.0, 501.0, 626.0, 890.0, 1338.0, 1964.0, 3322.0, 6611.0, 14457.0, 36296.0, 101731.0, 275239.0, 354350.0, 154276.0, 54040.0, 20289.0, 8943.0, 4278.0, 2493.0, 1524.0, 943.0, 727.0, 543.0, 404.0, 315.0, 221.0, 194.0, 144.0, 96.0, 84.0, 52.0, 48.0, 29.0, 25.0, 23.0, 12.0, 17.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0], "bins": [-1.1953125, -1.1581878662109375, -1.121063232421875, -1.0839385986328125, -1.04681396484375, -1.0096893310546875, -0.972564697265625, -0.9354400634765625, -0.8983154296875, -0.8611907958984375, -0.824066162109375, -0.7869415283203125, -0.74981689453125, -0.7126922607421875, -0.675567626953125, -0.6384429931640625, -0.601318359375, -0.5641937255859375, -0.527069091796875, -0.4899444580078125, -0.45281982421875, -0.4156951904296875, -0.378570556640625, -0.3414459228515625, -0.3043212890625, -0.2671966552734375, -0.230072021484375, -0.1929473876953125, -0.15582275390625, -0.1186981201171875, -0.081573486328125, -0.0444488525390625, -0.00732421875, 0.0298004150390625, 0.066925048828125, 0.1040496826171875, 0.14117431640625, 0.1782989501953125, 0.215423583984375, 0.2525482177734375, 0.2896728515625, 0.3267974853515625, 0.363922119140625, 0.4010467529296875, 0.43817138671875, 0.4752960205078125, 0.512420654296875, 0.5495452880859375, 0.586669921875, 0.6237945556640625, 0.660919189453125, 0.6980438232421875, 0.73516845703125, 0.7722930908203125, 0.809417724609375, 0.8465423583984375, 0.8836669921875, 0.9207916259765625, 0.957916259765625, 0.9950408935546875, 1.03216552734375, 1.0692901611328125, 1.106414794921875, 1.1435394287109375, 1.1806640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 4.0, 14.0, 18.0, 35.0, 47.0, 48.0, 60.0, 98.0, 91.0, 116.0, 96.0, 96.0, 60.0, 59.0, 30.0, 22.0, 25.0, 17.0, 9.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.34814453125, -0.3382911682128906, -0.32843780517578125, -0.3185844421386719, -0.3087310791015625, -0.2988777160644531, -0.28902435302734375, -0.2791709899902344, -0.269317626953125, -0.2594642639160156, -0.24961090087890625, -0.23975753784179688, -0.2299041748046875, -0.22005081176757812, -0.21019744873046875, -0.20034408569335938, -0.19049072265625, -0.18063735961914062, -0.17078399658203125, -0.16093063354492188, -0.1510772705078125, -0.14122390747070312, -0.13137054443359375, -0.12151718139648438, -0.111663818359375, -0.10181045532226562, -0.09195709228515625, -0.08210372924804688, -0.0722503662109375, -0.062397003173828125, -0.05254364013671875, -0.042690277099609375, -0.0328369140625, -0.022983551025390625, -0.01313018798828125, -0.003276824951171875, 0.0065765380859375, 0.016429901123046875, 0.02628326416015625, 0.036136627197265625, 0.045989990234375, 0.055843353271484375, 0.06569671630859375, 0.07555007934570312, 0.0854034423828125, 0.09525680541992188, 0.10511016845703125, 0.11496353149414062, 0.12481689453125, 0.13467025756835938, 0.14452362060546875, 0.15437698364257812, 0.1642303466796875, 0.17408370971679688, 0.18393707275390625, 0.19379043579101562, 0.203643798828125, 0.21349716186523438, 0.22335052490234375, 0.23320388793945312, 0.2430572509765625, 0.2529106140136719, 0.26276397705078125, 0.2726173400878906, 0.282470703125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 3.0, 3.0, 13.0, 9.0, 9.0, 11.0, 16.0, 19.0, 28.0, 52.0, 46.0, 69.0, 61.0, 84.0, 76.0, 82.0, 71.0, 62.0, 58.0, 48.0, 40.0, 31.0, 21.0, 16.0, 12.0, 11.0, 13.0, 7.0, 5.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.299629211425781, -14.861589431762695, -14.42354965209961, -13.98551082611084, -13.547471046447754, -13.109431266784668, -12.671392440795898, -12.233352661132812, -11.795312881469727, -11.35727310180664, -10.919233322143555, -10.481194496154785, -10.0431547164917, -9.605114936828613, -9.167076110839844, -8.729036331176758, -8.290996551513672, -7.852956771850586, -7.414917469024658, -6.9768781661987305, -6.5388383865356445, -6.100798606872559, -5.662759304046631, -5.224720001220703, -4.786680221557617, -4.348640441894531, -3.9106011390686035, -3.4725615978240967, -3.03452205657959, -2.596482515335083, -2.158442974090576, -1.7204034328460693, -1.282364845275879, -0.8443253040313721, -0.40628576278686523, 0.0317537784576416, 0.46979331970214844, 0.9078328609466553, 1.345872402191162, 1.783911943435669, 2.221951484680176, 2.6599910259246826, 3.0980305671691895, 3.5360701084136963, 3.974109649658203, 4.412149429321289, 4.850188732147217, 5.2882280349731445, 5.7262678146362305, 6.164307594299316, 6.602346897125244, 7.040386199951172, 7.478425979614258, 7.916465759277344, 8.35450553894043, 8.7925443649292, 9.230584144592285, 9.668623924255371, 10.10666275024414, 10.544702529907227, 10.982742309570312, 11.420782089233398, 11.858821868896484, 12.296860694885254, 12.73490047454834]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 4.0, 6.0, 10.0, 13.0, 17.0, 21.0, 27.0, 28.0, 28.0, 29.0, 25.0, 28.0, 42.0, 34.0, 39.0, 38.0, 47.0, 46.0, 43.0, 47.0, 31.0, 45.0, 31.0, 41.0, 28.0, 27.0, 32.0, 17.0, 34.0, 15.0, 17.0, 25.0, 14.0, 16.0, 11.0, 7.0, 4.0, 4.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.965717792510986, -6.735640048980713, -6.5055623054504395, -6.275484561920166, -6.045406818389893, -5.815329074859619, -5.585251331329346, -5.355173587799072, -5.125095844268799, -4.895018100738525, -4.664940357208252, -4.4348626136779785, -4.204784870147705, -3.9747071266174316, -3.744629383087158, -3.5145516395568848, -3.2844741344451904, -3.054396390914917, -2.8243186473846436, -2.59424090385437, -2.3641631603240967, -2.1340856552124023, -1.9040077924728394, -1.673930048942566, -1.4438523054122925, -1.213774561882019, -0.9836968183517456, -0.7536191344261169, -0.5235413908958435, -0.29346370697021484, -0.0633859634399414, 0.16669178009033203, 0.39676952362060547, 0.6268472671508789, 0.8569250106811523, 1.0870027542114258, 1.3170804977416992, 1.547158122062683, 1.7772358655929565, 2.0073137283325195, 2.237391471862793, 2.4674692153930664, 2.69754695892334, 2.9276247024536133, 3.1577024459838867, 3.38778018951416, 3.6178579330444336, 3.847935676574707, 4.0780134201049805, 4.308091163635254, 4.538168907165527, 4.768246650695801, 4.998324394226074, 5.228402137756348, 5.458479881286621, 5.6885576248168945, 5.91863489151001, 6.148712635040283, 6.378790378570557, 6.60886812210083, 6.8389458656311035, 7.069023609161377, 7.29910135269165, 7.529179096221924, 7.759256839752197]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 7.0, 5.0, 20.0, 20.0, 32.0, 51.0, 98.0, 162.0, 204.0, 306.0, 497.0, 749.0, 1258.0, 2023.0, 3137.0, 5248.0, 8227.0, 13740.0, 21266.0, 32986.0, 49607.0, 71182.0, 94816.0, 115574.0, 126883.0, 124346.0, 108146.0, 86054.0, 62309.0, 43441.0, 28197.0, 17998.0, 11366.0, 7013.0, 4423.0, 2697.0, 1680.0, 977.0, 610.0, 412.0, 309.0, 168.0, 112.0, 71.0, 46.0, 27.0, 22.0, 16.0, 7.0, 5.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.78515625, -5.61407470703125, -5.4429931640625, -5.27191162109375, -5.100830078125, -4.92974853515625, -4.7586669921875, -4.58758544921875, -4.41650390625, -4.24542236328125, -4.0743408203125, -3.90325927734375, -3.732177734375, -3.56109619140625, -3.3900146484375, -3.21893310546875, -3.0478515625, -2.87677001953125, -2.7056884765625, -2.53460693359375, -2.363525390625, -2.19244384765625, -2.0213623046875, -1.85028076171875, -1.67919921875, -1.50811767578125, -1.3370361328125, -1.16595458984375, -0.994873046875, -0.82379150390625, -0.6527099609375, -0.48162841796875, -0.310546875, -0.13946533203125, 0.0316162109375, 0.20269775390625, 0.373779296875, 0.54486083984375, 0.7159423828125, 0.88702392578125, 1.05810546875, 1.22918701171875, 1.4002685546875, 1.57135009765625, 1.742431640625, 1.91351318359375, 2.0845947265625, 2.25567626953125, 2.4267578125, 2.59783935546875, 2.7689208984375, 2.94000244140625, 3.111083984375, 3.28216552734375, 3.4532470703125, 3.62432861328125, 3.79541015625, 3.96649169921875, 4.1375732421875, 4.30865478515625, 4.479736328125, 4.65081787109375, 4.8218994140625, 4.99298095703125, 5.1640625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 3.0, 8.0, 12.0, 12.0, 12.0, 15.0, 15.0, 27.0, 26.0, 24.0, 17.0, 31.0, 31.0, 37.0, 45.0, 29.0, 54.0, 48.0, 41.0, 46.0, 38.0, 38.0, 35.0, 33.0, 34.0, 42.0, 34.0, 20.0, 20.0, 20.0, 14.0, 25.0, 26.0, 19.0, 17.0, 7.0, 11.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.9140625, -6.678466796875, -6.44287109375, -6.207275390625, -5.9716796875, -5.736083984375, -5.50048828125, -5.264892578125, -5.029296875, -4.793701171875, -4.55810546875, -4.322509765625, -4.0869140625, -3.851318359375, -3.61572265625, -3.380126953125, -3.14453125, -2.908935546875, -2.67333984375, -2.437744140625, -2.2021484375, -1.966552734375, -1.73095703125, -1.495361328125, -1.259765625, -1.024169921875, -0.78857421875, -0.552978515625, -0.3173828125, -0.081787109375, 0.15380859375, 0.389404296875, 0.625, 0.860595703125, 1.09619140625, 1.331787109375, 1.5673828125, 1.802978515625, 2.03857421875, 2.274169921875, 2.509765625, 2.745361328125, 2.98095703125, 3.216552734375, 3.4521484375, 3.687744140625, 3.92333984375, 4.158935546875, 4.39453125, 4.630126953125, 4.86572265625, 5.101318359375, 5.3369140625, 5.572509765625, 5.80810546875, 6.043701171875, 6.279296875, 6.514892578125, 6.75048828125, 6.986083984375, 7.2216796875, 7.457275390625, 7.69287109375, 7.928466796875, 8.1640625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 8.0, 12.0, 15.0, 22.0, 25.0, 31.0, 63.0, 59.0, 114.0, 169.0, 241.0, 375.0, 610.0, 957.0, 1633.0, 2784.0, 4967.0, 8590.0, 15270.0, 26554.0, 45162.0, 72447.0, 108634.0, 142681.0, 158974.0, 147935.0, 114738.0, 78268.0, 48946.0, 29072.0, 16649.0, 9487.0, 5230.0, 3112.0, 1753.0, 1105.0, 685.0, 398.0, 263.0, 167.0, 111.0, 76.0, 48.0, 31.0, 21.0, 18.0, 14.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-7.796875, -7.5714111328125, -7.345947265625, -7.1204833984375, -6.89501953125, -6.6695556640625, -6.444091796875, -6.2186279296875, -5.9931640625, -5.7677001953125, -5.542236328125, -5.3167724609375, -5.09130859375, -4.8658447265625, -4.640380859375, -4.4149169921875, -4.189453125, -3.9639892578125, -3.738525390625, -3.5130615234375, -3.28759765625, -3.0621337890625, -2.836669921875, -2.6112060546875, -2.3857421875, -2.1602783203125, -1.934814453125, -1.7093505859375, -1.48388671875, -1.2584228515625, -1.032958984375, -0.8074951171875, -0.58203125, -0.3565673828125, -0.131103515625, 0.0943603515625, 0.31982421875, 0.5452880859375, 0.770751953125, 0.9962158203125, 1.2216796875, 1.4471435546875, 1.672607421875, 1.8980712890625, 2.12353515625, 2.3489990234375, 2.574462890625, 2.7999267578125, 3.025390625, 3.2508544921875, 3.476318359375, 3.7017822265625, 3.92724609375, 4.1527099609375, 4.378173828125, 4.6036376953125, 4.8291015625, 5.0545654296875, 5.280029296875, 5.5054931640625, 5.73095703125, 5.9564208984375, 6.181884765625, 6.4073486328125, 6.6328125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 4.0, 6.0, 2.0, 5.0, 11.0, 13.0, 15.0, 11.0, 23.0, 15.0, 22.0, 21.0, 37.0, 27.0, 28.0, 38.0, 34.0, 39.0, 41.0, 43.0, 41.0, 43.0, 40.0, 52.0, 28.0, 34.0, 30.0, 43.0, 38.0, 40.0, 25.0, 30.0, 21.0, 22.0, 19.0, 14.0, 19.0, 7.0, 2.0, 6.0, 8.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.78515625, -4.63287353515625, -4.4805908203125, -4.32830810546875, -4.176025390625, -4.02374267578125, -3.8714599609375, -3.71917724609375, -3.56689453125, -3.41461181640625, -3.2623291015625, -3.11004638671875, -2.957763671875, -2.80548095703125, -2.6531982421875, -2.50091552734375, -2.3486328125, -2.19635009765625, -2.0440673828125, -1.89178466796875, -1.739501953125, -1.58721923828125, -1.4349365234375, -1.28265380859375, -1.13037109375, -0.97808837890625, -0.8258056640625, -0.67352294921875, -0.521240234375, -0.36895751953125, -0.2166748046875, -0.06439208984375, 0.087890625, 0.24017333984375, 0.3924560546875, 0.54473876953125, 0.697021484375, 0.84930419921875, 1.0015869140625, 1.15386962890625, 1.30615234375, 1.45843505859375, 1.6107177734375, 1.76300048828125, 1.915283203125, 2.06756591796875, 2.2198486328125, 2.37213134765625, 2.5244140625, 2.67669677734375, 2.8289794921875, 2.98126220703125, 3.133544921875, 3.28582763671875, 3.4381103515625, 3.59039306640625, 3.74267578125, 3.89495849609375, 4.0472412109375, 4.19952392578125, 4.351806640625, 4.50408935546875, 4.6563720703125, 4.80865478515625, 4.9609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 6.0, 10.0, 10.0, 17.0, 25.0, 20.0, 38.0, 52.0, 94.0, 151.0, 189.0, 303.0, 411.0, 663.0, 996.0, 1535.0, 2399.0, 3838.0, 6398.0, 10990.0, 19373.0, 34460.0, 61273.0, 102368.0, 153342.0, 185219.0, 168800.0, 121384.0, 74254.0, 42552.0, 23685.0, 13328.0, 7615.0, 4658.0, 2835.0, 1789.0, 1127.0, 745.0, 524.0, 347.0, 213.0, 188.0, 114.0, 70.0, 50.0, 26.0, 28.0, 16.0, 13.0, 9.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.32421875, -4.19189453125, -4.0595703125, -3.92724609375, -3.794921875, -3.66259765625, -3.5302734375, -3.39794921875, -3.265625, -3.13330078125, -3.0009765625, -2.86865234375, -2.736328125, -2.60400390625, -2.4716796875, -2.33935546875, -2.20703125, -2.07470703125, -1.9423828125, -1.81005859375, -1.677734375, -1.54541015625, -1.4130859375, -1.28076171875, -1.1484375, -1.01611328125, -0.8837890625, -0.75146484375, -0.619140625, -0.48681640625, -0.3544921875, -0.22216796875, -0.08984375, 0.04248046875, 0.1748046875, 0.30712890625, 0.439453125, 0.57177734375, 0.7041015625, 0.83642578125, 0.96875, 1.10107421875, 1.2333984375, 1.36572265625, 1.498046875, 1.63037109375, 1.7626953125, 1.89501953125, 2.02734375, 2.15966796875, 2.2919921875, 2.42431640625, 2.556640625, 2.68896484375, 2.8212890625, 2.95361328125, 3.0859375, 3.21826171875, 3.3505859375, 3.48291015625, 3.615234375, 3.74755859375, 3.8798828125, 4.01220703125, 4.14453125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 12.0, 11.0, 12.0, 14.0, 19.0, 24.0, 38.0, 35.0, 42.0, 43.0, 60.0, 46.0, 59.0, 56.0, 71.0, 65.0, 50.0, 50.0, 51.0, 50.0, 32.0, 24.0, 25.0, 14.0, 13.0, 17.0, 16.0, 11.0, 4.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00032210350036621094, -0.00031204521656036377, -0.0003019869327545166, -0.00029192864894866943, -0.00028187036514282227, -0.0002718120813369751, -0.00026175379753112793, -0.00025169551372528076, -0.0002416372299194336, -0.00023157894611358643, -0.00022152066230773926, -0.0002114623785018921, -0.00020140409469604492, -0.00019134581089019775, -0.00018128752708435059, -0.00017122924327850342, -0.00016117095947265625, -0.00015111267566680908, -0.00014105439186096191, -0.00013099610805511475, -0.00012093782424926758, -0.00011087954044342041, -0.00010082125663757324, -9.076297283172607e-05, -8.07046890258789e-05, -7.064640522003174e-05, -6.058812141418457e-05, -5.05298376083374e-05, -4.0471553802490234e-05, -3.0413269996643066e-05, -2.03549861907959e-05, -1.029670238494873e-05, -2.384185791015625e-07, 9.819865226745605e-06, 1.9878149032592773e-05, 2.993643283843994e-05, 3.999471664428711e-05, 5.005300045013428e-05, 6.0111284255981445e-05, 7.016956806182861e-05, 8.022785186767578e-05, 9.028613567352295e-05, 0.00010034441947937012, 0.00011040270328521729, 0.00012046098709106445, 0.00013051927089691162, 0.0001405775547027588, 0.00015063583850860596, 0.00016069412231445312, 0.0001707524061203003, 0.00018081068992614746, 0.00019086897373199463, 0.0002009272575378418, 0.00021098554134368896, 0.00022104382514953613, 0.0002311021089553833, 0.00024116039276123047, 0.00025121867656707764, 0.0002612769603729248, 0.00027133524417877197, 0.00028139352798461914, 0.0002914518117904663, 0.0003015100955963135, 0.00031156837940216064, 0.0003216266632080078]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 4.0, 7.0, 14.0, 20.0, 31.0, 36.0, 37.0, 70.0, 107.0, 186.0, 236.0, 435.0, 706.0, 1074.0, 1869.0, 3265.0, 5354.0, 9698.0, 16462.0, 28852.0, 49942.0, 81760.0, 125499.0, 164587.0, 172967.0, 142325.0, 97654.0, 60492.0, 35821.0, 20450.0, 11678.0, 6938.0, 3969.0, 2327.0, 1374.0, 812.0, 494.0, 325.0, 235.0, 136.0, 80.0, 62.0, 49.0, 31.0, 20.0, 15.0, 17.0, 11.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.07421875, -3.95147705078125, -3.8287353515625, -3.70599365234375, -3.583251953125, -3.46051025390625, -3.3377685546875, -3.21502685546875, -3.09228515625, -2.96954345703125, -2.8468017578125, -2.72406005859375, -2.601318359375, -2.47857666015625, -2.3558349609375, -2.23309326171875, -2.1103515625, -1.98760986328125, -1.8648681640625, -1.74212646484375, -1.619384765625, -1.49664306640625, -1.3739013671875, -1.25115966796875, -1.12841796875, -1.00567626953125, -0.8829345703125, -0.76019287109375, -0.637451171875, -0.51470947265625, -0.3919677734375, -0.26922607421875, -0.146484375, -0.02374267578125, 0.0989990234375, 0.22174072265625, 0.344482421875, 0.46722412109375, 0.5899658203125, 0.71270751953125, 0.83544921875, 0.95819091796875, 1.0809326171875, 1.20367431640625, 1.326416015625, 1.44915771484375, 1.5718994140625, 1.69464111328125, 1.8173828125, 1.94012451171875, 2.0628662109375, 2.18560791015625, 2.308349609375, 2.43109130859375, 2.5538330078125, 2.67657470703125, 2.79931640625, 2.92205810546875, 3.0447998046875, 3.16754150390625, 3.290283203125, 3.41302490234375, 3.5357666015625, 3.65850830078125, 3.78125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 9.0, 4.0, 7.0, 8.0, 3.0, 13.0, 18.0, 13.0, 15.0, 15.0, 19.0, 17.0, 30.0, 24.0, 29.0, 34.0, 26.0, 32.0, 44.0, 41.0, 38.0, 44.0, 38.0, 50.0, 49.0, 43.0, 34.0, 38.0, 28.0, 34.0, 19.0, 45.0, 21.0, 20.0, 17.0, 13.0, 11.0, 13.0, 10.0, 6.0, 5.0, 6.0, 8.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.828125, -0.8000869750976562, -0.7720489501953125, -0.7440109252929688, -0.715972900390625, -0.6879348754882812, -0.6598968505859375, -0.6318588256835938, -0.60382080078125, -0.5757827758789062, -0.5477447509765625, -0.5197067260742188, -0.491668701171875, -0.46363067626953125, -0.4355926513671875, -0.40755462646484375, -0.3795166015625, -0.35147857666015625, -0.3234405517578125, -0.29540252685546875, -0.267364501953125, -0.23932647705078125, -0.2112884521484375, -0.18325042724609375, -0.15521240234375, -0.12717437744140625, -0.0991363525390625, -0.07109832763671875, -0.043060302734375, -0.01502227783203125, 0.0130157470703125, 0.04105377197265625, 0.069091796875, 0.09712982177734375, 0.1251678466796875, 0.15320587158203125, 0.181243896484375, 0.20928192138671875, 0.2373199462890625, 0.26535797119140625, 0.29339599609375, 0.32143402099609375, 0.3494720458984375, 0.37751007080078125, 0.405548095703125, 0.43358612060546875, 0.4616241455078125, 0.48966217041015625, 0.5177001953125, 0.5457382202148438, 0.5737762451171875, 0.6018142700195312, 0.629852294921875, 0.6578903198242188, 0.6859283447265625, 0.7139663696289062, 0.74200439453125, 0.7700424194335938, 0.7980804443359375, 0.8261184692382812, 0.854156494140625, 0.8821945190429688, 0.9102325439453125, 0.9382705688476562, 0.96630859375]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 9.0, 6.0, 7.0, 12.0, 13.0, 13.0, 23.0, 24.0, 32.0, 63.0, 59.0, 60.0, 64.0, 64.0, 76.0, 61.0, 70.0, 55.0, 64.0, 42.0, 30.0, 32.0, 29.0, 15.0, 11.0, 10.0, 10.0, 6.0, 4.0, 3.0, 7.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.503911018371582, -13.099896430969238, -12.695881843566895, -12.29186725616455, -11.88785171508789, -11.483837127685547, -11.079822540283203, -10.67580795288086, -10.271793365478516, -9.867778778076172, -9.463764190673828, -9.059749603271484, -8.65573501586914, -8.251720428466797, -7.847704887390137, -7.443690299987793, -7.039675712585449, -6.6356611251831055, -6.231646537780762, -5.82763147354126, -5.423616886138916, -5.019602298736572, -4.61558723449707, -4.211572647094727, -3.807558059692383, -3.403543472290039, -2.999528646469116, -2.5955138206481934, -2.1914992332458496, -1.7874846458435059, -1.383469820022583, -0.9794549942016602, -0.575439453125, -0.1714247465133667, 0.2325899600982666, 0.6366046667098999, 1.0406193733215332, 1.444633960723877, 1.8486487865447998, 2.2526636123657227, 2.6566781997680664, 3.06069278717041, 3.464707612991333, 3.868722438812256, 4.2727370262146, 4.676751613616943, 5.080766677856445, 5.484781265258789, 5.888795852661133, 6.292810440063477, 6.69682502746582, 7.100840091705322, 7.504854679107666, 7.90886926651001, 8.312884330749512, 8.716898918151855, 9.1209135055542, 9.524928092956543, 9.928942680358887, 10.33295726776123, 10.73697280883789, 11.140987396240234, 11.545001983642578, 11.949016571044922, 12.353031158447266]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 14.0, 11.0, 22.0, 16.0, 14.0, 23.0, 23.0, 27.0, 23.0, 29.0, 33.0, 34.0, 43.0, 34.0, 38.0, 38.0, 37.0, 33.0, 38.0, 32.0, 34.0, 38.0, 24.0, 36.0, 37.0, 29.0, 30.0, 26.0, 18.0, 17.0, 22.0, 19.0, 18.0, 11.0, 13.0, 10.0, 4.0, 4.0, 6.0, 2.0, 4.0, 5.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.619550704956055, -6.404935359954834, -6.1903204917907715, -5.975705146789551, -5.76108980178833, -5.546474456787109, -5.331859588623047, -5.117244243621826, -4.9026288986206055, -4.688013553619385, -4.473398685455322, -4.258783340454102, -4.044167995452881, -3.8295528888702393, -3.6149377822875977, -3.400322437286377, -3.1857073307037354, -2.9710922241210938, -2.756476879119873, -2.5418617725372314, -2.3272464275360107, -2.112631320953369, -1.898016095161438, -1.6834008693695068, -1.4687856435775757, -1.2541704177856445, -1.0395551919937134, -0.824940025806427, -0.6103248000144958, -0.3957096338272095, -0.18109440803527832, 0.03352081775665283, 0.24813604354858398, 0.46275126934051514, 0.6773664951324463, 0.8919816613197327, 1.1065969467163086, 1.3212120532989502, 1.5358272790908813, 1.7504425048828125, 1.9650577306747437, 2.179672956466675, 2.3942880630493164, 2.608903408050537, 2.8235185146331787, 3.0381336212158203, 3.252748966217041, 3.4673643112182617, 3.6819794178009033, 3.896594524383545, 4.111209869384766, 4.325825214385986, 4.540440082550049, 4.7550554275512695, 4.96967077255249, 5.184286117553711, 5.398900985717773, 5.613516330718994, 5.828131198883057, 6.042746543884277, 6.257361888885498, 6.471977233886719, 6.686592102050781, 6.901207447052002, 7.115822792053223]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 12.0, 23.0, 37.0, 46.0, 90.0, 137.0, 227.0, 329.0, 511.0, 817.0, 1473.0, 2396.0, 3949.0, 6559.0, 11378.0, 19275.0, 33190.0, 58564.0, 101900.0, 178617.0, 302719.0, 482711.0, 669453.0, 729576.0, 602813.0, 404648.0, 245675.0, 142277.0, 81376.0, 46940.0, 27155.0, 15878.0, 9197.0, 5535.0, 3365.0, 2045.0, 1236.0, 805.0, 540.0, 322.0, 179.0, 97.0, 72.0, 56.0, 30.0, 20.0, 17.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.390625, -8.138671875, -7.88671875, -7.634765625, -7.3828125, -7.130859375, -6.87890625, -6.626953125, -6.375, -6.123046875, -5.87109375, -5.619140625, -5.3671875, -5.115234375, -4.86328125, -4.611328125, -4.359375, -4.107421875, -3.85546875, -3.603515625, -3.3515625, -3.099609375, -2.84765625, -2.595703125, -2.34375, -2.091796875, -1.83984375, -1.587890625, -1.3359375, -1.083984375, -0.83203125, -0.580078125, -0.328125, -0.076171875, 0.17578125, 0.427734375, 0.6796875, 0.931640625, 1.18359375, 1.435546875, 1.6875, 1.939453125, 2.19140625, 2.443359375, 2.6953125, 2.947265625, 3.19921875, 3.451171875, 3.703125, 3.955078125, 4.20703125, 4.458984375, 4.7109375, 4.962890625, 5.21484375, 5.466796875, 5.71875, 5.970703125, 6.22265625, 6.474609375, 6.7265625, 6.978515625, 7.23046875, 7.482421875, 7.734375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 5.0, 3.0, 6.0, 2.0, 6.0, 6.0, 11.0, 15.0, 17.0, 20.0, 20.0, 12.0, 25.0, 36.0, 21.0, 40.0, 44.0, 42.0, 39.0, 31.0, 43.0, 46.0, 35.0, 32.0, 34.0, 35.0, 39.0, 34.0, 41.0, 31.0, 35.0, 31.0, 28.0, 25.0, 24.0, 14.0, 14.0, 11.0, 10.0, 9.0, 8.0, 6.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.13330078125, -3.9736328125, -3.81396484375, -3.654296875, -3.49462890625, -3.3349609375, -3.17529296875, -3.015625, -2.85595703125, -2.6962890625, -2.53662109375, -2.376953125, -2.21728515625, -2.0576171875, -1.89794921875, -1.73828125, -1.57861328125, -1.4189453125, -1.25927734375, -1.099609375, -0.93994140625, -0.7802734375, -0.62060546875, -0.4609375, -0.30126953125, -0.1416015625, 0.01806640625, 0.177734375, 0.33740234375, 0.4970703125, 0.65673828125, 0.81640625, 0.97607421875, 1.1357421875, 1.29541015625, 1.455078125, 1.61474609375, 1.7744140625, 1.93408203125, 2.09375, 2.25341796875, 2.4130859375, 2.57275390625, 2.732421875, 2.89208984375, 3.0517578125, 3.21142578125, 3.37109375, 3.53076171875, 3.6904296875, 3.85009765625, 4.009765625, 4.16943359375, 4.3291015625, 4.48876953125, 4.6484375, 4.80810546875, 4.9677734375, 5.12744140625, 5.287109375, 5.44677734375, 5.6064453125, 5.76611328125, 5.92578125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 5.0, 8.0, 17.0, 29.0, 40.0, 68.0, 83.0, 161.0, 240.0, 395.0, 666.0, 1104.0, 1878.0, 3027.0, 5110.0, 9139.0, 15486.0, 27528.0, 48672.0, 84652.0, 146808.0, 248043.0, 393507.0, 559215.0, 667419.0, 643569.0, 503408.0, 339371.0, 208881.0, 122348.0, 69854.0, 39579.0, 22752.0, 12895.0, 7421.0, 4361.0, 2569.0, 1569.0, 951.0, 535.0, 358.0, 194.0, 145.0, 91.0, 49.0, 31.0, 15.0, 10.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-8.0078125, -7.7562255859375, -7.504638671875, -7.2530517578125, -7.00146484375, -6.7498779296875, -6.498291015625, -6.2467041015625, -5.9951171875, -5.7435302734375, -5.491943359375, -5.2403564453125, -4.98876953125, -4.7371826171875, -4.485595703125, -4.2340087890625, -3.982421875, -3.7308349609375, -3.479248046875, -3.2276611328125, -2.97607421875, -2.7244873046875, -2.472900390625, -2.2213134765625, -1.9697265625, -1.7181396484375, -1.466552734375, -1.2149658203125, -0.96337890625, -0.7117919921875, -0.460205078125, -0.2086181640625, 0.04296875, 0.2945556640625, 0.546142578125, 0.7977294921875, 1.04931640625, 1.3009033203125, 1.552490234375, 1.8040771484375, 2.0556640625, 2.3072509765625, 2.558837890625, 2.8104248046875, 3.06201171875, 3.3135986328125, 3.565185546875, 3.8167724609375, 4.068359375, 4.3199462890625, 4.571533203125, 4.8231201171875, 5.07470703125, 5.3262939453125, 5.577880859375, 5.8294677734375, 6.0810546875, 6.3326416015625, 6.584228515625, 6.8358154296875, 7.08740234375, 7.3389892578125, 7.590576171875, 7.8421630859375, 8.09375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 0.0, 6.0, 5.0, 5.0, 11.0, 27.0, 21.0, 43.0, 41.0, 56.0, 55.0, 111.0, 111.0, 146.0, 180.0, 216.0, 210.0, 231.0, 256.0, 284.0, 248.0, 243.0, 236.0, 221.0, 207.0, 169.0, 160.0, 112.0, 107.0, 87.0, 70.0, 42.0, 46.0, 32.0, 20.0, 16.0, 12.0, 12.0, 7.0, 3.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.78125, -2.678680419921875, -2.57611083984375, -2.473541259765625, -2.3709716796875, -2.268402099609375, -2.16583251953125, -2.063262939453125, -1.960693359375, -1.858123779296875, -1.75555419921875, -1.652984619140625, -1.5504150390625, -1.447845458984375, -1.34527587890625, -1.242706298828125, -1.14013671875, -1.037567138671875, -0.93499755859375, -0.832427978515625, -0.7298583984375, -0.627288818359375, -0.52471923828125, -0.422149658203125, -0.319580078125, -0.217010498046875, -0.11444091796875, -0.011871337890625, 0.0906982421875, 0.193267822265625, 0.29583740234375, 0.398406982421875, 0.5009765625, 0.603546142578125, 0.70611572265625, 0.808685302734375, 0.9112548828125, 1.013824462890625, 1.11639404296875, 1.218963623046875, 1.321533203125, 1.424102783203125, 1.52667236328125, 1.629241943359375, 1.7318115234375, 1.834381103515625, 1.93695068359375, 2.039520263671875, 2.14208984375, 2.244659423828125, 2.34722900390625, 2.449798583984375, 2.5523681640625, 2.654937744140625, 2.75750732421875, 2.860076904296875, 2.962646484375, 3.065216064453125, 3.16778564453125, 3.270355224609375, 3.3729248046875, 3.475494384765625, 3.57806396484375, 3.680633544921875, 3.783203125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 8.0, 16.0, 16.0, 13.0, 16.0, 36.0, 42.0, 42.0, 45.0, 55.0, 65.0, 68.0, 70.0, 77.0, 58.0, 55.0, 49.0, 39.0, 45.0, 31.0, 29.0, 21.0, 21.0, 13.0, 9.0, 15.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.835649490356445, -11.461814880371094, -11.087981224060059, -10.714146614074707, -10.340312957763672, -9.96647834777832, -9.592643737792969, -9.218809127807617, -8.844975471496582, -8.47114086151123, -8.097307205200195, -7.723472595214844, -7.34963846206665, -6.975804328918457, -6.6019697189331055, -6.228135585784912, -5.854301452636719, -5.480467319488525, -5.106633186340332, -4.7327985763549805, -4.358964443206787, -3.9851303100585938, -3.6112959384918213, -3.237461566925049, -2.8636274337768555, -2.489793300628662, -2.1159589290618896, -1.7421246767044067, -1.3682904243469238, -0.9944561719894409, -0.620621919631958, -0.24678754806518555, 0.1270456314086914, 0.5008798837661743, 0.8747141361236572, 1.2485483884811401, 1.622382640838623, 1.996216893196106, 2.370051145553589, 2.7438855171203613, 3.1177196502685547, 3.491553783416748, 3.8653881549835205, 4.239222526550293, 4.613056659698486, 4.98689079284668, 5.360725402832031, 5.734559535980225, 6.108393669128418, 6.482227802276611, 6.856061935424805, 7.229896545410156, 7.60373067855835, 7.977564811706543, 8.351399421691895, 8.72523307800293, 9.099067687988281, 9.472902297973633, 9.846735954284668, 10.22057056427002, 10.594404220581055, 10.968238830566406, 11.342073440551758, 11.71590805053711, 12.089741706848145]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 3.0, 6.0, 9.0, 11.0, 13.0, 17.0, 12.0, 27.0, 27.0, 31.0, 27.0, 29.0, 35.0, 60.0, 43.0, 44.0, 39.0, 47.0, 42.0, 41.0, 44.0, 34.0, 31.0, 39.0, 42.0, 29.0, 30.0, 32.0, 28.0, 23.0, 12.0, 11.0, 20.0, 7.0, 10.0, 10.0, 9.0, 6.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0097503662109375, -6.790735721588135, -6.571721076965332, -6.352705955505371, -6.133691310882568, -5.914676666259766, -5.695662021636963, -5.47664737701416, -5.257632255554199, -5.0386176109313965, -4.819602966308594, -4.600587844848633, -4.38157320022583, -4.162558555603027, -3.9435439109802246, -3.7245290279388428, -3.50551438331604, -3.2864997386932373, -3.0674848556518555, -2.8484702110290527, -2.629455327987671, -2.410440683364868, -2.1914258003234863, -1.9724111557006836, -1.7533963918685913, -1.534381628036499, -1.3153668642044067, -1.0963521003723145, -0.8773373961448669, -0.6583226919174194, -0.43930792808532715, -0.22029316425323486, -0.0012784004211425781, 0.2177363485097885, 0.4367510974407196, 0.6557658314704895, 0.8747805953025818, 1.0937952995300293, 1.3128100633621216, 1.5318248271942139, 1.7508395910263062, 1.9698543548583984, 2.188868999481201, 2.407883882522583, 2.6268985271453857, 2.8459134101867676, 3.0649280548095703, 3.283942699432373, 3.502957582473755, 3.7219722270965576, 3.9409871101379395, 4.160001754760742, 4.379016399383545, 4.598031044006348, 4.817046165466309, 5.036060810089111, 5.255075454711914, 5.474090099334717, 5.6931047439575195, 5.9121198654174805, 6.131134510040283, 6.350149154663086, 6.569163799285889, 6.788178443908691, 7.007193565368652]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 17.0, 16.0, 29.0, 37.0, 38.0, 64.0, 95.0, 137.0, 167.0, 246.0, 293.0, 431.0, 599.0, 906.0, 1347.0, 2064.0, 3314.0, 5624.0, 11025.0, 25813.0, 76136.0, 246429.0, 400795.0, 176884.0, 53958.0, 19628.0, 8957.0, 4745.0, 2841.0, 1803.0, 1175.0, 849.0, 565.0, 443.0, 287.0, 213.0, 164.0, 118.0, 81.0, 55.0, 43.0, 37.0, 24.0, 14.0, 13.0, 3.0, 7.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-4.67578125, -4.53125, -4.38671875, -4.2421875, -4.09765625, -3.953125, -3.80859375, -3.6640625, -3.51953125, -3.375, -3.23046875, -3.0859375, -2.94140625, -2.796875, -2.65234375, -2.5078125, -2.36328125, -2.21875, -2.07421875, -1.9296875, -1.78515625, -1.640625, -1.49609375, -1.3515625, -1.20703125, -1.0625, -0.91796875, -0.7734375, -0.62890625, -0.484375, -0.33984375, -0.1953125, -0.05078125, 0.09375, 0.23828125, 0.3828125, 0.52734375, 0.671875, 0.81640625, 0.9609375, 1.10546875, 1.25, 1.39453125, 1.5390625, 1.68359375, 1.828125, 1.97265625, 2.1171875, 2.26171875, 2.40625, 2.55078125, 2.6953125, 2.83984375, 2.984375, 3.12890625, 3.2734375, 3.41796875, 3.5625, 3.70703125, 3.8515625, 3.99609375, 4.140625, 4.28515625, 4.4296875, 4.57421875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 6.0, 8.0, 12.0, 15.0, 26.0, 19.0, 26.0, 17.0, 27.0, 29.0, 49.0, 34.0, 50.0, 43.0, 48.0, 32.0, 36.0, 41.0, 34.0, 41.0, 29.0, 29.0, 33.0, 33.0, 29.0, 30.0, 39.0, 17.0, 24.0, 17.0, 15.0, 16.0, 12.0, 14.0, 5.0, 7.0, 4.0, 12.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.8359375, -6.61749267578125, -6.3990478515625, -6.18060302734375, -5.962158203125, -5.74371337890625, -5.5252685546875, -5.30682373046875, -5.08837890625, -4.86993408203125, -4.6514892578125, -4.43304443359375, -4.214599609375, -3.99615478515625, -3.7777099609375, -3.55926513671875, -3.3408203125, -3.12237548828125, -2.9039306640625, -2.68548583984375, -2.467041015625, -2.24859619140625, -2.0301513671875, -1.81170654296875, -1.59326171875, -1.37481689453125, -1.1563720703125, -0.93792724609375, -0.719482421875, -0.50103759765625, -0.2825927734375, -0.06414794921875, 0.154296875, 0.37274169921875, 0.5911865234375, 0.80963134765625, 1.028076171875, 1.24652099609375, 1.4649658203125, 1.68341064453125, 1.90185546875, 2.12030029296875, 2.3387451171875, 2.55718994140625, 2.775634765625, 2.99407958984375, 3.2125244140625, 3.43096923828125, 3.6494140625, 3.86785888671875, 4.0863037109375, 4.30474853515625, 4.523193359375, 4.74163818359375, 4.9600830078125, 5.17852783203125, 5.39697265625, 5.61541748046875, 5.8338623046875, 6.05230712890625, 6.270751953125, 6.48919677734375, 6.7076416015625, 6.92608642578125, 7.14453125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 10.0, 14.0, 15.0, 26.0, 45.0, 67.0, 105.0, 185.0, 249.0, 451.0, 868.0, 1700.0, 3803.0, 10554.0, 39748.0, 211217.0, 552938.0, 176054.0, 34085.0, 9401.0, 3526.0, 1544.0, 811.0, 427.0, 249.0, 158.0, 104.0, 49.0, 46.0, 26.0, 22.0, 15.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.44921875, -7.22650146484375, -7.0037841796875, -6.78106689453125, -6.558349609375, -6.33563232421875, -6.1129150390625, -5.89019775390625, -5.66748046875, -5.44476318359375, -5.2220458984375, -4.99932861328125, -4.776611328125, -4.55389404296875, -4.3311767578125, -4.10845947265625, -3.8857421875, -3.66302490234375, -3.4403076171875, -3.21759033203125, -2.994873046875, -2.77215576171875, -2.5494384765625, -2.32672119140625, -2.10400390625, -1.88128662109375, -1.6585693359375, -1.43585205078125, -1.213134765625, -0.99041748046875, -0.7677001953125, -0.54498291015625, -0.322265625, -0.09954833984375, 0.1231689453125, 0.34588623046875, 0.568603515625, 0.79132080078125, 1.0140380859375, 1.23675537109375, 1.45947265625, 1.68218994140625, 1.9049072265625, 2.12762451171875, 2.350341796875, 2.57305908203125, 2.7957763671875, 3.01849365234375, 3.2412109375, 3.46392822265625, 3.6866455078125, 3.90936279296875, 4.132080078125, 4.35479736328125, 4.5775146484375, 4.80023193359375, 5.02294921875, 5.24566650390625, 5.4683837890625, 5.69110107421875, 5.913818359375, 6.13653564453125, 6.3592529296875, 6.58197021484375, 6.8046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 6.0, 3.0, 6.0, 8.0, 5.0, 7.0, 16.0, 18.0, 17.0, 18.0, 14.0, 23.0, 17.0, 25.0, 22.0, 26.0, 19.0, 34.0, 30.0, 27.0, 47.0, 42.0, 35.0, 40.0, 40.0, 28.0, 41.0, 43.0, 29.0, 43.0, 31.0, 21.0, 23.0, 42.0, 23.0, 16.0, 17.0, 14.0, 18.0, 11.0, 11.0, 6.0, 9.0, 5.0, 4.0, 6.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.958984375, -3.831817626953125, -3.70465087890625, -3.577484130859375, -3.4503173828125, -3.323150634765625, -3.19598388671875, -3.068817138671875, -2.941650390625, -2.814483642578125, -2.68731689453125, -2.560150146484375, -2.4329833984375, -2.305816650390625, -2.17864990234375, -2.051483154296875, -1.92431640625, -1.797149658203125, -1.66998291015625, -1.542816162109375, -1.4156494140625, -1.288482666015625, -1.16131591796875, -1.034149169921875, -0.906982421875, -0.779815673828125, -0.65264892578125, -0.525482177734375, -0.3983154296875, -0.271148681640625, -0.14398193359375, -0.016815185546875, 0.1103515625, 0.237518310546875, 0.36468505859375, 0.491851806640625, 0.6190185546875, 0.746185302734375, 0.87335205078125, 1.000518798828125, 1.127685546875, 1.254852294921875, 1.38201904296875, 1.509185791015625, 1.6363525390625, 1.763519287109375, 1.89068603515625, 2.017852783203125, 2.14501953125, 2.272186279296875, 2.39935302734375, 2.526519775390625, 2.6536865234375, 2.780853271484375, 2.90802001953125, 3.035186767578125, 3.162353515625, 3.289520263671875, 3.41668701171875, 3.543853759765625, 3.6710205078125, 3.798187255859375, 3.92535400390625, 4.052520751953125, 4.1796875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 11.0, 26.0, 31.0, 59.0, 69.0, 108.0, 170.0, 278.0, 461.0, 739.0, 1345.0, 2510.0, 5298.0, 13097.0, 45856.0, 370790.0, 517462.0, 61793.0, 15944.0, 6057.0, 2772.0, 1428.0, 855.0, 479.0, 304.0, 213.0, 110.0, 94.0, 55.0, 38.0, 20.0, 12.0, 9.0, 8.0, 9.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.603515625, -2.53515625, -2.466796875, -2.3984375, -2.330078125, -2.26171875, -2.193359375, -2.125, -2.056640625, -1.98828125, -1.919921875, -1.8515625, -1.783203125, -1.71484375, -1.646484375, -1.578125, -1.509765625, -1.44140625, -1.373046875, -1.3046875, -1.236328125, -1.16796875, -1.099609375, -1.03125, -0.962890625, -0.89453125, -0.826171875, -0.7578125, -0.689453125, -0.62109375, -0.552734375, -0.484375, -0.416015625, -0.34765625, -0.279296875, -0.2109375, -0.142578125, -0.07421875, -0.005859375, 0.0625, 0.130859375, 0.19921875, 0.267578125, 0.3359375, 0.404296875, 0.47265625, 0.541015625, 0.609375, 0.677734375, 0.74609375, 0.814453125, 0.8828125, 0.951171875, 1.01953125, 1.087890625, 1.15625, 1.224609375, 1.29296875, 1.361328125, 1.4296875, 1.498046875, 1.56640625, 1.634765625, 1.703125, 1.771484375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 8.0, 6.0, 9.0, 9.0, 8.0, 22.0, 32.0, 137.0, 300.0, 242.0, 105.0, 33.0, 12.0, 8.0, 3.0, 7.0, 10.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00021541118621826172, -0.00020972080528736115, -0.00020403042435646057, -0.00019834004342556, -0.00019264966249465942, -0.00018695928156375885, -0.00018126890063285828, -0.0001755785197019577, -0.00016988813877105713, -0.00016419775784015656, -0.00015850737690925598, -0.0001528169959783554, -0.00014712661504745483, -0.00014143623411655426, -0.0001357458531856537, -0.0001300554722547531, -0.00012436509132385254, -0.00011867471039295197, -0.00011298432946205139, -0.00010729394853115082, -0.00010160356760025024, -9.591318666934967e-05, -9.02228057384491e-05, -8.453242480754852e-05, -7.884204387664795e-05, -7.315166294574738e-05, -6.74612820148468e-05, -6.177090108394623e-05, -5.6080520153045654e-05, -5.039013922214508e-05, -4.469975829124451e-05, -3.900937736034393e-05, -3.331899642944336e-05, -2.7628615498542786e-05, -2.1938234567642212e-05, -1.6247853636741638e-05, -1.0557472705841064e-05, -4.867091774940491e-06, 8.23289155960083e-07, 6.513670086860657e-06, 1.220405101776123e-05, 1.7894431948661804e-05, 2.3584812879562378e-05, 2.927519381046295e-05, 3.4965574741363525e-05, 4.06559556722641e-05, 4.634633660316467e-05, 5.2036717534065247e-05, 5.772709846496582e-05, 6.34174793958664e-05, 6.910786032676697e-05, 7.479824125766754e-05, 8.048862218856812e-05, 8.617900311946869e-05, 9.186938405036926e-05, 9.755976498126984e-05, 0.00010325014591217041, 0.00010894052684307098, 0.00011463090777397156, 0.00012032128870487213, 0.0001260116696357727, 0.00013170205056667328, 0.00013739243149757385, 0.00014308281242847443, 0.000148773193359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 12.0, 21.0, 28.0, 31.0, 42.0, 62.0, 91.0, 127.0, 210.0, 251.0, 394.0, 562.0, 790.0, 1268.0, 1764.0, 2843.0, 4475.0, 7503.0, 13968.0, 31169.0, 107327.0, 454537.0, 302721.0, 66860.0, 22797.0, 11008.0, 6401.0, 3760.0, 2467.0, 1569.0, 1123.0, 746.0, 453.0, 342.0, 253.0, 160.0, 118.0, 75.0, 67.0, 49.0, 30.0, 21.0, 13.0, 10.0, 10.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.66015625, -1.608001708984375, -1.55584716796875, -1.503692626953125, -1.4515380859375, -1.399383544921875, -1.34722900390625, -1.295074462890625, -1.242919921875, -1.190765380859375, -1.13861083984375, -1.086456298828125, -1.0343017578125, -0.982147216796875, -0.92999267578125, -0.877838134765625, -0.82568359375, -0.773529052734375, -0.72137451171875, -0.669219970703125, -0.6170654296875, -0.564910888671875, -0.51275634765625, -0.460601806640625, -0.408447265625, -0.356292724609375, -0.30413818359375, -0.251983642578125, -0.1998291015625, -0.147674560546875, -0.09552001953125, -0.043365478515625, 0.0087890625, 0.060943603515625, 0.11309814453125, 0.165252685546875, 0.2174072265625, 0.269561767578125, 0.32171630859375, 0.373870849609375, 0.426025390625, 0.478179931640625, 0.53033447265625, 0.582489013671875, 0.6346435546875, 0.686798095703125, 0.73895263671875, 0.791107177734375, 0.84326171875, 0.895416259765625, 0.94757080078125, 0.999725341796875, 1.0518798828125, 1.104034423828125, 1.15618896484375, 1.208343505859375, 1.260498046875, 1.312652587890625, 1.36480712890625, 1.416961669921875, 1.4691162109375, 1.521270751953125, 1.57342529296875, 1.625579833984375, 1.677734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 11.0, 15.0, 8.0, 19.0, 30.0, 28.0, 72.0, 88.0, 126.0, 122.0, 125.0, 86.0, 62.0, 44.0, 34.0, 30.0, 17.0, 5.0, 9.0, 8.0, 9.0, 7.0, 5.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.263671875, -0.2547874450683594, -0.24590301513671875, -0.23701858520507812, -0.2281341552734375, -0.21924972534179688, -0.21036529541015625, -0.20148086547851562, -0.192596435546875, -0.18371200561523438, -0.17482757568359375, -0.16594314575195312, -0.1570587158203125, -0.14817428588867188, -0.13928985595703125, -0.13040542602539062, -0.12152099609375, -0.11263656616210938, -0.10375213623046875, -0.09486770629882812, -0.0859832763671875, -0.07709884643554688, -0.06821441650390625, -0.059329986572265625, -0.050445556640625, -0.041561126708984375, -0.03267669677734375, -0.023792266845703125, -0.0149078369140625, -0.006023406982421875, 0.00286102294921875, 0.011745452880859375, 0.0206298828125, 0.029514312744140625, 0.03839874267578125, 0.047283172607421875, 0.0561676025390625, 0.06505203247070312, 0.07393646240234375, 0.08282089233398438, 0.091705322265625, 0.10058975219726562, 0.10947418212890625, 0.11835861206054688, 0.1272430419921875, 0.13612747192382812, 0.14501190185546875, 0.15389633178710938, 0.16278076171875, 0.17166519165039062, 0.18054962158203125, 0.18943405151367188, 0.1983184814453125, 0.20720291137695312, 0.21608734130859375, 0.22497177124023438, 0.233856201171875, 0.24274063110351562, 0.25162506103515625, 0.2605094909667969, 0.2693939208984375, 0.2782783508300781, 0.28716278076171875, 0.2960472106933594, 0.304931640625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 6.0, 4.0, 3.0, 8.0, 10.0, 24.0, 16.0, 15.0, 21.0, 37.0, 40.0, 35.0, 54.0, 51.0, 79.0, 61.0, 78.0, 65.0, 61.0, 54.0, 48.0, 43.0, 38.0, 39.0, 20.0, 27.0, 10.0, 13.0, 12.0, 7.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.176722526550293, -11.800043106079102, -11.423364639282227, -11.046685218811035, -10.67000675201416, -10.293327331542969, -9.916648864746094, -9.539969444274902, -9.163290977478027, -8.786611557006836, -8.409933090209961, -8.03325366973877, -7.6565752029418945, -7.279896259307861, -6.903217315673828, -6.526537895202637, -6.1498589515686035, -5.77318000793457, -5.396501064300537, -5.019822120666504, -4.643143177032471, -4.2664642333984375, -3.889785051345825, -3.513106107711792, -3.136427164077759, -2.7597482204437256, -2.3830692768096924, -2.00639009475708, -1.6297112703323364, -1.2530323266983032, -0.8763532638549805, -0.49967432022094727, -0.12299537658691406, 0.25368359684944153, 0.6303625702857971, 1.007041573524475, 1.3837205171585083, 1.7603994607925415, 2.1370785236358643, 2.5137574672698975, 2.8904364109039307, 3.267115354537964, 3.643794298171997, 4.020473480224609, 4.397152423858643, 4.773831367492676, 5.150510311126709, 5.527189254760742, 5.903868198394775, 6.280547142028809, 6.657226085662842, 7.033905029296875, 7.410583972930908, 7.787262916564941, 8.163942337036133, 8.540620803833008, 8.9173002243042, 9.29397964477539, 9.670658111572266, 10.047337532043457, 10.424015998840332, 10.800695419311523, 11.177373886108398, 11.55405330657959, 11.930731773376465]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 10.0, 11.0, 19.0, 12.0, 24.0, 29.0, 30.0, 27.0, 34.0, 33.0, 56.0, 44.0, 46.0, 41.0, 41.0, 46.0, 43.0, 44.0, 31.0, 30.0, 43.0, 39.0, 32.0, 33.0, 25.0, 35.0, 19.0, 13.0, 15.0, 15.0, 8.0, 10.0, 10.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.024806976318359, -6.805076599121094, -6.58534574508667, -6.365615367889404, -6.145884990692139, -5.926154136657715, -5.706423759460449, -5.486693382263184, -5.266963005065918, -5.047232627868652, -4.8275017738342285, -4.607771396636963, -4.388041019439697, -4.168310165405273, -3.948579788208008, -3.728849411010742, -3.5091185569763184, -3.2893879413604736, -3.069657564163208, -2.8499269485473633, -2.6301965713500977, -2.410465955734253, -2.190735340118408, -1.971004843711853, -1.7512743473052979, -1.5315438508987427, -1.3118133544921875, -1.0920827388763428, -0.8723522424697876, -0.6526217460632324, -0.4328911304473877, -0.21316063404083252, 0.006569862365722656, 0.22630038857460022, 0.4460309147834778, 0.6657614707946777, 0.8854919672012329, 1.105222463607788, 1.3249530792236328, 1.544683575630188, 1.7644140720367432, 1.9841445684432983, 2.2038750648498535, 2.4236056804656982, 2.643336296081543, 2.8630666732788086, 3.0827972888946533, 3.302527904510498, 3.5222582817077637, 3.7419888973236084, 3.961719274520874, 4.181449890136719, 4.401180267333984, 4.62091064453125, 4.840641498565674, 5.0603718757629395, 5.280102729797363, 5.499833106994629, 5.719563961029053, 5.939294338226318, 6.159024715423584, 6.378755569458008, 6.598485946655273, 6.818216323852539, 7.037946701049805]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 15.0, 29.0, 37.0, 60.0, 77.0, 125.0, 228.0, 325.0, 541.0, 899.0, 1496.0, 2709.0, 4668.0, 7991.0, 14544.0, 25276.0, 42037.0, 67245.0, 100479.0, 132853.0, 152003.0, 147341.0, 120951.0, 87551.0, 57153.0, 34669.0, 19951.0, 11538.0, 6530.0, 3846.0, 2140.0, 1240.0, 787.0, 467.0, 268.0, 159.0, 116.0, 74.0, 48.0, 24.0, 22.0, 10.0, 8.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.02703857421875, -5.8314208984375, -5.63580322265625, -5.440185546875, -5.24456787109375, -5.0489501953125, -4.85333251953125, -4.65771484375, -4.46209716796875, -4.2664794921875, -4.07086181640625, -3.875244140625, -3.67962646484375, -3.4840087890625, -3.28839111328125, -3.0927734375, -2.89715576171875, -2.7015380859375, -2.50592041015625, -2.310302734375, -2.11468505859375, -1.9190673828125, -1.72344970703125, -1.52783203125, -1.33221435546875, -1.1365966796875, -0.94097900390625, -0.745361328125, -0.54974365234375, -0.3541259765625, -0.15850830078125, 0.037109375, 0.23272705078125, 0.4283447265625, 0.62396240234375, 0.819580078125, 1.01519775390625, 1.2108154296875, 1.40643310546875, 1.60205078125, 1.79766845703125, 1.9932861328125, 2.18890380859375, 2.384521484375, 2.58013916015625, 2.7757568359375, 2.97137451171875, 3.1669921875, 3.36260986328125, 3.5582275390625, 3.75384521484375, 3.949462890625, 4.14508056640625, 4.3406982421875, 4.53631591796875, 4.73193359375, 4.92755126953125, 5.1231689453125, 5.31878662109375, 5.514404296875, 5.71002197265625, 5.9056396484375, 6.10125732421875, 6.296875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 7.0, 10.0, 19.0, 15.0, 26.0, 27.0, 34.0, 29.0, 39.0, 32.0, 41.0, 56.0, 34.0, 43.0, 47.0, 47.0, 32.0, 54.0, 40.0, 37.0, 49.0, 33.0, 37.0, 30.0, 18.0, 18.0, 26.0, 15.0, 16.0, 14.0, 10.0, 10.0, 14.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-8.59375, -8.35284423828125, -8.1119384765625, -7.87103271484375, -7.630126953125, -7.38922119140625, -7.1483154296875, -6.90740966796875, -6.66650390625, -6.42559814453125, -6.1846923828125, -5.94378662109375, -5.702880859375, -5.46197509765625, -5.2210693359375, -4.98016357421875, -4.7392578125, -4.49835205078125, -4.2574462890625, -4.01654052734375, -3.775634765625, -3.53472900390625, -3.2938232421875, -3.05291748046875, -2.81201171875, -2.57110595703125, -2.3302001953125, -2.08929443359375, -1.848388671875, -1.60748291015625, -1.3665771484375, -1.12567138671875, -0.884765625, -0.64385986328125, -0.4029541015625, -0.16204833984375, 0.078857421875, 0.31976318359375, 0.5606689453125, 0.80157470703125, 1.04248046875, 1.28338623046875, 1.5242919921875, 1.76519775390625, 2.006103515625, 2.24700927734375, 2.4879150390625, 2.72882080078125, 2.9697265625, 3.21063232421875, 3.4515380859375, 3.69244384765625, 3.933349609375, 4.17425537109375, 4.4151611328125, 4.65606689453125, 4.89697265625, 5.13787841796875, 5.3787841796875, 5.61968994140625, 5.860595703125, 6.10150146484375, 6.3424072265625, 6.58331298828125, 6.82421875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 8.0, 7.0, 14.0, 14.0, 13.0, 40.0, 48.0, 67.0, 86.0, 173.0, 230.0, 410.0, 670.0, 1143.0, 1822.0, 3152.0, 5813.0, 10214.0, 18216.0, 31394.0, 53501.0, 84460.0, 121407.0, 150950.0, 158874.0, 138139.0, 102823.0, 67504.0, 41410.0, 24310.0, 13534.0, 7592.0, 4455.0, 2450.0, 1399.0, 829.0, 498.0, 333.0, 190.0, 104.0, 82.0, 48.0, 45.0, 23.0, 16.0, 14.0, 11.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-6.77734375, -6.56719970703125, -6.3570556640625, -6.14691162109375, -5.936767578125, -5.72662353515625, -5.5164794921875, -5.30633544921875, -5.09619140625, -4.88604736328125, -4.6759033203125, -4.46575927734375, -4.255615234375, -4.04547119140625, -3.8353271484375, -3.62518310546875, -3.4150390625, -3.20489501953125, -2.9947509765625, -2.78460693359375, -2.574462890625, -2.36431884765625, -2.1541748046875, -1.94403076171875, -1.73388671875, -1.52374267578125, -1.3135986328125, -1.10345458984375, -0.893310546875, -0.68316650390625, -0.4730224609375, -0.26287841796875, -0.052734375, 0.15740966796875, 0.3675537109375, 0.57769775390625, 0.787841796875, 0.99798583984375, 1.2081298828125, 1.41827392578125, 1.62841796875, 1.83856201171875, 2.0487060546875, 2.25885009765625, 2.468994140625, 2.67913818359375, 2.8892822265625, 3.09942626953125, 3.3095703125, 3.51971435546875, 3.7298583984375, 3.94000244140625, 4.150146484375, 4.36029052734375, 4.5704345703125, 4.78057861328125, 4.99072265625, 5.20086669921875, 5.4110107421875, 5.62115478515625, 5.831298828125, 6.04144287109375, 6.2515869140625, 6.46173095703125, 6.671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 2.0, 6.0, 13.0, 6.0, 11.0, 10.0, 7.0, 9.0, 25.0, 15.0, 23.0, 29.0, 34.0, 14.0, 24.0, 28.0, 34.0, 35.0, 35.0, 32.0, 39.0, 51.0, 34.0, 37.0, 41.0, 29.0, 31.0, 37.0, 34.0, 32.0, 28.0, 24.0, 27.0, 16.0, 24.0, 17.0, 14.0, 17.0, 20.0, 9.0, 9.0, 6.0, 5.0, 8.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.79296875, -3.67340087890625, -3.5538330078125, -3.43426513671875, -3.314697265625, -3.19512939453125, -3.0755615234375, -2.95599365234375, -2.83642578125, -2.71685791015625, -2.5972900390625, -2.47772216796875, -2.358154296875, -2.23858642578125, -2.1190185546875, -1.99945068359375, -1.8798828125, -1.76031494140625, -1.6407470703125, -1.52117919921875, -1.401611328125, -1.28204345703125, -1.1624755859375, -1.04290771484375, -0.92333984375, -0.80377197265625, -0.6842041015625, -0.56463623046875, -0.445068359375, -0.32550048828125, -0.2059326171875, -0.08636474609375, 0.033203125, 0.15277099609375, 0.2723388671875, 0.39190673828125, 0.511474609375, 0.63104248046875, 0.7506103515625, 0.87017822265625, 0.98974609375, 1.10931396484375, 1.2288818359375, 1.34844970703125, 1.468017578125, 1.58758544921875, 1.7071533203125, 1.82672119140625, 1.9462890625, 2.06585693359375, 2.1854248046875, 2.30499267578125, 2.424560546875, 2.54412841796875, 2.6636962890625, 2.78326416015625, 2.90283203125, 3.02239990234375, 3.1419677734375, 3.26153564453125, 3.381103515625, 3.50067138671875, 3.6202392578125, 3.73980712890625, 3.859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 2.0, 7.0, 10.0, 11.0, 18.0, 26.0, 28.0, 36.0, 66.0, 94.0, 122.0, 182.0, 262.0, 396.0, 572.0, 1003.0, 1527.0, 2429.0, 4094.0, 7461.0, 13549.0, 25819.0, 51805.0, 102275.0, 180364.0, 234370.0, 191341.0, 111261.0, 56870.0, 28294.0, 14768.0, 7816.0, 4451.0, 2651.0, 1571.0, 1034.0, 654.0, 401.0, 281.0, 216.0, 140.0, 89.0, 65.0, 33.0, 28.0, 21.0, 9.0, 12.0, 8.0, 8.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.03515625, -4.85888671875, -4.6826171875, -4.50634765625, -4.330078125, -4.15380859375, -3.9775390625, -3.80126953125, -3.625, -3.44873046875, -3.2724609375, -3.09619140625, -2.919921875, -2.74365234375, -2.5673828125, -2.39111328125, -2.21484375, -2.03857421875, -1.8623046875, -1.68603515625, -1.509765625, -1.33349609375, -1.1572265625, -0.98095703125, -0.8046875, -0.62841796875, -0.4521484375, -0.27587890625, -0.099609375, 0.07666015625, 0.2529296875, 0.42919921875, 0.60546875, 0.78173828125, 0.9580078125, 1.13427734375, 1.310546875, 1.48681640625, 1.6630859375, 1.83935546875, 2.015625, 2.19189453125, 2.3681640625, 2.54443359375, 2.720703125, 2.89697265625, 3.0732421875, 3.24951171875, 3.42578125, 3.60205078125, 3.7783203125, 3.95458984375, 4.130859375, 4.30712890625, 4.4833984375, 4.65966796875, 4.8359375, 5.01220703125, 5.1884765625, 5.36474609375, 5.541015625, 5.71728515625, 5.8935546875, 6.06982421875, 6.24609375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 14.0, 18.0, 15.0, 29.0, 35.0, 38.0, 33.0, 56.0, 62.0, 68.0, 50.0, 59.0, 60.0, 71.0, 47.0, 42.0, 42.0, 42.0, 38.0, 37.0, 25.0, 20.0, 19.0, 8.0, 7.0, 4.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.000362396240234375, -0.00035066157579421997, -0.00033892691135406494, -0.0003271922469139099, -0.0003154575824737549, -0.00030372291803359985, -0.0002919882535934448, -0.0002802535891532898, -0.00026851892471313477, -0.00025678426027297974, -0.0002450495958328247, -0.00023331493139266968, -0.00022158026695251465, -0.00020984560251235962, -0.0001981109380722046, -0.00018637627363204956, -0.00017464160919189453, -0.0001629069447517395, -0.00015117228031158447, -0.00013943761587142944, -0.00012770295143127441, -0.00011596828699111938, -0.00010423362255096436, -9.249895811080933e-05, -8.07642936706543e-05, -6.902962923049927e-05, -5.729496479034424e-05, -4.556030035018921e-05, -3.382563591003418e-05, -2.209097146987915e-05, -1.0356307029724121e-05, 1.3783574104309082e-06, 1.3113021850585938e-05, 2.4847686290740967e-05, 3.6582350730895996e-05, 4.8317015171051025e-05, 6.0051679611206055e-05, 7.178634405136108e-05, 8.352100849151611e-05, 9.525567293167114e-05, 0.00010699033737182617, 0.0001187250018119812, 0.00013045966625213623, 0.00014219433069229126, 0.0001539289951324463, 0.00016566365957260132, 0.00017739832401275635, 0.00018913298845291138, 0.0002008676528930664, 0.00021260231733322144, 0.00022433698177337646, 0.0002360716462135315, 0.0002478063106536865, 0.00025954097509384155, 0.0002712756395339966, 0.0002830103039741516, 0.00029474496841430664, 0.00030647963285446167, 0.0003182142972946167, 0.00032994896173477173, 0.00034168362617492676, 0.0003534182906150818, 0.0003651529550552368, 0.00037688761949539185, 0.0003886222839355469]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 8.0, 2.0, 1.0, 8.0, 12.0, 29.0, 12.0, 28.0, 37.0, 42.0, 70.0, 121.0, 133.0, 250.0, 306.0, 497.0, 809.0, 1235.0, 2119.0, 3574.0, 5899.0, 10660.0, 19134.0, 35606.0, 64832.0, 113719.0, 172506.0, 201679.0, 168330.0, 108356.0, 61723.0, 33806.0, 18208.0, 10272.0, 5736.0, 3217.0, 2017.0, 1231.0, 781.0, 525.0, 329.0, 238.0, 142.0, 96.0, 75.0, 45.0, 38.0, 22.0, 21.0, 14.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.27734375, -4.13214111328125, -3.9869384765625, -3.84173583984375, -3.696533203125, -3.55133056640625, -3.4061279296875, -3.26092529296875, -3.11572265625, -2.97052001953125, -2.8253173828125, -2.68011474609375, -2.534912109375, -2.38970947265625, -2.2445068359375, -2.09930419921875, -1.9541015625, -1.80889892578125, -1.6636962890625, -1.51849365234375, -1.373291015625, -1.22808837890625, -1.0828857421875, -0.93768310546875, -0.79248046875, -0.64727783203125, -0.5020751953125, -0.35687255859375, -0.211669921875, -0.06646728515625, 0.0787353515625, 0.22393798828125, 0.369140625, 0.51434326171875, 0.6595458984375, 0.80474853515625, 0.949951171875, 1.09515380859375, 1.2403564453125, 1.38555908203125, 1.53076171875, 1.67596435546875, 1.8211669921875, 1.96636962890625, 2.111572265625, 2.25677490234375, 2.4019775390625, 2.54718017578125, 2.6923828125, 2.83758544921875, 2.9827880859375, 3.12799072265625, 3.273193359375, 3.41839599609375, 3.5635986328125, 3.70880126953125, 3.85400390625, 3.99920654296875, 4.1444091796875, 4.28961181640625, 4.434814453125, 4.58001708984375, 4.7252197265625, 4.87042236328125, 5.015625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 9.0, 5.0, 7.0, 7.0, 8.0, 14.0, 15.0, 24.0, 21.0, 23.0, 33.0, 30.0, 40.0, 30.0, 68.0, 45.0, 62.0, 60.0, 52.0, 52.0, 50.0, 45.0, 37.0, 41.0, 37.0, 37.0, 26.0, 25.0, 14.0, 16.0, 14.0, 12.0, 8.0, 7.0, 9.0, 6.0, 2.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95849609375, -0.9236221313476562, -0.8887481689453125, -0.8538742065429688, -0.819000244140625, -0.7841262817382812, -0.7492523193359375, -0.7143783569335938, -0.67950439453125, -0.6446304321289062, -0.6097564697265625, -0.5748825073242188, -0.540008544921875, -0.5051345825195312, -0.4702606201171875, -0.43538665771484375, -0.4005126953125, -0.36563873291015625, -0.3307647705078125, -0.29589080810546875, -0.261016845703125, -0.22614288330078125, -0.1912689208984375, -0.15639495849609375, -0.12152099609375, -0.08664703369140625, -0.0517730712890625, -0.01689910888671875, 0.017974853515625, 0.05284881591796875, 0.0877227783203125, 0.12259674072265625, 0.157470703125, 0.19234466552734375, 0.2272186279296875, 0.26209259033203125, 0.296966552734375, 0.33184051513671875, 0.3667144775390625, 0.40158843994140625, 0.43646240234375, 0.47133636474609375, 0.5062103271484375, 0.5410842895507812, 0.575958251953125, 0.6108322143554688, 0.6457061767578125, 0.6805801391601562, 0.7154541015625, 0.7503280639648438, 0.7852020263671875, 0.8200759887695312, 0.854949951171875, 0.8898239135742188, 0.9246978759765625, 0.9595718383789062, 0.99444580078125, 1.0293197631835938, 1.0641937255859375, 1.0990676879882812, 1.133941650390625, 1.1688156127929688, 1.2036895751953125, 1.2385635375976562, 1.2734375]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 7.0, 5.0, 6.0, 6.0, 13.0, 12.0, 15.0, 19.0, 19.0, 27.0, 37.0, 37.0, 50.0, 61.0, 52.0, 77.0, 69.0, 70.0, 70.0, 69.0, 50.0, 54.0, 42.0, 25.0, 33.0, 21.0, 15.0, 12.0, 7.0, 8.0, 5.0, 11.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.064947128295898, -11.671323776245117, -11.27769947052002, -10.884076118469238, -10.490452766418457, -10.09682846069336, -9.703205108642578, -9.309581756591797, -8.9159574508667, -8.522334098815918, -8.12870979309082, -7.735086441040039, -7.3414626121521, -6.94783878326416, -6.554215431213379, -6.1605916023254395, -5.766968250274658, -5.373344421386719, -4.9797210693359375, -4.586097240447998, -4.192473411560059, -3.7988498210906982, -3.405226230621338, -3.0116024017333984, -2.617978811264038, -2.2243552207946777, -1.8307313919067383, -1.437107801437378, -1.043484091758728, -0.6498603820800781, -0.2562367916107178, 0.13738703727722168, 0.531010627746582, 0.9246343374252319, 1.3182580471038818, 1.7118816375732422, 2.1055054664611816, 2.499129056930542, 2.8927526473999023, 3.286376476287842, 3.680000066757202, 4.0736236572265625, 4.467247486114502, 4.860871315002441, 5.254494667053223, 5.648118495941162, 6.041742324829102, 6.435365676879883, 6.828989505767822, 7.222613334655762, 7.616236686706543, 8.00986099243164, 8.403484344482422, 8.797107696533203, 9.190731048583984, 9.584355354309082, 9.977978706359863, 10.371602058410645, 10.765226364135742, 11.158849716186523, 11.552473068237305, 11.946097373962402, 12.339720726013184, 12.733345031738281, 13.126968383789062]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 5.0, 6.0, 9.0, 13.0, 16.0, 20.0, 21.0, 22.0, 29.0, 33.0, 24.0, 33.0, 43.0, 43.0, 48.0, 47.0, 42.0, 43.0, 49.0, 48.0, 43.0, 47.0, 31.0, 36.0, 29.0, 42.0, 23.0, 28.0, 22.0, 13.0, 11.0, 12.0, 16.0, 11.0, 5.0, 6.0, 3.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.656757831573486, -7.42542839050293, -7.194098949432373, -6.962769508361816, -6.73144006729126, -6.500110626220703, -6.268781661987305, -6.03745174407959, -5.806122779846191, -5.574793338775635, -5.343463897705078, -5.1121344566345215, -4.880805015563965, -4.649475574493408, -4.418146133422852, -4.186817169189453, -3.9554872512817383, -3.7241578102111816, -3.492828369140625, -3.2614989280700684, -3.0301694869995117, -2.798840045928955, -2.5675108432769775, -2.336181402206421, -2.1048519611358643, -1.8735225200653076, -1.642193078994751, -1.4108637571334839, -1.1795343160629272, -0.9482048749923706, -0.7168755531311035, -0.4855461120605469, -0.25421619415283203, -0.02288678288459778, 0.20844262838363647, 0.43977200984954834, 0.671101450920105, 0.9024308919906616, 1.1337602138519287, 1.3650896549224854, 1.596419095993042, 1.8277485370635986, 2.0590779781341553, 2.290407180786133, 2.5217366218566895, 2.753066062927246, 2.9843955039978027, 3.2157249450683594, 3.447054386138916, 3.6783838272094727, 3.9097132682800293, 4.141042709350586, 4.372372150421143, 4.603701591491699, 4.835030555725098, 5.0663604736328125, 5.297689437866211, 5.529018878936768, 5.760348320007324, 5.991677761077881, 6.2230072021484375, 6.454336643218994, 6.685666084289551, 6.916995048522949, 7.148324966430664]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 24.0, 41.0, 44.0, 71.0, 97.0, 153.0, 229.0, 338.0, 500.0, 855.0, 1280.0, 1994.0, 3266.0, 5514.0, 9107.0, 15553.0, 26266.0, 46019.0, 82161.0, 142890.0, 248610.0, 410685.0, 606109.0, 729395.0, 668253.0, 481001.0, 301952.0, 175677.0, 100724.0, 56849.0, 32483.0, 18752.0, 10824.0, 6415.0, 3832.0, 2310.0, 1452.0, 944.0, 554.0, 360.0, 234.0, 169.0, 109.0, 73.0, 40.0, 28.0, 12.0, 7.0, 8.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.512939453125, -7.26806640625, -7.023193359375, -6.7783203125, -6.533447265625, -6.28857421875, -6.043701171875, -5.798828125, -5.553955078125, -5.30908203125, -5.064208984375, -4.8193359375, -4.574462890625, -4.32958984375, -4.084716796875, -3.83984375, -3.594970703125, -3.35009765625, -3.105224609375, -2.8603515625, -2.615478515625, -2.37060546875, -2.125732421875, -1.880859375, -1.635986328125, -1.39111328125, -1.146240234375, -0.9013671875, -0.656494140625, -0.41162109375, -0.166748046875, 0.078125, 0.322998046875, 0.56787109375, 0.812744140625, 1.0576171875, 1.302490234375, 1.54736328125, 1.792236328125, 2.037109375, 2.281982421875, 2.52685546875, 2.771728515625, 3.0166015625, 3.261474609375, 3.50634765625, 3.751220703125, 3.99609375, 4.240966796875, 4.48583984375, 4.730712890625, 4.9755859375, 5.220458984375, 5.46533203125, 5.710205078125, 5.955078125, 6.199951171875, 6.44482421875, 6.689697265625, 6.9345703125, 7.179443359375, 7.42431640625, 7.669189453125, 7.9140625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 9.0, 2.0, 14.0, 14.0, 12.0, 19.0, 28.0, 30.0, 21.0, 30.0, 24.0, 37.0, 31.0, 43.0, 57.0, 45.0, 50.0, 43.0, 59.0, 50.0, 33.0, 35.0, 26.0, 39.0, 44.0, 22.0, 35.0, 21.0, 17.0, 14.0, 16.0, 17.0, 14.0, 8.0, 9.0, 4.0, 4.0, 4.0, 6.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.0703125, -4.91058349609375, -4.7508544921875, -4.59112548828125, -4.431396484375, -4.27166748046875, -4.1119384765625, -3.95220947265625, -3.79248046875, -3.63275146484375, -3.4730224609375, -3.31329345703125, -3.153564453125, -2.99383544921875, -2.8341064453125, -2.67437744140625, -2.5146484375, -2.35491943359375, -2.1951904296875, -2.03546142578125, -1.875732421875, -1.71600341796875, -1.5562744140625, -1.39654541015625, -1.23681640625, -1.07708740234375, -0.9173583984375, -0.75762939453125, -0.597900390625, -0.43817138671875, -0.2784423828125, -0.11871337890625, 0.041015625, 0.20074462890625, 0.3604736328125, 0.52020263671875, 0.679931640625, 0.83966064453125, 0.9993896484375, 1.15911865234375, 1.31884765625, 1.47857666015625, 1.6383056640625, 1.79803466796875, 1.957763671875, 2.11749267578125, 2.2772216796875, 2.43695068359375, 2.5966796875, 2.75640869140625, 2.9161376953125, 3.07586669921875, 3.235595703125, 3.39532470703125, 3.5550537109375, 3.71478271484375, 3.87451171875, 4.03424072265625, 4.1939697265625, 4.35369873046875, 4.513427734375, 4.67315673828125, 4.8328857421875, 4.99261474609375, 5.15234375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 9.0, 7.0, 10.0, 31.0, 43.0, 30.0, 80.0, 123.0, 191.0, 297.0, 462.0, 732.0, 1156.0, 1953.0, 3006.0, 4909.0, 7714.0, 12412.0, 20058.0, 32362.0, 52116.0, 82967.0, 129680.0, 198820.0, 296626.0, 409911.0, 515899.0, 564133.0, 528461.0, 428552.0, 311815.0, 212048.0, 140196.0, 89301.0, 56096.0, 35044.0, 21448.0, 13589.0, 8365.0, 5189.0, 3187.0, 2004.0, 1262.0, 726.0, 483.0, 299.0, 181.0, 124.0, 76.0, 39.0, 25.0, 21.0, 5.0, 12.0, 4.0, 0.0, 2.0, 4.0, 1.0, 1.0], "bins": [-6.421875, -6.218505859375, -6.01513671875, -5.811767578125, -5.6083984375, -5.405029296875, -5.20166015625, -4.998291015625, -4.794921875, -4.591552734375, -4.38818359375, -4.184814453125, -3.9814453125, -3.778076171875, -3.57470703125, -3.371337890625, -3.16796875, -2.964599609375, -2.76123046875, -2.557861328125, -2.3544921875, -2.151123046875, -1.94775390625, -1.744384765625, -1.541015625, -1.337646484375, -1.13427734375, -0.930908203125, -0.7275390625, -0.524169921875, -0.32080078125, -0.117431640625, 0.0859375, 0.289306640625, 0.49267578125, 0.696044921875, 0.8994140625, 1.102783203125, 1.30615234375, 1.509521484375, 1.712890625, 1.916259765625, 2.11962890625, 2.322998046875, 2.5263671875, 2.729736328125, 2.93310546875, 3.136474609375, 3.33984375, 3.543212890625, 3.74658203125, 3.949951171875, 4.1533203125, 4.356689453125, 4.56005859375, 4.763427734375, 4.966796875, 5.170166015625, 5.37353515625, 5.576904296875, 5.7802734375, 5.983642578125, 6.18701171875, 6.390380859375, 6.59375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 7.0, 12.0, 15.0, 24.0, 31.0, 32.0, 51.0, 67.0, 75.0, 111.0, 121.0, 155.0, 153.0, 215.0, 202.0, 213.0, 231.0, 245.0, 278.0, 247.0, 236.0, 188.0, 197.0, 152.0, 165.0, 126.0, 112.0, 96.0, 79.0, 51.0, 44.0, 30.0, 29.0, 23.0, 19.0, 10.0, 7.0, 5.0, 5.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6953125, -2.602996826171875, -2.51068115234375, -2.418365478515625, -2.3260498046875, -2.233734130859375, -2.14141845703125, -2.049102783203125, -1.956787109375, -1.864471435546875, -1.77215576171875, -1.679840087890625, -1.5875244140625, -1.495208740234375, -1.40289306640625, -1.310577392578125, -1.21826171875, -1.125946044921875, -1.03363037109375, -0.941314697265625, -0.8489990234375, -0.756683349609375, -0.66436767578125, -0.572052001953125, -0.479736328125, -0.387420654296875, -0.29510498046875, -0.202789306640625, -0.1104736328125, -0.018157958984375, 0.07415771484375, 0.166473388671875, 0.2587890625, 0.351104736328125, 0.44342041015625, 0.535736083984375, 0.6280517578125, 0.720367431640625, 0.81268310546875, 0.904998779296875, 0.997314453125, 1.089630126953125, 1.18194580078125, 1.274261474609375, 1.3665771484375, 1.458892822265625, 1.55120849609375, 1.643524169921875, 1.73583984375, 1.828155517578125, 1.92047119140625, 2.012786865234375, 2.1051025390625, 2.197418212890625, 2.28973388671875, 2.382049560546875, 2.474365234375, 2.566680908203125, 2.65899658203125, 2.751312255859375, 2.8436279296875, 2.935943603515625, 3.02825927734375, 3.120574951171875, 3.212890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 0.0, 3.0, 3.0, 11.0, 15.0, 11.0, 17.0, 21.0, 21.0, 27.0, 33.0, 48.0, 56.0, 51.0, 63.0, 63.0, 80.0, 57.0, 54.0, 59.0, 58.0, 47.0, 39.0, 36.0, 18.0, 20.0, 21.0, 13.0, 12.0, 8.0, 6.0, 9.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.856048583984375, -10.500896453857422, -10.145745277404785, -9.790593147277832, -9.435441017150879, -9.080289840698242, -8.725137710571289, -8.369985580444336, -8.014833450317383, -7.659681797027588, -7.304529666900635, -6.94937801361084, -6.594225883483887, -6.239074230194092, -5.883922576904297, -5.528770446777344, -5.173619270324707, -4.818467617034912, -4.463315486907959, -4.108163833618164, -3.75301194190979, -3.397860050201416, -3.042708396911621, -2.687556505203247, -2.332404613494873, -1.977252721786499, -1.6221009492874146, -1.26694917678833, -0.911797285079956, -0.556645393371582, -0.2014937400817871, 0.15365815162658691, 0.5088090896606445, 0.8639609217643738, 1.219112753868103, 1.5742645263671875, 1.9294164180755615, 2.2845683097839355, 2.6397199630737305, 2.9948718547821045, 3.3500237464904785, 3.7051756381988525, 4.060327529907227, 4.4154791831970215, 4.770630836486816, 5.1257829666137695, 5.4809346199035645, 5.836086273193359, 6.1912384033203125, 6.546390056610107, 6.9015421867370605, 7.2566938400268555, 7.611845970153809, 7.9669976234436035, 8.322149276733398, 8.677301406860352, 9.032453536987305, 9.387605667114258, 9.742756843566895, 10.097908973693848, 10.4530611038208, 10.808212280273438, 11.16336441040039, 11.518516540527344, 11.87366771697998]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 5.0, 2.0, 4.0, 12.0, 12.0, 8.0, 15.0, 28.0, 24.0, 26.0, 22.0, 24.0, 20.0, 38.0, 32.0, 41.0, 32.0, 42.0, 34.0, 51.0, 28.0, 33.0, 41.0, 41.0, 40.0, 39.0, 35.0, 36.0, 22.0, 33.0, 24.0, 27.0, 21.0, 20.0, 15.0, 12.0, 8.0, 7.0, 4.0, 7.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.018222332000732, -5.823577880859375, -5.628933429718018, -5.43428897857666, -5.2396440505981445, -5.044999599456787, -4.85035514831543, -4.655710697174072, -4.461066246032715, -4.266421794891357, -4.07177734375, -3.8771326541900635, -3.682488203048706, -3.4878437519073486, -3.293199062347412, -3.0985546112060547, -2.9039101600646973, -2.70926570892334, -2.5146212577819824, -2.319976568222046, -2.1253321170806885, -1.930687665939331, -1.736043095588684, -1.541398525238037, -1.3467540740966797, -1.1521096229553223, -0.9574650526046753, -0.7628205418586731, -0.5681760311126709, -0.3735315203666687, -0.1788870096206665, 0.01575756072998047, 0.2104015350341797, 0.4050460457801819, 0.5996905565261841, 0.7943350672721863, 0.9889795780181885, 1.183624029159546, 1.3782685995101929, 1.5729131698608398, 1.7675576210021973, 1.9622020721435547, 2.156846523284912, 2.3514912128448486, 2.546135663986206, 2.7407801151275635, 2.9354248046875, 3.1300692558288574, 3.324713706970215, 3.5193581581115723, 3.7140026092529297, 3.908647298812866, 4.1032915115356445, 4.29793643951416, 4.492580890655518, 4.687225341796875, 4.881869792938232, 5.07651424407959, 5.271158695220947, 5.465803146362305, 5.66044807434082, 5.855092525482178, 6.049736976623535, 6.244381427764893, 6.43902587890625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 11.0, 7.0, 10.0, 10.0, 27.0, 25.0, 43.0, 70.0, 103.0, 156.0, 231.0, 340.0, 515.0, 832.0, 1305.0, 2133.0, 3355.0, 5435.0, 8859.0, 14874.0, 25021.0, 41392.0, 67323.0, 104182.0, 147665.0, 171378.0, 153289.0, 111801.0, 72872.0, 45258.0, 27480.0, 16738.0, 9865.0, 6106.0, 3648.0, 2257.0, 1394.0, 870.0, 600.0, 379.0, 238.0, 141.0, 99.0, 71.0, 56.0, 28.0, 21.0, 17.0, 12.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4609375, -1.413177490234375, -1.36541748046875, -1.317657470703125, -1.2698974609375, -1.222137451171875, -1.17437744140625, -1.126617431640625, -1.078857421875, -1.031097412109375, -0.98333740234375, -0.935577392578125, -0.8878173828125, -0.840057373046875, -0.79229736328125, -0.744537353515625, -0.69677734375, -0.649017333984375, -0.60125732421875, -0.553497314453125, -0.5057373046875, -0.457977294921875, -0.41021728515625, -0.362457275390625, -0.314697265625, -0.266937255859375, -0.21917724609375, -0.171417236328125, -0.1236572265625, -0.075897216796875, -0.02813720703125, 0.019622802734375, 0.0673828125, 0.115142822265625, 0.16290283203125, 0.210662841796875, 0.2584228515625, 0.306182861328125, 0.35394287109375, 0.401702880859375, 0.449462890625, 0.497222900390625, 0.54498291015625, 0.592742919921875, 0.6405029296875, 0.688262939453125, 0.73602294921875, 0.783782958984375, 0.83154296875, 0.879302978515625, 0.92706298828125, 0.974822998046875, 1.0225830078125, 1.070343017578125, 1.11810302734375, 1.165863037109375, 1.213623046875, 1.261383056640625, 1.30914306640625, 1.356903076171875, 1.4046630859375, 1.452423095703125, 1.50018310546875, 1.547943115234375, 1.595703125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 12.0, 18.0, 20.0, 18.0, 14.0, 15.0, 31.0, 28.0, 41.0, 23.0, 38.0, 30.0, 37.0, 44.0, 51.0, 45.0, 44.0, 39.0, 42.0, 42.0, 40.0, 35.0, 32.0, 31.0, 27.0, 24.0, 27.0, 23.0, 17.0, 21.0, 15.0, 5.0, 10.0, 9.0, 8.0, 4.0, 2.0, 8.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.27734375, -6.05633544921875, -5.8353271484375, -5.61431884765625, -5.393310546875, -5.17230224609375, -4.9512939453125, -4.73028564453125, -4.50927734375, -4.28826904296875, -4.0672607421875, -3.84625244140625, -3.625244140625, -3.40423583984375, -3.1832275390625, -2.96221923828125, -2.7412109375, -2.52020263671875, -2.2991943359375, -2.07818603515625, -1.857177734375, -1.63616943359375, -1.4151611328125, -1.19415283203125, -0.97314453125, -0.75213623046875, -0.5311279296875, -0.31011962890625, -0.089111328125, 0.13189697265625, 0.3529052734375, 0.57391357421875, 0.794921875, 1.01593017578125, 1.2369384765625, 1.45794677734375, 1.678955078125, 1.89996337890625, 2.1209716796875, 2.34197998046875, 2.56298828125, 2.78399658203125, 3.0050048828125, 3.22601318359375, 3.447021484375, 3.66802978515625, 3.8890380859375, 4.11004638671875, 4.3310546875, 4.55206298828125, 4.7730712890625, 4.99407958984375, 5.215087890625, 5.43609619140625, 5.6571044921875, 5.87811279296875, 6.09912109375, 6.32012939453125, 6.5411376953125, 6.76214599609375, 6.983154296875, 7.20416259765625, 7.4251708984375, 7.64617919921875, 7.8671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 5.0, 7.0, 9.0, 16.0, 17.0, 34.0, 50.0, 70.0, 127.0, 167.0, 283.0, 395.0, 755.0, 1228.0, 1982.0, 3445.0, 6130.0, 11454.0, 21217.0, 39993.0, 74950.0, 132660.0, 201158.0, 212559.0, 150688.0, 86916.0, 46961.0, 24883.0, 13201.0, 7287.0, 4037.0, 2288.0, 1404.0, 806.0, 494.0, 307.0, 188.0, 134.0, 68.0, 53.0, 33.0, 30.0, 23.0, 16.0, 10.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9453125, -1.8807373046875, -1.816162109375, -1.7515869140625, -1.68701171875, -1.6224365234375, -1.557861328125, -1.4932861328125, -1.4287109375, -1.3641357421875, -1.299560546875, -1.2349853515625, -1.17041015625, -1.1058349609375, -1.041259765625, -0.9766845703125, -0.912109375, -0.8475341796875, -0.782958984375, -0.7183837890625, -0.65380859375, -0.5892333984375, -0.524658203125, -0.4600830078125, -0.3955078125, -0.3309326171875, -0.266357421875, -0.2017822265625, -0.13720703125, -0.0726318359375, -0.008056640625, 0.0565185546875, 0.12109375, 0.1856689453125, 0.250244140625, 0.3148193359375, 0.37939453125, 0.4439697265625, 0.508544921875, 0.5731201171875, 0.6376953125, 0.7022705078125, 0.766845703125, 0.8314208984375, 0.89599609375, 0.9605712890625, 1.025146484375, 1.0897216796875, 1.154296875, 1.2188720703125, 1.283447265625, 1.3480224609375, 1.41259765625, 1.4771728515625, 1.541748046875, 1.6063232421875, 1.6708984375, 1.7354736328125, 1.800048828125, 1.8646240234375, 1.92919921875, 1.9937744140625, 2.058349609375, 2.1229248046875, 2.1875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 6.0, 3.0, 3.0, 3.0, 5.0, 9.0, 17.0, 18.0, 13.0, 17.0, 18.0, 13.0, 16.0, 29.0, 21.0, 23.0, 36.0, 35.0, 24.0, 34.0, 42.0, 32.0, 38.0, 32.0, 30.0, 44.0, 39.0, 29.0, 45.0, 40.0, 34.0, 25.0, 34.0, 18.0, 34.0, 17.0, 19.0, 13.0, 20.0, 12.0, 13.0, 13.0, 9.0, 6.0, 9.0, 5.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.546875, -3.432098388671875, -3.31732177734375, -3.202545166015625, -3.0877685546875, -2.972991943359375, -2.85821533203125, -2.743438720703125, -2.628662109375, -2.513885498046875, -2.39910888671875, -2.284332275390625, -2.1695556640625, -2.054779052734375, -1.94000244140625, -1.825225830078125, -1.71044921875, -1.595672607421875, -1.48089599609375, -1.366119384765625, -1.2513427734375, -1.136566162109375, -1.02178955078125, -0.907012939453125, -0.792236328125, -0.677459716796875, -0.56268310546875, -0.447906494140625, -0.3331298828125, -0.218353271484375, -0.10357666015625, 0.011199951171875, 0.1259765625, 0.240753173828125, 0.35552978515625, 0.470306396484375, 0.5850830078125, 0.699859619140625, 0.81463623046875, 0.929412841796875, 1.044189453125, 1.158966064453125, 1.27374267578125, 1.388519287109375, 1.5032958984375, 1.618072509765625, 1.73284912109375, 1.847625732421875, 1.96240234375, 2.077178955078125, 2.19195556640625, 2.306732177734375, 2.4215087890625, 2.536285400390625, 2.65106201171875, 2.765838623046875, 2.880615234375, 2.995391845703125, 3.11016845703125, 3.224945068359375, 3.3397216796875, 3.454498291015625, 3.56927490234375, 3.684051513671875, 3.798828125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 12.0, 10.0, 20.0, 16.0, 42.0, 46.0, 43.0, 83.0, 103.0, 155.0, 250.0, 347.0, 473.0, 768.0, 1304.0, 2132.0, 3650.0, 6594.0, 12702.0, 26407.0, 58592.0, 134589.0, 270207.0, 274713.0, 138767.0, 60231.0, 27007.0, 13069.0, 6697.0, 3748.0, 2059.0, 1271.0, 831.0, 510.0, 364.0, 221.0, 157.0, 109.0, 67.0, 55.0, 34.0, 22.0, 25.0, 19.0, 9.0, 5.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0], "bins": [-0.64013671875, -0.6194992065429688, -0.5988616943359375, -0.5782241821289062, -0.557586669921875, -0.5369491577148438, -0.5163116455078125, -0.49567413330078125, -0.47503662109375, -0.45439910888671875, -0.4337615966796875, -0.41312408447265625, -0.392486572265625, -0.37184906005859375, -0.3512115478515625, -0.33057403564453125, -0.3099365234375, -0.28929901123046875, -0.2686614990234375, -0.24802398681640625, -0.227386474609375, -0.20674896240234375, -0.1861114501953125, -0.16547393798828125, -0.14483642578125, -0.12419891357421875, -0.1035614013671875, -0.08292388916015625, -0.062286376953125, -0.04164886474609375, -0.0210113525390625, -0.00037384033203125, 0.020263671875, 0.04090118408203125, 0.0615386962890625, 0.08217620849609375, 0.102813720703125, 0.12345123291015625, 0.1440887451171875, 0.16472625732421875, 0.18536376953125, 0.20600128173828125, 0.2266387939453125, 0.24727630615234375, 0.267913818359375, 0.28855133056640625, 0.3091888427734375, 0.32982635498046875, 0.3504638671875, 0.37110137939453125, 0.3917388916015625, 0.41237640380859375, 0.433013916015625, 0.45365142822265625, 0.4742889404296875, 0.49492645263671875, 0.51556396484375, 0.5362014770507812, 0.5568389892578125, 0.5774765014648438, 0.598114013671875, 0.6187515258789062, 0.6393890380859375, 0.6600265502929688, 0.6806640625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 4.0, 7.0, 11.0, 15.0, 19.0, 16.0, 20.0, 37.0, 26.0, 40.0, 53.0, 51.0, 67.0, 64.0, 83.0, 67.0, 53.0, 60.0, 59.0, 34.0, 43.0, 32.0, 21.0, 19.0, 17.0, 17.0, 13.0, 10.0, 5.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4689903259277344e-05, -3.349222242832184e-05, -3.229454159736633e-05, -3.109686076641083e-05, -2.9899179935455322e-05, -2.8701499104499817e-05, -2.750381827354431e-05, -2.6306137442588806e-05, -2.51084566116333e-05, -2.3910775780677795e-05, -2.271309494972229e-05, -2.1515414118766785e-05, -2.031773328781128e-05, -1.9120052456855774e-05, -1.792237162590027e-05, -1.6724690794944763e-05, -1.5527009963989258e-05, -1.4329329133033752e-05, -1.3131648302078247e-05, -1.1933967471122742e-05, -1.0736286640167236e-05, -9.538605809211731e-06, -8.340924978256226e-06, -7.14324414730072e-06, -5.945563316345215e-06, -4.7478824853897095e-06, -3.550201654434204e-06, -2.3525208234786987e-06, -1.1548399925231934e-06, 4.284083843231201e-08, 1.2405216693878174e-06, 2.4382025003433228e-06, 3.635883331298828e-06, 4.8335641622543335e-06, 6.031244993209839e-06, 7.228925824165344e-06, 8.42660665512085e-06, 9.624287486076355e-06, 1.082196831703186e-05, 1.2019649147987366e-05, 1.3217329978942871e-05, 1.4415010809898376e-05, 1.5612691640853882e-05, 1.6810372471809387e-05, 1.8008053302764893e-05, 1.9205734133720398e-05, 2.0403414964675903e-05, 2.160109579563141e-05, 2.2798776626586914e-05, 2.399645745754242e-05, 2.5194138288497925e-05, 2.639181911945343e-05, 2.7589499950408936e-05, 2.878718078136444e-05, 2.9984861612319946e-05, 3.118254244327545e-05, 3.238022327423096e-05, 3.357790410518646e-05, 3.477558493614197e-05, 3.597326576709747e-05, 3.717094659805298e-05, 3.8368627429008484e-05, 3.956630825996399e-05, 4.0763989090919495e-05, 4.1961669921875e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 7.0, 14.0, 17.0, 32.0, 33.0, 48.0, 57.0, 108.0, 174.0, 246.0, 347.0, 527.0, 802.0, 1193.0, 1844.0, 2911.0, 4379.0, 7119.0, 11566.0, 19320.0, 32750.0, 57305.0, 101870.0, 171600.0, 220937.0, 172458.0, 101514.0, 56438.0, 32316.0, 18879.0, 11453.0, 7180.0, 4536.0, 2854.0, 1938.0, 1274.0, 798.0, 569.0, 392.0, 249.0, 171.0, 121.0, 65.0, 48.0, 34.0, 27.0, 15.0, 9.0, 5.0, 3.0, 1.0, 3.0], "bins": [-0.6103515625, -0.5936279296875, -0.576904296875, -0.5601806640625, -0.54345703125, -0.5267333984375, -0.510009765625, -0.4932861328125, -0.4765625, -0.4598388671875, -0.443115234375, -0.4263916015625, -0.40966796875, -0.3929443359375, -0.376220703125, -0.3594970703125, -0.3427734375, -0.3260498046875, -0.309326171875, -0.2926025390625, -0.27587890625, -0.2591552734375, -0.242431640625, -0.2257080078125, -0.208984375, -0.1922607421875, -0.175537109375, -0.1588134765625, -0.14208984375, -0.1253662109375, -0.108642578125, -0.0919189453125, -0.0751953125, -0.0584716796875, -0.041748046875, -0.0250244140625, -0.00830078125, 0.0084228515625, 0.025146484375, 0.0418701171875, 0.05859375, 0.0753173828125, 0.092041015625, 0.1087646484375, 0.12548828125, 0.1422119140625, 0.158935546875, 0.1756591796875, 0.1923828125, 0.2091064453125, 0.225830078125, 0.2425537109375, 0.25927734375, 0.2760009765625, 0.292724609375, 0.3094482421875, 0.326171875, 0.3428955078125, 0.359619140625, 0.3763427734375, 0.39306640625, 0.4097900390625, 0.426513671875, 0.4432373046875, 0.4599609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 13.0, 14.0, 17.0, 20.0, 19.0, 23.0, 26.0, 44.0, 49.0, 56.0, 58.0, 70.0, 66.0, 80.0, 68.0, 58.0, 56.0, 48.0, 38.0, 27.0, 23.0, 24.0, 13.0, 15.0, 15.0, 6.0, 10.0, 2.0, 4.0, 3.0, 9.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1285400390625, -0.12466621398925781, -0.12079238891601562, -0.11691856384277344, -0.11304473876953125, -0.10917091369628906, -0.10529708862304688, -0.10142326354980469, -0.0975494384765625, -0.09367561340332031, -0.08980178833007812, -0.08592796325683594, -0.08205413818359375, -0.07818031311035156, -0.07430648803710938, -0.07043266296386719, -0.066558837890625, -0.06268501281738281, -0.058811187744140625, -0.05493736267089844, -0.05106353759765625, -0.04718971252441406, -0.043315887451171875, -0.03944206237792969, -0.0355682373046875, -0.03169441223144531, -0.027820587158203125, -0.023946762084960938, -0.02007293701171875, -0.016199111938476562, -0.012325286865234375, -0.008451461791992188, -0.00457763671875, -0.0007038116455078125, 0.003170013427734375, 0.0070438385009765625, 0.01091766357421875, 0.014791488647460938, 0.018665313720703125, 0.022539138793945312, 0.0264129638671875, 0.030286788940429688, 0.034160614013671875, 0.03803443908691406, 0.04190826416015625, 0.04578208923339844, 0.049655914306640625, 0.05352973937988281, 0.057403564453125, 0.06127738952636719, 0.06515121459960938, 0.06902503967285156, 0.07289886474609375, 0.07677268981933594, 0.08064651489257812, 0.08452033996582031, 0.0883941650390625, 0.09226799011230469, 0.09614181518554688, 0.10001564025878906, 0.10388946533203125, 0.10776329040527344, 0.11163711547851562, 0.11551094055175781, 0.119384765625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 2.0, 1.0, 5.0, 3.0, 18.0, 7.0, 12.0, 18.0, 25.0, 25.0, 25.0, 35.0, 44.0, 57.0, 53.0, 69.0, 59.0, 77.0, 65.0, 49.0, 62.0, 42.0, 52.0, 39.0, 29.0, 21.0, 20.0, 18.0, 15.0, 10.0, 10.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.602386474609375, -10.252541542053223, -9.90269660949707, -9.552851676940918, -9.203006744384766, -8.853160858154297, -8.503315925598145, -8.153470993041992, -7.80362606048584, -7.4537811279296875, -7.103936195373535, -6.754090785980225, -6.404245853424072, -6.05440092086792, -5.704555511474609, -5.354710578918457, -5.004865646362305, -4.655020713806152, -4.30517578125, -3.9553303718566895, -3.605485439300537, -3.2556405067443848, -2.9057953357696533, -2.555950164794922, -2.2061052322387695, -1.8562601804733276, -1.5064151287078857, -1.1565700769424438, -0.806725025177002, -0.45687997341156006, -0.10703492164611816, 0.24281024932861328, 0.5926551818847656, 0.9425002336502075, 1.2923452854156494, 1.6421903371810913, 1.9920353889465332, 2.3418803215026855, 2.691725492477417, 3.0415706634521484, 3.391415596008301, 3.741260528564453, 4.0911054611206055, 4.440950870513916, 4.790795803070068, 5.140640735626221, 5.490486145019531, 5.840331077575684, 6.190176010131836, 6.540020942687988, 6.889865875244141, 7.239711284637451, 7.5895562171936035, 7.939401149749756, 8.289246559143066, 8.639091491699219, 8.988936424255371, 9.338781356811523, 9.688626289367676, 10.038471221923828, 10.388317108154297, 10.73816204071045, 11.088006973266602, 11.437851905822754, 11.787696838378906]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 4.0, 12.0, 10.0, 9.0, 13.0, 28.0, 26.0, 24.0, 25.0, 24.0, 18.0, 34.0, 31.0, 44.0, 34.0, 38.0, 35.0, 54.0, 27.0, 27.0, 43.0, 47.0, 35.0, 41.0, 37.0, 38.0, 22.0, 32.0, 25.0, 27.0, 21.0, 20.0, 16.0, 12.0, 6.0, 8.0, 5.0, 8.0, 5.0, 7.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.995700836181641, -5.801371097564697, -5.607040882110596, -5.412711143493652, -5.218381404876709, -5.024051666259766, -4.829721450805664, -4.635391712188721, -4.441061973571777, -4.246732234954834, -4.052402019500732, -3.858072280883789, -3.6637425422668457, -3.4694125652313232, -3.275082588195801, -3.0807528495788574, -2.886422634124756, -2.6920926570892334, -2.49776291847229, -2.3034329414367676, -2.109103202819824, -1.9147732257843018, -1.7204432487487793, -1.5261133909225464, -1.3317835330963135, -1.1374536752700806, -0.9431237578392029, -0.7487938404083252, -0.5544639825820923, -0.3601341247558594, -0.16580414772033691, 0.028525710105895996, 0.2228560447692871, 0.4171859323978424, 0.6115158200263977, 0.8058457374572754, 1.0001755952835083, 1.1945054531097412, 1.3888354301452637, 1.5831652879714966, 1.7774951457977295, 1.9718250036239624, 2.1661548614501953, 2.3604848384857178, 2.5548148155212402, 2.7491445541381836, 2.943474531173706, 3.1378045082092285, 3.332134246826172, 3.5264642238616943, 3.7207939624786377, 3.91512393951416, 4.1094536781311035, 4.303783416748047, 4.498113632202148, 4.692443370819092, 4.886773109436035, 5.0811028480529785, 5.27543306350708, 5.469762802124023, 5.664092540740967, 5.85842227935791, 6.052752494812012, 6.247082233428955, 6.441412448883057]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 5.0, 24.0, 29.0, 37.0, 63.0, 78.0, 139.0, 241.0, 364.0, 622.0, 812.0, 1315.0, 2002.0, 3033.0, 4919.0, 7079.0, 10682.0, 16236.0, 23898.0, 34070.0, 47032.0, 62905.0, 80537.0, 96487.0, 106918.0, 108626.0, 101725.0, 87292.0, 70909.0, 54453.0, 40147.0, 28101.0, 19091.0, 13348.0, 8744.0, 5780.0, 3774.0, 2555.0, 1595.0, 1021.0, 656.0, 441.0, 268.0, 190.0, 114.0, 82.0, 47.0, 29.0, 17.0, 12.0, 10.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.32421875, -4.1900634765625, -4.055908203125, -3.9217529296875, -3.78759765625, -3.6534423828125, -3.519287109375, -3.3851318359375, -3.2509765625, -3.1168212890625, -2.982666015625, -2.8485107421875, -2.71435546875, -2.5802001953125, -2.446044921875, -2.3118896484375, -2.177734375, -2.0435791015625, -1.909423828125, -1.7752685546875, -1.64111328125, -1.5069580078125, -1.372802734375, -1.2386474609375, -1.1044921875, -0.9703369140625, -0.836181640625, -0.7020263671875, -0.56787109375, -0.4337158203125, -0.299560546875, -0.1654052734375, -0.03125, 0.1029052734375, 0.237060546875, 0.3712158203125, 0.50537109375, 0.6395263671875, 0.773681640625, 0.9078369140625, 1.0419921875, 1.1761474609375, 1.310302734375, 1.4444580078125, 1.57861328125, 1.7127685546875, 1.846923828125, 1.9810791015625, 2.115234375, 2.2493896484375, 2.383544921875, 2.5177001953125, 2.65185546875, 2.7860107421875, 2.920166015625, 3.0543212890625, 3.1884765625, 3.3226318359375, 3.456787109375, 3.5909423828125, 3.72509765625, 3.8592529296875, 3.993408203125, 4.1275634765625, 4.26171875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 8.0, 8.0, 7.0, 16.0, 20.0, 23.0, 25.0, 19.0, 17.0, 23.0, 23.0, 27.0, 24.0, 38.0, 37.0, 49.0, 33.0, 50.0, 48.0, 40.0, 31.0, 32.0, 43.0, 40.0, 34.0, 29.0, 31.0, 27.0, 27.0, 25.0, 20.0, 19.0, 19.0, 14.0, 10.0, 12.0, 10.0, 7.0, 3.0, 2.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-6.3828125, -6.17626953125, -5.9697265625, -5.76318359375, -5.556640625, -5.35009765625, -5.1435546875, -4.93701171875, -4.73046875, -4.52392578125, -4.3173828125, -4.11083984375, -3.904296875, -3.69775390625, -3.4912109375, -3.28466796875, -3.078125, -2.87158203125, -2.6650390625, -2.45849609375, -2.251953125, -2.04541015625, -1.8388671875, -1.63232421875, -1.42578125, -1.21923828125, -1.0126953125, -0.80615234375, -0.599609375, -0.39306640625, -0.1865234375, 0.02001953125, 0.2265625, 0.43310546875, 0.6396484375, 0.84619140625, 1.052734375, 1.25927734375, 1.4658203125, 1.67236328125, 1.87890625, 2.08544921875, 2.2919921875, 2.49853515625, 2.705078125, 2.91162109375, 3.1181640625, 3.32470703125, 3.53125, 3.73779296875, 3.9443359375, 4.15087890625, 4.357421875, 4.56396484375, 4.7705078125, 4.97705078125, 5.18359375, 5.39013671875, 5.5966796875, 5.80322265625, 6.009765625, 6.21630859375, 6.4228515625, 6.62939453125, 6.8359375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 16.0, 20.0, 37.0, 60.0, 92.0, 174.0, 278.0, 524.0, 854.0, 1496.0, 2617.0, 4442.0, 7510.0, 12504.0, 20701.0, 32827.0, 50425.0, 73433.0, 98992.0, 121209.0, 133151.0, 128609.0, 109285.0, 85220.0, 59596.0, 40158.0, 25599.0, 15625.0, 9545.0, 5677.0, 3316.0, 1902.0, 1070.0, 652.0, 382.0, 196.0, 136.0, 70.0, 47.0, 35.0, 21.0, 8.0, 14.0, 9.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.37109375, -5.2017822265625, -5.032470703125, -4.8631591796875, -4.69384765625, -4.5245361328125, -4.355224609375, -4.1859130859375, -4.0166015625, -3.8472900390625, -3.677978515625, -3.5086669921875, -3.33935546875, -3.1700439453125, -3.000732421875, -2.8314208984375, -2.662109375, -2.4927978515625, -2.323486328125, -2.1541748046875, -1.98486328125, -1.8155517578125, -1.646240234375, -1.4769287109375, -1.3076171875, -1.1383056640625, -0.968994140625, -0.7996826171875, -0.63037109375, -0.4610595703125, -0.291748046875, -0.1224365234375, 0.046875, 0.2161865234375, 0.385498046875, 0.5548095703125, 0.72412109375, 0.8934326171875, 1.062744140625, 1.2320556640625, 1.4013671875, 1.5706787109375, 1.739990234375, 1.9093017578125, 2.07861328125, 2.2479248046875, 2.417236328125, 2.5865478515625, 2.755859375, 2.9251708984375, 3.094482421875, 3.2637939453125, 3.43310546875, 3.6024169921875, 3.771728515625, 3.9410400390625, 4.1103515625, 4.2796630859375, 4.448974609375, 4.6182861328125, 4.78759765625, 4.9569091796875, 5.126220703125, 5.2955322265625, 5.46484375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 6.0, 5.0, 9.0, 11.0, 14.0, 21.0, 16.0, 19.0, 17.0, 32.0, 35.0, 33.0, 28.0, 35.0, 37.0, 36.0, 38.0, 38.0, 35.0, 36.0, 46.0, 27.0, 41.0, 51.0, 40.0, 33.0, 45.0, 29.0, 25.0, 28.0, 14.0, 16.0, 23.0, 19.0, 17.0, 12.0, 4.0, 7.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.822265625, -3.694244384765625, -3.56622314453125, -3.438201904296875, -3.3101806640625, -3.182159423828125, -3.05413818359375, -2.926116943359375, -2.798095703125, -2.670074462890625, -2.54205322265625, -2.414031982421875, -2.2860107421875, -2.157989501953125, -2.02996826171875, -1.901947021484375, -1.77392578125, -1.645904541015625, -1.51788330078125, -1.389862060546875, -1.2618408203125, -1.133819580078125, -1.00579833984375, -0.877777099609375, -0.749755859375, -0.621734619140625, -0.49371337890625, -0.365692138671875, -0.2376708984375, -0.109649658203125, 0.01837158203125, 0.146392822265625, 0.2744140625, 0.402435302734375, 0.53045654296875, 0.658477783203125, 0.7864990234375, 0.914520263671875, 1.04254150390625, 1.170562744140625, 1.298583984375, 1.426605224609375, 1.55462646484375, 1.682647705078125, 1.8106689453125, 1.938690185546875, 2.06671142578125, 2.194732666015625, 2.32275390625, 2.450775146484375, 2.57879638671875, 2.706817626953125, 2.8348388671875, 2.962860107421875, 3.09088134765625, 3.218902587890625, 3.346923828125, 3.474945068359375, 3.60296630859375, 3.730987548828125, 3.8590087890625, 3.987030029296875, 4.11505126953125, 4.243072509765625, 4.37109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 8.0, 3.0, 5.0, 15.0, 23.0, 44.0, 58.0, 84.0, 108.0, 198.0, 295.0, 455.0, 739.0, 1119.0, 1848.0, 3130.0, 5137.0, 8577.0, 14243.0, 24542.0, 40672.0, 65398.0, 100125.0, 139690.0, 163460.0, 154232.0, 117916.0, 79677.0, 50332.0, 30395.0, 18310.0, 10748.0, 6535.0, 4039.0, 2370.0, 1513.0, 881.0, 566.0, 377.0, 245.0, 142.0, 99.0, 59.0, 66.0, 31.0, 23.0, 13.0, 9.0, 7.0, 1.0, 3.0, 1.0, 4.0], "bins": [-4.21484375, -4.09686279296875, -3.9788818359375, -3.86090087890625, -3.742919921875, -3.62493896484375, -3.5069580078125, -3.38897705078125, -3.27099609375, -3.15301513671875, -3.0350341796875, -2.91705322265625, -2.799072265625, -2.68109130859375, -2.5631103515625, -2.44512939453125, -2.3271484375, -2.20916748046875, -2.0911865234375, -1.97320556640625, -1.855224609375, -1.73724365234375, -1.6192626953125, -1.50128173828125, -1.38330078125, -1.26531982421875, -1.1473388671875, -1.02935791015625, -0.911376953125, -0.79339599609375, -0.6754150390625, -0.55743408203125, -0.439453125, -0.32147216796875, -0.2034912109375, -0.08551025390625, 0.032470703125, 0.15045166015625, 0.2684326171875, 0.38641357421875, 0.50439453125, 0.62237548828125, 0.7403564453125, 0.85833740234375, 0.976318359375, 1.09429931640625, 1.2122802734375, 1.33026123046875, 1.4482421875, 1.56622314453125, 1.6842041015625, 1.80218505859375, 1.920166015625, 2.03814697265625, 2.1561279296875, 2.27410888671875, 2.39208984375, 2.51007080078125, 2.6280517578125, 2.74603271484375, 2.864013671875, 2.98199462890625, 3.0999755859375, 3.21795654296875, 3.3359375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 3.0, 5.0, 1.0, 6.0, 17.0, 12.0, 15.0, 19.0, 36.0, 32.0, 31.0, 41.0, 46.0, 49.0, 71.0, 59.0, 53.0, 63.0, 60.0, 67.0, 59.0, 52.0, 33.0, 36.0, 23.0, 28.0, 20.0, 7.0, 11.0, 11.0, 11.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003414154052734375, -0.0003311522305011749, -0.00032088905572891235, -0.0003106258809566498, -0.0003003627061843872, -0.00029009953141212463, -0.00027983635663986206, -0.0002695731818675995, -0.0002593100070953369, -0.00024904683232307434, -0.00023878365755081177, -0.0002285204827785492, -0.00021825730800628662, -0.00020799413323402405, -0.00019773095846176147, -0.0001874677836894989, -0.00017720460891723633, -0.00016694143414497375, -0.00015667825937271118, -0.0001464150846004486, -0.00013615190982818604, -0.00012588873505592346, -0.00011562556028366089, -0.00010536238551139832, -9.509921073913574e-05, -8.483603596687317e-05, -7.45728611946106e-05, -6.430968642234802e-05, -5.404651165008545e-05, -4.3783336877822876e-05, -3.35201621055603e-05, -2.325698733329773e-05, -1.2993812561035156e-05, -2.730637788772583e-06, 7.53253698348999e-06, 1.7795711755752563e-05, 2.8058886528015137e-05, 3.832206130027771e-05, 4.858523607254028e-05, 5.8848410844802856e-05, 6.911158561706543e-05, 7.9374760389328e-05, 8.963793516159058e-05, 9.990110993385315e-05, 0.00011016428470611572, 0.0001204274594783783, 0.00013069063425064087, 0.00014095380902290344, 0.00015121698379516602, 0.0001614801585674286, 0.00017174333333969116, 0.00018200650811195374, 0.0001922696828842163, 0.00020253285765647888, 0.00021279603242874146, 0.00022305920720100403, 0.0002333223819732666, 0.00024358555674552917, 0.00025384873151779175, 0.0002641119062900543, 0.0002743750810623169, 0.00028463825583457947, 0.00029490143060684204, 0.0003051646053791046, 0.0003154277801513672]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 10.0, 15.0, 20.0, 26.0, 58.0, 59.0, 104.0, 150.0, 197.0, 339.0, 541.0, 841.0, 1353.0, 2078.0, 3520.0, 5684.0, 9186.0, 14696.0, 23767.0, 37298.0, 57912.0, 84993.0, 116804.0, 141225.0, 144605.0, 126178.0, 95123.0, 66133.0, 42985.0, 27642.0, 17090.0, 10513.0, 6431.0, 4128.0, 2533.0, 1587.0, 985.0, 636.0, 391.0, 244.0, 173.0, 103.0, 72.0, 56.0, 26.0, 12.0, 15.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.134765625, -3.03082275390625, -2.9268798828125, -2.82293701171875, -2.718994140625, -2.61505126953125, -2.5111083984375, -2.40716552734375, -2.30322265625, -2.19927978515625, -2.0953369140625, -1.99139404296875, -1.887451171875, -1.78350830078125, -1.6795654296875, -1.57562255859375, -1.4716796875, -1.36773681640625, -1.2637939453125, -1.15985107421875, -1.055908203125, -0.95196533203125, -0.8480224609375, -0.74407958984375, -0.64013671875, -0.53619384765625, -0.4322509765625, -0.32830810546875, -0.224365234375, -0.12042236328125, -0.0164794921875, 0.08746337890625, 0.19140625, 0.29534912109375, 0.3992919921875, 0.50323486328125, 0.607177734375, 0.71112060546875, 0.8150634765625, 0.91900634765625, 1.02294921875, 1.12689208984375, 1.2308349609375, 1.33477783203125, 1.438720703125, 1.54266357421875, 1.6466064453125, 1.75054931640625, 1.8544921875, 1.95843505859375, 2.0623779296875, 2.16632080078125, 2.270263671875, 2.37420654296875, 2.4781494140625, 2.58209228515625, 2.68603515625, 2.78997802734375, 2.8939208984375, 2.99786376953125, 3.101806640625, 3.20574951171875, 3.3096923828125, 3.41363525390625, 3.517578125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 8.0, 4.0, 0.0, 5.0, 11.0, 2.0, 13.0, 11.0, 23.0, 14.0, 24.0, 29.0, 35.0, 42.0, 37.0, 39.0, 48.0, 46.0, 54.0, 58.0, 52.0, 48.0, 54.0, 42.0, 41.0, 41.0, 35.0, 40.0, 32.0, 19.0, 23.0, 17.0, 12.0, 18.0, 6.0, 8.0, 5.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.2548828125, -1.2220840454101562, -1.1892852783203125, -1.1564865112304688, -1.123687744140625, -1.0908889770507812, -1.0580902099609375, -1.0252914428710938, -0.99249267578125, -0.9596939086914062, -0.9268951416015625, -0.8940963745117188, -0.861297607421875, -0.8284988403320312, -0.7957000732421875, -0.7629013061523438, -0.7301025390625, -0.6973037719726562, -0.6645050048828125, -0.6317062377929688, -0.598907470703125, -0.5661087036132812, -0.5333099365234375, -0.5005111694335938, -0.46771240234375, -0.43491363525390625, -0.4021148681640625, -0.36931610107421875, -0.336517333984375, -0.30371856689453125, -0.2709197998046875, -0.23812103271484375, -0.205322265625, -0.17252349853515625, -0.1397247314453125, -0.10692596435546875, -0.074127197265625, -0.04132843017578125, -0.0085296630859375, 0.02426910400390625, 0.05706787109375, 0.08986663818359375, 0.1226654052734375, 0.15546417236328125, 0.188262939453125, 0.22106170654296875, 0.2538604736328125, 0.28665924072265625, 0.3194580078125, 0.35225677490234375, 0.3850555419921875, 0.41785430908203125, 0.450653076171875, 0.48345184326171875, 0.5162506103515625, 0.5490493774414062, 0.58184814453125, 0.6146469116210938, 0.6474456787109375, 0.6802444458007812, 0.713043212890625, 0.7458419799804688, 0.7786407470703125, 0.8114395141601562, 0.84423828125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 4.0, 6.0, 12.0, 12.0, 15.0, 12.0, 29.0, 21.0, 27.0, 46.0, 52.0, 51.0, 51.0, 74.0, 65.0, 59.0, 54.0, 61.0, 67.0, 43.0, 37.0, 32.0, 27.0, 18.0, 22.0, 32.0, 9.0, 8.0, 6.0, 9.0, 6.0, 8.0, 0.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.150920867919922, -9.811415672302246, -9.471909523010254, -9.132404327392578, -8.792899131774902, -8.45339298248291, -8.113887786865234, -7.7743821144104, -7.434876441955566, -7.095370769500732, -6.755865573883057, -6.416359901428223, -6.076854228973389, -5.737348556518555, -5.397843360900879, -5.058337688446045, -4.718832492828369, -4.379326820373535, -4.039821624755859, -3.7003159523010254, -3.3608102798461914, -3.0213048458099365, -2.6817994117736816, -2.3422937393188477, -2.0027883052825928, -1.6632827520370483, -1.323777198791504, -0.984271764755249, -0.6447662115097046, -0.30526065826416016, 0.03424477577209473, 0.3737504482269287, 0.7132558822631836, 1.052761435508728, 1.3922669887542725, 1.7317724227905273, 2.0712780952453613, 2.410783529281616, 2.750288963317871, 3.089794635772705, 3.42930006980896, 3.768805503845215, 4.108311176300049, 4.447816848754883, 4.787322044372559, 5.126827716827393, 5.466333389282227, 5.805838584899902, 6.145344257354736, 6.48484992980957, 6.824355125427246, 7.16386079788208, 7.503366470336914, 7.84287166595459, 8.182376861572266, 8.521883010864258, 8.861388206481934, 9.20089340209961, 9.540399551391602, 9.879904747009277, 10.219409942626953, 10.558916091918945, 10.898421287536621, 11.237926483154297, 11.577432632446289]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 11.0, 13.0, 14.0, 12.0, 17.0, 24.0, 23.0, 24.0, 29.0, 29.0, 35.0, 35.0, 33.0, 50.0, 37.0, 52.0, 40.0, 30.0, 40.0, 36.0, 49.0, 37.0, 44.0, 38.0, 33.0, 30.0, 33.0, 21.0, 26.0, 24.0, 17.0, 6.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.818230628967285, -6.6018829345703125, -6.38553524017334, -6.169187545776367, -5.9528398513793945, -5.736492156982422, -5.520144939422607, -5.303797245025635, -5.087449550628662, -4.8711018562316895, -4.654754161834717, -4.438406467437744, -4.22205924987793, -4.005711555480957, -3.7893638610839844, -3.5730161666870117, -3.356668472290039, -3.1403207778930664, -2.9239730834960938, -2.7076256275177, -2.4912779331207275, -2.274930238723755, -2.0585827827453613, -1.8422350883483887, -1.625887393951416, -1.4095396995544434, -1.1931921243667603, -0.9768444895744324, -0.7604968547821045, -0.5441491603851318, -0.32780158519744873, -0.11145401000976562, 0.10489320755004883, 0.3212408423423767, 0.5375884771347046, 0.7539361119270325, 0.9702837467193604, 1.186631441116333, 1.4029790163040161, 1.6193265914916992, 1.8356742858886719, 2.0520219802856445, 2.268369674682617, 2.4847171306610107, 2.7010648250579834, 2.917412519454956, 3.1337599754333496, 3.3501076698303223, 3.566455364227295, 3.7828030586242676, 3.9991507530212402, 4.215498447418213, 4.431845664978027, 4.648193359375, 4.864541053771973, 5.080888748168945, 5.297236442565918, 5.513584136962891, 5.729931831359863, 5.946279525756836, 6.162627220153809, 6.378974914550781, 6.595322132110596, 6.811669826507568, 7.028017520904541]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 5.0, 7.0, 17.0, 14.0, 21.0, 27.0, 60.0, 67.0, 134.0, 160.0, 292.0, 467.0, 798.0, 1412.0, 2313.0, 4062.0, 7095.0, 12769.0, 23403.0, 43945.0, 83309.0, 158127.0, 296654.0, 520570.0, 767291.0, 829361.0, 627555.0, 377958.0, 203717.0, 107704.0, 56864.0, 30493.0, 16214.0, 9186.0, 5259.0, 2899.0, 1701.0, 954.0, 558.0, 315.0, 200.0, 131.0, 71.0, 51.0, 23.0, 18.0, 13.0, 13.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.640625, -7.3697509765625, -7.098876953125, -6.8280029296875, -6.55712890625, -6.2862548828125, -6.015380859375, -5.7445068359375, -5.4736328125, -5.2027587890625, -4.931884765625, -4.6610107421875, -4.39013671875, -4.1192626953125, -3.848388671875, -3.5775146484375, -3.306640625, -3.0357666015625, -2.764892578125, -2.4940185546875, -2.22314453125, -1.9522705078125, -1.681396484375, -1.4105224609375, -1.1396484375, -0.8687744140625, -0.597900390625, -0.3270263671875, -0.05615234375, 0.2147216796875, 0.485595703125, 0.7564697265625, 1.02734375, 1.2982177734375, 1.569091796875, 1.8399658203125, 2.11083984375, 2.3817138671875, 2.652587890625, 2.9234619140625, 3.1943359375, 3.4652099609375, 3.736083984375, 4.0069580078125, 4.27783203125, 4.5487060546875, 4.819580078125, 5.0904541015625, 5.361328125, 5.6322021484375, 5.903076171875, 6.1739501953125, 6.44482421875, 6.7156982421875, 6.986572265625, 7.2574462890625, 7.5283203125, 7.7991943359375, 8.070068359375, 8.3409423828125, 8.61181640625, 8.8826904296875, 9.153564453125, 9.4244384765625, 9.6953125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 7.0, 7.0, 6.0, 18.0, 15.0, 11.0, 16.0, 21.0, 25.0, 44.0, 26.0, 27.0, 31.0, 35.0, 39.0, 46.0, 53.0, 43.0, 49.0, 34.0, 37.0, 38.0, 40.0, 34.0, 43.0, 34.0, 27.0, 44.0, 26.0, 24.0, 25.0, 16.0, 8.0, 8.0, 8.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.22991943359375, -4.0770263671875, -3.92413330078125, -3.771240234375, -3.61834716796875, -3.4654541015625, -3.31256103515625, -3.15966796875, -3.00677490234375, -2.8538818359375, -2.70098876953125, -2.548095703125, -2.39520263671875, -2.2423095703125, -2.08941650390625, -1.9365234375, -1.78363037109375, -1.6307373046875, -1.47784423828125, -1.324951171875, -1.17205810546875, -1.0191650390625, -0.86627197265625, -0.71337890625, -0.56048583984375, -0.4075927734375, -0.25469970703125, -0.101806640625, 0.05108642578125, 0.2039794921875, 0.35687255859375, 0.509765625, 0.66265869140625, 0.8155517578125, 0.96844482421875, 1.121337890625, 1.27423095703125, 1.4271240234375, 1.58001708984375, 1.73291015625, 1.88580322265625, 2.0386962890625, 2.19158935546875, 2.344482421875, 2.49737548828125, 2.6502685546875, 2.80316162109375, 2.9560546875, 3.10894775390625, 3.2618408203125, 3.41473388671875, 3.567626953125, 3.72052001953125, 3.8734130859375, 4.02630615234375, 4.17919921875, 4.33209228515625, 4.4849853515625, 4.63787841796875, 4.790771484375, 4.94366455078125, 5.0965576171875, 5.24945068359375, 5.40234375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 12.0, 15.0, 32.0, 35.0, 49.0, 83.0, 143.0, 170.0, 285.0, 455.0, 688.0, 1081.0, 1687.0, 2705.0, 4417.0, 7024.0, 11400.0, 18168.0, 30066.0, 49229.0, 80159.0, 129200.0, 205751.0, 309724.0, 439617.0, 553361.0, 596685.0, 538210.0, 418434.0, 291360.0, 191607.0, 120292.0, 74340.0, 45067.0, 27633.0, 17125.0, 10482.0, 6513.0, 3972.0, 2531.0, 1659.0, 999.0, 611.0, 430.0, 271.0, 160.0, 122.0, 73.0, 59.0, 27.0, 24.0, 18.0, 11.0, 7.0, 1.0, 3.0, 4.0, 4.0], "bins": [-6.9296875, -6.7159423828125, -6.502197265625, -6.2884521484375, -6.07470703125, -5.8609619140625, -5.647216796875, -5.4334716796875, -5.2197265625, -5.0059814453125, -4.792236328125, -4.5784912109375, -4.36474609375, -4.1510009765625, -3.937255859375, -3.7235107421875, -3.509765625, -3.2960205078125, -3.082275390625, -2.8685302734375, -2.65478515625, -2.4410400390625, -2.227294921875, -2.0135498046875, -1.7998046875, -1.5860595703125, -1.372314453125, -1.1585693359375, -0.94482421875, -0.7310791015625, -0.517333984375, -0.3035888671875, -0.08984375, 0.1239013671875, 0.337646484375, 0.5513916015625, 0.76513671875, 0.9788818359375, 1.192626953125, 1.4063720703125, 1.6201171875, 1.8338623046875, 2.047607421875, 2.2613525390625, 2.47509765625, 2.6888427734375, 2.902587890625, 3.1163330078125, 3.330078125, 3.5438232421875, 3.757568359375, 3.9713134765625, 4.18505859375, 4.3988037109375, 4.612548828125, 4.8262939453125, 5.0400390625, 5.2537841796875, 5.467529296875, 5.6812744140625, 5.89501953125, 6.1087646484375, 6.322509765625, 6.5362548828125, 6.75]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 8.0, 13.0, 13.0, 24.0, 21.0, 26.0, 38.0, 46.0, 57.0, 55.0, 63.0, 90.0, 97.0, 112.0, 130.0, 143.0, 144.0, 188.0, 175.0, 200.0, 210.0, 230.0, 218.0, 220.0, 207.0, 183.0, 156.0, 153.0, 138.0, 127.0, 112.0, 80.0, 65.0, 72.0, 47.0, 38.0, 36.0, 32.0, 23.0, 17.0, 13.0, 10.0, 9.0, 6.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.421875, -2.345306396484375, -2.26873779296875, -2.192169189453125, -2.1156005859375, -2.039031982421875, -1.96246337890625, -1.885894775390625, -1.809326171875, -1.732757568359375, -1.65618896484375, -1.579620361328125, -1.5030517578125, -1.426483154296875, -1.34991455078125, -1.273345947265625, -1.19677734375, -1.120208740234375, -1.04364013671875, -0.967071533203125, -0.8905029296875, -0.813934326171875, -0.73736572265625, -0.660797119140625, -0.584228515625, -0.507659912109375, -0.43109130859375, -0.354522705078125, -0.2779541015625, -0.201385498046875, -0.12481689453125, -0.048248291015625, 0.0283203125, 0.104888916015625, 0.18145751953125, 0.258026123046875, 0.3345947265625, 0.411163330078125, 0.48773193359375, 0.564300537109375, 0.640869140625, 0.717437744140625, 0.79400634765625, 0.870574951171875, 0.9471435546875, 1.023712158203125, 1.10028076171875, 1.176849365234375, 1.25341796875, 1.329986572265625, 1.40655517578125, 1.483123779296875, 1.5596923828125, 1.636260986328125, 1.71282958984375, 1.789398193359375, 1.865966796875, 1.942535400390625, 2.01910400390625, 2.095672607421875, 2.1722412109375, 2.248809814453125, 2.32537841796875, 2.401947021484375, 2.478515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 4.0, 8.0, 10.0, 19.0, 13.0, 22.0, 16.0, 34.0, 34.0, 36.0, 61.0, 60.0, 68.0, 85.0, 69.0, 58.0, 62.0, 53.0, 51.0, 52.0, 37.0, 27.0, 30.0, 14.0, 15.0, 9.0, 12.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.30174732208252, -9.950090408325195, -9.598432540893555, -9.24677562713623, -8.895118713378906, -8.543460845947266, -8.191803932189941, -7.840147018432617, -7.488489627838135, -7.136832237243652, -6.785175323486328, -6.433517932891846, -6.081860542297363, -5.730203628540039, -5.378546237945557, -5.026888847351074, -4.67523193359375, -4.323574542999268, -3.9719176292419434, -3.620260238647461, -3.2686030864715576, -2.9169459342956543, -2.565288543701172, -2.2136313915252686, -1.8619742393493652, -1.510317087173462, -1.158659815788269, -0.8070025444030762, -0.45534539222717285, -0.10368824005126953, 0.2479691505432129, 0.5996263027191162, 0.9512825012207031, 1.3029396533966064, 1.6545969247817993, 2.006254196166992, 2.3579113483428955, 2.709568500518799, 3.0612258911132812, 3.4128830432891846, 3.764540195465088, 4.11619758605957, 4.4678544998168945, 4.819511890411377, 5.171169281005859, 5.522826194763184, 5.874483585357666, 6.226140975952148, 6.577797889709473, 6.929455280303955, 7.281112194061279, 7.632769584655762, 7.984426498413086, 8.336084365844727, 8.68774127960205, 9.039398193359375, 9.391056060791016, 9.74271297454834, 10.09437084197998, 10.446027755737305, 10.797684669494629, 11.149341583251953, 11.500999450683594, 11.852656364440918, 12.204313278198242]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 6.0, 9.0, 16.0, 13.0, 30.0, 35.0, 34.0, 26.0, 32.0, 33.0, 47.0, 42.0, 52.0, 50.0, 54.0, 51.0, 61.0, 45.0, 54.0, 39.0, 32.0, 48.0, 35.0, 27.0, 39.0, 15.0, 14.0, 16.0, 3.0, 8.0, 7.0, 1.0, 2.0, 8.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.52358341217041, -8.279224395751953, -8.034865379333496, -7.790506362915039, -7.546147346496582, -7.301788330078125, -7.057429313659668, -6.813070297241211, -6.568711280822754, -6.324352264404297, -6.07999324798584, -5.835634231567383, -5.591275215148926, -5.346916198730469, -5.102557182312012, -4.858198165893555, -4.613839149475098, -4.369480133056641, -4.125121116638184, -3.8807621002197266, -3.6364030838012695, -3.3920440673828125, -3.1476850509643555, -2.9033260345458984, -2.6589670181274414, -2.4146080017089844, -2.1702489852905273, -1.9258899688720703, -1.6815309524536133, -1.4371719360351562, -1.1928129196166992, -0.9484539031982422, -0.7040953636169434, -0.45973634719848633, -0.2153773307800293, 0.028981685638427734, 0.27334070205688477, 0.5176997184753418, 0.7620587348937988, 1.0064177513122559, 1.250776767730713, 1.49513578414917, 1.739494800567627, 1.983853816986084, 2.228212833404541, 2.472571849822998, 2.716930866241455, 2.961289882659912, 3.205648899078369, 3.450007915496826, 3.694366931915283, 3.9387259483337402, 4.183084964752197, 4.427443981170654, 4.671802997589111, 4.916162014007568, 5.160521030426025, 5.404880046844482, 5.6492390632629395, 5.8935980796813965, 6.1379570960998535, 6.3823161125183105, 6.626675128936768, 6.871034145355225, 7.115393161773682]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 7.0, 18.0, 17.0, 23.0, 44.0, 61.0, 117.0, 184.0, 427.0, 803.0, 1599.0, 3378.0, 7297.0, 16941.0, 38787.0, 90390.0, 186997.0, 277886.0, 220821.0, 113757.0, 49759.0, 21533.0, 9484.0, 4179.0, 1984.0, 914.0, 501.0, 288.0, 152.0, 71.0, 40.0, 34.0, 7.0, 18.0, 8.0, 9.0, 5.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0], "bins": [-2.826171875, -2.7510986328125, -2.676025390625, -2.6009521484375, -2.52587890625, -2.4508056640625, -2.375732421875, -2.3006591796875, -2.2255859375, -2.1505126953125, -2.075439453125, -2.0003662109375, -1.92529296875, -1.8502197265625, -1.775146484375, -1.7000732421875, -1.625, -1.5499267578125, -1.474853515625, -1.3997802734375, -1.32470703125, -1.2496337890625, -1.174560546875, -1.0994873046875, -1.0244140625, -0.9493408203125, -0.874267578125, -0.7991943359375, -0.72412109375, -0.6490478515625, -0.573974609375, -0.4989013671875, -0.423828125, -0.3487548828125, -0.273681640625, -0.1986083984375, -0.12353515625, -0.0484619140625, 0.026611328125, 0.1016845703125, 0.1767578125, 0.2518310546875, 0.326904296875, 0.4019775390625, 0.47705078125, 0.5521240234375, 0.627197265625, 0.7022705078125, 0.77734375, 0.8524169921875, 0.927490234375, 1.0025634765625, 1.07763671875, 1.1527099609375, 1.227783203125, 1.3028564453125, 1.3779296875, 1.4530029296875, 1.528076171875, 1.6031494140625, 1.67822265625, 1.7532958984375, 1.828369140625, 1.9034423828125, 1.978515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 7.0, 5.0, 9.0, 12.0, 20.0, 24.0, 26.0, 31.0, 33.0, 38.0, 33.0, 36.0, 44.0, 53.0, 56.0, 51.0, 51.0, 55.0, 49.0, 44.0, 52.0, 37.0, 41.0, 33.0, 29.0, 28.0, 17.0, 23.0, 13.0, 9.0, 9.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.28125, -9.0228271484375, -8.764404296875, -8.5059814453125, -8.24755859375, -7.9891357421875, -7.730712890625, -7.4722900390625, -7.2138671875, -6.9554443359375, -6.697021484375, -6.4385986328125, -6.18017578125, -5.9217529296875, -5.663330078125, -5.4049072265625, -5.146484375, -4.8880615234375, -4.629638671875, -4.3712158203125, -4.11279296875, -3.8543701171875, -3.595947265625, -3.3375244140625, -3.0791015625, -2.8206787109375, -2.562255859375, -2.3038330078125, -2.04541015625, -1.7869873046875, -1.528564453125, -1.2701416015625, -1.01171875, -0.7532958984375, -0.494873046875, -0.2364501953125, 0.02197265625, 0.2803955078125, 0.538818359375, 0.7972412109375, 1.0556640625, 1.3140869140625, 1.572509765625, 1.8309326171875, 2.08935546875, 2.3477783203125, 2.606201171875, 2.8646240234375, 3.123046875, 3.3814697265625, 3.639892578125, 3.8983154296875, 4.15673828125, 4.4151611328125, 4.673583984375, 4.9320068359375, 5.1904296875, 5.4488525390625, 5.707275390625, 5.9656982421875, 6.22412109375, 6.4825439453125, 6.740966796875, 6.9993896484375, 7.2578125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 10.0, 15.0, 33.0, 42.0, 46.0, 84.0, 124.0, 218.0, 299.0, 520.0, 903.0, 1502.0, 2494.0, 4474.0, 8021.0, 15561.0, 29242.0, 56170.0, 103086.0, 172761.0, 218868.0, 185261.0, 114947.0, 62443.0, 32815.0, 17270.0, 9196.0, 5032.0, 2873.0, 1645.0, 1021.0, 572.0, 350.0, 207.0, 147.0, 93.0, 79.0, 52.0, 25.0, 14.0, 11.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.959381103515625, -1.89532470703125, -1.831268310546875, -1.7672119140625, -1.703155517578125, -1.63909912109375, -1.575042724609375, -1.510986328125, -1.446929931640625, -1.38287353515625, -1.318817138671875, -1.2547607421875, -1.190704345703125, -1.12664794921875, -1.062591552734375, -0.99853515625, -0.934478759765625, -0.87042236328125, -0.806365966796875, -0.7423095703125, -0.678253173828125, -0.61419677734375, -0.550140380859375, -0.486083984375, -0.422027587890625, -0.35797119140625, -0.293914794921875, -0.2298583984375, -0.165802001953125, -0.10174560546875, -0.037689208984375, 0.0263671875, 0.090423583984375, 0.15447998046875, 0.218536376953125, 0.2825927734375, 0.346649169921875, 0.41070556640625, 0.474761962890625, 0.538818359375, 0.602874755859375, 0.66693115234375, 0.730987548828125, 0.7950439453125, 0.859100341796875, 0.92315673828125, 0.987213134765625, 1.05126953125, 1.115325927734375, 1.17938232421875, 1.243438720703125, 1.3074951171875, 1.371551513671875, 1.43560791015625, 1.499664306640625, 1.563720703125, 1.627777099609375, 1.69183349609375, 1.755889892578125, 1.8199462890625, 1.884002685546875, 1.94805908203125, 2.012115478515625, 2.076171875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 10.0, 7.0, 22.0, 9.0, 20.0, 20.0, 30.0, 30.0, 22.0, 39.0, 36.0, 41.0, 39.0, 35.0, 40.0, 42.0, 44.0, 48.0, 42.0, 40.0, 41.0, 36.0, 40.0, 31.0, 33.0, 29.0, 31.0, 24.0, 25.0, 19.0, 11.0, 9.0, 19.0, 4.0, 2.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.90234375, -4.764312744140625, -4.62628173828125, -4.488250732421875, -4.3502197265625, -4.212188720703125, -4.07415771484375, -3.936126708984375, -3.798095703125, -3.660064697265625, -3.52203369140625, -3.384002685546875, -3.2459716796875, -3.107940673828125, -2.96990966796875, -2.831878662109375, -2.69384765625, -2.555816650390625, -2.41778564453125, -2.279754638671875, -2.1417236328125, -2.003692626953125, -1.86566162109375, -1.727630615234375, -1.589599609375, -1.451568603515625, -1.31353759765625, -1.175506591796875, -1.0374755859375, -0.899444580078125, -0.76141357421875, -0.623382568359375, -0.4853515625, -0.347320556640625, -0.20928955078125, -0.071258544921875, 0.0667724609375, 0.204803466796875, 0.34283447265625, 0.480865478515625, 0.618896484375, 0.756927490234375, 0.89495849609375, 1.032989501953125, 1.1710205078125, 1.309051513671875, 1.44708251953125, 1.585113525390625, 1.72314453125, 1.861175537109375, 1.99920654296875, 2.137237548828125, 2.2752685546875, 2.413299560546875, 2.55133056640625, 2.689361572265625, 2.827392578125, 2.965423583984375, 3.10345458984375, 3.241485595703125, 3.3795166015625, 3.517547607421875, 3.65557861328125, 3.793609619140625, 3.931640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 10.0, 13.0, 9.0, 17.0, 23.0, 40.0, 45.0, 49.0, 110.0, 153.0, 234.0, 355.0, 542.0, 931.0, 1516.0, 2938.0, 5727.0, 11238.0, 23909.0, 57783.0, 152515.0, 338033.0, 268941.0, 105624.0, 41159.0, 17989.0, 8501.0, 4370.0, 2325.0, 1290.0, 772.0, 479.0, 318.0, 164.0, 121.0, 80.0, 64.0, 51.0, 28.0, 25.0, 14.0, 14.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.732421875, -0.7107620239257812, -0.6891021728515625, -0.6674423217773438, -0.645782470703125, -0.6241226196289062, -0.6024627685546875, -0.5808029174804688, -0.55914306640625, -0.5374832153320312, -0.5158233642578125, -0.49416351318359375, -0.472503662109375, -0.45084381103515625, -0.4291839599609375, -0.40752410888671875, -0.3858642578125, -0.36420440673828125, -0.3425445556640625, -0.32088470458984375, -0.299224853515625, -0.27756500244140625, -0.2559051513671875, -0.23424530029296875, -0.21258544921875, -0.19092559814453125, -0.1692657470703125, -0.14760589599609375, -0.125946044921875, -0.10428619384765625, -0.0826263427734375, -0.06096649169921875, -0.039306640625, -0.01764678955078125, 0.0040130615234375, 0.02567291259765625, 0.047332763671875, 0.06899261474609375, 0.0906524658203125, 0.11231231689453125, 0.13397216796875, 0.15563201904296875, 0.1772918701171875, 0.19895172119140625, 0.220611572265625, 0.24227142333984375, 0.2639312744140625, 0.28559112548828125, 0.3072509765625, 0.32891082763671875, 0.3505706787109375, 0.37223052978515625, 0.393890380859375, 0.41555023193359375, 0.4372100830078125, 0.45886993408203125, 0.48052978515625, 0.5021896362304688, 0.5238494873046875, 0.5455093383789062, 0.567169189453125, 0.5888290405273438, 0.6104888916015625, 0.6321487426757812, 0.65380859375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 6.0, 2.0, 11.0, 4.0, 8.0, 18.0, 18.0, 23.0, 23.0, 28.0, 36.0, 39.0, 39.0, 35.0, 58.0, 57.0, 64.0, 63.0, 61.0, 50.0, 56.0, 50.0, 29.0, 40.0, 46.0, 20.0, 21.0, 18.0, 13.0, 14.0, 9.0, 7.0, 6.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7298927307128906e-05, -2.6444904506206512e-05, -2.559088170528412e-05, -2.4736858904361725e-05, -2.388283610343933e-05, -2.3028813302516937e-05, -2.2174790501594543e-05, -2.132076770067215e-05, -2.0466744899749756e-05, -1.9612722098827362e-05, -1.8758699297904968e-05, -1.7904676496982574e-05, -1.705065369606018e-05, -1.6196630895137787e-05, -1.5342608094215393e-05, -1.4488585293293e-05, -1.3634562492370605e-05, -1.2780539691448212e-05, -1.1926516890525818e-05, -1.1072494089603424e-05, -1.021847128868103e-05, -9.364448487758636e-06, -8.510425686836243e-06, -7.656402885913849e-06, -6.802380084991455e-06, -5.948357284069061e-06, -5.0943344831466675e-06, -4.240311682224274e-06, -3.38628888130188e-06, -2.532266080379486e-06, -1.6782432794570923e-06, -8.242204785346985e-07, 2.9802322387695312e-08, 8.838251233100891e-07, 1.737847924232483e-06, 2.5918707251548767e-06, 3.4458935260772705e-06, 4.299916326999664e-06, 5.153939127922058e-06, 6.007961928844452e-06, 6.861984729766846e-06, 7.71600753068924e-06, 8.570030331611633e-06, 9.424053132534027e-06, 1.0278075933456421e-05, 1.1132098734378815e-05, 1.1986121535301208e-05, 1.2840144336223602e-05, 1.3694167137145996e-05, 1.454818993806839e-05, 1.5402212738990784e-05, 1.6256235539913177e-05, 1.711025834083557e-05, 1.7964281141757965e-05, 1.881830394268036e-05, 1.9672326743602753e-05, 2.0526349544525146e-05, 2.138037234544754e-05, 2.2234395146369934e-05, 2.3088417947292328e-05, 2.394244074821472e-05, 2.4796463549137115e-05, 2.565048635005951e-05, 2.6504509150981903e-05, 2.7358531951904297e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 2.0, 3.0, 6.0, 10.0, 11.0, 21.0, 28.0, 40.0, 51.0, 77.0, 133.0, 169.0, 279.0, 474.0, 740.0, 1089.0, 1848.0, 2821.0, 4722.0, 7959.0, 13726.0, 24930.0, 46666.0, 90862.0, 171910.0, 247295.0, 198640.0, 109126.0, 55853.0, 29250.0, 16156.0, 9282.0, 5417.0, 3315.0, 2114.0, 1268.0, 789.0, 520.0, 338.0, 204.0, 127.0, 95.0, 60.0, 53.0, 22.0, 15.0, 15.0, 9.0, 7.0, 3.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5751953125, -0.5575714111328125, -0.539947509765625, -0.5223236083984375, -0.50469970703125, -0.4870758056640625, -0.469451904296875, -0.4518280029296875, -0.4342041015625, -0.4165802001953125, -0.398956298828125, -0.3813323974609375, -0.36370849609375, -0.3460845947265625, -0.328460693359375, -0.3108367919921875, -0.293212890625, -0.2755889892578125, -0.257965087890625, -0.2403411865234375, -0.22271728515625, -0.2050933837890625, -0.187469482421875, -0.1698455810546875, -0.1522216796875, -0.1345977783203125, -0.116973876953125, -0.0993499755859375, -0.08172607421875, -0.0641021728515625, -0.046478271484375, -0.0288543701171875, -0.01123046875, 0.0063934326171875, 0.024017333984375, 0.0416412353515625, 0.05926513671875, 0.0768890380859375, 0.094512939453125, 0.1121368408203125, 0.1297607421875, 0.1473846435546875, 0.165008544921875, 0.1826324462890625, 0.20025634765625, 0.2178802490234375, 0.235504150390625, 0.2531280517578125, 0.270751953125, 0.2883758544921875, 0.305999755859375, 0.3236236572265625, 0.34124755859375, 0.3588714599609375, 0.376495361328125, 0.3941192626953125, 0.4117431640625, 0.4293670654296875, 0.446990966796875, 0.4646148681640625, 0.48223876953125, 0.4998626708984375, 0.517486572265625, 0.5351104736328125, 0.552734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 4.0, 14.0, 18.0, 16.0, 21.0, 25.0, 33.0, 34.0, 41.0, 49.0, 53.0, 67.0, 65.0, 74.0, 58.0, 62.0, 57.0, 44.0, 44.0, 37.0, 28.0, 24.0, 20.0, 22.0, 12.0, 8.0, 14.0, 8.0, 12.0, 4.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.185791015625, -0.1806621551513672, -0.17553329467773438, -0.17040443420410156, -0.16527557373046875, -0.16014671325683594, -0.15501785278320312, -0.1498889923095703, -0.1447601318359375, -0.1396312713623047, -0.13450241088867188, -0.12937355041503906, -0.12424468994140625, -0.11911582946777344, -0.11398696899414062, -0.10885810852050781, -0.103729248046875, -0.09860038757324219, -0.09347152709960938, -0.08834266662597656, -0.08321380615234375, -0.07808494567871094, -0.07295608520507812, -0.06782722473144531, -0.0626983642578125, -0.05756950378417969, -0.052440643310546875, -0.04731178283691406, -0.04218292236328125, -0.03705406188964844, -0.031925201416015625, -0.026796340942382812, -0.02166748046875, -0.016538619995117188, -0.011409759521484375, -0.0062808990478515625, -0.00115203857421875, 0.0039768218994140625, 0.009105682373046875, 0.014234542846679688, 0.0193634033203125, 0.024492263793945312, 0.029621124267578125, 0.03474998474121094, 0.03987884521484375, 0.04500770568847656, 0.050136566162109375, 0.05526542663574219, 0.060394287109375, 0.06552314758300781, 0.07065200805664062, 0.07578086853027344, 0.08090972900390625, 0.08603858947753906, 0.09116744995117188, 0.09629631042480469, 0.1014251708984375, 0.10655403137207031, 0.11168289184570312, 0.11681175231933594, 0.12194061279296875, 0.12706947326660156, 0.13219833374023438, 0.1373271942138672, 0.1424560546875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 15.0, 16.0, 22.0, 20.0, 25.0, 33.0, 39.0, 54.0, 62.0, 57.0, 85.0, 72.0, 58.0, 60.0, 48.0, 53.0, 50.0, 43.0, 32.0, 28.0, 21.0, 15.0, 12.0, 9.0, 12.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.76326847076416, -9.42093276977539, -9.078598022460938, -8.736262321472168, -8.393926620483398, -8.051591873168945, -7.709256172180176, -7.3669209480285645, -7.024585723876953, -6.682250499725342, -6.3399152755737305, -5.997579574584961, -5.65524435043335, -5.312909126281738, -4.970573425292969, -4.628238201141357, -4.285902976989746, -3.9435677528381348, -3.6012322902679443, -3.258896827697754, -2.9165616035461426, -2.5742263793945312, -2.231890916824341, -1.8895554542541504, -1.547220230102539, -1.2048848867416382, -0.8625495433807373, -0.5202142000198364, -0.17787885665893555, 0.16445648670196533, 0.5067918300628662, 0.8491272926330566, 1.1914615631103516, 1.5337969064712524, 1.8761322498321533, 2.2184677124023438, 2.560802936553955, 2.9031381607055664, 3.245473623275757, 3.5878090858459473, 3.9301443099975586, 4.27247953414917, 4.614814758300781, 4.957150459289551, 5.299485683441162, 5.641820907592773, 5.984156608581543, 6.326491832733154, 6.668827056884766, 7.011162281036377, 7.353497505187988, 7.695833206176758, 8.038167953491211, 8.38050365447998, 8.72283935546875, 9.065174102783203, 9.407509803771973, 9.749845504760742, 10.092180252075195, 10.434515953063965, 10.776851654052734, 11.119186401367188, 11.461522102355957, 11.803857803344727, 12.14619255065918]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 7.0, 8.0, 5.0, 10.0, 15.0, 16.0, 27.0, 35.0, 33.0, 25.0, 29.0, 37.0, 48.0, 37.0, 49.0, 51.0, 56.0, 45.0, 65.0, 48.0, 54.0, 38.0, 30.0, 44.0, 41.0, 31.0, 36.0, 20.0, 15.0, 14.0, 4.0, 8.0, 7.0, 2.0, 1.0, 8.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.499058723449707, -8.256243705749512, -8.013429641723633, -7.7706146240234375, -7.5278000831604, -7.284985542297363, -7.042170524597168, -6.799355983734131, -6.556541442871094, -6.313726902008057, -6.070911884307861, -5.828097343444824, -5.585282802581787, -5.34246826171875, -5.099653244018555, -4.856838703155518, -4.614023685455322, -4.371209144592285, -4.12839412689209, -3.8855795860290527, -3.6427650451660156, -3.3999502658843994, -3.157135486602783, -2.914320945739746, -2.67150616645813, -2.4286913871765137, -2.1858768463134766, -1.9430620670318604, -1.7002474069595337, -1.457432746887207, -1.2146179676055908, -0.9718033075332642, -0.7289881706237793, -0.48617348074913025, -0.2433587908744812, -0.0005440711975097656, 0.2422705888748169, 0.48508524894714355, 0.7279000282287598, 0.9707146883010864, 1.213529348373413, 1.4563440084457397, 1.6991586685180664, 1.9419734477996826, 2.184788227081299, 2.427602767944336, 2.670417547225952, 2.9132323265075684, 3.1560468673706055, 3.3988616466522217, 3.641676187515259, 3.884490966796875, 4.127305507659912, 4.370120048522949, 4.6129350662231445, 4.855749607086182, 5.098564147949219, 5.341378688812256, 5.584193706512451, 5.827008247375488, 6.069822788238525, 6.3126373291015625, 6.555452346801758, 6.798266887664795, 7.04108190536499]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 7.0, 22.0, 36.0, 46.0, 74.0, 114.0, 147.0, 266.0, 482.0, 760.0, 1289.0, 2098.0, 3641.0, 6242.0, 10480.0, 18049.0, 29697.0, 47461.0, 72904.0, 102262.0, 130436.0, 144371.0, 137272.0, 113481.0, 82920.0, 55740.0, 35289.0, 21432.0, 12806.0, 7565.0, 4518.0, 2663.0, 1596.0, 973.0, 548.0, 344.0, 213.0, 116.0, 78.0, 48.0, 21.0, 15.0, 7.0, 9.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.83203125, -5.653564453125, -5.47509765625, -5.296630859375, -5.1181640625, -4.939697265625, -4.76123046875, -4.582763671875, -4.404296875, -4.225830078125, -4.04736328125, -3.868896484375, -3.6904296875, -3.511962890625, -3.33349609375, -3.155029296875, -2.9765625, -2.798095703125, -2.61962890625, -2.441162109375, -2.2626953125, -2.084228515625, -1.90576171875, -1.727294921875, -1.548828125, -1.370361328125, -1.19189453125, -1.013427734375, -0.8349609375, -0.656494140625, -0.47802734375, -0.299560546875, -0.12109375, 0.057373046875, 0.23583984375, 0.414306640625, 0.5927734375, 0.771240234375, 0.94970703125, 1.128173828125, 1.306640625, 1.485107421875, 1.66357421875, 1.842041015625, 2.0205078125, 2.198974609375, 2.37744140625, 2.555908203125, 2.734375, 2.912841796875, 3.09130859375, 3.269775390625, 3.4482421875, 3.626708984375, 3.80517578125, 3.983642578125, 4.162109375, 4.340576171875, 4.51904296875, 4.697509765625, 4.8759765625, 5.054443359375, 5.23291015625, 5.411376953125, 5.58984375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 3.0, 7.0, 8.0, 6.0, 2.0, 17.0, 15.0, 22.0, 29.0, 30.0, 18.0, 35.0, 34.0, 40.0, 36.0, 36.0, 44.0, 34.0, 52.0, 43.0, 52.0, 56.0, 45.0, 46.0, 38.0, 32.0, 29.0, 33.0, 22.0, 29.0, 26.0, 17.0, 7.0, 14.0, 9.0, 5.0, 8.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5, -6.2774658203125, -6.054931640625, -5.8323974609375, -5.60986328125, -5.3873291015625, -5.164794921875, -4.9422607421875, -4.7197265625, -4.4971923828125, -4.274658203125, -4.0521240234375, -3.82958984375, -3.6070556640625, -3.384521484375, -3.1619873046875, -2.939453125, -2.7169189453125, -2.494384765625, -2.2718505859375, -2.04931640625, -1.8267822265625, -1.604248046875, -1.3817138671875, -1.1591796875, -0.9366455078125, -0.714111328125, -0.4915771484375, -0.26904296875, -0.0465087890625, 0.176025390625, 0.3985595703125, 0.62109375, 0.8436279296875, 1.066162109375, 1.2886962890625, 1.51123046875, 1.7337646484375, 1.956298828125, 2.1788330078125, 2.4013671875, 2.6239013671875, 2.846435546875, 3.0689697265625, 3.29150390625, 3.5140380859375, 3.736572265625, 3.9591064453125, 4.181640625, 4.4041748046875, 4.626708984375, 4.8492431640625, 5.07177734375, 5.2943115234375, 5.516845703125, 5.7393798828125, 5.9619140625, 6.1844482421875, 6.406982421875, 6.6295166015625, 6.85205078125, 7.0745849609375, 7.297119140625, 7.5196533203125, 7.7421875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 12.0, 10.0, 17.0, 36.0, 50.0, 100.0, 129.0, 288.0, 484.0, 935.0, 1970.0, 3773.0, 7515.0, 15132.0, 29696.0, 55508.0, 96385.0, 146245.0, 182706.0, 178744.0, 138162.0, 87616.0, 49837.0, 26297.0, 13404.0, 6576.0, 3369.0, 1671.0, 863.0, 460.0, 244.0, 116.0, 82.0, 36.0, 29.0, 24.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73046875, -6.48931884765625, -6.2481689453125, -6.00701904296875, -5.765869140625, -5.52471923828125, -5.2835693359375, -5.04241943359375, -4.80126953125, -4.56011962890625, -4.3189697265625, -4.07781982421875, -3.836669921875, -3.59552001953125, -3.3543701171875, -3.11322021484375, -2.8720703125, -2.63092041015625, -2.3897705078125, -2.14862060546875, -1.907470703125, -1.66632080078125, -1.4251708984375, -1.18402099609375, -0.94287109375, -0.70172119140625, -0.4605712890625, -0.21942138671875, 0.021728515625, 0.26287841796875, 0.5040283203125, 0.74517822265625, 0.986328125, 1.22747802734375, 1.4686279296875, 1.70977783203125, 1.950927734375, 2.19207763671875, 2.4332275390625, 2.67437744140625, 2.91552734375, 3.15667724609375, 3.3978271484375, 3.63897705078125, 3.880126953125, 4.12127685546875, 4.3624267578125, 4.60357666015625, 4.8447265625, 5.08587646484375, 5.3270263671875, 5.56817626953125, 5.809326171875, 6.05047607421875, 6.2916259765625, 6.53277587890625, 6.77392578125, 7.01507568359375, 7.2562255859375, 7.49737548828125, 7.738525390625, 7.97967529296875, 8.2208251953125, 8.46197509765625, 8.703125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 9.0, 12.0, 7.0, 15.0, 23.0, 21.0, 16.0, 15.0, 18.0, 24.0, 29.0, 23.0, 38.0, 35.0, 43.0, 42.0, 35.0, 42.0, 51.0, 50.0, 48.0, 45.0, 44.0, 31.0, 39.0, 27.0, 33.0, 26.0, 32.0, 32.0, 18.0, 14.0, 11.0, 12.0, 12.0, 8.0, 5.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.17578125, -4.049957275390625, -3.92413330078125, -3.798309326171875, -3.6724853515625, -3.546661376953125, -3.42083740234375, -3.295013427734375, -3.169189453125, -3.043365478515625, -2.91754150390625, -2.791717529296875, -2.6658935546875, -2.540069580078125, -2.41424560546875, -2.288421630859375, -2.16259765625, -2.036773681640625, -1.91094970703125, -1.785125732421875, -1.6593017578125, -1.533477783203125, -1.40765380859375, -1.281829833984375, -1.156005859375, -1.030181884765625, -0.90435791015625, -0.778533935546875, -0.6527099609375, -0.526885986328125, -0.40106201171875, -0.275238037109375, -0.1494140625, -0.023590087890625, 0.10223388671875, 0.228057861328125, 0.3538818359375, 0.479705810546875, 0.60552978515625, 0.731353759765625, 0.857177734375, 0.983001708984375, 1.10882568359375, 1.234649658203125, 1.3604736328125, 1.486297607421875, 1.61212158203125, 1.737945556640625, 1.86376953125, 1.989593505859375, 2.11541748046875, 2.241241455078125, 2.3670654296875, 2.492889404296875, 2.61871337890625, 2.744537353515625, 2.870361328125, 2.996185302734375, 3.12200927734375, 3.247833251953125, 3.3736572265625, 3.499481201171875, 3.62530517578125, 3.751129150390625, 3.876953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 10.0, 9.0, 13.0, 19.0, 20.0, 32.0, 42.0, 84.0, 110.0, 135.0, 241.0, 369.0, 513.0, 824.0, 1280.0, 2122.0, 3480.0, 5661.0, 9787.0, 17171.0, 30558.0, 54552.0, 96003.0, 150944.0, 194174.0, 180075.0, 125555.0, 75298.0, 42543.0, 23627.0, 13445.0, 7755.0, 4474.0, 2757.0, 1718.0, 1138.0, 708.0, 457.0, 279.0, 189.0, 125.0, 83.0, 61.0, 42.0, 26.0, 15.0, 9.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.23828125, -4.1005859375, -3.962890625, -3.8251953125, -3.6875, -3.5498046875, -3.412109375, -3.2744140625, -3.13671875, -2.9990234375, -2.861328125, -2.7236328125, -2.5859375, -2.4482421875, -2.310546875, -2.1728515625, -2.03515625, -1.8974609375, -1.759765625, -1.6220703125, -1.484375, -1.3466796875, -1.208984375, -1.0712890625, -0.93359375, -0.7958984375, -0.658203125, -0.5205078125, -0.3828125, -0.2451171875, -0.107421875, 0.0302734375, 0.16796875, 0.3056640625, 0.443359375, 0.5810546875, 0.71875, 0.8564453125, 0.994140625, 1.1318359375, 1.26953125, 1.4072265625, 1.544921875, 1.6826171875, 1.8203125, 1.9580078125, 2.095703125, 2.2333984375, 2.37109375, 2.5087890625, 2.646484375, 2.7841796875, 2.921875, 3.0595703125, 3.197265625, 3.3349609375, 3.47265625, 3.6103515625, 3.748046875, 3.8857421875, 4.0234375, 4.1611328125, 4.298828125, 4.4365234375, 4.57421875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 1.0, 4.0, 6.0, 7.0, 10.0, 10.0, 20.0, 26.0, 29.0, 34.0, 34.0, 59.0, 68.0, 46.0, 50.0, 66.0, 62.0, 72.0, 68.0, 66.0, 52.0, 42.0, 33.0, 33.0, 28.0, 21.0, 16.0, 13.0, 9.0, 6.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035643577575683594, -0.0003442205488681793, -0.0003320053219795227, -0.0003197900950908661, -0.00030757486820220947, -0.00029535964131355286, -0.00028314441442489624, -0.0002709291875362396, -0.000258713960647583, -0.0002464987337589264, -0.00023428350687026978, -0.00022206827998161316, -0.00020985305309295654, -0.00019763782620429993, -0.0001854225993156433, -0.0001732073724269867, -0.00016099214553833008, -0.00014877691864967346, -0.00013656169176101685, -0.00012434646487236023, -0.00011213123798370361, -9.9916011095047e-05, -8.770078420639038e-05, -7.548555731773376e-05, -6.327033042907715e-05, -5.105510354042053e-05, -3.8839876651763916e-05, -2.66246497631073e-05, -1.4409422874450684e-05, -2.1941959857940674e-06, 1.0021030902862549e-05, 2.2236257791519165e-05, 3.445148468017578e-05, 4.66667115688324e-05, 5.8881938457489014e-05, 7.109716534614563e-05, 8.331239223480225e-05, 9.552761912345886e-05, 0.00010774284601211548, 0.0001199580729007721, 0.0001321732997894287, 0.00014438852667808533, 0.00015660375356674194, 0.00016881898045539856, 0.00018103420734405518, 0.0001932494342327118, 0.0002054646611213684, 0.00021767988801002502, 0.00022989511489868164, 0.00024211034178733826, 0.0002543255686759949, 0.0002665407955646515, 0.0002787560224533081, 0.0002909712493419647, 0.00030318647623062134, 0.00031540170311927795, 0.00032761693000793457, 0.0003398321568965912, 0.0003520473837852478, 0.0003642626106739044, 0.00037647783756256104, 0.00038869306445121765, 0.00040090829133987427, 0.0004131235182285309, 0.0004253387451171875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 15.0, 22.0, 38.0, 32.0, 76.0, 97.0, 169.0, 272.0, 348.0, 587.0, 966.0, 1388.0, 2247.0, 3721.0, 6013.0, 9753.0, 16566.0, 27285.0, 46091.0, 73565.0, 110621.0, 147631.0, 164465.0, 145947.0, 108205.0, 71180.0, 44039.0, 26401.0, 15781.0, 9511.0, 5823.0, 3535.0, 2313.0, 1422.0, 859.0, 566.0, 353.0, 229.0, 148.0, 98.0, 64.0, 42.0, 15.0, 20.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0], "bins": [-4.140625, -4.027069091796875, -3.91351318359375, -3.799957275390625, -3.6864013671875, -3.572845458984375, -3.45928955078125, -3.345733642578125, -3.232177734375, -3.118621826171875, -3.00506591796875, -2.891510009765625, -2.7779541015625, -2.664398193359375, -2.55084228515625, -2.437286376953125, -2.32373046875, -2.210174560546875, -2.09661865234375, -1.983062744140625, -1.8695068359375, -1.755950927734375, -1.64239501953125, -1.528839111328125, -1.415283203125, -1.301727294921875, -1.18817138671875, -1.074615478515625, -0.9610595703125, -0.847503662109375, -0.73394775390625, -0.620391845703125, -0.5068359375, -0.393280029296875, -0.27972412109375, -0.166168212890625, -0.0526123046875, 0.060943603515625, 0.17449951171875, 0.288055419921875, 0.401611328125, 0.515167236328125, 0.62872314453125, 0.742279052734375, 0.8558349609375, 0.969390869140625, 1.08294677734375, 1.196502685546875, 1.31005859375, 1.423614501953125, 1.53717041015625, 1.650726318359375, 1.7642822265625, 1.877838134765625, 1.99139404296875, 2.104949951171875, 2.218505859375, 2.332061767578125, 2.44561767578125, 2.559173583984375, 2.6727294921875, 2.786285400390625, 2.89984130859375, 3.013397216796875, 3.126953125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 5.0, 7.0, 7.0, 7.0, 6.0, 16.0, 8.0, 9.0, 18.0, 22.0, 20.0, 18.0, 30.0, 35.0, 28.0, 43.0, 42.0, 45.0, 53.0, 61.0, 53.0, 54.0, 40.0, 35.0, 48.0, 41.0, 29.0, 36.0, 31.0, 22.0, 18.0, 14.0, 17.0, 13.0, 16.0, 8.0, 12.0, 8.0, 4.0, 2.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87744140625, -0.8489837646484375, -0.820526123046875, -0.7920684814453125, -0.76361083984375, -0.7351531982421875, -0.706695556640625, -0.6782379150390625, -0.6497802734375, -0.6213226318359375, -0.592864990234375, -0.5644073486328125, -0.53594970703125, -0.5074920654296875, -0.479034423828125, -0.4505767822265625, -0.422119140625, -0.3936614990234375, -0.365203857421875, -0.3367462158203125, -0.30828857421875, -0.2798309326171875, -0.251373291015625, -0.2229156494140625, -0.1944580078125, -0.1660003662109375, -0.137542724609375, -0.1090850830078125, -0.08062744140625, -0.0521697998046875, -0.023712158203125, 0.0047454833984375, 0.033203125, 0.0616607666015625, 0.090118408203125, 0.1185760498046875, 0.14703369140625, 0.1754913330078125, 0.203948974609375, 0.2324066162109375, 0.2608642578125, 0.2893218994140625, 0.317779541015625, 0.3462371826171875, 0.37469482421875, 0.4031524658203125, 0.431610107421875, 0.4600677490234375, 0.488525390625, 0.5169830322265625, 0.545440673828125, 0.5738983154296875, 0.60235595703125, 0.6308135986328125, 0.659271240234375, 0.6877288818359375, 0.7161865234375, 0.7446441650390625, 0.773101806640625, 0.8015594482421875, 0.83001708984375, 0.8584747314453125, 0.886932373046875, 0.9153900146484375, 0.94384765625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 11.0, 12.0, 13.0, 20.0, 17.0, 21.0, 36.0, 43.0, 49.0, 73.0, 75.0, 68.0, 67.0, 74.0, 72.0, 54.0, 59.0, 48.0, 47.0, 33.0, 29.0, 13.0, 11.0, 10.0, 6.0, 7.0, 8.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.292928695678711, -10.910783767700195, -10.528639793395996, -10.14649486541748, -9.764349937438965, -9.382205963134766, -9.00006103515625, -8.617916107177734, -8.235772132873535, -7.853627681732178, -7.471482753753662, -7.089338302612305, -6.707193851470947, -6.32504940032959, -5.942904472351074, -5.560760021209717, -5.178615093231201, -4.796470642089844, -4.414325714111328, -4.032181262969971, -3.6500368118286133, -3.2678921222686768, -2.8857474327087402, -2.503602981567383, -2.1214582920074463, -1.7393137216567993, -1.3571691513061523, -0.9750244617462158, -0.5928798913955688, -0.21073532104492188, 0.17140936851501465, 0.5535538196563721, 0.9356985092163086, 1.3178430795669556, 1.6999876499176025, 2.082132339477539, 2.4642767906188965, 2.846421480178833, 3.2285661697387695, 3.610710620880127, 3.9928553104400635, 4.375, 4.757144451141357, 5.139288902282715, 5.5214338302612305, 5.903578281402588, 6.285722732543945, 6.667867660522461, 7.050012111663818, 7.432156562805176, 7.814301490783691, 8.19644546508789, 8.578590393066406, 8.960735321044922, 9.342880249023438, 9.725024223327637, 10.107169151306152, 10.489314079284668, 10.871458053588867, 11.253602981567383, 11.635747909545898, 12.017891883850098, 12.400036811828613, 12.782180786132812, 13.164325714111328]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 5.0, 3.0, 5.0, 10.0, 7.0, 15.0, 15.0, 18.0, 20.0, 24.0, 24.0, 20.0, 36.0, 31.0, 36.0, 42.0, 44.0, 48.0, 34.0, 42.0, 50.0, 42.0, 45.0, 41.0, 46.0, 32.0, 47.0, 29.0, 32.0, 33.0, 20.0, 20.0, 19.0, 13.0, 13.0, 14.0, 11.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.322488784790039, -7.1039958000183105, -6.88550329208374, -6.667010307312012, -6.448517799377441, -6.230024814605713, -6.011531829833984, -5.793039321899414, -5.5745463371276855, -5.356053352355957, -5.137560844421387, -4.919067859649658, -4.70057487487793, -4.482082366943359, -4.263589382171631, -4.045096397399902, -3.826603889465332, -3.6081111431121826, -3.389618396759033, -3.1711254119873047, -2.9526326656341553, -2.734139919281006, -2.5156469345092773, -2.297154188156128, -2.0786614418029785, -1.860168695449829, -1.6416758298873901, -1.4231829643249512, -1.2046902179718018, -0.9861974716186523, -0.7677046060562134, -0.5492117404937744, -0.3307194709777832, -0.11222666501998901, 0.10626614093780518, 0.32475894689559937, 0.5432517528533936, 0.761744499206543, 0.9802373647689819, 1.198730230331421, 1.4172229766845703, 1.6357157230377197, 1.8542085886001587, 2.0727014541625977, 2.291194200515747, 2.5096869468688965, 2.728179931640625, 2.9466726779937744, 3.165165424346924, 3.3836581707000732, 3.6021509170532227, 3.820643901824951, 4.03913688659668, 4.25762939453125, 4.4761223793029785, 4.694615364074707, 4.913107872009277, 5.131600856781006, 5.350093364715576, 5.568586349487305, 5.787078857421875, 6.0055718421936035, 6.224064826965332, 6.442557334899902, 6.661050319671631]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 11.0, 9.0, 10.0, 16.0, 30.0, 31.0, 55.0, 82.0, 114.0, 192.0, 278.0, 387.0, 620.0, 957.0, 1340.0, 2099.0, 3361.0, 5246.0, 8318.0, 13530.0, 21862.0, 35989.0, 59042.0, 98607.0, 162258.0, 261307.0, 403459.0, 558484.0, 649954.0, 610010.0, 466983.0, 316047.0, 199595.0, 122262.0, 73721.0, 45296.0, 27392.0, 16802.0, 10582.0, 6407.0, 4187.0, 2627.0, 1659.0, 1018.0, 729.0, 454.0, 318.0, 210.0, 107.0, 86.0, 54.0, 29.0, 19.0, 18.0, 11.0, 10.0, 5.0, 4.0], "bins": [-7.37109375, -7.15875244140625, -6.9464111328125, -6.73406982421875, -6.521728515625, -6.30938720703125, -6.0970458984375, -5.88470458984375, -5.67236328125, -5.46002197265625, -5.2476806640625, -5.03533935546875, -4.822998046875, -4.61065673828125, -4.3983154296875, -4.18597412109375, -3.9736328125, -3.76129150390625, -3.5489501953125, -3.33660888671875, -3.124267578125, -2.91192626953125, -2.6995849609375, -2.48724365234375, -2.27490234375, -2.06256103515625, -1.8502197265625, -1.63787841796875, -1.425537109375, -1.21319580078125, -1.0008544921875, -0.78851318359375, -0.576171875, -0.36383056640625, -0.1514892578125, 0.06085205078125, 0.273193359375, 0.48553466796875, 0.6978759765625, 0.91021728515625, 1.12255859375, 1.33489990234375, 1.5472412109375, 1.75958251953125, 1.971923828125, 2.18426513671875, 2.3966064453125, 2.60894775390625, 2.8212890625, 3.03363037109375, 3.2459716796875, 3.45831298828125, 3.670654296875, 3.88299560546875, 4.0953369140625, 4.30767822265625, 4.52001953125, 4.73236083984375, 4.9447021484375, 5.15704345703125, 5.369384765625, 5.58172607421875, 5.7940673828125, 6.00640869140625, 6.21875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 0.0, 8.0, 14.0, 13.0, 15.0, 18.0, 13.0, 28.0, 28.0, 24.0, 34.0, 33.0, 25.0, 34.0, 36.0, 41.0, 41.0, 47.0, 50.0, 44.0, 36.0, 26.0, 41.0, 39.0, 44.0, 40.0, 31.0, 35.0, 35.0, 16.0, 16.0, 19.0, 21.0, 11.0, 6.0, 9.0, 5.0, 5.0, 6.0, 1.0, 1.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.73046875, -4.58154296875, -4.4326171875, -4.28369140625, -4.134765625, -3.98583984375, -3.8369140625, -3.68798828125, -3.5390625, -3.39013671875, -3.2412109375, -3.09228515625, -2.943359375, -2.79443359375, -2.6455078125, -2.49658203125, -2.34765625, -2.19873046875, -2.0498046875, -1.90087890625, -1.751953125, -1.60302734375, -1.4541015625, -1.30517578125, -1.15625, -1.00732421875, -0.8583984375, -0.70947265625, -0.560546875, -0.41162109375, -0.2626953125, -0.11376953125, 0.03515625, 0.18408203125, 0.3330078125, 0.48193359375, 0.630859375, 0.77978515625, 0.9287109375, 1.07763671875, 1.2265625, 1.37548828125, 1.5244140625, 1.67333984375, 1.822265625, 1.97119140625, 2.1201171875, 2.26904296875, 2.41796875, 2.56689453125, 2.7158203125, 2.86474609375, 3.013671875, 3.16259765625, 3.3115234375, 3.46044921875, 3.609375, 3.75830078125, 3.9072265625, 4.05615234375, 4.205078125, 4.35400390625, 4.5029296875, 4.65185546875, 4.80078125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 13.0, 26.0, 35.0, 53.0, 73.0, 123.0, 181.0, 322.0, 551.0, 842.0, 1368.0, 2271.0, 3799.0, 6172.0, 10182.0, 17248.0, 29354.0, 49361.0, 82850.0, 137599.0, 221263.0, 339520.0, 477015.0, 590845.0, 613046.0, 529922.0, 394969.0, 265226.0, 167296.0, 102395.0, 61167.0, 36162.0, 21393.0, 12465.0, 7617.0, 4575.0, 2733.0, 1663.0, 970.0, 590.0, 397.0, 234.0, 137.0, 105.0, 43.0, 41.0, 26.0, 12.0, 12.0, 7.0, 5.0, 3.0, 3.0], "bins": [-7.9453125, -7.7196044921875, -7.493896484375, -7.2681884765625, -7.04248046875, -6.8167724609375, -6.591064453125, -6.3653564453125, -6.1396484375, -5.9139404296875, -5.688232421875, -5.4625244140625, -5.23681640625, -5.0111083984375, -4.785400390625, -4.5596923828125, -4.333984375, -4.1082763671875, -3.882568359375, -3.6568603515625, -3.43115234375, -3.2054443359375, -2.979736328125, -2.7540283203125, -2.5283203125, -2.3026123046875, -2.076904296875, -1.8511962890625, -1.62548828125, -1.3997802734375, -1.174072265625, -0.9483642578125, -0.72265625, -0.4969482421875, -0.271240234375, -0.0455322265625, 0.18017578125, 0.4058837890625, 0.631591796875, 0.8572998046875, 1.0830078125, 1.3087158203125, 1.534423828125, 1.7601318359375, 1.98583984375, 2.2115478515625, 2.437255859375, 2.6629638671875, 2.888671875, 3.1143798828125, 3.340087890625, 3.5657958984375, 3.79150390625, 4.0172119140625, 4.242919921875, 4.4686279296875, 4.6943359375, 4.9200439453125, 5.145751953125, 5.3714599609375, 5.59716796875, 5.8228759765625, 6.048583984375, 6.2742919921875, 6.5]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 7.0, 14.0, 13.0, 24.0, 20.0, 20.0, 35.0, 60.0, 64.0, 93.0, 89.0, 111.0, 113.0, 138.0, 170.0, 184.0, 209.0, 207.0, 206.0, 247.0, 232.0, 232.0, 203.0, 197.0, 179.0, 173.0, 142.0, 124.0, 112.0, 89.0, 57.0, 75.0, 36.0, 50.0, 29.0, 20.0, 33.0, 19.0, 9.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.35247802734375, -2.2713623046875, -2.19024658203125, -2.109130859375, -2.02801513671875, -1.9468994140625, -1.86578369140625, -1.78466796875, -1.70355224609375, -1.6224365234375, -1.54132080078125, -1.460205078125, -1.37908935546875, -1.2979736328125, -1.21685791015625, -1.1357421875, -1.05462646484375, -0.9735107421875, -0.89239501953125, -0.811279296875, -0.73016357421875, -0.6490478515625, -0.56793212890625, -0.48681640625, -0.40570068359375, -0.3245849609375, -0.24346923828125, -0.162353515625, -0.08123779296875, -0.0001220703125, 0.08099365234375, 0.162109375, 0.24322509765625, 0.3243408203125, 0.40545654296875, 0.486572265625, 0.56768798828125, 0.6488037109375, 0.72991943359375, 0.81103515625, 0.89215087890625, 0.9732666015625, 1.05438232421875, 1.135498046875, 1.21661376953125, 1.2977294921875, 1.37884521484375, 1.4599609375, 1.54107666015625, 1.6221923828125, 1.70330810546875, 1.784423828125, 1.86553955078125, 1.9466552734375, 2.02777099609375, 2.10888671875, 2.19000244140625, 2.2711181640625, 2.35223388671875, 2.433349609375, 2.51446533203125, 2.5955810546875, 2.67669677734375, 2.7578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 6.0, 7.0, 10.0, 5.0, 7.0, 15.0, 25.0, 11.0, 23.0, 19.0, 52.0, 44.0, 67.0, 66.0, 65.0, 61.0, 93.0, 56.0, 68.0, 50.0, 52.0, 38.0, 46.0, 25.0, 25.0, 14.0, 10.0, 13.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.586697578430176, -11.213223457336426, -10.839749336242676, -10.466275215148926, -10.092802047729492, -9.719327926635742, -9.345853805541992, -8.972379684448242, -8.598905563354492, -8.225431442260742, -7.851957321166992, -7.4784836769104, -7.10500955581665, -6.7315354347229, -6.358061790466309, -5.984587669372559, -5.611113548278809, -5.237639427185059, -4.864165306091309, -4.490691661834717, -4.117217540740967, -3.743743419647217, -3.370269536972046, -2.996795654296875, -2.623321533203125, -2.249847412109375, -1.876373529434204, -1.5028995275497437, -1.1294255256652832, -0.7559515237808228, -0.3824775218963623, -0.009003639221191406, 0.364471435546875, 0.7379454374313354, 1.111419439315796, 1.4848934412002563, 1.8583674430847168, 2.231841564178467, 2.6053154468536377, 2.9787893295288086, 3.3522634506225586, 3.7257375717163086, 4.099211692810059, 4.47268533706665, 4.8461594581604, 5.21963357925415, 5.593107223510742, 5.966581344604492, 6.340055465698242, 6.713529586791992, 7.087003707885742, 7.460477352142334, 7.833951473236084, 8.207425117492676, 8.580899238586426, 8.954373359680176, 9.327847480773926, 9.701321601867676, 10.074795722961426, 10.448269844055176, 10.82174301147461, 11.19521713256836, 11.56869125366211, 11.94216537475586, 12.31563949584961]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 11.0, 7.0, 8.0, 11.0, 19.0, 13.0, 14.0, 30.0, 26.0, 34.0, 28.0, 37.0, 35.0, 40.0, 57.0, 44.0, 37.0, 44.0, 44.0, 52.0, 36.0, 40.0, 48.0, 42.0, 33.0, 25.0, 31.0, 24.0, 20.0, 20.0, 14.0, 8.0, 14.0, 17.0, 6.0, 4.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.685784816741943, -6.483177185058594, -6.280569553375244, -6.0779619216918945, -5.875354766845703, -5.6727471351623535, -5.470139503479004, -5.267531871795654, -5.064924240112305, -4.862316608428955, -4.6597089767456055, -4.457101821899414, -4.2544941902160645, -4.051886558532715, -3.8492789268493652, -3.6466712951660156, -3.444063901901245, -3.2414562702178955, -3.038848876953125, -2.8362412452697754, -2.633633613586426, -2.431025981903076, -2.2284185886383057, -2.025810956954956, -1.823203444480896, -1.620595932006836, -1.4179883003234863, -1.2153807878494263, -1.0127732753753662, -0.8101656436920166, -0.6075581312179565, -0.40495049953460693, -0.20234298706054688, 0.00026457011699676514, 0.2028721272945404, 0.40547966957092285, 0.6080872416496277, 0.8106948137283325, 1.0133023262023926, 1.2159099578857422, 1.4185174703598022, 1.6211249828338623, 1.823732614517212, 2.0263400077819824, 2.228947639465332, 2.4315552711486816, 2.6341629028320312, 2.836770534515381, 3.0393779277801514, 3.241985559463501, 3.4445929527282715, 3.647200584411621, 3.8498082160949707, 4.05241584777832, 4.255023002624512, 4.4576311111450195, 4.660238265991211, 4.8628458976745605, 5.06545352935791, 5.268060684204102, 5.470668315887451, 5.673275947570801, 5.87588357925415, 6.0784912109375, 6.28109884262085]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 1.0, 6.0, 11.0, 12.0, 15.0, 32.0, 27.0, 46.0, 55.0, 77.0, 99.0, 154.0, 196.0, 303.0, 403.0, 617.0, 976.0, 1529.0, 2374.0, 3954.0, 6796.0, 12108.0, 22191.0, 41579.0, 76883.0, 137821.0, 205506.0, 209368.0, 144359.0, 81887.0, 44102.0, 23364.0, 12815.0, 7380.0, 4222.0, 2541.0, 1518.0, 990.0, 685.0, 481.0, 302.0, 229.0, 163.0, 96.0, 79.0, 65.0, 42.0, 26.0, 19.0, 15.0, 15.0, 6.0, 8.0, 8.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8798828125, -1.8193359375, -1.7587890625, -1.6982421875, -1.6376953125, -1.5771484375, -1.5166015625, -1.4560546875, -1.3955078125, -1.3349609375, -1.2744140625, -1.2138671875, -1.1533203125, -1.0927734375, -1.0322265625, -0.9716796875, -0.9111328125, -0.8505859375, -0.7900390625, -0.7294921875, -0.6689453125, -0.6083984375, -0.5478515625, -0.4873046875, -0.4267578125, -0.3662109375, -0.3056640625, -0.2451171875, -0.1845703125, -0.1240234375, -0.0634765625, -0.0029296875, 0.0576171875, 0.1181640625, 0.1787109375, 0.2392578125, 0.2998046875, 0.3603515625, 0.4208984375, 0.4814453125, 0.5419921875, 0.6025390625, 0.6630859375, 0.7236328125, 0.7841796875, 0.8447265625, 0.9052734375, 0.9658203125, 1.0263671875, 1.0869140625, 1.1474609375, 1.2080078125, 1.2685546875, 1.3291015625, 1.3896484375, 1.4501953125, 1.5107421875, 1.5712890625, 1.6318359375, 1.6923828125, 1.7529296875, 1.8134765625, 1.8740234375, 1.9345703125, 1.9951171875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 5.0, 12.0, 18.0, 13.0, 14.0, 23.0, 21.0, 28.0, 35.0, 29.0, 35.0, 36.0, 38.0, 49.0, 41.0, 46.0, 48.0, 51.0, 57.0, 45.0, 35.0, 47.0, 43.0, 35.0, 39.0, 30.0, 18.0, 22.0, 14.0, 11.0, 10.0, 11.0, 12.0, 5.0, 7.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3203125, -6.0958251953125, -5.871337890625, -5.6468505859375, -5.42236328125, -5.1978759765625, -4.973388671875, -4.7489013671875, -4.5244140625, -4.2999267578125, -4.075439453125, -3.8509521484375, -3.62646484375, -3.4019775390625, -3.177490234375, -2.9530029296875, -2.728515625, -2.5040283203125, -2.279541015625, -2.0550537109375, -1.83056640625, -1.6060791015625, -1.381591796875, -1.1571044921875, -0.9326171875, -0.7081298828125, -0.483642578125, -0.2591552734375, -0.03466796875, 0.1898193359375, 0.414306640625, 0.6387939453125, 0.86328125, 1.0877685546875, 1.312255859375, 1.5367431640625, 1.76123046875, 1.9857177734375, 2.210205078125, 2.4346923828125, 2.6591796875, 2.8836669921875, 3.108154296875, 3.3326416015625, 3.55712890625, 3.7816162109375, 4.006103515625, 4.2305908203125, 4.455078125, 4.6795654296875, 4.904052734375, 5.1285400390625, 5.35302734375, 5.5775146484375, 5.802001953125, 6.0264892578125, 6.2509765625, 6.4754638671875, 6.699951171875, 6.9244384765625, 7.14892578125, 7.3734130859375, 7.597900390625, 7.8223876953125, 8.046875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 10.0, 28.0, 19.0, 40.0, 60.0, 97.0, 159.0, 250.0, 463.0, 945.0, 2059.0, 5172.0, 17373.0, 77130.0, 344952.0, 443660.0, 118717.0, 25310.0, 6993.0, 2606.0, 1143.0, 599.0, 285.0, 167.0, 98.0, 79.0, 39.0, 25.0, 16.0, 13.0, 10.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.47265625, -5.3074951171875, -5.142333984375, -4.9771728515625, -4.81201171875, -4.6468505859375, -4.481689453125, -4.3165283203125, -4.1513671875, -3.9862060546875, -3.821044921875, -3.6558837890625, -3.49072265625, -3.3255615234375, -3.160400390625, -2.9952392578125, -2.830078125, -2.6649169921875, -2.499755859375, -2.3345947265625, -2.16943359375, -2.0042724609375, -1.839111328125, -1.6739501953125, -1.5087890625, -1.3436279296875, -1.178466796875, -1.0133056640625, -0.84814453125, -0.6829833984375, -0.517822265625, -0.3526611328125, -0.1875, -0.0223388671875, 0.142822265625, 0.3079833984375, 0.47314453125, 0.6383056640625, 0.803466796875, 0.9686279296875, 1.1337890625, 1.2989501953125, 1.464111328125, 1.6292724609375, 1.79443359375, 1.9595947265625, 2.124755859375, 2.2899169921875, 2.455078125, 2.6202392578125, 2.785400390625, 2.9505615234375, 3.11572265625, 3.2808837890625, 3.446044921875, 3.6112060546875, 3.7763671875, 3.9415283203125, 4.106689453125, 4.2718505859375, 4.43701171875, 4.6021728515625, 4.767333984375, 4.9324951171875, 5.09765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 6.0, 8.0, 5.0, 6.0, 13.0, 8.0, 12.0, 15.0, 19.0, 25.0, 24.0, 26.0, 39.0, 34.0, 33.0, 43.0, 35.0, 29.0, 39.0, 43.0, 40.0, 44.0, 36.0, 39.0, 47.0, 33.0, 37.0, 25.0, 42.0, 24.0, 22.0, 20.0, 18.0, 25.0, 21.0, 6.0, 7.0, 10.0, 6.0, 4.0, 9.0, 5.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.58984375, -3.47161865234375, -3.3533935546875, -3.23516845703125, -3.116943359375, -2.99871826171875, -2.8804931640625, -2.76226806640625, -2.64404296875, -2.52581787109375, -2.4075927734375, -2.28936767578125, -2.171142578125, -2.05291748046875, -1.9346923828125, -1.81646728515625, -1.6982421875, -1.58001708984375, -1.4617919921875, -1.34356689453125, -1.225341796875, -1.10711669921875, -0.9888916015625, -0.87066650390625, -0.75244140625, -0.63421630859375, -0.5159912109375, -0.39776611328125, -0.279541015625, -0.16131591796875, -0.0430908203125, 0.07513427734375, 0.193359375, 0.31158447265625, 0.4298095703125, 0.54803466796875, 0.666259765625, 0.78448486328125, 0.9027099609375, 1.02093505859375, 1.13916015625, 1.25738525390625, 1.3756103515625, 1.49383544921875, 1.612060546875, 1.73028564453125, 1.8485107421875, 1.96673583984375, 2.0849609375, 2.20318603515625, 2.3214111328125, 2.43963623046875, 2.557861328125, 2.67608642578125, 2.7943115234375, 2.91253662109375, 3.03076171875, 3.14898681640625, 3.2672119140625, 3.38543701171875, 3.503662109375, 3.62188720703125, 3.7401123046875, 3.85833740234375, 3.9765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 9.0, 11.0, 17.0, 13.0, 21.0, 35.0, 40.0, 75.0, 106.0, 133.0, 212.0, 333.0, 498.0, 879.0, 1930.0, 4721.0, 19723.0, 459988.0, 528833.0, 21473.0, 4941.0, 1975.0, 1004.0, 557.0, 351.0, 218.0, 134.0, 82.0, 72.0, 38.0, 29.0, 37.0, 23.0, 17.0, 4.0, 5.0, 5.0, 4.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.99713134765625, -2.9063720703125, -2.81561279296875, -2.724853515625, -2.63409423828125, -2.5433349609375, -2.45257568359375, -2.36181640625, -2.27105712890625, -2.1802978515625, -2.08953857421875, -1.998779296875, -1.90802001953125, -1.8172607421875, -1.72650146484375, -1.6357421875, -1.54498291015625, -1.4542236328125, -1.36346435546875, -1.272705078125, -1.18194580078125, -1.0911865234375, -1.00042724609375, -0.90966796875, -0.81890869140625, -0.7281494140625, -0.63739013671875, -0.546630859375, -0.45587158203125, -0.3651123046875, -0.27435302734375, -0.18359375, -0.09283447265625, -0.0020751953125, 0.08868408203125, 0.179443359375, 0.27020263671875, 0.3609619140625, 0.45172119140625, 0.54248046875, 0.63323974609375, 0.7239990234375, 0.81475830078125, 0.905517578125, 0.99627685546875, 1.0870361328125, 1.17779541015625, 1.2685546875, 1.35931396484375, 1.4500732421875, 1.54083251953125, 1.631591796875, 1.72235107421875, 1.8131103515625, 1.90386962890625, 1.99462890625, 2.08538818359375, 2.1761474609375, 2.26690673828125, 2.357666015625, 2.44842529296875, 2.5391845703125, 2.62994384765625, 2.720703125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 19.0, 62.0, 172.0, 277.0, 254.0, 128.0, 36.0, 16.0, 10.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.703636169433594e-05, -9.212270379066467e-05, -8.720904588699341e-05, -8.229538798332214e-05, -7.738173007965088e-05, -7.246807217597961e-05, -6.755441427230835e-05, -6.264075636863708e-05, -5.772709846496582e-05, -5.2813440561294556e-05, -4.789978265762329e-05, -4.2986124753952026e-05, -3.807246685028076e-05, -3.31588089466095e-05, -2.8245151042938232e-05, -2.3331493139266968e-05, -1.8417835235595703e-05, -1.3504177331924438e-05, -8.590519428253174e-06, -3.676861524581909e-06, 1.2367963790893555e-06, 6.15045428276062e-06, 1.1064112186431885e-05, 1.597777009010315e-05, 2.0891427993774414e-05, 2.580508589744568e-05, 3.071874380111694e-05, 3.563240170478821e-05, 4.054605960845947e-05, 4.545971751213074e-05, 5.0373375415802e-05, 5.5287033319473267e-05, 6.020069122314453e-05, 6.51143491268158e-05, 7.002800703048706e-05, 7.494166493415833e-05, 7.985532283782959e-05, 8.476898074150085e-05, 8.968263864517212e-05, 9.459629654884338e-05, 9.950995445251465e-05, 0.00010442361235618591, 0.00010933727025985718, 0.00011425092816352844, 0.00011916458606719971, 0.00012407824397087097, 0.00012899190187454224, 0.0001339055597782135, 0.00013881921768188477, 0.00014373287558555603, 0.0001486465334892273, 0.00015356019139289856, 0.00015847384929656982, 0.0001633875072002411, 0.00016830116510391235, 0.00017321482300758362, 0.00017812848091125488, 0.00018304213881492615, 0.0001879557967185974, 0.00019286945462226868, 0.00019778311252593994, 0.0002026967704296112, 0.00020761042833328247, 0.00021252408623695374, 0.000217437744140625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 8.0, 17.0, 9.0, 14.0, 23.0, 20.0, 46.0, 60.0, 85.0, 110.0, 158.0, 269.0, 396.0, 636.0, 1054.0, 1637.0, 3040.0, 6046.0, 15170.0, 58440.0, 361695.0, 482565.0, 82310.0, 19204.0, 7129.0, 3402.0, 1944.0, 1069.0, 691.0, 425.0, 260.0, 180.0, 141.0, 95.0, 43.0, 46.0, 28.0, 19.0, 17.0, 13.0, 12.0, 10.0, 4.0, 2.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7138671875, -1.6604766845703125, -1.607086181640625, -1.5536956787109375, -1.50030517578125, -1.4469146728515625, -1.393524169921875, -1.3401336669921875, -1.2867431640625, -1.2333526611328125, -1.179962158203125, -1.1265716552734375, -1.07318115234375, -1.0197906494140625, -0.966400146484375, -0.9130096435546875, -0.859619140625, -0.8062286376953125, -0.752838134765625, -0.6994476318359375, -0.64605712890625, -0.5926666259765625, -0.539276123046875, -0.4858856201171875, -0.4324951171875, -0.3791046142578125, -0.325714111328125, -0.2723236083984375, -0.21893310546875, -0.1655426025390625, -0.112152099609375, -0.0587615966796875, -0.00537109375, 0.0480194091796875, 0.101409912109375, 0.1548004150390625, 0.20819091796875, 0.2615814208984375, 0.314971923828125, 0.3683624267578125, 0.4217529296875, 0.4751434326171875, 0.528533935546875, 0.5819244384765625, 0.63531494140625, 0.6887054443359375, 0.742095947265625, 0.7954864501953125, 0.848876953125, 0.9022674560546875, 0.955657958984375, 1.0090484619140625, 1.06243896484375, 1.1158294677734375, 1.169219970703125, 1.2226104736328125, 1.2760009765625, 1.3293914794921875, 1.382781982421875, 1.4361724853515625, 1.48956298828125, 1.5429534912109375, 1.596343994140625, 1.6497344970703125, 1.703125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 4.0, 10.0, 17.0, 30.0, 41.0, 84.0, 124.0, 185.0, 181.0, 121.0, 83.0, 46.0, 28.0, 15.0, 8.0, 4.0, 1.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37646484375, -0.365386962890625, -0.35430908203125, -0.343231201171875, -0.3321533203125, -0.321075439453125, -0.30999755859375, -0.298919677734375, -0.287841796875, -0.276763916015625, -0.26568603515625, -0.254608154296875, -0.2435302734375, -0.232452392578125, -0.22137451171875, -0.210296630859375, -0.19921875, -0.188140869140625, -0.17706298828125, -0.165985107421875, -0.1549072265625, -0.143829345703125, -0.13275146484375, -0.121673583984375, -0.110595703125, -0.099517822265625, -0.08843994140625, -0.077362060546875, -0.0662841796875, -0.055206298828125, -0.04412841796875, -0.033050537109375, -0.02197265625, -0.010894775390625, 0.00018310546875, 0.011260986328125, 0.0223388671875, 0.033416748046875, 0.04449462890625, 0.055572509765625, 0.066650390625, 0.077728271484375, 0.08880615234375, 0.099884033203125, 0.1109619140625, 0.122039794921875, 0.13311767578125, 0.144195556640625, 0.1552734375, 0.166351318359375, 0.17742919921875, 0.188507080078125, 0.1995849609375, 0.210662841796875, 0.22174072265625, 0.232818603515625, 0.243896484375, 0.254974365234375, 0.26605224609375, 0.277130126953125, 0.2882080078125, 0.299285888671875, 0.31036376953125, 0.321441650390625, 0.33251953125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 9.0, 9.0, 6.0, 7.0, 11.0, 21.0, 19.0, 13.0, 25.0, 35.0, 38.0, 62.0, 75.0, 56.0, 69.0, 76.0, 63.0, 60.0, 67.0, 45.0, 53.0, 39.0, 38.0, 24.0, 21.0, 11.0, 10.0, 13.0, 5.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.272560119628906, -10.903301239013672, -10.534042358398438, -10.16478443145752, -9.795525550842285, -9.42626667022705, -9.057008743286133, -8.687749862670898, -8.318490982055664, -7.94923210144043, -7.5799736976623535, -7.210715293884277, -6.841456413269043, -6.472197532653809, -6.102939128875732, -5.733680725097656, -5.364421844482422, -4.9951629638671875, -4.625904560089111, -4.256646156311035, -3.887387275695801, -3.5181286334991455, -3.1488699913024902, -2.779611349105835, -2.4103527069091797, -2.0410940647125244, -1.6718354225158691, -1.3025767803192139, -0.9333181381225586, -0.5640594959259033, -0.19480085372924805, 0.17445778846740723, 0.5437164306640625, 0.9129750728607178, 1.282233715057373, 1.6514923572540283, 2.0207509994506836, 2.390009641647339, 2.759268283843994, 3.1285269260406494, 3.4977855682373047, 3.86704421043396, 4.236302852630615, 4.605561256408691, 4.974820137023926, 5.34407901763916, 5.713337421417236, 6.0825958251953125, 6.451854705810547, 6.821113586425781, 7.190371990203857, 7.559630393981934, 7.928889274597168, 8.298148155212402, 8.66740608215332, 9.036664962768555, 9.405923843383789, 9.775182723999023, 10.144441604614258, 10.513699531555176, 10.88295841217041, 11.252217292785645, 11.621475219726562, 11.990734100341797, 12.359992980957031]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 5.0, 11.0, 7.0, 8.0, 12.0, 19.0, 12.0, 16.0, 30.0, 26.0, 34.0, 28.0, 36.0, 32.0, 48.0, 52.0, 44.0, 42.0, 40.0, 44.0, 55.0, 37.0, 39.0, 42.0, 44.0, 37.0, 23.0, 31.0, 24.0, 18.0, 22.0, 15.0, 5.0, 17.0, 16.0, 4.0, 5.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.671492099761963, -6.468455791473389, -6.265419960021973, -6.062383651733398, -5.859347820281982, -5.656311511993408, -5.453275680541992, -5.250239372253418, -5.047203063964844, -4.8441667556762695, -4.6411309242248535, -4.438094615936279, -4.235058784484863, -4.032022476196289, -3.828986406326294, -3.625950336456299, -3.422914505004883, -3.2198784351348877, -3.0168423652648926, -2.8138060569763184, -2.6107702255249023, -2.407733917236328, -2.204697847366333, -2.001661777496338, -1.7986257076263428, -1.5955896377563477, -1.3925535678863525, -1.1895173788070679, -0.9864813089370728, -0.7834452390670776, -0.580409049987793, -0.37737298011779785, -0.17433691024780273, 0.02869918942451477, 0.23173528909683228, 0.43477141857147217, 0.6378074884414673, 0.8408435583114624, 1.043879747390747, 1.2469158172607422, 1.4499518871307373, 1.6529879570007324, 1.8560240268707275, 2.0590600967407227, 2.262096405029297, 2.465132236480713, 2.668168544769287, 2.8712046146392822, 3.0742406845092773, 3.2772767543792725, 3.4803128242492676, 3.683349132537842, 3.886384963989258, 4.089421272277832, 4.292457580566406, 4.495493412017822, 4.698529243469238, 4.9015655517578125, 5.1046013832092285, 5.307637691497803, 5.510673522949219, 5.713709831237793, 5.916746139526367, 6.119781970977783, 6.322818279266357]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 11.0, 13.0, 15.0, 24.0, 36.0, 59.0, 73.0, 110.0, 174.0, 242.0, 404.0, 610.0, 1054.0, 1648.0, 2959.0, 5333.0, 9857.0, 18072.0, 34135.0, 62483.0, 106632.0, 159262.0, 189554.0, 171348.0, 121774.0, 73253.0, 41018.0, 21920.0, 11571.0, 6311.0, 3411.0, 1964.0, 1211.0, 746.0, 436.0, 295.0, 190.0, 108.0, 79.0, 53.0, 41.0, 27.0, 16.0, 12.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.917724609375, -6.64794921875, -6.378173828125, -6.1083984375, -5.838623046875, -5.56884765625, -5.299072265625, -5.029296875, -4.759521484375, -4.48974609375, -4.219970703125, -3.9501953125, -3.680419921875, -3.41064453125, -3.140869140625, -2.87109375, -2.601318359375, -2.33154296875, -2.061767578125, -1.7919921875, -1.522216796875, -1.25244140625, -0.982666015625, -0.712890625, -0.443115234375, -0.17333984375, 0.096435546875, 0.3662109375, 0.635986328125, 0.90576171875, 1.175537109375, 1.4453125, 1.715087890625, 1.98486328125, 2.254638671875, 2.5244140625, 2.794189453125, 3.06396484375, 3.333740234375, 3.603515625, 3.873291015625, 4.14306640625, 4.412841796875, 4.6826171875, 4.952392578125, 5.22216796875, 5.491943359375, 5.76171875, 6.031494140625, 6.30126953125, 6.571044921875, 6.8408203125, 7.110595703125, 7.38037109375, 7.650146484375, 7.919921875, 8.189697265625, 8.45947265625, 8.729248046875, 8.9990234375, 9.268798828125, 9.53857421875, 9.808349609375, 10.078125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 4.0, 5.0, 14.0, 11.0, 14.0, 14.0, 11.0, 22.0, 21.0, 23.0, 28.0, 36.0, 30.0, 27.0, 37.0, 35.0, 35.0, 36.0, 25.0, 52.0, 43.0, 45.0, 38.0, 40.0, 37.0, 49.0, 32.0, 23.0, 25.0, 18.0, 35.0, 24.0, 15.0, 22.0, 12.0, 5.0, 8.0, 11.0, 9.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3984375, -6.1982421875, -5.998046875, -5.7978515625, -5.59765625, -5.3974609375, -5.197265625, -4.9970703125, -4.796875, -4.5966796875, -4.396484375, -4.1962890625, -3.99609375, -3.7958984375, -3.595703125, -3.3955078125, -3.1953125, -2.9951171875, -2.794921875, -2.5947265625, -2.39453125, -2.1943359375, -1.994140625, -1.7939453125, -1.59375, -1.3935546875, -1.193359375, -0.9931640625, -0.79296875, -0.5927734375, -0.392578125, -0.1923828125, 0.0078125, 0.2080078125, 0.408203125, 0.6083984375, 0.80859375, 1.0087890625, 1.208984375, 1.4091796875, 1.609375, 1.8095703125, 2.009765625, 2.2099609375, 2.41015625, 2.6103515625, 2.810546875, 3.0107421875, 3.2109375, 3.4111328125, 3.611328125, 3.8115234375, 4.01171875, 4.2119140625, 4.412109375, 4.6123046875, 4.8125, 5.0126953125, 5.212890625, 5.4130859375, 5.61328125, 5.8134765625, 6.013671875, 6.2138671875, 6.4140625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 12.0, 14.0, 14.0, 22.0, 41.0, 49.0, 84.0, 88.0, 175.0, 224.0, 344.0, 464.0, 744.0, 1134.0, 1597.0, 2505.0, 4020.0, 6199.0, 10135.0, 16153.0, 25605.0, 40373.0, 60863.0, 86089.0, 112369.0, 131400.0, 134883.0, 120503.0, 95319.0, 69017.0, 46475.0, 30098.0, 18941.0, 11939.0, 7405.0, 4612.0, 2966.0, 1828.0, 1214.0, 837.0, 568.0, 356.0, 238.0, 206.0, 119.0, 103.0, 69.0, 44.0, 34.0, 23.0, 18.0, 7.0, 4.0, 7.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.9921875, -5.7935791015625, -5.594970703125, -5.3963623046875, -5.19775390625, -4.9991455078125, -4.800537109375, -4.6019287109375, -4.4033203125, -4.2047119140625, -4.006103515625, -3.8074951171875, -3.60888671875, -3.4102783203125, -3.211669921875, -3.0130615234375, -2.814453125, -2.6158447265625, -2.417236328125, -2.2186279296875, -2.02001953125, -1.8214111328125, -1.622802734375, -1.4241943359375, -1.2255859375, -1.0269775390625, -0.828369140625, -0.6297607421875, -0.43115234375, -0.2325439453125, -0.033935546875, 0.1646728515625, 0.36328125, 0.5618896484375, 0.760498046875, 0.9591064453125, 1.15771484375, 1.3563232421875, 1.554931640625, 1.7535400390625, 1.9521484375, 2.1507568359375, 2.349365234375, 2.5479736328125, 2.74658203125, 2.9451904296875, 3.143798828125, 3.3424072265625, 3.541015625, 3.7396240234375, 3.938232421875, 4.1368408203125, 4.33544921875, 4.5340576171875, 4.732666015625, 4.9312744140625, 5.1298828125, 5.3284912109375, 5.527099609375, 5.7257080078125, 5.92431640625, 6.1229248046875, 6.321533203125, 6.5201416015625, 6.71875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 2.0, 7.0, 6.0, 4.0, 12.0, 10.0, 9.0, 19.0, 21.0, 20.0, 27.0, 25.0, 22.0, 34.0, 30.0, 26.0, 34.0, 26.0, 53.0, 36.0, 38.0, 45.0, 30.0, 38.0, 41.0, 36.0, 40.0, 35.0, 27.0, 36.0, 29.0, 30.0, 21.0, 20.0, 11.0, 17.0, 25.0, 11.0, 11.0, 8.0, 6.0, 7.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.689453125, -3.5704345703125, -3.451416015625, -3.3323974609375, -3.21337890625, -3.0943603515625, -2.975341796875, -2.8563232421875, -2.7373046875, -2.6182861328125, -2.499267578125, -2.3802490234375, -2.26123046875, -2.1422119140625, -2.023193359375, -1.9041748046875, -1.78515625, -1.6661376953125, -1.547119140625, -1.4281005859375, -1.30908203125, -1.1900634765625, -1.071044921875, -0.9520263671875, -0.8330078125, -0.7139892578125, -0.594970703125, -0.4759521484375, -0.35693359375, -0.2379150390625, -0.118896484375, 0.0001220703125, 0.119140625, 0.2381591796875, 0.357177734375, 0.4761962890625, 0.59521484375, 0.7142333984375, 0.833251953125, 0.9522705078125, 1.0712890625, 1.1903076171875, 1.309326171875, 1.4283447265625, 1.54736328125, 1.6663818359375, 1.785400390625, 1.9044189453125, 2.0234375, 2.1424560546875, 2.261474609375, 2.3804931640625, 2.49951171875, 2.6185302734375, 2.737548828125, 2.8565673828125, 2.9755859375, 3.0946044921875, 3.213623046875, 3.3326416015625, 3.45166015625, 3.5706787109375, 3.689697265625, 3.8087158203125, 3.927734375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 8.0, 12.0, 14.0, 44.0, 57.0, 74.0, 114.0, 162.0, 277.0, 355.0, 579.0, 963.0, 1390.0, 2418.0, 3943.0, 7215.0, 12932.0, 23806.0, 45427.0, 87348.0, 157409.0, 224792.0, 205293.0, 127466.0, 67837.0, 35456.0, 18467.0, 10216.0, 5819.0, 3365.0, 1932.0, 1262.0, 696.0, 514.0, 325.0, 187.0, 129.0, 70.0, 60.0, 46.0, 29.0, 19.0, 9.0, 9.0, 5.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.53466796875, -6.3154296875, -6.09619140625, -5.876953125, -5.65771484375, -5.4384765625, -5.21923828125, -5.0, -4.78076171875, -4.5615234375, -4.34228515625, -4.123046875, -3.90380859375, -3.6845703125, -3.46533203125, -3.24609375, -3.02685546875, -2.8076171875, -2.58837890625, -2.369140625, -2.14990234375, -1.9306640625, -1.71142578125, -1.4921875, -1.27294921875, -1.0537109375, -0.83447265625, -0.615234375, -0.39599609375, -0.1767578125, 0.04248046875, 0.26171875, 0.48095703125, 0.7001953125, 0.91943359375, 1.138671875, 1.35791015625, 1.5771484375, 1.79638671875, 2.015625, 2.23486328125, 2.4541015625, 2.67333984375, 2.892578125, 3.11181640625, 3.3310546875, 3.55029296875, 3.76953125, 3.98876953125, 4.2080078125, 4.42724609375, 4.646484375, 4.86572265625, 5.0849609375, 5.30419921875, 5.5234375, 5.74267578125, 5.9619140625, 6.18115234375, 6.400390625, 6.61962890625, 6.8388671875, 7.05810546875, 7.27734375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 6.0, 13.0, 7.0, 19.0, 18.0, 28.0, 29.0, 31.0, 63.0, 65.0, 86.0, 62.0, 83.0, 95.0, 71.0, 73.0, 45.0, 55.0, 32.0, 23.0, 20.0, 17.0, 12.0, 10.0, 5.0, 3.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006594657897949219, -0.0006401613354682922, -0.0006208568811416626, -0.000601552426815033, -0.0005822479724884033, -0.0005629435181617737, -0.000543639063835144, -0.0005243346095085144, -0.0005050301551818848, -0.0004857257008552551, -0.0004664212465286255, -0.00044711679220199585, -0.0004278123378753662, -0.00040850788354873657, -0.00038920342922210693, -0.0003698989748954773, -0.00035059452056884766, -0.000331290066242218, -0.0003119856119155884, -0.00029268115758895874, -0.0002733767032623291, -0.00025407224893569946, -0.00023476779460906982, -0.00021546334028244019, -0.00019615888595581055, -0.0001768544316291809, -0.00015754997730255127, -0.00013824552297592163, -0.00011894106864929199, -9.963661432266235e-05, -8.033215999603271e-05, -6.1027705669403076e-05, -4.172325134277344e-05, -2.24187970161438e-05, -3.11434268951416e-06, 1.619011163711548e-05, 3.549456596374512e-05, 5.4799020290374756e-05, 7.41034746170044e-05, 9.340792894363403e-05, 0.00011271238327026367, 0.0001320168375968933, 0.00015132129192352295, 0.0001706257462501526, 0.00018993020057678223, 0.00020923465490341187, 0.0002285391092300415, 0.00024784356355667114, 0.0002671480178833008, 0.0002864524722099304, 0.00030575692653656006, 0.0003250613808631897, 0.00034436583518981934, 0.000363670289516449, 0.0003829747438430786, 0.00040227919816970825, 0.0004215836524963379, 0.00044088810682296753, 0.00046019256114959717, 0.0004794970154762268, 0.0004988014698028564, 0.0005181059241294861, 0.0005374103784561157, 0.0005567148327827454, 0.000576019287109375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 1.0, 5.0, 4.0, 8.0, 8.0, 19.0, 23.0, 37.0, 58.0, 90.0, 163.0, 248.0, 468.0, 729.0, 1287.0, 2320.0, 4370.0, 8232.0, 16410.0, 33622.0, 70044.0, 138349.0, 223919.0, 234862.0, 154864.0, 80423.0, 38877.0, 18683.0, 9571.0, 4818.0, 2603.0, 1443.0, 793.0, 425.0, 274.0, 201.0, 104.0, 68.0, 46.0, 30.0, 11.0, 17.0, 10.0, 10.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-7.6171875, -7.400146484375, -7.18310546875, -6.966064453125, -6.7490234375, -6.531982421875, -6.31494140625, -6.097900390625, -5.880859375, -5.663818359375, -5.44677734375, -5.229736328125, -5.0126953125, -4.795654296875, -4.57861328125, -4.361572265625, -4.14453125, -3.927490234375, -3.71044921875, -3.493408203125, -3.2763671875, -3.059326171875, -2.84228515625, -2.625244140625, -2.408203125, -2.191162109375, -1.97412109375, -1.757080078125, -1.5400390625, -1.322998046875, -1.10595703125, -0.888916015625, -0.671875, -0.454833984375, -0.23779296875, -0.020751953125, 0.1962890625, 0.413330078125, 0.63037109375, 0.847412109375, 1.064453125, 1.281494140625, 1.49853515625, 1.715576171875, 1.9326171875, 2.149658203125, 2.36669921875, 2.583740234375, 2.80078125, 3.017822265625, 3.23486328125, 3.451904296875, 3.6689453125, 3.885986328125, 4.10302734375, 4.320068359375, 4.537109375, 4.754150390625, 4.97119140625, 5.188232421875, 5.4052734375, 5.622314453125, 5.83935546875, 6.056396484375, 6.2734375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 3.0, 9.0, 6.0, 8.0, 12.0, 14.0, 19.0, 28.0, 40.0, 45.0, 68.0, 75.0, 89.0, 88.0, 91.0, 85.0, 76.0, 54.0, 54.0, 35.0, 30.0, 19.0, 12.0, 11.0, 9.0, 9.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8761444091796875, -1.800140380859375, -1.7241363525390625, -1.64813232421875, -1.5721282958984375, -1.496124267578125, -1.4201202392578125, -1.3441162109375, -1.2681121826171875, -1.192108154296875, -1.1161041259765625, -1.04010009765625, -0.9640960693359375, -0.888092041015625, -0.8120880126953125, -0.736083984375, -0.6600799560546875, -0.584075927734375, -0.5080718994140625, -0.43206787109375, -0.3560638427734375, -0.280059814453125, -0.2040557861328125, -0.1280517578125, -0.0520477294921875, 0.023956298828125, 0.0999603271484375, 0.17596435546875, 0.2519683837890625, 0.327972412109375, 0.4039764404296875, 0.47998046875, 0.5559844970703125, 0.631988525390625, 0.7079925537109375, 0.78399658203125, 0.8600006103515625, 0.936004638671875, 1.0120086669921875, 1.0880126953125, 1.1640167236328125, 1.240020751953125, 1.3160247802734375, 1.39202880859375, 1.4680328369140625, 1.544036865234375, 1.6200408935546875, 1.696044921875, 1.7720489501953125, 1.848052978515625, 1.9240570068359375, 2.00006103515625, 2.0760650634765625, 2.152069091796875, 2.2280731201171875, 2.3040771484375, 2.3800811767578125, 2.456085205078125, 2.5320892333984375, 2.60809326171875, 2.6840972900390625, 2.760101318359375, 2.8361053466796875, 2.912109375]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 12.0, 5.0, 8.0, 9.0, 17.0, 16.0, 21.0, 27.0, 30.0, 33.0, 41.0, 56.0, 63.0, 56.0, 55.0, 57.0, 67.0, 65.0, 52.0, 39.0, 55.0, 30.0, 44.0, 34.0, 22.0, 18.0, 14.0, 9.0, 9.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.519061088562012, -9.180553436279297, -8.842044830322266, -8.50353717803955, -8.165029525756836, -7.826521396636963, -7.48801326751709, -7.149505615234375, -6.810997486114502, -6.472489356994629, -6.133981704711914, -5.795473575592041, -5.456965446472168, -5.118457794189453, -4.77994966506958, -4.441441535949707, -4.102933883666992, -3.7644259929656982, -3.4259181022644043, -3.0874099731445312, -2.7489020824432373, -2.4103941917419434, -2.0718860626220703, -1.7333781719207764, -1.3948702812194824, -1.0563623905181885, -0.717854380607605, -0.3793463706970215, -0.04083847999572754, 0.2976694107055664, 0.6361775398254395, 0.9746854305267334, 1.3131933212280273, 1.6517012119293213, 1.9902092218399048, 2.3287172317504883, 2.6672251224517822, 3.005733013153076, 3.344241142272949, 3.682749032974243, 4.021256923675537, 4.35976505279541, 4.698272705078125, 5.036780834197998, 5.375288963317871, 5.713796615600586, 6.052304744720459, 6.390812873840332, 6.729320526123047, 7.06782865524292, 7.406336307525635, 7.744844436645508, 8.083352088928223, 8.421859741210938, 8.760368347167969, 9.098875999450684, 9.437383651733398, 9.775891304016113, 10.114399909973145, 10.45290756225586, 10.791415214538574, 11.129922866821289, 11.46843147277832, 11.806939125061035, 12.145447731018066]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 10.0, 17.0, 14.0, 9.0, 13.0, 19.0, 17.0, 16.0, 23.0, 32.0, 36.0, 23.0, 39.0, 39.0, 41.0, 50.0, 40.0, 52.0, 37.0, 46.0, 49.0, 43.0, 45.0, 37.0, 40.0, 29.0, 27.0, 25.0, 17.0, 18.0, 22.0, 16.0, 8.0, 8.0, 12.0, 5.0, 5.0, 2.0, 7.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.005425453186035, -6.794717788696289, -6.584010601043701, -6.373302936553955, -6.162595748901367, -5.951888084411621, -5.741180419921875, -5.530472755432129, -5.319765567779541, -5.109057903289795, -4.898350715637207, -4.687643051147461, -4.476935386657715, -4.266228199005127, -4.055520534515381, -3.844813108444214, -3.634105682373047, -3.42339825630188, -3.212690830230713, -3.001983165740967, -2.7912757396698, -2.580568313598633, -2.3698606491088867, -2.1591532230377197, -1.9484457969665527, -1.7377383708953857, -1.5270308256149292, -1.3163232803344727, -1.1056158542633057, -0.8949084281921387, -0.6842008829116821, -0.4734933376312256, -0.2627859115600586, -0.052078425884246826, 0.15862905979156494, 0.3693365454673767, 0.5800440311431885, 0.7907514572143555, 1.001459002494812, 1.2121665477752686, 1.4228739738464355, 1.6335813999176025, 1.844288945198059, 2.0549964904785156, 2.2657039165496826, 2.4764113426208496, 2.6871190071105957, 2.8978264331817627, 3.1085338592529297, 3.3192412853240967, 3.5299487113952637, 3.7406563758850098, 3.9513638019561768, 4.162071228027344, 4.37277889251709, 4.583486557006836, 4.794193744659424, 5.00490140914917, 5.215608596801758, 5.426316261291504, 5.63702392578125, 5.847731113433838, 6.058438777923584, 6.269145965576172, 6.479853630065918]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 10.0, 2.0, 8.0, 17.0, 31.0, 37.0, 48.0, 98.0, 131.0, 242.0, 359.0, 545.0, 853.0, 1480.0, 2420.0, 4194.0, 7017.0, 12175.0, 21369.0, 37709.0, 66775.0, 119748.0, 211627.0, 361629.0, 561868.0, 726801.0, 716542.0, 540513.0, 341801.0, 199220.0, 113228.0, 63013.0, 35472.0, 19805.0, 11378.0, 6565.0, 3884.0, 2259.0, 1400.0, 777.0, 451.0, 315.0, 185.0, 121.0, 51.0, 45.0, 38.0, 11.0, 8.0, 8.0, 5.0, 1.0, 0.0, 1.0, 3.0], "bins": [-9.015625, -8.7576904296875, -8.499755859375, -8.2418212890625, -7.98388671875, -7.7259521484375, -7.468017578125, -7.2100830078125, -6.9521484375, -6.6942138671875, -6.436279296875, -6.1783447265625, -5.92041015625, -5.6624755859375, -5.404541015625, -5.1466064453125, -4.888671875, -4.6307373046875, -4.372802734375, -4.1148681640625, -3.85693359375, -3.5989990234375, -3.341064453125, -3.0831298828125, -2.8251953125, -2.5672607421875, -2.309326171875, -2.0513916015625, -1.79345703125, -1.5355224609375, -1.277587890625, -1.0196533203125, -0.76171875, -0.5037841796875, -0.245849609375, 0.0120849609375, 0.27001953125, 0.5279541015625, 0.785888671875, 1.0438232421875, 1.3017578125, 1.5596923828125, 1.817626953125, 2.0755615234375, 2.33349609375, 2.5914306640625, 2.849365234375, 3.1072998046875, 3.365234375, 3.6231689453125, 3.881103515625, 4.1390380859375, 4.39697265625, 4.6549072265625, 4.912841796875, 5.1707763671875, 5.4287109375, 5.6866455078125, 5.944580078125, 6.2025146484375, 6.46044921875, 6.7183837890625, 6.976318359375, 7.2342529296875, 7.4921875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 3.0, 1.0, 3.0, 6.0, 12.0, 10.0, 9.0, 12.0, 16.0, 16.0, 13.0, 19.0, 32.0, 33.0, 30.0, 33.0, 33.0, 35.0, 41.0, 40.0, 49.0, 54.0, 38.0, 47.0, 46.0, 42.0, 45.0, 28.0, 34.0, 37.0, 26.0, 30.0, 27.0, 8.0, 17.0, 11.0, 10.0, 7.0, 8.0, 6.0, 9.0, 5.0, 4.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.37054443359375, -4.2254638671875, -4.08038330078125, -3.935302734375, -3.79022216796875, -3.6451416015625, -3.50006103515625, -3.35498046875, -3.20989990234375, -3.0648193359375, -2.91973876953125, -2.774658203125, -2.62957763671875, -2.4844970703125, -2.33941650390625, -2.1943359375, -2.04925537109375, -1.9041748046875, -1.75909423828125, -1.614013671875, -1.46893310546875, -1.3238525390625, -1.17877197265625, -1.03369140625, -0.88861083984375, -0.7435302734375, -0.59844970703125, -0.453369140625, -0.30828857421875, -0.1632080078125, -0.01812744140625, 0.126953125, 0.27203369140625, 0.4171142578125, 0.56219482421875, 0.707275390625, 0.85235595703125, 0.9974365234375, 1.14251708984375, 1.28759765625, 1.43267822265625, 1.5777587890625, 1.72283935546875, 1.867919921875, 2.01300048828125, 2.1580810546875, 2.30316162109375, 2.4482421875, 2.59332275390625, 2.7384033203125, 2.88348388671875, 3.028564453125, 3.17364501953125, 3.3187255859375, 3.46380615234375, 3.60888671875, 3.75396728515625, 3.8990478515625, 4.04412841796875, 4.189208984375, 4.33428955078125, 4.4793701171875, 4.62445068359375, 4.76953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 8.0, 1.0, 8.0, 10.0, 15.0, 22.0, 30.0, 48.0, 80.0, 102.0, 148.0, 241.0, 374.0, 549.0, 848.0, 1298.0, 2094.0, 3195.0, 5218.0, 8378.0, 13300.0, 21447.0, 34808.0, 56195.0, 89288.0, 140648.0, 217764.0, 319807.0, 437961.0, 537950.0, 569460.0, 515363.0, 403925.0, 289198.0, 192566.0, 124353.0, 78327.0, 48875.0, 30222.0, 18773.0, 11760.0, 7201.0, 4486.0, 2854.0, 1844.0, 1244.0, 698.0, 497.0, 284.0, 176.0, 129.0, 81.0, 47.0, 33.0, 33.0, 16.0, 5.0, 6.0, 3.0, 2.0, 3.0], "bins": [-7.24609375, -7.02886962890625, -6.8116455078125, -6.59442138671875, -6.377197265625, -6.15997314453125, -5.9427490234375, -5.72552490234375, -5.50830078125, -5.29107666015625, -5.0738525390625, -4.85662841796875, -4.639404296875, -4.42218017578125, -4.2049560546875, -3.98773193359375, -3.7705078125, -3.55328369140625, -3.3360595703125, -3.11883544921875, -2.901611328125, -2.68438720703125, -2.4671630859375, -2.24993896484375, -2.03271484375, -1.81549072265625, -1.5982666015625, -1.38104248046875, -1.163818359375, -0.94659423828125, -0.7293701171875, -0.51214599609375, -0.294921875, -0.07769775390625, 0.1395263671875, 0.35675048828125, 0.573974609375, 0.79119873046875, 1.0084228515625, 1.22564697265625, 1.44287109375, 1.66009521484375, 1.8773193359375, 2.09454345703125, 2.311767578125, 2.52899169921875, 2.7462158203125, 2.96343994140625, 3.1806640625, 3.39788818359375, 3.6151123046875, 3.83233642578125, 4.049560546875, 4.26678466796875, 4.4840087890625, 4.70123291015625, 4.91845703125, 5.13568115234375, 5.3529052734375, 5.57012939453125, 5.787353515625, 6.00457763671875, 6.2218017578125, 6.43902587890625, 6.65625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 5.0, 3.0, 6.0, 12.0, 13.0, 13.0, 11.0, 25.0, 43.0, 42.0, 56.0, 61.0, 79.0, 96.0, 114.0, 123.0, 165.0, 155.0, 208.0, 200.0, 220.0, 263.0, 238.0, 245.0, 222.0, 199.0, 205.0, 157.0, 135.0, 136.0, 116.0, 100.0, 97.0, 69.0, 61.0, 49.0, 30.0, 17.0, 16.0, 21.0, 10.0, 12.0, 4.0, 5.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.947265625, -2.8619384765625, -2.776611328125, -2.6912841796875, -2.60595703125, -2.5206298828125, -2.435302734375, -2.3499755859375, -2.2646484375, -2.1793212890625, -2.093994140625, -2.0086669921875, -1.92333984375, -1.8380126953125, -1.752685546875, -1.6673583984375, -1.58203125, -1.4967041015625, -1.411376953125, -1.3260498046875, -1.24072265625, -1.1553955078125, -1.070068359375, -0.9847412109375, -0.8994140625, -0.8140869140625, -0.728759765625, -0.6434326171875, -0.55810546875, -0.4727783203125, -0.387451171875, -0.3021240234375, -0.216796875, -0.1314697265625, -0.046142578125, 0.0391845703125, 0.12451171875, 0.2098388671875, 0.295166015625, 0.3804931640625, 0.4658203125, 0.5511474609375, 0.636474609375, 0.7218017578125, 0.80712890625, 0.8924560546875, 0.977783203125, 1.0631103515625, 1.1484375, 1.2337646484375, 1.319091796875, 1.4044189453125, 1.48974609375, 1.5750732421875, 1.660400390625, 1.7457275390625, 1.8310546875, 1.9163818359375, 2.001708984375, 2.0870361328125, 2.17236328125, 2.2576904296875, 2.343017578125, 2.4283447265625, 2.513671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 0.0, 1.0, 3.0, 6.0, 8.0, 4.0, 12.0, 11.0, 17.0, 21.0, 20.0, 19.0, 31.0, 32.0, 43.0, 64.0, 44.0, 65.0, 57.0, 66.0, 70.0, 61.0, 50.0, 65.0, 45.0, 32.0, 32.0, 23.0, 26.0, 22.0, 6.0, 11.0, 8.0, 6.0, 2.0, 4.0, 3.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.530740737915039, -11.185663223266602, -10.840585708618164, -10.495508193969727, -10.150429725646973, -9.805352210998535, -9.460274696350098, -9.11519718170166, -8.770118713378906, -8.425041198730469, -8.079963684082031, -7.7348856925964355, -7.38980770111084, -7.044730186462402, -6.699652671813965, -6.354575157165527, -6.00949764251709, -5.664420127868652, -5.319342136383057, -4.974264621734619, -4.629186630249023, -4.284109115600586, -3.9390316009521484, -3.593953847885132, -3.2488760948181152, -2.9037983417510986, -2.558720588684082, -2.2136430740356445, -1.868565320968628, -1.5234875679016113, -1.1784100532531738, -0.8333323001861572, -0.48825550079345703, -0.1431778073310852, 0.20189988613128662, 0.5469775199890137, 0.8920552730560303, 1.2371330261230469, 1.5822105407714844, 1.927288293838501, 2.2723660469055176, 2.617443799972534, 2.962521553039551, 3.3075990676879883, 3.652676820755005, 3.9977545738220215, 4.342832088470459, 4.687910079956055, 5.032987594604492, 5.37806510925293, 5.723143100738525, 6.068220615386963, 6.413298606872559, 6.758376121520996, 7.103453636169434, 7.448531150817871, 7.793609142303467, 8.138687133789062, 8.4837646484375, 8.828842163085938, 9.173919677734375, 9.518997192382812, 9.86407470703125, 10.209153175354004, 10.554230690002441]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 11.0, 11.0, 12.0, 15.0, 17.0, 15.0, 15.0, 32.0, 29.0, 30.0, 35.0, 38.0, 47.0, 43.0, 37.0, 48.0, 39.0, 42.0, 56.0, 39.0, 46.0, 39.0, 39.0, 46.0, 30.0, 25.0, 18.0, 23.0, 23.0, 13.0, 10.0, 8.0, 10.0, 16.0, 7.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.039371013641357, -6.8392333984375, -6.639096260070801, -6.438958644866943, -6.238821029663086, -6.038683891296387, -5.838546276092529, -5.638408660888672, -5.438271522521973, -5.238133907318115, -5.037996768951416, -4.837859153747559, -4.637721538543701, -4.437584400177002, -4.2374467849731445, -4.037309646606445, -3.837171792984009, -3.6370344161987305, -3.436896800994873, -3.2367594242095947, -3.0366220474243164, -2.836484432220459, -2.6363470554351807, -2.4362096786499023, -2.236072063446045, -2.0359346866607666, -1.8357971906661987, -1.6356596946716309, -1.4355223178863525, -1.2353848218917847, -1.0352473258972168, -0.8351099491119385, -0.6349725723266602, -0.43483513593673706, -0.23469766974449158, -0.034560203552246094, 0.165577232837677, 0.3657146692276001, 0.565852165222168, 0.7659895420074463, 0.9661270380020142, 1.166264533996582, 1.3664019107818604, 1.5665394067764282, 1.766676902770996, 1.9668142795562744, 2.1669516563415527, 2.36708927154541, 2.5672266483306885, 2.767364025115967, 2.967501640319824, 3.1676390171051025, 3.367776393890381, 3.5679140090942383, 3.7680513858795166, 3.968188762664795, 4.168326377868652, 4.36846399307251, 4.568601131439209, 4.768738746643066, 4.968876361846924, 5.169013500213623, 5.3691511154174805, 5.56928825378418, 5.769425868988037]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 8.0, 13.0, 15.0, 24.0, 45.0, 52.0, 84.0, 107.0, 171.0, 289.0, 377.0, 639.0, 935.0, 1440.0, 2171.0, 3284.0, 5118.0, 8038.0, 12100.0, 18894.0, 28010.0, 43476.0, 64637.0, 91934.0, 122040.0, 141481.0, 137578.0, 113700.0, 83916.0, 57609.0, 38040.0, 25304.0, 16418.0, 10672.0, 6925.0, 4482.0, 2833.0, 1976.0, 1258.0, 833.0, 530.0, 350.0, 264.0, 172.0, 105.0, 81.0, 40.0, 36.0, 21.0, 13.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.166015625, -1.126953125, -1.087890625, -1.048828125, -1.009765625, -0.970703125, -0.931640625, -0.892578125, -0.853515625, -0.814453125, -0.775390625, -0.736328125, -0.697265625, -0.658203125, -0.619140625, -0.580078125, -0.541015625, -0.501953125, -0.462890625, -0.423828125, -0.384765625, -0.345703125, -0.306640625, -0.267578125, -0.228515625, -0.189453125, -0.150390625, -0.111328125, -0.072265625, -0.033203125, 0.005859375, 0.044921875, 0.083984375, 0.123046875, 0.162109375, 0.201171875, 0.240234375, 0.279296875, 0.318359375, 0.357421875, 0.396484375, 0.435546875, 0.474609375, 0.513671875, 0.552734375, 0.591796875, 0.630859375, 0.669921875, 0.708984375, 0.748046875, 0.787109375, 0.826171875, 0.865234375, 0.904296875, 0.943359375, 0.982421875, 1.021484375, 1.060546875, 1.099609375, 1.138671875, 1.177734375, 1.216796875, 1.255859375, 1.294921875, 1.333984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 10.0, 12.0, 14.0, 24.0, 15.0, 24.0, 37.0, 28.0, 31.0, 50.0, 31.0, 59.0, 54.0, 54.0, 58.0, 48.0, 60.0, 43.0, 46.0, 46.0, 30.0, 31.0, 38.0, 26.0, 23.0, 17.0, 10.0, 13.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.26922607421875, -8.0150146484375, -7.76080322265625, -7.506591796875, -7.25238037109375, -6.9981689453125, -6.74395751953125, -6.48974609375, -6.23553466796875, -5.9813232421875, -5.72711181640625, -5.472900390625, -5.21868896484375, -4.9644775390625, -4.71026611328125, -4.4560546875, -4.20184326171875, -3.9476318359375, -3.69342041015625, -3.439208984375, -3.18499755859375, -2.9307861328125, -2.67657470703125, -2.42236328125, -2.16815185546875, -1.9139404296875, -1.65972900390625, -1.405517578125, -1.15130615234375, -0.8970947265625, -0.64288330078125, -0.388671875, -0.13446044921875, 0.1197509765625, 0.37396240234375, 0.628173828125, 0.88238525390625, 1.1365966796875, 1.39080810546875, 1.64501953125, 1.89923095703125, 2.1534423828125, 2.40765380859375, 2.661865234375, 2.91607666015625, 3.1702880859375, 3.42449951171875, 3.6787109375, 3.93292236328125, 4.1871337890625, 4.44134521484375, 4.695556640625, 4.94976806640625, 5.2039794921875, 5.45819091796875, 5.71240234375, 5.96661376953125, 6.2208251953125, 6.47503662109375, 6.729248046875, 6.98345947265625, 7.2376708984375, 7.49188232421875, 7.74609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 8.0, 14.0, 22.0, 32.0, 37.0, 43.0, 73.0, 109.0, 156.0, 309.0, 450.0, 745.0, 1191.0, 1971.0, 3258.0, 5636.0, 9828.0, 17154.0, 29649.0, 51320.0, 85767.0, 133504.0, 177139.0, 177980.0, 136220.0, 89160.0, 52978.0, 31051.0, 17914.0, 10158.0, 5894.0, 3417.0, 2074.0, 1168.0, 783.0, 470.0, 266.0, 207.0, 120.0, 85.0, 62.0, 32.0, 28.0, 24.0, 8.0, 5.0, 8.0, 9.0, 4.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.623046875, -1.5690155029296875, -1.514984130859375, -1.4609527587890625, -1.40692138671875, -1.3528900146484375, -1.298858642578125, -1.2448272705078125, -1.1907958984375, -1.1367645263671875, -1.082733154296875, -1.0287017822265625, -0.97467041015625, -0.9206390380859375, -0.866607666015625, -0.8125762939453125, -0.758544921875, -0.7045135498046875, -0.650482177734375, -0.5964508056640625, -0.54241943359375, -0.4883880615234375, -0.434356689453125, -0.3803253173828125, -0.3262939453125, -0.2722625732421875, -0.218231201171875, -0.1641998291015625, -0.11016845703125, -0.0561370849609375, -0.002105712890625, 0.0519256591796875, 0.10595703125, 0.1599884033203125, 0.214019775390625, 0.2680511474609375, 0.32208251953125, 0.3761138916015625, 0.430145263671875, 0.4841766357421875, 0.5382080078125, 0.5922393798828125, 0.646270751953125, 0.7003021240234375, 0.75433349609375, 0.8083648681640625, 0.862396240234375, 0.9164276123046875, 0.970458984375, 1.0244903564453125, 1.078521728515625, 1.1325531005859375, 1.18658447265625, 1.2406158447265625, 1.294647216796875, 1.3486785888671875, 1.4027099609375, 1.4567413330078125, 1.510772705078125, 1.5648040771484375, 1.61883544921875, 1.6728668212890625, 1.726898193359375, 1.7809295654296875, 1.8349609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 7.0, 9.0, 15.0, 10.0, 19.0, 22.0, 23.0, 27.0, 33.0, 28.0, 36.0, 42.0, 41.0, 43.0, 31.0, 41.0, 31.0, 42.0, 51.0, 40.0, 39.0, 35.0, 41.0, 36.0, 24.0, 35.0, 18.0, 21.0, 21.0, 13.0, 20.0, 20.0, 14.0, 10.0, 8.0, 4.0, 5.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.281036376953125, -4.15191650390625, -4.022796630859375, -3.8936767578125, -3.764556884765625, -3.63543701171875, -3.506317138671875, -3.377197265625, -3.248077392578125, -3.11895751953125, -2.989837646484375, -2.8607177734375, -2.731597900390625, -2.60247802734375, -2.473358154296875, -2.34423828125, -2.215118408203125, -2.08599853515625, -1.956878662109375, -1.8277587890625, -1.698638916015625, -1.56951904296875, -1.440399169921875, -1.311279296875, -1.182159423828125, -1.05303955078125, -0.923919677734375, -0.7947998046875, -0.665679931640625, -0.53656005859375, -0.407440185546875, -0.2783203125, -0.149200439453125, -0.02008056640625, 0.109039306640625, 0.2381591796875, 0.367279052734375, 0.49639892578125, 0.625518798828125, 0.754638671875, 0.883758544921875, 1.01287841796875, 1.141998291015625, 1.2711181640625, 1.400238037109375, 1.52935791015625, 1.658477783203125, 1.78759765625, 1.916717529296875, 2.04583740234375, 2.174957275390625, 2.3040771484375, 2.433197021484375, 2.56231689453125, 2.691436767578125, 2.820556640625, 2.949676513671875, 3.07879638671875, 3.207916259765625, 3.3370361328125, 3.466156005859375, 3.59527587890625, 3.724395751953125, 3.853515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 9.0, 9.0, 12.0, 11.0, 20.0, 34.0, 64.0, 129.0, 151.0, 285.0, 459.0, 791.0, 1410.0, 2714.0, 5513.0, 12501.0, 31013.0, 86680.0, 243427.0, 375179.0, 182121.0, 63603.0, 23298.0, 9730.0, 4341.0, 2148.0, 1180.0, 675.0, 379.0, 234.0, 154.0, 102.0, 74.0, 38.0, 19.0, 17.0, 10.0, 8.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7919921875, -0.7667312622070312, -0.7414703369140625, -0.7162094116210938, -0.690948486328125, -0.6656875610351562, -0.6404266357421875, -0.6151657104492188, -0.58990478515625, -0.5646438598632812, -0.5393829345703125, -0.5141220092773438, -0.488861083984375, -0.46360015869140625, -0.4383392333984375, -0.41307830810546875, -0.3878173828125, -0.36255645751953125, -0.3372955322265625, -0.31203460693359375, -0.286773681640625, -0.26151275634765625, -0.2362518310546875, -0.21099090576171875, -0.18572998046875, -0.16046905517578125, -0.1352081298828125, -0.10994720458984375, -0.084686279296875, -0.05942535400390625, -0.0341644287109375, -0.00890350341796875, 0.016357421875, 0.04161834716796875, 0.0668792724609375, 0.09214019775390625, 0.117401123046875, 0.14266204833984375, 0.1679229736328125, 0.19318389892578125, 0.21844482421875, 0.24370574951171875, 0.2689666748046875, 0.29422760009765625, 0.319488525390625, 0.34474945068359375, 0.3700103759765625, 0.39527130126953125, 0.4205322265625, 0.44579315185546875, 0.4710540771484375, 0.49631500244140625, 0.521575927734375, 0.5468368530273438, 0.5720977783203125, 0.5973587036132812, 0.62261962890625, 0.6478805541992188, 0.6731414794921875, 0.6984024047851562, 0.723663330078125, 0.7489242553710938, 0.7741851806640625, 0.7994461059570312, 0.82470703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 5.0, 7.0, 11.0, 15.0, 19.0, 18.0, 25.0, 34.0, 30.0, 42.0, 64.0, 66.0, 69.0, 65.0, 61.0, 72.0, 63.0, 50.0, 52.0, 44.0, 34.0, 26.0, 22.0, 20.0, 12.0, 14.0, 12.0, 5.0, 6.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.147125244140625e-05, -3.0423514544963837e-05, -2.9375776648521423e-05, -2.832803875207901e-05, -2.7280300855636597e-05, -2.6232562959194183e-05, -2.518482506275177e-05, -2.4137087166309357e-05, -2.3089349269866943e-05, -2.204161137342453e-05, -2.0993873476982117e-05, -1.9946135580539703e-05, -1.889839768409729e-05, -1.7850659787654877e-05, -1.6802921891212463e-05, -1.575518399477005e-05, -1.4707446098327637e-05, -1.3659708201885223e-05, -1.261197030544281e-05, -1.1564232409000397e-05, -1.0516494512557983e-05, -9.46875661611557e-06, -8.421018719673157e-06, -7.373280823230743e-06, -6.32554292678833e-06, -5.277805030345917e-06, -4.230067133903503e-06, -3.18232923746109e-06, -2.1345913410186768e-06, -1.0868534445762634e-06, -3.91155481338501e-08, 1.0086223483085632e-06, 2.0563602447509766e-06, 3.10409814119339e-06, 4.151836037635803e-06, 5.1995739340782166e-06, 6.24731183052063e-06, 7.295049726963043e-06, 8.342787623405457e-06, 9.39052551984787e-06, 1.0438263416290283e-05, 1.1486001312732697e-05, 1.253373920917511e-05, 1.3581477105617523e-05, 1.4629215002059937e-05, 1.567695289850235e-05, 1.6724690794944763e-05, 1.7772428691387177e-05, 1.882016658782959e-05, 1.9867904484272003e-05, 2.0915642380714417e-05, 2.196338027715683e-05, 2.3011118173599243e-05, 2.4058856070041656e-05, 2.510659396648407e-05, 2.6154331862926483e-05, 2.7202069759368896e-05, 2.824980765581131e-05, 2.9297545552253723e-05, 3.0345283448696136e-05, 3.139302134513855e-05, 3.244075924158096e-05, 3.3488497138023376e-05, 3.453623503446579e-05, 3.55839729309082e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 10.0, 10.0, 18.0, 18.0, 35.0, 52.0, 79.0, 115.0, 182.0, 262.0, 411.0, 629.0, 1019.0, 1547.0, 2494.0, 3988.0, 6662.0, 11060.0, 18791.0, 33171.0, 59173.0, 107235.0, 178240.0, 223430.0, 169370.0, 99970.0, 55335.0, 30786.0, 17692.0, 10169.0, 6263.0, 3771.0, 2382.0, 1438.0, 962.0, 596.0, 400.0, 271.0, 182.0, 112.0, 71.0, 46.0, 41.0, 14.0, 15.0, 11.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.5673828125, -0.5504150390625, -0.533447265625, -0.5164794921875, -0.49951171875, -0.4825439453125, -0.465576171875, -0.4486083984375, -0.431640625, -0.4146728515625, -0.397705078125, -0.3807373046875, -0.36376953125, -0.3468017578125, -0.329833984375, -0.3128662109375, -0.2958984375, -0.2789306640625, -0.261962890625, -0.2449951171875, -0.22802734375, -0.2110595703125, -0.194091796875, -0.1771240234375, -0.16015625, -0.1431884765625, -0.126220703125, -0.1092529296875, -0.09228515625, -0.0753173828125, -0.058349609375, -0.0413818359375, -0.0244140625, -0.0074462890625, 0.009521484375, 0.0264892578125, 0.04345703125, 0.0604248046875, 0.077392578125, 0.0943603515625, 0.111328125, 0.1282958984375, 0.145263671875, 0.1622314453125, 0.17919921875, 0.1961669921875, 0.213134765625, 0.2301025390625, 0.2470703125, 0.2640380859375, 0.281005859375, 0.2979736328125, 0.31494140625, 0.3319091796875, 0.348876953125, 0.3658447265625, 0.3828125, 0.3997802734375, 0.416748046875, 0.4337158203125, 0.45068359375, 0.4676513671875, 0.484619140625, 0.5015869140625, 0.5185546875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 7.0, 5.0, 11.0, 9.0, 14.0, 13.0, 20.0, 21.0, 27.0, 28.0, 27.0, 36.0, 31.0, 36.0, 34.0, 37.0, 48.0, 59.0, 52.0, 63.0, 44.0, 54.0, 37.0, 37.0, 32.0, 23.0, 29.0, 38.0, 17.0, 14.0, 22.0, 20.0, 11.0, 11.0, 4.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1324462890625, -0.12834930419921875, -0.1242523193359375, -0.12015533447265625, -0.116058349609375, -0.11196136474609375, -0.1078643798828125, -0.10376739501953125, -0.09967041015625, -0.09557342529296875, -0.0914764404296875, -0.08737945556640625, -0.083282470703125, -0.07918548583984375, -0.0750885009765625, -0.07099151611328125, -0.06689453125, -0.06279754638671875, -0.0587005615234375, -0.05460357666015625, -0.050506591796875, -0.04640960693359375, -0.0423126220703125, -0.03821563720703125, -0.03411865234375, -0.03002166748046875, -0.0259246826171875, -0.02182769775390625, -0.017730712890625, -0.01363372802734375, -0.0095367431640625, -0.00543975830078125, -0.0013427734375, 0.00275421142578125, 0.0068511962890625, 0.01094818115234375, 0.015045166015625, 0.01914215087890625, 0.0232391357421875, 0.02733612060546875, 0.03143310546875, 0.03553009033203125, 0.0396270751953125, 0.04372406005859375, 0.047821044921875, 0.05191802978515625, 0.0560150146484375, 0.06011199951171875, 0.064208984375, 0.06830596923828125, 0.0724029541015625, 0.07649993896484375, 0.080596923828125, 0.08469390869140625, 0.0887908935546875, 0.09288787841796875, 0.09698486328125, 0.10108184814453125, 0.1051788330078125, 0.10927581787109375, 0.113372802734375, 0.11746978759765625, 0.1215667724609375, 0.12566375732421875, 0.1297607421875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 0.0, 3.0, 2.0, 8.0, 5.0, 7.0, 7.0, 14.0, 17.0, 25.0, 20.0, 18.0, 34.0, 34.0, 41.0, 64.0, 52.0, 55.0, 58.0, 71.0, 65.0, 62.0, 51.0, 57.0, 48.0, 33.0, 28.0, 26.0, 27.0, 17.0, 9.0, 10.0, 9.0, 6.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.380390167236328, -11.037607192993164, -10.69482421875, -10.352042198181152, -10.009259223937988, -9.666476249694824, -9.323694229125977, -8.980911254882812, -8.638128280639648, -8.295345306396484, -7.9525628089904785, -7.609780311584473, -7.266997337341309, -6.9242143630981445, -6.581431865692139, -6.238649368286133, -5.895866394042969, -5.553083419799805, -5.210300922393799, -4.867518424987793, -4.524735450744629, -4.181952476501465, -3.839169979095459, -3.496387243270874, -3.153604507446289, -2.810821771621704, -2.468039035797119, -2.125256299972534, -1.7824735641479492, -1.4396908283233643, -1.0969080924987793, -0.7541253566741943, -0.4113435745239258, -0.06856083869934082, 0.27422189712524414, 0.6170046329498291, 0.9597873687744141, 1.302570104598999, 1.645352840423584, 1.988135576248169, 2.330918312072754, 2.673701047897339, 3.016483783721924, 3.359266519546509, 3.7020492553710938, 4.044832229614258, 4.387614727020264, 4.7303972244262695, 5.073180198669434, 5.415963172912598, 5.7587456703186035, 6.101528167724609, 6.444311141967773, 6.7870941162109375, 7.129876613616943, 7.472659111022949, 7.815442085266113, 8.158225059509277, 8.501007080078125, 8.843790054321289, 9.186573028564453, 9.529356002807617, 9.872138977050781, 10.214920997619629, 10.557703971862793]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 7.0, 10.0, 10.0, 14.0, 14.0, 14.0, 18.0, 15.0, 32.0, 29.0, 33.0, 31.0, 40.0, 48.0, 41.0, 36.0, 48.0, 40.0, 40.0, 58.0, 40.0, 50.0, 35.0, 38.0, 48.0, 28.0, 24.0, 22.0, 21.0, 21.0, 15.0, 11.0, 6.0, 12.0, 15.0, 9.0, 5.0, 4.0, 1.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.000344276428223, -6.800783157348633, -6.601221561431885, -6.401660442352295, -6.202099323272705, -6.002537727355957, -5.802976608276367, -5.603415489196777, -5.4038543701171875, -5.204293251037598, -5.00473165512085, -4.80517053604126, -4.60560941696167, -4.406047821044922, -4.206486701965332, -4.006925582885742, -3.807363986968994, -3.607802629470825, -3.4082415103912354, -3.2086801528930664, -3.0091190338134766, -2.8095576763153076, -2.6099963188171387, -2.410435199737549, -2.21087384223938, -2.011312484741211, -1.811751365661621, -1.6121900081634521, -1.4126287698745728, -1.2130675315856934, -1.0135061740875244, -0.813944935798645, -0.6143841743469238, -0.41482290625572205, -0.21526163816452026, -0.015700340270996094, 0.1838608980178833, 0.3834221363067627, 0.5829834938049316, 0.782544732093811, 0.9821059703826904, 1.1816672086715698, 1.3812284469604492, 1.5807898044586182, 1.7803510427474976, 1.979912281036377, 2.179473638534546, 2.379034996032715, 2.5785961151123047, 2.7781574726104736, 2.9777185916900635, 3.1772799491882324, 3.3768410682678223, 3.576402425765991, 3.77596378326416, 3.97552490234375, 4.17508602142334, 4.37464714050293, 4.574208736419678, 4.773769855499268, 4.973330974578857, 5.1728925704956055, 5.372453689575195, 5.572014808654785, 5.771576404571533]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 7.0, 6.0, 10.0, 16.0, 20.0, 20.0, 31.0, 42.0, 52.0, 74.0, 79.0, 132.0, 184.0, 261.0, 378.0, 571.0, 821.0, 1315.0, 2146.0, 3367.0, 5551.0, 9725.0, 16667.0, 28513.0, 48337.0, 76006.0, 110600.0, 142346.0, 154854.0, 141768.0, 110548.0, 75922.0, 47772.0, 28994.0, 16563.0, 9749.0, 5729.0, 3384.0, 2112.0, 1307.0, 802.0, 547.0, 338.0, 238.0, 188.0, 131.0, 78.0, 65.0, 53.0, 44.0, 19.0, 21.0, 24.0, 17.0, 8.0, 7.0, 4.0, 1.0, 0.0, 2.0], "bins": [-7.2578125, -7.03448486328125, -6.8111572265625, -6.58782958984375, -6.364501953125, -6.14117431640625, -5.9178466796875, -5.69451904296875, -5.47119140625, -5.24786376953125, -5.0245361328125, -4.80120849609375, -4.577880859375, -4.35455322265625, -4.1312255859375, -3.90789794921875, -3.6845703125, -3.46124267578125, -3.2379150390625, -3.01458740234375, -2.791259765625, -2.56793212890625, -2.3446044921875, -2.12127685546875, -1.89794921875, -1.67462158203125, -1.4512939453125, -1.22796630859375, -1.004638671875, -0.78131103515625, -0.5579833984375, -0.33465576171875, -0.111328125, 0.11199951171875, 0.3353271484375, 0.55865478515625, 0.781982421875, 1.00531005859375, 1.2286376953125, 1.45196533203125, 1.67529296875, 1.89862060546875, 2.1219482421875, 2.34527587890625, 2.568603515625, 2.79193115234375, 3.0152587890625, 3.23858642578125, 3.4619140625, 3.68524169921875, 3.9085693359375, 4.13189697265625, 4.355224609375, 4.57855224609375, 4.8018798828125, 5.02520751953125, 5.24853515625, 5.47186279296875, 5.6951904296875, 5.91851806640625, 6.141845703125, 6.36517333984375, 6.5885009765625, 6.81182861328125, 7.03515625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 9.0, 5.0, 9.0, 11.0, 16.0, 13.0, 19.0, 22.0, 23.0, 30.0, 29.0, 41.0, 39.0, 48.0, 42.0, 38.0, 41.0, 31.0, 35.0, 45.0, 44.0, 38.0, 38.0, 35.0, 38.0, 35.0, 35.0, 22.0, 19.0, 21.0, 17.0, 15.0, 13.0, 10.0, 11.0, 10.0, 4.0, 9.0, 4.0, 7.0, 8.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.06640625, -5.86773681640625, -5.6690673828125, -5.47039794921875, -5.271728515625, -5.07305908203125, -4.8743896484375, -4.67572021484375, -4.47705078125, -4.27838134765625, -4.0797119140625, -3.88104248046875, -3.682373046875, -3.48370361328125, -3.2850341796875, -3.08636474609375, -2.8876953125, -2.68902587890625, -2.4903564453125, -2.29168701171875, -2.093017578125, -1.89434814453125, -1.6956787109375, -1.49700927734375, -1.29833984375, -1.09967041015625, -0.9010009765625, -0.70233154296875, -0.503662109375, -0.30499267578125, -0.1063232421875, 0.09234619140625, 0.291015625, 0.48968505859375, 0.6883544921875, 0.88702392578125, 1.085693359375, 1.28436279296875, 1.4830322265625, 1.68170166015625, 1.88037109375, 2.07904052734375, 2.2777099609375, 2.47637939453125, 2.675048828125, 2.87371826171875, 3.0723876953125, 3.27105712890625, 3.4697265625, 3.66839599609375, 3.8670654296875, 4.06573486328125, 4.264404296875, 4.46307373046875, 4.6617431640625, 4.86041259765625, 5.05908203125, 5.25775146484375, 5.4564208984375, 5.65509033203125, 5.853759765625, 6.05242919921875, 6.2510986328125, 6.44976806640625, 6.6484375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 11.0, 8.0, 18.0, 23.0, 37.0, 48.0, 49.0, 73.0, 113.0, 175.0, 279.0, 499.0, 791.0, 1334.0, 2389.0, 4360.0, 8021.0, 15502.0, 28992.0, 52225.0, 88357.0, 132656.0, 168656.0, 172401.0, 142407.0, 97971.0, 59263.0, 33180.0, 17824.0, 9404.0, 5000.0, 2703.0, 1404.0, 848.0, 536.0, 323.0, 190.0, 146.0, 88.0, 68.0, 42.0, 36.0, 31.0, 16.0, 19.0, 5.0, 7.0, 7.0, 7.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.0703125, -7.8109130859375, -7.551513671875, -7.2921142578125, -7.03271484375, -6.7733154296875, -6.513916015625, -6.2545166015625, -5.9951171875, -5.7357177734375, -5.476318359375, -5.2169189453125, -4.95751953125, -4.6981201171875, -4.438720703125, -4.1793212890625, -3.919921875, -3.6605224609375, -3.401123046875, -3.1417236328125, -2.88232421875, -2.6229248046875, -2.363525390625, -2.1041259765625, -1.8447265625, -1.5853271484375, -1.325927734375, -1.0665283203125, -0.80712890625, -0.5477294921875, -0.288330078125, -0.0289306640625, 0.23046875, 0.4898681640625, 0.749267578125, 1.0086669921875, 1.26806640625, 1.5274658203125, 1.786865234375, 2.0462646484375, 2.3056640625, 2.5650634765625, 2.824462890625, 3.0838623046875, 3.34326171875, 3.6026611328125, 3.862060546875, 4.1214599609375, 4.380859375, 4.6402587890625, 4.899658203125, 5.1590576171875, 5.41845703125, 5.6778564453125, 5.937255859375, 6.1966552734375, 6.4560546875, 6.7154541015625, 6.974853515625, 7.2342529296875, 7.49365234375, 7.7530517578125, 8.012451171875, 8.2718505859375, 8.53125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 8.0, 11.0, 7.0, 5.0, 7.0, 12.0, 16.0, 20.0, 17.0, 26.0, 26.0, 27.0, 29.0, 35.0, 35.0, 38.0, 29.0, 36.0, 36.0, 55.0, 40.0, 50.0, 49.0, 41.0, 35.0, 37.0, 26.0, 38.0, 29.0, 24.0, 22.0, 28.0, 15.0, 12.0, 15.0, 11.0, 6.0, 10.0, 6.0, 12.0, 6.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6875, -3.56475830078125, -3.4420166015625, -3.31927490234375, -3.196533203125, -3.07379150390625, -2.9510498046875, -2.82830810546875, -2.70556640625, -2.58282470703125, -2.4600830078125, -2.33734130859375, -2.214599609375, -2.09185791015625, -1.9691162109375, -1.84637451171875, -1.7236328125, -1.60089111328125, -1.4781494140625, -1.35540771484375, -1.232666015625, -1.10992431640625, -0.9871826171875, -0.86444091796875, -0.74169921875, -0.61895751953125, -0.4962158203125, -0.37347412109375, -0.250732421875, -0.12799072265625, -0.0052490234375, 0.11749267578125, 0.240234375, 0.36297607421875, 0.4857177734375, 0.60845947265625, 0.731201171875, 0.85394287109375, 0.9766845703125, 1.09942626953125, 1.22216796875, 1.34490966796875, 1.4676513671875, 1.59039306640625, 1.713134765625, 1.83587646484375, 1.9586181640625, 2.08135986328125, 2.2041015625, 2.32684326171875, 2.4495849609375, 2.57232666015625, 2.695068359375, 2.81781005859375, 2.9405517578125, 3.06329345703125, 3.18603515625, 3.30877685546875, 3.4315185546875, 3.55426025390625, 3.677001953125, 3.79974365234375, 3.9224853515625, 4.04522705078125, 4.16796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 6.0, 8.0, 14.0, 15.0, 21.0, 36.0, 44.0, 56.0, 82.0, 139.0, 211.0, 366.0, 646.0, 1135.0, 2300.0, 5309.0, 14718.0, 55771.0, 246998.0, 482471.0, 178050.0, 40238.0, 11231.0, 4225.0, 1979.0, 991.0, 558.0, 324.0, 200.0, 155.0, 84.0, 55.0, 38.0, 22.0, 10.0, 24.0, 7.0, 10.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.09375, -15.5968017578125, -15.099853515625, -14.6029052734375, -14.10595703125, -13.6090087890625, -13.112060546875, -12.6151123046875, -12.1181640625, -11.6212158203125, -11.124267578125, -10.6273193359375, -10.13037109375, -9.6334228515625, -9.136474609375, -8.6395263671875, -8.142578125, -7.6456298828125, -7.148681640625, -6.6517333984375, -6.15478515625, -5.6578369140625, -5.160888671875, -4.6639404296875, -4.1669921875, -3.6700439453125, -3.173095703125, -2.6761474609375, -2.17919921875, -1.6822509765625, -1.185302734375, -0.6883544921875, -0.19140625, 0.3055419921875, 0.802490234375, 1.2994384765625, 1.79638671875, 2.2933349609375, 2.790283203125, 3.2872314453125, 3.7841796875, 4.2811279296875, 4.778076171875, 5.2750244140625, 5.77197265625, 6.2689208984375, 6.765869140625, 7.2628173828125, 7.759765625, 8.2567138671875, 8.753662109375, 9.2506103515625, 9.74755859375, 10.2445068359375, 10.741455078125, 11.2384033203125, 11.7353515625, 12.2322998046875, 12.729248046875, 13.2261962890625, 13.72314453125, 14.2200927734375, 14.717041015625, 15.2139892578125, 15.7109375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 5.0, 4.0, 13.0, 11.0, 9.0, 27.0, 48.0, 80.0, 90.0, 155.0, 138.0, 140.0, 100.0, 66.0, 31.0, 28.0, 11.0, 3.0, 10.0, 6.0, 1.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013055801391601562, -0.0012639909982681274, -0.0012224018573760986, -0.0011808127164840698, -0.001139223575592041, -0.0010976344347000122, -0.0010560452938079834, -0.0010144561529159546, -0.0009728670120239258, -0.000931277871131897, -0.0008896887302398682, -0.0008480995893478394, -0.0008065104484558105, -0.0007649213075637817, -0.0007233321666717529, -0.0006817430257797241, -0.0006401538848876953, -0.0005985647439956665, -0.0005569756031036377, -0.0005153864622116089, -0.0004737973213195801, -0.00043220818042755127, -0.00039061903953552246, -0.00034902989864349365, -0.00030744075775146484, -0.00026585161685943604, -0.00022426247596740723, -0.00018267333507537842, -0.0001410841941833496, -9.94950532913208e-05, -5.790591239929199e-05, -1.6316771507263184e-05, 2.5272369384765625e-05, 6.686151027679443e-05, 0.00010845065116882324, 0.00015003979206085205, 0.00019162893295288086, 0.00023321807384490967, 0.0002748072147369385, 0.0003163963556289673, 0.0003579854965209961, 0.0003995746374130249, 0.0004411637783050537, 0.0004827529191970825, 0.0005243420600891113, 0.0005659312009811401, 0.0006075203418731689, 0.0006491094827651978, 0.0006906986236572266, 0.0007322877645492554, 0.0007738769054412842, 0.000815466046333313, 0.0008570551872253418, 0.0008986443281173706, 0.0009402334690093994, 0.0009818226099014282, 0.001023411750793457, 0.0010650008916854858, 0.0011065900325775146, 0.0011481791734695435, 0.0011897683143615723, 0.001231357455253601, 0.0012729465961456299, 0.0013145357370376587, 0.0013561248779296875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 11.0, 14.0, 17.0, 28.0, 30.0, 45.0, 77.0, 112.0, 127.0, 238.0, 348.0, 498.0, 829.0, 1292.0, 2310.0, 3856.0, 6953.0, 13491.0, 26665.0, 54330.0, 107876.0, 186403.0, 232801.0, 187957.0, 109438.0, 55138.0, 27015.0, 13594.0, 7261.0, 3905.0, 2173.0, 1321.0, 837.0, 505.0, 319.0, 220.0, 139.0, 115.0, 69.0, 62.0, 34.0, 27.0, 28.0, 15.0, 10.0, 7.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.53515625, -6.3277587890625, -6.120361328125, -5.9129638671875, -5.70556640625, -5.4981689453125, -5.290771484375, -5.0833740234375, -4.8759765625, -4.6685791015625, -4.461181640625, -4.2537841796875, -4.04638671875, -3.8389892578125, -3.631591796875, -3.4241943359375, -3.216796875, -3.0093994140625, -2.802001953125, -2.5946044921875, -2.38720703125, -2.1798095703125, -1.972412109375, -1.7650146484375, -1.5576171875, -1.3502197265625, -1.142822265625, -0.9354248046875, -0.72802734375, -0.5206298828125, -0.313232421875, -0.1058349609375, 0.1015625, 0.3089599609375, 0.516357421875, 0.7237548828125, 0.93115234375, 1.1385498046875, 1.345947265625, 1.5533447265625, 1.7607421875, 1.9681396484375, 2.175537109375, 2.3829345703125, 2.59033203125, 2.7977294921875, 3.005126953125, 3.2125244140625, 3.419921875, 3.6273193359375, 3.834716796875, 4.0421142578125, 4.24951171875, 4.4569091796875, 4.664306640625, 4.8717041015625, 5.0791015625, 5.2864990234375, 5.493896484375, 5.7012939453125, 5.90869140625, 6.1160888671875, 6.323486328125, 6.5308837890625, 6.73828125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 12.0, 19.0, 21.0, 20.0, 34.0, 40.0, 61.0, 58.0, 73.0, 71.0, 88.0, 79.0, 78.0, 57.0, 66.0, 35.0, 46.0, 29.0, 21.0, 15.0, 11.0, 16.0, 2.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.029022216796875, -1.97406005859375, -1.919097900390625, -1.8641357421875, -1.809173583984375, -1.75421142578125, -1.699249267578125, -1.644287109375, -1.589324951171875, -1.53436279296875, -1.479400634765625, -1.4244384765625, -1.369476318359375, -1.31451416015625, -1.259552001953125, -1.20458984375, -1.149627685546875, -1.09466552734375, -1.039703369140625, -0.9847412109375, -0.929779052734375, -0.87481689453125, -0.819854736328125, -0.764892578125, -0.709930419921875, -0.65496826171875, -0.600006103515625, -0.5450439453125, -0.490081787109375, -0.43511962890625, -0.380157470703125, -0.3251953125, -0.270233154296875, -0.21527099609375, -0.160308837890625, -0.1053466796875, -0.050384521484375, 0.00457763671875, 0.059539794921875, 0.114501953125, 0.169464111328125, 0.22442626953125, 0.279388427734375, 0.3343505859375, 0.389312744140625, 0.44427490234375, 0.499237060546875, 0.55419921875, 0.609161376953125, 0.66412353515625, 0.719085693359375, 0.7740478515625, 0.829010009765625, 0.88397216796875, 0.938934326171875, 0.993896484375, 1.048858642578125, 1.10382080078125, 1.158782958984375, 1.2137451171875, 1.268707275390625, 1.32366943359375, 1.378631591796875, 1.43359375]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 9.0, 17.0, 14.0, 31.0, 20.0, 33.0, 34.0, 42.0, 53.0, 42.0, 55.0, 71.0, 72.0, 52.0, 87.0, 50.0, 54.0, 49.0, 39.0, 39.0, 29.0, 21.0, 12.0, 12.0, 7.0, 6.0, 6.0, 6.0, 2.0, 4.0, 2.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.46998119354248, -13.093667030334473, -12.717352867126465, -12.341038703918457, -11.96472454071045, -11.588410377502441, -11.21209716796875, -10.835783004760742, -10.459468841552734, -10.083154678344727, -9.706840515136719, -9.330526351928711, -8.954212188720703, -8.577898025512695, -8.201583862304688, -7.825270175933838, -7.448955535888672, -7.072641372680664, -6.696327209472656, -6.320013046264648, -5.943698883056641, -5.567384719848633, -5.191071033477783, -4.814756870269775, -4.438442707061768, -4.06212854385376, -3.685814380645752, -3.3095004558563232, -2.9331862926483154, -2.5568721294403076, -2.180558204650879, -1.804244041442871, -1.4279298782348633, -1.0516157150268555, -0.6753016710281372, -0.29898762702941895, 0.07732653617858887, 0.4536406993865967, 0.8299546241760254, 1.2062687873840332, 1.582582950592041, 1.9588971138000488, 2.3352112770080566, 2.7115252017974854, 3.087839365005493, 3.464153528213501, 3.8404674530029297, 4.2167816162109375, 4.593095779418945, 4.969409942626953, 5.345724105834961, 5.722038269042969, 6.098352432250977, 6.474666595458984, 6.850980281829834, 7.227294445037842, 7.60360860824585, 7.979922771453857, 8.356236457824707, 8.732550621032715, 9.108864784240723, 9.48517894744873, 9.861493110656738, 10.237807273864746, 10.614121437072754]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 8.0, 8.0, 5.0, 11.0, 14.0, 12.0, 16.0, 28.0, 20.0, 27.0, 37.0, 28.0, 36.0, 36.0, 36.0, 33.0, 37.0, 47.0, 38.0, 40.0, 42.0, 45.0, 47.0, 40.0, 36.0, 35.0, 34.0, 22.0, 28.0, 24.0, 21.0, 20.0, 13.0, 9.0, 12.0, 6.0, 6.0, 9.0, 6.0, 4.0, 1.0, 3.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.395371913909912, -6.201572418212891, -6.007773399353027, -5.813974380493164, -5.620174884796143, -5.426375389099121, -5.232576370239258, -5.0387773513793945, -4.844977855682373, -4.651178359985352, -4.457379341125488, -4.263580322265625, -4.0697808265686035, -3.875981569290161, -3.6821823120117188, -3.4883830547332764, -3.294583797454834, -3.1007845401763916, -2.906985282897949, -2.713186025619507, -2.5193867683410645, -2.325587511062622, -2.1317882537841797, -1.9379889965057373, -1.744189739227295, -1.5503904819488525, -1.3565912246704102, -1.1627919673919678, -0.9689927101135254, -0.775193452835083, -0.5813941955566406, -0.38759493827819824, -0.19379568099975586, 3.5762786865234375e-06, 0.1938028335571289, 0.3876020908355713, 0.5814013481140137, 0.775200605392456, 0.9689998626708984, 1.1627991199493408, 1.3565983772277832, 1.5503976345062256, 1.744196891784668, 1.9379961490631104, 2.1317954063415527, 2.325594663619995, 2.5193939208984375, 2.71319317817688, 2.9069924354553223, 3.1007916927337646, 3.294590950012207, 3.4883902072906494, 3.682189464569092, 3.875988721847534, 4.069787979125977, 4.26358699798584, 4.457386493682861, 4.651185989379883, 4.844985008239746, 5.038784027099609, 5.232583522796631, 5.426383018493652, 5.620182037353516, 5.813981056213379, 6.0077805519104]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 8.0, 19.0, 39.0, 48.0, 81.0, 114.0, 202.0, 352.0, 605.0, 917.0, 1634.0, 2801.0, 4818.0, 8628.0, 15238.0, 28245.0, 52414.0, 96955.0, 179684.0, 321895.0, 531025.0, 731048.0, 766105.0, 598742.0, 379170.0, 215462.0, 117955.0, 63631.0, 34038.0, 18474.0, 10315.0, 5711.0, 3293.0, 1888.0, 1102.0, 638.0, 394.0, 238.0, 136.0, 76.0, 59.0, 29.0, 24.0, 15.0, 4.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.8033447265625, -8.520751953125, -8.2381591796875, -7.95556640625, -7.6729736328125, -7.390380859375, -7.1077880859375, -6.8251953125, -6.5426025390625, -6.260009765625, -5.9774169921875, -5.69482421875, -5.4122314453125, -5.129638671875, -4.8470458984375, -4.564453125, -4.2818603515625, -3.999267578125, -3.7166748046875, -3.43408203125, -3.1514892578125, -2.868896484375, -2.5863037109375, -2.3037109375, -2.0211181640625, -1.738525390625, -1.4559326171875, -1.17333984375, -0.8907470703125, -0.608154296875, -0.3255615234375, -0.04296875, 0.2396240234375, 0.522216796875, 0.8048095703125, 1.08740234375, 1.3699951171875, 1.652587890625, 1.9351806640625, 2.2177734375, 2.5003662109375, 2.782958984375, 3.0655517578125, 3.34814453125, 3.6307373046875, 3.913330078125, 4.1959228515625, 4.478515625, 4.7611083984375, 5.043701171875, 5.3262939453125, 5.60888671875, 5.8914794921875, 6.174072265625, 6.4566650390625, 6.7392578125, 7.0218505859375, 7.304443359375, 7.5870361328125, 7.86962890625, 8.1522216796875, 8.434814453125, 8.7174072265625, 9.0]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 12.0, 6.0, 14.0, 20.0, 18.0, 17.0, 25.0, 23.0, 39.0, 40.0, 39.0, 44.0, 45.0, 56.0, 60.0, 51.0, 54.0, 52.0, 42.0, 45.0, 44.0, 39.0, 36.0, 28.0, 25.0, 21.0, 16.0, 23.0, 6.0, 8.0, 11.0, 6.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.34063720703125, -4.1578369140625, -3.97503662109375, -3.792236328125, -3.60943603515625, -3.4266357421875, -3.24383544921875, -3.06103515625, -2.87823486328125, -2.6954345703125, -2.51263427734375, -2.329833984375, -2.14703369140625, -1.9642333984375, -1.78143310546875, -1.5986328125, -1.41583251953125, -1.2330322265625, -1.05023193359375, -0.867431640625, -0.68463134765625, -0.5018310546875, -0.31903076171875, -0.13623046875, 0.04656982421875, 0.2293701171875, 0.41217041015625, 0.594970703125, 0.77777099609375, 0.9605712890625, 1.14337158203125, 1.326171875, 1.50897216796875, 1.6917724609375, 1.87457275390625, 2.057373046875, 2.24017333984375, 2.4229736328125, 2.60577392578125, 2.78857421875, 2.97137451171875, 3.1541748046875, 3.33697509765625, 3.519775390625, 3.70257568359375, 3.8853759765625, 4.06817626953125, 4.2509765625, 4.43377685546875, 4.6165771484375, 4.79937744140625, 4.982177734375, 5.16497802734375, 5.3477783203125, 5.53057861328125, 5.71337890625, 5.89617919921875, 6.0789794921875, 6.26177978515625, 6.444580078125, 6.62738037109375, 6.8101806640625, 6.99298095703125, 7.17578125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 10.0, 10.0, 20.0, 27.0, 36.0, 62.0, 112.0, 145.0, 229.0, 398.0, 609.0, 1070.0, 1637.0, 2696.0, 4408.0, 7061.0, 11971.0, 19492.0, 32706.0, 55406.0, 93004.0, 150746.0, 240166.0, 360079.0, 492079.0, 590032.0, 595163.0, 507247.0, 374278.0, 250910.0, 159749.0, 96566.0, 58400.0, 34843.0, 21028.0, 12509.0, 7609.0, 4530.0, 2687.0, 1788.0, 1049.0, 646.0, 387.0, 245.0, 168.0, 92.0, 66.0, 42.0, 33.0, 17.0, 14.0, 4.0, 3.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.37567138671875, -7.1302490234375, -6.88482666015625, -6.639404296875, -6.39398193359375, -6.1485595703125, -5.90313720703125, -5.65771484375, -5.41229248046875, -5.1668701171875, -4.92144775390625, -4.676025390625, -4.43060302734375, -4.1851806640625, -3.93975830078125, -3.6943359375, -3.44891357421875, -3.2034912109375, -2.95806884765625, -2.712646484375, -2.46722412109375, -2.2218017578125, -1.97637939453125, -1.73095703125, -1.48553466796875, -1.2401123046875, -0.99468994140625, -0.749267578125, -0.50384521484375, -0.2584228515625, -0.01300048828125, 0.232421875, 0.47784423828125, 0.7232666015625, 0.96868896484375, 1.214111328125, 1.45953369140625, 1.7049560546875, 1.95037841796875, 2.19580078125, 2.44122314453125, 2.6866455078125, 2.93206787109375, 3.177490234375, 3.42291259765625, 3.6683349609375, 3.91375732421875, 4.1591796875, 4.40460205078125, 4.6500244140625, 4.89544677734375, 5.140869140625, 5.38629150390625, 5.6317138671875, 5.87713623046875, 6.12255859375, 6.36798095703125, 6.6134033203125, 6.85882568359375, 7.104248046875, 7.34967041015625, 7.5950927734375, 7.84051513671875, 8.0859375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 14.0, 8.0, 21.0, 19.0, 34.0, 40.0, 41.0, 71.0, 66.0, 69.0, 129.0, 118.0, 163.0, 174.0, 211.0, 243.0, 211.0, 237.0, 241.0, 240.0, 220.0, 238.0, 203.0, 191.0, 160.0, 123.0, 117.0, 109.0, 76.0, 66.0, 44.0, 53.0, 32.0, 25.0, 19.0, 13.0, 11.0, 7.0, 3.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.376953125, -3.27960205078125, -3.1822509765625, -3.08489990234375, -2.987548828125, -2.89019775390625, -2.7928466796875, -2.69549560546875, -2.59814453125, -2.50079345703125, -2.4034423828125, -2.30609130859375, -2.208740234375, -2.11138916015625, -2.0140380859375, -1.91668701171875, -1.8193359375, -1.72198486328125, -1.6246337890625, -1.52728271484375, -1.429931640625, -1.33258056640625, -1.2352294921875, -1.13787841796875, -1.04052734375, -0.94317626953125, -0.8458251953125, -0.74847412109375, -0.651123046875, -0.55377197265625, -0.4564208984375, -0.35906982421875, -0.26171875, -0.16436767578125, -0.0670166015625, 0.03033447265625, 0.127685546875, 0.22503662109375, 0.3223876953125, 0.41973876953125, 0.51708984375, 0.61444091796875, 0.7117919921875, 0.80914306640625, 0.906494140625, 1.00384521484375, 1.1011962890625, 1.19854736328125, 1.2958984375, 1.39324951171875, 1.4906005859375, 1.58795166015625, 1.685302734375, 1.78265380859375, 1.8800048828125, 1.97735595703125, 2.07470703125, 2.17205810546875, 2.2694091796875, 2.36676025390625, 2.464111328125, 2.56146240234375, 2.6588134765625, 2.75616455078125, 2.853515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 1.0, 4.0, 6.0, 6.0, 6.0, 16.0, 8.0, 19.0, 19.0, 37.0, 34.0, 43.0, 37.0, 56.0, 55.0, 66.0, 76.0, 63.0, 67.0, 59.0, 60.0, 44.0, 43.0, 42.0, 23.0, 27.0, 15.0, 20.0, 9.0, 10.0, 5.0, 5.0, 7.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.141827583312988, -12.765663146972656, -12.38949966430664, -12.013335227966309, -11.637170791625977, -11.261007308959961, -10.884842872619629, -10.508678436279297, -10.132514953613281, -9.75635051727295, -9.380187034606934, -9.004022598266602, -8.627859115600586, -8.251694679260254, -7.875530242919922, -7.499366283416748, -7.123202323913574, -6.7470383644104, -6.370874404907227, -5.9947099685668945, -5.618546009063721, -5.242382049560547, -4.866217613220215, -4.490053653717041, -4.113889694213867, -3.7377257347106934, -3.3615615367889404, -2.9853973388671875, -2.6092333793640137, -2.23306941986084, -1.856905221939087, -1.480741024017334, -1.1045770645141602, -0.7284129858016968, -0.3522489070892334, 0.02391517162322998, 0.40007925033569336, 0.7762433290481567, 1.1524074077606201, 1.528571605682373, 1.9047355651855469, 2.2808995246887207, 2.6570637226104736, 3.0332279205322266, 3.4093918800354004, 3.785555839538574, 4.161720275878906, 4.53788423538208, 4.914048194885254, 5.290212154388428, 5.666376113891602, 6.042540550231934, 6.418704509735107, 6.794868469238281, 7.171032905578613, 7.547196865081787, 7.923360824584961, 8.299525260925293, 8.675688743591309, 9.05185317993164, 9.428016662597656, 9.804181098937988, 10.18034553527832, 10.556509017944336, 10.932673454284668]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 9.0, 7.0, 13.0, 17.0, 19.0, 17.0, 23.0, 19.0, 28.0, 29.0, 30.0, 38.0, 31.0, 50.0, 28.0, 37.0, 42.0, 39.0, 36.0, 46.0, 39.0, 33.0, 41.0, 44.0, 34.0, 31.0, 20.0, 23.0, 30.0, 30.0, 15.0, 16.0, 20.0, 10.0, 9.0, 11.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.733055114746094, -6.54025411605835, -6.3474531173706055, -6.154651641845703, -5.961850643157959, -5.769049644470215, -5.576248645782471, -5.383447647094727, -5.190646171569824, -4.99784517288208, -4.805044174194336, -4.612242698669434, -4.4194416999816895, -4.226640701293945, -4.033839702606201, -3.841038465499878, -3.648237466812134, -3.4554364681243896, -3.2626352310180664, -3.0698342323303223, -2.877032995223999, -2.684231996536255, -2.4914307594299316, -2.2986297607421875, -2.1058287620544434, -1.9130276441574097, -1.720226526260376, -1.5274255275726318, -1.3346242904663086, -1.1418232917785645, -0.9490221738815308, -0.7562210559844971, -0.5634198188781738, -0.37061870098114014, -0.17781761288642883, 0.01498347520828247, 0.20778459310531616, 0.40058571100234985, 0.5933867692947388, 0.7861878871917725, 0.9789890050888062, 1.1717901229858398, 1.3645912408828735, 1.5573923587799072, 1.7501933574676514, 1.9429945945739746, 2.1357955932617188, 2.328596591949463, 2.521397829055786, 2.7141988277435303, 2.9070000648498535, 3.0998010635375977, 3.292602300643921, 3.485403299331665, 3.6782045364379883, 3.8710055351257324, 4.063806533813477, 4.256607532501221, 4.449408531188965, 4.642210006713867, 4.835011005401611, 5.0278120040893555, 5.2206130027771, 5.413414001464844, 5.606215476989746]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 5.0, 8.0, 16.0, 20.0, 33.0, 29.0, 66.0, 76.0, 96.0, 131.0, 186.0, 285.0, 380.0, 538.0, 764.0, 1043.0, 1707.0, 2702.0, 4822.0, 10213.0, 25099.0, 69065.0, 184641.0, 334156.0, 246737.0, 100555.0, 35849.0, 13683.0, 6018.0, 3337.0, 1938.0, 1303.0, 948.0, 596.0, 444.0, 312.0, 214.0, 180.0, 104.0, 84.0, 50.0, 40.0, 25.0, 21.0, 15.0, 8.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.939453125, -3.81890869140625, -3.6983642578125, -3.57781982421875, -3.457275390625, -3.33673095703125, -3.2161865234375, -3.09564208984375, -2.97509765625, -2.85455322265625, -2.7340087890625, -2.61346435546875, -2.492919921875, -2.37237548828125, -2.2518310546875, -2.13128662109375, -2.0107421875, -1.89019775390625, -1.7696533203125, -1.64910888671875, -1.528564453125, -1.40802001953125, -1.2874755859375, -1.16693115234375, -1.04638671875, -0.92584228515625, -0.8052978515625, -0.68475341796875, -0.564208984375, -0.44366455078125, -0.3231201171875, -0.20257568359375, -0.08203125, 0.03851318359375, 0.1590576171875, 0.27960205078125, 0.400146484375, 0.52069091796875, 0.6412353515625, 0.76177978515625, 0.88232421875, 1.00286865234375, 1.1234130859375, 1.24395751953125, 1.364501953125, 1.48504638671875, 1.6055908203125, 1.72613525390625, 1.8466796875, 1.96722412109375, 2.0877685546875, 2.20831298828125, 2.328857421875, 2.44940185546875, 2.5699462890625, 2.69049072265625, 2.81103515625, 2.93157958984375, 3.0521240234375, 3.17266845703125, 3.293212890625, 3.41375732421875, 3.5343017578125, 3.65484619140625, 3.775390625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 5.0, 4.0, 12.0, 9.0, 16.0, 20.0, 26.0, 23.0, 22.0, 23.0, 33.0, 25.0, 19.0, 31.0, 29.0, 41.0, 49.0, 38.0, 34.0, 36.0, 42.0, 39.0, 26.0, 30.0, 31.0, 33.0, 37.0, 32.0, 26.0, 29.0, 20.0, 24.0, 28.0, 18.0, 14.0, 15.0, 7.0, 7.0, 7.0, 12.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.25, -6.0467529296875, -5.843505859375, -5.6402587890625, -5.43701171875, -5.2337646484375, -5.030517578125, -4.8272705078125, -4.6240234375, -4.4207763671875, -4.217529296875, -4.0142822265625, -3.81103515625, -3.6077880859375, -3.404541015625, -3.2012939453125, -2.998046875, -2.7947998046875, -2.591552734375, -2.3883056640625, -2.18505859375, -1.9818115234375, -1.778564453125, -1.5753173828125, -1.3720703125, -1.1688232421875, -0.965576171875, -0.7623291015625, -0.55908203125, -0.3558349609375, -0.152587890625, 0.0506591796875, 0.25390625, 0.4571533203125, 0.660400390625, 0.8636474609375, 1.06689453125, 1.2701416015625, 1.473388671875, 1.6766357421875, 1.8798828125, 2.0831298828125, 2.286376953125, 2.4896240234375, 2.69287109375, 2.8961181640625, 3.099365234375, 3.3026123046875, 3.505859375, 3.7091064453125, 3.912353515625, 4.1156005859375, 4.31884765625, 4.5220947265625, 4.725341796875, 4.9285888671875, 5.1318359375, 5.3350830078125, 5.538330078125, 5.7415771484375, 5.94482421875, 6.1480712890625, 6.351318359375, 6.5545654296875, 6.7578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 13.0, 21.0, 24.0, 31.0, 47.0, 55.0, 88.0, 124.0, 182.0, 283.0, 503.0, 931.0, 1884.0, 4863.0, 25716.0, 394808.0, 567779.0, 40563.0, 6043.0, 2169.0, 975.0, 512.0, 286.0, 194.0, 124.0, 91.0, 81.0, 39.0, 31.0, 28.0, 17.0, 11.0, 7.0, 4.0, 9.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.3125, -9.9580078125, -9.603515625, -9.2490234375, -8.89453125, -8.5400390625, -8.185546875, -7.8310546875, -7.4765625, -7.1220703125, -6.767578125, -6.4130859375, -6.05859375, -5.7041015625, -5.349609375, -4.9951171875, -4.640625, -4.2861328125, -3.931640625, -3.5771484375, -3.22265625, -2.8681640625, -2.513671875, -2.1591796875, -1.8046875, -1.4501953125, -1.095703125, -0.7412109375, -0.38671875, -0.0322265625, 0.322265625, 0.6767578125, 1.03125, 1.3857421875, 1.740234375, 2.0947265625, 2.44921875, 2.8037109375, 3.158203125, 3.5126953125, 3.8671875, 4.2216796875, 4.576171875, 4.9306640625, 5.28515625, 5.6396484375, 5.994140625, 6.3486328125, 6.703125, 7.0576171875, 7.412109375, 7.7666015625, 8.12109375, 8.4755859375, 8.830078125, 9.1845703125, 9.5390625, 9.8935546875, 10.248046875, 10.6025390625, 10.95703125, 11.3115234375, 11.666015625, 12.0205078125, 12.375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 8.0, 7.0, 10.0, 11.0, 11.0, 16.0, 27.0, 19.0, 17.0, 19.0, 19.0, 19.0, 24.0, 31.0, 36.0, 41.0, 48.0, 36.0, 39.0, 42.0, 30.0, 30.0, 27.0, 35.0, 34.0, 40.0, 32.0, 38.0, 36.0, 32.0, 24.0, 16.0, 20.0, 21.0, 15.0, 10.0, 10.0, 13.0, 6.0, 13.0, 9.0, 9.0, 4.0, 5.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.896484375, -3.773040771484375, -3.64959716796875, -3.526153564453125, -3.4027099609375, -3.279266357421875, -3.15582275390625, -3.032379150390625, -2.908935546875, -2.785491943359375, -2.66204833984375, -2.538604736328125, -2.4151611328125, -2.291717529296875, -2.16827392578125, -2.044830322265625, -1.92138671875, -1.797943115234375, -1.67449951171875, -1.551055908203125, -1.4276123046875, -1.304168701171875, -1.18072509765625, -1.057281494140625, -0.933837890625, -0.810394287109375, -0.68695068359375, -0.563507080078125, -0.4400634765625, -0.316619873046875, -0.19317626953125, -0.069732666015625, 0.0537109375, 0.177154541015625, 0.30059814453125, 0.424041748046875, 0.5474853515625, 0.670928955078125, 0.79437255859375, 0.917816162109375, 1.041259765625, 1.164703369140625, 1.28814697265625, 1.411590576171875, 1.5350341796875, 1.658477783203125, 1.78192138671875, 1.905364990234375, 2.02880859375, 2.152252197265625, 2.27569580078125, 2.399139404296875, 2.5225830078125, 2.646026611328125, 2.76947021484375, 2.892913818359375, 3.016357421875, 3.139801025390625, 3.26324462890625, 3.386688232421875, 3.5101318359375, 3.633575439453125, 3.75701904296875, 3.880462646484375, 4.00390625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 6.0, 8.0, 23.0, 16.0, 23.0, 43.0, 69.0, 71.0, 100.0, 163.0, 208.0, 297.0, 457.0, 742.0, 1151.0, 1790.0, 3024.0, 5777.0, 23215.0, 959705.0, 36336.0, 6409.0, 3353.0, 2011.0, 1197.0, 803.0, 477.0, 334.0, 233.0, 143.0, 107.0, 72.0, 59.0, 36.0, 19.0, 20.0, 8.0, 11.0, 9.0, 11.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.1480712890625, -5.925048828125, -5.7020263671875, -5.47900390625, -5.2559814453125, -5.032958984375, -4.8099365234375, -4.5869140625, -4.3638916015625, -4.140869140625, -3.9178466796875, -3.69482421875, -3.4718017578125, -3.248779296875, -3.0257568359375, -2.802734375, -2.5797119140625, -2.356689453125, -2.1336669921875, -1.91064453125, -1.6876220703125, -1.464599609375, -1.2415771484375, -1.0185546875, -0.7955322265625, -0.572509765625, -0.3494873046875, -0.12646484375, 0.0965576171875, 0.319580078125, 0.5426025390625, 0.765625, 0.9886474609375, 1.211669921875, 1.4346923828125, 1.65771484375, 1.8807373046875, 2.103759765625, 2.3267822265625, 2.5498046875, 2.7728271484375, 2.995849609375, 3.2188720703125, 3.44189453125, 3.6649169921875, 3.887939453125, 4.1109619140625, 4.333984375, 4.5570068359375, 4.780029296875, 5.0030517578125, 5.22607421875, 5.4490966796875, 5.672119140625, 5.8951416015625, 6.1181640625, 6.3411865234375, 6.564208984375, 6.7872314453125, 7.01025390625, 7.2332763671875, 7.456298828125, 7.6793212890625, 7.90234375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 23.0, 207.0, 560.0, 145.0, 22.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0005087852478027344, -0.0004939958453178406, -0.0004792064428329468, -0.000464417040348053, -0.0004496276378631592, -0.0004348382353782654, -0.0004200488328933716, -0.0004052594304084778, -0.000390470027923584, -0.0003756806254386902, -0.0003608912229537964, -0.0003461018204689026, -0.0003313124179840088, -0.000316523015499115, -0.0003017336130142212, -0.0002869442105293274, -0.0002721548080444336, -0.0002573654055595398, -0.000242576003074646, -0.0002277866005897522, -0.0002129971981048584, -0.0001982077956199646, -0.0001834183931350708, -0.000168628990650177, -0.0001538395881652832, -0.0001390501856803894, -0.0001242607831954956, -0.0001094713807106018, -9.468197822570801e-05, -7.989257574081421e-05, -6.510317325592041e-05, -5.031377077102661e-05, -3.552436828613281e-05, -2.0734965801239014e-05, -5.945563316345215e-06, 8.843839168548584e-06, 2.3633241653442383e-05, 3.842264413833618e-05, 5.321204662322998e-05, 6.800144910812378e-05, 8.279085159301758e-05, 9.758025407791138e-05, 0.00011236965656280518, 0.00012715905904769897, 0.00014194846153259277, 0.00015673786401748657, 0.00017152726650238037, 0.00018631666898727417, 0.00020110607147216797, 0.00021589547395706177, 0.00023068487644195557, 0.00024547427892684937, 0.00026026368141174316, 0.00027505308389663696, 0.00028984248638153076, 0.00030463188886642456, 0.00031942129135131836, 0.00033421069383621216, 0.00034900009632110596, 0.00036378949880599976, 0.00037857890129089355, 0.00039336830377578735, 0.00040815770626068115, 0.00042294710874557495, 0.00043773651123046875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 10.0, 4.0, 4.0, 12.0, 7.0, 11.0, 21.0, 32.0, 63.0, 62.0, 118.0, 161.0, 254.0, 330.0, 482.0, 593.0, 877.0, 1217.0, 1758.0, 2504.0, 3888.0, 6631.0, 16642.0, 74608.0, 493996.0, 362492.0, 51636.0, 12819.0, 5817.0, 3532.0, 2264.0, 1649.0, 1153.0, 827.0, 581.0, 429.0, 320.0, 206.0, 180.0, 94.0, 89.0, 60.0, 49.0, 22.0, 22.0, 12.0, 3.0, 13.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.658203125, -2.58203125, -2.505859375, -2.4296875, -2.353515625, -2.27734375, -2.201171875, -2.125, -2.048828125, -1.97265625, -1.896484375, -1.8203125, -1.744140625, -1.66796875, -1.591796875, -1.515625, -1.439453125, -1.36328125, -1.287109375, -1.2109375, -1.134765625, -1.05859375, -0.982421875, -0.90625, -0.830078125, -0.75390625, -0.677734375, -0.6015625, -0.525390625, -0.44921875, -0.373046875, -0.296875, -0.220703125, -0.14453125, -0.068359375, 0.0078125, 0.083984375, 0.16015625, 0.236328125, 0.3125, 0.388671875, 0.46484375, 0.541015625, 0.6171875, 0.693359375, 0.76953125, 0.845703125, 0.921875, 0.998046875, 1.07421875, 1.150390625, 1.2265625, 1.302734375, 1.37890625, 1.455078125, 1.53125, 1.607421875, 1.68359375, 1.759765625, 1.8359375, 1.912109375, 1.98828125, 2.064453125, 2.140625, 2.216796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 2.0, 13.0, 25.0, 57.0, 110.0, 147.0, 199.0, 192.0, 99.0, 64.0, 31.0, 11.0, 11.0, 6.0, 4.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61767578125, -0.599822998046875, -0.58197021484375, -0.564117431640625, -0.5462646484375, -0.528411865234375, -0.51055908203125, -0.492706298828125, -0.474853515625, -0.457000732421875, -0.43914794921875, -0.421295166015625, -0.4034423828125, -0.385589599609375, -0.36773681640625, -0.349884033203125, -0.33203125, -0.314178466796875, -0.29632568359375, -0.278472900390625, -0.2606201171875, -0.242767333984375, -0.22491455078125, -0.207061767578125, -0.189208984375, -0.171356201171875, -0.15350341796875, -0.135650634765625, -0.1177978515625, -0.099945068359375, -0.08209228515625, -0.064239501953125, -0.04638671875, -0.028533935546875, -0.01068115234375, 0.007171630859375, 0.0250244140625, 0.042877197265625, 0.06072998046875, 0.078582763671875, 0.096435546875, 0.114288330078125, 0.13214111328125, 0.149993896484375, 0.1678466796875, 0.185699462890625, 0.20355224609375, 0.221405029296875, 0.2392578125, 0.257110595703125, 0.27496337890625, 0.292816162109375, 0.3106689453125, 0.328521728515625, 0.34637451171875, 0.364227294921875, 0.382080078125, 0.399932861328125, 0.41778564453125, 0.435638427734375, 0.4534912109375, 0.471343994140625, 0.48919677734375, 0.507049560546875, 0.52490234375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 11.0, 18.0, 11.0, 24.0, 25.0, 34.0, 39.0, 37.0, 50.0, 57.0, 60.0, 66.0, 80.0, 58.0, 67.0, 56.0, 47.0, 47.0, 46.0, 28.0, 27.0, 17.0, 18.0, 14.0, 7.0, 10.0, 7.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.204133033752441, -12.830341339111328, -12.456550598144531, -12.082758903503418, -11.708967208862305, -11.335176467895508, -10.961384773254395, -10.587593078613281, -10.213802337646484, -9.840010643005371, -9.466219902038574, -9.092428207397461, -8.718636512756348, -8.344844818115234, -7.9710540771484375, -7.597262382507324, -7.223470687866211, -6.849679470062256, -6.475887775421143, -6.1020965576171875, -5.728304862976074, -5.354513645172119, -4.980722427368164, -4.606930732727051, -4.233139514923096, -3.8593480587005615, -3.4855566024780273, -3.1117653846740723, -2.737973928451538, -2.364182472229004, -1.9903912544250488, -1.6165997982025146, -1.242807388305664, -0.8690159916877747, -0.49522459506988525, -0.12143325805664062, 0.25235819816589355, 0.6261496543884277, 0.9999408721923828, 1.373732328414917, 1.7475237846374512, 2.1213152408599854, 2.4951066970825195, 2.8688979148864746, 3.242689371109009, 3.616480827331543, 3.990272045135498, 4.364063262939453, 4.737854957580566, 5.1116461753845215, 5.485437870025635, 5.85922908782959, 6.233020782470703, 6.606812000274658, 6.980603218078613, 7.354394912719727, 7.728186130523682, 8.101977348327637, 8.47576904296875, 8.849559783935547, 9.22335147857666, 9.597143173217773, 9.97093391418457, 10.344725608825684, 10.718517303466797]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 12.0, 6.0, 10.0, 15.0, 17.0, 17.0, 18.0, 24.0, 22.0, 28.0, 37.0, 24.0, 44.0, 34.0, 42.0, 32.0, 39.0, 44.0, 32.0, 47.0, 39.0, 38.0, 36.0, 50.0, 31.0, 37.0, 26.0, 19.0, 27.0, 28.0, 21.0, 22.0, 16.0, 15.0, 8.0, 7.0, 12.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.718294143676758, -6.523728847503662, -6.329163551330566, -6.134598255157471, -5.940032958984375, -5.745467662811279, -5.550902366638184, -5.356337070465088, -5.161771774291992, -4.9672064781188965, -4.772641181945801, -4.578075885772705, -4.383510589599609, -4.188945293426514, -3.994379997253418, -3.7998147010803223, -3.6052494049072266, -3.410684108734131, -3.216118812561035, -3.0215535163879395, -2.8269882202148438, -2.632422924041748, -2.4378576278686523, -2.2432923316955566, -2.048727035522461, -1.8541617393493652, -1.6595964431762695, -1.4650311470031738, -1.2704658508300781, -1.0759005546569824, -0.8813352584838867, -0.686769962310791, -0.4922051429748535, -0.2976398468017578, -0.10307455062866211, 0.0914907455444336, 0.2860560417175293, 0.480621337890625, 0.6751866340637207, 0.8697519302368164, 1.064317226409912, 1.2588825225830078, 1.4534478187561035, 1.6480131149291992, 1.842578411102295, 2.0371437072753906, 2.2317090034484863, 2.426274299621582, 2.6208395957946777, 2.8154048919677734, 3.009970188140869, 3.204535484313965, 3.3991007804870605, 3.5936660766601562, 3.788231372833252, 3.9827966690063477, 4.177361965179443, 4.371927261352539, 4.566492557525635, 4.7610578536987305, 4.955623149871826, 5.150188446044922, 5.344753742218018, 5.539319038391113, 5.733884334564209]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 6.0, 9.0, 13.0, 17.0, 26.0, 50.0, 60.0, 78.0, 115.0, 235.0, 369.0, 576.0, 1047.0, 1949.0, 4132.0, 8853.0, 19969.0, 44145.0, 92037.0, 165388.0, 223444.0, 210004.0, 139189.0, 73526.0, 34347.0, 15299.0, 6799.0, 3163.0, 1550.0, 877.0, 468.0, 298.0, 178.0, 99.0, 74.0, 36.0, 34.0, 34.0, 23.0, 14.0, 9.0, 4.0, 2.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3125, -10.9571533203125, -10.601806640625, -10.2464599609375, -9.89111328125, -9.5357666015625, -9.180419921875, -8.8250732421875, -8.4697265625, -8.1143798828125, -7.759033203125, -7.4036865234375, -7.04833984375, -6.6929931640625, -6.337646484375, -5.9822998046875, -5.626953125, -5.2716064453125, -4.916259765625, -4.5609130859375, -4.20556640625, -3.8502197265625, -3.494873046875, -3.1395263671875, -2.7841796875, -2.4288330078125, -2.073486328125, -1.7181396484375, -1.36279296875, -1.0074462890625, -0.652099609375, -0.2967529296875, 0.05859375, 0.4139404296875, 0.769287109375, 1.1246337890625, 1.47998046875, 1.8353271484375, 2.190673828125, 2.5460205078125, 2.9013671875, 3.2567138671875, 3.612060546875, 3.9674072265625, 4.32275390625, 4.6781005859375, 5.033447265625, 5.3887939453125, 5.744140625, 6.0994873046875, 6.454833984375, 6.8101806640625, 7.16552734375, 7.5208740234375, 7.876220703125, 8.2315673828125, 8.5869140625, 8.9422607421875, 9.297607421875, 9.6529541015625, 10.00830078125, 10.3636474609375, 10.718994140625, 11.0743408203125, 11.4296875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 7.0, 17.0, 19.0, 15.0, 31.0, 20.0, 37.0, 29.0, 31.0, 26.0, 44.0, 50.0, 37.0, 35.0, 42.0, 46.0, 31.0, 44.0, 49.0, 40.0, 37.0, 48.0, 29.0, 40.0, 23.0, 23.0, 17.0, 22.0, 18.0, 14.0, 10.0, 11.0, 10.0, 13.0, 6.0, 5.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0], "bins": [-8.4921875, -8.26715087890625, -8.0421142578125, -7.81707763671875, -7.592041015625, -7.36700439453125, -7.1419677734375, -6.91693115234375, -6.69189453125, -6.46685791015625, -6.2418212890625, -6.01678466796875, -5.791748046875, -5.56671142578125, -5.3416748046875, -5.11663818359375, -4.8916015625, -4.66656494140625, -4.4415283203125, -4.21649169921875, -3.991455078125, -3.76641845703125, -3.5413818359375, -3.31634521484375, -3.09130859375, -2.86627197265625, -2.6412353515625, -2.41619873046875, -2.191162109375, -1.96612548828125, -1.7410888671875, -1.51605224609375, -1.291015625, -1.06597900390625, -0.8409423828125, -0.61590576171875, -0.390869140625, -0.16583251953125, 0.0592041015625, 0.28424072265625, 0.50927734375, 0.73431396484375, 0.9593505859375, 1.18438720703125, 1.409423828125, 1.63446044921875, 1.8594970703125, 2.08453369140625, 2.3095703125, 2.53460693359375, 2.7596435546875, 2.98468017578125, 3.209716796875, 3.43475341796875, 3.6597900390625, 3.88482666015625, 4.10986328125, 4.33489990234375, 4.5599365234375, 4.78497314453125, 5.010009765625, 5.23504638671875, 5.4600830078125, 5.68511962890625, 5.91015625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 6.0, 12.0, 12.0, 18.0, 39.0, 53.0, 92.0, 112.0, 199.0, 300.0, 424.0, 776.0, 1217.0, 2093.0, 3458.0, 6111.0, 10417.0, 17163.0, 28747.0, 45408.0, 68925.0, 96808.0, 123376.0, 138664.0, 135994.0, 116469.0, 88505.0, 61812.0, 39741.0, 24532.0, 15149.0, 8917.0, 5280.0, 3046.0, 1785.0, 1121.0, 647.0, 425.0, 255.0, 175.0, 102.0, 52.0, 50.0, 30.0, 15.0, 9.0, 5.0, 9.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.7386474609375, -6.520263671875, -6.3018798828125, -6.08349609375, -5.8651123046875, -5.646728515625, -5.4283447265625, -5.2099609375, -4.9915771484375, -4.773193359375, -4.5548095703125, -4.33642578125, -4.1180419921875, -3.899658203125, -3.6812744140625, -3.462890625, -3.2445068359375, -3.026123046875, -2.8077392578125, -2.58935546875, -2.3709716796875, -2.152587890625, -1.9342041015625, -1.7158203125, -1.4974365234375, -1.279052734375, -1.0606689453125, -0.84228515625, -0.6239013671875, -0.405517578125, -0.1871337890625, 0.03125, 0.2496337890625, 0.468017578125, 0.6864013671875, 0.90478515625, 1.1231689453125, 1.341552734375, 1.5599365234375, 1.7783203125, 1.9967041015625, 2.215087890625, 2.4334716796875, 2.65185546875, 2.8702392578125, 3.088623046875, 3.3070068359375, 3.525390625, 3.7437744140625, 3.962158203125, 4.1805419921875, 4.39892578125, 4.6173095703125, 4.835693359375, 5.0540771484375, 5.2724609375, 5.4908447265625, 5.709228515625, 5.9276123046875, 6.14599609375, 6.3643798828125, 6.582763671875, 6.8011474609375, 7.01953125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 3.0, 11.0, 5.0, 2.0, 18.0, 12.0, 17.0, 14.0, 15.0, 13.0, 17.0, 23.0, 32.0, 30.0, 22.0, 34.0, 27.0, 27.0, 48.0, 35.0, 50.0, 34.0, 39.0, 39.0, 40.0, 35.0, 22.0, 34.0, 35.0, 29.0, 25.0, 29.0, 34.0, 21.0, 23.0, 17.0, 11.0, 12.0, 10.0, 7.0, 7.0, 7.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310546875, -3.192596435546875, -3.07464599609375, -2.956695556640625, -2.8387451171875, -2.720794677734375, -2.60284423828125, -2.484893798828125, -2.366943359375, -2.248992919921875, -2.13104248046875, -2.013092041015625, -1.8951416015625, -1.777191162109375, -1.65924072265625, -1.541290283203125, -1.42333984375, -1.305389404296875, -1.18743896484375, -1.069488525390625, -0.9515380859375, -0.833587646484375, -0.71563720703125, -0.597686767578125, -0.479736328125, -0.361785888671875, -0.24383544921875, -0.125885009765625, -0.0079345703125, 0.110015869140625, 0.22796630859375, 0.345916748046875, 0.4638671875, 0.581817626953125, 0.69976806640625, 0.817718505859375, 0.9356689453125, 1.053619384765625, 1.17156982421875, 1.289520263671875, 1.407470703125, 1.525421142578125, 1.64337158203125, 1.761322021484375, 1.8792724609375, 1.997222900390625, 2.11517333984375, 2.233123779296875, 2.35107421875, 2.469024658203125, 2.58697509765625, 2.704925537109375, 2.8228759765625, 2.940826416015625, 3.05877685546875, 3.176727294921875, 3.294677734375, 3.412628173828125, 3.53057861328125, 3.648529052734375, 3.7664794921875, 3.884429931640625, 4.00238037109375, 4.120330810546875, 4.23828125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 7.0, 7.0, 16.0, 19.0, 37.0, 48.0, 60.0, 84.0, 111.0, 155.0, 245.0, 337.0, 524.0, 735.0, 1221.0, 2040.0, 3607.0, 8013.0, 23412.0, 111976.0, 487378.0, 321239.0, 58931.0, 14878.0, 5826.0, 2901.0, 1628.0, 1026.0, 635.0, 446.0, 324.0, 202.0, 146.0, 77.0, 72.0, 53.0, 40.0, 24.0, 12.0, 28.0, 14.0, 2.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.734375, -16.153564453125, -15.57275390625, -14.991943359375, -14.4111328125, -13.830322265625, -13.24951171875, -12.668701171875, -12.087890625, -11.507080078125, -10.92626953125, -10.345458984375, -9.7646484375, -9.183837890625, -8.60302734375, -8.022216796875, -7.44140625, -6.860595703125, -6.27978515625, -5.698974609375, -5.1181640625, -4.537353515625, -3.95654296875, -3.375732421875, -2.794921875, -2.214111328125, -1.63330078125, -1.052490234375, -0.4716796875, 0.109130859375, 0.68994140625, 1.270751953125, 1.8515625, 2.432373046875, 3.01318359375, 3.593994140625, 4.1748046875, 4.755615234375, 5.33642578125, 5.917236328125, 6.498046875, 7.078857421875, 7.65966796875, 8.240478515625, 8.8212890625, 9.402099609375, 9.98291015625, 10.563720703125, 11.14453125, 11.725341796875, 12.30615234375, 12.886962890625, 13.4677734375, 14.048583984375, 14.62939453125, 15.210205078125, 15.791015625, 16.371826171875, 16.95263671875, 17.533447265625, 18.1142578125, 18.695068359375, 19.27587890625, 19.856689453125, 20.4375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 6.0, 5.0, 14.0, 12.0, 29.0, 36.0, 98.0, 138.0, 185.0, 161.0, 134.0, 77.0, 40.0, 25.0, 14.0, 13.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016937255859375, -0.0016478747129440308, -0.0016020238399505615, -0.0015561729669570923, -0.001510322093963623, -0.0014644712209701538, -0.0014186203479766846, -0.0013727694749832153, -0.001326918601989746, -0.0012810677289962769, -0.0012352168560028076, -0.0011893659830093384, -0.0011435151100158691, -0.0010976642370224, -0.0010518133640289307, -0.0010059624910354614, -0.0009601116180419922, -0.000914260745048523, -0.0008684098720550537, -0.0008225589990615845, -0.0007767081260681152, -0.000730857253074646, -0.0006850063800811768, -0.0006391555070877075, -0.0005933046340942383, -0.000547453761100769, -0.0005016028881072998, -0.00045575201511383057, -0.00040990114212036133, -0.0003640502691268921, -0.00031819939613342285, -0.0002723485231399536, -0.00022649765014648438, -0.00018064677715301514, -0.0001347959041595459, -8.894503116607666e-05, -4.309415817260742e-05, 2.7567148208618164e-06, 4.8607587814331055e-05, 9.445846080780029e-05, 0.00014030933380126953, 0.00018616020679473877, 0.000232011079788208, 0.00027786195278167725, 0.0003237128257751465, 0.0003695636987686157, 0.00041541457176208496, 0.0004612654447555542, 0.0005071163177490234, 0.0005529671907424927, 0.0005988180637359619, 0.0006446689367294312, 0.0006905198097229004, 0.0007363706827163696, 0.0007822215557098389, 0.0008280724287033081, 0.0008739233016967773, 0.0009197741746902466, 0.0009656250476837158, 0.001011475920677185, 0.0010573267936706543, 0.0011031776666641235, 0.0011490285396575928, 0.001194879412651062, 0.0012407302856445312]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 3.0, 4.0, 5.0, 6.0, 9.0, 18.0, 31.0, 50.0, 42.0, 73.0, 122.0, 165.0, 265.0, 338.0, 561.0, 871.0, 1302.0, 2042.0, 3399.0, 6049.0, 11858.0, 25766.0, 58971.0, 133261.0, 240420.0, 261288.0, 162024.0, 74686.0, 32503.0, 14532.0, 7344.0, 4034.0, 2313.0, 1404.0, 901.0, 609.0, 418.0, 280.0, 208.0, 109.0, 88.0, 55.0, 39.0, 29.0, 16.0, 21.0, 9.0, 11.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.140625, -7.8873291015625, -7.634033203125, -7.3807373046875, -7.12744140625, -6.8741455078125, -6.620849609375, -6.3675537109375, -6.1142578125, -5.8609619140625, -5.607666015625, -5.3543701171875, -5.10107421875, -4.8477783203125, -4.594482421875, -4.3411865234375, -4.087890625, -3.8345947265625, -3.581298828125, -3.3280029296875, -3.07470703125, -2.8214111328125, -2.568115234375, -2.3148193359375, -2.0615234375, -1.8082275390625, -1.554931640625, -1.3016357421875, -1.04833984375, -0.7950439453125, -0.541748046875, -0.2884521484375, -0.03515625, 0.2181396484375, 0.471435546875, 0.7247314453125, 0.97802734375, 1.2313232421875, 1.484619140625, 1.7379150390625, 1.9912109375, 2.2445068359375, 2.497802734375, 2.7510986328125, 3.00439453125, 3.2576904296875, 3.510986328125, 3.7642822265625, 4.017578125, 4.2708740234375, 4.524169921875, 4.7774658203125, 5.03076171875, 5.2840576171875, 5.537353515625, 5.7906494140625, 6.0439453125, 6.2972412109375, 6.550537109375, 6.8038330078125, 7.05712890625, 7.3104248046875, 7.563720703125, 7.8170166015625, 8.0703125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 1.0, 9.0, 10.0, 13.0, 15.0, 22.0, 44.0, 49.0, 50.0, 76.0, 99.0, 90.0, 91.0, 98.0, 82.0, 68.0, 50.0, 35.0, 27.0, 18.0, 11.0, 5.0, 10.0, 4.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8871307373046875, -1.822113037109375, -1.7570953369140625, -1.69207763671875, -1.6270599365234375, -1.562042236328125, -1.4970245361328125, -1.4320068359375, -1.3669891357421875, -1.301971435546875, -1.2369537353515625, -1.17193603515625, -1.1069183349609375, -1.041900634765625, -0.9768829345703125, -0.911865234375, -0.8468475341796875, -0.781829833984375, -0.7168121337890625, -0.65179443359375, -0.5867767333984375, -0.521759033203125, -0.4567413330078125, -0.3917236328125, -0.3267059326171875, -0.261688232421875, -0.1966705322265625, -0.13165283203125, -0.0666351318359375, -0.001617431640625, 0.0634002685546875, 0.12841796875, 0.1934356689453125, 0.258453369140625, 0.3234710693359375, 0.38848876953125, 0.4535064697265625, 0.518524169921875, 0.5835418701171875, 0.6485595703125, 0.7135772705078125, 0.778594970703125, 0.8436126708984375, 0.90863037109375, 0.9736480712890625, 1.038665771484375, 1.1036834716796875, 1.168701171875, 1.2337188720703125, 1.298736572265625, 1.3637542724609375, 1.42877197265625, 1.4937896728515625, 1.558807373046875, 1.6238250732421875, 1.6888427734375, 1.7538604736328125, 1.818878173828125, 1.8838958740234375, 1.94891357421875, 2.0139312744140625, 2.078948974609375, 2.1439666748046875, 2.208984375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 11.0, 5.0, 6.0, 10.0, 8.0, 16.0, 25.0, 27.0, 37.0, 42.0, 45.0, 58.0, 43.0, 60.0, 64.0, 58.0, 56.0, 64.0, 70.0, 46.0, 41.0, 34.0, 42.0, 23.0, 31.0, 10.0, 16.0, 6.0, 11.0, 1.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.284029960632324, -13.901891708374023, -13.519754409790039, -13.137616157531738, -12.755477905273438, -12.373340606689453, -11.991202354431152, -11.609064102172852, -11.226926803588867, -10.844788551330566, -10.462651252746582, -10.080513000488281, -9.69837474822998, -9.31623649597168, -8.934099197387695, -8.551960945129395, -8.169822692871094, -7.787684917449951, -7.40554666519165, -7.023408889770508, -6.641270637512207, -6.2591328620910645, -5.876995086669922, -5.494856834411621, -5.1127190589904785, -4.730581283569336, -4.348443031311035, -3.9663052558898926, -3.584167242050171, -3.202029228210449, -2.8198914527893066, -2.437753438949585, -2.055614471435547, -1.6734764575958252, -1.291338562965393, -0.9092006683349609, -0.5270626544952393, -0.14492464065551758, 0.237213134765625, 0.6193511486053467, 1.0014891624450684, 1.38362717628479, 1.7657650709152222, 2.1479029655456543, 2.530040979385376, 2.9121789932250977, 3.2943167686462402, 3.676454782485962, 4.058592796325684, 4.440730571746826, 4.822868824005127, 5.2050065994262695, 5.58714485168457, 5.969282627105713, 6.3514204025268555, 6.733558654785156, 7.115696430206299, 7.497834205627441, 7.879972457885742, 8.262109756469727, 8.644248008728027, 9.026386260986328, 9.408523559570312, 9.790661811828613, 10.172800064086914]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 9.0, 7.0, 11.0, 14.0, 19.0, 25.0, 23.0, 24.0, 40.0, 34.0, 40.0, 43.0, 36.0, 28.0, 50.0, 62.0, 42.0, 47.0, 41.0, 48.0, 44.0, 32.0, 40.0, 22.0, 32.0, 37.0, 27.0, 16.0, 20.0, 20.0, 20.0, 14.0, 3.0, 5.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.696415901184082, -7.469488143920898, -7.242560386657715, -7.0156331062316895, -6.788705348968506, -6.561777591705322, -6.334850311279297, -6.107922554016113, -5.88099479675293, -5.654067039489746, -5.4271392822265625, -5.200212001800537, -4.9732842445373535, -4.74635648727417, -4.5194292068481445, -4.292501449584961, -4.065573692321777, -3.8386459350585938, -3.6117184162139893, -3.3847908973693848, -3.157863140106201, -2.9309353828430176, -2.704007863998413, -2.4770803451538086, -2.250152587890625, -2.0232248306274414, -1.796297311782837, -1.5693696737289429, -1.3424420356750488, -1.1155143976211548, -0.8885867595672607, -0.6616591215133667, -0.43473100662231445, -0.2078033685684204, 0.019124269485473633, 0.24605190753936768, 0.4729795455932617, 0.6999071836471558, 0.9268348217010498, 1.1537624597549438, 1.380690097808838, 1.607617735862732, 1.834545373916626, 2.0614728927612305, 2.288400650024414, 2.5153284072875977, 2.742255926132202, 2.9691834449768066, 3.1961112022399902, 3.423038959503174, 3.6499664783477783, 3.876893997192383, 4.103821754455566, 4.33074951171875, 4.557677268981934, 4.784604549407959, 5.011532306671143, 5.238460063934326, 5.465387344360352, 5.692315101623535, 5.919242858886719, 6.146170616149902, 6.373098373413086, 6.600025653839111, 6.826953411102295]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 10.0, 14.0, 25.0, 32.0, 65.0, 67.0, 131.0, 218.0, 374.0, 573.0, 955.0, 1469.0, 2457.0, 3985.0, 6700.0, 11309.0, 19674.0, 34315.0, 60009.0, 105306.0, 182797.0, 305678.0, 472720.0, 639085.0, 695061.0, 593871.0, 420311.0, 265073.0, 157597.0, 90798.0, 52061.0, 29980.0, 16955.0, 9914.0, 5852.0, 3396.0, 2023.0, 1328.0, 780.0, 521.0, 275.0, 210.0, 129.0, 75.0, 38.0, 31.0, 13.0, 10.0, 4.0, 1.0, 6.0, 3.0, 1.0, 2.0], "bins": [-9.28125, -9.01123046875, -8.7412109375, -8.47119140625, -8.201171875, -7.93115234375, -7.6611328125, -7.39111328125, -7.12109375, -6.85107421875, -6.5810546875, -6.31103515625, -6.041015625, -5.77099609375, -5.5009765625, -5.23095703125, -4.9609375, -4.69091796875, -4.4208984375, -4.15087890625, -3.880859375, -3.61083984375, -3.3408203125, -3.07080078125, -2.80078125, -2.53076171875, -2.2607421875, -1.99072265625, -1.720703125, -1.45068359375, -1.1806640625, -0.91064453125, -0.640625, -0.37060546875, -0.1005859375, 0.16943359375, 0.439453125, 0.70947265625, 0.9794921875, 1.24951171875, 1.51953125, 1.78955078125, 2.0595703125, 2.32958984375, 2.599609375, 2.86962890625, 3.1396484375, 3.40966796875, 3.6796875, 3.94970703125, 4.2197265625, 4.48974609375, 4.759765625, 5.02978515625, 5.2998046875, 5.56982421875, 5.83984375, 6.10986328125, 6.3798828125, 6.64990234375, 6.919921875, 7.18994140625, 7.4599609375, 7.72998046875, 8.0]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 6.0, 12.0, 6.0, 12.0, 14.0, 8.0, 24.0, 19.0, 19.0, 27.0, 38.0, 31.0, 45.0, 27.0, 44.0, 33.0, 51.0, 53.0, 61.0, 31.0, 49.0, 33.0, 32.0, 31.0, 42.0, 37.0, 30.0, 21.0, 32.0, 23.0, 14.0, 12.0, 17.0, 20.0, 7.0, 7.0, 3.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.7921142578125, -4.631103515625, -4.4700927734375, -4.30908203125, -4.1480712890625, -3.987060546875, -3.8260498046875, -3.6650390625, -3.5040283203125, -3.343017578125, -3.1820068359375, -3.02099609375, -2.8599853515625, -2.698974609375, -2.5379638671875, -2.376953125, -2.2159423828125, -2.054931640625, -1.8939208984375, -1.73291015625, -1.5718994140625, -1.410888671875, -1.2498779296875, -1.0888671875, -0.9278564453125, -0.766845703125, -0.6058349609375, -0.44482421875, -0.2838134765625, -0.122802734375, 0.0382080078125, 0.19921875, 0.3602294921875, 0.521240234375, 0.6822509765625, 0.84326171875, 1.0042724609375, 1.165283203125, 1.3262939453125, 1.4873046875, 1.6483154296875, 1.809326171875, 1.9703369140625, 2.13134765625, 2.2923583984375, 2.453369140625, 2.6143798828125, 2.775390625, 2.9364013671875, 3.097412109375, 3.2584228515625, 3.41943359375, 3.5804443359375, 3.741455078125, 3.9024658203125, 4.0634765625, 4.2244873046875, 4.385498046875, 4.5465087890625, 4.70751953125, 4.8685302734375, 5.029541015625, 5.1905517578125, 5.3515625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 5.0, 8.0, 16.0, 24.0, 40.0, 61.0, 90.0, 126.0, 216.0, 366.0, 573.0, 1013.0, 1576.0, 2576.0, 4607.0, 7970.0, 13699.0, 23630.0, 41605.0, 71883.0, 123042.0, 203549.0, 320527.0, 464596.0, 592064.0, 632654.0, 559313.0, 421035.0, 282203.0, 175967.0, 104524.0, 61451.0, 35001.0, 20220.0, 11533.0, 6746.0, 3923.0, 2221.0, 1418.0, 880.0, 499.0, 297.0, 195.0, 129.0, 79.0, 53.0, 33.0, 21.0, 14.0, 9.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.0, -8.7218017578125, -8.443603515625, -8.1654052734375, -7.88720703125, -7.6090087890625, -7.330810546875, -7.0526123046875, -6.7744140625, -6.4962158203125, -6.218017578125, -5.9398193359375, -5.66162109375, -5.3834228515625, -5.105224609375, -4.8270263671875, -4.548828125, -4.2706298828125, -3.992431640625, -3.7142333984375, -3.43603515625, -3.1578369140625, -2.879638671875, -2.6014404296875, -2.3232421875, -2.0450439453125, -1.766845703125, -1.4886474609375, -1.21044921875, -0.9322509765625, -0.654052734375, -0.3758544921875, -0.09765625, 0.1805419921875, 0.458740234375, 0.7369384765625, 1.01513671875, 1.2933349609375, 1.571533203125, 1.8497314453125, 2.1279296875, 2.4061279296875, 2.684326171875, 2.9625244140625, 3.24072265625, 3.5189208984375, 3.797119140625, 4.0753173828125, 4.353515625, 4.6317138671875, 4.909912109375, 5.1881103515625, 5.46630859375, 5.7445068359375, 6.022705078125, 6.3009033203125, 6.5791015625, 6.8572998046875, 7.135498046875, 7.4136962890625, 7.69189453125, 7.9700927734375, 8.248291015625, 8.5264892578125, 8.8046875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 8.0, 13.0, 17.0, 24.0, 23.0, 34.0, 34.0, 59.0, 73.0, 89.0, 99.0, 111.0, 122.0, 154.0, 162.0, 201.0, 207.0, 203.0, 187.0, 254.0, 233.0, 237.0, 221.0, 186.0, 171.0, 170.0, 153.0, 117.0, 110.0, 69.0, 72.0, 56.0, 45.0, 29.0, 33.0, 15.0, 16.0, 20.0, 5.0, 10.0, 5.0, 5.0, 7.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.17352294921875, -3.0794677734375, -2.98541259765625, -2.891357421875, -2.79730224609375, -2.7032470703125, -2.60919189453125, -2.51513671875, -2.42108154296875, -2.3270263671875, -2.23297119140625, -2.138916015625, -2.04486083984375, -1.9508056640625, -1.85675048828125, -1.7626953125, -1.66864013671875, -1.5745849609375, -1.48052978515625, -1.386474609375, -1.29241943359375, -1.1983642578125, -1.10430908203125, -1.01025390625, -0.91619873046875, -0.8221435546875, -0.72808837890625, -0.634033203125, -0.53997802734375, -0.4459228515625, -0.35186767578125, -0.2578125, -0.16375732421875, -0.0697021484375, 0.02435302734375, 0.118408203125, 0.21246337890625, 0.3065185546875, 0.40057373046875, 0.49462890625, 0.58868408203125, 0.6827392578125, 0.77679443359375, 0.870849609375, 0.96490478515625, 1.0589599609375, 1.15301513671875, 1.2470703125, 1.34112548828125, 1.4351806640625, 1.52923583984375, 1.623291015625, 1.71734619140625, 1.8114013671875, 1.90545654296875, 1.99951171875, 2.09356689453125, 2.1876220703125, 2.28167724609375, 2.375732421875, 2.46978759765625, 2.5638427734375, 2.65789794921875, 2.751953125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 9.0, 4.0, 10.0, 8.0, 12.0, 14.0, 14.0, 21.0, 32.0, 41.0, 41.0, 42.0, 67.0, 66.0, 79.0, 79.0, 81.0, 72.0, 53.0, 49.0, 35.0, 39.0, 32.0, 25.0, 23.0, 13.0, 15.0, 5.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.268253326416016, -16.817340850830078, -16.36642837524414, -15.915514945983887, -15.464601516723633, -15.013689041137695, -14.562776565551758, -14.111863136291504, -13.66094970703125, -13.210037231445312, -12.759123802185059, -12.308211326599121, -11.857297897338867, -11.40638542175293, -10.955472946166992, -10.504559516906738, -10.0536470413208, -9.602734565734863, -9.15182113647461, -8.700908660888672, -8.249995231628418, -7.7990827560424805, -7.348169803619385, -6.897256851196289, -6.446343898773193, -5.995430946350098, -5.544517993927002, -5.093605041503906, -4.642692565917969, -4.191779136657715, -3.7408666610717773, -3.2899537086486816, -2.8390398025512695, -2.388126850128174, -1.9372140169143677, -1.4863011837005615, -1.0353882312774658, -0.5844752788543701, -0.13356256484985352, 0.3173503875732422, 0.7682633399963379, 1.2191762924194336, 1.6700891256332397, 2.121001958847046, 2.5719149112701416, 3.0228278636932373, 3.473740577697754, 3.9246535301208496, 4.375566482543945, 4.826479434967041, 5.277392387390137, 5.728304862976074, 6.179218292236328, 6.630130767822266, 7.081043720245361, 7.531956672668457, 7.982869625091553, 8.433782577514648, 8.884695053100586, 9.33560848236084, 9.786520957946777, 10.237434387207031, 10.688346862792969, 11.139259338378906, 11.59017276763916]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 10.0, 5.0, 4.0, 12.0, 12.0, 17.0, 28.0, 21.0, 34.0, 21.0, 32.0, 39.0, 43.0, 44.0, 45.0, 41.0, 44.0, 58.0, 56.0, 50.0, 49.0, 46.0, 46.0, 42.0, 27.0, 31.0, 26.0, 21.0, 15.0, 12.0, 18.0, 8.0, 13.0, 5.0, 4.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-8.761787414550781, -8.533682823181152, -8.305578231811523, -8.077473640441895, -7.849369049072266, -7.621264457702637, -7.393160343170166, -7.165055751800537, -6.936951160430908, -6.708846569061279, -6.48074197769165, -6.2526373863220215, -6.024533271789551, -5.796428680419922, -5.568324089050293, -5.340219497680664, -5.112114906311035, -4.884010314941406, -4.655905723571777, -4.427801132202148, -4.1996965408325195, -3.9715921878814697, -3.74348783493042, -3.515383243560791, -3.287278652191162, -3.059174060821533, -2.8310694694519043, -2.6029651165008545, -2.3748605251312256, -2.1467559337615967, -1.9186514616012573, -1.690546989440918, -1.462442398071289, -1.2343378067016602, -1.0062333345413208, -0.7781288027763367, -0.5500242710113525, -0.32191967964172363, -0.09381520748138428, 0.13428926467895508, 0.362393856048584, 0.5904983878135681, 0.8186029195785522, 1.0467073917388916, 1.2748119831085205, 1.5029165744781494, 1.7310210466384888, 1.9591255187988281, 2.187230110168457, 2.415334701538086, 2.643439292907715, 2.8715436458587646, 3.0996482372283936, 3.3277528285980225, 3.5558571815490723, 3.783961772918701, 4.01206636428833, 4.240170955657959, 4.468275547027588, 4.696380138397217, 4.9244842529296875, 5.152588844299316, 5.380693435668945, 5.608798027038574, 5.836902618408203]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 11.0, 22.0, 24.0, 50.0, 78.0, 159.0, 246.0, 419.0, 648.0, 1200.0, 1923.0, 3267.0, 5456.0, 9440.0, 16138.0, 27087.0, 45115.0, 73190.0, 113043.0, 156406.0, 175329.0, 147765.0, 104259.0, 67130.0, 40699.0, 24500.0, 14369.0, 8338.0, 4928.0, 2950.0, 1785.0, 990.0, 602.0, 381.0, 210.0, 162.0, 86.0, 49.0, 35.0, 21.0, 11.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5869140625, -1.5347137451171875, -1.482513427734375, -1.4303131103515625, -1.37811279296875, -1.3259124755859375, -1.273712158203125, -1.2215118408203125, -1.1693115234375, -1.1171112060546875, -1.064910888671875, -1.0127105712890625, -0.96051025390625, -0.9083099365234375, -0.856109619140625, -0.8039093017578125, -0.751708984375, -0.6995086669921875, -0.647308349609375, -0.5951080322265625, -0.54290771484375, -0.4907073974609375, -0.438507080078125, -0.3863067626953125, -0.3341064453125, -0.2819061279296875, -0.229705810546875, -0.1775054931640625, -0.12530517578125, -0.0731048583984375, -0.020904541015625, 0.0312957763671875, 0.08349609375, 0.1356964111328125, 0.187896728515625, 0.2400970458984375, 0.29229736328125, 0.3444976806640625, 0.396697998046875, 0.4488983154296875, 0.5010986328125, 0.5532989501953125, 0.605499267578125, 0.6576995849609375, 0.70989990234375, 0.7621002197265625, 0.814300537109375, 0.8665008544921875, 0.918701171875, 0.9709014892578125, 1.023101806640625, 1.0753021240234375, 1.12750244140625, 1.1797027587890625, 1.231903076171875, 1.2841033935546875, 1.3363037109375, 1.3885040283203125, 1.440704345703125, 1.4929046630859375, 1.54510498046875, 1.5973052978515625, 1.649505615234375, 1.7017059326171875, 1.75390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 6.0, 10.0, 14.0, 9.0, 21.0, 19.0, 23.0, 30.0, 17.0, 36.0, 34.0, 39.0, 44.0, 57.0, 41.0, 44.0, 50.0, 49.0, 57.0, 50.0, 46.0, 32.0, 45.0, 34.0, 35.0, 19.0, 29.0, 18.0, 17.0, 14.0, 10.0, 5.0, 6.0, 7.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-9.234375, -8.989501953125, -8.74462890625, -8.499755859375, -8.2548828125, -8.010009765625, -7.76513671875, -7.520263671875, -7.275390625, -7.030517578125, -6.78564453125, -6.540771484375, -6.2958984375, -6.051025390625, -5.80615234375, -5.561279296875, -5.31640625, -5.071533203125, -4.82666015625, -4.581787109375, -4.3369140625, -4.092041015625, -3.84716796875, -3.602294921875, -3.357421875, -3.112548828125, -2.86767578125, -2.622802734375, -2.3779296875, -2.133056640625, -1.88818359375, -1.643310546875, -1.3984375, -1.153564453125, -0.90869140625, -0.663818359375, -0.4189453125, -0.174072265625, 0.07080078125, 0.315673828125, 0.560546875, 0.805419921875, 1.05029296875, 1.295166015625, 1.5400390625, 1.784912109375, 2.02978515625, 2.274658203125, 2.51953125, 2.764404296875, 3.00927734375, 3.254150390625, 3.4990234375, 3.743896484375, 3.98876953125, 4.233642578125, 4.478515625, 4.723388671875, 4.96826171875, 5.213134765625, 5.4580078125, 5.702880859375, 5.94775390625, 6.192626953125, 6.4375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 9.0, 8.0, 10.0, 26.0, 37.0, 34.0, 56.0, 90.0, 137.0, 216.0, 385.0, 650.0, 1138.0, 1858.0, 3191.0, 5793.0, 10453.0, 19620.0, 36328.0, 68572.0, 121530.0, 185814.0, 210865.0, 162969.0, 100281.0, 54822.0, 28708.0, 15551.0, 8372.0, 4705.0, 2550.0, 1485.0, 894.0, 523.0, 307.0, 193.0, 121.0, 91.0, 46.0, 37.0, 33.0, 18.0, 11.0, 6.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.111328125, -2.04168701171875, -1.9720458984375, -1.90240478515625, -1.832763671875, -1.76312255859375, -1.6934814453125, -1.62384033203125, -1.55419921875, -1.48455810546875, -1.4149169921875, -1.34527587890625, -1.275634765625, -1.20599365234375, -1.1363525390625, -1.06671142578125, -0.9970703125, -0.92742919921875, -0.8577880859375, -0.78814697265625, -0.718505859375, -0.64886474609375, -0.5792236328125, -0.50958251953125, -0.43994140625, -0.37030029296875, -0.3006591796875, -0.23101806640625, -0.161376953125, -0.09173583984375, -0.0220947265625, 0.04754638671875, 0.1171875, 0.18682861328125, 0.2564697265625, 0.32611083984375, 0.395751953125, 0.46539306640625, 0.5350341796875, 0.60467529296875, 0.67431640625, 0.74395751953125, 0.8135986328125, 0.88323974609375, 0.952880859375, 1.02252197265625, 1.0921630859375, 1.16180419921875, 1.2314453125, 1.30108642578125, 1.3707275390625, 1.44036865234375, 1.510009765625, 1.57965087890625, 1.6492919921875, 1.71893310546875, 1.78857421875, 1.85821533203125, 1.9278564453125, 1.99749755859375, 2.067138671875, 2.13677978515625, 2.2064208984375, 2.27606201171875, 2.345703125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 10.0, 9.0, 15.0, 18.0, 22.0, 27.0, 29.0, 28.0, 34.0, 31.0, 28.0, 40.0, 28.0, 46.0, 33.0, 40.0, 42.0, 45.0, 37.0, 43.0, 31.0, 43.0, 29.0, 30.0, 31.0, 32.0, 16.0, 28.0, 17.0, 24.0, 18.0, 18.0, 14.0, 10.0, 8.0, 5.0, 3.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.07861328125, -3.9501953125, -3.82177734375, -3.693359375, -3.56494140625, -3.4365234375, -3.30810546875, -3.1796875, -3.05126953125, -2.9228515625, -2.79443359375, -2.666015625, -2.53759765625, -2.4091796875, -2.28076171875, -2.15234375, -2.02392578125, -1.8955078125, -1.76708984375, -1.638671875, -1.51025390625, -1.3818359375, -1.25341796875, -1.125, -0.99658203125, -0.8681640625, -0.73974609375, -0.611328125, -0.48291015625, -0.3544921875, -0.22607421875, -0.09765625, 0.03076171875, 0.1591796875, 0.28759765625, 0.416015625, 0.54443359375, 0.6728515625, 0.80126953125, 0.9296875, 1.05810546875, 1.1865234375, 1.31494140625, 1.443359375, 1.57177734375, 1.7001953125, 1.82861328125, 1.95703125, 2.08544921875, 2.2138671875, 2.34228515625, 2.470703125, 2.59912109375, 2.7275390625, 2.85595703125, 2.984375, 3.11279296875, 3.2412109375, 3.36962890625, 3.498046875, 3.62646484375, 3.7548828125, 3.88330078125, 4.01171875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 13.0, 12.0, 13.0, 34.0, 38.0, 60.0, 88.0, 169.0, 278.0, 443.0, 834.0, 1512.0, 3077.0, 6435.0, 14412.0, 33963.0, 84633.0, 198831.0, 316043.0, 221492.0, 96440.0, 39121.0, 16104.0, 7131.0, 3400.0, 1771.0, 931.0, 526.0, 265.0, 174.0, 101.0, 61.0, 45.0, 31.0, 25.0, 19.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.72314453125, -0.7002410888671875, -0.677337646484375, -0.6544342041015625, -0.63153076171875, -0.6086273193359375, -0.585723876953125, -0.5628204345703125, -0.5399169921875, -0.5170135498046875, -0.494110107421875, -0.4712066650390625, -0.44830322265625, -0.4253997802734375, -0.402496337890625, -0.3795928955078125, -0.356689453125, -0.3337860107421875, -0.310882568359375, -0.2879791259765625, -0.26507568359375, -0.2421722412109375, -0.219268798828125, -0.1963653564453125, -0.1734619140625, -0.1505584716796875, -0.127655029296875, -0.1047515869140625, -0.08184814453125, -0.0589447021484375, -0.036041259765625, -0.0131378173828125, 0.009765625, 0.0326690673828125, 0.055572509765625, 0.0784759521484375, 0.10137939453125, 0.1242828369140625, 0.147186279296875, 0.1700897216796875, 0.1929931640625, 0.2158966064453125, 0.238800048828125, 0.2617034912109375, 0.28460693359375, 0.3075103759765625, 0.330413818359375, 0.3533172607421875, 0.376220703125, 0.3991241455078125, 0.422027587890625, 0.4449310302734375, 0.46783447265625, 0.4907379150390625, 0.513641357421875, 0.5365447998046875, 0.5594482421875, 0.5823516845703125, 0.605255126953125, 0.6281585693359375, 0.65106201171875, 0.6739654541015625, 0.696868896484375, 0.7197723388671875, 0.74267578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 7.0, 8.0, 9.0, 9.0, 24.0, 19.0, 17.0, 29.0, 39.0, 35.0, 50.0, 42.0, 40.0, 49.0, 41.0, 53.0, 55.0, 50.0, 47.0, 58.0, 54.0, 46.0, 33.0, 31.0, 23.0, 16.0, 18.0, 18.0, 10.0, 11.0, 13.0, 9.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.075599670410156e-05, -2.9777176678180695e-05, -2.8798356652259827e-05, -2.781953662633896e-05, -2.684071660041809e-05, -2.5861896574497223e-05, -2.4883076548576355e-05, -2.3904256522655487e-05, -2.292543649673462e-05, -2.194661647081375e-05, -2.0967796444892883e-05, -1.9988976418972015e-05, -1.9010156393051147e-05, -1.803133636713028e-05, -1.705251634120941e-05, -1.6073696315288544e-05, -1.5094876289367676e-05, -1.4116056263446808e-05, -1.313723623752594e-05, -1.2158416211605072e-05, -1.1179596185684204e-05, -1.0200776159763336e-05, -9.221956133842468e-06, -8.2431361079216e-06, -7.264316082000732e-06, -6.2854960560798645e-06, -5.306676030158997e-06, -4.327856004238129e-06, -3.3490359783172607e-06, -2.370215952396393e-06, -1.391395926475525e-06, -4.12575900554657e-07, 5.662441253662109e-07, 1.5450641512870789e-06, 2.5238841772079468e-06, 3.5027042031288147e-06, 4.481524229049683e-06, 5.4603442549705505e-06, 6.4391642808914185e-06, 7.417984306812286e-06, 8.396804332733154e-06, 9.375624358654022e-06, 1.035444438457489e-05, 1.1333264410495758e-05, 1.2312084436416626e-05, 1.3290904462337494e-05, 1.4269724488258362e-05, 1.524854451417923e-05, 1.6227364540100098e-05, 1.7206184566020966e-05, 1.8185004591941833e-05, 1.91638246178627e-05, 2.014264464378357e-05, 2.1121464669704437e-05, 2.2100284695625305e-05, 2.3079104721546173e-05, 2.405792474746704e-05, 2.503674477338791e-05, 2.6015564799308777e-05, 2.6994384825229645e-05, 2.7973204851150513e-05, 2.895202487707138e-05, 2.993084490299225e-05, 3.0909664928913116e-05, 3.1888484954833984e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 10.0, 5.0, 12.0, 13.0, 24.0, 42.0, 64.0, 74.0, 107.0, 166.0, 273.0, 432.0, 706.0, 1039.0, 1727.0, 2741.0, 4268.0, 7107.0, 11576.0, 18975.0, 31872.0, 52899.0, 86655.0, 135535.0, 184730.0, 178245.0, 126829.0, 80053.0, 48063.0, 29315.0, 17307.0, 10511.0, 6319.0, 4057.0, 2400.0, 1584.0, 961.0, 658.0, 423.0, 244.0, 173.0, 126.0, 72.0, 66.0, 28.0, 17.0, 17.0, 11.0, 14.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.5302734375, -0.5136566162109375, -0.497039794921875, -0.4804229736328125, -0.46380615234375, -0.4471893310546875, -0.430572509765625, -0.4139556884765625, -0.3973388671875, -0.3807220458984375, -0.364105224609375, -0.3474884033203125, -0.33087158203125, -0.3142547607421875, -0.297637939453125, -0.2810211181640625, -0.264404296875, -0.2477874755859375, -0.231170654296875, -0.2145538330078125, -0.19793701171875, -0.1813201904296875, -0.164703369140625, -0.1480865478515625, -0.1314697265625, -0.1148529052734375, -0.098236083984375, -0.0816192626953125, -0.06500244140625, -0.0483856201171875, -0.031768798828125, -0.0151519775390625, 0.00146484375, 0.0180816650390625, 0.034698486328125, 0.0513153076171875, 0.06793212890625, 0.0845489501953125, 0.101165771484375, 0.1177825927734375, 0.1343994140625, 0.1510162353515625, 0.167633056640625, 0.1842498779296875, 0.20086669921875, 0.2174835205078125, 0.234100341796875, 0.2507171630859375, 0.267333984375, 0.2839508056640625, 0.300567626953125, 0.3171844482421875, 0.33380126953125, 0.3504180908203125, 0.367034912109375, 0.3836517333984375, 0.4002685546875, 0.4168853759765625, 0.433502197265625, 0.4501190185546875, 0.46673583984375, 0.4833526611328125, 0.499969482421875, 0.5165863037109375, 0.533203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 5.0, 13.0, 10.0, 10.0, 14.0, 19.0, 30.0, 38.0, 42.0, 48.0, 39.0, 63.0, 64.0, 79.0, 65.0, 69.0, 71.0, 55.0, 53.0, 45.0, 37.0, 27.0, 22.0, 13.0, 12.0, 15.0, 7.0, 11.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13671875, -0.1316852569580078, -0.12665176391601562, -0.12161827087402344, -0.11658477783203125, -0.11155128479003906, -0.10651779174804688, -0.10148429870605469, -0.0964508056640625, -0.09141731262207031, -0.08638381958007812, -0.08135032653808594, -0.07631683349609375, -0.07128334045410156, -0.06624984741210938, -0.06121635437011719, -0.056182861328125, -0.05114936828613281, -0.046115875244140625, -0.04108238220214844, -0.03604888916015625, -0.031015396118164062, -0.025981903076171875, -0.020948410034179688, -0.0159149169921875, -0.010881423950195312, -0.005847930908203125, -0.0008144378662109375, 0.00421905517578125, 0.009252548217773438, 0.014286041259765625, 0.019319534301757812, 0.02435302734375, 0.029386520385742188, 0.034420013427734375, 0.03945350646972656, 0.04448699951171875, 0.04952049255371094, 0.054553985595703125, 0.05958747863769531, 0.0646209716796875, 0.06965446472167969, 0.07468795776367188, 0.07972145080566406, 0.08475494384765625, 0.08978843688964844, 0.09482192993164062, 0.09985542297363281, 0.104888916015625, 0.10992240905761719, 0.11495590209960938, 0.11998939514160156, 0.12502288818359375, 0.13005638122558594, 0.13508987426757812, 0.1401233673095703, 0.1451568603515625, 0.1501903533935547, 0.15522384643554688, 0.16025733947753906, 0.16529083251953125, 0.17032432556152344, 0.17535781860351562, 0.1803913116455078, 0.1854248046875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 8.0, 2.0, 11.0, 7.0, 12.0, 12.0, 17.0, 24.0, 32.0, 43.0, 33.0, 52.0, 64.0, 76.0, 77.0, 73.0, 88.0, 70.0, 48.0, 44.0, 42.0, 33.0, 34.0, 27.0, 19.0, 15.0, 10.0, 5.0, 5.0, 10.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.290966033935547, -16.8377628326416, -16.384557723999023, -15.931354522705078, -15.478150367736816, -15.024946212768555, -14.57174301147461, -14.118538856506348, -13.665334701538086, -13.212130546569824, -12.758927345275879, -12.305723190307617, -11.852519035339355, -11.399314880371094, -10.946111679077148, -10.492907524108887, -10.039703369140625, -9.586499214172363, -9.133296012878418, -8.680091857910156, -8.226887702941895, -7.773684024810791, -7.3204803466796875, -6.867276191711426, -6.4140729904174805, -5.960869312286377, -5.507665157318115, -5.054461479187012, -4.60125732421875, -4.1480536460876465, -3.694849729537964, -3.2416458129882812, -2.7884416580200195, -2.335237741470337, -1.8820338249206543, -1.4288300275802612, -0.9756261110305786, -0.5224223136901855, -0.06921839714050293, 0.3839855194091797, 0.8371894359588623, 1.290393352508545, 1.7435972690582275, 2.19680118560791, 2.6500048637390137, 3.1032087802886963, 3.556412696838379, 4.009616851806641, 4.462820529937744, 4.916024208068848, 5.369228363037109, 5.822432041168213, 6.275636196136475, 6.728839874267578, 7.18204402923584, 7.635247707366943, 8.088451385498047, 8.541655540466309, 8.994858741760254, 9.448062896728516, 9.901267051696777, 10.354471206665039, 10.807674407958984, 11.260878562927246, 11.714082717895508]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 4.0, 5.0, 11.0, 13.0, 15.0, 28.0, 26.0, 29.0, 23.0, 30.0, 44.0, 36.0, 49.0, 40.0, 44.0, 41.0, 56.0, 62.0, 48.0, 50.0, 48.0, 46.0, 37.0, 28.0, 33.0, 28.0, 20.0, 10.0, 18.0, 15.0, 8.0, 13.0, 6.0, 4.0, 5.0, 6.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-8.719562530517578, -8.492415428161621, -8.265268325805664, -8.03812026977539, -7.810973644256592, -7.583826065063477, -7.3566789627075195, -7.1295318603515625, -6.9023847579956055, -6.675237655639648, -6.448090076446533, -6.220942974090576, -5.993795871734619, -5.766648292541504, -5.539501190185547, -5.31235408782959, -5.085206508636475, -4.858059406280518, -4.630911827087402, -4.403764724731445, -4.176617622375488, -3.949470281600952, -3.722322940826416, -3.495175838470459, -3.268028497695923, -3.0408811569213867, -2.8137340545654297, -2.5865867137908936, -2.3594393730163574, -2.1322922706604004, -1.9051449298858643, -1.6779977083206177, -1.4508509635925293, -1.2237037420272827, -0.9965564608573914, -0.7694091796875, -0.5422619581222534, -0.31511473655700684, -0.0879673957824707, 0.13917982578277588, 0.36632704734802246, 0.593474268913269, 0.8206215500831604, 1.0477688312530518, 1.2749160528182983, 1.502063274383545, 1.729210615158081, 1.9563578367233276, 2.183505058288574, 2.4106523990631104, 2.6377995014190674, 2.8649468421936035, 3.0920939445495605, 3.3192412853240967, 3.546388626098633, 3.77353572845459, 4.000682830810547, 4.227829933166504, 4.454977512359619, 4.682124614715576, 4.909271717071533, 5.136419296264648, 5.3635663986206055, 5.5907135009765625, 5.817861080169678]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 11.0, 17.0, 30.0, 30.0, 43.0, 84.0, 140.0, 171.0, 260.0, 430.0, 613.0, 1031.0, 1671.0, 2675.0, 4364.0, 7127.0, 12436.0, 21265.0, 36304.0, 60539.0, 93920.0, 130974.0, 157377.0, 155630.0, 128138.0, 90589.0, 57820.0, 34633.0, 20211.0, 11967.0, 7039.0, 4031.0, 2510.0, 1506.0, 1031.0, 639.0, 434.0, 270.0, 156.0, 128.0, 104.0, 54.0, 43.0, 32.0, 19.0, 15.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-8.1171875, -7.85498046875, -7.5927734375, -7.33056640625, -7.068359375, -6.80615234375, -6.5439453125, -6.28173828125, -6.01953125, -5.75732421875, -5.4951171875, -5.23291015625, -4.970703125, -4.70849609375, -4.4462890625, -4.18408203125, -3.921875, -3.65966796875, -3.3974609375, -3.13525390625, -2.873046875, -2.61083984375, -2.3486328125, -2.08642578125, -1.82421875, -1.56201171875, -1.2998046875, -1.03759765625, -0.775390625, -0.51318359375, -0.2509765625, 0.01123046875, 0.2734375, 0.53564453125, 0.7978515625, 1.06005859375, 1.322265625, 1.58447265625, 1.8466796875, 2.10888671875, 2.37109375, 2.63330078125, 2.8955078125, 3.15771484375, 3.419921875, 3.68212890625, 3.9443359375, 4.20654296875, 4.46875, 4.73095703125, 4.9931640625, 5.25537109375, 5.517578125, 5.77978515625, 6.0419921875, 6.30419921875, 6.56640625, 6.82861328125, 7.0908203125, 7.35302734375, 7.615234375, 7.87744140625, 8.1396484375, 8.40185546875, 8.6640625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 3.0, 7.0, 8.0, 12.0, 15.0, 12.0, 18.0, 27.0, 31.0, 18.0, 24.0, 14.0, 34.0, 49.0, 36.0, 43.0, 46.0, 45.0, 40.0, 62.0, 39.0, 40.0, 35.0, 56.0, 38.0, 34.0, 32.0, 30.0, 23.0, 21.0, 18.0, 16.0, 13.0, 13.0, 9.0, 9.0, 10.0, 4.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.52734375, -7.2984619140625, -7.069580078125, -6.8406982421875, -6.61181640625, -6.3829345703125, -6.154052734375, -5.9251708984375, -5.6962890625, -5.4674072265625, -5.238525390625, -5.0096435546875, -4.78076171875, -4.5518798828125, -4.322998046875, -4.0941162109375, -3.865234375, -3.6363525390625, -3.407470703125, -3.1785888671875, -2.94970703125, -2.7208251953125, -2.491943359375, -2.2630615234375, -2.0341796875, -1.8052978515625, -1.576416015625, -1.3475341796875, -1.11865234375, -0.8897705078125, -0.660888671875, -0.4320068359375, -0.203125, 0.0257568359375, 0.254638671875, 0.4835205078125, 0.71240234375, 0.9412841796875, 1.170166015625, 1.3990478515625, 1.6279296875, 1.8568115234375, 2.085693359375, 2.3145751953125, 2.54345703125, 2.7723388671875, 3.001220703125, 3.2301025390625, 3.458984375, 3.6878662109375, 3.916748046875, 4.1456298828125, 4.37451171875, 4.6033935546875, 4.832275390625, 5.0611572265625, 5.2900390625, 5.5189208984375, 5.747802734375, 5.9766845703125, 6.20556640625, 6.4344482421875, 6.663330078125, 6.8922119140625, 7.12109375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [7.0, 4.0, 2.0, 4.0, 11.0, 22.0, 34.0, 46.0, 62.0, 128.0, 177.0, 286.0, 442.0, 702.0, 1058.0, 1700.0, 2546.0, 4107.0, 6187.0, 9539.0, 14696.0, 22311.0, 33202.0, 48143.0, 66772.0, 87255.0, 106146.0, 118056.0, 118024.0, 106333.0, 87511.0, 67071.0, 48214.0, 33218.0, 22635.0, 14707.0, 9755.0, 6192.0, 3991.0, 2625.0, 1678.0, 1080.0, 710.0, 438.0, 264.0, 166.0, 119.0, 68.0, 54.0, 29.0, 14.0, 14.0, 10.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.53125, -5.333740234375, -5.13623046875, -4.938720703125, -4.7412109375, -4.543701171875, -4.34619140625, -4.148681640625, -3.951171875, -3.753662109375, -3.55615234375, -3.358642578125, -3.1611328125, -2.963623046875, -2.76611328125, -2.568603515625, -2.37109375, -2.173583984375, -1.97607421875, -1.778564453125, -1.5810546875, -1.383544921875, -1.18603515625, -0.988525390625, -0.791015625, -0.593505859375, -0.39599609375, -0.198486328125, -0.0009765625, 0.196533203125, 0.39404296875, 0.591552734375, 0.7890625, 0.986572265625, 1.18408203125, 1.381591796875, 1.5791015625, 1.776611328125, 1.97412109375, 2.171630859375, 2.369140625, 2.566650390625, 2.76416015625, 2.961669921875, 3.1591796875, 3.356689453125, 3.55419921875, 3.751708984375, 3.94921875, 4.146728515625, 4.34423828125, 4.541748046875, 4.7392578125, 4.936767578125, 5.13427734375, 5.331787109375, 5.529296875, 5.726806640625, 5.92431640625, 6.121826171875, 6.3193359375, 6.516845703125, 6.71435546875, 6.911865234375, 7.109375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 8.0, 14.0, 11.0, 10.0, 21.0, 30.0, 22.0, 28.0, 37.0, 44.0, 41.0, 36.0, 47.0, 38.0, 46.0, 34.0, 55.0, 33.0, 50.0, 37.0, 32.0, 46.0, 36.0, 30.0, 31.0, 24.0, 28.0, 29.0, 14.0, 10.0, 16.0, 10.0, 8.0, 3.0, 4.0, 7.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.39166259765625, -4.2442626953125, -4.09686279296875, -3.949462890625, -3.80206298828125, -3.6546630859375, -3.50726318359375, -3.35986328125, -3.21246337890625, -3.0650634765625, -2.91766357421875, -2.770263671875, -2.62286376953125, -2.4754638671875, -2.32806396484375, -2.1806640625, -2.03326416015625, -1.8858642578125, -1.73846435546875, -1.591064453125, -1.44366455078125, -1.2962646484375, -1.14886474609375, -1.00146484375, -0.85406494140625, -0.7066650390625, -0.55926513671875, -0.411865234375, -0.26446533203125, -0.1170654296875, 0.03033447265625, 0.177734375, 0.32513427734375, 0.4725341796875, 0.61993408203125, 0.767333984375, 0.91473388671875, 1.0621337890625, 1.20953369140625, 1.35693359375, 1.50433349609375, 1.6517333984375, 1.79913330078125, 1.946533203125, 2.09393310546875, 2.2413330078125, 2.38873291015625, 2.5361328125, 2.68353271484375, 2.8309326171875, 2.97833251953125, 3.125732421875, 3.27313232421875, 3.4205322265625, 3.56793212890625, 3.71533203125, 3.86273193359375, 4.0101318359375, 4.15753173828125, 4.304931640625, 4.45233154296875, 4.5997314453125, 4.74713134765625, 4.89453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 10.0, 9.0, 10.0, 15.0, 17.0, 31.0, 36.0, 40.0, 69.0, 100.0, 153.0, 272.0, 363.0, 633.0, 1197.0, 2343.0, 4596.0, 9938.0, 24586.0, 87251.0, 486838.0, 335710.0, 58914.0, 18983.0, 8038.0, 3882.0, 1902.0, 1024.0, 558.0, 317.0, 217.0, 139.0, 106.0, 62.0, 58.0, 34.0, 28.0, 19.0, 11.0, 16.0, 9.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-25.40625, -24.63330078125, -23.8603515625, -23.08740234375, -22.314453125, -21.54150390625, -20.7685546875, -19.99560546875, -19.22265625, -18.44970703125, -17.6767578125, -16.90380859375, -16.130859375, -15.35791015625, -14.5849609375, -13.81201171875, -13.0390625, -12.26611328125, -11.4931640625, -10.72021484375, -9.947265625, -9.17431640625, -8.4013671875, -7.62841796875, -6.85546875, -6.08251953125, -5.3095703125, -4.53662109375, -3.763671875, -2.99072265625, -2.2177734375, -1.44482421875, -0.671875, 0.10107421875, 0.8740234375, 1.64697265625, 2.419921875, 3.19287109375, 3.9658203125, 4.73876953125, 5.51171875, 6.28466796875, 7.0576171875, 7.83056640625, 8.603515625, 9.37646484375, 10.1494140625, 10.92236328125, 11.6953125, 12.46826171875, 13.2412109375, 14.01416015625, 14.787109375, 15.56005859375, 16.3330078125, 17.10595703125, 17.87890625, 18.65185546875, 19.4248046875, 20.19775390625, 20.970703125, 21.74365234375, 22.5166015625, 23.28955078125, 24.0625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 1.0, 4.0, 8.0, 11.0, 10.0, 14.0, 21.0, 26.0, 56.0, 86.0, 104.0, 127.0, 141.0, 110.0, 85.0, 47.0, 41.0, 27.0, 15.0, 14.0, 11.0, 6.0, 11.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0014247894287109375, -0.0013841241598129272, -0.001343458890914917, -0.0013027936220169067, -0.0012621283531188965, -0.0012214630842208862, -0.001180797815322876, -0.0011401325464248657, -0.0010994672775268555, -0.0010588020086288452, -0.001018136739730835, -0.0009774714708328247, -0.0009368062019348145, -0.0008961409330368042, -0.0008554756641387939, -0.0008148103952407837, -0.0007741451263427734, -0.0007334798574447632, -0.0006928145885467529, -0.0006521493196487427, -0.0006114840507507324, -0.0005708187818527222, -0.0005301535129547119, -0.0004894882440567017, -0.0004488229751586914, -0.00040815770626068115, -0.0003674924373626709, -0.00032682716846466064, -0.0002861618995666504, -0.00024549663066864014, -0.00020483136177062988, -0.00016416609287261963, -0.00012350082397460938, -8.283555507659912e-05, -4.217028617858887e-05, -1.5050172805786133e-06, 3.916025161743164e-05, 7.98255205154419e-05, 0.00012049078941345215, 0.0001611560583114624, 0.00020182132720947266, 0.0002424865961074829, 0.00028315186500549316, 0.0003238171339035034, 0.00036448240280151367, 0.0004051476716995239, 0.0004458129405975342, 0.00048647820949554443, 0.0005271434783935547, 0.0005678087472915649, 0.0006084740161895752, 0.0006491392850875854, 0.0006898045539855957, 0.000730469822883606, 0.0007711350917816162, 0.0008118003606796265, 0.0008524656295776367, 0.000893130898475647, 0.0009337961673736572, 0.0009744614362716675, 0.0010151267051696777, 0.001055791974067688, 0.0010964572429656982, 0.0011371225118637085, 0.0011777877807617188]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 5.0, 11.0, 18.0, 24.0, 40.0, 63.0, 68.0, 99.0, 164.0, 255.0, 416.0, 508.0, 833.0, 1184.0, 1856.0, 2713.0, 4356.0, 7138.0, 11728.0, 20075.0, 37048.0, 77321.0, 171492.0, 281777.0, 217384.0, 102336.0, 47785.0, 24495.0, 14333.0, 8429.0, 5075.0, 3242.0, 2100.0, 1304.0, 975.0, 543.0, 422.0, 300.0, 204.0, 134.0, 102.0, 57.0, 46.0, 35.0, 17.0, 13.0, 10.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5, -9.1903076171875, -8.880615234375, -8.5709228515625, -8.26123046875, -7.9515380859375, -7.641845703125, -7.3321533203125, -7.0224609375, -6.7127685546875, -6.403076171875, -6.0933837890625, -5.78369140625, -5.4739990234375, -5.164306640625, -4.8546142578125, -4.544921875, -4.2352294921875, -3.925537109375, -3.6158447265625, -3.30615234375, -2.9964599609375, -2.686767578125, -2.3770751953125, -2.0673828125, -1.7576904296875, -1.447998046875, -1.1383056640625, -0.82861328125, -0.5189208984375, -0.209228515625, 0.1004638671875, 0.41015625, 0.7198486328125, 1.029541015625, 1.3392333984375, 1.64892578125, 1.9586181640625, 2.268310546875, 2.5780029296875, 2.8876953125, 3.1973876953125, 3.507080078125, 3.8167724609375, 4.12646484375, 4.4361572265625, 4.745849609375, 5.0555419921875, 5.365234375, 5.6749267578125, 5.984619140625, 6.2943115234375, 6.60400390625, 6.9136962890625, 7.223388671875, 7.5330810546875, 7.8427734375, 8.1524658203125, 8.462158203125, 8.7718505859375, 9.08154296875, 9.3912353515625, 9.700927734375, 10.0106201171875, 10.3203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 3.0, 7.0, 12.0, 11.0, 18.0, 14.0, 24.0, 40.0, 51.0, 56.0, 82.0, 79.0, 116.0, 98.0, 90.0, 84.0, 42.0, 29.0, 27.0, 16.0, 19.0, 14.0, 8.0, 11.0, 8.0, 9.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.314453125, -2.22161865234375, -2.1287841796875, -2.03594970703125, -1.943115234375, -1.85028076171875, -1.7574462890625, -1.66461181640625, -1.57177734375, -1.47894287109375, -1.3861083984375, -1.29327392578125, -1.200439453125, -1.10760498046875, -1.0147705078125, -0.92193603515625, -0.8291015625, -0.73626708984375, -0.6434326171875, -0.55059814453125, -0.457763671875, -0.36492919921875, -0.2720947265625, -0.17926025390625, -0.08642578125, 0.00640869140625, 0.0992431640625, 0.19207763671875, 0.284912109375, 0.37774658203125, 0.4705810546875, 0.56341552734375, 0.65625, 0.74908447265625, 0.8419189453125, 0.93475341796875, 1.027587890625, 1.12042236328125, 1.2132568359375, 1.30609130859375, 1.39892578125, 1.49176025390625, 1.5845947265625, 1.67742919921875, 1.770263671875, 1.86309814453125, 1.9559326171875, 2.04876708984375, 2.1416015625, 2.23443603515625, 2.3272705078125, 2.42010498046875, 2.512939453125, 2.60577392578125, 2.6986083984375, 2.79144287109375, 2.88427734375, 2.97711181640625, 3.0699462890625, 3.16278076171875, 3.255615234375, 3.34844970703125, 3.4412841796875, 3.53411865234375, 3.626953125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 7.0, 3.0, 4.0, 5.0, 10.0, 11.0, 13.0, 10.0, 23.0, 23.0, 25.0, 33.0, 34.0, 37.0, 59.0, 55.0, 50.0, 70.0, 57.0, 62.0, 56.0, 57.0, 49.0, 37.0, 39.0, 35.0, 27.0, 17.0, 18.0, 18.0, 12.0, 7.0, 10.0, 6.0, 7.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0], "bins": [-15.952945709228516, -15.550568580627441, -15.14819049835205, -14.745813369750977, -14.343436241149902, -13.941058158874512, -13.538681030273438, -13.136302947998047, -12.733925819396973, -12.331548690795898, -11.929170608520508, -11.526793479919434, -11.12441635131836, -10.722038269042969, -10.319661140441895, -9.91728401184082, -9.51490592956543, -9.112528800964355, -8.710150718688965, -8.30777359008789, -7.905395984649658, -7.503018379211426, -7.100641250610352, -6.698263645172119, -6.295886993408203, -5.893509387969971, -5.4911322593688965, -5.088754653930664, -4.686377048492432, -4.283999443054199, -3.881622314453125, -3.4792447090148926, -3.07686710357666, -2.674489736557007, -2.2721121311187744, -1.869734764099121, -1.4673572778701782, -1.0649797916412354, -0.662602424621582, -0.2602248191833496, 0.1421525478363037, 0.5445300340652466, 0.9469074606895447, 1.3492848873138428, 1.7516623735427856, 2.1540398597717285, 2.556417226791382, 2.9587948322296143, 3.3611721992492676, 3.763549566268921, 4.165926933288574, 4.568304538726807, 4.970682144165039, 5.373059272766113, 5.775436878204346, 6.177814483642578, 6.580191612243652, 6.982569217681885, 7.384946346282959, 7.787323951721191, 8.189701080322266, 8.592079162597656, 8.99445629119873, 9.396833419799805, 9.799211502075195]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 1.0, 6.0, 5.0, 16.0, 7.0, 11.0, 14.0, 14.0, 25.0, 23.0, 23.0, 34.0, 38.0, 38.0, 42.0, 37.0, 49.0, 61.0, 53.0, 60.0, 54.0, 62.0, 56.0, 38.0, 34.0, 34.0, 34.0, 25.0, 25.0, 18.0, 10.0, 18.0, 11.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.369500160217285, -8.106168746948242, -7.842837333679199, -7.579505920410156, -7.316174507141113, -7.05284309387207, -6.7895121574401855, -6.526180744171143, -6.2628493309021, -5.999517917633057, -5.736186504364014, -5.472855091094971, -5.209524154663086, -4.946192741394043, -4.682861328125, -4.419529914855957, -4.156198501586914, -3.892867088317871, -3.629535675048828, -3.3662045001983643, -3.1028730869293213, -2.8395416736602783, -2.5762104988098145, -2.3128790855407715, -2.0495476722717285, -1.7862162590026855, -1.5228849649429321, -1.2595536708831787, -0.9962222576141357, -0.7328908443450928, -0.46955955028533936, -0.20622825622558594, 0.05710315704345703, 0.3204345107078552, 0.5837658643722534, 0.8470972180366516, 1.1104285717010498, 1.3737599849700928, 1.6370912790298462, 1.9004225730895996, 2.1637539863586426, 2.4270853996276855, 2.6904168128967285, 2.9537479877471924, 3.2170794010162354, 3.4804108142852783, 3.743741989135742, 4.007073402404785, 4.270404815673828, 4.533736228942871, 4.797067642211914, 5.060399055480957, 5.32373046875, 5.587061882019043, 5.850392818450928, 6.113724231719971, 6.377055644989014, 6.640387058258057, 6.9037184715271, 7.167049884796143, 7.430380821228027, 7.69371223449707, 7.957043647766113, 8.220375061035156, 8.4837064743042]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 11.0, 13.0, 19.0, 37.0, 66.0, 93.0, 143.0, 190.0, 353.0, 573.0, 957.0, 1491.0, 2368.0, 4185.0, 7030.0, 11522.0, 20614.0, 35740.0, 62054.0, 108281.0, 184324.0, 302436.0, 460631.0, 613390.0, 672406.0, 590699.0, 430915.0, 278699.0, 168628.0, 98853.0, 57152.0, 33053.0, 19266.0, 11166.0, 6695.0, 3973.0, 2424.0, 1409.0, 876.0, 563.0, 365.0, 213.0, 143.0, 92.0, 60.0, 48.0, 25.0, 8.0, 10.0, 14.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.5546875, -9.260009765625, -8.96533203125, -8.670654296875, -8.3759765625, -8.081298828125, -7.78662109375, -7.491943359375, -7.197265625, -6.902587890625, -6.60791015625, -6.313232421875, -6.0185546875, -5.723876953125, -5.42919921875, -5.134521484375, -4.83984375, -4.545166015625, -4.25048828125, -3.955810546875, -3.6611328125, -3.366455078125, -3.07177734375, -2.777099609375, -2.482421875, -2.187744140625, -1.89306640625, -1.598388671875, -1.3037109375, -1.009033203125, -0.71435546875, -0.419677734375, -0.125, 0.169677734375, 0.46435546875, 0.759033203125, 1.0537109375, 1.348388671875, 1.64306640625, 1.937744140625, 2.232421875, 2.527099609375, 2.82177734375, 3.116455078125, 3.4111328125, 3.705810546875, 4.00048828125, 4.295166015625, 4.58984375, 4.884521484375, 5.17919921875, 5.473876953125, 5.7685546875, 6.063232421875, 6.35791015625, 6.652587890625, 6.947265625, 7.241943359375, 7.53662109375, 7.831298828125, 8.1259765625, 8.420654296875, 8.71533203125, 9.010009765625, 9.3046875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 4.0, 10.0, 10.0, 10.0, 14.0, 30.0, 18.0, 26.0, 40.0, 23.0, 31.0, 35.0, 57.0, 70.0, 53.0, 61.0, 49.0, 52.0, 60.0, 49.0, 39.0, 49.0, 37.0, 26.0, 28.0, 18.0, 23.0, 15.0, 14.0, 10.0, 6.0, 7.0, 6.0, 6.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.05078125, -6.8372802734375, -6.623779296875, -6.4102783203125, -6.19677734375, -5.9832763671875, -5.769775390625, -5.5562744140625, -5.3427734375, -5.1292724609375, -4.915771484375, -4.7022705078125, -4.48876953125, -4.2752685546875, -4.061767578125, -3.8482666015625, -3.634765625, -3.4212646484375, -3.207763671875, -2.9942626953125, -2.78076171875, -2.5672607421875, -2.353759765625, -2.1402587890625, -1.9267578125, -1.7132568359375, -1.499755859375, -1.2862548828125, -1.07275390625, -0.8592529296875, -0.645751953125, -0.4322509765625, -0.21875, -0.0052490234375, 0.208251953125, 0.4217529296875, 0.63525390625, 0.8487548828125, 1.062255859375, 1.2757568359375, 1.4892578125, 1.7027587890625, 1.916259765625, 2.1297607421875, 2.34326171875, 2.5567626953125, 2.770263671875, 2.9837646484375, 3.197265625, 3.4107666015625, 3.624267578125, 3.8377685546875, 4.05126953125, 4.2647705078125, 4.478271484375, 4.6917724609375, 4.9052734375, 5.1187744140625, 5.332275390625, 5.5457763671875, 5.75927734375, 5.9727783203125, 6.186279296875, 6.3997802734375, 6.61328125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 1.0, 8.0, 9.0, 12.0, 24.0, 36.0, 50.0, 81.0, 127.0, 184.0, 265.0, 445.0, 716.0, 1118.0, 1864.0, 3110.0, 4901.0, 8012.0, 13277.0, 22615.0, 37356.0, 61736.0, 101153.0, 162097.0, 249387.0, 360926.0, 477778.0, 556425.0, 562271.0, 489254.0, 374130.0, 261501.0, 170963.0, 107460.0, 65281.0, 39632.0, 23778.0, 14159.0, 8514.0, 5167.0, 3202.0, 1969.0, 1211.0, 763.0, 506.0, 305.0, 177.0, 120.0, 86.0, 49.0, 33.0, 14.0, 16.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.5968017578125, -8.310791015625, -8.0247802734375, -7.73876953125, -7.4527587890625, -7.166748046875, -6.8807373046875, -6.5947265625, -6.3087158203125, -6.022705078125, -5.7366943359375, -5.45068359375, -5.1646728515625, -4.878662109375, -4.5926513671875, -4.306640625, -4.0206298828125, -3.734619140625, -3.4486083984375, -3.16259765625, -2.8765869140625, -2.590576171875, -2.3045654296875, -2.0185546875, -1.7325439453125, -1.446533203125, -1.1605224609375, -0.87451171875, -0.5885009765625, -0.302490234375, -0.0164794921875, 0.26953125, 0.5555419921875, 0.841552734375, 1.1275634765625, 1.41357421875, 1.6995849609375, 1.985595703125, 2.2716064453125, 2.5576171875, 2.8436279296875, 3.129638671875, 3.4156494140625, 3.70166015625, 3.9876708984375, 4.273681640625, 4.5596923828125, 4.845703125, 5.1317138671875, 5.417724609375, 5.7037353515625, 5.98974609375, 6.2757568359375, 6.561767578125, 6.8477783203125, 7.1337890625, 7.4197998046875, 7.705810546875, 7.9918212890625, 8.27783203125, 8.5638427734375, 8.849853515625, 9.1358642578125, 9.421875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 14.0, 21.0, 28.0, 30.0, 36.0, 46.0, 55.0, 59.0, 63.0, 82.0, 103.0, 137.0, 122.0, 135.0, 142.0, 150.0, 152.0, 185.0, 167.0, 197.0, 221.0, 187.0, 169.0, 168.0, 159.0, 168.0, 144.0, 127.0, 132.0, 96.0, 95.0, 93.0, 64.0, 76.0, 44.0, 39.0, 26.0, 29.0, 27.0, 13.0, 8.0, 12.0, 8.0, 4.0, 3.0, 1.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-3.099609375, -3.007904052734375, -2.91619873046875, -2.824493408203125, -2.7327880859375, -2.641082763671875, -2.54937744140625, -2.457672119140625, -2.365966796875, -2.274261474609375, -2.18255615234375, -2.090850830078125, -1.9991455078125, -1.907440185546875, -1.81573486328125, -1.724029541015625, -1.63232421875, -1.540618896484375, -1.44891357421875, -1.357208251953125, -1.2655029296875, -1.173797607421875, -1.08209228515625, -0.990386962890625, -0.898681640625, -0.806976318359375, -0.71527099609375, -0.623565673828125, -0.5318603515625, -0.440155029296875, -0.34844970703125, -0.256744384765625, -0.1650390625, -0.073333740234375, 0.01837158203125, 0.110076904296875, 0.2017822265625, 0.293487548828125, 0.38519287109375, 0.476898193359375, 0.568603515625, 0.660308837890625, 0.75201416015625, 0.843719482421875, 0.9354248046875, 1.027130126953125, 1.11883544921875, 1.210540771484375, 1.30224609375, 1.393951416015625, 1.48565673828125, 1.577362060546875, 1.6690673828125, 1.760772705078125, 1.85247802734375, 1.944183349609375, 2.035888671875, 2.127593994140625, 2.21929931640625, 2.311004638671875, 2.4027099609375, 2.494415283203125, 2.58612060546875, 2.677825927734375, 2.76953125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 7.0, 7.0, 9.0, 12.0, 8.0, 9.0, 24.0, 17.0, 39.0, 31.0, 36.0, 52.0, 47.0, 56.0, 54.0, 66.0, 84.0, 76.0, 56.0, 51.0, 37.0, 35.0, 35.0, 39.0, 25.0, 15.0, 23.0, 14.0, 10.0, 7.0, 4.0, 3.0, 4.0, 3.0, 5.0, 4.0, 2.0, 2.0], "bins": [-19.686586380004883, -19.21902847290039, -18.75147247314453, -18.28391456604004, -17.816356658935547, -17.348800659179688, -16.881242752075195, -16.413686752319336, -15.946128845214844, -15.478571891784668, -15.011014938354492, -14.54345703125, -14.075900077819824, -13.608343124389648, -13.140785217285156, -12.67322826385498, -12.205671310424805, -11.738114356994629, -11.270557403564453, -10.802999496459961, -10.335442543029785, -9.86788558959961, -9.400327682495117, -8.932770729064941, -8.465213775634766, -7.99765682220459, -7.530099391937256, -7.062541961669922, -6.594985008239746, -6.12742805480957, -5.659870624542236, -5.192313194274902, -4.724756240844727, -4.257199287414551, -3.789641857147217, -3.322084665298462, -2.854527473449707, -2.386970281600952, -1.9194130897521973, -1.4518558979034424, -0.9842987060546875, -0.5167415142059326, -0.049184322357177734, 0.41837286949157715, 0.885930061340332, 1.353487253189087, 1.8210444450378418, 2.2886016368865967, 2.7561588287353516, 3.2237160205841064, 3.6912732124328613, 4.158830642700195, 4.626387596130371, 5.093944549560547, 5.561501979827881, 6.029059410095215, 6.496616363525391, 6.964173316955566, 7.4317307472229, 7.899288177490234, 8.36684513092041, 8.834402084350586, 9.301959991455078, 9.769516944885254, 10.23707389831543]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 15.0, 7.0, 12.0, 17.0, 18.0, 28.0, 20.0, 25.0, 32.0, 48.0, 40.0, 50.0, 42.0, 45.0, 44.0, 57.0, 42.0, 50.0, 49.0, 47.0, 52.0, 53.0, 30.0, 25.0, 28.0, 29.0, 24.0, 15.0, 8.0, 15.0, 8.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.811206817626953, -8.54182243347168, -8.272438049316406, -8.00305461883545, -7.733670234680176, -7.464285850524902, -7.194901466369629, -6.925517559051514, -6.656133651733398, -6.386749267578125, -6.11736536026001, -5.847980976104736, -5.578597068786621, -5.309212684631348, -5.039828300476074, -4.770444393157959, -4.5010600090026855, -4.231675624847412, -3.962291717529297, -3.6929073333740234, -3.423523426055908, -3.1541390419006348, -2.8847548961639404, -2.615370750427246, -2.3459866046905518, -2.0766024589538574, -1.807218313217163, -1.5378340482711792, -1.2684499025344849, -0.9990657567977905, -0.7296814918518066, -0.4602973461151123, -0.19091320037841797, 0.07847097516059875, 0.3478551506996155, 0.6172393560409546, 0.8866235017776489, 1.1560076475143433, 1.4253919124603271, 1.6947760581970215, 1.9641602039337158, 2.23354434967041, 2.5029284954071045, 2.772312641143799, 3.0416970252990723, 3.3110809326171875, 3.580465316772461, 3.8498494625091553, 4.11923360824585, 4.388617992401123, 4.658001899719238, 4.927386283874512, 5.196770191192627, 5.4661545753479, 5.735538482666016, 6.004922866821289, 6.2743072509765625, 6.543691635131836, 6.813075542449951, 7.082459926605225, 7.35184383392334, 7.621228218078613, 7.890612602233887, 8.159996032714844, 8.429380416870117]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 7.0, 17.0, 12.0, 16.0, 20.0, 20.0, 39.0, 54.0, 76.0, 96.0, 129.0, 194.0, 312.0, 435.0, 601.0, 1036.0, 1733.0, 2938.0, 5354.0, 10076.0, 20347.0, 42304.0, 85948.0, 160316.0, 232012.0, 214377.0, 133010.0, 68776.0, 33304.0, 15974.0, 8202.0, 4307.0, 2390.0, 1443.0, 877.0, 554.0, 387.0, 239.0, 157.0, 128.0, 86.0, 81.0, 48.0, 36.0, 23.0, 22.0, 14.0, 13.0, 11.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.767578125, -2.677825927734375, -2.58807373046875, -2.498321533203125, -2.4085693359375, -2.318817138671875, -2.22906494140625, -2.139312744140625, -2.049560546875, -1.959808349609375, -1.87005615234375, -1.780303955078125, -1.6905517578125, -1.600799560546875, -1.51104736328125, -1.421295166015625, -1.33154296875, -1.241790771484375, -1.15203857421875, -1.062286376953125, -0.9725341796875, -0.882781982421875, -0.79302978515625, -0.703277587890625, -0.613525390625, -0.523773193359375, -0.43402099609375, -0.344268798828125, -0.2545166015625, -0.164764404296875, -0.07501220703125, 0.014739990234375, 0.1044921875, 0.194244384765625, 0.28399658203125, 0.373748779296875, 0.4635009765625, 0.553253173828125, 0.64300537109375, 0.732757568359375, 0.822509765625, 0.912261962890625, 1.00201416015625, 1.091766357421875, 1.1815185546875, 1.271270751953125, 1.36102294921875, 1.450775146484375, 1.54052734375, 1.630279541015625, 1.72003173828125, 1.809783935546875, 1.8995361328125, 1.989288330078125, 2.07904052734375, 2.168792724609375, 2.258544921875, 2.348297119140625, 2.43804931640625, 2.527801513671875, 2.6175537109375, 2.707305908203125, 2.79705810546875, 2.886810302734375, 2.9765625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 5.0, 6.0, 15.0, 10.0, 18.0, 18.0, 20.0, 17.0, 33.0, 29.0, 31.0, 38.0, 45.0, 44.0, 42.0, 42.0, 53.0, 47.0, 53.0, 37.0, 47.0, 36.0, 33.0, 39.0, 49.0, 40.0, 32.0, 23.0, 17.0, 17.0, 16.0, 14.0, 13.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.572021484375, -9.28466796875, -8.997314453125, -8.7099609375, -8.422607421875, -8.13525390625, -7.847900390625, -7.560546875, -7.273193359375, -6.98583984375, -6.698486328125, -6.4111328125, -6.123779296875, -5.83642578125, -5.549072265625, -5.26171875, -4.974365234375, -4.68701171875, -4.399658203125, -4.1123046875, -3.824951171875, -3.53759765625, -3.250244140625, -2.962890625, -2.675537109375, -2.38818359375, -2.100830078125, -1.8134765625, -1.526123046875, -1.23876953125, -0.951416015625, -0.6640625, -0.376708984375, -0.08935546875, 0.197998046875, 0.4853515625, 0.772705078125, 1.06005859375, 1.347412109375, 1.634765625, 1.922119140625, 2.20947265625, 2.496826171875, 2.7841796875, 3.071533203125, 3.35888671875, 3.646240234375, 3.93359375, 4.220947265625, 4.50830078125, 4.795654296875, 5.0830078125, 5.370361328125, 5.65771484375, 5.945068359375, 6.232421875, 6.519775390625, 6.80712890625, 7.094482421875, 7.3818359375, 7.669189453125, 7.95654296875, 8.243896484375, 8.53125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 20.0, 26.0, 43.0, 49.0, 93.0, 159.0, 317.0, 599.0, 1180.0, 2619.0, 5919.0, 15354.0, 41876.0, 120165.0, 285612.0, 327301.0, 157450.0, 56017.0, 19887.0, 7666.0, 3203.0, 1460.0, 689.0, 369.0, 173.0, 99.0, 74.0, 39.0, 28.0, 15.0, 11.0, 6.0, 9.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.904296875, -3.765533447265625, -3.62677001953125, -3.488006591796875, -3.3492431640625, -3.210479736328125, -3.07171630859375, -2.932952880859375, -2.794189453125, -2.655426025390625, -2.51666259765625, -2.377899169921875, -2.2391357421875, -2.100372314453125, -1.96160888671875, -1.822845458984375, -1.68408203125, -1.545318603515625, -1.40655517578125, -1.267791748046875, -1.1290283203125, -0.990264892578125, -0.85150146484375, -0.712738037109375, -0.573974609375, -0.435211181640625, -0.29644775390625, -0.157684326171875, -0.0189208984375, 0.119842529296875, 0.25860595703125, 0.397369384765625, 0.5361328125, 0.674896240234375, 0.81365966796875, 0.952423095703125, 1.0911865234375, 1.229949951171875, 1.36871337890625, 1.507476806640625, 1.646240234375, 1.785003662109375, 1.92376708984375, 2.062530517578125, 2.2012939453125, 2.340057373046875, 2.47882080078125, 2.617584228515625, 2.75634765625, 2.895111083984375, 3.03387451171875, 3.172637939453125, 3.3114013671875, 3.450164794921875, 3.58892822265625, 3.727691650390625, 3.866455078125, 4.005218505859375, 4.14398193359375, 4.282745361328125, 4.4215087890625, 4.560272216796875, 4.69903564453125, 4.837799072265625, 4.9765625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 10.0, 9.0, 9.0, 14.0, 12.0, 12.0, 15.0, 37.0, 27.0, 30.0, 38.0, 25.0, 36.0, 33.0, 44.0, 43.0, 43.0, 39.0, 43.0, 48.0, 49.0, 45.0, 34.0, 28.0, 41.0, 32.0, 26.0, 23.0, 28.0, 21.0, 15.0, 16.0, 16.0, 20.0, 8.0, 10.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.51953125, -5.3516845703125, -5.183837890625, -5.0159912109375, -4.84814453125, -4.6802978515625, -4.512451171875, -4.3446044921875, -4.1767578125, -4.0089111328125, -3.841064453125, -3.6732177734375, -3.50537109375, -3.3375244140625, -3.169677734375, -3.0018310546875, -2.833984375, -2.6661376953125, -2.498291015625, -2.3304443359375, -2.16259765625, -1.9947509765625, -1.826904296875, -1.6590576171875, -1.4912109375, -1.3233642578125, -1.155517578125, -0.9876708984375, -0.81982421875, -0.6519775390625, -0.484130859375, -0.3162841796875, -0.1484375, 0.0194091796875, 0.187255859375, 0.3551025390625, 0.52294921875, 0.6907958984375, 0.858642578125, 1.0264892578125, 1.1943359375, 1.3621826171875, 1.530029296875, 1.6978759765625, 1.86572265625, 2.0335693359375, 2.201416015625, 2.3692626953125, 2.537109375, 2.7049560546875, 2.872802734375, 3.0406494140625, 3.20849609375, 3.3763427734375, 3.544189453125, 3.7120361328125, 3.8798828125, 4.0477294921875, 4.215576171875, 4.3834228515625, 4.55126953125, 4.7191162109375, 4.886962890625, 5.0548095703125, 5.22265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 8.0, 14.0, 29.0, 28.0, 60.0, 63.0, 159.0, 266.0, 528.0, 1296.0, 3036.0, 10508.0, 52401.0, 373699.0, 507864.0, 77546.0, 14249.0, 3946.0, 1476.0, 645.0, 322.0, 159.0, 98.0, 57.0, 29.0, 15.0, 16.0, 10.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7919921875, -1.7233428955078125, -1.654693603515625, -1.5860443115234375, -1.51739501953125, -1.4487457275390625, -1.380096435546875, -1.3114471435546875, -1.2427978515625, -1.1741485595703125, -1.105499267578125, -1.0368499755859375, -0.96820068359375, -0.8995513916015625, -0.830902099609375, -0.7622528076171875, -0.693603515625, -0.6249542236328125, -0.556304931640625, -0.4876556396484375, -0.41900634765625, -0.3503570556640625, -0.281707763671875, -0.2130584716796875, -0.1444091796875, -0.0757598876953125, -0.007110595703125, 0.0615386962890625, 0.13018798828125, 0.1988372802734375, 0.267486572265625, 0.3361358642578125, 0.40478515625, 0.4734344482421875, 0.542083740234375, 0.6107330322265625, 0.67938232421875, 0.7480316162109375, 0.816680908203125, 0.8853302001953125, 0.9539794921875, 1.0226287841796875, 1.091278076171875, 1.1599273681640625, 1.22857666015625, 1.2972259521484375, 1.365875244140625, 1.4345245361328125, 1.503173828125, 1.5718231201171875, 1.640472412109375, 1.7091217041015625, 1.77777099609375, 1.8464202880859375, 1.915069580078125, 1.9837188720703125, 2.0523681640625, 2.1210174560546875, 2.189666748046875, 2.2583160400390625, 2.32696533203125, 2.3956146240234375, 2.464263916015625, 2.5329132080078125, 2.6015625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 9.0, 16.0, 17.0, 27.0, 69.0, 86.0, 137.0, 130.0, 139.0, 129.0, 86.0, 57.0, 25.0, 22.0, 18.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010657310485839844, -0.00010303501039743423, -9.949691593647003e-05, -9.595882147550583e-05, -9.242072701454163e-05, -8.888263255357742e-05, -8.534453809261322e-05, -8.180644363164902e-05, -7.826834917068481e-05, -7.473025470972061e-05, -7.119216024875641e-05, -6.76540657877922e-05, -6.4115971326828e-05, -6.05778768658638e-05, -5.70397824048996e-05, -5.3501687943935394e-05, -4.996359348297119e-05, -4.642549902200699e-05, -4.2887404561042786e-05, -3.934931010007858e-05, -3.581121563911438e-05, -3.227312117815018e-05, -2.8735026717185974e-05, -2.519693225622177e-05, -2.165883779525757e-05, -1.8120743334293365e-05, -1.4582648873329163e-05, -1.104455441236496e-05, -7.506459951400757e-06, -3.968365490436554e-06, -4.302710294723511e-07, 3.107823431491852e-06, 6.645917892456055e-06, 1.0184012353420258e-05, 1.372210681438446e-05, 1.7260201275348663e-05, 2.0798295736312866e-05, 2.433639019727707e-05, 2.7874484658241272e-05, 3.1412579119205475e-05, 3.495067358016968e-05, 3.848876804113388e-05, 4.2026862502098083e-05, 4.5564956963062286e-05, 4.910305142402649e-05, 5.264114588499069e-05, 5.6179240345954895e-05, 5.97173348069191e-05, 6.32554292678833e-05, 6.67935237288475e-05, 7.03316181898117e-05, 7.386971265077591e-05, 7.740780711174011e-05, 8.094590157270432e-05, 8.448399603366852e-05, 8.802209049463272e-05, 9.156018495559692e-05, 9.509827941656113e-05, 9.863637387752533e-05, 0.00010217446833848953, 0.00010571256279945374, 0.00010925065726041794, 0.00011278875172138214, 0.00011632684618234634, 0.00011986494064331055]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 8.0, 6.0, 5.0, 10.0, 13.0, 24.0, 17.0, 29.0, 37.0, 49.0, 72.0, 116.0, 138.0, 218.0, 269.0, 421.0, 650.0, 944.0, 1414.0, 2290.0, 3756.0, 6407.0, 11173.0, 21238.0, 42228.0, 87969.0, 174525.0, 264093.0, 208852.0, 109619.0, 52674.0, 26043.0, 13607.0, 7633.0, 4352.0, 2683.0, 1755.0, 1073.0, 627.0, 420.0, 309.0, 236.0, 153.0, 104.0, 87.0, 40.0, 44.0, 29.0, 30.0, 29.0, 16.0, 15.0, 6.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0, -0.967376708984375, -0.93475341796875, -0.902130126953125, -0.8695068359375, -0.836883544921875, -0.80426025390625, -0.771636962890625, -0.739013671875, -0.706390380859375, -0.67376708984375, -0.641143798828125, -0.6085205078125, -0.575897216796875, -0.54327392578125, -0.510650634765625, -0.47802734375, -0.445404052734375, -0.41278076171875, -0.380157470703125, -0.3475341796875, -0.314910888671875, -0.28228759765625, -0.249664306640625, -0.217041015625, -0.184417724609375, -0.15179443359375, -0.119171142578125, -0.0865478515625, -0.053924560546875, -0.02130126953125, 0.011322021484375, 0.0439453125, 0.076568603515625, 0.10919189453125, 0.141815185546875, 0.1744384765625, 0.207061767578125, 0.23968505859375, 0.272308349609375, 0.304931640625, 0.337554931640625, 0.37017822265625, 0.402801513671875, 0.4354248046875, 0.468048095703125, 0.50067138671875, 0.533294677734375, 0.56591796875, 0.598541259765625, 0.63116455078125, 0.663787841796875, 0.6964111328125, 0.729034423828125, 0.76165771484375, 0.794281005859375, 0.826904296875, 0.859527587890625, 0.89215087890625, 0.924774169921875, 0.9573974609375, 0.990020751953125, 1.02264404296875, 1.055267333984375, 1.087890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 8.0, 2.0, 2.0, 15.0, 8.0, 17.0, 7.0, 15.0, 26.0, 37.0, 24.0, 43.0, 36.0, 49.0, 52.0, 47.0, 61.0, 57.0, 59.0, 44.0, 56.0, 42.0, 50.0, 33.0, 39.0, 23.0, 32.0, 20.0, 17.0, 18.0, 8.0, 9.0, 13.0, 10.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18212890625, -0.17623329162597656, -0.17033767700195312, -0.1644420623779297, -0.15854644775390625, -0.1526508331298828, -0.14675521850585938, -0.14085960388183594, -0.1349639892578125, -0.12906837463378906, -0.12317276000976562, -0.11727714538574219, -0.11138153076171875, -0.10548591613769531, -0.09959030151367188, -0.09369468688964844, -0.087799072265625, -0.08190345764160156, -0.07600784301757812, -0.07011222839355469, -0.06421661376953125, -0.05832099914550781, -0.052425384521484375, -0.04652976989746094, -0.0406341552734375, -0.03473854064941406, -0.028842926025390625, -0.022947311401367188, -0.01705169677734375, -0.011156082153320312, -0.005260467529296875, 0.0006351470947265625, 0.00653076171875, 0.012426376342773438, 0.018321990966796875, 0.024217605590820312, 0.03011322021484375, 0.03600883483886719, 0.041904449462890625, 0.04780006408691406, 0.0536956787109375, 0.05959129333496094, 0.06548690795898438, 0.07138252258300781, 0.07727813720703125, 0.08317375183105469, 0.08906936645507812, 0.09496498107910156, 0.100860595703125, 0.10675621032714844, 0.11265182495117188, 0.11854743957519531, 0.12444305419921875, 0.1303386688232422, 0.13623428344726562, 0.14212989807128906, 0.1480255126953125, 0.15392112731933594, 0.15981674194335938, 0.1657123565673828, 0.17160797119140625, 0.1775035858154297, 0.18339920043945312, 0.18929481506347656, 0.1951904296875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 8.0, 4.0, 10.0, 6.0, 12.0, 9.0, 10.0, 20.0, 21.0, 33.0, 39.0, 32.0, 44.0, 49.0, 57.0, 50.0, 69.0, 79.0, 69.0, 62.0, 49.0, 39.0, 33.0, 38.0, 33.0, 34.0, 17.0, 22.0, 17.0, 10.0, 11.0, 4.0, 1.0, 6.0, 1.0, 5.0, 5.0, 2.0, 3.0, 1.0], "bins": [-18.87945556640625, -18.421875, -17.964292526245117, -17.506710052490234, -17.049129486083984, -16.591548919677734, -16.13396644592285, -15.676384925842285, -15.218803405761719, -14.761221885681152, -14.303640365600586, -13.84605884552002, -13.388477325439453, -12.930895805358887, -12.47331428527832, -12.015732765197754, -11.558151245117188, -11.100569725036621, -10.642988204956055, -10.185406684875488, -9.727825164794922, -9.270243644714355, -8.812662124633789, -8.355080604553223, -7.897499084472656, -7.43991756439209, -6.982336044311523, -6.524754524230957, -6.067173004150391, -5.609591484069824, -5.152009963989258, -4.694428443908691, -4.236846923828125, -3.7792654037475586, -3.321683883666992, -2.864102363586426, -2.4065208435058594, -1.948939323425293, -1.4913578033447266, -1.0337762832641602, -0.5761947631835938, -0.11861324310302734, 0.33896827697753906, 0.7965497970581055, 1.2541313171386719, 1.7117128372192383, 2.1692943572998047, 2.626875877380371, 3.0844573974609375, 3.542038917541504, 3.9996204376220703, 4.457201957702637, 4.914783477783203, 5.3723649978637695, 5.829946517944336, 6.287528038024902, 6.745109558105469, 7.202691078186035, 7.660272598266602, 8.117854118347168, 8.575435638427734, 9.0330171585083, 9.490598678588867, 9.948180198669434, 10.40576171875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 15.0, 9.0, 9.0, 19.0, 17.0, 30.0, 17.0, 24.0, 32.0, 43.0, 41.0, 56.0, 35.0, 49.0, 45.0, 56.0, 44.0, 52.0, 40.0, 51.0, 55.0, 52.0, 29.0, 25.0, 32.0, 31.0, 22.0, 16.0, 7.0, 16.0, 10.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.853988647460938, -8.5844144821167, -8.314840316772461, -8.045267105102539, -7.775692939758301, -7.5061187744140625, -7.236545085906982, -6.966971397399902, -6.697397232055664, -6.427823066711426, -6.158249378204346, -5.888675689697266, -5.619101524353027, -5.349527359008789, -5.079953670501709, -4.810379981994629, -4.540805816650391, -4.271231651306152, -4.001657962799072, -3.732084035873413, -3.462510108947754, -3.1929361820220947, -2.9233622550964355, -2.6537883281707764, -2.384214401245117, -2.114640474319458, -1.8450665473937988, -1.5754926204681396, -1.3059186935424805, -1.0363447666168213, -0.7667708396911621, -0.49719691276550293, -0.22762203216552734, 0.041951894760131836, 0.311525821685791, 0.5810997486114502, 0.8506736755371094, 1.1202476024627686, 1.3898215293884277, 1.659395456314087, 1.928969383239746, 2.1985433101654053, 2.4681172370910645, 2.7376911640167236, 3.007265090942383, 3.276839017868042, 3.546412944793701, 3.8159868717193604, 4.0855607986450195, 4.355134963989258, 4.624708652496338, 4.894282341003418, 5.163856506347656, 5.4334306716918945, 5.703004360198975, 5.972578048706055, 6.242152214050293, 6.511726379394531, 6.781300067901611, 7.050873756408691, 7.32044792175293, 7.590022087097168, 7.859595775604248, 8.129169464111328, 8.398743629455566]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 17.0, 26.0, 57.0, 76.0, 103.0, 192.0, 340.0, 462.0, 772.0, 1231.0, 2020.0, 3195.0, 5185.0, 8299.0, 12753.0, 19661.0, 29760.0, 42789.0, 60026.0, 78972.0, 96896.0, 110611.0, 115061.0, 109217.0, 95321.0, 76777.0, 57802.0, 41451.0, 28127.0, 18971.0, 11961.0, 7753.0, 4776.0, 2998.0, 1900.0, 1093.0, 714.0, 420.0, 282.0, 173.0, 106.0, 76.0, 49.0, 34.0, 16.0, 9.0, 11.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69921875, -5.505615234375, -5.31201171875, -5.118408203125, -4.9248046875, -4.731201171875, -4.53759765625, -4.343994140625, -4.150390625, -3.956787109375, -3.76318359375, -3.569580078125, -3.3759765625, -3.182373046875, -2.98876953125, -2.795166015625, -2.6015625, -2.407958984375, -2.21435546875, -2.020751953125, -1.8271484375, -1.633544921875, -1.43994140625, -1.246337890625, -1.052734375, -0.859130859375, -0.66552734375, -0.471923828125, -0.2783203125, -0.084716796875, 0.10888671875, 0.302490234375, 0.49609375, 0.689697265625, 0.88330078125, 1.076904296875, 1.2705078125, 1.464111328125, 1.65771484375, 1.851318359375, 2.044921875, 2.238525390625, 2.43212890625, 2.625732421875, 2.8193359375, 3.012939453125, 3.20654296875, 3.400146484375, 3.59375, 3.787353515625, 3.98095703125, 4.174560546875, 4.3681640625, 4.561767578125, 4.75537109375, 4.948974609375, 5.142578125, 5.336181640625, 5.52978515625, 5.723388671875, 5.9169921875, 6.110595703125, 6.30419921875, 6.497802734375, 6.69140625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 8.0, 7.0, 8.0, 14.0, 15.0, 17.0, 20.0, 23.0, 28.0, 29.0, 39.0, 41.0, 41.0, 51.0, 55.0, 44.0, 53.0, 56.0, 45.0, 42.0, 44.0, 37.0, 47.0, 31.0, 43.0, 35.0, 23.0, 22.0, 22.0, 14.0, 10.0, 7.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -9.021240234375, -8.72998046875, -8.438720703125, -8.1474609375, -7.856201171875, -7.56494140625, -7.273681640625, -6.982421875, -6.691162109375, -6.39990234375, -6.108642578125, -5.8173828125, -5.526123046875, -5.23486328125, -4.943603515625, -4.65234375, -4.361083984375, -4.06982421875, -3.778564453125, -3.4873046875, -3.196044921875, -2.90478515625, -2.613525390625, -2.322265625, -2.031005859375, -1.73974609375, -1.448486328125, -1.1572265625, -0.865966796875, -0.57470703125, -0.283447265625, 0.0078125, 0.299072265625, 0.59033203125, 0.881591796875, 1.1728515625, 1.464111328125, 1.75537109375, 2.046630859375, 2.337890625, 2.629150390625, 2.92041015625, 3.211669921875, 3.5029296875, 3.794189453125, 4.08544921875, 4.376708984375, 4.66796875, 4.959228515625, 5.25048828125, 5.541748046875, 5.8330078125, 6.124267578125, 6.41552734375, 6.706787109375, 6.998046875, 7.289306640625, 7.58056640625, 7.871826171875, 8.1630859375, 8.454345703125, 8.74560546875, 9.036865234375, 9.328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 3.0, 6.0, 22.0, 15.0, 38.0, 55.0, 90.0, 197.0, 274.0, 452.0, 737.0, 1140.0, 1849.0, 3043.0, 4901.0, 7184.0, 10725.0, 16275.0, 24228.0, 34574.0, 47504.0, 62780.0, 79100.0, 93947.0, 103871.0, 105697.0, 100176.0, 87733.0, 72024.0, 57339.0, 42034.0, 30296.0, 20743.0, 13880.0, 9352.0, 6016.0, 3765.0, 2480.0, 1587.0, 921.0, 555.0, 395.0, 207.0, 152.0, 89.0, 50.0, 30.0, 17.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.09344482421875, -4.9134521484375, -4.73345947265625, -4.553466796875, -4.37347412109375, -4.1934814453125, -4.01348876953125, -3.83349609375, -3.65350341796875, -3.4735107421875, -3.29351806640625, -3.113525390625, -2.93353271484375, -2.7535400390625, -2.57354736328125, -2.3935546875, -2.21356201171875, -2.0335693359375, -1.85357666015625, -1.673583984375, -1.49359130859375, -1.3135986328125, -1.13360595703125, -0.95361328125, -0.77362060546875, -0.5936279296875, -0.41363525390625, -0.233642578125, -0.05364990234375, 0.1263427734375, 0.30633544921875, 0.486328125, 0.66632080078125, 0.8463134765625, 1.02630615234375, 1.206298828125, 1.38629150390625, 1.5662841796875, 1.74627685546875, 1.92626953125, 2.10626220703125, 2.2862548828125, 2.46624755859375, 2.646240234375, 2.82623291015625, 3.0062255859375, 3.18621826171875, 3.3662109375, 3.54620361328125, 3.7261962890625, 3.90618896484375, 4.086181640625, 4.26617431640625, 4.4461669921875, 4.62615966796875, 4.80615234375, 4.98614501953125, 5.1661376953125, 5.34613037109375, 5.526123046875, 5.70611572265625, 5.8861083984375, 6.06610107421875, 6.24609375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 2.0, 5.0, 7.0, 7.0, 13.0, 11.0, 15.0, 8.0, 25.0, 19.0, 22.0, 20.0, 24.0, 38.0, 34.0, 34.0, 36.0, 32.0, 46.0, 40.0, 50.0, 48.0, 41.0, 45.0, 30.0, 32.0, 31.0, 30.0, 30.0, 30.0, 23.0, 25.0, 27.0, 14.0, 18.0, 15.0, 12.0, 6.0, 10.0, 10.0, 5.0, 7.0, 6.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.7374267578125, -4.592041015625, -4.4466552734375, -4.30126953125, -4.1558837890625, -4.010498046875, -3.8651123046875, -3.7197265625, -3.5743408203125, -3.428955078125, -3.2835693359375, -3.13818359375, -2.9927978515625, -2.847412109375, -2.7020263671875, -2.556640625, -2.4112548828125, -2.265869140625, -2.1204833984375, -1.97509765625, -1.8297119140625, -1.684326171875, -1.5389404296875, -1.3935546875, -1.2481689453125, -1.102783203125, -0.9573974609375, -0.81201171875, -0.6666259765625, -0.521240234375, -0.3758544921875, -0.23046875, -0.0850830078125, 0.060302734375, 0.2056884765625, 0.35107421875, 0.4964599609375, 0.641845703125, 0.7872314453125, 0.9326171875, 1.0780029296875, 1.223388671875, 1.3687744140625, 1.51416015625, 1.6595458984375, 1.804931640625, 1.9503173828125, 2.095703125, 2.2410888671875, 2.386474609375, 2.5318603515625, 2.67724609375, 2.8226318359375, 2.968017578125, 3.1134033203125, 3.2587890625, 3.4041748046875, 3.549560546875, 3.6949462890625, 3.84033203125, 3.9857177734375, 4.131103515625, 4.2764892578125, 4.421875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 13.0, 27.0, 19.0, 46.0, 62.0, 68.0, 115.0, 150.0, 213.0, 317.0, 468.0, 829.0, 1293.0, 2242.0, 4042.0, 7288.0, 13689.0, 26073.0, 49823.0, 93242.0, 156300.0, 206659.0, 193703.0, 131972.0, 74695.0, 39766.0, 20664.0, 10883.0, 5824.0, 3189.0, 1837.0, 1135.0, 643.0, 417.0, 262.0, 172.0, 108.0, 86.0, 53.0, 42.0, 44.0, 14.0, 13.0, 13.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.6015625, -7.36993408203125, -7.1383056640625, -6.90667724609375, -6.675048828125, -6.44342041015625, -6.2117919921875, -5.98016357421875, -5.74853515625, -5.51690673828125, -5.2852783203125, -5.05364990234375, -4.822021484375, -4.59039306640625, -4.3587646484375, -4.12713623046875, -3.8955078125, -3.66387939453125, -3.4322509765625, -3.20062255859375, -2.968994140625, -2.73736572265625, -2.5057373046875, -2.27410888671875, -2.04248046875, -1.81085205078125, -1.5792236328125, -1.34759521484375, -1.115966796875, -0.88433837890625, -0.6527099609375, -0.42108154296875, -0.189453125, 0.04217529296875, 0.2738037109375, 0.50543212890625, 0.737060546875, 0.96868896484375, 1.2003173828125, 1.43194580078125, 1.66357421875, 1.89520263671875, 2.1268310546875, 2.35845947265625, 2.590087890625, 2.82171630859375, 3.0533447265625, 3.28497314453125, 3.5166015625, 3.74822998046875, 3.9798583984375, 4.21148681640625, 4.443115234375, 4.67474365234375, 4.9063720703125, 5.13800048828125, 5.36962890625, 5.60125732421875, 5.8328857421875, 6.06451416015625, 6.296142578125, 6.52777099609375, 6.7593994140625, 6.99102783203125, 7.22265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 10.0, 4.0, 7.0, 8.0, 17.0, 21.0, 30.0, 32.0, 30.0, 36.0, 60.0, 51.0, 56.0, 66.0, 55.0, 66.0, 71.0, 63.0, 40.0, 54.0, 47.0, 36.0, 26.0, 21.0, 15.0, 15.0, 10.0, 8.0, 8.0, 8.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005731582641601562, -0.0005551949143409729, -0.0005372315645217896, -0.0005192682147026062, -0.0005013048648834229, -0.0004833415150642395, -0.00046537816524505615, -0.0004474148154258728, -0.00042945146560668945, -0.0004114881157875061, -0.00039352476596832275, -0.0003755614161491394, -0.00035759806632995605, -0.0003396347165107727, -0.00032167136669158936, -0.000303708016872406, -0.00028574466705322266, -0.0002677813172340393, -0.00024981796741485596, -0.0002318546175956726, -0.00021389126777648926, -0.0001959279179573059, -0.00017796456813812256, -0.0001600012183189392, -0.00014203786849975586, -0.0001240745186805725, -0.00010611116886138916, -8.814781904220581e-05, -7.018446922302246e-05, -5.222111940383911e-05, -3.425776958465576e-05, -1.6294419765472412e-05, 1.6689300537109375e-06, 1.9632279872894287e-05, 3.759562969207764e-05, 5.5558979511260986e-05, 7.352232933044434e-05, 9.148567914962769e-05, 0.00010944902896881104, 0.00012741237878799438, 0.00014537572860717773, 0.00016333907842636108, 0.00018130242824554443, 0.00019926577806472778, 0.00021722912788391113, 0.00023519247770309448, 0.00025315582752227783, 0.0002711191773414612, 0.00028908252716064453, 0.0003070458769798279, 0.00032500922679901123, 0.0003429725766181946, 0.00036093592643737793, 0.0003788992762565613, 0.00039686262607574463, 0.000414825975894928, 0.00043278932571411133, 0.0004507526755332947, 0.00046871602535247803, 0.0004866793751716614, 0.0005046427249908447, 0.0005226060748100281, 0.0005405694246292114, 0.0005585327744483948, 0.0005764961242675781]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 27.0, 21.0, 31.0, 42.0, 71.0, 122.0, 179.0, 295.0, 588.0, 1153.0, 2272.0, 4768.0, 9877.0, 21897.0, 48417.0, 103192.0, 187644.0, 245429.0, 202457.0, 116586.0, 55918.0, 25423.0, 11358.0, 5242.0, 2625.0, 1343.0, 633.0, 368.0, 210.0, 123.0, 77.0, 55.0, 25.0, 27.0, 14.0, 16.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0546875, -7.782470703125, -7.51025390625, -7.238037109375, -6.9658203125, -6.693603515625, -6.42138671875, -6.149169921875, -5.876953125, -5.604736328125, -5.33251953125, -5.060302734375, -4.7880859375, -4.515869140625, -4.24365234375, -3.971435546875, -3.69921875, -3.427001953125, -3.15478515625, -2.882568359375, -2.6103515625, -2.338134765625, -2.06591796875, -1.793701171875, -1.521484375, -1.249267578125, -0.97705078125, -0.704833984375, -0.4326171875, -0.160400390625, 0.11181640625, 0.384033203125, 0.65625, 0.928466796875, 1.20068359375, 1.472900390625, 1.7451171875, 2.017333984375, 2.28955078125, 2.561767578125, 2.833984375, 3.106201171875, 3.37841796875, 3.650634765625, 3.9228515625, 4.195068359375, 4.46728515625, 4.739501953125, 5.01171875, 5.283935546875, 5.55615234375, 5.828369140625, 6.1005859375, 6.372802734375, 6.64501953125, 6.917236328125, 7.189453125, 7.461669921875, 7.73388671875, 8.006103515625, 8.2783203125, 8.550537109375, 8.82275390625, 9.094970703125, 9.3671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 19.0, 13.0, 26.0, 21.0, 38.0, 42.0, 41.0, 51.0, 62.0, 62.0, 65.0, 68.0, 69.0, 61.0, 41.0, 63.0, 49.0, 42.0, 37.0, 28.0, 22.0, 14.0, 7.0, 11.0, 4.0, 5.0, 6.0, 2.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5234375, -1.467864990234375, -1.41229248046875, -1.356719970703125, -1.3011474609375, -1.245574951171875, -1.19000244140625, -1.134429931640625, -1.078857421875, -1.023284912109375, -0.96771240234375, -0.912139892578125, -0.8565673828125, -0.800994873046875, -0.74542236328125, -0.689849853515625, -0.63427734375, -0.578704833984375, -0.52313232421875, -0.467559814453125, -0.4119873046875, -0.356414794921875, -0.30084228515625, -0.245269775390625, -0.189697265625, -0.134124755859375, -0.07855224609375, -0.022979736328125, 0.0325927734375, 0.088165283203125, 0.14373779296875, 0.199310302734375, 0.2548828125, 0.310455322265625, 0.36602783203125, 0.421600341796875, 0.4771728515625, 0.532745361328125, 0.58831787109375, 0.643890380859375, 0.699462890625, 0.755035400390625, 0.81060791015625, 0.866180419921875, 0.9217529296875, 0.977325439453125, 1.03289794921875, 1.088470458984375, 1.14404296875, 1.199615478515625, 1.25518798828125, 1.310760498046875, 1.3663330078125, 1.421905517578125, 1.47747802734375, 1.533050537109375, 1.588623046875, 1.644195556640625, 1.69976806640625, 1.755340576171875, 1.8109130859375, 1.866485595703125, 1.92205810546875, 1.977630615234375, 2.033203125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 5.0, 8.0, 11.0, 16.0, 19.0, 24.0, 21.0, 35.0, 47.0, 34.0, 51.0, 64.0, 44.0, 59.0, 85.0, 79.0, 58.0, 65.0, 44.0, 41.0, 36.0, 36.0, 24.0, 26.0, 18.0, 10.0, 14.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-19.812416076660156, -19.31037139892578, -18.808324813842773, -18.3062801361084, -17.80423355102539, -17.302188873291016, -16.80014419555664, -16.298097610473633, -15.796052932739258, -15.294007301330566, -14.791961669921875, -14.2899169921875, -13.787871360778809, -13.285825729370117, -12.783781051635742, -12.28173542022705, -11.77968978881836, -11.277644157409668, -10.775598526000977, -10.273553848266602, -9.77150821685791, -9.269462585449219, -8.767417907714844, -8.265372276306152, -7.763326644897461, -7.2612810134887695, -6.759235858917236, -6.257190704345703, -5.755145072937012, -5.25309944152832, -4.751054286956787, -4.249009132385254, -3.7469654083251953, -3.244920015335083, -2.7428746223449707, -2.2408292293548584, -1.738783836364746, -1.2367384433746338, -0.7346930503845215, -0.23264765739440918, 0.2693977355957031, 0.7714431285858154, 1.2734885215759277, 1.77553391456604, 2.2775793075561523, 2.7796247005462646, 3.281670093536377, 3.7837154865264893, 4.285760879516602, 4.787806510925293, 5.289851665496826, 5.791896820068359, 6.293942451477051, 6.795988082885742, 7.298033237457275, 7.800078392028809, 8.3021240234375, 8.804169654846191, 9.306215286254883, 9.808259963989258, 10.31030559539795, 10.81235122680664, 11.314395904541016, 11.816441535949707, 12.318487167358398]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 9.0, 4.0, 7.0, 7.0, 4.0, 12.0, 15.0, 15.0, 21.0, 20.0, 20.0, 23.0, 31.0, 31.0, 30.0, 39.0, 40.0, 36.0, 46.0, 44.0, 48.0, 44.0, 36.0, 39.0, 43.0, 36.0, 44.0, 34.0, 39.0, 30.0, 24.0, 23.0, 23.0, 15.0, 9.0, 10.0, 11.0, 12.0, 8.0, 4.0, 7.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.02529239654541, -7.781941890716553, -7.538591384887695, -7.295241355895996, -7.051890850067139, -6.808540344238281, -6.565189838409424, -6.321839332580566, -6.078489303588867, -5.83513879776001, -5.591788291931152, -5.348438262939453, -5.105087757110596, -4.861737251281738, -4.618386745452881, -4.375036239624023, -4.131685733795166, -3.8883352279663086, -3.6449849605560303, -3.401634454727173, -3.1582841873168945, -2.914933681488037, -2.6715831756591797, -2.4282326698303223, -2.184882402420044, -1.941532015800476, -1.6981816291809082, -1.4548311233520508, -1.211480736732483, -0.968130350112915, -0.7247798442840576, -0.48142945766448975, -0.23807954788208008, 0.005270868539810181, 0.24862128496170044, 0.4919717311859131, 0.735322117805481, 0.9786725044250488, 1.2220230102539062, 1.4653733968734741, 1.708723783493042, 1.9520741701126099, 2.1954245567321777, 2.438775062561035, 2.6821255683898926, 2.925475835800171, 3.1688263416290283, 3.4121766090393066, 3.655527114868164, 3.8988776206970215, 4.142228126525879, 4.385578155517578, 4.6289286613464355, 4.872279167175293, 5.11562967300415, 5.358980178833008, 5.602330207824707, 5.8456807136535645, 6.089031219482422, 6.332381248474121, 6.5757317543029785, 6.819082260131836, 7.062432765960693, 7.305783271789551, 7.549133777618408]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 10.0, 11.0, 32.0, 42.0, 70.0, 104.0, 181.0, 333.0, 567.0, 951.0, 1540.0, 2696.0, 4460.0, 7692.0, 13133.0, 22447.0, 38760.0, 66378.0, 112712.0, 187095.0, 299944.0, 442803.0, 579221.0, 639988.0, 578579.0, 442726.0, 298639.0, 186166.0, 110875.0, 65112.0, 37987.0, 21852.0, 12813.0, 7441.0, 4358.0, 2582.0, 1608.0, 906.0, 570.0, 339.0, 231.0, 110.0, 91.0, 55.0, 25.0, 11.0, 20.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.01953125, -8.703125, -8.38671875, -8.0703125, -7.75390625, -7.4375, -7.12109375, -6.8046875, -6.48828125, -6.171875, -5.85546875, -5.5390625, -5.22265625, -4.90625, -4.58984375, -4.2734375, -3.95703125, -3.640625, -3.32421875, -3.0078125, -2.69140625, -2.375, -2.05859375, -1.7421875, -1.42578125, -1.109375, -0.79296875, -0.4765625, -0.16015625, 0.15625, 0.47265625, 0.7890625, 1.10546875, 1.421875, 1.73828125, 2.0546875, 2.37109375, 2.6875, 3.00390625, 3.3203125, 3.63671875, 3.953125, 4.26953125, 4.5859375, 4.90234375, 5.21875, 5.53515625, 5.8515625, 6.16796875, 6.484375, 6.80078125, 7.1171875, 7.43359375, 7.75, 8.06640625, 8.3828125, 8.69921875, 9.015625, 9.33203125, 9.6484375, 9.96484375, 10.28125, 10.59765625, 10.9140625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 5.0, 3.0, 5.0, 14.0, 9.0, 5.0, 7.0, 9.0, 22.0, 18.0, 18.0, 21.0, 34.0, 20.0, 34.0, 39.0, 33.0, 37.0, 38.0, 41.0, 42.0, 55.0, 46.0, 39.0, 37.0, 39.0, 28.0, 38.0, 35.0, 19.0, 34.0, 33.0, 21.0, 24.0, 14.0, 19.0, 11.0, 14.0, 8.0, 12.0, 5.0, 4.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84765625, -5.65966796875, -5.4716796875, -5.28369140625, -5.095703125, -4.90771484375, -4.7197265625, -4.53173828125, -4.34375, -4.15576171875, -3.9677734375, -3.77978515625, -3.591796875, -3.40380859375, -3.2158203125, -3.02783203125, -2.83984375, -2.65185546875, -2.4638671875, -2.27587890625, -2.087890625, -1.89990234375, -1.7119140625, -1.52392578125, -1.3359375, -1.14794921875, -0.9599609375, -0.77197265625, -0.583984375, -0.39599609375, -0.2080078125, -0.02001953125, 0.16796875, 0.35595703125, 0.5439453125, 0.73193359375, 0.919921875, 1.10791015625, 1.2958984375, 1.48388671875, 1.671875, 1.85986328125, 2.0478515625, 2.23583984375, 2.423828125, 2.61181640625, 2.7998046875, 2.98779296875, 3.17578125, 3.36376953125, 3.5517578125, 3.73974609375, 3.927734375, 4.11572265625, 4.3037109375, 4.49169921875, 4.6796875, 4.86767578125, 5.0556640625, 5.24365234375, 5.431640625, 5.61962890625, 5.8076171875, 5.99560546875, 6.18359375]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 9.0, 10.0, 13.0, 15.0, 32.0, 71.0, 83.0, 153.0, 260.0, 442.0, 709.0, 1167.0, 1926.0, 3273.0, 5520.0, 9455.0, 16186.0, 27149.0, 45365.0, 76046.0, 124120.0, 194248.0, 291176.0, 405577.0, 509456.0, 560102.0, 536801.0, 446846.0, 334401.0, 228021.0, 147352.0, 91588.0, 55598.0, 33142.0, 19664.0, 11623.0, 6713.0, 3970.0, 2351.0, 1422.0, 892.0, 543.0, 292.0, 197.0, 125.0, 56.0, 54.0, 33.0, 17.0, 16.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.464111328125, -8.14697265625, -7.829833984375, -7.5126953125, -7.195556640625, -6.87841796875, -6.561279296875, -6.244140625, -5.927001953125, -5.60986328125, -5.292724609375, -4.9755859375, -4.658447265625, -4.34130859375, -4.024169921875, -3.70703125, -3.389892578125, -3.07275390625, -2.755615234375, -2.4384765625, -2.121337890625, -1.80419921875, -1.487060546875, -1.169921875, -0.852783203125, -0.53564453125, -0.218505859375, 0.0986328125, 0.415771484375, 0.73291015625, 1.050048828125, 1.3671875, 1.684326171875, 2.00146484375, 2.318603515625, 2.6357421875, 2.952880859375, 3.27001953125, 3.587158203125, 3.904296875, 4.221435546875, 4.53857421875, 4.855712890625, 5.1728515625, 5.489990234375, 5.80712890625, 6.124267578125, 6.44140625, 6.758544921875, 7.07568359375, 7.392822265625, 7.7099609375, 8.027099609375, 8.34423828125, 8.661376953125, 8.978515625, 9.295654296875, 9.61279296875, 9.929931640625, 10.2470703125, 10.564208984375, 10.88134765625, 11.198486328125, 11.515625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 14.0, 12.0, 13.0, 19.0, 35.0, 32.0, 49.0, 51.0, 51.0, 79.0, 80.0, 109.0, 108.0, 145.0, 163.0, 155.0, 177.0, 192.0, 206.0, 219.0, 212.0, 197.0, 222.0, 199.0, 189.0, 181.0, 150.0, 145.0, 115.0, 97.0, 87.0, 89.0, 55.0, 43.0, 46.0, 28.0, 31.0, 23.0, 14.0, 8.0, 11.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-3.974609375, -3.86224365234375, -3.7498779296875, -3.63751220703125, -3.525146484375, -3.41278076171875, -3.3004150390625, -3.18804931640625, -3.07568359375, -2.96331787109375, -2.8509521484375, -2.73858642578125, -2.626220703125, -2.51385498046875, -2.4014892578125, -2.28912353515625, -2.1767578125, -2.06439208984375, -1.9520263671875, -1.83966064453125, -1.727294921875, -1.61492919921875, -1.5025634765625, -1.39019775390625, -1.27783203125, -1.16546630859375, -1.0531005859375, -0.94073486328125, -0.828369140625, -0.71600341796875, -0.6036376953125, -0.49127197265625, -0.37890625, -0.26654052734375, -0.1541748046875, -0.04180908203125, 0.070556640625, 0.18292236328125, 0.2952880859375, 0.40765380859375, 0.52001953125, 0.63238525390625, 0.7447509765625, 0.85711669921875, 0.969482421875, 1.08184814453125, 1.1942138671875, 1.30657958984375, 1.4189453125, 1.53131103515625, 1.6436767578125, 1.75604248046875, 1.868408203125, 1.98077392578125, 2.0931396484375, 2.20550537109375, 2.31787109375, 2.43023681640625, 2.5426025390625, 2.65496826171875, 2.767333984375, 2.87969970703125, 2.9920654296875, 3.10443115234375, 3.216796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 6.0, 8.0, 12.0, 18.0, 20.0, 19.0, 37.0, 28.0, 37.0, 45.0, 51.0, 69.0, 65.0, 62.0, 61.0, 63.0, 59.0, 56.0, 37.0, 45.0, 34.0, 30.0, 37.0, 16.0, 19.0, 16.0, 8.0, 10.0, 8.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-18.870746612548828, -18.36263656616211, -17.85452651977539, -17.346418380737305, -16.838308334350586, -16.330198287963867, -15.822088241577148, -15.31397819519043, -14.805869102478027, -14.297759056091309, -13.789649963378906, -13.281539916992188, -12.773429870605469, -12.265320777893066, -11.757210731506348, -11.249101638793945, -10.740991592407227, -10.232881546020508, -9.724772453308105, -9.216662406921387, -8.708553314208984, -8.200443267822266, -7.692333221435547, -7.184223651885986, -6.676114082336426, -6.168004512786865, -5.659894943237305, -5.151784896850586, -4.643675327301025, -4.135565757751465, -3.627455949783325, -3.1193461418151855, -2.6112356185913086, -2.103126049041748, -1.5950162410736084, -1.0869065523147583, -0.5787968635559082, -0.07068729400634766, 0.437422513961792, 0.9455323219299316, 1.4536418914794922, 1.9617515802383423, 2.4698612689971924, 2.977971076965332, 3.4860806465148926, 3.994190216064453, 4.502300262451172, 5.010409832000732, 5.518519401550293, 6.0266289710998535, 6.534738540649414, 7.042848587036133, 7.550958156585693, 8.059067726135254, 8.567177772521973, 9.075286865234375, 9.583396911621094, 10.091506958007812, 10.599616050720215, 11.107726097106934, 11.615835189819336, 12.123945236206055, 12.632055282592773, 13.140165328979492, 13.648274421691895]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 3.0, 4.0, 6.0, 14.0, 8.0, 16.0, 15.0, 19.0, 14.0, 23.0, 31.0, 24.0, 21.0, 37.0, 38.0, 52.0, 47.0, 39.0, 39.0, 31.0, 45.0, 50.0, 58.0, 35.0, 41.0, 39.0, 30.0, 32.0, 37.0, 31.0, 23.0, 17.0, 16.0, 10.0, 12.0, 8.0, 12.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.106224060058594, -7.842144012451172, -7.578064441680908, -7.313984394073486, -7.049904823303223, -6.785824775695801, -6.521744728088379, -6.257665157318115, -5.993585586547852, -5.72950553894043, -5.465425968170166, -5.201345920562744, -4.9372663497924805, -4.673186302185059, -4.409106254577637, -4.145026683807373, -3.880946636199951, -3.6168668270111084, -3.3527870178222656, -3.0887069702148438, -2.82462739944458, -2.560547351837158, -2.2964675426483154, -2.0323877334594727, -1.7683079242706299, -1.504228115081787, -1.2401483058929443, -0.976068377494812, -0.7119885683059692, -0.44790875911712646, -0.18382883071899414, 0.08025097846984863, 0.3443307876586914, 0.6084105968475342, 0.8724904656410217, 1.1365703344345093, 1.400650143623352, 1.6647299528121948, 1.9288098812103271, 2.19288969039917, 2.4569694995880127, 2.7210493087768555, 2.9851291179656982, 3.249208927154541, 3.513288974761963, 3.7773685455322266, 4.041448593139648, 4.30552864074707, 4.569608211517334, 4.833688259124756, 5.0977678298950195, 5.361847877502441, 5.625927448272705, 5.890007495880127, 6.154087066650391, 6.4181671142578125, 6.682247161865234, 6.946327209472656, 7.21040678024292, 7.474486827850342, 7.7385663986206055, 8.002646446228027, 8.26672649383545, 8.530805587768555, 8.794885635375977]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 8.0, 3.0, 6.0, 13.0, 13.0, 25.0, 32.0, 61.0, 106.0, 158.0, 254.0, 371.0, 545.0, 925.0, 1456.0, 2231.0, 3477.0, 5326.0, 8494.0, 13332.0, 20400.0, 31636.0, 48530.0, 71502.0, 100776.0, 129714.0, 144254.0, 133664.0, 106370.0, 76663.0, 52178.0, 34174.0, 22023.0, 14446.0, 9105.0, 5762.0, 3865.0, 2435.0, 1509.0, 945.0, 629.0, 432.0, 239.0, 178.0, 109.0, 72.0, 44.0, 26.0, 16.0, 10.0, 8.0, 4.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.724609375, -1.66632080078125, -1.6080322265625, -1.54974365234375, -1.491455078125, -1.43316650390625, -1.3748779296875, -1.31658935546875, -1.25830078125, -1.20001220703125, -1.1417236328125, -1.08343505859375, -1.025146484375, -0.96685791015625, -0.9085693359375, -0.85028076171875, -0.7919921875, -0.73370361328125, -0.6754150390625, -0.61712646484375, -0.558837890625, -0.50054931640625, -0.4422607421875, -0.38397216796875, -0.32568359375, -0.26739501953125, -0.2091064453125, -0.15081787109375, -0.092529296875, -0.03424072265625, 0.0240478515625, 0.08233642578125, 0.140625, 0.19891357421875, 0.2572021484375, 0.31549072265625, 0.373779296875, 0.43206787109375, 0.4903564453125, 0.54864501953125, 0.60693359375, 0.66522216796875, 0.7235107421875, 0.78179931640625, 0.840087890625, 0.89837646484375, 0.9566650390625, 1.01495361328125, 1.0732421875, 1.13153076171875, 1.1898193359375, 1.24810791015625, 1.306396484375, 1.36468505859375, 1.4229736328125, 1.48126220703125, 1.53955078125, 1.59783935546875, 1.6561279296875, 1.71441650390625, 1.772705078125, 1.83099365234375, 1.8892822265625, 1.94757080078125, 2.005859375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 8.0, 11.0, 15.0, 14.0, 22.0, 26.0, 20.0, 26.0, 23.0, 31.0, 28.0, 37.0, 39.0, 43.0, 46.0, 53.0, 38.0, 38.0, 44.0, 47.0, 35.0, 32.0, 26.0, 34.0, 31.0, 40.0, 22.0, 20.0, 19.0, 24.0, 17.0, 13.0, 8.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.852294921875, -7.57958984375, -7.306884765625, -7.0341796875, -6.761474609375, -6.48876953125, -6.216064453125, -5.943359375, -5.670654296875, -5.39794921875, -5.125244140625, -4.8525390625, -4.579833984375, -4.30712890625, -4.034423828125, -3.76171875, -3.489013671875, -3.21630859375, -2.943603515625, -2.6708984375, -2.398193359375, -2.12548828125, -1.852783203125, -1.580078125, -1.307373046875, -1.03466796875, -0.761962890625, -0.4892578125, -0.216552734375, 0.05615234375, 0.328857421875, 0.6015625, 0.874267578125, 1.14697265625, 1.419677734375, 1.6923828125, 1.965087890625, 2.23779296875, 2.510498046875, 2.783203125, 3.055908203125, 3.32861328125, 3.601318359375, 3.8740234375, 4.146728515625, 4.41943359375, 4.692138671875, 4.96484375, 5.237548828125, 5.51025390625, 5.782958984375, 6.0556640625, 6.328369140625, 6.60107421875, 6.873779296875, 7.146484375, 7.419189453125, 7.69189453125, 7.964599609375, 8.2373046875, 8.510009765625, 8.78271484375, 9.055419921875, 9.328125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 11.0, 17.0, 12.0, 37.0, 33.0, 41.0, 69.0, 116.0, 183.0, 266.0, 413.0, 708.0, 1181.0, 1840.0, 3211.0, 5327.0, 9218.0, 16257.0, 29672.0, 52649.0, 91296.0, 145971.0, 193331.0, 183820.0, 130070.0, 78942.0, 45172.0, 24971.0, 14140.0, 7874.0, 4626.0, 2728.0, 1644.0, 971.0, 654.0, 411.0, 210.0, 143.0, 98.0, 76.0, 37.0, 31.0, 20.0, 21.0, 11.0, 9.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.78515625, -2.702911376953125, -2.62066650390625, -2.538421630859375, -2.4561767578125, -2.373931884765625, -2.29168701171875, -2.209442138671875, -2.127197265625, -2.044952392578125, -1.96270751953125, -1.880462646484375, -1.7982177734375, -1.715972900390625, -1.63372802734375, -1.551483154296875, -1.46923828125, -1.386993408203125, -1.30474853515625, -1.222503662109375, -1.1402587890625, -1.058013916015625, -0.97576904296875, -0.893524169921875, -0.811279296875, -0.729034423828125, -0.64678955078125, -0.564544677734375, -0.4822998046875, -0.400054931640625, -0.31781005859375, -0.235565185546875, -0.1533203125, -0.071075439453125, 0.01116943359375, 0.093414306640625, 0.1756591796875, 0.257904052734375, 0.34014892578125, 0.422393798828125, 0.504638671875, 0.586883544921875, 0.66912841796875, 0.751373291015625, 0.8336181640625, 0.915863037109375, 0.99810791015625, 1.080352783203125, 1.16259765625, 1.244842529296875, 1.32708740234375, 1.409332275390625, 1.4915771484375, 1.573822021484375, 1.65606689453125, 1.738311767578125, 1.820556640625, 1.902801513671875, 1.98504638671875, 2.067291259765625, 2.1495361328125, 2.231781005859375, 2.31402587890625, 2.396270751953125, 2.478515625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 7.0, 7.0, 6.0, 6.0, 14.0, 13.0, 15.0, 8.0, 27.0, 15.0, 19.0, 22.0, 32.0, 27.0, 29.0, 33.0, 26.0, 40.0, 48.0, 44.0, 42.0, 41.0, 46.0, 45.0, 50.0, 32.0, 32.0, 43.0, 42.0, 28.0, 28.0, 27.0, 12.0, 14.0, 18.0, 10.0, 7.0, 12.0, 7.0, 8.0, 7.0, 5.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-6.01953125, -5.84869384765625, -5.6778564453125, -5.50701904296875, -5.336181640625, -5.16534423828125, -4.9945068359375, -4.82366943359375, -4.65283203125, -4.48199462890625, -4.3111572265625, -4.14031982421875, -3.969482421875, -3.79864501953125, -3.6278076171875, -3.45697021484375, -3.2861328125, -3.11529541015625, -2.9444580078125, -2.77362060546875, -2.602783203125, -2.43194580078125, -2.2611083984375, -2.09027099609375, -1.91943359375, -1.74859619140625, -1.5777587890625, -1.40692138671875, -1.236083984375, -1.06524658203125, -0.8944091796875, -0.72357177734375, -0.552734375, -0.38189697265625, -0.2110595703125, -0.04022216796875, 0.130615234375, 0.30145263671875, 0.4722900390625, 0.64312744140625, 0.81396484375, 0.98480224609375, 1.1556396484375, 1.32647705078125, 1.497314453125, 1.66815185546875, 1.8389892578125, 2.00982666015625, 2.1806640625, 2.35150146484375, 2.5223388671875, 2.69317626953125, 2.864013671875, 3.03485107421875, 3.2056884765625, 3.37652587890625, 3.54736328125, 3.71820068359375, 3.8890380859375, 4.05987548828125, 4.230712890625, 4.40155029296875, 4.5723876953125, 4.74322509765625, 4.9140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 12.0, 18.0, 18.0, 33.0, 45.0, 59.0, 122.0, 181.0, 251.0, 420.0, 714.0, 1172.0, 2175.0, 3755.0, 7233.0, 14819.0, 31654.0, 68889.0, 147283.0, 263185.0, 251216.0, 135409.0, 62772.0, 28640.0, 13404.0, 6713.0, 3565.0, 1896.0, 1158.0, 672.0, 359.0, 257.0, 160.0, 101.0, 67.0, 33.0, 31.0, 20.0, 19.0, 10.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8056640625, -0.7778244018554688, -0.7499847412109375, -0.7221450805664062, -0.694305419921875, -0.6664657592773438, -0.6386260986328125, -0.6107864379882812, -0.58294677734375, -0.5551071166992188, -0.5272674560546875, -0.49942779541015625, -0.471588134765625, -0.44374847412109375, -0.4159088134765625, -0.38806915283203125, -0.3602294921875, -0.33238983154296875, -0.3045501708984375, -0.27671051025390625, -0.248870849609375, -0.22103118896484375, -0.1931915283203125, -0.16535186767578125, -0.13751220703125, -0.10967254638671875, -0.0818328857421875, -0.05399322509765625, -0.026153564453125, 0.00168609619140625, 0.0295257568359375, 0.05736541748046875, 0.085205078125, 0.11304473876953125, 0.1408843994140625, 0.16872406005859375, 0.196563720703125, 0.22440338134765625, 0.2522430419921875, 0.28008270263671875, 0.30792236328125, 0.33576202392578125, 0.3636016845703125, 0.39144134521484375, 0.419281005859375, 0.44712066650390625, 0.4749603271484375, 0.5027999877929688, 0.5306396484375, 0.5584793090820312, 0.5863189697265625, 0.6141586303710938, 0.641998291015625, 0.6698379516601562, 0.6976776123046875, 0.7255172729492188, 0.75335693359375, 0.7811965942382812, 0.8090362548828125, 0.8368759155273438, 0.864715576171875, 0.8925552368164062, 0.9203948974609375, 0.9482345581054688, 0.97607421875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 11.0, 12.0, 8.0, 21.0, 22.0, 27.0, 34.0, 41.0, 38.0, 60.0, 62.0, 67.0, 62.0, 76.0, 74.0, 54.0, 60.0, 45.0, 40.0, 36.0, 28.0, 21.0, 24.0, 15.0, 14.0, 16.0, 8.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.210803985595703e-05, -6.0335732996463776e-05, -5.856342613697052e-05, -5.6791119277477264e-05, -5.501881241798401e-05, -5.324650555849075e-05, -5.14741986989975e-05, -4.970189183950424e-05, -4.7929584980010986e-05, -4.615727812051773e-05, -4.4384971261024475e-05, -4.261266440153122e-05, -4.0840357542037964e-05, -3.906805068254471e-05, -3.729574382305145e-05, -3.55234369635582e-05, -3.375113010406494e-05, -3.1978823244571686e-05, -3.020651638507843e-05, -2.8434209525585175e-05, -2.666190266609192e-05, -2.4889595806598663e-05, -2.3117288947105408e-05, -2.1344982087612152e-05, -1.9572675228118896e-05, -1.780036836862564e-05, -1.6028061509132385e-05, -1.425575464963913e-05, -1.2483447790145874e-05, -1.0711140930652618e-05, -8.938834071159363e-06, -7.166527211666107e-06, -5.3942203521728516e-06, -3.621913492679596e-06, -1.8496066331863403e-06, -7.729977369308472e-08, 1.695007085800171e-06, 3.4673139452934265e-06, 5.239620804786682e-06, 7.011927664279938e-06, 8.784234523773193e-06, 1.0556541383266449e-05, 1.2328848242759705e-05, 1.410115510225296e-05, 1.5873461961746216e-05, 1.764576882123947e-05, 1.9418075680732727e-05, 2.1190382540225983e-05, 2.2962689399719238e-05, 2.4734996259212494e-05, 2.650730311870575e-05, 2.8279609978199005e-05, 3.005191683769226e-05, 3.1824223697185516e-05, 3.359653055667877e-05, 3.536883741617203e-05, 3.714114427566528e-05, 3.891345113515854e-05, 4.0685757994651794e-05, 4.245806485414505e-05, 4.4230371713638306e-05, 4.600267857313156e-05, 4.777498543262482e-05, 4.954729229211807e-05, 5.131959915161133e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 11.0, 18.0, 25.0, 25.0, 37.0, 70.0, 115.0, 162.0, 249.0, 359.0, 603.0, 1041.0, 1647.0, 3033.0, 5453.0, 9577.0, 17851.0, 33902.0, 63657.0, 119365.0, 202476.0, 236053.0, 161045.0, 89052.0, 47389.0, 24815.0, 13160.0, 7256.0, 4215.0, 2337.0, 1360.0, 805.0, 519.0, 284.0, 202.0, 140.0, 70.0, 52.0, 33.0, 26.0, 17.0, 6.0, 10.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0], "bins": [-1.060546875, -1.0286636352539062, -0.9967803955078125, -0.9648971557617188, -0.933013916015625, -0.9011306762695312, -0.8692474365234375, -0.8373641967773438, -0.80548095703125, -0.7735977172851562, -0.7417144775390625, -0.7098312377929688, -0.677947998046875, -0.6460647583007812, -0.6141815185546875, -0.5822982788085938, -0.5504150390625, -0.5185317993164062, -0.4866485595703125, -0.45476531982421875, -0.422882080078125, -0.39099884033203125, -0.3591156005859375, -0.32723236083984375, -0.29534912109375, -0.26346588134765625, -0.2315826416015625, -0.19969940185546875, -0.167816162109375, -0.13593292236328125, -0.1040496826171875, -0.07216644287109375, -0.040283203125, -0.00839996337890625, 0.0234832763671875, 0.05536651611328125, 0.087249755859375, 0.11913299560546875, 0.1510162353515625, 0.18289947509765625, 0.21478271484375, 0.24666595458984375, 0.2785491943359375, 0.31043243408203125, 0.342315673828125, 0.37419891357421875, 0.4060821533203125, 0.43796539306640625, 0.4698486328125, 0.5017318725585938, 0.5336151123046875, 0.5654983520507812, 0.597381591796875, 0.6292648315429688, 0.6611480712890625, 0.6930313110351562, 0.72491455078125, 0.7567977905273438, 0.7886810302734375, 0.8205642700195312, 0.852447509765625, 0.8843307495117188, 0.9162139892578125, 0.9480972290039062, 0.97998046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 1.0, 5.0, 1.0, 4.0, 1.0, 6.0, 7.0, 8.0, 8.0, 10.0, 15.0, 14.0, 16.0, 24.0, 27.0, 20.0, 37.0, 42.0, 41.0, 64.0, 67.0, 72.0, 76.0, 86.0, 61.0, 40.0, 49.0, 28.0, 30.0, 24.0, 25.0, 16.0, 11.0, 17.0, 15.0, 11.0, 8.0, 3.0, 6.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2449951171875, -0.2368297576904297, -0.22866439819335938, -0.22049903869628906, -0.21233367919921875, -0.20416831970214844, -0.19600296020507812, -0.1878376007080078, -0.1796722412109375, -0.1715068817138672, -0.16334152221679688, -0.15517616271972656, -0.14701080322265625, -0.13884544372558594, -0.13068008422851562, -0.12251472473144531, -0.114349365234375, -0.10618400573730469, -0.09801864624023438, -0.08985328674316406, -0.08168792724609375, -0.07352256774902344, -0.06535720825195312, -0.05719184875488281, -0.0490264892578125, -0.04086112976074219, -0.032695770263671875, -0.024530410766601562, -0.01636505126953125, -0.008199691772460938, -3.4332275390625e-05, 0.008131027221679688, 0.01629638671875, 0.024461746215820312, 0.032627105712890625, 0.04079246520996094, 0.04895782470703125, 0.05712318420410156, 0.06528854370117188, 0.07345390319824219, 0.0816192626953125, 0.08978462219238281, 0.09794998168945312, 0.10611534118652344, 0.11428070068359375, 0.12244606018066406, 0.13061141967773438, 0.1387767791748047, 0.146942138671875, 0.1551074981689453, 0.16327285766601562, 0.17143821716308594, 0.17960357666015625, 0.18776893615722656, 0.19593429565429688, 0.2040996551513672, 0.2122650146484375, 0.2204303741455078, 0.22859573364257812, 0.23676109313964844, 0.24492645263671875, 0.25309181213378906, 0.2612571716308594, 0.2694225311279297, 0.277587890625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 5.0, 9.0, 8.0, 10.0, 15.0, 22.0, 24.0, 33.0, 34.0, 39.0, 44.0, 47.0, 73.0, 65.0, 55.0, 68.0, 65.0, 58.0, 60.0, 33.0, 42.0, 32.0, 32.0, 36.0, 16.0, 17.0, 17.0, 6.0, 12.0, 6.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-18.734418869018555, -18.22749137878418, -17.720563888549805, -17.213634490966797, -16.706707000732422, -16.199779510498047, -15.692852020263672, -15.185924530029297, -14.678996086120605, -14.17206859588623, -13.665140151977539, -13.158212661743164, -12.651285171508789, -12.144356727600098, -11.637429237365723, -11.130500793457031, -10.623573303222656, -10.116645812988281, -9.60971736907959, -9.102789878845215, -8.595861434936523, -8.088933944702148, -7.582006454467773, -7.07507848739624, -6.568150520324707, -6.061222553253174, -5.554294586181641, -5.047367095947266, -4.540439128875732, -4.033511161804199, -3.526583433151245, -3.019655704498291, -2.5127267837524414, -2.005798816680908, -1.498871088027954, -0.9919432401657104, -0.4850153923034668, 0.021912574768066406, 0.5288403034210205, 1.0357680320739746, 1.5426959991455078, 2.049623966217041, 2.556551694869995, 3.063479423522949, 3.5704073905944824, 4.077335357666016, 4.584262847900391, 5.091190814971924, 5.598118782043457, 6.10504674911499, 6.611974716186523, 7.118902206420898, 7.625830173492432, 8.132758140563965, 8.63968563079834, 9.146614074707031, 9.653541564941406, 10.160469055175781, 10.667397499084473, 11.174324989318848, 11.681253433227539, 12.188180923461914, 12.695108413696289, 13.202035903930664, 13.708964347839355]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 3.0, 5.0, 6.0, 9.0, 16.0, 15.0, 16.0, 17.0, 15.0, 24.0, 26.0, 28.0, 18.0, 38.0, 39.0, 51.0, 50.0, 39.0, 39.0, 30.0, 48.0, 50.0, 53.0, 37.0, 42.0, 38.0, 27.0, 31.0, 40.0, 28.0, 22.0, 23.0, 13.0, 10.0, 13.0, 10.0, 11.0, 7.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.095754623413086, -7.832189559936523, -7.568624973297119, -7.305059909820557, -7.041495323181152, -6.77793025970459, -6.514365196228027, -6.250800609588623, -5.987236022949219, -5.723670959472656, -5.460106372833252, -5.1965413093566895, -4.932976722717285, -4.669411659240723, -4.40584659576416, -4.142282009124756, -3.8787169456481934, -3.61515212059021, -3.3515872955322266, -3.088022232055664, -2.8244576454162598, -2.5608925819396973, -2.297327756881714, -2.0337629318237305, -1.770198106765747, -1.5066332817077637, -1.2430684566497803, -0.9795035123825073, -0.7159386873245239, -0.4523738622665405, -0.18880891799926758, 0.07475590705871582, 0.3383207321166992, 0.6018855571746826, 0.8654504418373108, 1.129015326499939, 1.3925801515579224, 1.6561449766159058, 1.9197099208831787, 2.183274745941162, 2.4468395709991455, 2.710404396057129, 2.9739692211151123, 3.2375340461730957, 3.501099109649658, 3.7646636962890625, 4.028228759765625, 4.2917938232421875, 4.555358409881592, 4.818923473358154, 5.082488059997559, 5.346053123474121, 5.609617710113525, 5.873182773590088, 6.136747360229492, 6.400312423706055, 6.663877487182617, 6.92744255065918, 7.191007137298584, 7.4545722007751465, 7.718136787414551, 7.981701850891113, 8.245266914367676, 8.508831024169922, 8.772396087646484]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 16.0, 28.0, 43.0, 67.0, 106.0, 176.0, 355.0, 575.0, 974.0, 1547.0, 2897.0, 4656.0, 7472.0, 12675.0, 19939.0, 31210.0, 46398.0, 66615.0, 88403.0, 109413.0, 121803.0, 122598.0, 111690.0, 91724.0, 69964.0, 49033.0, 32982.0, 21281.0, 13532.0, 8156.0, 4894.0, 2976.0, 1813.0, 1053.0, 596.0, 359.0, 216.0, 134.0, 57.0, 50.0, 25.0, 22.0, 11.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.96484375, -6.7476806640625, -6.530517578125, -6.3133544921875, -6.09619140625, -5.8790283203125, -5.661865234375, -5.4447021484375, -5.2275390625, -5.0103759765625, -4.793212890625, -4.5760498046875, -4.35888671875, -4.1417236328125, -3.924560546875, -3.7073974609375, -3.490234375, -3.2730712890625, -3.055908203125, -2.8387451171875, -2.62158203125, -2.4044189453125, -2.187255859375, -1.9700927734375, -1.7529296875, -1.5357666015625, -1.318603515625, -1.1014404296875, -0.88427734375, -0.6671142578125, -0.449951171875, -0.2327880859375, -0.015625, 0.2015380859375, 0.418701171875, 0.6358642578125, 0.85302734375, 1.0701904296875, 1.287353515625, 1.5045166015625, 1.7216796875, 1.9388427734375, 2.156005859375, 2.3731689453125, 2.59033203125, 2.8074951171875, 3.024658203125, 3.2418212890625, 3.458984375, 3.6761474609375, 3.893310546875, 4.1104736328125, 4.32763671875, 4.5447998046875, 4.761962890625, 4.9791259765625, 5.1962890625, 5.4134521484375, 5.630615234375, 5.8477783203125, 6.06494140625, 6.2821044921875, 6.499267578125, 6.7164306640625, 6.93359375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 10.0, 13.0, 14.0, 18.0, 14.0, 21.0, 22.0, 28.0, 28.0, 19.0, 47.0, 55.0, 37.0, 41.0, 34.0, 65.0, 53.0, 42.0, 46.0, 46.0, 38.0, 40.0, 43.0, 30.0, 33.0, 40.0, 21.0, 6.0, 24.0, 11.0, 8.0, 9.0, 6.0, 4.0, 5.0, 8.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.1663818359375, -8.871826171875, -8.5772705078125, -8.28271484375, -7.9881591796875, -7.693603515625, -7.3990478515625, -7.1044921875, -6.8099365234375, -6.515380859375, -6.2208251953125, -5.92626953125, -5.6317138671875, -5.337158203125, -5.0426025390625, -4.748046875, -4.4534912109375, -4.158935546875, -3.8643798828125, -3.56982421875, -3.2752685546875, -2.980712890625, -2.6861572265625, -2.3916015625, -2.0970458984375, -1.802490234375, -1.5079345703125, -1.21337890625, -0.9188232421875, -0.624267578125, -0.3297119140625, -0.03515625, 0.2593994140625, 0.553955078125, 0.8485107421875, 1.14306640625, 1.4376220703125, 1.732177734375, 2.0267333984375, 2.3212890625, 2.6158447265625, 2.910400390625, 3.2049560546875, 3.49951171875, 3.7940673828125, 4.088623046875, 4.3831787109375, 4.677734375, 4.9722900390625, 5.266845703125, 5.5614013671875, 5.85595703125, 6.1505126953125, 6.445068359375, 6.7396240234375, 7.0341796875, 7.3287353515625, 7.623291015625, 7.9178466796875, 8.21240234375, 8.5069580078125, 8.801513671875, 9.0960693359375, 9.390625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 9.0, 7.0, 14.0, 28.0, 26.0, 66.0, 85.0, 112.0, 214.0, 325.0, 478.0, 845.0, 1357.0, 2088.0, 3315.0, 5165.0, 7836.0, 12429.0, 18606.0, 26775.0, 38410.0, 52405.0, 68467.0, 85048.0, 98248.0, 106172.0, 105603.0, 97522.0, 83733.0, 67651.0, 51083.0, 37497.0, 25943.0, 17916.0, 11795.0, 7652.0, 5035.0, 3258.0, 1974.0, 1202.0, 791.0, 477.0, 341.0, 202.0, 130.0, 79.0, 56.0, 28.0, 30.0, 11.0, 6.0, 9.0, 4.0, 3.0, 1.0, 2.0], "bins": [-6.6015625, -6.40716552734375, -6.2127685546875, -6.01837158203125, -5.823974609375, -5.62957763671875, -5.4351806640625, -5.24078369140625, -5.04638671875, -4.85198974609375, -4.6575927734375, -4.46319580078125, -4.268798828125, -4.07440185546875, -3.8800048828125, -3.68560791015625, -3.4912109375, -3.29681396484375, -3.1024169921875, -2.90802001953125, -2.713623046875, -2.51922607421875, -2.3248291015625, -2.13043212890625, -1.93603515625, -1.74163818359375, -1.5472412109375, -1.35284423828125, -1.158447265625, -0.96405029296875, -0.7696533203125, -0.57525634765625, -0.380859375, -0.18646240234375, 0.0079345703125, 0.20233154296875, 0.396728515625, 0.59112548828125, 0.7855224609375, 0.97991943359375, 1.17431640625, 1.36871337890625, 1.5631103515625, 1.75750732421875, 1.951904296875, 2.14630126953125, 2.3406982421875, 2.53509521484375, 2.7294921875, 2.92388916015625, 3.1182861328125, 3.31268310546875, 3.507080078125, 3.70147705078125, 3.8958740234375, 4.09027099609375, 4.28466796875, 4.47906494140625, 4.6734619140625, 4.86785888671875, 5.062255859375, 5.25665283203125, 5.4510498046875, 5.64544677734375, 5.83984375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 12.0, 14.0, 15.0, 18.0, 24.0, 19.0, 25.0, 26.0, 26.0, 33.0, 43.0, 45.0, 38.0, 35.0, 35.0, 38.0, 54.0, 44.0, 39.0, 42.0, 30.0, 30.0, 49.0, 39.0, 27.0, 31.0, 24.0, 12.0, 21.0, 14.0, 17.0, 14.0, 9.0, 6.0, 11.0, 4.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.6055908203125, -4.437744140625, -4.2698974609375, -4.10205078125, -3.9342041015625, -3.766357421875, -3.5985107421875, -3.4306640625, -3.2628173828125, -3.094970703125, -2.9271240234375, -2.75927734375, -2.5914306640625, -2.423583984375, -2.2557373046875, -2.087890625, -1.9200439453125, -1.752197265625, -1.5843505859375, -1.41650390625, -1.2486572265625, -1.080810546875, -0.9129638671875, -0.7451171875, -0.5772705078125, -0.409423828125, -0.2415771484375, -0.07373046875, 0.0941162109375, 0.261962890625, 0.4298095703125, 0.59765625, 0.7655029296875, 0.933349609375, 1.1011962890625, 1.26904296875, 1.4368896484375, 1.604736328125, 1.7725830078125, 1.9404296875, 2.1082763671875, 2.276123046875, 2.4439697265625, 2.61181640625, 2.7796630859375, 2.947509765625, 3.1153564453125, 3.283203125, 3.4510498046875, 3.618896484375, 3.7867431640625, 3.95458984375, 4.1224365234375, 4.290283203125, 4.4581298828125, 4.6259765625, 4.7938232421875, 4.961669921875, 5.1295166015625, 5.29736328125, 5.4652099609375, 5.633056640625, 5.8009033203125, 5.96875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 3.0, 12.0, 14.0, 11.0, 23.0, 32.0, 44.0, 73.0, 96.0, 167.0, 192.0, 328.0, 496.0, 792.0, 1175.0, 1854.0, 3027.0, 5085.0, 8983.0, 16796.0, 32614.0, 63353.0, 113937.0, 177069.0, 207073.0, 173780.0, 110829.0, 60941.0, 31341.0, 16490.0, 8807.0, 4891.0, 2994.0, 1805.0, 1131.0, 763.0, 478.0, 309.0, 216.0, 155.0, 116.0, 80.0, 63.0, 52.0, 21.0, 15.0, 16.0, 10.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -7.0272216796875, -6.796630859375, -6.5660400390625, -6.33544921875, -6.1048583984375, -5.874267578125, -5.6436767578125, -5.4130859375, -5.1824951171875, -4.951904296875, -4.7213134765625, -4.49072265625, -4.2601318359375, -4.029541015625, -3.7989501953125, -3.568359375, -3.3377685546875, -3.107177734375, -2.8765869140625, -2.64599609375, -2.4154052734375, -2.184814453125, -1.9542236328125, -1.7236328125, -1.4930419921875, -1.262451171875, -1.0318603515625, -0.80126953125, -0.5706787109375, -0.340087890625, -0.1094970703125, 0.12109375, 0.3516845703125, 0.582275390625, 0.8128662109375, 1.04345703125, 1.2740478515625, 1.504638671875, 1.7352294921875, 1.9658203125, 2.1964111328125, 2.427001953125, 2.6575927734375, 2.88818359375, 3.1187744140625, 3.349365234375, 3.5799560546875, 3.810546875, 4.0411376953125, 4.271728515625, 4.5023193359375, 4.73291015625, 4.9635009765625, 5.194091796875, 5.4246826171875, 5.6552734375, 5.8858642578125, 6.116455078125, 6.3470458984375, 6.57763671875, 6.8082275390625, 7.038818359375, 7.2694091796875, 7.5]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 9.0, 7.0, 10.0, 6.0, 13.0, 18.0, 18.0, 16.0, 30.0, 34.0, 41.0, 48.0, 47.0, 62.0, 54.0, 65.0, 66.0, 47.0, 60.0, 57.0, 53.0, 57.0, 39.0, 32.0, 29.0, 17.0, 11.0, 18.0, 14.0, 11.0, 6.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044989585876464844, -0.00043143704533576965, -0.00041297823190689087, -0.0003945194184780121, -0.0003760606050491333, -0.0003576017916202545, -0.00033914297819137573, -0.00032068416476249695, -0.00030222535133361816, -0.0002837665379047394, -0.0002653077244758606, -0.0002468489110469818, -0.00022839009761810303, -0.00020993128418922424, -0.00019147247076034546, -0.00017301365733146667, -0.0001545548439025879, -0.0001360960304737091, -0.00011763721704483032, -9.917840361595154e-05, -8.071959018707275e-05, -6.226077675819397e-05, -4.3801963329315186e-05, -2.53431499004364e-05, -6.884336471557617e-06, 1.1574476957321167e-05, 3.003329038619995e-05, 4.8492103815078735e-05, 6.695091724395752e-05, 8.54097306728363e-05, 0.00010386854410171509, 0.00012232735753059387, 0.00014078617095947266, 0.00015924498438835144, 0.00017770379781723022, 0.000196162611246109, 0.0002146214246749878, 0.00023308023810386658, 0.00025153905153274536, 0.00026999786496162415, 0.00028845667839050293, 0.0003069154918193817, 0.0003253743052482605, 0.0003438331186771393, 0.00036229193210601807, 0.00038075074553489685, 0.00039920955896377563, 0.0004176683723926544, 0.0004361271858215332, 0.000454585999250412, 0.00047304481267929077, 0.0004915036261081696, 0.0005099624395370483, 0.0005284212529659271, 0.0005468800663948059, 0.0005653388798236847, 0.0005837976932525635, 0.0006022565066814423, 0.000620715320110321, 0.0006391741335391998, 0.0006576329469680786, 0.0006760917603969574, 0.0006945505738258362, 0.000713009387254715, 0.0007314682006835938]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 9.0, 14.0, 16.0, 14.0, 26.0, 38.0, 52.0, 73.0, 107.0, 144.0, 224.0, 336.0, 540.0, 856.0, 1379.0, 2186.0, 4204.0, 7881.0, 16512.0, 35121.0, 76231.0, 152595.0, 232672.0, 229223.0, 147600.0, 73282.0, 33754.0, 15675.0, 7762.0, 4085.0, 2301.0, 1264.0, 806.0, 557.0, 323.0, 215.0, 116.0, 120.0, 75.0, 48.0, 34.0, 20.0, 22.0, 16.0, 6.0, 6.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.72705078125, -8.4541015625, -8.18115234375, -7.908203125, -7.63525390625, -7.3623046875, -7.08935546875, -6.81640625, -6.54345703125, -6.2705078125, -5.99755859375, -5.724609375, -5.45166015625, -5.1787109375, -4.90576171875, -4.6328125, -4.35986328125, -4.0869140625, -3.81396484375, -3.541015625, -3.26806640625, -2.9951171875, -2.72216796875, -2.44921875, -2.17626953125, -1.9033203125, -1.63037109375, -1.357421875, -1.08447265625, -0.8115234375, -0.53857421875, -0.265625, 0.00732421875, 0.2802734375, 0.55322265625, 0.826171875, 1.09912109375, 1.3720703125, 1.64501953125, 1.91796875, 2.19091796875, 2.4638671875, 2.73681640625, 3.009765625, 3.28271484375, 3.5556640625, 3.82861328125, 4.1015625, 4.37451171875, 4.6474609375, 4.92041015625, 5.193359375, 5.46630859375, 5.7392578125, 6.01220703125, 6.28515625, 6.55810546875, 6.8310546875, 7.10400390625, 7.376953125, 7.64990234375, 7.9228515625, 8.19580078125, 8.46875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 3.0, 8.0, 16.0, 9.0, 21.0, 13.0, 26.0, 28.0, 31.0, 47.0, 46.0, 49.0, 51.0, 65.0, 47.0, 52.0, 54.0, 50.0, 55.0, 38.0, 50.0, 38.0, 36.0, 26.0, 18.0, 15.0, 15.0, 15.0, 13.0, 8.0, 10.0, 9.0, 7.0, 2.0, 5.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.53515625, -1.4865264892578125, -1.437896728515625, -1.3892669677734375, -1.34063720703125, -1.2920074462890625, -1.243377685546875, -1.1947479248046875, -1.1461181640625, -1.0974884033203125, -1.048858642578125, -1.0002288818359375, -0.95159912109375, -0.9029693603515625, -0.854339599609375, -0.8057098388671875, -0.757080078125, -0.7084503173828125, -0.659820556640625, -0.6111907958984375, -0.56256103515625, -0.5139312744140625, -0.465301513671875, -0.4166717529296875, -0.3680419921875, -0.3194122314453125, -0.270782470703125, -0.2221527099609375, -0.17352294921875, -0.1248931884765625, -0.076263427734375, -0.0276336669921875, 0.02099609375, 0.0696258544921875, 0.118255615234375, 0.1668853759765625, 0.21551513671875, 0.2641448974609375, 0.312774658203125, 0.3614044189453125, 0.4100341796875, 0.4586639404296875, 0.507293701171875, 0.5559234619140625, 0.60455322265625, 0.6531829833984375, 0.701812744140625, 0.7504425048828125, 0.799072265625, 0.8477020263671875, 0.896331787109375, 0.9449615478515625, 0.99359130859375, 1.0422210693359375, 1.090850830078125, 1.1394805908203125, 1.1881103515625, 1.2367401123046875, 1.285369873046875, 1.3339996337890625, 1.38262939453125, 1.4312591552734375, 1.479888916015625, 1.5285186767578125, 1.5771484375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 5.0, 10.0, 10.0, 12.0, 14.0, 17.0, 21.0, 34.0, 25.0, 28.0, 45.0, 42.0, 41.0, 57.0, 60.0, 70.0, 69.0, 40.0, 64.0, 51.0, 41.0, 44.0, 32.0, 32.0, 29.0, 27.0, 19.0, 16.0, 10.0, 7.0, 12.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.999459266662598, -15.514992713928223, -15.030526161193848, -14.546059608459473, -14.061593055725098, -13.577126502990723, -13.092659950256348, -12.608193397521973, -12.123726844787598, -11.639260292053223, -11.154793739318848, -10.670327186584473, -10.185860633850098, -9.701394081115723, -9.216927528381348, -8.732460975646973, -8.247994422912598, -7.763527870178223, -7.279061317443848, -6.794594764709473, -6.310128211975098, -5.825661659240723, -5.341195106506348, -4.856728553771973, -4.372262001037598, -3.8877954483032227, -3.4033288955688477, -2.9188623428344727, -2.4343957901000977, -1.9499292373657227, -1.4654626846313477, -0.9809961318969727, -0.49653053283691406, -0.012063980102539062, 0.47240257263183594, 0.9568691253662109, 1.441335678100586, 1.925802230834961, 2.410268783569336, 2.894735336303711, 3.379201889038086, 3.863668441772461, 4.348134994506836, 4.832601547241211, 5.317068099975586, 5.801534652709961, 6.286001205444336, 6.770467758178711, 7.254934310913086, 7.739400863647461, 8.223867416381836, 8.708333969116211, 9.192800521850586, 9.677267074584961, 10.161733627319336, 10.646200180053711, 11.130666732788086, 11.615133285522461, 12.099599838256836, 12.584066390991211, 13.068532943725586, 13.552999496459961, 14.037466049194336, 14.521932601928711, 15.006399154663086]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 0.0, 9.0, 6.0, 13.0, 13.0, 23.0, 13.0, 18.0, 34.0, 18.0, 37.0, 29.0, 30.0, 33.0, 32.0, 40.0, 51.0, 31.0, 43.0, 42.0, 38.0, 39.0, 34.0, 40.0, 36.0, 34.0, 31.0, 27.0, 22.0, 32.0, 21.0, 23.0, 14.0, 14.0, 12.0, 13.0, 8.0, 7.0, 6.0, 4.0, 1.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.057671546936035, -7.795970916748047, -7.534270286560059, -7.27256965637207, -7.010869026184082, -6.749168395996094, -6.487468242645264, -6.225767612457275, -5.964066982269287, -5.702366352081299, -5.4406657218933105, -5.178965091705322, -4.917264938354492, -4.655564308166504, -4.393863677978516, -4.132163047790527, -3.870462417602539, -3.608761787414551, -3.3470611572265625, -3.0853607654571533, -2.823660135269165, -2.5619595050811768, -2.3002591133117676, -2.0385584831237793, -1.776857852935791, -1.5151572227478027, -1.253456711769104, -0.9917561411857605, -0.730055570602417, -0.4683549404144287, -0.20665442943572998, 0.05504608154296875, 0.3167457580566406, 0.5784463286399841, 0.8401468992233276, 1.1018474102020264, 1.3635480403900146, 1.625248670578003, 1.8869491815567017, 2.1486496925354004, 2.4103503227233887, 2.672050952911377, 2.9337515830993652, 3.1954519748687744, 3.4571526050567627, 3.718853235244751, 3.98055362701416, 4.242254257202148, 4.503954887390137, 4.765655517578125, 5.027356147766113, 5.289056777954102, 5.55075740814209, 5.812458038330078, 6.074158191680908, 6.3358588218688965, 6.597559452056885, 6.859260082244873, 7.120960712432861, 7.38266134262085, 7.64436149597168, 7.906062126159668, 8.167762756347656, 8.429463386535645, 8.691164016723633]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 8.0, 12.0, 18.0, 24.0, 58.0, 53.0, 100.0, 188.0, 252.0, 375.0, 638.0, 1049.0, 1593.0, 2468.0, 3787.0, 6222.0, 9609.0, 15702.0, 25542.0, 40476.0, 64846.0, 101637.0, 156426.0, 234266.0, 329404.0, 427679.0, 503250.0, 526895.0, 481257.0, 392175.0, 291797.0, 203183.0, 135507.0, 87081.0, 55744.0, 34824.0, 21876.0, 13968.0, 8736.0, 5488.0, 3587.0, 2260.0, 1489.0, 981.0, 631.0, 348.0, 279.0, 162.0, 125.0, 72.0, 53.0, 26.0, 24.0, 20.0, 9.0, 7.0, 2.0, 2.0, 3.0, 4.0], "bins": [-9.5, -9.1966552734375, -8.893310546875, -8.5899658203125, -8.28662109375, -7.9832763671875, -7.679931640625, -7.3765869140625, -7.0732421875, -6.7698974609375, -6.466552734375, -6.1632080078125, -5.85986328125, -5.5565185546875, -5.253173828125, -4.9498291015625, -4.646484375, -4.3431396484375, -4.039794921875, -3.7364501953125, -3.43310546875, -3.1297607421875, -2.826416015625, -2.5230712890625, -2.2197265625, -1.9163818359375, -1.613037109375, -1.3096923828125, -1.00634765625, -0.7030029296875, -0.399658203125, -0.0963134765625, 0.20703125, 0.5103759765625, 0.813720703125, 1.1170654296875, 1.42041015625, 1.7237548828125, 2.027099609375, 2.3304443359375, 2.6337890625, 2.9371337890625, 3.240478515625, 3.5438232421875, 3.84716796875, 4.1505126953125, 4.453857421875, 4.7572021484375, 5.060546875, 5.3638916015625, 5.667236328125, 5.9705810546875, 6.27392578125, 6.5772705078125, 6.880615234375, 7.1839599609375, 7.4873046875, 7.7906494140625, 8.093994140625, 8.3973388671875, 8.70068359375, 9.0040283203125, 9.307373046875, 9.6107177734375, 9.9140625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 9.0, 5.0, 7.0, 12.0, 14.0, 9.0, 13.0, 14.0, 17.0, 25.0, 24.0, 19.0, 28.0, 26.0, 29.0, 33.0, 38.0, 35.0, 30.0, 44.0, 40.0, 33.0, 35.0, 33.0, 33.0, 40.0, 33.0, 41.0, 34.0, 21.0, 27.0, 36.0, 29.0, 23.0, 19.0, 21.0, 13.0, 10.0, 10.0, 3.0, 10.0, 2.0, 7.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.48046875, -6.27508544921875, -6.0697021484375, -5.86431884765625, -5.658935546875, -5.45355224609375, -5.2481689453125, -5.04278564453125, -4.83740234375, -4.63201904296875, -4.4266357421875, -4.22125244140625, -4.015869140625, -3.81048583984375, -3.6051025390625, -3.39971923828125, -3.1943359375, -2.98895263671875, -2.7835693359375, -2.57818603515625, -2.372802734375, -2.16741943359375, -1.9620361328125, -1.75665283203125, -1.55126953125, -1.34588623046875, -1.1405029296875, -0.93511962890625, -0.729736328125, -0.52435302734375, -0.3189697265625, -0.11358642578125, 0.091796875, 0.29718017578125, 0.5025634765625, 0.70794677734375, 0.913330078125, 1.11871337890625, 1.3240966796875, 1.52947998046875, 1.73486328125, 1.94024658203125, 2.1456298828125, 2.35101318359375, 2.556396484375, 2.76177978515625, 2.9671630859375, 3.17254638671875, 3.3779296875, 3.58331298828125, 3.7886962890625, 3.99407958984375, 4.199462890625, 4.40484619140625, 4.6102294921875, 4.81561279296875, 5.02099609375, 5.22637939453125, 5.4317626953125, 5.63714599609375, 5.842529296875, 6.04791259765625, 6.2532958984375, 6.45867919921875, 6.6640625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 19.0, 21.0, 33.0, 32.0, 87.0, 113.0, 183.0, 280.0, 456.0, 756.0, 1206.0, 1821.0, 3082.0, 5120.0, 8738.0, 14065.0, 23441.0, 38716.0, 62824.0, 101463.0, 156961.0, 233749.0, 327094.0, 422753.0, 496764.0, 519473.0, 482192.0, 401297.0, 303126.0, 212759.0, 142144.0, 90684.0, 56124.0, 34332.0, 20765.0, 12418.0, 7322.0, 4507.0, 2818.0, 1729.0, 1062.0, 635.0, 406.0, 247.0, 153.0, 107.0, 77.0, 41.0, 33.0, 15.0, 12.0, 10.0, 5.0, 3.0, 5.0, 4.0], "bins": [-11.734375, -11.3828125, -11.03125, -10.6796875, -10.328125, -9.9765625, -9.625, -9.2734375, -8.921875, -8.5703125, -8.21875, -7.8671875, -7.515625, -7.1640625, -6.8125, -6.4609375, -6.109375, -5.7578125, -5.40625, -5.0546875, -4.703125, -4.3515625, -4.0, -3.6484375, -3.296875, -2.9453125, -2.59375, -2.2421875, -1.890625, -1.5390625, -1.1875, -0.8359375, -0.484375, -0.1328125, 0.21875, 0.5703125, 0.921875, 1.2734375, 1.625, 1.9765625, 2.328125, 2.6796875, 3.03125, 3.3828125, 3.734375, 4.0859375, 4.4375, 4.7890625, 5.140625, 5.4921875, 5.84375, 6.1953125, 6.546875, 6.8984375, 7.25, 7.6015625, 7.953125, 8.3046875, 8.65625, 9.0078125, 9.359375, 9.7109375, 10.0625, 10.4140625, 10.765625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 8.0, 12.0, 7.0, 19.0, 22.0, 47.0, 39.0, 56.0, 61.0, 83.0, 79.0, 103.0, 104.0, 121.0, 122.0, 141.0, 172.0, 184.0, 192.0, 186.0, 211.0, 203.0, 199.0, 186.0, 184.0, 164.0, 169.0, 137.0, 130.0, 129.0, 111.0, 74.0, 95.0, 59.0, 47.0, 42.0, 25.0, 33.0, 20.0, 17.0, 16.0, 15.0, 9.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.791015625, -3.666961669921875, -3.54290771484375, -3.418853759765625, -3.2947998046875, -3.170745849609375, -3.04669189453125, -2.922637939453125, -2.798583984375, -2.674530029296875, -2.55047607421875, -2.426422119140625, -2.3023681640625, -2.178314208984375, -2.05426025390625, -1.930206298828125, -1.80615234375, -1.682098388671875, -1.55804443359375, -1.433990478515625, -1.3099365234375, -1.185882568359375, -1.06182861328125, -0.937774658203125, -0.813720703125, -0.689666748046875, -0.56561279296875, -0.441558837890625, -0.3175048828125, -0.193450927734375, -0.06939697265625, 0.054656982421875, 0.1787109375, 0.302764892578125, 0.42681884765625, 0.550872802734375, 0.6749267578125, 0.798980712890625, 0.92303466796875, 1.047088623046875, 1.171142578125, 1.295196533203125, 1.41925048828125, 1.543304443359375, 1.6673583984375, 1.791412353515625, 1.91546630859375, 2.039520263671875, 2.16357421875, 2.287628173828125, 2.41168212890625, 2.535736083984375, 2.6597900390625, 2.783843994140625, 2.90789794921875, 3.031951904296875, 3.156005859375, 3.280059814453125, 3.40411376953125, 3.528167724609375, 3.6522216796875, 3.776275634765625, 3.90032958984375, 4.024383544921875, 4.1484375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 15.0, 10.0, 23.0, 21.0, 23.0, 22.0, 41.0, 48.0, 55.0, 53.0, 56.0, 64.0, 60.0, 80.0, 59.0, 66.0, 54.0, 48.0, 40.0, 21.0, 27.0, 27.0, 21.0, 18.0, 10.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.157114028930664, -18.553369522094727, -17.949626922607422, -17.345882415771484, -16.74213981628418, -16.138395309448242, -15.534652709960938, -14.930908203125, -14.327165603637695, -13.723422050476074, -13.119678497314453, -12.515934944152832, -11.912191390991211, -11.30844783782959, -10.704704284667969, -10.100959777832031, -9.49721622467041, -8.893472671508789, -8.289729118347168, -7.685985565185547, -7.082242012023926, -6.478498458862305, -5.874754428863525, -5.271010875701904, -4.667267322540283, -4.063523769378662, -3.459780216217041, -2.856036424636841, -2.2522928714752197, -1.6485493183135986, -1.0448055267333984, -0.44106197357177734, 0.16268157958984375, 0.7664251923561096, 1.3701688051223755, 1.9739124774932861, 2.5776560306549072, 3.1813995838165283, 3.7851433753967285, 4.38888692855835, 4.992630481719971, 5.596374034881592, 6.200117588043213, 6.803861618041992, 7.407605171203613, 8.011348724365234, 8.615092277526855, 9.218835830688477, 9.822579383850098, 10.426322937011719, 11.03006649017334, 11.633810043334961, 12.237553596496582, 12.841297149658203, 13.44504165649414, 14.048784255981445, 14.652528762817383, 15.256272315979004, 15.860015869140625, 16.463760375976562, 17.067502975463867, 17.671247482299805, 18.27499008178711, 18.878734588623047, 19.48247718811035]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 5.0, 9.0, 15.0, 13.0, 14.0, 26.0, 27.0, 29.0, 40.0, 28.0, 36.0, 34.0, 32.0, 39.0, 40.0, 51.0, 43.0, 52.0, 42.0, 44.0, 34.0, 45.0, 22.0, 36.0, 27.0, 29.0, 27.0, 24.0, 28.0, 16.0, 13.0, 10.0, 14.0, 11.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59604263305664, -9.292692184448242, -8.989340782165527, -8.685989379882812, -8.382638931274414, -8.079288482666016, -7.775937080383301, -7.472586154937744, -7.1692352294921875, -6.865884304046631, -6.562533378601074, -6.259182453155518, -5.955831527709961, -5.652480602264404, -5.349129676818848, -5.045778751373291, -4.742427825927734, -4.439076900482178, -4.135725975036621, -3.8323750495910645, -3.529024124145508, -3.225673198699951, -2.9223222732543945, -2.618971347808838, -2.3156204223632812, -2.0122694969177246, -1.708918571472168, -1.4055676460266113, -1.1022167205810547, -0.798865795135498, -0.4955148696899414, -0.19216394424438477, 0.11118698120117188, 0.4145379066467285, 0.7178888320922852, 1.0212397575378418, 1.3245906829833984, 1.627941608428955, 1.9312925338745117, 2.2346434593200684, 2.537994384765625, 2.8413453102111816, 3.1446962356567383, 3.448047161102295, 3.7513980865478516, 4.054749011993408, 4.358099937438965, 4.6614508628845215, 4.964801788330078, 5.268152713775635, 5.571503639221191, 5.874854564666748, 6.178205490112305, 6.481556415557861, 6.784907341003418, 7.088258266448975, 7.391609191894531, 7.694960117340088, 7.9983110427856445, 8.30166244506836, 8.605012893676758, 8.908363342285156, 9.211714744567871, 9.515066146850586, 9.818416595458984]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 12.0, 11.0, 29.0, 20.0, 70.0, 80.0, 112.0, 182.0, 216.0, 338.0, 543.0, 831.0, 1239.0, 1890.0, 2818.0, 4350.0, 6704.0, 9991.0, 15186.0, 23090.0, 34234.0, 50779.0, 71796.0, 99015.0, 123461.0, 136267.0, 126442.0, 102692.0, 75443.0, 53355.0, 36368.0, 24018.0, 16218.0, 10634.0, 6798.0, 4461.0, 2999.0, 2003.0, 1287.0, 866.0, 559.0, 387.0, 257.0, 150.0, 115.0, 65.0, 47.0, 40.0, 31.0, 13.0, 18.0, 10.0, 4.0, 4.0, 1.0, 1.0, 6.0], "bins": [-2.078125, -2.014312744140625, -1.95050048828125, -1.886688232421875, -1.8228759765625, -1.759063720703125, -1.69525146484375, -1.631439208984375, -1.567626953125, -1.503814697265625, -1.44000244140625, -1.376190185546875, -1.3123779296875, -1.248565673828125, -1.18475341796875, -1.120941162109375, -1.05712890625, -0.993316650390625, -0.92950439453125, -0.865692138671875, -0.8018798828125, -0.738067626953125, -0.67425537109375, -0.610443115234375, -0.546630859375, -0.482818603515625, -0.41900634765625, -0.355194091796875, -0.2913818359375, -0.227569580078125, -0.16375732421875, -0.099945068359375, -0.0361328125, 0.027679443359375, 0.09149169921875, 0.155303955078125, 0.2191162109375, 0.282928466796875, 0.34674072265625, 0.410552978515625, 0.474365234375, 0.538177490234375, 0.60198974609375, 0.665802001953125, 0.7296142578125, 0.793426513671875, 0.85723876953125, 0.921051025390625, 0.98486328125, 1.048675537109375, 1.11248779296875, 1.176300048828125, 1.2401123046875, 1.303924560546875, 1.36773681640625, 1.431549072265625, 1.495361328125, 1.559173583984375, 1.62298583984375, 1.686798095703125, 1.7506103515625, 1.814422607421875, 1.87823486328125, 1.942047119140625, 2.005859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 7.0, 10.0, 9.0, 14.0, 20.0, 16.0, 24.0, 35.0, 25.0, 24.0, 34.0, 45.0, 34.0, 44.0, 49.0, 51.0, 55.0, 56.0, 55.0, 43.0, 40.0, 40.0, 39.0, 38.0, 21.0, 25.0, 22.0, 19.0, 18.0, 13.0, 17.0, 13.0, 8.0, 5.0, 7.0, 7.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.971435546875, -9.61474609375, -9.258056640625, -8.9013671875, -8.544677734375, -8.18798828125, -7.831298828125, -7.474609375, -7.117919921875, -6.76123046875, -6.404541015625, -6.0478515625, -5.691162109375, -5.33447265625, -4.977783203125, -4.62109375, -4.264404296875, -3.90771484375, -3.551025390625, -3.1943359375, -2.837646484375, -2.48095703125, -2.124267578125, -1.767578125, -1.410888671875, -1.05419921875, -0.697509765625, -0.3408203125, 0.015869140625, 0.37255859375, 0.729248046875, 1.0859375, 1.442626953125, 1.79931640625, 2.156005859375, 2.5126953125, 2.869384765625, 3.22607421875, 3.582763671875, 3.939453125, 4.296142578125, 4.65283203125, 5.009521484375, 5.3662109375, 5.722900390625, 6.07958984375, 6.436279296875, 6.79296875, 7.149658203125, 7.50634765625, 7.863037109375, 8.2197265625, 8.576416015625, 8.93310546875, 9.289794921875, 9.646484375, 10.003173828125, 10.35986328125, 10.716552734375, 11.0732421875, 11.429931640625, 11.78662109375, 12.143310546875, 12.5]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 10.0, 23.0, 41.0, 55.0, 82.0, 135.0, 199.0, 365.0, 619.0, 1007.0, 1693.0, 3083.0, 5613.0, 10436.0, 20072.0, 39431.0, 76995.0, 138809.0, 210999.0, 216635.0, 149121.0, 83204.0, 42768.0, 21847.0, 11544.0, 5996.0, 3347.0, 1785.0, 1058.0, 616.0, 352.0, 214.0, 131.0, 92.0, 62.0, 31.0, 21.0, 16.0, 11.0, 11.0, 8.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.689453125, -3.581146240234375, -3.47283935546875, -3.364532470703125, -3.2562255859375, -3.147918701171875, -3.03961181640625, -2.931304931640625, -2.822998046875, -2.714691162109375, -2.60638427734375, -2.498077392578125, -2.3897705078125, -2.281463623046875, -2.17315673828125, -2.064849853515625, -1.95654296875, -1.848236083984375, -1.73992919921875, -1.631622314453125, -1.5233154296875, -1.415008544921875, -1.30670166015625, -1.198394775390625, -1.090087890625, -0.981781005859375, -0.87347412109375, -0.765167236328125, -0.6568603515625, -0.548553466796875, -0.44024658203125, -0.331939697265625, -0.2236328125, -0.115325927734375, -0.00701904296875, 0.101287841796875, 0.2095947265625, 0.317901611328125, 0.42620849609375, 0.534515380859375, 0.642822265625, 0.751129150390625, 0.85943603515625, 0.967742919921875, 1.0760498046875, 1.184356689453125, 1.29266357421875, 1.400970458984375, 1.50927734375, 1.617584228515625, 1.72589111328125, 1.834197998046875, 1.9425048828125, 2.050811767578125, 2.15911865234375, 2.267425537109375, 2.375732421875, 2.484039306640625, 2.59234619140625, 2.700653076171875, 2.8089599609375, 2.917266845703125, 3.02557373046875, 3.133880615234375, 3.2421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 9.0, 16.0, 7.0, 8.0, 15.0, 16.0, 15.0, 21.0, 21.0, 24.0, 29.0, 29.0, 26.0, 38.0, 37.0, 27.0, 40.0, 44.0, 36.0, 25.0, 40.0, 40.0, 33.0, 34.0, 45.0, 42.0, 31.0, 24.0, 25.0, 26.0, 16.0, 19.0, 16.0, 13.0, 20.0, 21.0, 11.0, 14.0, 8.0, 7.0, 7.0, 7.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.5078125, -6.32342529296875, -6.1390380859375, -5.95465087890625, -5.770263671875, -5.58587646484375, -5.4014892578125, -5.21710205078125, -5.03271484375, -4.84832763671875, -4.6639404296875, -4.47955322265625, -4.295166015625, -4.11077880859375, -3.9263916015625, -3.74200439453125, -3.5576171875, -3.37322998046875, -3.1888427734375, -3.00445556640625, -2.820068359375, -2.63568115234375, -2.4512939453125, -2.26690673828125, -2.08251953125, -1.89813232421875, -1.7137451171875, -1.52935791015625, -1.344970703125, -1.16058349609375, -0.9761962890625, -0.79180908203125, -0.607421875, -0.42303466796875, -0.2386474609375, -0.05426025390625, 0.130126953125, 0.31451416015625, 0.4989013671875, 0.68328857421875, 0.86767578125, 1.05206298828125, 1.2364501953125, 1.42083740234375, 1.605224609375, 1.78961181640625, 1.9739990234375, 2.15838623046875, 2.3427734375, 2.52716064453125, 2.7115478515625, 2.89593505859375, 3.080322265625, 3.26470947265625, 3.4490966796875, 3.63348388671875, 3.81787109375, 4.00225830078125, 4.1866455078125, 4.37103271484375, 4.555419921875, 4.73980712890625, 4.9241943359375, 5.10858154296875, 5.29296875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 13.0, 12.0, 19.0, 24.0, 54.0, 79.0, 152.0, 217.0, 383.0, 645.0, 1230.0, 2187.0, 4624.0, 10085.0, 23403.0, 59732.0, 154378.0, 316461.0, 274447.0, 119865.0, 46044.0, 18622.0, 7867.0, 3673.0, 1934.0, 969.0, 551.0, 337.0, 197.0, 119.0, 81.0, 41.0, 36.0, 20.0, 13.0, 4.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3642578125, -1.323974609375, -1.28369140625, -1.243408203125, -1.203125, -1.162841796875, -1.12255859375, -1.082275390625, -1.0419921875, -1.001708984375, -0.96142578125, -0.921142578125, -0.880859375, -0.840576171875, -0.80029296875, -0.760009765625, -0.7197265625, -0.679443359375, -0.63916015625, -0.598876953125, -0.55859375, -0.518310546875, -0.47802734375, -0.437744140625, -0.3974609375, -0.357177734375, -0.31689453125, -0.276611328125, -0.236328125, -0.196044921875, -0.15576171875, -0.115478515625, -0.0751953125, -0.034912109375, 0.00537109375, 0.045654296875, 0.0859375, 0.126220703125, 0.16650390625, 0.206787109375, 0.2470703125, 0.287353515625, 0.32763671875, 0.367919921875, 0.408203125, 0.448486328125, 0.48876953125, 0.529052734375, 0.5693359375, 0.609619140625, 0.64990234375, 0.690185546875, 0.73046875, 0.770751953125, 0.81103515625, 0.851318359375, 0.8916015625, 0.931884765625, 0.97216796875, 1.012451171875, 1.052734375, 1.093017578125, 1.13330078125, 1.173583984375, 1.2138671875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 4.0, 7.0, 4.0, 8.0, 15.0, 18.0, 26.0, 28.0, 34.0, 34.0, 45.0, 40.0, 41.0, 54.0, 65.0, 66.0, 46.0, 67.0, 54.0, 50.0, 43.0, 51.0, 39.0, 20.0, 27.0, 30.0, 21.0, 13.0, 13.0, 8.0, 7.0, 10.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.97834587097168e-05, -5.78761100769043e-05, -5.59687614440918e-05, -5.40614128112793e-05, -5.21540641784668e-05, -5.02467155456543e-05, -4.83393669128418e-05, -4.64320182800293e-05, -4.45246696472168e-05, -4.26173210144043e-05, -4.07099723815918e-05, -3.88026237487793e-05, -3.68952751159668e-05, -3.49879264831543e-05, -3.30805778503418e-05, -3.11732292175293e-05, -2.9265880584716797e-05, -2.7358531951904297e-05, -2.5451183319091797e-05, -2.3543834686279297e-05, -2.1636486053466797e-05, -1.9729137420654297e-05, -1.7821788787841797e-05, -1.5914440155029297e-05, -1.4007091522216797e-05, -1.2099742889404297e-05, -1.0192394256591797e-05, -8.285045623779297e-06, -6.377696990966797e-06, -4.470348358154297e-06, -2.562999725341797e-06, -6.556510925292969e-07, 1.2516975402832031e-06, 3.159046173095703e-06, 5.066394805908203e-06, 6.973743438720703e-06, 8.881092071533203e-06, 1.0788440704345703e-05, 1.2695789337158203e-05, 1.4603137969970703e-05, 1.6510486602783203e-05, 1.8417835235595703e-05, 2.0325183868408203e-05, 2.2232532501220703e-05, 2.4139881134033203e-05, 2.6047229766845703e-05, 2.7954578399658203e-05, 2.9861927032470703e-05, 3.17692756652832e-05, 3.36766242980957e-05, 3.55839729309082e-05, 3.74913215637207e-05, 3.93986701965332e-05, 4.13060188293457e-05, 4.32133674621582e-05, 4.51207160949707e-05, 4.70280647277832e-05, 4.89354133605957e-05, 5.08427619934082e-05, 5.27501106262207e-05, 5.46574592590332e-05, 5.65648078918457e-05, 5.84721565246582e-05, 6.03795051574707e-05, 6.22868537902832e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 6.0, 8.0, 10.0, 15.0, 26.0, 36.0, 49.0, 125.0, 137.0, 223.0, 309.0, 492.0, 685.0, 990.0, 1581.0, 2379.0, 3538.0, 5601.0, 8873.0, 14249.0, 23150.0, 37342.0, 60822.0, 95998.0, 141436.0, 176679.0, 161734.0, 114460.0, 74515.0, 46379.0, 28529.0, 17469.0, 10874.0, 6890.0, 4435.0, 2913.0, 1895.0, 1247.0, 809.0, 546.0, 385.0, 284.0, 156.0, 97.0, 65.0, 39.0, 29.0, 20.0, 16.0, 11.0, 6.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.0390625, -1.0082473754882812, -0.9774322509765625, -0.9466171264648438, -0.915802001953125, -0.8849868774414062, -0.8541717529296875, -0.8233566284179688, -0.79254150390625, -0.7617263793945312, -0.7309112548828125, -0.7000961303710938, -0.669281005859375, -0.6384658813476562, -0.6076507568359375, -0.5768356323242188, -0.5460205078125, -0.5152053833007812, -0.4843902587890625, -0.45357513427734375, -0.422760009765625, -0.39194488525390625, -0.3611297607421875, -0.33031463623046875, -0.29949951171875, -0.26868438720703125, -0.2378692626953125, -0.20705413818359375, -0.176239013671875, -0.14542388916015625, -0.1146087646484375, -0.08379364013671875, -0.052978515625, -0.02216339111328125, 0.0086517333984375, 0.03946685791015625, 0.070281982421875, 0.10109710693359375, 0.1319122314453125, 0.16272735595703125, 0.19354248046875, 0.22435760498046875, 0.2551727294921875, 0.28598785400390625, 0.316802978515625, 0.34761810302734375, 0.3784332275390625, 0.40924835205078125, 0.4400634765625, 0.47087860107421875, 0.5016937255859375, 0.5325088500976562, 0.563323974609375, 0.5941390991210938, 0.6249542236328125, 0.6557693481445312, 0.68658447265625, 0.7173995971679688, 0.7482147216796875, 0.7790298461914062, 0.809844970703125, 0.8406600952148438, 0.8714752197265625, 0.9022903442382812, 0.93310546875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 12.0, 6.0, 11.0, 14.0, 13.0, 21.0, 32.0, 22.0, 39.0, 37.0, 50.0, 51.0, 63.0, 58.0, 62.0, 57.0, 67.0, 73.0, 51.0, 44.0, 41.0, 34.0, 25.0, 26.0, 15.0, 14.0, 7.0, 12.0, 6.0, 9.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.42626953125, -0.41493988037109375, -0.4036102294921875, -0.39228057861328125, -0.380950927734375, -0.36962127685546875, -0.3582916259765625, -0.34696197509765625, -0.33563232421875, -0.32430267333984375, -0.3129730224609375, -0.30164337158203125, -0.290313720703125, -0.27898406982421875, -0.2676544189453125, -0.25632476806640625, -0.2449951171875, -0.23366546630859375, -0.2223358154296875, -0.21100616455078125, -0.199676513671875, -0.18834686279296875, -0.1770172119140625, -0.16568756103515625, -0.15435791015625, -0.14302825927734375, -0.1316986083984375, -0.12036895751953125, -0.109039306640625, -0.09770965576171875, -0.0863800048828125, -0.07505035400390625, -0.063720703125, -0.05239105224609375, -0.0410614013671875, -0.02973175048828125, -0.018402099609375, -0.00707244873046875, 0.0042572021484375, 0.01558685302734375, 0.02691650390625, 0.03824615478515625, 0.0495758056640625, 0.06090545654296875, 0.072235107421875, 0.08356475830078125, 0.0948944091796875, 0.10622406005859375, 0.1175537109375, 0.12888336181640625, 0.1402130126953125, 0.15154266357421875, 0.162872314453125, 0.17420196533203125, 0.1855316162109375, 0.19686126708984375, 0.20819091796875, 0.21952056884765625, 0.2308502197265625, 0.24217987060546875, 0.253509521484375, 0.26483917236328125, 0.2761688232421875, 0.28749847412109375, 0.298828125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 15.0, 13.0, 18.0, 19.0, 25.0, 22.0, 41.0, 46.0, 46.0, 59.0, 55.0, 61.0, 67.0, 71.0, 64.0, 64.0, 56.0, 49.0, 42.0, 25.0, 30.0, 22.0, 24.0, 16.0, 14.0, 6.0, 9.0, 5.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.15614891052246, -18.554906845092773, -17.953664779663086, -17.3524227142334, -16.75118064880371, -16.149938583374023, -15.54869556427002, -14.947453498840332, -14.346211433410645, -13.744969367980957, -13.14372730255127, -12.542485237121582, -11.941242218017578, -11.34000015258789, -10.738758087158203, -10.137516021728516, -9.536273956298828, -8.93503189086914, -8.333789825439453, -7.732547283172607, -7.13130521774292, -6.530063152313232, -5.928820610046387, -5.327578544616699, -4.726336479187012, -4.125094413757324, -3.5238521099090576, -2.922609806060791, -2.3213677406311035, -1.720125675201416, -1.1188833713531494, -0.5176410675048828, 0.08359909057617188, 0.6848412752151489, 1.286083459854126, 1.887325644493103, 2.48856782913208, 3.0898098945617676, 3.691052198410034, 4.292294502258301, 4.893536567687988, 5.494778633117676, 6.096020698547363, 6.697263240814209, 7.2985053062438965, 7.899747371673584, 8.50098991394043, 9.102231979370117, 9.703474044799805, 10.304716110229492, 10.90595817565918, 11.507200241088867, 12.108442306518555, 12.709684371948242, 13.310927391052246, 13.912169456481934, 14.513411521911621, 15.114653587341309, 15.715895652770996, 16.317138671875, 16.918380737304688, 17.519622802734375, 18.120864868164062, 18.72210693359375, 19.323348999023438]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 5.0, 13.0, 14.0, 11.0, 15.0, 28.0, 23.0, 31.0, 36.0, 32.0, 34.0, 27.0, 35.0, 49.0, 35.0, 43.0, 43.0, 53.0, 49.0, 35.0, 40.0, 43.0, 22.0, 29.0, 35.0, 27.0, 29.0, 23.0, 24.0, 23.0, 12.0, 9.0, 14.0, 14.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.535992622375488, -9.236194610595703, -8.936395645141602, -8.636597633361816, -8.336799621582031, -8.03700065612793, -7.7372026443481445, -7.437404155731201, -7.137605667114258, -6.8378071784973145, -6.538008689880371, -6.238210678100586, -5.938412189483643, -5.638613700866699, -5.338815689086914, -5.039017200469971, -4.739218711853027, -4.439420223236084, -4.139621734619141, -3.8398237228393555, -3.540025234222412, -3.2402267456054688, -2.9404284954071045, -2.6406302452087402, -2.340831756591797, -2.0410332679748535, -1.7412350177764893, -1.4414366483688354, -1.1416382789611816, -0.8418399095535278, -0.542041540145874, -0.24224328994750977, 0.05755615234375, 0.3573545217514038, 0.6571528911590576, 0.9569512605667114, 1.2567496299743652, 1.556547999382019, 1.8563463687896729, 2.156144618988037, 2.4559431076049805, 2.755741596221924, 3.055539846420288, 3.3553380966186523, 3.6551365852355957, 3.954935073852539, 4.254733085632324, 4.554531574249268, 4.854330062866211, 5.154128551483154, 5.453927040100098, 5.753725051879883, 6.053523540496826, 6.3533220291137695, 6.653120040893555, 6.952918529510498, 7.252717018127441, 7.552515506744385, 7.852313995361328, 8.152112007141113, 8.451910018920898, 8.751708984375, 9.051506996154785, 9.35130500793457, 9.651103973388672]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 4.0, 11.0, 13.0, 15.0, 33.0, 56.0, 88.0, 138.0, 207.0, 392.0, 572.0, 911.0, 1456.0, 2196.0, 3570.0, 5439.0, 8601.0, 13214.0, 19416.0, 28758.0, 41176.0, 55934.0, 72959.0, 89410.0, 102147.0, 108620.0, 106156.0, 95348.0, 80253.0, 63297.0, 47706.0, 33548.0, 23081.0, 15527.0, 10178.0, 6672.0, 4170.0, 2610.0, 1795.0, 1052.0, 686.0, 415.0, 296.0, 181.0, 98.0, 65.0, 46.0, 20.0, 13.0, 2.0, 8.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2109375, -6.00189208984375, -5.7928466796875, -5.58380126953125, -5.374755859375, -5.16571044921875, -4.9566650390625, -4.74761962890625, -4.53857421875, -4.32952880859375, -4.1204833984375, -3.91143798828125, -3.702392578125, -3.49334716796875, -3.2843017578125, -3.07525634765625, -2.8662109375, -2.65716552734375, -2.4481201171875, -2.23907470703125, -2.030029296875, -1.82098388671875, -1.6119384765625, -1.40289306640625, -1.19384765625, -0.98480224609375, -0.7757568359375, -0.56671142578125, -0.357666015625, -0.14862060546875, 0.0604248046875, 0.26947021484375, 0.478515625, 0.68756103515625, 0.8966064453125, 1.10565185546875, 1.314697265625, 1.52374267578125, 1.7327880859375, 1.94183349609375, 2.15087890625, 2.35992431640625, 2.5689697265625, 2.77801513671875, 2.987060546875, 3.19610595703125, 3.4051513671875, 3.61419677734375, 3.8232421875, 4.03228759765625, 4.2413330078125, 4.45037841796875, 4.659423828125, 4.86846923828125, 5.0775146484375, 5.28656005859375, 5.49560546875, 5.70465087890625, 5.9136962890625, 6.12274169921875, 6.331787109375, 6.54083251953125, 6.7498779296875, 6.95892333984375, 7.16796875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 5.0, 9.0, 4.0, 6.0, 7.0, 5.0, 8.0, 15.0, 14.0, 16.0, 20.0, 13.0, 24.0, 29.0, 34.0, 37.0, 34.0, 40.0, 46.0, 38.0, 45.0, 43.0, 49.0, 49.0, 42.0, 38.0, 48.0, 41.0, 30.0, 20.0, 29.0, 25.0, 20.0, 19.0, 15.0, 20.0, 12.0, 9.0, 11.0, 11.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8203125, -10.4893798828125, -10.158447265625, -9.8275146484375, -9.49658203125, -9.1656494140625, -8.834716796875, -8.5037841796875, -8.1728515625, -7.8419189453125, -7.510986328125, -7.1800537109375, -6.84912109375, -6.5181884765625, -6.187255859375, -5.8563232421875, -5.525390625, -5.1944580078125, -4.863525390625, -4.5325927734375, -4.20166015625, -3.8707275390625, -3.539794921875, -3.2088623046875, -2.8779296875, -2.5469970703125, -2.216064453125, -1.8851318359375, -1.55419921875, -1.2232666015625, -0.892333984375, -0.5614013671875, -0.23046875, 0.1004638671875, 0.431396484375, 0.7623291015625, 1.09326171875, 1.4241943359375, 1.755126953125, 2.0860595703125, 2.4169921875, 2.7479248046875, 3.078857421875, 3.4097900390625, 3.74072265625, 4.0716552734375, 4.402587890625, 4.7335205078125, 5.064453125, 5.3953857421875, 5.726318359375, 6.0572509765625, 6.38818359375, 6.7191162109375, 7.050048828125, 7.3809814453125, 7.7119140625, 8.0428466796875, 8.373779296875, 8.7047119140625, 9.03564453125, 9.3665771484375, 9.697509765625, 10.0284423828125, 10.359375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 5.0, 3.0, 2.0, 5.0, 6.0, 8.0, 14.0, 28.0, 52.0, 93.0, 116.0, 216.0, 301.0, 541.0, 831.0, 1268.0, 2062.0, 3308.0, 5112.0, 7810.0, 11895.0, 17733.0, 25694.0, 36532.0, 50016.0, 64243.0, 80102.0, 93766.0, 101899.0, 103419.0, 97370.0, 85974.0, 70956.0, 55476.0, 41526.0, 29719.0, 20713.0, 13948.0, 9201.0, 6055.0, 3842.0, 2467.0, 1632.0, 995.0, 572.0, 414.0, 214.0, 164.0, 100.0, 60.0, 32.0, 24.0, 13.0, 9.0, 5.0, 4.0, 0.0, 3.0, 1.0, 2.0], "bins": [-6.875, -6.66790771484375, -6.4608154296875, -6.25372314453125, -6.046630859375, -5.83953857421875, -5.6324462890625, -5.42535400390625, -5.21826171875, -5.01116943359375, -4.8040771484375, -4.59698486328125, -4.389892578125, -4.18280029296875, -3.9757080078125, -3.76861572265625, -3.5615234375, -3.35443115234375, -3.1473388671875, -2.94024658203125, -2.733154296875, -2.52606201171875, -2.3189697265625, -2.11187744140625, -1.90478515625, -1.69769287109375, -1.4906005859375, -1.28350830078125, -1.076416015625, -0.86932373046875, -0.6622314453125, -0.45513916015625, -0.248046875, -0.04095458984375, 0.1661376953125, 0.37322998046875, 0.580322265625, 0.78741455078125, 0.9945068359375, 1.20159912109375, 1.40869140625, 1.61578369140625, 1.8228759765625, 2.02996826171875, 2.237060546875, 2.44415283203125, 2.6512451171875, 2.85833740234375, 3.0654296875, 3.27252197265625, 3.4796142578125, 3.68670654296875, 3.893798828125, 4.10089111328125, 4.3079833984375, 4.51507568359375, 4.72216796875, 4.92926025390625, 5.1363525390625, 5.34344482421875, 5.550537109375, 5.75762939453125, 5.9647216796875, 6.17181396484375, 6.37890625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 7.0, 6.0, 7.0, 12.0, 14.0, 19.0, 22.0, 28.0, 33.0, 23.0, 23.0, 35.0, 33.0, 32.0, 31.0, 40.0, 39.0, 32.0, 37.0, 41.0, 39.0, 34.0, 37.0, 33.0, 32.0, 28.0, 25.0, 26.0, 25.0, 21.0, 26.0, 17.0, 22.0, 12.0, 17.0, 12.0, 11.0, 10.0, 9.0, 8.0, 6.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.234375, -6.0472412109375, -5.860107421875, -5.6729736328125, -5.48583984375, -5.2987060546875, -5.111572265625, -4.9244384765625, -4.7373046875, -4.5501708984375, -4.363037109375, -4.1759033203125, -3.98876953125, -3.8016357421875, -3.614501953125, -3.4273681640625, -3.240234375, -3.0531005859375, -2.865966796875, -2.6788330078125, -2.49169921875, -2.3045654296875, -2.117431640625, -1.9302978515625, -1.7431640625, -1.5560302734375, -1.368896484375, -1.1817626953125, -0.99462890625, -0.8074951171875, -0.620361328125, -0.4332275390625, -0.24609375, -0.0589599609375, 0.128173828125, 0.3153076171875, 0.50244140625, 0.6895751953125, 0.876708984375, 1.0638427734375, 1.2509765625, 1.4381103515625, 1.625244140625, 1.8123779296875, 1.99951171875, 2.1866455078125, 2.373779296875, 2.5609130859375, 2.748046875, 2.9351806640625, 3.122314453125, 3.3094482421875, 3.49658203125, 3.6837158203125, 3.870849609375, 4.0579833984375, 4.2451171875, 4.4322509765625, 4.619384765625, 4.8065185546875, 4.99365234375, 5.1807861328125, 5.367919921875, 5.5550537109375, 5.7421875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 18.0, 25.0, 29.0, 44.0, 50.0, 83.0, 102.0, 182.0, 245.0, 375.0, 529.0, 765.0, 1093.0, 1609.0, 2428.0, 3663.0, 5535.0, 8484.0, 13132.0, 20544.0, 31759.0, 48456.0, 70666.0, 98125.0, 122331.0, 134959.0, 129700.0, 108251.0, 81796.0, 56419.0, 37636.0, 24221.0, 15699.0, 10010.0, 6419.0, 4329.0, 2764.0, 1914.0, 1328.0, 901.0, 589.0, 418.0, 282.0, 192.0, 137.0, 109.0, 62.0, 50.0, 45.0, 11.0, 15.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0], "bins": [-5.046875, -4.89251708984375, -4.7381591796875, -4.58380126953125, -4.429443359375, -4.27508544921875, -4.1207275390625, -3.96636962890625, -3.81201171875, -3.65765380859375, -3.5032958984375, -3.34893798828125, -3.194580078125, -3.04022216796875, -2.8858642578125, -2.73150634765625, -2.5771484375, -2.42279052734375, -2.2684326171875, -2.11407470703125, -1.959716796875, -1.80535888671875, -1.6510009765625, -1.49664306640625, -1.34228515625, -1.18792724609375, -1.0335693359375, -0.87921142578125, -0.724853515625, -0.57049560546875, -0.4161376953125, -0.26177978515625, -0.107421875, 0.04693603515625, 0.2012939453125, 0.35565185546875, 0.510009765625, 0.66436767578125, 0.8187255859375, 0.97308349609375, 1.12744140625, 1.28179931640625, 1.4361572265625, 1.59051513671875, 1.744873046875, 1.89923095703125, 2.0535888671875, 2.20794677734375, 2.3623046875, 2.51666259765625, 2.6710205078125, 2.82537841796875, 2.979736328125, 3.13409423828125, 3.2884521484375, 3.44281005859375, 3.59716796875, 3.75152587890625, 3.9058837890625, 4.06024169921875, 4.214599609375, 4.36895751953125, 4.5233154296875, 4.67767333984375, 4.83203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 9.0, 8.0, 7.0, 8.0, 13.0, 11.0, 21.0, 30.0, 25.0, 25.0, 41.0, 48.0, 52.0, 35.0, 51.0, 52.0, 51.0, 44.0, 55.0, 50.0, 43.0, 32.0, 28.0, 40.0, 32.0, 25.0, 29.0, 21.0, 19.0, 18.0, 18.0, 12.0, 8.0, 11.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0005507469177246094, -0.0005351752042770386, -0.0005196034908294678, -0.000504031777381897, -0.0004884600639343262, -0.00047288835048675537, -0.00045731663703918457, -0.00044174492359161377, -0.00042617321014404297, -0.00041060149669647217, -0.00039502978324890137, -0.00037945806980133057, -0.00036388635635375977, -0.00034831464290618896, -0.00033274292945861816, -0.00031717121601104736, -0.00030159950256347656, -0.00028602778911590576, -0.00027045607566833496, -0.00025488436222076416, -0.00023931264877319336, -0.00022374093532562256, -0.00020816922187805176, -0.00019259750843048096, -0.00017702579498291016, -0.00016145408153533936, -0.00014588236808776855, -0.00013031065464019775, -0.00011473894119262695, -9.916722774505615e-05, -8.359551429748535e-05, -6.802380084991455e-05, -5.245208740234375e-05, -3.688037395477295e-05, -2.130866050720215e-05, -5.736947059631348e-06, 9.834766387939453e-06, 2.5406479835510254e-05, 4.0978193283081055e-05, 5.6549906730651855e-05, 7.212162017822266e-05, 8.769333362579346e-05, 0.00010326504707336426, 0.00011883676052093506, 0.00013440847396850586, 0.00014998018741607666, 0.00016555190086364746, 0.00018112361431121826, 0.00019669532775878906, 0.00021226704120635986, 0.00022783875465393066, 0.00024341046810150146, 0.00025898218154907227, 0.00027455389499664307, 0.00029012560844421387, 0.00030569732189178467, 0.00032126903533935547, 0.00033684074878692627, 0.00035241246223449707, 0.00036798417568206787, 0.00038355588912963867, 0.00039912760257720947, 0.0004146993160247803, 0.0004302710294723511, 0.0004458427429199219]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 13.0, 17.0, 23.0, 33.0, 50.0, 94.0, 130.0, 229.0, 340.0, 588.0, 1082.0, 1762.0, 3332.0, 6296.0, 12396.0, 27239.0, 61164.0, 132458.0, 227393.0, 249234.0, 169664.0, 83378.0, 37167.0, 16635.0, 8134.0, 4175.0, 2278.0, 1285.0, 740.0, 423.0, 286.0, 169.0, 123.0, 66.0, 39.0, 31.0, 30.0, 9.0, 9.0, 8.0, 8.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6484375, -9.339111328125, -9.02978515625, -8.720458984375, -8.4111328125, -8.101806640625, -7.79248046875, -7.483154296875, -7.173828125, -6.864501953125, -6.55517578125, -6.245849609375, -5.9365234375, -5.627197265625, -5.31787109375, -5.008544921875, -4.69921875, -4.389892578125, -4.08056640625, -3.771240234375, -3.4619140625, -3.152587890625, -2.84326171875, -2.533935546875, -2.224609375, -1.915283203125, -1.60595703125, -1.296630859375, -0.9873046875, -0.677978515625, -0.36865234375, -0.059326171875, 0.25, 0.559326171875, 0.86865234375, 1.177978515625, 1.4873046875, 1.796630859375, 2.10595703125, 2.415283203125, 2.724609375, 3.033935546875, 3.34326171875, 3.652587890625, 3.9619140625, 4.271240234375, 4.58056640625, 4.889892578125, 5.19921875, 5.508544921875, 5.81787109375, 6.127197265625, 6.4365234375, 6.745849609375, 7.05517578125, 7.364501953125, 7.673828125, 7.983154296875, 8.29248046875, 8.601806640625, 8.9111328125, 9.220458984375, 9.52978515625, 9.839111328125, 10.1484375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 7.0, 12.0, 27.0, 24.0, 27.0, 33.0, 45.0, 36.0, 41.0, 49.0, 51.0, 65.0, 65.0, 68.0, 53.0, 60.0, 46.0, 51.0, 39.0, 27.0, 24.0, 24.0, 24.0, 20.0, 10.0, 8.0, 10.0, 10.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6875, -1.6324615478515625, -1.577423095703125, -1.5223846435546875, -1.46734619140625, -1.4123077392578125, -1.357269287109375, -1.3022308349609375, -1.2471923828125, -1.1921539306640625, -1.137115478515625, -1.0820770263671875, -1.02703857421875, -0.9720001220703125, -0.916961669921875, -0.8619232177734375, -0.806884765625, -0.7518463134765625, -0.696807861328125, -0.6417694091796875, -0.58673095703125, -0.5316925048828125, -0.476654052734375, -0.4216156005859375, -0.3665771484375, -0.3115386962890625, -0.256500244140625, -0.2014617919921875, -0.14642333984375, -0.0913848876953125, -0.036346435546875, 0.0186920166015625, 0.07373046875, 0.1287689208984375, 0.183807373046875, 0.2388458251953125, 0.29388427734375, 0.3489227294921875, 0.403961181640625, 0.4589996337890625, 0.5140380859375, 0.5690765380859375, 0.624114990234375, 0.6791534423828125, 0.73419189453125, 0.7892303466796875, 0.844268798828125, 0.8993072509765625, 0.954345703125, 1.0093841552734375, 1.064422607421875, 1.1194610595703125, 1.17449951171875, 1.2295379638671875, 1.284576416015625, 1.3396148681640625, 1.3946533203125, 1.4496917724609375, 1.504730224609375, 1.5597686767578125, 1.61480712890625, 1.6698455810546875, 1.724884033203125, 1.7799224853515625, 1.8349609375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 13.0, 9.0, 15.0, 16.0, 26.0, 31.0, 42.0, 48.0, 45.0, 45.0, 46.0, 69.0, 72.0, 62.0, 62.0, 60.0, 56.0, 50.0, 39.0, 43.0, 33.0, 23.0, 21.0, 15.0, 18.0, 9.0, 5.0, 6.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.22496795654297, -19.61767578125, -19.010385513305664, -18.403093338012695, -17.795801162719727, -17.18851089477539, -16.581218719482422, -15.973926544189453, -15.3666353225708, -14.759344100952148, -14.15205192565918, -13.544760704040527, -12.937469482421875, -12.330177307128906, -11.722886085510254, -11.115594863891602, -10.508302688598633, -9.90101146697998, -9.293719291687012, -8.68642807006836, -8.07913589477539, -7.471844673156738, -6.864553451538086, -6.257261753082275, -5.649970054626465, -5.042678356170654, -4.435386657714844, -3.8280954360961914, -3.220803737640381, -2.6135120391845703, -2.006220579147339, -1.3989291191101074, -0.7916393280029297, -0.1843477487564087, 0.4229438304901123, 1.0302354097366333, 1.6375269889831543, 2.244818687438965, 2.8521101474761963, 3.4594016075134277, 4.066693305969238, 4.673985004425049, 5.281276702880859, 5.888567924499512, 6.495859622955322, 7.103151321411133, 7.710442543029785, 8.317733764648438, 8.925025939941406, 9.532317161560059, 10.139609336853027, 10.74690055847168, 11.354192733764648, 11.9614839553833, 12.568775177001953, 13.176067352294922, 13.783358573913574, 14.390649795532227, 14.997941970825195, 15.605233192443848, 16.2125244140625, 16.81981658935547, 17.427108764648438, 18.034399032592773, 18.641691207885742]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 3.0, 4.0, 4.0, 11.0, 9.0, 18.0, 13.0, 20.0, 22.0, 27.0, 22.0, 27.0, 29.0, 28.0, 23.0, 24.0, 47.0, 37.0, 36.0, 41.0, 38.0, 40.0, 27.0, 42.0, 40.0, 33.0, 39.0, 32.0, 36.0, 27.0, 34.0, 20.0, 8.0, 16.0, 16.0, 20.0, 13.0, 12.0, 15.0, 12.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.019770622253418, -9.716050148010254, -9.41232967376709, -9.108609199523926, -8.804888725280762, -8.501168251037598, -8.197447776794434, -7.8937273025512695, -7.5900068283081055, -7.286286354064941, -6.982565879821777, -6.678845405578613, -6.375124931335449, -6.071404457092285, -5.767683982849121, -5.463963508605957, -5.160243034362793, -4.856522560119629, -4.552802085876465, -4.249081611633301, -3.9453611373901367, -3.6416406631469727, -3.3379201889038086, -3.0341997146606445, -2.7304792404174805, -2.4267587661743164, -2.1230382919311523, -1.8193178176879883, -1.5155973434448242, -1.2118768692016602, -0.9081563949584961, -0.604435920715332, -0.3007164001464844, 0.0030040740966796875, 0.30672454833984375, 0.6104450225830078, 0.9141654968261719, 1.217885971069336, 1.5216064453125, 1.825326919555664, 2.129047393798828, 2.432767868041992, 2.7364883422851562, 3.0402088165283203, 3.3439292907714844, 3.6476497650146484, 3.9513702392578125, 4.255090713500977, 4.558811187744141, 4.862531661987305, 5.166252136230469, 5.469972610473633, 5.773693084716797, 6.077413558959961, 6.381134033203125, 6.684854507446289, 6.988574981689453, 7.292295455932617, 7.596015930175781, 7.899736404418945, 8.20345687866211, 8.507177352905273, 8.810897827148438, 9.114618301391602, 9.418338775634766]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 12.0, 10.0, 32.0, 41.0, 74.0, 102.0, 188.0, 285.0, 494.0, 783.0, 1321.0, 2388.0, 3989.0, 7188.0, 12659.0, 22268.0, 38898.0, 68843.0, 118528.0, 197268.0, 307443.0, 445968.0, 564304.0, 613810.0, 562393.0, 440845.0, 306169.0, 196038.0, 118448.0, 68850.0, 40229.0, 23014.0, 13046.0, 7590.0, 4405.0, 2540.0, 1455.0, 890.0, 568.0, 367.0, 207.0, 124.0, 75.0, 43.0, 30.0, 25.0, 17.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0], "bins": [-14.296875, -13.8701171875, -13.443359375, -13.0166015625, -12.58984375, -12.1630859375, -11.736328125, -11.3095703125, -10.8828125, -10.4560546875, -10.029296875, -9.6025390625, -9.17578125, -8.7490234375, -8.322265625, -7.8955078125, -7.46875, -7.0419921875, -6.615234375, -6.1884765625, -5.76171875, -5.3349609375, -4.908203125, -4.4814453125, -4.0546875, -3.6279296875, -3.201171875, -2.7744140625, -2.34765625, -1.9208984375, -1.494140625, -1.0673828125, -0.640625, -0.2138671875, 0.212890625, 0.6396484375, 1.06640625, 1.4931640625, 1.919921875, 2.3466796875, 2.7734375, 3.2001953125, 3.626953125, 4.0537109375, 4.48046875, 4.9072265625, 5.333984375, 5.7607421875, 6.1875, 6.6142578125, 7.041015625, 7.4677734375, 7.89453125, 8.3212890625, 8.748046875, 9.1748046875, 9.6015625, 10.0283203125, 10.455078125, 10.8818359375, 11.30859375, 11.7353515625, 12.162109375, 12.5888671875, 13.015625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 6.0, 7.0, 10.0, 9.0, 21.0, 15.0, 18.0, 29.0, 28.0, 37.0, 31.0, 28.0, 42.0, 25.0, 30.0, 40.0, 49.0, 35.0, 42.0, 44.0, 34.0, 29.0, 26.0, 45.0, 33.0, 29.0, 27.0, 33.0, 16.0, 19.0, 18.0, 19.0, 22.0, 11.0, 5.0, 13.0, 11.0, 10.0, 9.0, 8.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.46875, -8.2076416015625, -7.946533203125, -7.6854248046875, -7.42431640625, -7.1632080078125, -6.902099609375, -6.6409912109375, -6.3798828125, -6.1187744140625, -5.857666015625, -5.5965576171875, -5.33544921875, -5.0743408203125, -4.813232421875, -4.5521240234375, -4.291015625, -4.0299072265625, -3.768798828125, -3.5076904296875, -3.24658203125, -2.9854736328125, -2.724365234375, -2.4632568359375, -2.2021484375, -1.9410400390625, -1.679931640625, -1.4188232421875, -1.15771484375, -0.8966064453125, -0.635498046875, -0.3743896484375, -0.11328125, 0.1478271484375, 0.408935546875, 0.6700439453125, 0.93115234375, 1.1922607421875, 1.453369140625, 1.7144775390625, 1.9755859375, 2.2366943359375, 2.497802734375, 2.7589111328125, 3.02001953125, 3.2811279296875, 3.542236328125, 3.8033447265625, 4.064453125, 4.3255615234375, 4.586669921875, 4.8477783203125, 5.10888671875, 5.3699951171875, 5.631103515625, 5.8922119140625, 6.1533203125, 6.4144287109375, 6.675537109375, 6.9366455078125, 7.19775390625, 7.4588623046875, 7.719970703125, 7.9810791015625, 8.2421875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 2.0, 8.0, 9.0, 9.0, 18.0, 33.0, 38.0, 75.0, 109.0, 204.0, 329.0, 502.0, 882.0, 1440.0, 2400.0, 4018.0, 6767.0, 11386.0, 19194.0, 32096.0, 52913.0, 85351.0, 133846.0, 201853.0, 289712.0, 385963.0, 467413.0, 510493.0, 500138.0, 435323.0, 343971.0, 249827.0, 171025.0, 110802.0, 69462.0, 42497.0, 26002.0, 15606.0, 9127.0, 5362.0, 3150.0, 1935.0, 1185.0, 683.0, 416.0, 268.0, 161.0, 120.0, 59.0, 36.0, 24.0, 21.0, 7.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-13.8984375, -13.461181640625, -13.02392578125, -12.586669921875, -12.1494140625, -11.712158203125, -11.27490234375, -10.837646484375, -10.400390625, -9.963134765625, -9.52587890625, -9.088623046875, -8.6513671875, -8.214111328125, -7.77685546875, -7.339599609375, -6.90234375, -6.465087890625, -6.02783203125, -5.590576171875, -5.1533203125, -4.716064453125, -4.27880859375, -3.841552734375, -3.404296875, -2.967041015625, -2.52978515625, -2.092529296875, -1.6552734375, -1.218017578125, -0.78076171875, -0.343505859375, 0.09375, 0.531005859375, 0.96826171875, 1.405517578125, 1.8427734375, 2.280029296875, 2.71728515625, 3.154541015625, 3.591796875, 4.029052734375, 4.46630859375, 4.903564453125, 5.3408203125, 5.778076171875, 6.21533203125, 6.652587890625, 7.08984375, 7.527099609375, 7.96435546875, 8.401611328125, 8.8388671875, 9.276123046875, 9.71337890625, 10.150634765625, 10.587890625, 11.025146484375, 11.46240234375, 11.899658203125, 12.3369140625, 12.774169921875, 13.21142578125, 13.648681640625, 14.0859375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 10.0, 13.0, 10.0, 16.0, 17.0, 19.0, 26.0, 29.0, 42.0, 43.0, 74.0, 63.0, 79.0, 104.0, 125.0, 143.0, 158.0, 172.0, 184.0, 192.0, 221.0, 196.0, 204.0, 212.0, 214.0, 185.0, 171.0, 166.0, 143.0, 150.0, 110.0, 114.0, 95.0, 65.0, 62.0, 54.0, 44.0, 34.0, 25.0, 27.0, 16.0, 8.0, 6.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.26171875, -5.09820556640625, -4.9346923828125, -4.77117919921875, -4.607666015625, -4.44415283203125, -4.2806396484375, -4.11712646484375, -3.95361328125, -3.79010009765625, -3.6265869140625, -3.46307373046875, -3.299560546875, -3.13604736328125, -2.9725341796875, -2.80902099609375, -2.6455078125, -2.48199462890625, -2.3184814453125, -2.15496826171875, -1.991455078125, -1.82794189453125, -1.6644287109375, -1.50091552734375, -1.33740234375, -1.17388916015625, -1.0103759765625, -0.84686279296875, -0.683349609375, -0.51983642578125, -0.3563232421875, -0.19281005859375, -0.029296875, 0.13421630859375, 0.2977294921875, 0.46124267578125, 0.624755859375, 0.78826904296875, 0.9517822265625, 1.11529541015625, 1.27880859375, 1.44232177734375, 1.6058349609375, 1.76934814453125, 1.932861328125, 2.09637451171875, 2.2598876953125, 2.42340087890625, 2.5869140625, 2.75042724609375, 2.9139404296875, 3.07745361328125, 3.240966796875, 3.40447998046875, 3.5679931640625, 3.73150634765625, 3.89501953125, 4.05853271484375, 4.2220458984375, 4.38555908203125, 4.549072265625, 4.71258544921875, 4.8760986328125, 5.03961181640625, 5.203125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 8.0, 4.0, 10.0, 13.0, 11.0, 15.0, 15.0, 23.0, 20.0, 37.0, 41.0, 29.0, 43.0, 44.0, 48.0, 46.0, 40.0, 58.0, 42.0, 59.0, 57.0, 41.0, 46.0, 34.0, 31.0, 26.0, 30.0, 15.0, 17.0, 18.0, 13.0, 16.0, 12.0, 6.0, 6.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-21.039783477783203, -20.453575134277344, -19.86736488342285, -19.281156539916992, -18.6949462890625, -18.10873794555664, -17.52252960205078, -16.936321258544922, -16.35011100769043, -15.763901710510254, -15.177692413330078, -14.591484069824219, -14.005274772644043, -13.419065475463867, -12.832857131958008, -12.246647834777832, -11.660438537597656, -11.07422924041748, -10.488019943237305, -9.901811599731445, -9.31560230255127, -8.729393005371094, -8.143184661865234, -7.556975364685059, -6.970766067504883, -6.384556770324707, -5.7983479499816895, -5.212139129638672, -4.625929832458496, -4.03972053527832, -3.4535117149353027, -2.867302894592285, -2.2810935974121094, -1.6948845386505127, -1.108675479888916, -0.5224664211273193, 0.06374263763427734, 0.649951696395874, 1.2361607551574707, 1.8223695755004883, 2.408578872680664, 2.9947879314422607, 3.5809969902038574, 4.167205810546875, 4.753415107727051, 5.339624404907227, 5.925833225250244, 6.512042045593262, 7.0982513427734375, 7.684460639953613, 8.270669937133789, 8.856878280639648, 9.443087577819824, 10.029296875, 10.61550521850586, 11.201714515686035, 11.787923812866211, 12.374133110046387, 12.960342407226562, 13.546550750732422, 14.132760047912598, 14.718969345092773, 15.305177688598633, 15.891386985778809, 16.477596282958984]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 3.0, 8.0, 11.0, 13.0, 13.0, 14.0, 13.0, 19.0, 20.0, 28.0, 25.0, 37.0, 38.0, 30.0, 33.0, 45.0, 50.0, 53.0, 46.0, 38.0, 37.0, 48.0, 36.0, 52.0, 46.0, 30.0, 33.0, 28.0, 20.0, 16.0, 22.0, 19.0, 16.0, 10.0, 11.0, 14.0, 9.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.202217102050781, -12.773894309997559, -12.345572471618652, -11.91724967956543, -11.488926887512207, -11.0606050491333, -10.632282257080078, -10.203960418701172, -9.77563762664795, -9.347314834594727, -8.91899299621582, -8.490670204162598, -8.062347412109375, -7.634025573730469, -7.205702781677246, -6.777380466461182, -6.349057674407959, -5.9207353591918945, -5.492412567138672, -5.064090251922607, -4.635767936706543, -4.20744514465332, -3.779122829437256, -3.3508005142211914, -2.922477960586548, -2.4941554069519043, -2.06583309173584, -1.6375105381011963, -1.2091881036758423, -0.7808656692504883, -0.3525431156158447, 0.07577919960021973, 0.5041017532348633, 0.9324241876602173, 1.3607466220855713, 1.7890691757202148, 2.2173914909362793, 2.645714044570923, 3.0740365982055664, 3.502358913421631, 3.9306814670562744, 4.359004020690918, 4.787326335906982, 5.215648651123047, 5.6439714431762695, 6.072293758392334, 6.500616073608398, 6.928938865661621, 7.3572611808776855, 7.78558349609375, 8.213906288146973, 8.642229080200195, 9.070550918579102, 9.498873710632324, 9.927196502685547, 10.355518341064453, 10.783841133117676, 11.212163925170898, 11.640485763549805, 12.068808555603027, 12.49713134765625, 12.925453186035156, 13.353775978088379, 13.782098770141602, 14.210420608520508]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 5.0, 11.0, 18.0, 19.0, 29.0, 37.0, 72.0, 118.0, 178.0, 262.0, 415.0, 689.0, 1070.0, 1673.0, 2586.0, 4268.0, 7029.0, 11442.0, 18426.0, 29477.0, 47022.0, 72661.0, 106616.0, 142223.0, 158687.0, 142219.0, 105747.0, 72181.0, 46524.0, 29222.0, 18245.0, 11141.0, 6918.0, 4232.0, 2605.0, 1646.0, 1012.0, 660.0, 419.0, 265.0, 192.0, 95.0, 67.0, 44.0, 38.0, 14.0, 20.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.16796875, -3.070465087890625, -2.97296142578125, -2.875457763671875, -2.7779541015625, -2.680450439453125, -2.58294677734375, -2.485443115234375, -2.387939453125, -2.290435791015625, -2.19293212890625, -2.095428466796875, -1.9979248046875, -1.900421142578125, -1.80291748046875, -1.705413818359375, -1.60791015625, -1.510406494140625, -1.41290283203125, -1.315399169921875, -1.2178955078125, -1.120391845703125, -1.02288818359375, -0.925384521484375, -0.827880859375, -0.730377197265625, -0.63287353515625, -0.535369873046875, -0.4378662109375, -0.340362548828125, -0.24285888671875, -0.145355224609375, -0.0478515625, 0.049652099609375, 0.14715576171875, 0.244659423828125, 0.3421630859375, 0.439666748046875, 0.53717041015625, 0.634674072265625, 0.732177734375, 0.829681396484375, 0.92718505859375, 1.024688720703125, 1.1221923828125, 1.219696044921875, 1.31719970703125, 1.414703369140625, 1.51220703125, 1.609710693359375, 1.70721435546875, 1.804718017578125, 1.9022216796875, 1.999725341796875, 2.09722900390625, 2.194732666015625, 2.292236328125, 2.389739990234375, 2.48724365234375, 2.584747314453125, 2.6822509765625, 2.779754638671875, 2.87725830078125, 2.974761962890625, 3.072265625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 7.0, 4.0, 3.0, 5.0, 13.0, 18.0, 14.0, 15.0, 21.0, 21.0, 13.0, 22.0, 42.0, 28.0, 48.0, 38.0, 44.0, 52.0, 45.0, 51.0, 44.0, 47.0, 48.0, 34.0, 43.0, 24.0, 22.0, 26.0, 18.0, 31.0, 31.0, 22.0, 20.0, 10.0, 16.0, 13.0, 11.0, 13.0, 3.0, 6.0, 3.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.203125, -14.7589111328125, -14.314697265625, -13.8704833984375, -13.42626953125, -12.9820556640625, -12.537841796875, -12.0936279296875, -11.6494140625, -11.2052001953125, -10.760986328125, -10.3167724609375, -9.87255859375, -9.4283447265625, -8.984130859375, -8.5399169921875, -8.095703125, -7.6514892578125, -7.207275390625, -6.7630615234375, -6.31884765625, -5.8746337890625, -5.430419921875, -4.9862060546875, -4.5419921875, -4.0977783203125, -3.653564453125, -3.2093505859375, -2.76513671875, -2.3209228515625, -1.876708984375, -1.4324951171875, -0.98828125, -0.5440673828125, -0.099853515625, 0.3443603515625, 0.78857421875, 1.2327880859375, 1.677001953125, 2.1212158203125, 2.5654296875, 3.0096435546875, 3.453857421875, 3.8980712890625, 4.34228515625, 4.7864990234375, 5.230712890625, 5.6749267578125, 6.119140625, 6.5633544921875, 7.007568359375, 7.4517822265625, 7.89599609375, 8.3402099609375, 8.784423828125, 9.2286376953125, 9.6728515625, 10.1170654296875, 10.561279296875, 11.0054931640625, 11.44970703125, 11.8939208984375, 12.338134765625, 12.7823486328125, 13.2265625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 0.0, 1.0, 2.0, 4.0, 12.0, 16.0, 12.0, 19.0, 24.0, 40.0, 56.0, 81.0, 102.0, 164.0, 222.0, 392.0, 687.0, 963.0, 1656.0, 2673.0, 4446.0, 7953.0, 13944.0, 24985.0, 44905.0, 79843.0, 132294.0, 186474.0, 193491.0, 145198.0, 90729.0, 50903.0, 28535.0, 15868.0, 8945.0, 5076.0, 3022.0, 1734.0, 1115.0, 674.0, 419.0, 288.0, 181.0, 127.0, 84.0, 65.0, 42.0, 29.0, 24.0, 13.0, 12.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.97265625, -3.84893798828125, -3.7252197265625, -3.60150146484375, -3.477783203125, -3.35406494140625, -3.2303466796875, -3.10662841796875, -2.98291015625, -2.85919189453125, -2.7354736328125, -2.61175537109375, -2.488037109375, -2.36431884765625, -2.2406005859375, -2.11688232421875, -1.9931640625, -1.86944580078125, -1.7457275390625, -1.62200927734375, -1.498291015625, -1.37457275390625, -1.2508544921875, -1.12713623046875, -1.00341796875, -0.87969970703125, -0.7559814453125, -0.63226318359375, -0.508544921875, -0.38482666015625, -0.2611083984375, -0.13739013671875, -0.013671875, 0.11004638671875, 0.2337646484375, 0.35748291015625, 0.481201171875, 0.60491943359375, 0.7286376953125, 0.85235595703125, 0.97607421875, 1.09979248046875, 1.2235107421875, 1.34722900390625, 1.470947265625, 1.59466552734375, 1.7183837890625, 1.84210205078125, 1.9658203125, 2.08953857421875, 2.2132568359375, 2.33697509765625, 2.460693359375, 2.58441162109375, 2.7081298828125, 2.83184814453125, 2.95556640625, 3.07928466796875, 3.2030029296875, 3.32672119140625, 3.450439453125, 3.57415771484375, 3.6978759765625, 3.82159423828125, 3.9453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 3.0, 6.0, 5.0, 16.0, 10.0, 14.0, 12.0, 20.0, 18.0, 24.0, 15.0, 26.0, 21.0, 36.0, 36.0, 33.0, 35.0, 33.0, 43.0, 51.0, 45.0, 42.0, 37.0, 36.0, 40.0, 26.0, 42.0, 45.0, 24.0, 41.0, 23.0, 18.0, 19.0, 15.0, 20.0, 16.0, 8.0, 7.0, 6.0, 4.0, 6.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7109375, -7.453857421875, -7.19677734375, -6.939697265625, -6.6826171875, -6.425537109375, -6.16845703125, -5.911376953125, -5.654296875, -5.397216796875, -5.14013671875, -4.883056640625, -4.6259765625, -4.368896484375, -4.11181640625, -3.854736328125, -3.59765625, -3.340576171875, -3.08349609375, -2.826416015625, -2.5693359375, -2.312255859375, -2.05517578125, -1.798095703125, -1.541015625, -1.283935546875, -1.02685546875, -0.769775390625, -0.5126953125, -0.255615234375, 0.00146484375, 0.258544921875, 0.515625, 0.772705078125, 1.02978515625, 1.286865234375, 1.5439453125, 1.801025390625, 2.05810546875, 2.315185546875, 2.572265625, 2.829345703125, 3.08642578125, 3.343505859375, 3.6005859375, 3.857666015625, 4.11474609375, 4.371826171875, 4.62890625, 4.885986328125, 5.14306640625, 5.400146484375, 5.6572265625, 5.914306640625, 6.17138671875, 6.428466796875, 6.685546875, 6.942626953125, 7.19970703125, 7.456787109375, 7.7138671875, 7.970947265625, 8.22802734375, 8.485107421875, 8.7421875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 18.0, 17.0, 33.0, 43.0, 66.0, 123.0, 177.0, 287.0, 537.0, 854.0, 1468.0, 2644.0, 4654.0, 8816.0, 17733.0, 37231.0, 81231.0, 168609.0, 267919.0, 226902.0, 119898.0, 55811.0, 25950.0, 12560.0, 6578.0, 3567.0, 1960.0, 1118.0, 647.0, 413.0, 251.0, 152.0, 79.0, 65.0, 39.0, 35.0, 18.0, 12.0, 4.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.4755859375, -1.433135986328125, -1.39068603515625, -1.348236083984375, -1.3057861328125, -1.263336181640625, -1.22088623046875, -1.178436279296875, -1.135986328125, -1.093536376953125, -1.05108642578125, -1.008636474609375, -0.9661865234375, -0.923736572265625, -0.88128662109375, -0.838836669921875, -0.79638671875, -0.753936767578125, -0.71148681640625, -0.669036865234375, -0.6265869140625, -0.584136962890625, -0.54168701171875, -0.499237060546875, -0.456787109375, -0.414337158203125, -0.37188720703125, -0.329437255859375, -0.2869873046875, -0.244537353515625, -0.20208740234375, -0.159637451171875, -0.1171875, -0.074737548828125, -0.03228759765625, 0.010162353515625, 0.0526123046875, 0.095062255859375, 0.13751220703125, 0.179962158203125, 0.222412109375, 0.264862060546875, 0.30731201171875, 0.349761962890625, 0.3922119140625, 0.434661865234375, 0.47711181640625, 0.519561767578125, 0.56201171875, 0.604461669921875, 0.64691162109375, 0.689361572265625, 0.7318115234375, 0.774261474609375, 0.81671142578125, 0.859161376953125, 0.901611328125, 0.944061279296875, 0.98651123046875, 1.028961181640625, 1.0714111328125, 1.113861083984375, 1.15631103515625, 1.198760986328125, 1.2412109375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 3.0, 12.0, 3.0, 12.0, 17.0, 11.0, 19.0, 13.0, 24.0, 27.0, 29.0, 34.0, 36.0, 46.0, 45.0, 46.0, 53.0, 47.0, 49.0, 49.0, 52.0, 47.0, 25.0, 39.0, 26.0, 34.0, 45.0, 31.0, 16.0, 22.0, 16.0, 13.0, 11.0, 12.0, 10.0, 2.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.561113357543945e-05, -5.3705647587776184e-05, -5.1800161600112915e-05, -4.9894675612449646e-05, -4.798918962478638e-05, -4.608370363712311e-05, -4.417821764945984e-05, -4.227273166179657e-05, -4.03672456741333e-05, -3.846175968647003e-05, -3.655627369880676e-05, -3.4650787711143494e-05, -3.2745301723480225e-05, -3.0839815735816956e-05, -2.8934329748153687e-05, -2.7028843760490417e-05, -2.512335777282715e-05, -2.321787178516388e-05, -2.131238579750061e-05, -1.940689980983734e-05, -1.7501413822174072e-05, -1.5595927834510803e-05, -1.3690441846847534e-05, -1.1784955859184265e-05, -9.879469871520996e-06, -7.973983883857727e-06, -6.068497896194458e-06, -4.163011908531189e-06, -2.25752592086792e-06, -3.520399332046509e-07, 1.5534460544586182e-06, 3.458932042121887e-06, 5.364418029785156e-06, 7.269904017448425e-06, 9.175390005111694e-06, 1.1080875992774963e-05, 1.2986361980438232e-05, 1.4891847968101501e-05, 1.679733395576477e-05, 1.870281994342804e-05, 2.060830593109131e-05, 2.2513791918754578e-05, 2.4419277906417847e-05, 2.6324763894081116e-05, 2.8230249881744385e-05, 3.0135735869407654e-05, 3.204122185707092e-05, 3.394670784473419e-05, 3.585219383239746e-05, 3.775767982006073e-05, 3.9663165807724e-05, 4.156865179538727e-05, 4.347413778305054e-05, 4.5379623770713806e-05, 4.7285109758377075e-05, 4.9190595746040344e-05, 5.109608173370361e-05, 5.300156772136688e-05, 5.490705370903015e-05, 5.681253969669342e-05, 5.871802568435669e-05, 6.062351167201996e-05, 6.252899765968323e-05, 6.44344836473465e-05, 6.633996963500977e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 6.0, 14.0, 11.0, 32.0, 24.0, 48.0, 81.0, 120.0, 207.0, 324.0, 601.0, 937.0, 1614.0, 2886.0, 4894.0, 8590.0, 15053.0, 27261.0, 49293.0, 89762.0, 156236.0, 221914.0, 195584.0, 121477.0, 66977.0, 36878.0, 20604.0, 11484.0, 6445.0, 3782.0, 2135.0, 1299.0, 767.0, 464.0, 288.0, 160.0, 95.0, 48.0, 39.0, 38.0, 18.0, 13.0, 13.0, 11.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.6826171875, -1.6279144287109375, -1.573211669921875, -1.5185089111328125, -1.46380615234375, -1.4091033935546875, -1.354400634765625, -1.2996978759765625, -1.2449951171875, -1.1902923583984375, -1.135589599609375, -1.0808868408203125, -1.02618408203125, -0.9714813232421875, -0.916778564453125, -0.8620758056640625, -0.807373046875, -0.7526702880859375, -0.697967529296875, -0.6432647705078125, -0.58856201171875, -0.5338592529296875, -0.479156494140625, -0.4244537353515625, -0.3697509765625, -0.3150482177734375, -0.260345458984375, -0.2056427001953125, -0.15093994140625, -0.0962371826171875, -0.041534423828125, 0.0131683349609375, 0.06787109375, 0.1225738525390625, 0.177276611328125, 0.2319793701171875, 0.28668212890625, 0.3413848876953125, 0.396087646484375, 0.4507904052734375, 0.5054931640625, 0.5601959228515625, 0.614898681640625, 0.6696014404296875, 0.72430419921875, 0.7790069580078125, 0.833709716796875, 0.8884124755859375, 0.943115234375, 0.9978179931640625, 1.052520751953125, 1.1072235107421875, 1.16192626953125, 1.2166290283203125, 1.271331787109375, 1.3260345458984375, 1.3807373046875, 1.4354400634765625, 1.490142822265625, 1.5448455810546875, 1.59954833984375, 1.6542510986328125, 1.708953857421875, 1.7636566162109375, 1.818359375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 8.0, 2.0, 14.0, 14.0, 17.0, 13.0, 15.0, 18.0, 25.0, 34.0, 38.0, 46.0, 64.0, 61.0, 73.0, 66.0, 74.0, 57.0, 60.0, 41.0, 40.0, 40.0, 28.0, 18.0, 16.0, 21.0, 19.0, 15.0, 9.0, 7.0, 7.0, 5.0, 4.0, 5.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.474853515625, -0.4608192443847656, -0.44678497314453125, -0.4327507019042969, -0.4187164306640625, -0.4046821594238281, -0.39064788818359375, -0.3766136169433594, -0.362579345703125, -0.3485450744628906, -0.33451080322265625, -0.3204765319824219, -0.3064422607421875, -0.2924079895019531, -0.27837371826171875, -0.2643394470214844, -0.25030517578125, -0.23627090454101562, -0.22223663330078125, -0.20820236206054688, -0.1941680908203125, -0.18013381958007812, -0.16609954833984375, -0.15206527709960938, -0.138031005859375, -0.12399673461914062, -0.10996246337890625, -0.09592819213867188, -0.0818939208984375, -0.06785964965820312, -0.05382537841796875, -0.039791107177734375, -0.0257568359375, -0.011722564697265625, 0.00231170654296875, 0.016345977783203125, 0.0303802490234375, 0.044414520263671875, 0.05844879150390625, 0.07248306274414062, 0.086517333984375, 0.10055160522460938, 0.11458587646484375, 0.12862014770507812, 0.1426544189453125, 0.15668869018554688, 0.17072296142578125, 0.18475723266601562, 0.19879150390625, 0.21282577514648438, 0.22686004638671875, 0.24089431762695312, 0.2549285888671875, 0.2689628601074219, 0.28299713134765625, 0.2970314025878906, 0.311065673828125, 0.3250999450683594, 0.33913421630859375, 0.3531684875488281, 0.3672027587890625, 0.3812370300292969, 0.39527130126953125, 0.4093055725097656, 0.42333984375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 10.0, 2.0, 9.0, 14.0, 13.0, 12.0, 17.0, 23.0, 28.0, 31.0, 36.0, 37.0, 37.0, 44.0, 55.0, 33.0, 51.0, 45.0, 43.0, 57.0, 54.0, 44.0, 40.0, 40.0, 26.0, 34.0, 25.0, 21.0, 19.0, 15.0, 15.0, 12.0, 14.0, 9.0, 5.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-19.99135398864746, -19.419038772583008, -18.846721649169922, -18.27440643310547, -17.702089309692383, -17.12977409362793, -16.557456970214844, -15.98514175415039, -15.412824630737305, -14.840508460998535, -14.268192291259766, -13.695876121520996, -13.123559951782227, -12.551243782043457, -11.978927612304688, -11.406612396240234, -10.834296226501465, -10.261980056762695, -9.689663887023926, -9.117347717285156, -8.545031547546387, -7.972715377807617, -7.400399684906006, -6.828083515167236, -6.255767345428467, -5.683451175689697, -5.111135005950928, -4.538819313049316, -3.9665029048919678, -3.3941867351531982, -2.821870803833008, -2.2495546340942383, -1.6772384643554688, -1.1049222946166992, -0.5326062440872192, 0.03970980644226074, 0.6120259761810303, 1.1843421459197998, 1.7566580772399902, 2.3289742469787598, 2.9012904167175293, 3.473606586456299, 4.045922756195068, 4.61823844909668, 5.190554618835449, 5.762870788574219, 6.335186958312988, 6.907503128051758, 7.479819297790527, 8.052135467529297, 8.624451637268066, 9.196767807006836, 9.769083976745605, 10.341400146484375, 10.913715362548828, 11.486032485961914, 12.058347702026367, 12.630663871765137, 13.202980041503906, 13.775296211242676, 14.347612380981445, 14.919928550720215, 15.492244720458984, 16.064559936523438, 16.636877059936523]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 10.0, 10.0, 12.0, 13.0, 16.0, 12.0, 19.0, 18.0, 29.0, 26.0, 35.0, 38.0, 30.0, 37.0, 47.0, 50.0, 51.0, 41.0, 47.0, 37.0, 42.0, 43.0, 47.0, 46.0, 30.0, 33.0, 28.0, 21.0, 21.0, 14.0, 22.0, 14.0, 10.0, 12.0, 14.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.306718826293945, -12.876669883728027, -12.44662094116211, -12.016571998596191, -11.586523056030273, -11.156474113464355, -10.726425170898438, -10.296377182006836, -9.866327285766602, -9.436278343200684, -9.006229400634766, -8.576180458068848, -8.14613151550293, -7.716082572937012, -7.286034107208252, -6.855985164642334, -6.425936698913574, -5.995887756347656, -5.565838813781738, -5.13578987121582, -4.705740928649902, -4.275691986083984, -3.8456435203552246, -3.4155945777893066, -2.9855456352233887, -2.5554966926574707, -2.1254477500915527, -1.6953990459442139, -1.265350103378296, -0.8353011608123779, -0.40525245666503906, 0.024796485900878906, 0.45484447479248047, 0.8848933577537537, 1.3149422407150269, 1.7449910640716553, 2.1750400066375732, 2.605088949203491, 3.03513765335083, 3.465186595916748, 3.895235538482666, 4.325284481048584, 4.755333423614502, 5.185381889343262, 5.61543083190918, 6.045479774475098, 6.475528717041016, 6.905577659606934, 7.335626602172852, 7.7656755447387695, 8.195724487304688, 8.625773429870605, 9.055822372436523, 9.485871315002441, 9.91592025756836, 10.345968246459961, 10.776018142700195, 11.206067085266113, 11.636116027832031, 12.06616497039795, 12.496213912963867, 12.926262855529785, 13.356311798095703, 13.786359786987305, 14.216408729553223]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 7.0, 7.0, 16.0, 27.0, 33.0, 53.0, 91.0, 159.0, 242.0, 408.0, 663.0, 1013.0, 1672.0, 2530.0, 3943.0, 6005.0, 9105.0, 13642.0, 19976.0, 28699.0, 40146.0, 53619.0, 69255.0, 84313.0, 96024.0, 103168.0, 101789.0, 94253.0, 81184.0, 66234.0, 50732.0, 37775.0, 26572.0, 18736.0, 12488.0, 8500.0, 5605.0, 3541.0, 2292.0, 1498.0, 908.0, 621.0, 337.0, 273.0, 157.0, 92.0, 59.0, 42.0, 22.0, 13.0, 10.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.2421875, -7.0078125, -6.7734375, -6.5390625, -6.3046875, -6.0703125, -5.8359375, -5.6015625, -5.3671875, -5.1328125, -4.8984375, -4.6640625, -4.4296875, -4.1953125, -3.9609375, -3.7265625, -3.4921875, -3.2578125, -3.0234375, -2.7890625, -2.5546875, -2.3203125, -2.0859375, -1.8515625, -1.6171875, -1.3828125, -1.1484375, -0.9140625, -0.6796875, -0.4453125, -0.2109375, 0.0234375, 0.2578125, 0.4921875, 0.7265625, 0.9609375, 1.1953125, 1.4296875, 1.6640625, 1.8984375, 2.1328125, 2.3671875, 2.6015625, 2.8359375, 3.0703125, 3.3046875, 3.5390625, 3.7734375, 4.0078125, 4.2421875, 4.4765625, 4.7109375, 4.9453125, 5.1796875, 5.4140625, 5.6484375, 5.8828125, 6.1171875, 6.3515625, 6.5859375, 6.8203125, 7.0546875, 7.2890625, 7.5234375, 7.7578125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 12.0, 10.0, 5.0, 9.0, 10.0, 24.0, 26.0, 25.0, 30.0, 29.0, 32.0, 39.0, 32.0, 34.0, 46.0, 48.0, 51.0, 55.0, 41.0, 40.0, 46.0, 29.0, 43.0, 44.0, 37.0, 36.0, 27.0, 28.0, 18.0, 12.0, 14.0, 14.0, 13.0, 10.0, 8.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8515625, -14.38623046875, -13.9208984375, -13.45556640625, -12.990234375, -12.52490234375, -12.0595703125, -11.59423828125, -11.12890625, -10.66357421875, -10.1982421875, -9.73291015625, -9.267578125, -8.80224609375, -8.3369140625, -7.87158203125, -7.40625, -6.94091796875, -6.4755859375, -6.01025390625, -5.544921875, -5.07958984375, -4.6142578125, -4.14892578125, -3.68359375, -3.21826171875, -2.7529296875, -2.28759765625, -1.822265625, -1.35693359375, -0.8916015625, -0.42626953125, 0.0390625, 0.50439453125, 0.9697265625, 1.43505859375, 1.900390625, 2.36572265625, 2.8310546875, 3.29638671875, 3.76171875, 4.22705078125, 4.6923828125, 5.15771484375, 5.623046875, 6.08837890625, 6.5537109375, 7.01904296875, 7.484375, 7.94970703125, 8.4150390625, 8.88037109375, 9.345703125, 9.81103515625, 10.2763671875, 10.74169921875, 11.20703125, 11.67236328125, 12.1376953125, 12.60302734375, 13.068359375, 13.53369140625, 13.9990234375, 14.46435546875, 14.9296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 16.0, 23.0, 31.0, 47.0, 99.0, 159.0, 215.0, 349.0, 594.0, 910.0, 1395.0, 2166.0, 3515.0, 5103.0, 7558.0, 11222.0, 16602.0, 23403.0, 32113.0, 43692.0, 56547.0, 69937.0, 82181.0, 92010.0, 96422.0, 94962.0, 88279.0, 76773.0, 63749.0, 50404.0, 38557.0, 28075.0, 20066.0, 13811.0, 9331.0, 6262.0, 4142.0, 2794.0, 1810.0, 1163.0, 730.0, 471.0, 310.0, 196.0, 128.0, 80.0, 56.0, 42.0, 17.0, 21.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.3515625, -7.12017822265625, -6.8887939453125, -6.65740966796875, -6.426025390625, -6.19464111328125, -5.9632568359375, -5.73187255859375, -5.50048828125, -5.26910400390625, -5.0377197265625, -4.80633544921875, -4.574951171875, -4.34356689453125, -4.1121826171875, -3.88079833984375, -3.6494140625, -3.41802978515625, -3.1866455078125, -2.95526123046875, -2.723876953125, -2.49249267578125, -2.2611083984375, -2.02972412109375, -1.79833984375, -1.56695556640625, -1.3355712890625, -1.10418701171875, -0.872802734375, -0.64141845703125, -0.4100341796875, -0.17864990234375, 0.052734375, 0.28411865234375, 0.5155029296875, 0.74688720703125, 0.978271484375, 1.20965576171875, 1.4410400390625, 1.67242431640625, 1.90380859375, 2.13519287109375, 2.3665771484375, 2.59796142578125, 2.829345703125, 3.06072998046875, 3.2921142578125, 3.52349853515625, 3.7548828125, 3.98626708984375, 4.2176513671875, 4.44903564453125, 4.680419921875, 4.91180419921875, 5.1431884765625, 5.37457275390625, 5.60595703125, 5.83734130859375, 6.0687255859375, 6.30010986328125, 6.531494140625, 6.76287841796875, 6.9942626953125, 7.22564697265625, 7.45703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 10.0, 11.0, 3.0, 7.0, 11.0, 15.0, 20.0, 13.0, 23.0, 23.0, 32.0, 23.0, 24.0, 29.0, 31.0, 35.0, 32.0, 43.0, 33.0, 42.0, 47.0, 43.0, 36.0, 33.0, 30.0, 38.0, 37.0, 26.0, 36.0, 32.0, 25.0, 20.0, 25.0, 19.0, 16.0, 21.0, 9.0, 11.0, 6.0, 4.0, 7.0, 7.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.42852783203125, -7.1734619140625, -6.91839599609375, -6.663330078125, -6.40826416015625, -6.1531982421875, -5.89813232421875, -5.64306640625, -5.38800048828125, -5.1329345703125, -4.87786865234375, -4.622802734375, -4.36773681640625, -4.1126708984375, -3.85760498046875, -3.6025390625, -3.34747314453125, -3.0924072265625, -2.83734130859375, -2.582275390625, -2.32720947265625, -2.0721435546875, -1.81707763671875, -1.56201171875, -1.30694580078125, -1.0518798828125, -0.79681396484375, -0.541748046875, -0.28668212890625, -0.0316162109375, 0.22344970703125, 0.478515625, 0.73358154296875, 0.9886474609375, 1.24371337890625, 1.498779296875, 1.75384521484375, 2.0089111328125, 2.26397705078125, 2.51904296875, 2.77410888671875, 3.0291748046875, 3.28424072265625, 3.539306640625, 3.79437255859375, 4.0494384765625, 4.30450439453125, 4.5595703125, 4.81463623046875, 5.0697021484375, 5.32476806640625, 5.579833984375, 5.83489990234375, 6.0899658203125, 6.34503173828125, 6.60009765625, 6.85516357421875, 7.1102294921875, 7.36529541015625, 7.620361328125, 7.87542724609375, 8.1304931640625, 8.38555908203125, 8.640625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 3.0, 10.0, 11.0, 8.0, 20.0, 15.0, 23.0, 37.0, 51.0, 53.0, 86.0, 98.0, 121.0, 186.0, 274.0, 363.0, 556.0, 832.0, 1312.0, 1983.0, 3264.0, 5337.0, 9034.0, 15475.0, 27363.0, 47677.0, 78871.0, 119514.0, 154715.0, 165872.0, 145139.0, 106380.0, 67567.0, 40144.0, 22811.0, 13126.0, 7637.0, 4467.0, 2809.0, 1781.0, 1068.0, 743.0, 492.0, 340.0, 257.0, 160.0, 125.0, 93.0, 67.0, 63.0, 35.0, 29.0, 20.0, 13.0, 14.0, 9.0, 8.0, 3.0, 0.0, 2.0, 2.0], "bins": [-6.86328125, -6.65106201171875, -6.4388427734375, -6.22662353515625, -6.014404296875, -5.80218505859375, -5.5899658203125, -5.37774658203125, -5.16552734375, -4.95330810546875, -4.7410888671875, -4.52886962890625, -4.316650390625, -4.10443115234375, -3.8922119140625, -3.67999267578125, -3.4677734375, -3.25555419921875, -3.0433349609375, -2.83111572265625, -2.618896484375, -2.40667724609375, -2.1944580078125, -1.98223876953125, -1.77001953125, -1.55780029296875, -1.3455810546875, -1.13336181640625, -0.921142578125, -0.70892333984375, -0.4967041015625, -0.28448486328125, -0.072265625, 0.13995361328125, 0.3521728515625, 0.56439208984375, 0.776611328125, 0.98883056640625, 1.2010498046875, 1.41326904296875, 1.62548828125, 1.83770751953125, 2.0499267578125, 2.26214599609375, 2.474365234375, 2.68658447265625, 2.8988037109375, 3.11102294921875, 3.3232421875, 3.53546142578125, 3.7476806640625, 3.95989990234375, 4.172119140625, 4.38433837890625, 4.5965576171875, 4.80877685546875, 5.02099609375, 5.23321533203125, 5.4454345703125, 5.65765380859375, 5.869873046875, 6.08209228515625, 6.2943115234375, 6.50653076171875, 6.71875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 10.0, 4.0, 3.0, 3.0, 7.0, 8.0, 9.0, 12.0, 21.0, 25.0, 22.0, 38.0, 44.0, 49.0, 51.0, 62.0, 73.0, 67.0, 77.0, 59.0, 57.0, 61.0, 45.0, 33.0, 32.0, 23.0, 28.0, 22.0, 15.0, 10.0, 10.0, 5.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007205009460449219, -0.0006961226463317871, -0.0006717443466186523, -0.0006473660469055176, -0.0006229877471923828, -0.000598609447479248, -0.0005742311477661133, -0.0005498528480529785, -0.0005254745483398438, -0.000501096248626709, -0.0004767179489135742, -0.00045233964920043945, -0.0004279613494873047, -0.0004035830497741699, -0.00037920475006103516, -0.0003548264503479004, -0.0003304481506347656, -0.00030606985092163086, -0.0002816915512084961, -0.00025731325149536133, -0.00023293495178222656, -0.0002085566520690918, -0.00018417835235595703, -0.00015980005264282227, -0.0001354217529296875, -0.00011104345321655273, -8.666515350341797e-05, -6.22868537902832e-05, -3.790855407714844e-05, -1.3530254364013672e-05, 1.0848045349121094e-05, 3.522634506225586e-05, 5.9604644775390625e-05, 8.398294448852539e-05, 0.00010836124420166016, 0.00013273954391479492, 0.0001571178436279297, 0.00018149614334106445, 0.00020587444305419922, 0.00023025274276733398, 0.00025463104248046875, 0.0002790093421936035, 0.0003033876419067383, 0.00032776594161987305, 0.0003521442413330078, 0.0003765225410461426, 0.00040090084075927734, 0.0004252791404724121, 0.0004496574401855469, 0.00047403573989868164, 0.0004984140396118164, 0.0005227923393249512, 0.0005471706390380859, 0.0005715489387512207, 0.0005959272384643555, 0.0006203055381774902, 0.000644683837890625, 0.0006690621376037598, 0.0006934404373168945, 0.0007178187370300293, 0.0007421970367431641, 0.0007665753364562988, 0.0007909536361694336, 0.0008153319358825684, 0.0008397102355957031]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 12.0, 17.0, 21.0, 11.0, 24.0, 34.0, 54.0, 87.0, 86.0, 150.0, 185.0, 286.0, 441.0, 711.0, 1102.0, 1764.0, 3034.0, 5308.0, 9978.0, 19103.0, 38266.0, 74215.0, 132423.0, 191161.0, 205803.0, 160317.0, 97022.0, 50953.0, 25980.0, 13187.0, 6915.0, 3759.0, 2198.0, 1305.0, 900.0, 527.0, 360.0, 262.0, 174.0, 127.0, 86.0, 60.0, 41.0, 34.0, 20.0, 17.0, 11.0, 7.0, 8.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-9.3046875, -9.015869140625, -8.72705078125, -8.438232421875, -8.1494140625, -7.860595703125, -7.57177734375, -7.282958984375, -6.994140625, -6.705322265625, -6.41650390625, -6.127685546875, -5.8388671875, -5.550048828125, -5.26123046875, -4.972412109375, -4.68359375, -4.394775390625, -4.10595703125, -3.817138671875, -3.5283203125, -3.239501953125, -2.95068359375, -2.661865234375, -2.373046875, -2.084228515625, -1.79541015625, -1.506591796875, -1.2177734375, -0.928955078125, -0.64013671875, -0.351318359375, -0.0625, 0.226318359375, 0.51513671875, 0.803955078125, 1.0927734375, 1.381591796875, 1.67041015625, 1.959228515625, 2.248046875, 2.536865234375, 2.82568359375, 3.114501953125, 3.4033203125, 3.692138671875, 3.98095703125, 4.269775390625, 4.55859375, 4.847412109375, 5.13623046875, 5.425048828125, 5.7138671875, 6.002685546875, 6.29150390625, 6.580322265625, 6.869140625, 7.157958984375, 7.44677734375, 7.735595703125, 8.0244140625, 8.313232421875, 8.60205078125, 8.890869140625, 9.1796875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 0.0, 11.0, 12.0, 9.0, 4.0, 25.0, 27.0, 39.0, 52.0, 56.0, 80.0, 77.0, 88.0, 89.0, 72.0, 76.0, 60.0, 62.0, 40.0, 29.0, 30.0, 25.0, 8.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.322418212890625, -3.22491455078125, -3.127410888671875, -3.0299072265625, -2.932403564453125, -2.83489990234375, -2.737396240234375, -2.639892578125, -2.542388916015625, -2.44488525390625, -2.347381591796875, -2.2498779296875, -2.152374267578125, -2.05487060546875, -1.957366943359375, -1.85986328125, -1.762359619140625, -1.66485595703125, -1.567352294921875, -1.4698486328125, -1.372344970703125, -1.27484130859375, -1.177337646484375, -1.079833984375, -0.982330322265625, -0.88482666015625, -0.787322998046875, -0.6898193359375, -0.592315673828125, -0.49481201171875, -0.397308349609375, -0.2998046875, -0.202301025390625, -0.10479736328125, -0.007293701171875, 0.0902099609375, 0.187713623046875, 0.28521728515625, 0.382720947265625, 0.480224609375, 0.577728271484375, 0.67523193359375, 0.772735595703125, 0.8702392578125, 0.967742919921875, 1.06524658203125, 1.162750244140625, 1.26025390625, 1.357757568359375, 1.45526123046875, 1.552764892578125, 1.6502685546875, 1.747772216796875, 1.84527587890625, 1.942779541015625, 2.040283203125, 2.137786865234375, 2.23529052734375, 2.332794189453125, 2.4302978515625, 2.527801513671875, 2.62530517578125, 2.722808837890625, 2.8203125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 4.0, 4.0, 9.0, 10.0, 12.0, 11.0, 14.0, 16.0, 16.0, 25.0, 31.0, 34.0, 32.0, 37.0, 49.0, 40.0, 55.0, 50.0, 53.0, 46.0, 41.0, 52.0, 39.0, 49.0, 33.0, 34.0, 23.0, 30.0, 24.0, 20.0, 25.0, 16.0, 17.0, 10.0, 7.0, 8.0, 4.0, 4.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-20.702268600463867, -20.11518669128418, -19.52810287475586, -18.941020965576172, -18.353939056396484, -17.766857147216797, -17.17977523803711, -16.59269142150879, -16.0056095123291, -15.418527603149414, -14.83144474029541, -14.244361877441406, -13.657279968261719, -13.070198059082031, -12.483115196228027, -11.896032333374023, -11.308950424194336, -10.721868515014648, -10.134785652160645, -9.54770278930664, -8.960620880126953, -8.373538970947266, -7.786456108093262, -7.199373722076416, -6.61229133605957, -6.025208950042725, -5.438126564025879, -4.851044178009033, -4.2639617919921875, -3.676879405975342, -3.089797019958496, -2.5027146339416504, -1.9156322479248047, -1.328549861907959, -0.7414674758911133, -0.15438508987426758, 0.4326972961425781, 1.0197796821594238, 1.6068620681762695, 2.1939444541931152, 2.781026840209961, 3.3681092262268066, 3.9551916122436523, 4.542273998260498, 5.129356384277344, 5.7164387702941895, 6.303521156311035, 6.890603542327881, 7.477685928344727, 8.064767837524414, 8.651850700378418, 9.238933563232422, 9.82601547241211, 10.413097381591797, 11.0001802444458, 11.587263107299805, 12.174345016479492, 12.76142692565918, 13.348509788513184, 13.935592651367188, 14.522674560546875, 15.109756469726562, 15.696839332580566, 16.28392219543457, 16.871004104614258]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 3.0, 7.0, 7.0, 9.0, 6.0, 10.0, 12.0, 13.0, 8.0, 15.0, 13.0, 17.0, 20.0, 28.0, 27.0, 23.0, 30.0, 35.0, 36.0, 44.0, 41.0, 35.0, 42.0, 45.0, 39.0, 36.0, 43.0, 44.0, 35.0, 32.0, 23.0, 37.0, 26.0, 18.0, 23.0, 16.0, 17.0, 8.0, 18.0, 11.0, 11.0, 7.0, 6.0, 6.0, 6.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.249616622924805, -11.82735824584961, -11.40510082244873, -10.982843399047852, -10.560585021972656, -10.138326644897461, -9.716069221496582, -9.293811798095703, -8.871553421020508, -8.449295043945312, -8.027037620544434, -7.6047797203063965, -7.182521820068359, -6.760263919830322, -6.338006019592285, -5.915748119354248, -5.493490219116211, -5.071232318878174, -4.648974418640137, -4.2267165184021, -3.8044586181640625, -3.3822007179260254, -2.9599428176879883, -2.537684917449951, -2.115427017211914, -1.693169116973877, -1.2709112167358398, -0.8486533164978027, -0.4263954162597656, -0.004137516021728516, 0.4181203842163086, 0.8403782844543457, 1.2626371383666992, 1.6848950386047363, 2.1071529388427734, 2.5294108390808105, 2.9516687393188477, 3.3739266395568848, 3.796184539794922, 4.218442440032959, 4.640700340270996, 5.062958240509033, 5.48521614074707, 5.907474040985107, 6.3297319412231445, 6.751989841461182, 7.174247741699219, 7.596505641937256, 8.018763542175293, 8.441020965576172, 8.863279342651367, 9.285537719726562, 9.707795143127441, 10.13005256652832, 10.552310943603516, 10.974569320678711, 11.39682674407959, 11.819084167480469, 12.241342544555664, 12.66360092163086, 13.085858345031738, 13.508115768432617, 13.930374145507812, 14.352632522583008, 14.774889945983887]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 18.0, 32.0, 38.0, 60.0, 127.0, 170.0, 250.0, 371.0, 688.0, 1019.0, 1673.0, 2733.0, 4578.0, 7211.0, 12225.0, 19672.0, 32494.0, 53195.0, 84870.0, 134621.0, 207058.0, 300152.0, 405461.0, 495480.0, 538616.0, 511199.0, 428991.0, 324512.0, 226828.0, 149620.0, 95718.0, 59509.0, 36627.0, 22554.0, 13655.0, 8446.0, 5191.0, 3193.0, 2019.0, 1245.0, 755.0, 509.0, 306.0, 216.0, 124.0, 90.0, 65.0, 32.0, 25.0, 11.0, 16.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.8359375, -14.3514404296875, -13.866943359375, -13.3824462890625, -12.89794921875, -12.4134521484375, -11.928955078125, -11.4444580078125, -10.9599609375, -10.4754638671875, -9.990966796875, -9.5064697265625, -9.02197265625, -8.5374755859375, -8.052978515625, -7.5684814453125, -7.083984375, -6.5994873046875, -6.114990234375, -5.6304931640625, -5.14599609375, -4.6614990234375, -4.177001953125, -3.6925048828125, -3.2080078125, -2.7235107421875, -2.239013671875, -1.7545166015625, -1.27001953125, -0.7855224609375, -0.301025390625, 0.1834716796875, 0.66796875, 1.1524658203125, 1.636962890625, 2.1214599609375, 2.60595703125, 3.0904541015625, 3.574951171875, 4.0594482421875, 4.5439453125, 5.0284423828125, 5.512939453125, 5.9974365234375, 6.48193359375, 6.9664306640625, 7.450927734375, 7.9354248046875, 8.419921875, 8.9044189453125, 9.388916015625, 9.8734130859375, 10.35791015625, 10.8424072265625, 11.326904296875, 11.8114013671875, 12.2958984375, 12.7803955078125, 13.264892578125, 13.7493896484375, 14.23388671875, 14.7183837890625, 15.202880859375, 15.6873779296875, 16.171875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 11.0, 6.0, 9.0, 15.0, 16.0, 17.0, 17.0, 21.0, 28.0, 23.0, 26.0, 31.0, 37.0, 34.0, 51.0, 37.0, 50.0, 49.0, 35.0, 44.0, 38.0, 45.0, 47.0, 34.0, 43.0, 30.0, 32.0, 20.0, 24.0, 15.0, 26.0, 12.0, 15.0, 9.0, 11.0, 5.0, 10.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6640625, -12.2454833984375, -11.826904296875, -11.4083251953125, -10.98974609375, -10.5711669921875, -10.152587890625, -9.7340087890625, -9.3154296875, -8.8968505859375, -8.478271484375, -8.0596923828125, -7.64111328125, -7.2225341796875, -6.803955078125, -6.3853759765625, -5.966796875, -5.5482177734375, -5.129638671875, -4.7110595703125, -4.29248046875, -3.8739013671875, -3.455322265625, -3.0367431640625, -2.6181640625, -2.1995849609375, -1.781005859375, -1.3624267578125, -0.94384765625, -0.5252685546875, -0.106689453125, 0.3118896484375, 0.73046875, 1.1490478515625, 1.567626953125, 1.9862060546875, 2.40478515625, 2.8233642578125, 3.241943359375, 3.6605224609375, 4.0791015625, 4.4976806640625, 4.916259765625, 5.3348388671875, 5.75341796875, 6.1719970703125, 6.590576171875, 7.0091552734375, 7.427734375, 7.8463134765625, 8.264892578125, 8.6834716796875, 9.10205078125, 9.5206298828125, 9.939208984375, 10.3577880859375, 10.7763671875, 11.1949462890625, 11.613525390625, 12.0321044921875, 12.45068359375, 12.8692626953125, 13.287841796875, 13.7064208984375, 14.125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 11.0, 20.0, 39.0, 70.0, 119.0, 189.0, 307.0, 559.0, 853.0, 1347.0, 2182.0, 3524.0, 5552.0, 9270.0, 14992.0, 23853.0, 37936.0, 59791.0, 91848.0, 137972.0, 199389.0, 274775.0, 357073.0, 430484.0, 472370.0, 468613.0, 422821.0, 348211.0, 266559.0, 192370.0, 131304.0, 87617.0, 56378.0, 36377.0, 22659.0, 14257.0, 8664.0, 5448.0, 3255.0, 1948.0, 1274.0, 789.0, 493.0, 277.0, 176.0, 119.0, 59.0, 40.0, 21.0, 10.0, 7.0, 10.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.4375, -16.8916015625, -16.345703125, -15.7998046875, -15.25390625, -14.7080078125, -14.162109375, -13.6162109375, -13.0703125, -12.5244140625, -11.978515625, -11.4326171875, -10.88671875, -10.3408203125, -9.794921875, -9.2490234375, -8.703125, -8.1572265625, -7.611328125, -7.0654296875, -6.51953125, -5.9736328125, -5.427734375, -4.8818359375, -4.3359375, -3.7900390625, -3.244140625, -2.6982421875, -2.15234375, -1.6064453125, -1.060546875, -0.5146484375, 0.03125, 0.5771484375, 1.123046875, 1.6689453125, 2.21484375, 2.7607421875, 3.306640625, 3.8525390625, 4.3984375, 4.9443359375, 5.490234375, 6.0361328125, 6.58203125, 7.1279296875, 7.673828125, 8.2197265625, 8.765625, 9.3115234375, 9.857421875, 10.4033203125, 10.94921875, 11.4951171875, 12.041015625, 12.5869140625, 13.1328125, 13.6787109375, 14.224609375, 14.7705078125, 15.31640625, 15.8623046875, 16.408203125, 16.9541015625, 17.5]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 9.0, 3.0, 5.0, 13.0, 7.0, 18.0, 24.0, 30.0, 36.0, 41.0, 43.0, 50.0, 71.0, 82.0, 79.0, 100.0, 119.0, 128.0, 143.0, 149.0, 168.0, 198.0, 182.0, 182.0, 195.0, 198.0, 134.0, 173.0, 188.0, 160.0, 167.0, 132.0, 127.0, 103.0, 98.0, 74.0, 66.0, 72.0, 59.0, 50.0, 30.0, 37.0, 42.0, 24.0, 15.0, 16.0, 5.0, 6.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-6.5625, -6.35693359375, -6.1513671875, -5.94580078125, -5.740234375, -5.53466796875, -5.3291015625, -5.12353515625, -4.91796875, -4.71240234375, -4.5068359375, -4.30126953125, -4.095703125, -3.89013671875, -3.6845703125, -3.47900390625, -3.2734375, -3.06787109375, -2.8623046875, -2.65673828125, -2.451171875, -2.24560546875, -2.0400390625, -1.83447265625, -1.62890625, -1.42333984375, -1.2177734375, -1.01220703125, -0.806640625, -0.60107421875, -0.3955078125, -0.18994140625, 0.015625, 0.22119140625, 0.4267578125, 0.63232421875, 0.837890625, 1.04345703125, 1.2490234375, 1.45458984375, 1.66015625, 1.86572265625, 2.0712890625, 2.27685546875, 2.482421875, 2.68798828125, 2.8935546875, 3.09912109375, 3.3046875, 3.51025390625, 3.7158203125, 3.92138671875, 4.126953125, 4.33251953125, 4.5380859375, 4.74365234375, 4.94921875, 5.15478515625, 5.3603515625, 5.56591796875, 5.771484375, 5.97705078125, 6.1826171875, 6.38818359375, 6.59375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 9.0, 9.0, 5.0, 12.0, 10.0, 13.0, 12.0, 23.0, 18.0, 21.0, 34.0, 32.0, 37.0, 44.0, 47.0, 44.0, 50.0, 62.0, 40.0, 58.0, 50.0, 44.0, 38.0, 35.0, 32.0, 26.0, 18.0, 36.0, 17.0, 26.0, 14.0, 13.0, 16.0, 13.0, 6.0, 4.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-24.797061920166016, -24.032432556152344, -23.267803192138672, -22.503173828125, -21.738544464111328, -20.97391700744629, -20.209287643432617, -19.444658279418945, -18.680028915405273, -17.9153995513916, -17.15077018737793, -16.386140823364258, -15.621512413024902, -14.85688304901123, -14.092254638671875, -13.327625274658203, -12.562995910644531, -11.79836654663086, -11.033737182617188, -10.269108772277832, -9.50447940826416, -8.739850044250488, -7.975221157073975, -7.210592269897461, -6.445962905883789, -5.681333541870117, -4.9167046546936035, -4.15207576751709, -3.387446403503418, -2.622817277908325, -1.8581881523132324, -1.0935592651367188, -0.3289299011230469, 0.4356992244720459, 1.2003283500671387, 1.9649574756622314, 2.729586601257324, 3.494215726852417, 4.25884485244751, 5.023473739624023, 5.788103103637695, 6.552732467651367, 7.317361354827881, 8.081990242004395, 8.846619606018066, 9.611248970031738, 10.375877380371094, 11.140506744384766, 11.905136108398438, 12.66976547241211, 13.434394836425781, 14.199023246765137, 14.963652610778809, 15.72828197479248, 16.492910385131836, 17.257539749145508, 18.02216911315918, 18.78679847717285, 19.551427841186523, 20.316057205200195, 21.080684661865234, 21.845314025878906, 22.609943389892578, 23.37457275390625, 24.139202117919922]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 2.0, 5.0, 4.0, 2.0, 4.0, 10.0, 7.0, 10.0, 15.0, 11.0, 14.0, 16.0, 24.0, 19.0, 22.0, 39.0, 34.0, 38.0, 28.0, 37.0, 36.0, 40.0, 51.0, 35.0, 46.0, 41.0, 39.0, 42.0, 37.0, 29.0, 26.0, 35.0, 27.0, 17.0, 25.0, 21.0, 19.0, 10.0, 23.0, 15.0, 9.0, 11.0, 7.0, 8.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.51991844177246, -16.984806060791016, -16.44969367980957, -15.914581298828125, -15.37946891784668, -14.844356536865234, -14.309244155883789, -13.774131774902344, -13.239019393920898, -12.703907012939453, -12.168794631958008, -11.633682250976562, -11.098569869995117, -10.563457489013672, -10.028345108032227, -9.493232727050781, -8.958121299743652, -8.423008918762207, -7.887896537780762, -7.352784156799316, -6.817671775817871, -6.282559394836426, -5.747447490692139, -5.212335109710693, -4.677222728729248, -4.142110347747803, -3.6069979667663574, -3.071885824203491, -2.536773443222046, -2.0016610622406006, -1.4665489196777344, -0.9314365386962891, -0.39632415771484375, 0.1387881636619568, 0.6739004850387573, 1.209012746810913, 1.7441251277923584, 2.2792375087738037, 2.81434965133667, 3.3494620323181152, 3.8845744132995605, 4.419686794281006, 4.954799175262451, 5.489911079406738, 6.025023460388184, 6.560135841369629, 7.095248222351074, 7.6303606033325195, 8.165472984313965, 8.70058536529541, 9.235697746276855, 9.7708101272583, 10.305922508239746, 10.841034889221191, 11.37614631652832, 11.911258697509766, 12.446371078491211, 12.981483459472656, 13.516595840454102, 14.051708221435547, 14.586820602416992, 15.121932983398438, 15.657045364379883, 16.192157745361328, 16.727270126342773]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 9.0, 12.0, 25.0, 32.0, 54.0, 92.0, 113.0, 177.0, 273.0, 396.0, 616.0, 918.0, 1456.0, 2364.0, 3780.0, 6042.0, 10079.0, 16262.0, 26835.0, 43903.0, 70554.0, 107695.0, 147878.0, 167887.0, 148140.0, 107903.0, 71022.0, 44337.0, 26741.0, 16269.0, 10050.0, 6095.0, 3867.0, 2419.0, 1495.0, 956.0, 651.0, 374.0, 249.0, 185.0, 125.0, 73.0, 53.0, 34.0, 18.0, 13.0, 10.0, 9.0, 2.0, 3.0, 2.0, 6.0, 0.0, 1.0], "bins": [-4.78125, -4.6385498046875, -4.495849609375, -4.3531494140625, -4.21044921875, -4.0677490234375, -3.925048828125, -3.7823486328125, -3.6396484375, -3.4969482421875, -3.354248046875, -3.2115478515625, -3.06884765625, -2.9261474609375, -2.783447265625, -2.6407470703125, -2.498046875, -2.3553466796875, -2.212646484375, -2.0699462890625, -1.92724609375, -1.7845458984375, -1.641845703125, -1.4991455078125, -1.3564453125, -1.2137451171875, -1.071044921875, -0.9283447265625, -0.78564453125, -0.6429443359375, -0.500244140625, -0.3575439453125, -0.21484375, -0.0721435546875, 0.070556640625, 0.2132568359375, 0.35595703125, 0.4986572265625, 0.641357421875, 0.7840576171875, 0.9267578125, 1.0694580078125, 1.212158203125, 1.3548583984375, 1.49755859375, 1.6402587890625, 1.782958984375, 1.9256591796875, 2.068359375, 2.2110595703125, 2.353759765625, 2.4964599609375, 2.63916015625, 2.7818603515625, 2.924560546875, 3.0672607421875, 3.2099609375, 3.3526611328125, 3.495361328125, 3.6380615234375, 3.78076171875, 3.9234619140625, 4.066162109375, 4.2088623046875, 4.3515625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 9.0, 8.0, 11.0, 9.0, 15.0, 15.0, 21.0, 13.0, 20.0, 20.0, 29.0, 24.0, 32.0, 32.0, 32.0, 39.0, 37.0, 29.0, 45.0, 33.0, 42.0, 33.0, 39.0, 45.0, 44.0, 32.0, 40.0, 26.0, 31.0, 24.0, 25.0, 17.0, 14.0, 11.0, 10.0, 13.0, 21.0, 7.0, 9.0, 8.0, 13.0, 7.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.78759765625, -16.2158203125, -15.64404296875, -15.072265625, -14.50048828125, -13.9287109375, -13.35693359375, -12.78515625, -12.21337890625, -11.6416015625, -11.06982421875, -10.498046875, -9.92626953125, -9.3544921875, -8.78271484375, -8.2109375, -7.63916015625, -7.0673828125, -6.49560546875, -5.923828125, -5.35205078125, -4.7802734375, -4.20849609375, -3.63671875, -3.06494140625, -2.4931640625, -1.92138671875, -1.349609375, -0.77783203125, -0.2060546875, 0.36572265625, 0.9375, 1.50927734375, 2.0810546875, 2.65283203125, 3.224609375, 3.79638671875, 4.3681640625, 4.93994140625, 5.51171875, 6.08349609375, 6.6552734375, 7.22705078125, 7.798828125, 8.37060546875, 8.9423828125, 9.51416015625, 10.0859375, 10.65771484375, 11.2294921875, 11.80126953125, 12.373046875, 12.94482421875, 13.5166015625, 14.08837890625, 14.66015625, 15.23193359375, 15.8037109375, 16.37548828125, 16.947265625, 17.51904296875, 18.0908203125, 18.66259765625, 19.234375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 16.0, 19.0, 20.0, 30.0, 26.0, 61.0, 106.0, 130.0, 233.0, 321.0, 565.0, 1000.0, 1802.0, 3233.0, 5964.0, 11424.0, 22234.0, 44320.0, 87195.0, 158422.0, 226584.0, 209923.0, 132064.0, 69499.0, 35163.0, 18069.0, 9038.0, 4849.0, 2596.0, 1450.0, 847.0, 504.0, 278.0, 199.0, 123.0, 78.0, 64.0, 38.0, 24.0, 16.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-6.77734375, -6.5770263671875, -6.376708984375, -6.1763916015625, -5.97607421875, -5.7757568359375, -5.575439453125, -5.3751220703125, -5.1748046875, -4.9744873046875, -4.774169921875, -4.5738525390625, -4.37353515625, -4.1732177734375, -3.972900390625, -3.7725830078125, -3.572265625, -3.3719482421875, -3.171630859375, -2.9713134765625, -2.77099609375, -2.5706787109375, -2.370361328125, -2.1700439453125, -1.9697265625, -1.7694091796875, -1.569091796875, -1.3687744140625, -1.16845703125, -0.9681396484375, -0.767822265625, -0.5675048828125, -0.3671875, -0.1668701171875, 0.033447265625, 0.2337646484375, 0.43408203125, 0.6343994140625, 0.834716796875, 1.0350341796875, 1.2353515625, 1.4356689453125, 1.635986328125, 1.8363037109375, 2.03662109375, 2.2369384765625, 2.437255859375, 2.6375732421875, 2.837890625, 3.0382080078125, 3.238525390625, 3.4388427734375, 3.63916015625, 3.8394775390625, 4.039794921875, 4.2401123046875, 4.4404296875, 4.6407470703125, 4.841064453125, 5.0413818359375, 5.24169921875, 5.4420166015625, 5.642333984375, 5.8426513671875, 6.04296875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 16.0, 9.0, 15.0, 21.0, 17.0, 23.0, 22.0, 31.0, 26.0, 35.0, 37.0, 52.0, 36.0, 46.0, 40.0, 58.0, 46.0, 49.0, 36.0, 38.0, 46.0, 37.0, 29.0, 37.0, 35.0, 23.0, 24.0, 14.0, 22.0, 16.0, 9.0, 9.0, 11.0, 6.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.734375, -13.326171875, -12.91796875, -12.509765625, -12.1015625, -11.693359375, -11.28515625, -10.876953125, -10.46875, -10.060546875, -9.65234375, -9.244140625, -8.8359375, -8.427734375, -8.01953125, -7.611328125, -7.203125, -6.794921875, -6.38671875, -5.978515625, -5.5703125, -5.162109375, -4.75390625, -4.345703125, -3.9375, -3.529296875, -3.12109375, -2.712890625, -2.3046875, -1.896484375, -1.48828125, -1.080078125, -0.671875, -0.263671875, 0.14453125, 0.552734375, 0.9609375, 1.369140625, 1.77734375, 2.185546875, 2.59375, 3.001953125, 3.41015625, 3.818359375, 4.2265625, 4.634765625, 5.04296875, 5.451171875, 5.859375, 6.267578125, 6.67578125, 7.083984375, 7.4921875, 7.900390625, 8.30859375, 8.716796875, 9.125, 9.533203125, 9.94140625, 10.349609375, 10.7578125, 11.166015625, 11.57421875, 11.982421875, 12.390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 10.0, 12.0, 16.0, 26.0, 27.0, 37.0, 61.0, 70.0, 140.0, 215.0, 323.0, 518.0, 823.0, 1421.0, 2592.0, 4671.0, 9413.0, 19950.0, 45887.0, 111410.0, 244727.0, 305300.0, 170260.0, 71875.0, 30357.0, 13623.0, 6563.0, 3426.0, 1840.0, 1079.0, 691.0, 398.0, 269.0, 174.0, 109.0, 75.0, 50.0, 26.0, 29.0, 21.0, 12.0, 4.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.109375, -2.043975830078125, -1.97857666015625, -1.913177490234375, -1.8477783203125, -1.782379150390625, -1.71697998046875, -1.651580810546875, -1.586181640625, -1.520782470703125, -1.45538330078125, -1.389984130859375, -1.3245849609375, -1.259185791015625, -1.19378662109375, -1.128387451171875, -1.06298828125, -0.997589111328125, -0.93218994140625, -0.866790771484375, -0.8013916015625, -0.735992431640625, -0.67059326171875, -0.605194091796875, -0.539794921875, -0.474395751953125, -0.40899658203125, -0.343597412109375, -0.2781982421875, -0.212799072265625, -0.14739990234375, -0.082000732421875, -0.0166015625, 0.048797607421875, 0.11419677734375, 0.179595947265625, 0.2449951171875, 0.310394287109375, 0.37579345703125, 0.441192626953125, 0.506591796875, 0.571990966796875, 0.63739013671875, 0.702789306640625, 0.7681884765625, 0.833587646484375, 0.89898681640625, 0.964385986328125, 1.02978515625, 1.095184326171875, 1.16058349609375, 1.225982666015625, 1.2913818359375, 1.356781005859375, 1.42218017578125, 1.487579345703125, 1.552978515625, 1.618377685546875, 1.68377685546875, 1.749176025390625, 1.8145751953125, 1.879974365234375, 1.94537353515625, 2.010772705078125, 2.076171875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 10.0, 7.0, 8.0, 12.0, 18.0, 28.0, 44.0, 38.0, 40.0, 64.0, 70.0, 64.0, 77.0, 72.0, 72.0, 75.0, 68.0, 46.0, 46.0, 39.0, 25.0, 14.0, 23.0, 19.0, 10.0, 3.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014197826385498047, -0.00013795215636491776, -0.00013392604887485504, -0.00012989994138479233, -0.00012587383389472961, -0.0001218477264046669, -0.00011782161891460419, -0.00011379551142454147, -0.00010976940393447876, -0.00010574329644441605, -0.00010171718895435333, -9.769108146429062e-05, -9.36649739742279e-05, -8.963886648416519e-05, -8.561275899410248e-05, -8.158665150403976e-05, -7.756054401397705e-05, -7.353443652391434e-05, -6.950832903385162e-05, -6.548222154378891e-05, -6.14561140537262e-05, -5.743000656366348e-05, -5.340389907360077e-05, -4.9377791583538055e-05, -4.535168409347534e-05, -4.132557660341263e-05, -3.7299469113349915e-05, -3.32733616232872e-05, -2.9247254133224487e-05, -2.5221146643161774e-05, -2.119503915309906e-05, -1.7168931663036346e-05, -1.3142824172973633e-05, -9.11671668291092e-06, -5.0906091928482056e-06, -1.064501702785492e-06, 2.9616057872772217e-06, 6.987713277339935e-06, 1.1013820767402649e-05, 1.5039928257465363e-05, 1.9066035747528076e-05, 2.309214323759079e-05, 2.7118250727653503e-05, 3.114435821771622e-05, 3.517046570777893e-05, 3.9196573197841644e-05, 4.322268068790436e-05, 4.724878817796707e-05, 5.1274895668029785e-05, 5.53010031580925e-05, 5.932711064815521e-05, 6.335321813821793e-05, 6.737932562828064e-05, 7.140543311834335e-05, 7.543154060840607e-05, 7.945764809846878e-05, 8.34837555885315e-05, 8.750986307859421e-05, 9.153597056865692e-05, 9.556207805871964e-05, 9.958818554878235e-05, 0.00010361429303884506, 0.00010764040052890778, 0.00011166650801897049, 0.0001156926155090332]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 12.0, 11.0, 14.0, 37.0, 55.0, 66.0, 109.0, 183.0, 312.0, 548.0, 956.0, 1617.0, 2859.0, 5402.0, 9965.0, 20034.0, 40926.0, 86313.0, 178506.0, 279908.0, 212896.0, 106646.0, 50256.0, 24381.0, 12211.0, 6382.0, 3363.0, 1890.0, 1154.0, 613.0, 342.0, 198.0, 139.0, 89.0, 48.0, 37.0, 22.0, 20.0, 8.0, 7.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.08984375, -2.9921875, -2.89453125, -2.796875, -2.69921875, -2.6015625, -2.50390625, -2.40625, -2.30859375, -2.2109375, -2.11328125, -2.015625, -1.91796875, -1.8203125, -1.72265625, -1.625, -1.52734375, -1.4296875, -1.33203125, -1.234375, -1.13671875, -1.0390625, -0.94140625, -0.84375, -0.74609375, -0.6484375, -0.55078125, -0.453125, -0.35546875, -0.2578125, -0.16015625, -0.0625, 0.03515625, 0.1328125, 0.23046875, 0.328125, 0.42578125, 0.5234375, 0.62109375, 0.71875, 0.81640625, 0.9140625, 1.01171875, 1.109375, 1.20703125, 1.3046875, 1.40234375, 1.5, 1.59765625, 1.6953125, 1.79296875, 1.890625, 1.98828125, 2.0859375, 2.18359375, 2.28125, 2.37890625, 2.4765625, 2.57421875, 2.671875, 2.76953125, 2.8671875, 2.96484375, 3.0625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 7.0, 11.0, 13.0, 15.0, 13.0, 19.0, 24.0, 32.0, 44.0, 37.0, 64.0, 49.0, 71.0, 76.0, 74.0, 60.0, 42.0, 55.0, 57.0, 49.0, 29.0, 24.0, 25.0, 25.0, 18.0, 6.0, 11.0, 12.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6728515625, -0.6500320434570312, -0.6272125244140625, -0.6043930053710938, -0.581573486328125, -0.5587539672851562, -0.5359344482421875, -0.5131149291992188, -0.49029541015625, -0.46747589111328125, -0.4446563720703125, -0.42183685302734375, -0.399017333984375, -0.37619781494140625, -0.3533782958984375, -0.33055877685546875, -0.3077392578125, -0.28491973876953125, -0.2621002197265625, -0.23928070068359375, -0.216461181640625, -0.19364166259765625, -0.1708221435546875, -0.14800262451171875, -0.12518310546875, -0.10236358642578125, -0.0795440673828125, -0.05672454833984375, -0.033905029296875, -0.01108551025390625, 0.0117340087890625, 0.03455352783203125, 0.057373046875, 0.08019256591796875, 0.1030120849609375, 0.12583160400390625, 0.148651123046875, 0.17147064208984375, 0.1942901611328125, 0.21710968017578125, 0.23992919921875, 0.26274871826171875, 0.2855682373046875, 0.30838775634765625, 0.331207275390625, 0.35402679443359375, 0.3768463134765625, 0.39966583251953125, 0.4224853515625, 0.44530487060546875, 0.4681243896484375, 0.49094390869140625, 0.513763427734375, 0.5365829467773438, 0.5594024658203125, 0.5822219848632812, 0.60504150390625, 0.6278610229492188, 0.6506805419921875, 0.6735000610351562, 0.696319580078125, 0.7191390991210938, 0.7419586181640625, 0.7647781372070312, 0.78759765625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 11.0, 6.0, 6.0, 8.0, 14.0, 8.0, 14.0, 22.0, 15.0, 19.0, 34.0, 30.0, 34.0, 45.0, 53.0, 44.0, 44.0, 51.0, 53.0, 50.0, 54.0, 47.0, 42.0, 30.0, 33.0, 33.0, 17.0, 34.0, 22.0, 20.0, 21.0, 7.0, 18.0, 15.0, 9.0, 4.0, 5.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-25.067045211791992, -24.301271438598633, -23.535497665405273, -22.769723892211914, -22.003950119018555, -21.238176345825195, -20.472400665283203, -19.706626892089844, -18.940853118896484, -18.175079345703125, -17.409305572509766, -16.643531799316406, -15.877758026123047, -15.111984252929688, -14.346209526062012, -13.580435752868652, -12.81466293334961, -12.04888916015625, -11.28311538696289, -10.517341613769531, -9.751567840576172, -8.985794067382812, -8.220019340515137, -7.454245567321777, -6.688471794128418, -5.922698020935059, -5.156924247741699, -4.391149997711182, -3.6253762245178223, -2.859602451324463, -2.0938282012939453, -1.328054428100586, -0.5622787475585938, 0.20349514484405518, 0.9692690372467041, 1.7350430488586426, 2.500816822052002, 3.2665905952453613, 4.032364845275879, 4.798138618469238, 5.563912391662598, 6.329686164855957, 7.095459938049316, 7.861234188079834, 8.627008438110352, 9.392782211303711, 10.15855598449707, 10.92432975769043, 11.690103530883789, 12.455877304077148, 13.221651077270508, 13.987424850463867, 14.753198623657227, 15.518972396850586, 16.284748077392578, 17.050521850585938, 17.816295623779297, 18.582069396972656, 19.347843170166016, 20.113616943359375, 20.879390716552734, 21.645164489746094, 22.410938262939453, 23.176712036132812, 23.942485809326172]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 4.0, 2.0, 8.0, 8.0, 6.0, 12.0, 16.0, 11.0, 17.0, 11.0, 26.0, 19.0, 28.0, 35.0, 36.0, 35.0, 30.0, 33.0, 40.0, 43.0, 45.0, 39.0, 43.0, 42.0, 36.0, 44.0, 37.0, 30.0, 20.0, 36.0, 29.0, 17.0, 21.0, 23.0, 19.0, 12.0, 21.0, 16.0, 9.0, 9.0, 8.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.38416290283203, -16.852876663208008, -16.321590423583984, -15.790303230285645, -15.259016036987305, -14.727729797363281, -14.196443557739258, -13.665157318115234, -13.133870124816895, -12.602583885192871, -12.071296691894531, -11.540010452270508, -11.008724212646484, -10.477437019348145, -9.946150779724121, -9.414863586425781, -8.883577346801758, -8.352291107177734, -7.8210039138793945, -7.289717674255371, -6.7584309577941895, -6.227144241333008, -5.695858001708984, -5.164571285247803, -4.633284568786621, -4.1019978523254395, -3.570711374282837, -3.0394248962402344, -2.5081381797790527, -1.976851463317871, -1.4455649852752686, -0.914278507232666, -0.3829936981201172, 0.1482928991317749, 0.679579496383667, 1.210866093635559, 1.7421526908874512, 2.273439407348633, 2.8047258853912354, 3.336012363433838, 3.8672990798950195, 4.398585796356201, 4.929872512817383, 5.461158752441406, 5.992445468902588, 6.5237321853637695, 7.055018424987793, 7.586305141448975, 8.117591857910156, 8.64887809753418, 9.18016529083252, 9.711451530456543, 10.242738723754883, 10.774024963378906, 11.30531120300293, 11.836597442626953, 12.367884635925293, 12.899170875549316, 13.430458068847656, 13.96174430847168, 14.493030548095703, 15.024317741394043, 15.555603981018066, 16.086891174316406, 16.61817741394043]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 7.0, 17.0, 12.0, 21.0, 32.0, 71.0, 80.0, 116.0, 194.0, 267.0, 411.0, 662.0, 1064.0, 1601.0, 2342.0, 3806.0, 5929.0, 9224.0, 14135.0, 21302.0, 32096.0, 46222.0, 64819.0, 84158.0, 102683.0, 114638.0, 116287.0, 107433.0, 90206.0, 70486.0, 51770.0, 36169.0, 24579.0, 16101.0, 10358.0, 6808.0, 4441.0, 2846.0, 1753.0, 1200.0, 788.0, 532.0, 308.0, 204.0, 148.0, 80.0, 58.0, 37.0, 24.0, 19.0, 12.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6171875, -10.26513671875, -9.9130859375, -9.56103515625, -9.208984375, -8.85693359375, -8.5048828125, -8.15283203125, -7.80078125, -7.44873046875, -7.0966796875, -6.74462890625, -6.392578125, -6.04052734375, -5.6884765625, -5.33642578125, -4.984375, -4.63232421875, -4.2802734375, -3.92822265625, -3.576171875, -3.22412109375, -2.8720703125, -2.52001953125, -2.16796875, -1.81591796875, -1.4638671875, -1.11181640625, -0.759765625, -0.40771484375, -0.0556640625, 0.29638671875, 0.6484375, 1.00048828125, 1.3525390625, 1.70458984375, 2.056640625, 2.40869140625, 2.7607421875, 3.11279296875, 3.46484375, 3.81689453125, 4.1689453125, 4.52099609375, 4.873046875, 5.22509765625, 5.5771484375, 5.92919921875, 6.28125, 6.63330078125, 6.9853515625, 7.33740234375, 7.689453125, 8.04150390625, 8.3935546875, 8.74560546875, 9.09765625, 9.44970703125, 9.8017578125, 10.15380859375, 10.505859375, 10.85791015625, 11.2099609375, 11.56201171875, 11.9140625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 2.0, 3.0, 6.0, 1.0, 2.0, 11.0, 7.0, 14.0, 10.0, 10.0, 23.0, 21.0, 17.0, 28.0, 28.0, 23.0, 42.0, 32.0, 40.0, 36.0, 37.0, 34.0, 39.0, 53.0, 40.0, 35.0, 33.0, 35.0, 39.0, 50.0, 31.0, 31.0, 22.0, 23.0, 25.0, 17.0, 8.0, 12.0, 15.0, 8.0, 16.0, 15.0, 7.0, 5.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.03125, -16.45263671875, -15.8740234375, -15.29541015625, -14.716796875, -14.13818359375, -13.5595703125, -12.98095703125, -12.40234375, -11.82373046875, -11.2451171875, -10.66650390625, -10.087890625, -9.50927734375, -8.9306640625, -8.35205078125, -7.7734375, -7.19482421875, -6.6162109375, -6.03759765625, -5.458984375, -4.88037109375, -4.3017578125, -3.72314453125, -3.14453125, -2.56591796875, -1.9873046875, -1.40869140625, -0.830078125, -0.25146484375, 0.3271484375, 0.90576171875, 1.484375, 2.06298828125, 2.6416015625, 3.22021484375, 3.798828125, 4.37744140625, 4.9560546875, 5.53466796875, 6.11328125, 6.69189453125, 7.2705078125, 7.84912109375, 8.427734375, 9.00634765625, 9.5849609375, 10.16357421875, 10.7421875, 11.32080078125, 11.8994140625, 12.47802734375, 13.056640625, 13.63525390625, 14.2138671875, 14.79248046875, 15.37109375, 15.94970703125, 16.5283203125, 17.10693359375, 17.685546875, 18.26416015625, 18.8427734375, 19.42138671875, 20.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 11.0, 16.0, 30.0, 53.0, 69.0, 117.0, 160.0, 287.0, 429.0, 732.0, 1240.0, 2097.0, 3613.0, 6234.0, 10833.0, 18929.0, 31773.0, 53081.0, 81981.0, 114212.0, 141283.0, 150101.0, 136988.0, 106831.0, 73566.0, 47190.0, 27943.0, 16393.0, 9269.0, 5456.0, 3085.0, 1771.0, 1051.0, 653.0, 384.0, 251.0, 171.0, 97.0, 58.0, 48.0, 15.0, 20.0, 11.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.875, -13.385986328125, -12.89697265625, -12.407958984375, -11.9189453125, -11.429931640625, -10.94091796875, -10.451904296875, -9.962890625, -9.473876953125, -8.98486328125, -8.495849609375, -8.0068359375, -7.517822265625, -7.02880859375, -6.539794921875, -6.05078125, -5.561767578125, -5.07275390625, -4.583740234375, -4.0947265625, -3.605712890625, -3.11669921875, -2.627685546875, -2.138671875, -1.649658203125, -1.16064453125, -0.671630859375, -0.1826171875, 0.306396484375, 0.79541015625, 1.284423828125, 1.7734375, 2.262451171875, 2.75146484375, 3.240478515625, 3.7294921875, 4.218505859375, 4.70751953125, 5.196533203125, 5.685546875, 6.174560546875, 6.66357421875, 7.152587890625, 7.6416015625, 8.130615234375, 8.61962890625, 9.108642578125, 9.59765625, 10.086669921875, 10.57568359375, 11.064697265625, 11.5537109375, 12.042724609375, 12.53173828125, 13.020751953125, 13.509765625, 13.998779296875, 14.48779296875, 14.976806640625, 15.4658203125, 15.954833984375, 16.44384765625, 16.932861328125, 17.421875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 15.0, 14.0, 13.0, 17.0, 18.0, 24.0, 24.0, 27.0, 39.0, 46.0, 39.0, 42.0, 51.0, 46.0, 47.0, 32.0, 46.0, 43.0, 50.0, 38.0, 32.0, 39.0, 36.0, 35.0, 26.0, 29.0, 16.0, 27.0, 18.0, 16.0, 15.0, 8.0, 4.0, 11.0, 6.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0625, -12.6561279296875, -12.249755859375, -11.8433837890625, -11.43701171875, -11.0306396484375, -10.624267578125, -10.2178955078125, -9.8115234375, -9.4051513671875, -8.998779296875, -8.5924072265625, -8.18603515625, -7.7796630859375, -7.373291015625, -6.9669189453125, -6.560546875, -6.1541748046875, -5.747802734375, -5.3414306640625, -4.93505859375, -4.5286865234375, -4.122314453125, -3.7159423828125, -3.3095703125, -2.9031982421875, -2.496826171875, -2.0904541015625, -1.68408203125, -1.2777099609375, -0.871337890625, -0.4649658203125, -0.05859375, 0.3477783203125, 0.754150390625, 1.1605224609375, 1.56689453125, 1.9732666015625, 2.379638671875, 2.7860107421875, 3.1923828125, 3.5987548828125, 4.005126953125, 4.4114990234375, 4.81787109375, 5.2242431640625, 5.630615234375, 6.0369873046875, 6.443359375, 6.8497314453125, 7.256103515625, 7.6624755859375, 8.06884765625, 8.4752197265625, 8.881591796875, 9.2879638671875, 9.6943359375, 10.1007080078125, 10.507080078125, 10.9134521484375, 11.31982421875, 11.7261962890625, 12.132568359375, 12.5389404296875, 12.9453125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 6.0, 16.0, 11.0, 12.0, 24.0, 34.0, 44.0, 62.0, 64.0, 106.0, 134.0, 218.0, 301.0, 371.0, 563.0, 816.0, 1084.0, 1573.0, 2503.0, 3884.0, 7234.0, 18136.0, 64685.0, 213089.0, 362244.0, 247064.0, 81103.0, 22201.0, 8109.0, 4291.0, 2668.0, 1718.0, 1214.0, 863.0, 567.0, 470.0, 297.0, 204.0, 162.0, 121.0, 73.0, 64.0, 41.0, 25.0, 25.0, 21.0, 12.0, 11.0, 8.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.828125, -17.263671875, -16.69921875, -16.134765625, -15.5703125, -15.005859375, -14.44140625, -13.876953125, -13.3125, -12.748046875, -12.18359375, -11.619140625, -11.0546875, -10.490234375, -9.92578125, -9.361328125, -8.796875, -8.232421875, -7.66796875, -7.103515625, -6.5390625, -5.974609375, -5.41015625, -4.845703125, -4.28125, -3.716796875, -3.15234375, -2.587890625, -2.0234375, -1.458984375, -0.89453125, -0.330078125, 0.234375, 0.798828125, 1.36328125, 1.927734375, 2.4921875, 3.056640625, 3.62109375, 4.185546875, 4.75, 5.314453125, 5.87890625, 6.443359375, 7.0078125, 7.572265625, 8.13671875, 8.701171875, 9.265625, 9.830078125, 10.39453125, 10.958984375, 11.5234375, 12.087890625, 12.65234375, 13.216796875, 13.78125, 14.345703125, 14.91015625, 15.474609375, 16.0390625, 16.603515625, 17.16796875, 17.732421875, 18.296875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 3.0, 13.0, 14.0, 26.0, 46.0, 50.0, 65.0, 110.0, 100.0, 115.0, 113.0, 84.0, 82.0, 56.0, 38.0, 24.0, 18.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0014505386352539062, -0.0014026165008544922, -0.0013546943664550781, -0.001306772232055664, -0.00125885009765625, -0.001210927963256836, -0.0011630058288574219, -0.0011150836944580078, -0.0010671615600585938, -0.0010192394256591797, -0.0009713172912597656, -0.0009233951568603516, -0.0008754730224609375, -0.0008275508880615234, -0.0007796287536621094, -0.0007317066192626953, -0.0006837844848632812, -0.0006358623504638672, -0.0005879402160644531, -0.0005400180816650391, -0.000492095947265625, -0.00044417381286621094, -0.0003962516784667969, -0.0003483295440673828, -0.00030040740966796875, -0.0002524852752685547, -0.00020456314086914062, -0.00015664100646972656, -0.0001087188720703125, -6.079673767089844e-05, -1.2874603271484375e-05, 3.504753112792969e-05, 8.296966552734375e-05, 0.0001308917999267578, 0.00017881393432617188, 0.00022673606872558594, 0.000274658203125, 0.00032258033752441406, 0.0003705024719238281, 0.0004184246063232422, 0.00046634674072265625, 0.0005142688751220703, 0.0005621910095214844, 0.0006101131439208984, 0.0006580352783203125, 0.0007059574127197266, 0.0007538795471191406, 0.0008018016815185547, 0.0008497238159179688, 0.0008976459503173828, 0.0009455680847167969, 0.000993490219116211, 0.001041412353515625, 0.001089334487915039, 0.0011372566223144531, 0.0011851787567138672, 0.0012331008911132812, 0.0012810230255126953, 0.0013289451599121094, 0.0013768672943115234, 0.0014247894287109375, 0.0014727115631103516, 0.0015206336975097656, 0.0015685558319091797, 0.0016164779663085938]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 13.0, 16.0, 34.0, 33.0, 40.0, 83.0, 74.0, 134.0, 154.0, 220.0, 311.0, 413.0, 613.0, 886.0, 1273.0, 1820.0, 2770.0, 4629.0, 8967.0, 22128.0, 68421.0, 183058.0, 303686.0, 258430.0, 119130.0, 39715.0, 14046.0, 6240.0, 3628.0, 2312.0, 1561.0, 1066.0, 737.0, 529.0, 370.0, 278.0, 219.0, 143.0, 112.0, 70.0, 59.0, 41.0, 19.0, 27.0, 13.0, 9.0, 10.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-16.53125, -16.0416259765625, -15.552001953125, -15.0623779296875, -14.57275390625, -14.0831298828125, -13.593505859375, -13.1038818359375, -12.6142578125, -12.1246337890625, -11.635009765625, -11.1453857421875, -10.65576171875, -10.1661376953125, -9.676513671875, -9.1868896484375, -8.697265625, -8.2076416015625, -7.718017578125, -7.2283935546875, -6.73876953125, -6.2491455078125, -5.759521484375, -5.2698974609375, -4.7802734375, -4.2906494140625, -3.801025390625, -3.3114013671875, -2.82177734375, -2.3321533203125, -1.842529296875, -1.3529052734375, -0.86328125, -0.3736572265625, 0.115966796875, 0.6055908203125, 1.09521484375, 1.5848388671875, 2.074462890625, 2.5640869140625, 3.0537109375, 3.5433349609375, 4.032958984375, 4.5225830078125, 5.01220703125, 5.5018310546875, 5.991455078125, 6.4810791015625, 6.970703125, 7.4603271484375, 7.949951171875, 8.4395751953125, 8.92919921875, 9.4188232421875, 9.908447265625, 10.3980712890625, 10.8876953125, 11.3773193359375, 11.866943359375, 12.3565673828125, 12.84619140625, 13.3358154296875, 13.825439453125, 14.3150634765625, 14.8046875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 11.0, 3.0, 10.0, 12.0, 12.0, 29.0, 34.0, 46.0, 61.0, 62.0, 74.0, 94.0, 88.0, 76.0, 83.0, 70.0, 62.0, 54.0, 34.0, 35.0, 12.0, 9.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.24609375, -4.122711181640625, -3.99932861328125, -3.875946044921875, -3.7525634765625, -3.629180908203125, -3.50579833984375, -3.382415771484375, -3.259033203125, -3.135650634765625, -3.01226806640625, -2.888885498046875, -2.7655029296875, -2.642120361328125, -2.51873779296875, -2.395355224609375, -2.27197265625, -2.148590087890625, -2.02520751953125, -1.901824951171875, -1.7784423828125, -1.655059814453125, -1.53167724609375, -1.408294677734375, -1.284912109375, -1.161529541015625, -1.03814697265625, -0.914764404296875, -0.7913818359375, -0.667999267578125, -0.54461669921875, -0.421234130859375, -0.2978515625, -0.174468994140625, -0.05108642578125, 0.072296142578125, 0.1956787109375, 0.319061279296875, 0.44244384765625, 0.565826416015625, 0.689208984375, 0.812591552734375, 0.93597412109375, 1.059356689453125, 1.1827392578125, 1.306121826171875, 1.42950439453125, 1.552886962890625, 1.67626953125, 1.799652099609375, 1.92303466796875, 2.046417236328125, 2.1697998046875, 2.293182373046875, 2.41656494140625, 2.539947509765625, 2.663330078125, 2.786712646484375, 2.91009521484375, 3.033477783203125, 3.1568603515625, 3.280242919921875, 3.40362548828125, 3.527008056640625, 3.650390625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 6.0, 6.0, 6.0, 11.0, 14.0, 14.0, 12.0, 18.0, 18.0, 22.0, 23.0, 42.0, 43.0, 36.0, 39.0, 56.0, 52.0, 53.0, 57.0, 50.0, 58.0, 47.0, 44.0, 34.0, 32.0, 33.0, 27.0, 23.0, 24.0, 12.0, 22.0, 14.0, 13.0, 7.0, 5.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.366357803344727, -27.522932052612305, -26.679508209228516, -25.836082458496094, -24.992658615112305, -24.149232864379883, -23.305809020996094, -22.462383270263672, -21.61895751953125, -20.775531768798828, -19.93210792541504, -19.088682174682617, -18.245258331298828, -17.401832580566406, -16.558406829833984, -15.714982986450195, -14.871559143066406, -14.0281343460083, -13.184709548950195, -12.341283798217773, -11.497859954833984, -10.654434204101562, -9.811009407043457, -8.967584609985352, -8.124159812927246, -7.280735015869141, -6.437310218811035, -5.5938849449157715, -4.750460147857666, -3.9070353507995605, -3.063610076904297, -2.2201852798461914, -1.3767623901367188, -0.5333374738693237, 0.3100874423980713, 1.1535124778747559, 1.9969372749328613, 2.840362071990967, 3.6837873458862305, 4.527212142944336, 5.370636940002441, 6.214061737060547, 7.057486534118652, 7.900911808013916, 8.74433708190918, 9.587760925292969, 10.43118667602539, 11.274611473083496, 12.118036270141602, 12.961461067199707, 13.804885864257812, 14.648311614990234, 15.491735458374023, 16.335161209106445, 17.178585052490234, 18.022010803222656, 18.865436553955078, 19.7088623046875, 20.55228614807129, 21.39571189880371, 22.2391357421875, 23.082561492919922, 23.925987243652344, 24.769411087036133, 25.612834930419922]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 7.0, 2.0, 5.0, 8.0, 8.0, 6.0, 10.0, 12.0, 13.0, 11.0, 12.0, 21.0, 24.0, 23.0, 30.0, 23.0, 27.0, 33.0, 35.0, 34.0, 34.0, 41.0, 41.0, 46.0, 41.0, 40.0, 45.0, 36.0, 27.0, 41.0, 29.0, 28.0, 27.0, 18.0, 25.0, 19.0, 19.0, 18.0, 9.0, 13.0, 10.0, 15.0, 6.0, 6.0, 6.0, 8.0, 2.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.357778549194336, -18.75189971923828, -18.146018981933594, -17.54014015197754, -16.934261322021484, -16.328380584716797, -15.722501754760742, -15.116621971130371, -14.5107421875, -13.904862403869629, -13.298982620239258, -12.693103790283203, -12.087224006652832, -11.481344223022461, -10.875465393066406, -10.269585609436035, -9.663705825805664, -9.057826042175293, -8.451946258544922, -7.846067428588867, -7.240187644958496, -6.634307861328125, -6.028428554534912, -5.422549247741699, -4.816669464111328, -4.210789680480957, -3.604910373687744, -2.999030828475952, -2.39315128326416, -1.7872717380523682, -1.1813921928405762, -0.5755128860473633, 0.030366897583007812, 0.6362464427947998, 1.2421259880065918, 1.8480055332183838, 2.453885078430176, 3.0597646236419678, 3.6656441688537598, 4.271523475646973, 4.877403259277344, 5.483283042907715, 6.089162349700928, 6.695041656494141, 7.300921440124512, 7.906801223754883, 8.512680053710938, 9.118559837341309, 9.72443962097168, 10.33031940460205, 10.936199188232422, 11.542078018188477, 12.147957801818848, 12.753837585449219, 13.359716415405273, 13.965596199035645, 14.571475982666016, 15.177355766296387, 15.783235549926758, 16.389114379882812, 16.9949951171875, 17.600873947143555, 18.20675277709961, 18.812633514404297, 19.41851234436035]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 7.0, 11.0, 14.0, 19.0, 35.0, 47.0, 81.0, 119.0, 170.0, 297.0, 426.0, 623.0, 938.0, 1572.0, 2311.0, 3472.0, 5474.0, 8551.0, 13782.0, 21510.0, 34685.0, 55324.0, 88428.0, 141368.0, 223719.0, 341382.0, 484296.0, 601465.0, 614538.0, 516468.0, 371393.0, 245296.0, 156162.0, 96914.0, 60645.0, 37733.0, 23608.0, 14937.0, 9365.0, 6064.0, 3817.0, 2513.0, 1622.0, 1100.0, 715.0, 429.0, 267.0, 190.0, 132.0, 76.0, 57.0, 44.0, 30.0, 18.0, 11.0, 12.0, 6.0, 5.0, 2.0, 3.0], "bins": [-24.5625, -23.797607421875, -23.03271484375, -22.267822265625, -21.5029296875, -20.738037109375, -19.97314453125, -19.208251953125, -18.443359375, -17.678466796875, -16.91357421875, -16.148681640625, -15.3837890625, -14.618896484375, -13.85400390625, -13.089111328125, -12.32421875, -11.559326171875, -10.79443359375, -10.029541015625, -9.2646484375, -8.499755859375, -7.73486328125, -6.969970703125, -6.205078125, -5.440185546875, -4.67529296875, -3.910400390625, -3.1455078125, -2.380615234375, -1.61572265625, -0.850830078125, -0.0859375, 0.678955078125, 1.44384765625, 2.208740234375, 2.9736328125, 3.738525390625, 4.50341796875, 5.268310546875, 6.033203125, 6.798095703125, 7.56298828125, 8.327880859375, 9.0927734375, 9.857666015625, 10.62255859375, 11.387451171875, 12.15234375, 12.917236328125, 13.68212890625, 14.447021484375, 15.2119140625, 15.976806640625, 16.74169921875, 17.506591796875, 18.271484375, 19.036376953125, 19.80126953125, 20.566162109375, 21.3310546875, 22.095947265625, 22.86083984375, 23.625732421875, 24.390625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 9.0, 14.0, 14.0, 15.0, 23.0, 21.0, 24.0, 28.0, 29.0, 20.0, 28.0, 38.0, 47.0, 39.0, 57.0, 42.0, 55.0, 61.0, 39.0, 48.0, 43.0, 38.0, 50.0, 22.0, 22.0, 21.0, 25.0, 25.0, 20.0, 25.0, 12.0, 7.0, 3.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.953125, -22.201904296875, -21.45068359375, -20.699462890625, -19.9482421875, -19.197021484375, -18.44580078125, -17.694580078125, -16.943359375, -16.192138671875, -15.44091796875, -14.689697265625, -13.9384765625, -13.187255859375, -12.43603515625, -11.684814453125, -10.93359375, -10.182373046875, -9.43115234375, -8.679931640625, -7.9287109375, -7.177490234375, -6.42626953125, -5.675048828125, -4.923828125, -4.172607421875, -3.42138671875, -2.670166015625, -1.9189453125, -1.167724609375, -0.41650390625, 0.334716796875, 1.0859375, 1.837158203125, 2.58837890625, 3.339599609375, 4.0908203125, 4.842041015625, 5.59326171875, 6.344482421875, 7.095703125, 7.846923828125, 8.59814453125, 9.349365234375, 10.1005859375, 10.851806640625, 11.60302734375, 12.354248046875, 13.10546875, 13.856689453125, 14.60791015625, 15.359130859375, 16.1103515625, 16.861572265625, 17.61279296875, 18.364013671875, 19.115234375, 19.866455078125, 20.61767578125, 21.368896484375, 22.1201171875, 22.871337890625, 23.62255859375, 24.373779296875, 25.125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 6.0, 10.0, 11.0, 14.0, 22.0, 27.0, 57.0, 96.0, 140.0, 195.0, 299.0, 487.0, 769.0, 1203.0, 2046.0, 3198.0, 4941.0, 7870.0, 12607.0, 19934.0, 32042.0, 51914.0, 81793.0, 128815.0, 197220.0, 293557.0, 408202.0, 517807.0, 571639.0, 533195.0, 427061.0, 311535.0, 210995.0, 137969.0, 88221.0, 55237.0, 34956.0, 21769.0, 13350.0, 8656.0, 5331.0, 3378.0, 2075.0, 1326.0, 829.0, 532.0, 360.0, 236.0, 118.0, 91.0, 48.0, 40.0, 28.0, 13.0, 10.0, 8.0, 4.0, 3.0, 1.0, 1.0], "bins": [-32.0, -31.017822265625, -30.03564453125, -29.053466796875, -28.0712890625, -27.089111328125, -26.10693359375, -25.124755859375, -24.142578125, -23.160400390625, -22.17822265625, -21.196044921875, -20.2138671875, -19.231689453125, -18.24951171875, -17.267333984375, -16.28515625, -15.302978515625, -14.32080078125, -13.338623046875, -12.3564453125, -11.374267578125, -10.39208984375, -9.409912109375, -8.427734375, -7.445556640625, -6.46337890625, -5.481201171875, -4.4990234375, -3.516845703125, -2.53466796875, -1.552490234375, -0.5703125, 0.411865234375, 1.39404296875, 2.376220703125, 3.3583984375, 4.340576171875, 5.32275390625, 6.304931640625, 7.287109375, 8.269287109375, 9.25146484375, 10.233642578125, 11.2158203125, 12.197998046875, 13.18017578125, 14.162353515625, 15.14453125, 16.126708984375, 17.10888671875, 18.091064453125, 19.0732421875, 20.055419921875, 21.03759765625, 22.019775390625, 23.001953125, 23.984130859375, 24.96630859375, 25.948486328125, 26.9306640625, 27.912841796875, 28.89501953125, 29.877197265625, 30.859375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 6.0, 6.0, 1.0, 6.0, 4.0, 13.0, 16.0, 17.0, 23.0, 39.0, 39.0, 45.0, 40.0, 78.0, 86.0, 94.0, 131.0, 143.0, 140.0, 161.0, 188.0, 229.0, 261.0, 212.0, 227.0, 213.0, 240.0, 207.0, 195.0, 185.0, 153.0, 123.0, 102.0, 88.0, 78.0, 46.0, 59.0, 40.0, 38.0, 33.0, 20.0, 12.0, 7.0, 12.0, 10.0, 8.0, 2.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.625, -12.2335205078125, -11.842041015625, -11.4505615234375, -11.05908203125, -10.6676025390625, -10.276123046875, -9.8846435546875, -9.4931640625, -9.1016845703125, -8.710205078125, -8.3187255859375, -7.92724609375, -7.5357666015625, -7.144287109375, -6.7528076171875, -6.361328125, -5.9698486328125, -5.578369140625, -5.1868896484375, -4.79541015625, -4.4039306640625, -4.012451171875, -3.6209716796875, -3.2294921875, -2.8380126953125, -2.446533203125, -2.0550537109375, -1.66357421875, -1.2720947265625, -0.880615234375, -0.4891357421875, -0.09765625, 0.2938232421875, 0.685302734375, 1.0767822265625, 1.46826171875, 1.8597412109375, 2.251220703125, 2.6427001953125, 3.0341796875, 3.4256591796875, 3.817138671875, 4.2086181640625, 4.60009765625, 4.9915771484375, 5.383056640625, 5.7745361328125, 6.166015625, 6.5574951171875, 6.948974609375, 7.3404541015625, 7.73193359375, 8.1234130859375, 8.514892578125, 8.9063720703125, 9.2978515625, 9.6893310546875, 10.080810546875, 10.4722900390625, 10.86376953125, 11.2552490234375, 11.646728515625, 12.0382080078125, 12.4296875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 4.0, 6.0, 4.0, 7.0, 3.0, 5.0, 14.0, 24.0, 11.0, 26.0, 23.0, 33.0, 36.0, 42.0, 32.0, 60.0, 49.0, 60.0, 55.0, 53.0, 48.0, 43.0, 59.0, 35.0, 53.0, 31.0, 23.0, 23.0, 30.0, 28.0, 17.0, 9.0, 18.0, 4.0, 6.0, 5.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.580814361572266, -38.063297271728516, -36.5457763671875, -35.02825927734375, -33.5107421875, -31.993223190307617, -30.475704193115234, -28.958187103271484, -27.4406681060791, -25.92314910888672, -24.40563201904297, -22.888113021850586, -21.370594024658203, -19.853076934814453, -18.33555793762207, -16.818038940429688, -15.300521850585938, -13.783003807067871, -12.265485763549805, -10.747966766357422, -9.230448722839355, -7.712930679321289, -6.195411682128906, -4.67789363861084, -3.1603755950927734, -1.642857313156128, -0.12533903121948242, 1.3921794891357422, 2.9096975326538086, 4.427215576171875, 5.944734573364258, 7.462252616882324, 8.979766845703125, 10.497284889221191, 12.014802932739258, 13.53232192993164, 15.049839973449707, 16.567358016967773, 18.084877014160156, 19.602394104003906, 21.11991310119629, 22.637432098388672, 24.154949188232422, 25.672468185424805, 27.189987182617188, 28.707504272460938, 30.22502326965332, 31.742542266845703, 33.26005935668945, 34.7775764465332, 36.29509735107422, 37.81261444091797, 39.33013153076172, 40.84764862060547, 42.365169525146484, 43.882686614990234, 45.40020751953125, 46.917724609375, 48.435245513916016, 49.952762603759766, 51.470279693603516, 52.98780059814453, 54.50531768798828, 56.02283477783203, 57.54035186767578]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 2.0, 6.0, 12.0, 12.0, 6.0, 18.0, 10.0, 16.0, 26.0, 21.0, 35.0, 27.0, 23.0, 28.0, 22.0, 27.0, 28.0, 35.0, 30.0, 38.0, 37.0, 43.0, 27.0, 29.0, 42.0, 27.0, 39.0, 40.0, 36.0, 25.0, 28.0, 20.0, 19.0, 22.0, 19.0, 23.0, 11.0, 15.0, 15.0, 10.0, 3.0, 10.0, 5.0, 4.0, 3.0, 2.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.241344451904297, -24.418441772460938, -23.59554100036621, -22.77263832092285, -21.949735641479492, -21.126834869384766, -20.303932189941406, -19.481029510498047, -18.65812873840332, -17.83522605895996, -17.012325286865234, -16.189422607421875, -15.366520881652832, -14.543619155883789, -13.72071647644043, -12.897814750671387, -12.074912071228027, -11.252010345458984, -10.429107666015625, -9.606205940246582, -8.783304214477539, -7.960402011871338, -7.137499809265137, -6.314598083496094, -5.491695880889893, -4.668793678283691, -3.8458919525146484, -3.0229897499084473, -2.200087785720825, -1.3771858215332031, -0.554283618927002, 0.268618106842041, 1.0915203094482422, 1.9144222736358643, 2.7373242378234863, 3.5602264404296875, 4.3831281661987305, 5.206030368804932, 6.028932571411133, 6.851834297180176, 7.674736499786377, 8.497638702392578, 9.320540428161621, 10.143442153930664, 10.966344833374023, 11.789246559143066, 12.61214828491211, 13.435050964355469, 14.257952690124512, 15.080854415893555, 15.903757095336914, 16.72665786743164, 17.549560546875, 18.37246322631836, 19.19536590576172, 20.018266677856445, 20.841169357299805, 21.664072036743164, 22.48697280883789, 23.30987548828125, 24.13277816772461, 24.955678939819336, 25.778581619262695, 26.601482391357422, 27.42438507080078]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 6.0, 26.0, 28.0, 50.0, 74.0, 123.0, 212.0, 331.0, 501.0, 821.0, 1317.0, 2156.0, 3393.0, 5530.0, 9268.0, 15683.0, 26970.0, 45953.0, 78790.0, 129977.0, 188352.0, 193714.0, 138193.0, 84886.0, 50069.0, 29084.0, 17128.0, 10202.0, 5988.0, 3743.0, 2214.0, 1379.0, 863.0, 554.0, 367.0, 205.0, 152.0, 92.0, 48.0, 39.0, 21.0, 14.0, 9.0, 10.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.8515625, -9.5706787109375, -9.289794921875, -9.0089111328125, -8.72802734375, -8.4471435546875, -8.166259765625, -7.8853759765625, -7.6044921875, -7.3236083984375, -7.042724609375, -6.7618408203125, -6.48095703125, -6.2000732421875, -5.919189453125, -5.6383056640625, -5.357421875, -5.0765380859375, -4.795654296875, -4.5147705078125, -4.23388671875, -3.9530029296875, -3.672119140625, -3.3912353515625, -3.1103515625, -2.8294677734375, -2.548583984375, -2.2677001953125, -1.98681640625, -1.7059326171875, -1.425048828125, -1.1441650390625, -0.86328125, -0.5823974609375, -0.301513671875, -0.0206298828125, 0.26025390625, 0.5411376953125, 0.822021484375, 1.1029052734375, 1.3837890625, 1.6646728515625, 1.945556640625, 2.2264404296875, 2.50732421875, 2.7882080078125, 3.069091796875, 3.3499755859375, 3.630859375, 3.9117431640625, 4.192626953125, 4.4735107421875, 4.75439453125, 5.0352783203125, 5.316162109375, 5.5970458984375, 5.8779296875, 6.1588134765625, 6.439697265625, 6.7205810546875, 7.00146484375, 7.2823486328125, 7.563232421875, 7.8441162109375, 8.125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 4.0, 6.0, 10.0, 13.0, 21.0, 11.0, 18.0, 19.0, 24.0, 29.0, 27.0, 31.0, 30.0, 39.0, 23.0, 27.0, 36.0, 45.0, 34.0, 50.0, 37.0, 46.0, 39.0, 36.0, 25.0, 46.0, 32.0, 36.0, 24.0, 28.0, 20.0, 18.0, 17.0, 13.0, 11.0, 10.0, 7.0, 12.0, 9.0, 7.0, 3.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.578125, -30.547607421875, -29.51708984375, -28.486572265625, -27.4560546875, -26.425537109375, -25.39501953125, -24.364501953125, -23.333984375, -22.303466796875, -21.27294921875, -20.242431640625, -19.2119140625, -18.181396484375, -17.15087890625, -16.120361328125, -15.08984375, -14.059326171875, -13.02880859375, -11.998291015625, -10.9677734375, -9.937255859375, -8.90673828125, -7.876220703125, -6.845703125, -5.815185546875, -4.78466796875, -3.754150390625, -2.7236328125, -1.693115234375, -0.66259765625, 0.367919921875, 1.3984375, 2.428955078125, 3.45947265625, 4.489990234375, 5.5205078125, 6.551025390625, 7.58154296875, 8.612060546875, 9.642578125, 10.673095703125, 11.70361328125, 12.734130859375, 13.7646484375, 14.795166015625, 15.82568359375, 16.856201171875, 17.88671875, 18.917236328125, 19.94775390625, 20.978271484375, 22.0087890625, 23.039306640625, 24.06982421875, 25.100341796875, 26.130859375, 27.161376953125, 28.19189453125, 29.222412109375, 30.2529296875, 31.283447265625, 32.31396484375, 33.344482421875, 34.375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 13.0, 15.0, 19.0, 31.0, 41.0, 58.0, 80.0, 117.0, 157.0, 267.0, 411.0, 620.0, 947.0, 1559.0, 2556.0, 4578.0, 8171.0, 15179.0, 28274.0, 53397.0, 96614.0, 159712.0, 209131.0, 188790.0, 124221.0, 70527.0, 37560.0, 20036.0, 10775.0, 5869.0, 3442.0, 2036.0, 1215.0, 710.0, 464.0, 308.0, 203.0, 143.0, 90.0, 55.0, 40.0, 37.0, 27.0, 13.0, 11.0, 5.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0], "bins": [-9.6015625, -9.2989501953125, -8.996337890625, -8.6937255859375, -8.39111328125, -8.0885009765625, -7.785888671875, -7.4832763671875, -7.1806640625, -6.8780517578125, -6.575439453125, -6.2728271484375, -5.97021484375, -5.6676025390625, -5.364990234375, -5.0623779296875, -4.759765625, -4.4571533203125, -4.154541015625, -3.8519287109375, -3.54931640625, -3.2467041015625, -2.944091796875, -2.6414794921875, -2.3388671875, -2.0362548828125, -1.733642578125, -1.4310302734375, -1.12841796875, -0.8258056640625, -0.523193359375, -0.2205810546875, 0.08203125, 0.3846435546875, 0.687255859375, 0.9898681640625, 1.29248046875, 1.5950927734375, 1.897705078125, 2.2003173828125, 2.5029296875, 2.8055419921875, 3.108154296875, 3.4107666015625, 3.71337890625, 4.0159912109375, 4.318603515625, 4.6212158203125, 4.923828125, 5.2264404296875, 5.529052734375, 5.8316650390625, 6.13427734375, 6.4368896484375, 6.739501953125, 7.0421142578125, 7.3447265625, 7.6473388671875, 7.949951171875, 8.2525634765625, 8.55517578125, 8.8577880859375, 9.160400390625, 9.4630126953125, 9.765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 4.0, 10.0, 11.0, 12.0, 18.0, 22.0, 27.0, 28.0, 33.0, 24.0, 33.0, 40.0, 35.0, 34.0, 38.0, 43.0, 43.0, 51.0, 57.0, 41.0, 45.0, 47.0, 36.0, 37.0, 37.0, 27.0, 23.0, 27.0, 23.0, 24.0, 22.0, 7.0, 4.0, 6.0, 6.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.11279296875, -20.3818359375, -19.65087890625, -18.919921875, -18.18896484375, -17.4580078125, -16.72705078125, -15.99609375, -15.26513671875, -14.5341796875, -13.80322265625, -13.072265625, -12.34130859375, -11.6103515625, -10.87939453125, -10.1484375, -9.41748046875, -8.6865234375, -7.95556640625, -7.224609375, -6.49365234375, -5.7626953125, -5.03173828125, -4.30078125, -3.56982421875, -2.8388671875, -2.10791015625, -1.376953125, -0.64599609375, 0.0849609375, 0.81591796875, 1.546875, 2.27783203125, 3.0087890625, 3.73974609375, 4.470703125, 5.20166015625, 5.9326171875, 6.66357421875, 7.39453125, 8.12548828125, 8.8564453125, 9.58740234375, 10.318359375, 11.04931640625, 11.7802734375, 12.51123046875, 13.2421875, 13.97314453125, 14.7041015625, 15.43505859375, 16.166015625, 16.89697265625, 17.6279296875, 18.35888671875, 19.08984375, 19.82080078125, 20.5517578125, 21.28271484375, 22.013671875, 22.74462890625, 23.4755859375, 24.20654296875, 24.9375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 11.0, 12.0, 18.0, 8.0, 20.0, 37.0, 42.0, 55.0, 99.0, 181.0, 274.0, 391.0, 724.0, 1592.0, 3757.0, 9814.0, 29016.0, 97532.0, 313590.0, 388642.0, 140136.0, 40579.0, 12950.0, 4812.0, 2023.0, 901.0, 496.0, 304.0, 156.0, 101.0, 70.0, 52.0, 50.0, 27.0, 25.0, 13.0, 6.0, 10.0, 3.0, 6.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-4.63671875, -4.504791259765625, -4.37286376953125, -4.240936279296875, -4.1090087890625, -3.977081298828125, -3.84515380859375, -3.713226318359375, -3.581298828125, -3.449371337890625, -3.31744384765625, -3.185516357421875, -3.0535888671875, -2.921661376953125, -2.78973388671875, -2.657806396484375, -2.52587890625, -2.393951416015625, -2.26202392578125, -2.130096435546875, -1.9981689453125, -1.866241455078125, -1.73431396484375, -1.602386474609375, -1.470458984375, -1.338531494140625, -1.20660400390625, -1.074676513671875, -0.9427490234375, -0.810821533203125, -0.67889404296875, -0.546966552734375, -0.4150390625, -0.283111572265625, -0.15118408203125, -0.019256591796875, 0.1126708984375, 0.244598388671875, 0.37652587890625, 0.508453369140625, 0.640380859375, 0.772308349609375, 0.90423583984375, 1.036163330078125, 1.1680908203125, 1.300018310546875, 1.43194580078125, 1.563873291015625, 1.69580078125, 1.827728271484375, 1.95965576171875, 2.091583251953125, 2.2235107421875, 2.355438232421875, 2.48736572265625, 2.619293212890625, 2.751220703125, 2.883148193359375, 3.01507568359375, 3.147003173828125, 3.2789306640625, 3.410858154296875, 3.54278564453125, 3.674713134765625, 3.806640625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 1.0, 4.0, 13.0, 10.0, 13.0, 14.0, 15.0, 26.0, 22.0, 26.0, 39.0, 32.0, 26.0, 40.0, 49.0, 46.0, 50.0, 49.0, 58.0, 59.0, 51.0, 41.0, 42.0, 51.0, 31.0, 36.0, 31.0, 20.0, 16.0, 24.0, 14.0, 6.0, 8.0, 5.0, 8.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00013375282287597656, -0.0001295916736125946, -0.00012543052434921265, -0.00012126937508583069, -0.00011710822582244873, -0.00011294707655906677, -0.00010878592729568481, -0.00010462477803230286, -0.0001004636287689209, -9.630247950553894e-05, -9.214133024215698e-05, -8.798018097877502e-05, -8.381903171539307e-05, -7.965788245201111e-05, -7.549673318862915e-05, -7.133558392524719e-05, -6.717443466186523e-05, -6.301328539848328e-05, -5.885213613510132e-05, -5.469098687171936e-05, -5.05298376083374e-05, -4.6368688344955444e-05, -4.2207539081573486e-05, -3.804638981819153e-05, -3.388524055480957e-05, -2.9724091291427612e-05, -2.5562942028045654e-05, -2.1401792764663696e-05, -1.7240643501281738e-05, -1.307949423789978e-05, -8.918344974517822e-06, -4.757195711135864e-06, -5.960464477539062e-07, 3.5651028156280518e-06, 7.72625207901001e-06, 1.1887401342391968e-05, 1.6048550605773926e-05, 2.0209699869155884e-05, 2.4370849132537842e-05, 2.85319983959198e-05, 3.269314765930176e-05, 3.6854296922683716e-05, 4.1015446186065674e-05, 4.517659544944763e-05, 4.933774471282959e-05, 5.349889397621155e-05, 5.7660043239593506e-05, 6.182119250297546e-05, 6.598234176635742e-05, 7.014349102973938e-05, 7.430464029312134e-05, 7.84657895565033e-05, 8.262693881988525e-05, 8.678808808326721e-05, 9.094923734664917e-05, 9.511038661003113e-05, 9.927153587341309e-05, 0.00010343268513679504, 0.000107593834400177, 0.00011175498366355896, 0.00011591613292694092, 0.00012007728219032288, 0.00012423843145370483, 0.0001283995807170868, 0.00013256072998046875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 0.0, 3.0, 2.0, 8.0, 10.0, 11.0, 23.0, 24.0, 44.0, 61.0, 100.0, 117.0, 167.0, 259.0, 350.0, 437.0, 627.0, 964.0, 1504.0, 2570.0, 4612.0, 9430.0, 20022.0, 45594.0, 109991.0, 259794.0, 320764.0, 154483.0, 62705.0, 26955.0, 12238.0, 5895.0, 3284.0, 1802.0, 1144.0, 806.0, 507.0, 366.0, 275.0, 196.0, 115.0, 107.0, 54.0, 40.0, 35.0, 21.0, 13.0, 13.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.30078125, -5.14105224609375, -4.9813232421875, -4.82159423828125, -4.661865234375, -4.50213623046875, -4.3424072265625, -4.18267822265625, -4.02294921875, -3.86322021484375, -3.7034912109375, -3.54376220703125, -3.384033203125, -3.22430419921875, -3.0645751953125, -2.90484619140625, -2.7451171875, -2.58538818359375, -2.4256591796875, -2.26593017578125, -2.106201171875, -1.94647216796875, -1.7867431640625, -1.62701416015625, -1.46728515625, -1.30755615234375, -1.1478271484375, -0.98809814453125, -0.828369140625, -0.66864013671875, -0.5089111328125, -0.34918212890625, -0.189453125, -0.02972412109375, 0.1300048828125, 0.28973388671875, 0.449462890625, 0.60919189453125, 0.7689208984375, 0.92864990234375, 1.08837890625, 1.24810791015625, 1.4078369140625, 1.56756591796875, 1.727294921875, 1.88702392578125, 2.0467529296875, 2.20648193359375, 2.3662109375, 2.52593994140625, 2.6856689453125, 2.84539794921875, 3.005126953125, 3.16485595703125, 3.3245849609375, 3.48431396484375, 3.64404296875, 3.80377197265625, 3.9635009765625, 4.12322998046875, 4.282958984375, 4.44268798828125, 4.6024169921875, 4.76214599609375, 4.921875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 11.0, 4.0, 6.0, 9.0, 17.0, 23.0, 24.0, 23.0, 30.0, 45.0, 35.0, 46.0, 63.0, 87.0, 87.0, 86.0, 73.0, 73.0, 49.0, 50.0, 41.0, 25.0, 20.0, 16.0, 8.0, 12.0, 3.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.150390625, -1.1121673583984375, -1.073944091796875, -1.0357208251953125, -0.99749755859375, -0.9592742919921875, -0.921051025390625, -0.8828277587890625, -0.8446044921875, -0.8063812255859375, -0.768157958984375, -0.7299346923828125, -0.69171142578125, -0.6534881591796875, -0.615264892578125, -0.5770416259765625, -0.538818359375, -0.5005950927734375, -0.462371826171875, -0.4241485595703125, -0.38592529296875, -0.3477020263671875, -0.309478759765625, -0.2712554931640625, -0.2330322265625, -0.1948089599609375, -0.156585693359375, -0.1183624267578125, -0.08013916015625, -0.0419158935546875, -0.003692626953125, 0.0345306396484375, 0.07275390625, 0.1109771728515625, 0.149200439453125, 0.1874237060546875, 0.22564697265625, 0.2638702392578125, 0.302093505859375, 0.3403167724609375, 0.3785400390625, 0.4167633056640625, 0.454986572265625, 0.4932098388671875, 0.53143310546875, 0.5696563720703125, 0.607879638671875, 0.6461029052734375, 0.684326171875, 0.7225494384765625, 0.760772705078125, 0.7989959716796875, 0.83721923828125, 0.8754425048828125, 0.913665771484375, 0.9518890380859375, 0.9901123046875, 1.0283355712890625, 1.066558837890625, 1.1047821044921875, 1.14300537109375, 1.1812286376953125, 1.219451904296875, 1.2576751708984375, 1.2958984375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 7.0, 3.0, 9.0, 3.0, 4.0, 7.0, 8.0, 13.0, 18.0, 20.0, 23.0, 28.0, 41.0, 32.0, 43.0, 40.0, 54.0, 57.0, 56.0, 56.0, 50.0, 49.0, 57.0, 43.0, 42.0, 45.0, 25.0, 24.0, 25.0, 36.0, 18.0, 12.0, 10.0, 12.0, 7.0, 5.0, 4.0, 2.0, 6.0, 1.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.25777816772461, -39.71240997314453, -38.16703796386719, -36.621665954589844, -35.076297760009766, -33.53092956542969, -31.985557556152344, -30.440187454223633, -28.894817352294922, -27.34944725036621, -25.8040771484375, -24.25870704650879, -22.713336944580078, -21.167966842651367, -19.622596740722656, -18.077226638793945, -16.531856536865234, -14.986486434936523, -13.441116333007812, -11.895746231079102, -10.35037612915039, -8.80500602722168, -7.259635925292969, -5.714265823364258, -4.168895721435547, -2.623525619506836, -1.078155517578125, 0.46721458435058594, 2.012584686279297, 3.557954788208008, 5.103324890136719, 6.64869499206543, 8.19406509399414, 9.739435195922852, 11.284805297851562, 12.830175399780273, 14.375545501708984, 15.920915603637695, 17.466285705566406, 19.011655807495117, 20.557025909423828, 22.10239601135254, 23.64776611328125, 25.19313621520996, 26.738506317138672, 28.283876419067383, 29.829246520996094, 31.374616622924805, 32.919986724853516, 34.465354919433594, 36.01072692871094, 37.55609893798828, 39.10146713256836, 40.64683532714844, 42.19220733642578, 43.737579345703125, 45.2829475402832, 46.82831573486328, 48.373687744140625, 49.91905975341797, 51.46442794799805, 53.009796142578125, 54.55516815185547, 56.10054016113281, 57.64590835571289]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 3.0, 5.0, 10.0, 13.0, 7.0, 18.0, 15.0, 12.0, 26.0, 23.0, 33.0, 23.0, 28.0, 18.0, 32.0, 22.0, 34.0, 30.0, 32.0, 37.0, 39.0, 39.0, 32.0, 27.0, 41.0, 30.0, 41.0, 40.0, 31.0, 28.0, 25.0, 22.0, 21.0, 18.0, 21.0, 25.0, 11.0, 17.0, 12.0, 8.0, 5.0, 8.0, 5.0, 5.0, 2.0, 3.0, 8.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-25.646669387817383, -24.813852310180664, -23.981035232543945, -23.148218154907227, -22.315401077270508, -21.482582092285156, -20.649765014648438, -19.81694793701172, -18.984130859375, -18.15131378173828, -17.318496704101562, -16.485679626464844, -15.652861595153809, -14.82004451751709, -13.987227439880371, -13.154409408569336, -12.321593284606934, -11.488776206970215, -10.655959129333496, -9.823141098022461, -8.990324020385742, -8.157506942749023, -7.324689865112305, -6.491872310638428, -5.659055233001709, -4.82623815536499, -3.9934206008911133, -3.1606035232543945, -2.3277862071990967, -1.4949688911437988, -0.6621518135070801, 0.17066574096679688, 1.0034828186035156, 1.8363001346588135, 2.6691174507141113, 3.50193452835083, 4.334752082824707, 5.167569160461426, 6.0003862380981445, 6.8332037925720215, 7.66602087020874, 8.498838424682617, 9.331655502319336, 10.164472579956055, 10.997289657592773, 11.830106735229492, 12.662923812866211, 13.495741844177246, 14.328558921813965, 15.161375999450684, 15.994193077087402, 16.827011108398438, 17.659828186035156, 18.492645263671875, 19.325462341308594, 20.158279418945312, 20.99109649658203, 21.82391357421875, 22.65673065185547, 23.489547729492188, 24.322364807128906, 25.155181884765625, 25.987998962402344, 26.820817947387695, 27.653635025024414]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 7.0, 12.0, 15.0, 11.0, 33.0, 35.0, 52.0, 92.0, 100.0, 189.0, 248.0, 350.0, 590.0, 872.0, 1451.0, 2056.0, 3393.0, 5286.0, 8390.0, 13652.0, 22094.0, 35968.0, 57559.0, 88617.0, 123873.0, 150779.0, 152204.0, 127327.0, 91987.0, 60791.0, 38222.0, 23271.0, 14460.0, 8861.0, 5635.0, 3442.0, 2306.0, 1512.0, 962.0, 605.0, 418.0, 276.0, 184.0, 106.0, 75.0, 63.0, 36.0, 32.0, 31.0, 13.0, 6.0, 6.0, 2.0, 3.0, 2.0], "bins": [-29.03125, -28.203125, -27.375, -26.546875, -25.71875, -24.890625, -24.0625, -23.234375, -22.40625, -21.578125, -20.75, -19.921875, -19.09375, -18.265625, -17.4375, -16.609375, -15.78125, -14.953125, -14.125, -13.296875, -12.46875, -11.640625, -10.8125, -9.984375, -9.15625, -8.328125, -7.5, -6.671875, -5.84375, -5.015625, -4.1875, -3.359375, -2.53125, -1.703125, -0.875, -0.046875, 0.78125, 1.609375, 2.4375, 3.265625, 4.09375, 4.921875, 5.75, 6.578125, 7.40625, 8.234375, 9.0625, 9.890625, 10.71875, 11.546875, 12.375, 13.203125, 14.03125, 14.859375, 15.6875, 16.515625, 17.34375, 18.171875, 19.0, 19.828125, 20.65625, 21.484375, 22.3125, 23.140625, 23.96875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 5.0, 2.0, 5.0, 7.0, 8.0, 10.0, 12.0, 21.0, 22.0, 21.0, 21.0, 29.0, 31.0, 34.0, 33.0, 39.0, 37.0, 30.0, 43.0, 41.0, 51.0, 44.0, 47.0, 41.0, 43.0, 39.0, 44.0, 41.0, 29.0, 31.0, 21.0, 21.0, 15.0, 14.0, 9.0, 12.0, 12.0, 11.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-35.40625, -34.32763671875, -33.2490234375, -32.17041015625, -31.091796875, -30.01318359375, -28.9345703125, -27.85595703125, -26.77734375, -25.69873046875, -24.6201171875, -23.54150390625, -22.462890625, -21.38427734375, -20.3056640625, -19.22705078125, -18.1484375, -17.06982421875, -15.9912109375, -14.91259765625, -13.833984375, -12.75537109375, -11.6767578125, -10.59814453125, -9.51953125, -8.44091796875, -7.3623046875, -6.28369140625, -5.205078125, -4.12646484375, -3.0478515625, -1.96923828125, -0.890625, 0.18798828125, 1.2666015625, 2.34521484375, 3.423828125, 4.50244140625, 5.5810546875, 6.65966796875, 7.73828125, 8.81689453125, 9.8955078125, 10.97412109375, 12.052734375, 13.13134765625, 14.2099609375, 15.28857421875, 16.3671875, 17.44580078125, 18.5244140625, 19.60302734375, 20.681640625, 21.76025390625, 22.8388671875, 23.91748046875, 24.99609375, 26.07470703125, 27.1533203125, 28.23193359375, 29.310546875, 30.38916015625, 31.4677734375, 32.54638671875, 33.625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 6.0, 16.0, 24.0, 27.0, 42.0, 71.0, 103.0, 116.0, 207.0, 319.0, 446.0, 644.0, 969.0, 1432.0, 2011.0, 3250.0, 4857.0, 7611.0, 12095.0, 19903.0, 33086.0, 55142.0, 90673.0, 137888.0, 175594.0, 169790.0, 125937.0, 80155.0, 48473.0, 28998.0, 17880.0, 10938.0, 6785.0, 4429.0, 2851.0, 1852.0, 1247.0, 862.0, 554.0, 405.0, 283.0, 195.0, 115.0, 82.0, 60.0, 50.0, 25.0, 22.0, 9.0, 12.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.40625, -39.138671875, -37.87109375, -36.603515625, -35.3359375, -34.068359375, -32.80078125, -31.533203125, -30.265625, -28.998046875, -27.73046875, -26.462890625, -25.1953125, -23.927734375, -22.66015625, -21.392578125, -20.125, -18.857421875, -17.58984375, -16.322265625, -15.0546875, -13.787109375, -12.51953125, -11.251953125, -9.984375, -8.716796875, -7.44921875, -6.181640625, -4.9140625, -3.646484375, -2.37890625, -1.111328125, 0.15625, 1.423828125, 2.69140625, 3.958984375, 5.2265625, 6.494140625, 7.76171875, 9.029296875, 10.296875, 11.564453125, 12.83203125, 14.099609375, 15.3671875, 16.634765625, 17.90234375, 19.169921875, 20.4375, 21.705078125, 22.97265625, 24.240234375, 25.5078125, 26.775390625, 28.04296875, 29.310546875, 30.578125, 31.845703125, 33.11328125, 34.380859375, 35.6484375, 36.916015625, 38.18359375, 39.451171875, 40.71875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 7.0, 14.0, 5.0, 10.0, 15.0, 9.0, 29.0, 22.0, 20.0, 23.0, 20.0, 27.0, 34.0, 49.0, 39.0, 37.0, 43.0, 41.0, 46.0, 42.0, 39.0, 36.0, 33.0, 42.0, 31.0, 32.0, 36.0, 26.0, 30.0, 31.0, 15.0, 20.0, 16.0, 11.0, 9.0, 13.0, 6.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-22.09375, -21.464111328125, -20.83447265625, -20.204833984375, -19.5751953125, -18.945556640625, -18.31591796875, -17.686279296875, -17.056640625, -16.427001953125, -15.79736328125, -15.167724609375, -14.5380859375, -13.908447265625, -13.27880859375, -12.649169921875, -12.01953125, -11.389892578125, -10.76025390625, -10.130615234375, -9.5009765625, -8.871337890625, -8.24169921875, -7.612060546875, -6.982421875, -6.352783203125, -5.72314453125, -5.093505859375, -4.4638671875, -3.834228515625, -3.20458984375, -2.574951171875, -1.9453125, -1.315673828125, -0.68603515625, -0.056396484375, 0.5732421875, 1.202880859375, 1.83251953125, 2.462158203125, 3.091796875, 3.721435546875, 4.35107421875, 4.980712890625, 5.6103515625, 6.239990234375, 6.86962890625, 7.499267578125, 8.12890625, 8.758544921875, 9.38818359375, 10.017822265625, 10.6474609375, 11.277099609375, 11.90673828125, 12.536376953125, 13.166015625, 13.795654296875, 14.42529296875, 15.054931640625, 15.6845703125, 16.314208984375, 16.94384765625, 17.573486328125, 18.203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 5.0, 11.0, 14.0, 17.0, 26.0, 37.0, 50.0, 61.0, 93.0, 111.0, 165.0, 199.0, 348.0, 461.0, 711.0, 1088.0, 1752.0, 2945.0, 5250.0, 9819.0, 19477.0, 40314.0, 81826.0, 146594.0, 208170.0, 209168.0, 150196.0, 83960.0, 41660.0, 20058.0, 10198.0, 5454.0, 2991.0, 1783.0, 1167.0, 782.0, 492.0, 312.0, 215.0, 156.0, 110.0, 90.0, 47.0, 48.0, 40.0, 30.0, 23.0, 10.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.859375, -16.31591796875, -15.7724609375, -15.22900390625, -14.685546875, -14.14208984375, -13.5986328125, -13.05517578125, -12.51171875, -11.96826171875, -11.4248046875, -10.88134765625, -10.337890625, -9.79443359375, -9.2509765625, -8.70751953125, -8.1640625, -7.62060546875, -7.0771484375, -6.53369140625, -5.990234375, -5.44677734375, -4.9033203125, -4.35986328125, -3.81640625, -3.27294921875, -2.7294921875, -2.18603515625, -1.642578125, -1.09912109375, -0.5556640625, -0.01220703125, 0.53125, 1.07470703125, 1.6181640625, 2.16162109375, 2.705078125, 3.24853515625, 3.7919921875, 4.33544921875, 4.87890625, 5.42236328125, 5.9658203125, 6.50927734375, 7.052734375, 7.59619140625, 8.1396484375, 8.68310546875, 9.2265625, 9.77001953125, 10.3134765625, 10.85693359375, 11.400390625, 11.94384765625, 12.4873046875, 13.03076171875, 13.57421875, 14.11767578125, 14.6611328125, 15.20458984375, 15.748046875, 16.29150390625, 16.8349609375, 17.37841796875, 17.921875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 11.0, 7.0, 7.0, 12.0, 16.0, 28.0, 17.0, 20.0, 30.0, 40.0, 63.0, 60.0, 68.0, 59.0, 78.0, 65.0, 69.0, 71.0, 52.0, 52.0, 35.0, 36.0, 26.0, 19.0, 16.0, 9.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023193359375, -0.0022589415311813354, -0.002198547124862671, -0.0021381527185440063, -0.002077758312225342, -0.0020173639059066772, -0.0019569694995880127, -0.0018965750932693481, -0.0018361806869506836, -0.001775786280632019, -0.0017153918743133545, -0.00165499746799469, -0.0015946030616760254, -0.0015342086553573608, -0.0014738142490386963, -0.0014134198427200317, -0.0013530254364013672, -0.0012926310300827026, -0.001232236623764038, -0.0011718422174453735, -0.001111447811126709, -0.0010510534048080444, -0.0009906589984893799, -0.0009302645921707153, -0.0008698701858520508, -0.0008094757795333862, -0.0007490813732147217, -0.0006886869668960571, -0.0006282925605773926, -0.000567898154258728, -0.0005075037479400635, -0.0004471093416213989, -0.0003867149353027344, -0.0003263205289840698, -0.0002659261226654053, -0.00020553171634674072, -0.00014513731002807617, -8.474290370941162e-05, -2.434849739074707e-05, 3.604590892791748e-05, 9.644031524658203e-05, 0.00015683472156524658, 0.00021722912788391113, 0.0002776235342025757, 0.00033801794052124023, 0.0003984123468399048, 0.00045880675315856934, 0.0005192011594772339, 0.0005795955657958984, 0.000639989972114563, 0.0007003843784332275, 0.0007607787847518921, 0.0008211731910705566, 0.0008815675973892212, 0.0009419620037078857, 0.0010023564100265503, 0.0010627508163452148, 0.0011231452226638794, 0.001183539628982544, 0.0012439340353012085, 0.001304328441619873, 0.0013647228479385376, 0.0014251172542572021, 0.0014855116605758667, 0.0015459060668945312]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 3.0, 7.0, 14.0, 12.0, 22.0, 32.0, 33.0, 53.0, 65.0, 119.0, 208.0, 304.0, 529.0, 949.0, 1796.0, 3689.0, 8077.0, 20085.0, 53871.0, 136749.0, 254920.0, 278078.0, 171198.0, 71247.0, 26370.0, 10345.0, 4665.0, 2259.0, 1134.0, 666.0, 386.0, 232.0, 143.0, 80.0, 75.0, 37.0, 22.0, 20.0, 27.0, 10.0, 2.0, 9.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.83642578125, -22.1259765625, -21.41552734375, -20.705078125, -19.99462890625, -19.2841796875, -18.57373046875, -17.86328125, -17.15283203125, -16.4423828125, -15.73193359375, -15.021484375, -14.31103515625, -13.6005859375, -12.89013671875, -12.1796875, -11.46923828125, -10.7587890625, -10.04833984375, -9.337890625, -8.62744140625, -7.9169921875, -7.20654296875, -6.49609375, -5.78564453125, -5.0751953125, -4.36474609375, -3.654296875, -2.94384765625, -2.2333984375, -1.52294921875, -0.8125, -0.10205078125, 0.6083984375, 1.31884765625, 2.029296875, 2.73974609375, 3.4501953125, 4.16064453125, 4.87109375, 5.58154296875, 6.2919921875, 7.00244140625, 7.712890625, 8.42333984375, 9.1337890625, 9.84423828125, 10.5546875, 11.26513671875, 11.9755859375, 12.68603515625, 13.396484375, 14.10693359375, 14.8173828125, 15.52783203125, 16.23828125, 16.94873046875, 17.6591796875, 18.36962890625, 19.080078125, 19.79052734375, 20.5009765625, 21.21142578125, 21.921875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 2.0, 2.0, 2.0, 10.0, 8.0, 8.0, 11.0, 19.0, 25.0, 35.0, 49.0, 44.0, 41.0, 41.0, 55.0, 61.0, 52.0, 60.0, 74.0, 67.0, 44.0, 26.0, 44.0, 41.0, 29.0, 27.0, 23.0, 26.0, 20.0, 14.0, 9.0, 7.0, 5.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.15625, -5.019775390625, -4.88330078125, -4.746826171875, -4.6103515625, -4.473876953125, -4.33740234375, -4.200927734375, -4.064453125, -3.927978515625, -3.79150390625, -3.655029296875, -3.5185546875, -3.382080078125, -3.24560546875, -3.109130859375, -2.97265625, -2.836181640625, -2.69970703125, -2.563232421875, -2.4267578125, -2.290283203125, -2.15380859375, -2.017333984375, -1.880859375, -1.744384765625, -1.60791015625, -1.471435546875, -1.3349609375, -1.198486328125, -1.06201171875, -0.925537109375, -0.7890625, -0.652587890625, -0.51611328125, -0.379638671875, -0.2431640625, -0.106689453125, 0.02978515625, 0.166259765625, 0.302734375, 0.439208984375, 0.57568359375, 0.712158203125, 0.8486328125, 0.985107421875, 1.12158203125, 1.258056640625, 1.39453125, 1.531005859375, 1.66748046875, 1.803955078125, 1.9404296875, 2.076904296875, 2.21337890625, 2.349853515625, 2.486328125, 2.622802734375, 2.75927734375, 2.895751953125, 3.0322265625, 3.168701171875, 3.30517578125, 3.441650390625, 3.578125]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 6.0, 3.0, 4.0, 3.0, 3.0, 7.0, 10.0, 3.0, 6.0, 12.0, 16.0, 18.0, 24.0, 22.0, 34.0, 22.0, 39.0, 32.0, 39.0, 43.0, 41.0, 48.0, 49.0, 52.0, 42.0, 44.0, 49.0, 44.0, 30.0, 32.0, 36.0, 28.0, 26.0, 31.0, 24.0, 14.0, 14.0, 11.0, 5.0, 8.0, 4.0, 6.0, 9.0, 4.0, 1.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.27381896972656, -36.83565902709961, -35.39749526977539, -33.95933532714844, -32.52117156982422, -31.083009719848633, -29.644847869873047, -28.206687927246094, -26.768524169921875, -25.33036231994629, -23.892200469970703, -22.454038619995117, -21.01587677001953, -19.577714920043945, -18.13955307006836, -16.701393127441406, -15.26323127746582, -13.825069427490234, -12.386907577514648, -10.948745727539062, -9.510583877563477, -8.07242202758789, -6.634261131286621, -5.196099281311035, -3.757937431335449, -2.3197755813598633, -0.8816139698028564, 0.5565476417541504, 1.9947094917297363, 3.4328713417053223, 4.87103271484375, 6.309194564819336, 7.747356414794922, 9.185518264770508, 10.623680114746094, 12.06184196472168, 13.500003814697266, 14.938165664672852, 16.376327514648438, 17.81448745727539, 19.25265121459961, 20.690813064575195, 22.12897491455078, 23.567136764526367, 25.005298614501953, 26.44346046447754, 27.881622314453125, 29.319782257080078, 30.757944107055664, 32.19610595703125, 33.6342658996582, 35.07242965698242, 36.510589599609375, 37.948753356933594, 39.38691329956055, 40.825077056884766, 42.26323699951172, 43.70139694213867, 45.13956069946289, 46.577720642089844, 48.01588439941406, 49.454044342041016, 50.892208099365234, 52.33036804199219, 53.768531799316406]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 11.0, 5.0, 7.0, 10.0, 12.0, 18.0, 19.0, 22.0, 19.0, 20.0, 28.0, 24.0, 27.0, 39.0, 33.0, 45.0, 36.0, 27.0, 49.0, 53.0, 45.0, 37.0, 41.0, 30.0, 37.0, 44.0, 32.0, 21.0, 23.0, 29.0, 19.0, 19.0, 21.0, 17.0, 13.0, 7.0, 16.0, 9.0, 5.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.30934143066406, -40.074867248535156, -38.840389251708984, -37.60591506958008, -36.371437072753906, -35.136962890625, -33.90248489379883, -32.66801071166992, -31.433534622192383, -30.199058532714844, -28.964582443237305, -27.730106353759766, -26.49563217163086, -25.261154174804688, -24.02667999267578, -22.792203903198242, -21.557727813720703, -20.323251724243164, -19.088775634765625, -17.854299545288086, -16.619823455810547, -15.385348320007324, -14.150873184204102, -12.916397094726562, -11.681921005249023, -10.447444915771484, -9.212968826293945, -7.978493690490723, -6.744017601013184, -5.5095415115356445, -4.275065898895264, -3.040590286254883, -1.8061103820800781, -0.5716345310211182, 0.6628413200378418, 1.8973171710968018, 3.1317930221557617, 4.366269111633301, 5.600744724273682, 6.8352203369140625, 8.069696426391602, 9.30417251586914, 10.53864860534668, 11.773123741149902, 13.007599830627441, 14.24207592010498, 15.476551055908203, 16.711027145385742, 17.94550323486328, 19.17997932434082, 20.41445541381836, 21.6489315032959, 22.883407592773438, 24.117881774902344, 25.352357864379883, 26.586833953857422, 27.82131004333496, 29.0557861328125, 30.29026222229004, 31.524738311767578, 32.759212493896484, 33.993690490722656, 35.22816467285156, 36.46263885498047, 37.69711685180664]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 9.0, 14.0, 12.0, 16.0, 20.0, 34.0, 48.0, 53.0, 85.0, 111.0, 177.0, 247.0, 433.0, 601.0, 959.0, 1485.0, 2162.0, 3544.0, 5398.0, 10746.0, 479210.0, 6755.0, 4244.0, 2696.0, 1769.0, 1176.0, 710.0, 485.0, 319.0, 225.0, 165.0, 91.0, 76.0, 48.0, 30.0, 26.0, 30.0, 17.0, 8.0, 10.0, 8.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-622.2182006835938, -603.4912719726562, -584.7643432617188, -566.0374145507812, -547.3104858398438, -528.5835571289062, -509.85662841796875, -491.12969970703125, -472.40277099609375, -453.67584228515625, -434.94891357421875, -416.22198486328125, -397.49505615234375, -378.76812744140625, -360.04119873046875, -341.31427001953125, -322.5873718261719, -303.8604431152344, -285.1335144042969, -266.4065856933594, -247.67965698242188, -228.95272827148438, -210.22581481933594, -191.49888610839844, -172.77195739746094, -154.04502868652344, -135.31809997558594, -116.59117889404297, -97.86425018310547, -79.13732147216797, -60.410400390625, -41.6834716796875, -22.95654296875, -4.229616165161133, 14.497310638427734, 33.22423553466797, 51.95116424560547, 70.67809295654297, 89.40501403808594, 108.13194274902344, 126.85887145996094, 145.58580017089844, 164.31272888183594, 183.03964233398438, 201.76657104492188, 220.49349975585938, 239.22042846679688, 257.9473571777344, 276.6742858886719, 295.4012145996094, 314.1281433105469, 332.8550720214844, 351.5820007324219, 370.3089294433594, 389.03582763671875, 407.76275634765625, 426.48968505859375, 445.21661376953125, 463.94354248046875, 482.67047119140625, 501.39739990234375, 520.1243286132812, 538.8512573242188, 557.5781860351562, 576.3051147460938]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 7.0, 6.0, 15.0, 17.0, 17.0, 20.0, 20.0, 21.0, 19.0, 33.0, 23.0, 39.0, 33.0, 38.0, 45.0, 27.0, 46.0, 56.0, 1068.0, 40.0, 33.0, 36.0, 39.0, 37.0, 41.0, 22.0, 24.0, 27.0, 21.0, 17.0, 22.0, 16.0, 14.0, 10.0, 17.0, 8.0, 5.0, 6.0, 6.0, 5.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1273.25439453125, -1235.2457275390625, -1197.237060546875, -1159.2283935546875, -1121.2197265625, -1083.211181640625, -1045.202392578125, -1007.19384765625, -969.1851806640625, -931.176513671875, -893.1678466796875, -855.1591796875, -817.1505737304688, -779.1419067382812, -741.1332397460938, -703.1246337890625, -665.1159057617188, -627.1072387695312, -589.0985717773438, -551.0899658203125, -513.081298828125, -475.0726318359375, -437.06396484375, -399.0553283691406, -361.0466613769531, -323.0379943847656, -285.02935791015625, -247.02069091796875, -209.0120391845703, -171.00338745117188, -132.99472045898438, -94.986083984375, -56.9774169921875, -18.968761444091797, 19.039894104003906, 57.048553466796875, 95.05720520019531, 133.06585693359375, 171.07452392578125, 209.08316040039062, 247.09182739257812, 285.1004943847656, 323.109130859375, 361.1177978515625, 399.12646484375, 437.1351013183594, 475.1437683105469, 513.1524047851562, 551.1610717773438, 589.1697387695312, 627.1784057617188, 665.18701171875, 703.1956787109375, 741.204345703125, 779.2130126953125, 817.2216796875, 855.2303466796875, 893.239013671875, 931.2476806640625, 969.25634765625, 1007.2649536132812, 1045.273681640625, 1083.2822265625, 1121.2908935546875, 1159.299560546875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 5.0, 5.0, 11.0, 18.0, 35.0, 39.0, 45.0, 76.0, 92.0, 126.0, 160.0, 223.0, 322.0, 467.0, 688.0, 959.0, 1447.0, 2471.0, 4062.0, 6660.0, 10132.0, 15119.0, 24952.0, 98833.0, 30977132.0, 59118.0, 27198.0, 10693.0, 5428.0, 3138.0, 1965.0, 1131.0, 651.0, 359.0, 222.0, 141.0, 107.0, 80.0, 55.0, 41.0, 35.0, 21.0, 17.0, 15.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-809.2265625, -786.8597412109375, -764.492919921875, -742.1261596679688, -719.7593383789062, -697.3925170898438, -675.0256958007812, -652.658935546875, -630.2921142578125, -607.92529296875, -585.5584716796875, -563.1917114257812, -540.8248901367188, -518.4580688476562, -496.09124755859375, -473.7244567871094, -451.3576354980469, -428.9908142089844, -406.6240234375, -384.2572021484375, -361.8904113769531, -339.5235900878906, -317.15679931640625, -294.78997802734375, -272.42315673828125, -250.0563507080078, -227.68954467773438, -205.32272338867188, -182.9559326171875, -160.589111328125, -138.22230529785156, -115.85549926757812, -93.48870849609375, -71.12190246582031, -48.75509262084961, -26.388282775878906, -4.021476745605469, 18.34532928466797, 40.71214294433594, 63.078948974609375, 85.44575500488281, 107.81256103515625, 130.1793670654297, 152.54617309570312, 174.91299438476562, 197.27978515625, 219.6466064453125, 242.01341247558594, 264.3802185058594, 286.7470397949219, 309.11383056640625, 331.48065185546875, 353.8474426269531, 376.2142639160156, 398.5810546875, 420.9478759765625, 443.314697265625, 465.6815185546875, 488.0483093261719, 510.4151306152344, 532.7819213867188, 555.1487426757812, 577.5155639648438, 599.88232421875, 622.2491455078125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 4.0, 9.0, 12.0, 10.0, 16.0, 36.0, 25.0, 49.0, 77.0, 120.0, 166.0, 240.0, 377.0, 648.0, 975.0, 1618.0, 2589.0, 4691.0, 8487.0, 15924.0, 32405.0, 69739.0, 163217.0, 406408.0, 1192295.0, 2715443.0, 1041216.0, 363575.0, 145991.0, 63750.0, 29142.0, 14370.0, 7470.0, 4109.0, 2388.0, 1418.0, 915.0, 533.0, 321.0, 206.0, 166.0, 97.0, 62.0, 45.0, 31.0, 23.0, 6.0, 11.0, 5.0, 6.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-24.640625, -23.803955078125, -22.96728515625, -22.130615234375, -21.2939453125, -20.457275390625, -19.62060546875, -18.783935546875, -17.947265625, -17.110595703125, -16.27392578125, -15.437255859375, -14.6005859375, -13.763916015625, -12.92724609375, -12.090576171875, -11.25390625, -10.417236328125, -9.58056640625, -8.743896484375, -7.9072265625, -7.070556640625, -6.23388671875, -5.397216796875, -4.560546875, -3.723876953125, -2.88720703125, -2.050537109375, -1.2138671875, -0.377197265625, 0.45947265625, 1.296142578125, 2.1328125, 2.969482421875, 3.80615234375, 4.642822265625, 5.4794921875, 6.316162109375, 7.15283203125, 7.989501953125, 8.826171875, 9.662841796875, 10.49951171875, 11.336181640625, 12.1728515625, 13.009521484375, 13.84619140625, 14.682861328125, 15.51953125, 16.356201171875, 17.19287109375, 18.029541015625, 18.8662109375, 19.702880859375, 20.53955078125, 21.376220703125, 22.212890625, 23.049560546875, 23.88623046875, 24.722900390625, 25.5595703125, 26.396240234375, 27.23291015625, 28.069580078125, 28.90625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 4.0, 6.0, 4.0, 7.0, 17.0, 14.0, 24.0, 23.0, 31.0, 37.0, 31.0, 48.0, 63.0, 97.0, 166.0, 314.0, 364.0, 253.0, 113.0, 66.0, 52.0, 42.0, 41.0, 39.0, 23.0, 29.0, 14.0, 15.0, 16.0, 13.0, 17.0, 6.0, 6.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0], "bins": [-52.90625, -51.5263671875, -50.146484375, -48.7666015625, -47.38671875, -46.0068359375, -44.626953125, -43.2470703125, -41.8671875, -40.4873046875, -39.107421875, -37.7275390625, -36.34765625, -34.9677734375, -33.587890625, -32.2080078125, -30.828125, -29.4482421875, -28.068359375, -26.6884765625, -25.30859375, -23.9287109375, -22.548828125, -21.1689453125, -19.7890625, -18.4091796875, -17.029296875, -15.6494140625, -14.26953125, -12.8896484375, -11.509765625, -10.1298828125, -8.75, -7.3701171875, -5.990234375, -4.6103515625, -3.23046875, -1.8505859375, -0.470703125, 0.9091796875, 2.2890625, 3.6689453125, 5.048828125, 6.4287109375, 7.80859375, 9.1884765625, 10.568359375, 11.9482421875, 13.328125, 14.7080078125, 16.087890625, 17.4677734375, 18.84765625, 20.2275390625, 21.607421875, 22.9873046875, 24.3671875, 25.7470703125, 27.126953125, 28.5068359375, 29.88671875, 31.2666015625, 32.646484375, 34.0263671875, 35.40625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 3.0, 6.0, 7.0, 8.0, 17.0, 31.0, 36.0, 72.0, 91.0, 165.0, 226.0, 366.0, 519.0, 809.0, 1255.0, 1813.0, 2670.0, 4207.0, 6542.0, 10284.0, 16426.0, 26341.0, 43257.0, 70795.0, 116552.0, 195338.0, 341602.0, 689042.0, 2151123.0, 1405097.0, 517228.0, 276484.0, 160728.0, 97055.0, 58645.0, 35823.0, 21915.0, 13734.0, 8631.0, 5488.0, 3718.0, 2466.0, 1657.0, 1070.0, 681.0, 471.0, 335.0, 229.0, 121.0, 109.0, 75.0, 45.0, 23.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.8359375, -13.3719482421875, -12.907958984375, -12.4439697265625, -11.97998046875, -11.5159912109375, -11.052001953125, -10.5880126953125, -10.1240234375, -9.6600341796875, -9.196044921875, -8.7320556640625, -8.26806640625, -7.8040771484375, -7.340087890625, -6.8760986328125, -6.412109375, -5.9481201171875, -5.484130859375, -5.0201416015625, -4.55615234375, -4.0921630859375, -3.628173828125, -3.1641845703125, -2.7001953125, -2.2362060546875, -1.772216796875, -1.3082275390625, -0.84423828125, -0.3802490234375, 0.083740234375, 0.5477294921875, 1.01171875, 1.4757080078125, 1.939697265625, 2.4036865234375, 2.86767578125, 3.3316650390625, 3.795654296875, 4.2596435546875, 4.7236328125, 5.1876220703125, 5.651611328125, 6.1156005859375, 6.57958984375, 7.0435791015625, 7.507568359375, 7.9715576171875, 8.435546875, 8.8995361328125, 9.363525390625, 9.8275146484375, 10.29150390625, 10.7554931640625, 11.219482421875, 11.6834716796875, 12.1474609375, 12.6114501953125, 13.075439453125, 13.5394287109375, 14.00341796875, 14.4674072265625, 14.931396484375, 15.3953857421875, 15.859375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 8.0, 6.0, 6.0, 13.0, 9.0, 17.0, 16.0, 25.0, 23.0, 26.0, 34.0, 40.0, 30.0, 29.0, 44.0, 78.0, 100.0, 243.0, 432.0, 281.0, 108.0, 60.0, 45.0, 36.0, 43.0, 40.0, 21.0, 38.0, 21.0, 23.0, 18.0, 16.0, 13.0, 19.0, 12.0, 6.0, 7.0, 4.0, 9.0, 8.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.3125, -49.7451171875, -48.177734375, -46.6103515625, -45.04296875, -43.4755859375, -41.908203125, -40.3408203125, -38.7734375, -37.2060546875, -35.638671875, -34.0712890625, -32.50390625, -30.9365234375, -29.369140625, -27.8017578125, -26.234375, -24.6669921875, -23.099609375, -21.5322265625, -19.96484375, -18.3974609375, -16.830078125, -15.2626953125, -13.6953125, -12.1279296875, -10.560546875, -8.9931640625, -7.42578125, -5.8583984375, -4.291015625, -2.7236328125, -1.15625, 0.4111328125, 1.978515625, 3.5458984375, 5.11328125, 6.6806640625, 8.248046875, 9.8154296875, 11.3828125, 12.9501953125, 14.517578125, 16.0849609375, 17.65234375, 19.2197265625, 20.787109375, 22.3544921875, 23.921875, 25.4892578125, 27.056640625, 28.6240234375, 30.19140625, 31.7587890625, 33.326171875, 34.8935546875, 36.4609375, 38.0283203125, 39.595703125, 41.1630859375, 42.73046875, 44.2978515625, 45.865234375, 47.4326171875, 49.0]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 6.0, 5.0, 5.0, 9.0, 7.0, 11.0, 14.0, 33.0, 27.0, 37.0, 48.0, 97.0, 159.0, 201.0, 222.0, 384.0, 657.0, 928.0, 1487.0, 2707.0, 5047.0, 10130.0, 21466.0, 55437.0, 258570.0, 5766522.0, 104203.0, 32741.0, 13774.0, 7159.0, 3814.0, 2109.0, 1217.0, 826.0, 448.0, 267.0, 202.0, 149.0, 102.0, 53.0, 55.0, 32.0, 9.0, 18.0, 11.0, 7.0, 13.0, 5.0, 0.0, 2.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-100.0625, -96.75390625, -93.4453125, -90.13671875, -86.828125, -83.51953125, -80.2109375, -76.90234375, -73.59375, -70.28515625, -66.9765625, -63.66796875, -60.359375, -57.05078125, -53.7421875, -50.43359375, -47.125, -43.81640625, -40.5078125, -37.19921875, -33.890625, -30.58203125, -27.2734375, -23.96484375, -20.65625, -17.34765625, -14.0390625, -10.73046875, -7.421875, -4.11328125, -0.8046875, 2.50390625, 5.8125, 9.12109375, 12.4296875, 15.73828125, 19.046875, 22.35546875, 25.6640625, 28.97265625, 32.28125, 35.58984375, 38.8984375, 42.20703125, 45.515625, 48.82421875, 52.1328125, 55.44140625, 58.75, 62.05859375, 65.3671875, 68.67578125, 71.984375, 75.29296875, 78.6015625, 81.91015625, 85.21875, 88.52734375, 91.8359375, 95.14453125, 98.453125, 101.76171875, 105.0703125, 108.37890625, 111.6875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 14.0, 13.0, 15.0, 24.0, 39.0, 28.0, 35.0, 37.0, 45.0, 66.0, 60.0, 99.0, 317.0, 679.0, 133.0, 65.0, 60.0, 47.0, 42.0, 42.0, 31.0, 22.0, 21.0, 12.0, 18.0, 17.0, 15.0, 7.0, 7.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.3125, -111.9560546875, -108.599609375, -105.2431640625, -101.88671875, -98.5302734375, -95.173828125, -91.8173828125, -88.4609375, -85.1044921875, -81.748046875, -78.3916015625, -75.03515625, -71.6787109375, -68.322265625, -64.9658203125, -61.609375, -58.2529296875, -54.896484375, -51.5400390625, -48.18359375, -44.8271484375, -41.470703125, -38.1142578125, -34.7578125, -31.4013671875, -28.044921875, -24.6884765625, -21.33203125, -17.9755859375, -14.619140625, -11.2626953125, -7.90625, -4.5498046875, -1.193359375, 2.1630859375, 5.51953125, 8.8759765625, 12.232421875, 15.5888671875, 18.9453125, 22.3017578125, 25.658203125, 29.0146484375, 32.37109375, 35.7275390625, 39.083984375, 42.4404296875, 45.796875, 49.1533203125, 52.509765625, 55.8662109375, 59.22265625, 62.5791015625, 65.935546875, 69.2919921875, 72.6484375, 76.0048828125, 79.361328125, 82.7177734375, 86.07421875, 89.4306640625, 92.787109375, 96.1435546875, 99.5]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 5.0, 12.0, 17.0, 35.0, 85.0, 624.0, 133.0, 33.0, 19.0, 13.0, 6.0, 7.0, 3.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2823.115966796875, -2749.9716796875, -2676.8271484375, -2603.682861328125, -2530.53857421875, -2457.39404296875, -2384.249755859375, -2311.10546875, -2237.9609375, -2164.816650390625, -2091.672119140625, -2018.52783203125, -1945.3834228515625, -1872.239013671875, -1799.0947265625, -1725.9503173828125, -1652.8060302734375, -1579.66162109375, -1506.517333984375, -1433.3729248046875, -1360.228515625, -1287.084228515625, -1213.9398193359375, -1140.79541015625, -1067.651123046875, -994.5067749023438, -921.3623657226562, -848.218017578125, -775.0736083984375, -701.9292602539062, -628.784912109375, -555.6405029296875, -482.4962158203125, -409.3518371582031, -336.20745849609375, -263.0631103515625, -189.91873168945312, -116.77435302734375, -43.6300048828125, 29.514404296875, 102.65875244140625, 175.80313110351562, 248.94749450683594, 322.09185791015625, 395.2362365722656, 468.380615234375, 541.5249633789062, 614.6693725585938, 687.813720703125, 760.9580688476562, 834.1024780273438, 907.246826171875, 980.3912353515625, 1053.53564453125, 1126.679931640625, 1199.8243408203125, 1272.96875, 1346.1131591796875, 1419.2574462890625, 1492.40185546875, 1565.5462646484375, 1638.690673828125, 1711.8349609375, 1784.9793701171875, 1858.1236572265625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 6.0, 4.0, 6.0, 6.0, 8.0, 9.0, 14.0, 17.0, 34.0, 54.0, 86.0, 403.0, 114.0, 71.0, 37.0, 28.0, 9.0, 13.0, 11.0, 8.0, 5.0, 4.0, 8.0, 7.0, 3.0, 3.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2070.414794921875, -2012.2484130859375, -1954.0819091796875, -1895.91552734375, -1837.7490234375, -1779.5826416015625, -1721.416259765625, -1663.249755859375, -1605.083251953125, -1546.9168701171875, -1488.7503662109375, -1430.583984375, -1372.41748046875, -1314.2510986328125, -1256.084716796875, -1197.918212890625, -1139.7518310546875, -1081.58544921875, -1023.4189453125, -965.2525634765625, -907.0860595703125, -848.919677734375, -790.7532348632812, -732.5867919921875, -674.4203491210938, -616.25390625, -558.0874633789062, -499.9210510253906, -441.7546081542969, -383.5881652832031, -325.4217529296875, -267.25531005859375, -209.0888671875, -150.92242431640625, -92.75599670410156, -34.589569091796875, 23.576873779296875, 81.74331665039062, 139.90972900390625, 198.076171875, 256.24261474609375, 314.4090576171875, 372.57550048828125, 430.7419128417969, 488.9083557128906, 547.0748291015625, 605.2412109375, 663.4076538085938, 721.5740966796875, 779.7405395507812, 837.906982421875, 896.0733642578125, 954.2398681640625, 1012.40625, 1070.57275390625, 1128.7391357421875, 1186.905517578125, 1245.0718994140625, 1303.2384033203125, 1361.40478515625, 1419.5712890625, 1477.7376708984375, 1535.904052734375, 1594.070556640625, 1652.237060546875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 10.0, 29.0, 53.0, 74.0, 72.0, 169.0, 299.0, 448.0, 799.0, 1505.0, 3013.0, 6443.0, 14957.0, 42468.0, 294132.0, 3707890.0, 76675.0, 24771.0, 10582.0, 4964.0, 2338.0, 1244.0, 616.0, 325.0, 156.0, 91.0, 63.0, 27.0, 18.0, 15.0, 8.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-29.859375, -29.09814453125, -28.3369140625, -27.57568359375, -26.814453125, -26.05322265625, -25.2919921875, -24.53076171875, -23.76953125, -23.00830078125, -22.2470703125, -21.48583984375, -20.724609375, -19.96337890625, -19.2021484375, -18.44091796875, -17.6796875, -16.91845703125, -16.1572265625, -15.39599609375, -14.634765625, -13.87353515625, -13.1123046875, -12.35107421875, -11.58984375, -10.82861328125, -10.0673828125, -9.30615234375, -8.544921875, -7.78369140625, -7.0224609375, -6.26123046875, -5.5, -4.73876953125, -3.9775390625, -3.21630859375, -2.455078125, -1.69384765625, -0.9326171875, -0.17138671875, 0.58984375, 1.35107421875, 2.1123046875, 2.87353515625, 3.634765625, 4.39599609375, 5.1572265625, 5.91845703125, 6.6796875, 7.44091796875, 8.2021484375, 8.96337890625, 9.724609375, 10.48583984375, 11.2470703125, 12.00830078125, 12.76953125, 13.53076171875, 14.2919921875, 15.05322265625, 15.814453125, 16.57568359375, 17.3369140625, 18.09814453125, 18.859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 9.0, 1.0, 6.0, 6.0, 9.0, 8.0, 5.0, 13.0, 13.0, 9.0, 25.0, 101.0, 485.0, 188.0, 28.0, 19.0, 23.0, 6.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 8.0, 3.0, 4.0, 1.0, 4.0, 2.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.453125, -2.3758544921875, -2.298583984375, -2.2213134765625, -2.14404296875, -2.0667724609375, -1.989501953125, -1.9122314453125, -1.8349609375, -1.7576904296875, -1.680419921875, -1.6031494140625, -1.52587890625, -1.4486083984375, -1.371337890625, -1.2940673828125, -1.216796875, -1.1395263671875, -1.062255859375, -0.9849853515625, -0.90771484375, -0.8304443359375, -0.753173828125, -0.6759033203125, -0.5986328125, -0.5213623046875, -0.444091796875, -0.3668212890625, -0.28955078125, -0.2122802734375, -0.135009765625, -0.0577392578125, 0.01953125, 0.0968017578125, 0.174072265625, 0.2513427734375, 0.32861328125, 0.4058837890625, 0.483154296875, 0.5604248046875, 0.6376953125, 0.7149658203125, 0.792236328125, 0.8695068359375, 0.94677734375, 1.0240478515625, 1.101318359375, 1.1785888671875, 1.255859375, 1.3331298828125, 1.410400390625, 1.4876708984375, 1.56494140625, 1.6422119140625, 1.719482421875, 1.7967529296875, 1.8740234375, 1.9512939453125, 2.028564453125, 2.1058349609375, 2.18310546875, 2.2603759765625, 2.337646484375, 2.4149169921875, 2.4921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 16.0, 18.0, 25.0, 35.0, 55.0, 66.0, 111.0, 161.0, 279.0, 452.0, 800.0, 1600.0, 3476.0, 9680.0, 34726.0, 219723.0, 3197548.0, 635525.0, 66256.0, 14977.0, 4800.0, 1955.0, 884.0, 446.0, 251.0, 142.0, 86.0, 57.0, 39.0, 23.0, 18.0, 15.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.53125, -20.85205078125, -20.1728515625, -19.49365234375, -18.814453125, -18.13525390625, -17.4560546875, -16.77685546875, -16.09765625, -15.41845703125, -14.7392578125, -14.06005859375, -13.380859375, -12.70166015625, -12.0224609375, -11.34326171875, -10.6640625, -9.98486328125, -9.3056640625, -8.62646484375, -7.947265625, -7.26806640625, -6.5888671875, -5.90966796875, -5.23046875, -4.55126953125, -3.8720703125, -3.19287109375, -2.513671875, -1.83447265625, -1.1552734375, -0.47607421875, 0.203125, 0.88232421875, 1.5615234375, 2.24072265625, 2.919921875, 3.59912109375, 4.2783203125, 4.95751953125, 5.63671875, 6.31591796875, 6.9951171875, 7.67431640625, 8.353515625, 9.03271484375, 9.7119140625, 10.39111328125, 11.0703125, 11.74951171875, 12.4287109375, 13.10791015625, 13.787109375, 14.46630859375, 15.1455078125, 15.82470703125, 16.50390625, 17.18310546875, 17.8623046875, 18.54150390625, 19.220703125, 19.89990234375, 20.5791015625, 21.25830078125, 21.9375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 12.0, 19.0, 29.0, 38.0, 57.0, 68.0, 101.0, 155.0, 225.0, 317.0, 629.0, 984.0, 502.0, 286.0, 177.0, 147.0, 89.0, 58.0, 50.0, 35.0, 21.0, 14.0, 11.0, 11.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0], "bins": [-10.0625, -9.83551025390625, -9.6085205078125, -9.38153076171875, -9.154541015625, -8.92755126953125, -8.7005615234375, -8.47357177734375, -8.24658203125, -8.01959228515625, -7.7926025390625, -7.56561279296875, -7.338623046875, -7.11163330078125, -6.8846435546875, -6.65765380859375, -6.4306640625, -6.20367431640625, -5.9766845703125, -5.74969482421875, -5.522705078125, -5.29571533203125, -5.0687255859375, -4.84173583984375, -4.61474609375, -4.38775634765625, -4.1607666015625, -3.93377685546875, -3.706787109375, -3.47979736328125, -3.2528076171875, -3.02581787109375, -2.798828125, -2.57183837890625, -2.3448486328125, -2.11785888671875, -1.890869140625, -1.66387939453125, -1.4368896484375, -1.20989990234375, -0.98291015625, -0.75592041015625, -0.5289306640625, -0.30194091796875, -0.074951171875, 0.15203857421875, 0.3790283203125, 0.60601806640625, 0.8330078125, 1.05999755859375, 1.2869873046875, 1.51397705078125, 1.740966796875, 1.96795654296875, 2.1949462890625, 2.42193603515625, 2.64892578125, 2.87591552734375, 3.1029052734375, 3.32989501953125, 3.556884765625, 3.78387451171875, 4.0108642578125, 4.23785400390625, 4.46484375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 10.0, 11.0, 19.0, 21.0, 37.0, 54.0, 107.0, 137.0, 227.0, 173.0, 93.0, 54.0, 20.0, 13.0, 6.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.80792236328125, -78.6084213256836, -76.4089126586914, -74.20941162109375, -72.00990295410156, -69.8104019165039, -67.61090087890625, -65.41139221191406, -63.211891174316406, -61.012386322021484, -58.81288146972656, -56.613380432128906, -54.413875579833984, -52.21437072753906, -50.01486587524414, -47.81536102294922, -45.6158561706543, -43.416351318359375, -41.21684646606445, -39.01734161376953, -36.817840576171875, -34.61833572387695, -32.41883087158203, -30.21932601928711, -28.01982307434082, -25.8203182220459, -23.62081527709961, -21.421310424804688, -19.221805572509766, -17.022302627563477, -14.822797775268555, -12.62329387664795, -10.423786163330078, -8.224282264709473, -6.024777889251709, -3.8252735137939453, -1.6257696151733398, 0.5737342834472656, 2.7732391357421875, 4.972743034362793, 7.172246932983398, 9.371750831604004, 11.57125473022461, 13.770759582519531, 15.970263481140137, 18.169767379760742, 20.369272232055664, 22.568775177001953, 24.768280029296875, 26.967784881591797, 29.167287826538086, 31.366792678833008, 33.5662956237793, 35.76580047607422, 37.96530532836914, 40.16481018066406, 42.36431121826172, 44.56381607055664, 46.76332092285156, 48.96282196044922, 51.16232681274414, 53.36183166503906, 55.561336517333984, 57.760841369628906, 59.96034622192383]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 9.0, 10.0, 12.0, 18.0, 14.0, 19.0, 16.0, 26.0, 36.0, 26.0, 36.0, 41.0, 33.0, 53.0, 48.0, 52.0, 40.0, 39.0, 38.0, 36.0, 33.0, 44.0, 48.0, 32.0, 30.0, 29.0, 36.0, 19.0, 18.0, 22.0, 15.0, 11.0, 10.0, 6.0, 6.0, 3.0, 1.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.407119750976562, -30.233205795288086, -29.059289932250977, -27.8853759765625, -26.711462020874023, -25.537548065185547, -24.363632202148438, -23.18971824645996, -22.015804290771484, -20.841890335083008, -19.6679744720459, -18.494060516357422, -17.320146560668945, -16.14623260498047, -14.97231674194336, -13.798402786254883, -12.624486923217773, -11.45057201385498, -10.276658058166504, -9.102743148803711, -7.928828716278076, -6.754914283752441, -5.580999374389648, -4.407085418701172, -3.233170509338379, -2.059256076812744, -0.8853414058685303, 0.2885732650756836, 1.4624876976013184, 2.636402130126953, 3.810317039489746, 4.984230995178223, 6.158145904541016, 7.33206033706665, 8.505974769592285, 9.679889678955078, 10.853803634643555, 12.027718544006348, 13.20163345336914, 14.375547409057617, 15.54946231842041, 16.723377227783203, 17.89729118347168, 19.071205139160156, 20.245121002197266, 21.419034957885742, 22.59294891357422, 23.766864776611328, 24.940778732299805, 26.11469268798828, 27.28860855102539, 28.462522506713867, 29.636436462402344, 30.810352325439453, 31.98426628112793, 33.158180236816406, 34.332096099853516, 35.506011962890625, 36.67992401123047, 37.85383987426758, 39.02775573730469, 40.20166778564453, 41.37558364868164, 42.54949951171875, 43.723411560058594]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 5.0, 12.0, 17.0, 19.0, 20.0, 35.0, 54.0, 72.0, 109.0, 152.0, 194.0, 289.0, 398.0, 558.0, 810.0, 1250.0, 1875.0, 2881.0, 4746.0, 8539.0, 18111.0, 48292.0, 214751.0, 580417.0, 103654.0, 30597.0, 12667.0, 6532.0, 3989.0, 2400.0, 1579.0, 1072.0, 784.0, 495.0, 338.0, 251.0, 172.0, 127.0, 78.0, 60.0, 49.0, 24.0, 18.0, 18.0, 23.0, 8.0, 9.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-10.6875, -10.366455078125, -10.04541015625, -9.724365234375, -9.4033203125, -9.082275390625, -8.76123046875, -8.440185546875, -8.119140625, -7.798095703125, -7.47705078125, -7.156005859375, -6.8349609375, -6.513916015625, -6.19287109375, -5.871826171875, -5.55078125, -5.229736328125, -4.90869140625, -4.587646484375, -4.2666015625, -3.945556640625, -3.62451171875, -3.303466796875, -2.982421875, -2.661376953125, -2.34033203125, -2.019287109375, -1.6982421875, -1.377197265625, -1.05615234375, -0.735107421875, -0.4140625, -0.093017578125, 0.22802734375, 0.549072265625, 0.8701171875, 1.191162109375, 1.51220703125, 1.833251953125, 2.154296875, 2.475341796875, 2.79638671875, 3.117431640625, 3.4384765625, 3.759521484375, 4.08056640625, 4.401611328125, 4.72265625, 5.043701171875, 5.36474609375, 5.685791015625, 6.0068359375, 6.327880859375, 6.64892578125, 6.969970703125, 7.291015625, 7.612060546875, 7.93310546875, 8.254150390625, 8.5751953125, 8.896240234375, 9.21728515625, 9.538330078125, 9.859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 0.0, 6.0, 5.0, 7.0, 11.0, 11.0, 20.0, 21.0, 39.0, 42.0, 61.0, 97.0, 117.0, 120.0, 105.0, 90.0, 63.0, 49.0, 28.0, 23.0, 12.0, 14.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 6.0, 1.0, 0.0, 3.0, 3.0, 2.0], "bins": [-2.71875, -2.6480865478515625, -2.577423095703125, -2.5067596435546875, -2.43609619140625, -2.3654327392578125, -2.294769287109375, -2.2241058349609375, -2.1534423828125, -2.0827789306640625, -2.012115478515625, -1.9414520263671875, -1.87078857421875, -1.8001251220703125, -1.729461669921875, -1.6587982177734375, -1.588134765625, -1.5174713134765625, -1.446807861328125, -1.3761444091796875, -1.30548095703125, -1.2348175048828125, -1.164154052734375, -1.0934906005859375, -1.0228271484375, -0.9521636962890625, -0.881500244140625, -0.8108367919921875, -0.74017333984375, -0.6695098876953125, -0.598846435546875, -0.5281829833984375, -0.45751953125, -0.3868560791015625, -0.316192626953125, -0.2455291748046875, -0.17486572265625, -0.1042022705078125, -0.033538818359375, 0.0371246337890625, 0.1077880859375, 0.1784515380859375, 0.249114990234375, 0.3197784423828125, 0.39044189453125, 0.4611053466796875, 0.531768798828125, 0.6024322509765625, 0.673095703125, 0.7437591552734375, 0.814422607421875, 0.8850860595703125, 0.95574951171875, 1.0264129638671875, 1.097076416015625, 1.1677398681640625, 1.2384033203125, 1.3090667724609375, 1.379730224609375, 1.4503936767578125, 1.52105712890625, 1.5917205810546875, 1.662384033203125, 1.7330474853515625, 1.8037109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 6.0, 6.0, 11.0, 20.0, 27.0, 41.0, 51.0, 81.0, 106.0, 153.0, 262.0, 426.0, 744.0, 1326.0, 2500.0, 4674.0, 9676.0, 21545.0, 53968.0, 181025.0, 510862.0, 169226.0, 51811.0, 20522.0, 9479.0, 4495.0, 2349.0, 1300.0, 691.0, 413.0, 252.0, 156.0, 107.0, 77.0, 47.0, 25.0, 24.0, 14.0, 17.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-11.2421875, -10.885009765625, -10.52783203125, -10.170654296875, -9.8134765625, -9.456298828125, -9.09912109375, -8.741943359375, -8.384765625, -8.027587890625, -7.67041015625, -7.313232421875, -6.9560546875, -6.598876953125, -6.24169921875, -5.884521484375, -5.52734375, -5.170166015625, -4.81298828125, -4.455810546875, -4.0986328125, -3.741455078125, -3.38427734375, -3.027099609375, -2.669921875, -2.312744140625, -1.95556640625, -1.598388671875, -1.2412109375, -0.884033203125, -0.52685546875, -0.169677734375, 0.1875, 0.544677734375, 0.90185546875, 1.259033203125, 1.6162109375, 1.973388671875, 2.33056640625, 2.687744140625, 3.044921875, 3.402099609375, 3.75927734375, 4.116455078125, 4.4736328125, 4.830810546875, 5.18798828125, 5.545166015625, 5.90234375, 6.259521484375, 6.61669921875, 6.973876953125, 7.3310546875, 7.688232421875, 8.04541015625, 8.402587890625, 8.759765625, 9.116943359375, 9.47412109375, 9.831298828125, 10.1884765625, 10.545654296875, 10.90283203125, 11.260009765625, 11.6171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 3.0, 6.0, 5.0, 11.0, 8.0, 15.0, 7.0, 14.0, 17.0, 13.0, 21.0, 33.0, 19.0, 15.0, 28.0, 26.0, 34.0, 36.0, 42.0, 47.0, 37.0, 39.0, 37.0, 36.0, 35.0, 43.0, 44.0, 39.0, 37.0, 19.0, 38.0, 28.0, 26.0, 23.0, 22.0, 20.0, 14.0, 15.0, 9.0, 8.0, 11.0, 1.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.296875, -10.931884765625, -10.56689453125, -10.201904296875, -9.8369140625, -9.471923828125, -9.10693359375, -8.741943359375, -8.376953125, -8.011962890625, -7.64697265625, -7.281982421875, -6.9169921875, -6.552001953125, -6.18701171875, -5.822021484375, -5.45703125, -5.092041015625, -4.72705078125, -4.362060546875, -3.9970703125, -3.632080078125, -3.26708984375, -2.902099609375, -2.537109375, -2.172119140625, -1.80712890625, -1.442138671875, -1.0771484375, -0.712158203125, -0.34716796875, 0.017822265625, 0.3828125, 0.747802734375, 1.11279296875, 1.477783203125, 1.8427734375, 2.207763671875, 2.57275390625, 2.937744140625, 3.302734375, 3.667724609375, 4.03271484375, 4.397705078125, 4.7626953125, 5.127685546875, 5.49267578125, 5.857666015625, 6.22265625, 6.587646484375, 6.95263671875, 7.317626953125, 7.6826171875, 8.047607421875, 8.41259765625, 8.777587890625, 9.142578125, 9.507568359375, 9.87255859375, 10.237548828125, 10.6025390625, 10.967529296875, 11.33251953125, 11.697509765625, 12.0625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 12.0, 14.0, 39.0, 44.0, 76.0, 128.0, 265.0, 732.0, 2396.0, 17013.0, 984316.0, 38487.0, 3294.0, 996.0, 328.0, 178.0, 82.0, 40.0, 27.0, 27.0, 14.0, 9.0, 7.0, 3.0, 1.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.21875, -34.9072265625, -33.595703125, -32.2841796875, -30.97265625, -29.6611328125, -28.349609375, -27.0380859375, -25.7265625, -24.4150390625, -23.103515625, -21.7919921875, -20.48046875, -19.1689453125, -17.857421875, -16.5458984375, -15.234375, -13.9228515625, -12.611328125, -11.2998046875, -9.98828125, -8.6767578125, -7.365234375, -6.0537109375, -4.7421875, -3.4306640625, -2.119140625, -0.8076171875, 0.50390625, 1.8154296875, 3.126953125, 4.4384765625, 5.75, 7.0615234375, 8.373046875, 9.6845703125, 10.99609375, 12.3076171875, 13.619140625, 14.9306640625, 16.2421875, 17.5537109375, 18.865234375, 20.1767578125, 21.48828125, 22.7998046875, 24.111328125, 25.4228515625, 26.734375, 28.0458984375, 29.357421875, 30.6689453125, 31.98046875, 33.2919921875, 34.603515625, 35.9150390625, 37.2265625, 38.5380859375, 39.849609375, 41.1611328125, 42.47265625, 43.7841796875, 45.095703125, 46.4072265625, 47.71875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 10.0, 41.0, 48.0, 118.0, 260.0, 268.0, 122.0, 46.0, 31.0, 12.0, 4.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012350082397460938, -0.0011965036392211914, -0.001157999038696289, -0.0011194944381713867, -0.0010809898376464844, -0.001042485237121582, -0.0010039806365966797, -0.0009654760360717773, -0.000926971435546875, -0.0008884668350219727, -0.0008499622344970703, -0.000811457633972168, -0.0007729530334472656, -0.0007344484329223633, -0.0006959438323974609, -0.0006574392318725586, -0.0006189346313476562, -0.0005804300308227539, -0.0005419254302978516, -0.0005034208297729492, -0.0004649162292480469, -0.00042641162872314453, -0.0003879070281982422, -0.00034940242767333984, -0.0003108978271484375, -0.00027239322662353516, -0.0002338886260986328, -0.00019538402557373047, -0.00015687942504882812, -0.00011837482452392578, -7.987022399902344e-05, -4.1365623474121094e-05, -2.86102294921875e-06, 3.5643577575683594e-05, 7.414817810058594e-05, 0.00011265277862548828, 0.00015115737915039062, 0.00018966197967529297, 0.0002281665802001953, 0.00026667118072509766, 0.00030517578125, 0.00034368038177490234, 0.0003821849822998047, 0.00042068958282470703, 0.0004591941833496094, 0.0004976987838745117, 0.0005362033843994141, 0.0005747079849243164, 0.0006132125854492188, 0.0006517171859741211, 0.0006902217864990234, 0.0007287263870239258, 0.0007672309875488281, 0.0008057355880737305, 0.0008442401885986328, 0.0008827447891235352, 0.0009212493896484375, 0.0009597539901733398, 0.0009982585906982422, 0.0010367631912231445, 0.0010752677917480469, 0.0011137723922729492, 0.0011522769927978516, 0.001190781593322754, 0.0012292861938476562]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 3.0, 10.0, 16.0, 15.0, 34.0, 37.0, 50.0, 90.0, 151.0, 204.0, 394.0, 665.0, 1244.0, 2663.0, 6212.0, 18860.0, 99515.0, 747473.0, 134931.0, 22769.0, 7128.0, 2931.0, 1359.0, 696.0, 390.0, 245.0, 147.0, 92.0, 62.0, 46.0, 33.0, 21.0, 15.0, 11.0, 14.0, 12.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.171875, -15.7296142578125, -15.287353515625, -14.8450927734375, -14.40283203125, -13.9605712890625, -13.518310546875, -13.0760498046875, -12.6337890625, -12.1915283203125, -11.749267578125, -11.3070068359375, -10.86474609375, -10.4224853515625, -9.980224609375, -9.5379638671875, -9.095703125, -8.6534423828125, -8.211181640625, -7.7689208984375, -7.32666015625, -6.8843994140625, -6.442138671875, -5.9998779296875, -5.5576171875, -5.1153564453125, -4.673095703125, -4.2308349609375, -3.78857421875, -3.3463134765625, -2.904052734375, -2.4617919921875, -2.01953125, -1.5772705078125, -1.135009765625, -0.6927490234375, -0.25048828125, 0.1917724609375, 0.634033203125, 1.0762939453125, 1.5185546875, 1.9608154296875, 2.403076171875, 2.8453369140625, 3.28759765625, 3.7298583984375, 4.172119140625, 4.6143798828125, 5.056640625, 5.4989013671875, 5.941162109375, 6.3834228515625, 6.82568359375, 7.2679443359375, 7.710205078125, 8.1524658203125, 8.5947265625, 9.0369873046875, 9.479248046875, 9.9215087890625, 10.36376953125, 10.8060302734375, 11.248291015625, 11.6905517578125, 12.1328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 7.0, 8.0, 17.0, 24.0, 38.0, 62.0, 82.0, 142.0, 159.0, 168.0, 100.0, 58.0, 31.0, 20.0, 23.0, 16.0, 10.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.515625, -15.994140625, -15.47265625, -14.951171875, -14.4296875, -13.908203125, -13.38671875, -12.865234375, -12.34375, -11.822265625, -11.30078125, -10.779296875, -10.2578125, -9.736328125, -9.21484375, -8.693359375, -8.171875, -7.650390625, -7.12890625, -6.607421875, -6.0859375, -5.564453125, -5.04296875, -4.521484375, -4.0, -3.478515625, -2.95703125, -2.435546875, -1.9140625, -1.392578125, -0.87109375, -0.349609375, 0.171875, 0.693359375, 1.21484375, 1.736328125, 2.2578125, 2.779296875, 3.30078125, 3.822265625, 4.34375, 4.865234375, 5.38671875, 5.908203125, 6.4296875, 6.951171875, 7.47265625, 7.994140625, 8.515625, 9.037109375, 9.55859375, 10.080078125, 10.6015625, 11.123046875, 11.64453125, 12.166015625, 12.6875, 13.208984375, 13.73046875, 14.251953125, 14.7734375, 15.294921875, 15.81640625, 16.337890625, 16.859375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 9.0, 17.0, 39.0, 70.0, 170.0, 344.0, 172.0, 73.0, 46.0, 21.0, 14.0, 8.0, 9.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-210.56649780273438, -204.6480255126953, -198.7295684814453, -192.81109619140625, -186.89263916015625, -180.9741668701172, -175.05569458007812, -169.13723754882812, -163.21876525878906, -157.30029296875, -151.3818359375, -145.46336364746094, -139.54489135742188, -133.62643432617188, -127.70796203613281, -121.78949737548828, -115.87103271484375, -109.95256805419922, -104.03410339355469, -98.11563110351562, -92.1971664428711, -86.27870178222656, -80.3602294921875, -74.44176483154297, -68.52330017089844, -62.604835510253906, -56.68636703491211, -50.76789855957031, -44.84943389892578, -38.93096923828125, -33.01250076293945, -27.094032287597656, -21.175582885742188, -15.257116317749023, -9.33864974975586, -3.4201831817626953, 2.4982833862304688, 8.416749954223633, 14.335216522216797, 20.253684997558594, 26.172149658203125, 32.090614318847656, 38.00908279418945, 43.92755126953125, 49.84601593017578, 55.76448059082031, 61.68294906616211, 67.6014175415039, 73.51988220214844, 79.43834686279297, 85.3568115234375, 91.27528381347656, 97.1937484741211, 103.11221313476562, 109.03068542480469, 114.94915008544922, 120.86761474609375, 126.78607940673828, 132.7045440673828, 138.62301635742188, 144.54147338867188, 150.45994567871094, 156.37841796875, 162.296875, 168.21534729003906]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 5.0, 7.0, 8.0, 6.0, 11.0, 20.0, 40.0, 63.0, 97.0, 143.0, 139.0, 145.0, 93.0, 76.0, 36.0, 21.0, 17.0, 16.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.62356567382812, -210.2628631591797, -202.90216064453125, -195.5414581298828, -188.18075561523438, -180.82005310058594, -173.4593505859375, -166.09864807128906, -158.73794555664062, -151.3772430419922, -144.01654052734375, -136.6558380126953, -129.29513549804688, -121.93443298339844, -114.57373046875, -107.21302795410156, -99.85232543945312, -92.49162292480469, -85.13092041015625, -77.77021789550781, -70.40951538085938, -63.04881286621094, -55.6881103515625, -48.32740783691406, -40.966705322265625, -33.60600280761719, -26.24530029296875, -18.884597778320312, -11.523895263671875, -4.1631927490234375, 3.197509765625, 10.558212280273438, 17.918899536132812, 25.27960205078125, 32.64030456542969, 40.001007080078125, 47.36170959472656, 54.722412109375, 62.08311462402344, 69.44381713867188, 76.80451965332031, 84.16522216796875, 91.52592468261719, 98.88662719726562, 106.24732971191406, 113.6080322265625, 120.96873474121094, 128.32943725585938, 135.6901397705078, 143.05084228515625, 150.4115447998047, 157.77224731445312, 165.13294982910156, 172.49365234375, 179.85435485839844, 187.21505737304688, 194.5757598876953, 201.93646240234375, 209.2971649169922, 216.65786743164062, 224.01856994628906, 231.3792724609375, 238.73997497558594, 246.10067749023438, 253.4613800048828]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 5.0, 4.0, 8.0, 7.0, 3.0, 19.0, 26.0, 30.0, 52.0, 99.0, 150.0, 262.0, 418.0, 948.0, 1820.0, 3993.0, 12023.0, 63849.0, 3911829.0, 172988.0, 17227.0, 4723.0, 1847.0, 840.0, 467.0, 246.0, 143.0, 93.0, 59.0, 22.0, 29.0, 17.0, 11.0, 7.0, 5.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.125, -48.5419921875, -46.958984375, -45.3759765625, -43.79296875, -42.2099609375, -40.626953125, -39.0439453125, -37.4609375, -35.8779296875, -34.294921875, -32.7119140625, -31.12890625, -29.5458984375, -27.962890625, -26.3798828125, -24.796875, -23.2138671875, -21.630859375, -20.0478515625, -18.46484375, -16.8818359375, -15.298828125, -13.7158203125, -12.1328125, -10.5498046875, -8.966796875, -7.3837890625, -5.80078125, -4.2177734375, -2.634765625, -1.0517578125, 0.53125, 2.1142578125, 3.697265625, 5.2802734375, 6.86328125, 8.4462890625, 10.029296875, 11.6123046875, 13.1953125, 14.7783203125, 16.361328125, 17.9443359375, 19.52734375, 21.1103515625, 22.693359375, 24.2763671875, 25.859375, 27.4423828125, 29.025390625, 30.6083984375, 32.19140625, 33.7744140625, 35.357421875, 36.9404296875, 38.5234375, 40.1064453125, 41.689453125, 43.2724609375, 44.85546875, 46.4384765625, 48.021484375, 49.6044921875, 51.1875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 2.0, 4.0, 5.0, 7.0, 14.0, 17.0, 31.0, 47.0, 64.0, 107.0, 142.0, 151.0, 121.0, 89.0, 61.0, 34.0, 25.0, 13.0, 9.0, 9.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.376953125, -3.271697998046875, -3.16644287109375, -3.061187744140625, -2.9559326171875, -2.850677490234375, -2.74542236328125, -2.640167236328125, -2.534912109375, -2.429656982421875, -2.32440185546875, -2.219146728515625, -2.1138916015625, -2.008636474609375, -1.90338134765625, -1.798126220703125, -1.69287109375, -1.587615966796875, -1.48236083984375, -1.377105712890625, -1.2718505859375, -1.166595458984375, -1.06134033203125, -0.956085205078125, -0.850830078125, -0.745574951171875, -0.64031982421875, -0.535064697265625, -0.4298095703125, -0.324554443359375, -0.21929931640625, -0.114044189453125, -0.0087890625, 0.096466064453125, 0.20172119140625, 0.306976318359375, 0.4122314453125, 0.517486572265625, 0.62274169921875, 0.727996826171875, 0.833251953125, 0.938507080078125, 1.04376220703125, 1.149017333984375, 1.2542724609375, 1.359527587890625, 1.46478271484375, 1.570037841796875, 1.67529296875, 1.780548095703125, 1.88580322265625, 1.991058349609375, 2.0963134765625, 2.201568603515625, 2.30682373046875, 2.412078857421875, 2.517333984375, 2.622589111328125, 2.72784423828125, 2.833099365234375, 2.9383544921875, 3.043609619140625, 3.14886474609375, 3.254119873046875, 3.359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 8.0, 13.0, 15.0, 16.0, 21.0, 26.0, 40.0, 61.0, 89.0, 120.0, 172.0, 254.0, 407.0, 701.0, 1206.0, 2115.0, 4188.0, 10305.0, 34413.0, 225931.0, 3649192.0, 212012.0, 33063.0, 10088.0, 4352.0, 2099.0, 1213.0, 754.0, 483.0, 260.0, 218.0, 152.0, 80.0, 70.0, 37.0, 31.0, 25.0, 15.0, 12.0, 4.0, 7.0, 4.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.984375, -30.00048828125, -29.0166015625, -28.03271484375, -27.048828125, -26.06494140625, -25.0810546875, -24.09716796875, -23.11328125, -22.12939453125, -21.1455078125, -20.16162109375, -19.177734375, -18.19384765625, -17.2099609375, -16.22607421875, -15.2421875, -14.25830078125, -13.2744140625, -12.29052734375, -11.306640625, -10.32275390625, -9.3388671875, -8.35498046875, -7.37109375, -6.38720703125, -5.4033203125, -4.41943359375, -3.435546875, -2.45166015625, -1.4677734375, -0.48388671875, 0.5, 1.48388671875, 2.4677734375, 3.45166015625, 4.435546875, 5.41943359375, 6.4033203125, 7.38720703125, 8.37109375, 9.35498046875, 10.3388671875, 11.32275390625, 12.306640625, 13.29052734375, 14.2744140625, 15.25830078125, 16.2421875, 17.22607421875, 18.2099609375, 19.19384765625, 20.177734375, 21.16162109375, 22.1455078125, 23.12939453125, 24.11328125, 25.09716796875, 26.0810546875, 27.06494140625, 28.048828125, 29.03271484375, 30.0166015625, 31.00048828125, 31.984375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 9.0, 18.0, 23.0, 51.0, 93.0, 161.0, 372.0, 2078.0, 770.0, 213.0, 98.0, 47.0, 39.0, 23.0, 13.0, 9.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.765625, -5.5333251953125, -5.301025390625, -5.0687255859375, -4.83642578125, -4.6041259765625, -4.371826171875, -4.1395263671875, -3.9072265625, -3.6749267578125, -3.442626953125, -3.2103271484375, -2.97802734375, -2.7457275390625, -2.513427734375, -2.2811279296875, -2.048828125, -1.8165283203125, -1.584228515625, -1.3519287109375, -1.11962890625, -0.8873291015625, -0.655029296875, -0.4227294921875, -0.1904296875, 0.0418701171875, 0.274169921875, 0.5064697265625, 0.73876953125, 0.9710693359375, 1.203369140625, 1.4356689453125, 1.66796875, 1.9002685546875, 2.132568359375, 2.3648681640625, 2.59716796875, 2.8294677734375, 3.061767578125, 3.2940673828125, 3.5263671875, 3.7586669921875, 3.990966796875, 4.2232666015625, 4.45556640625, 4.6878662109375, 4.920166015625, 5.1524658203125, 5.384765625, 5.6170654296875, 5.849365234375, 6.0816650390625, 6.31396484375, 6.5462646484375, 6.778564453125, 7.0108642578125, 7.2431640625, 7.4754638671875, 7.707763671875, 7.9400634765625, 8.17236328125, 8.4046630859375, 8.636962890625, 8.8692626953125, 9.1015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 14.0, 13.0, 20.0, 37.0, 55.0, 111.0, 206.0, 229.0, 156.0, 69.0, 42.0, 25.0, 16.0, 4.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-63.78923797607422, -62.49596405029297, -61.20268630981445, -59.9094123840332, -58.61613845825195, -57.32286071777344, -56.02958679199219, -54.73631286621094, -53.44303894042969, -52.14976501464844, -50.85648727416992, -49.56321334838867, -48.26993942260742, -46.976661682128906, -45.683387756347656, -44.390113830566406, -43.09683609008789, -41.80356216430664, -40.510284423828125, -39.217010498046875, -37.923736572265625, -36.630462646484375, -35.33718490600586, -34.04391098022461, -32.750633239746094, -31.45735740661621, -30.16408348083496, -28.870807647705078, -27.577533721923828, -26.284257888793945, -24.990982055664062, -23.697708129882812, -22.404430389404297, -21.111154556274414, -19.817880630493164, -18.52460479736328, -17.23133087158203, -15.938055038452148, -14.644779205322266, -13.3515043258667, -12.058229446411133, -10.764954566955566, -9.4716796875, -8.178403854370117, -6.885128974914551, -5.591854095458984, -4.29857873916626, -3.005303382873535, -1.7120285034179688, -0.41875338554382324, 0.8745217323303223, 2.1677968502044678, 3.4610719680786133, 4.75434684753418, 6.047622203826904, 7.340897560119629, 8.634172439575195, 9.927447319030762, 11.220722198486328, 12.513998031616211, 13.807272911071777, 15.100547790527344, 16.393823623657227, 17.68709945678711, 18.98037338256836]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 20.0, 22.0, 32.0, 47.0, 45.0, 53.0, 64.0, 72.0, 91.0, 77.0, 70.0, 73.0, 51.0, 40.0, 47.0, 29.0, 33.0, 20.0, 16.0, 7.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 6.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.85426902770996, -28.979158401489258, -28.104049682617188, -27.228939056396484, -26.353830337524414, -25.47871971130371, -24.60361099243164, -23.728500366210938, -22.853389739990234, -21.97827911376953, -21.10317039489746, -20.228059768676758, -19.352951049804688, -18.477840423583984, -17.60272979736328, -16.72762107849121, -15.852511405944824, -14.977401733398438, -14.10229206085205, -13.227182388305664, -12.352071762084961, -11.476962089538574, -10.601852416992188, -9.726741790771484, -8.851633071899414, -7.976523399353027, -7.101413249969482, -6.226303577423096, -5.351193428039551, -4.476083755493164, -3.6009740829467773, -2.7258639335632324, -1.8507537841796875, -0.9756439328193665, -0.10053408145904541, 0.7745757102966309, 1.6496856212615967, 2.5247955322265625, 3.399905204772949, 4.275015354156494, 5.150125026702881, 6.025234699249268, 6.9003448486328125, 7.775454521179199, 8.650564193725586, 9.525674819946289, 10.40078353881836, 11.275894165039062, 12.15100383758545, 13.026113510131836, 13.901223182678223, 14.77633285522461, 15.651443481445312, 16.526554107666016, 17.401662826538086, 18.27677345275879, 19.15188217163086, 20.026992797851562, 20.902101516723633, 21.777212142944336, 22.652320861816406, 23.52743148803711, 24.402542114257812, 25.277650833129883, 26.152761459350586]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 8.0, 18.0, 26.0, 85.0, 214.0, 444.0, 1653.0, 9258.0, 137160.0, 859055.0, 34939.0, 4213.0, 899.0, 296.0, 114.0, 65.0, 28.0, 18.0, 8.0, 6.0, 3.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.3125, -41.92822265625, -40.5439453125, -39.15966796875, -37.775390625, -36.39111328125, -35.0068359375, -33.62255859375, -32.23828125, -30.85400390625, -29.4697265625, -28.08544921875, -26.701171875, -25.31689453125, -23.9326171875, -22.54833984375, -21.1640625, -19.77978515625, -18.3955078125, -17.01123046875, -15.626953125, -14.24267578125, -12.8583984375, -11.47412109375, -10.08984375, -8.70556640625, -7.3212890625, -5.93701171875, -4.552734375, -3.16845703125, -1.7841796875, -0.39990234375, 0.984375, 2.36865234375, 3.7529296875, 5.13720703125, 6.521484375, 7.90576171875, 9.2900390625, 10.67431640625, 12.05859375, 13.44287109375, 14.8271484375, 16.21142578125, 17.595703125, 18.97998046875, 20.3642578125, 21.74853515625, 23.1328125, 24.51708984375, 25.9013671875, 27.28564453125, 28.669921875, 30.05419921875, 31.4384765625, 32.82275390625, 34.20703125, 35.59130859375, 36.9755859375, 38.35986328125, 39.744140625, 41.12841796875, 42.5126953125, 43.89697265625, 45.28125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 3.0, 9.0, 10.0, 14.0, 30.0, 28.0, 37.0, 50.0, 65.0, 91.0, 88.0, 102.0, 86.0, 72.0, 69.0, 44.0, 48.0, 39.0, 31.0, 19.0, 9.0, 10.0, 4.0, 6.0, 9.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.478912353515625, -2.41290283203125, -2.346893310546875, -2.2808837890625, -2.214874267578125, -2.14886474609375, -2.082855224609375, -2.016845703125, -1.950836181640625, -1.88482666015625, -1.818817138671875, -1.7528076171875, -1.686798095703125, -1.62078857421875, -1.554779052734375, -1.48876953125, -1.422760009765625, -1.35675048828125, -1.290740966796875, -1.2247314453125, -1.158721923828125, -1.09271240234375, -1.026702880859375, -0.960693359375, -0.894683837890625, -0.82867431640625, -0.762664794921875, -0.6966552734375, -0.630645751953125, -0.56463623046875, -0.498626708984375, -0.4326171875, -0.366607666015625, -0.30059814453125, -0.234588623046875, -0.1685791015625, -0.102569580078125, -0.03656005859375, 0.029449462890625, 0.095458984375, 0.161468505859375, 0.22747802734375, 0.293487548828125, 0.3594970703125, 0.425506591796875, 0.49151611328125, 0.557525634765625, 0.62353515625, 0.689544677734375, 0.75555419921875, 0.821563720703125, 0.8875732421875, 0.953582763671875, 1.01959228515625, 1.085601806640625, 1.151611328125, 1.217620849609375, 1.28363037109375, 1.349639892578125, 1.4156494140625, 1.481658935546875, 1.54766845703125, 1.613677978515625, 1.6796875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 7.0, 4.0, 8.0, 9.0, 52.0, 433.0, 5235.0, 150086.0, 866268.0, 24935.0, 1311.0, 141.0, 20.0, 7.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0, -53.52392578125, -52.0478515625, -50.57177734375, -49.095703125, -47.61962890625, -46.1435546875, -44.66748046875, -43.19140625, -41.71533203125, -40.2392578125, -38.76318359375, -37.287109375, -35.81103515625, -34.3349609375, -32.85888671875, -31.3828125, -29.90673828125, -28.4306640625, -26.95458984375, -25.478515625, -24.00244140625, -22.5263671875, -21.05029296875, -19.57421875, -18.09814453125, -16.6220703125, -15.14599609375, -13.669921875, -12.19384765625, -10.7177734375, -9.24169921875, -7.765625, -6.28955078125, -4.8134765625, -3.33740234375, -1.861328125, -0.38525390625, 1.0908203125, 2.56689453125, 4.04296875, 5.51904296875, 6.9951171875, 8.47119140625, 9.947265625, 11.42333984375, 12.8994140625, 14.37548828125, 15.8515625, 17.32763671875, 18.8037109375, 20.27978515625, 21.755859375, 23.23193359375, 24.7080078125, 26.18408203125, 27.66015625, 29.13623046875, 30.6123046875, 32.08837890625, 33.564453125, 35.04052734375, 36.5166015625, 37.99267578125, 39.46875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 13.0, 14.0, 5.0, 15.0, 8.0, 17.0, 8.0, 12.0, 24.0, 25.0, 27.0, 22.0, 33.0, 30.0, 44.0, 36.0, 35.0, 38.0, 33.0, 41.0, 47.0, 40.0, 42.0, 42.0, 31.0, 38.0, 45.0, 25.0, 31.0, 20.0, 28.0, 9.0, 20.0, 16.0, 10.0, 7.0, 5.0, 9.0, 6.0, 6.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.34375, -7.11773681640625, -6.8917236328125, -6.66571044921875, -6.439697265625, -6.21368408203125, -5.9876708984375, -5.76165771484375, -5.53564453125, -5.30963134765625, -5.0836181640625, -4.85760498046875, -4.631591796875, -4.40557861328125, -4.1795654296875, -3.95355224609375, -3.7275390625, -3.50152587890625, -3.2755126953125, -3.04949951171875, -2.823486328125, -2.59747314453125, -2.3714599609375, -2.14544677734375, -1.91943359375, -1.69342041015625, -1.4674072265625, -1.24139404296875, -1.015380859375, -0.78936767578125, -0.5633544921875, -0.33734130859375, -0.111328125, 0.11468505859375, 0.3406982421875, 0.56671142578125, 0.792724609375, 1.01873779296875, 1.2447509765625, 1.47076416015625, 1.69677734375, 1.92279052734375, 2.1488037109375, 2.37481689453125, 2.600830078125, 2.82684326171875, 3.0528564453125, 3.27886962890625, 3.5048828125, 3.73089599609375, 3.9569091796875, 4.18292236328125, 4.408935546875, 4.63494873046875, 4.8609619140625, 5.08697509765625, 5.31298828125, 5.53900146484375, 5.7650146484375, 5.99102783203125, 6.217041015625, 6.44305419921875, 6.6690673828125, 6.89508056640625, 7.12109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 19.0, 14.0, 21.0, 37.0, 54.0, 92.0, 138.0, 260.0, 512.0, 1721.0, 9735.0, 625812.0, 398812.0, 8629.0, 1556.0, 506.0, 230.0, 125.0, 84.0, 43.0, 30.0, 33.0, 14.0, 15.0, 8.0, 9.0, 11.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.59375, -53.60595703125, -51.6181640625, -49.63037109375, -47.642578125, -45.65478515625, -43.6669921875, -41.67919921875, -39.69140625, -37.70361328125, -35.7158203125, -33.72802734375, -31.740234375, -29.75244140625, -27.7646484375, -25.77685546875, -23.7890625, -21.80126953125, -19.8134765625, -17.82568359375, -15.837890625, -13.85009765625, -11.8623046875, -9.87451171875, -7.88671875, -5.89892578125, -3.9111328125, -1.92333984375, 0.064453125, 2.05224609375, 4.0400390625, 6.02783203125, 8.015625, 10.00341796875, 11.9912109375, 13.97900390625, 15.966796875, 17.95458984375, 19.9423828125, 21.93017578125, 23.91796875, 25.90576171875, 27.8935546875, 29.88134765625, 31.869140625, 33.85693359375, 35.8447265625, 37.83251953125, 39.8203125, 41.80810546875, 43.7958984375, 45.78369140625, 47.771484375, 49.75927734375, 51.7470703125, 53.73486328125, 55.72265625, 57.71044921875, 59.6982421875, 61.68603515625, 63.673828125, 65.66162109375, 67.6494140625, 69.63720703125, 71.625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 12.0, 16.0, 16.0, 29.0, 53.0, 83.0, 126.0, 188.0, 175.0, 109.0, 56.0, 39.0, 27.0, 19.0, 9.0, 8.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0020923614501953125, -0.0020446032285690308, -0.001996845006942749, -0.0019490867853164673, -0.0019013285636901855, -0.0018535703420639038, -0.001805812120437622, -0.0017580538988113403, -0.0017102956771850586, -0.0016625374555587769, -0.0016147792339324951, -0.0015670210123062134, -0.0015192627906799316, -0.00147150456905365, -0.0014237463474273682, -0.0013759881258010864, -0.0013282299041748047, -0.001280471682548523, -0.0012327134609222412, -0.0011849552392959595, -0.0011371970176696777, -0.001089438796043396, -0.0010416805744171143, -0.0009939223527908325, -0.0009461641311645508, -0.000898405909538269, -0.0008506476879119873, -0.0008028894662857056, -0.0007551312446594238, -0.0007073730230331421, -0.0006596148014068604, -0.0006118565797805786, -0.0005640983581542969, -0.0005163401365280151, -0.0004685819149017334, -0.00042082369327545166, -0.0003730654716491699, -0.0003253072500228882, -0.00027754902839660645, -0.0002297908067703247, -0.00018203258514404297, -0.00013427436351776123, -8.651614189147949e-05, -3.8757920265197754e-05, 9.000301361083984e-06, 5.675852298736572e-05, 0.00010451674461364746, 0.0001522749662399292, 0.00020003318786621094, 0.0002477914094924927, 0.0002955496311187744, 0.00034330785274505615, 0.0003910660743713379, 0.00043882429599761963, 0.00048658251762390137, 0.0005343407392501831, 0.0005820989608764648, 0.0006298571825027466, 0.0006776154041290283, 0.0007253736257553101, 0.0007731318473815918, 0.0008208900690078735, 0.0008686482906341553, 0.000916406512260437, 0.0009641647338867188]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 0.0, 4.0, 3.0, 4.0, 9.0, 7.0, 14.0, 13.0, 12.0, 23.0, 36.0, 70.0, 64.0, 126.0, 210.0, 244.0, 412.0, 752.0, 1396.0, 2852.0, 7017.0, 25781.0, 231640.0, 695497.0, 62161.0, 12098.0, 3993.0, 1804.0, 902.0, 545.0, 315.0, 204.0, 109.0, 77.0, 39.0, 35.0, 33.0, 14.0, 13.0, 14.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.15625, -23.330078125, -22.50390625, -21.677734375, -20.8515625, -20.025390625, -19.19921875, -18.373046875, -17.546875, -16.720703125, -15.89453125, -15.068359375, -14.2421875, -13.416015625, -12.58984375, -11.763671875, -10.9375, -10.111328125, -9.28515625, -8.458984375, -7.6328125, -6.806640625, -5.98046875, -5.154296875, -4.328125, -3.501953125, -2.67578125, -1.849609375, -1.0234375, -0.197265625, 0.62890625, 1.455078125, 2.28125, 3.107421875, 3.93359375, 4.759765625, 5.5859375, 6.412109375, 7.23828125, 8.064453125, 8.890625, 9.716796875, 10.54296875, 11.369140625, 12.1953125, 13.021484375, 13.84765625, 14.673828125, 15.5, 16.326171875, 17.15234375, 17.978515625, 18.8046875, 19.630859375, 20.45703125, 21.283203125, 22.109375, 22.935546875, 23.76171875, 24.587890625, 25.4140625, 26.240234375, 27.06640625, 27.892578125, 28.71875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 18.0, 17.0, 17.0, 48.0, 121.0, 191.0, 250.0, 159.0, 72.0, 44.0, 19.0, 17.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9375, -34.02392578125, -33.1103515625, -32.19677734375, -31.283203125, -30.36962890625, -29.4560546875, -28.54248046875, -27.62890625, -26.71533203125, -25.8017578125, -24.88818359375, -23.974609375, -23.06103515625, -22.1474609375, -21.23388671875, -20.3203125, -19.40673828125, -18.4931640625, -17.57958984375, -16.666015625, -15.75244140625, -14.8388671875, -13.92529296875, -13.01171875, -12.09814453125, -11.1845703125, -10.27099609375, -9.357421875, -8.44384765625, -7.5302734375, -6.61669921875, -5.703125, -4.78955078125, -3.8759765625, -2.96240234375, -2.048828125, -1.13525390625, -0.2216796875, 0.69189453125, 1.60546875, 2.51904296875, 3.4326171875, 4.34619140625, 5.259765625, 6.17333984375, 7.0869140625, 8.00048828125, 8.9140625, 9.82763671875, 10.7412109375, 11.65478515625, 12.568359375, 13.48193359375, 14.3955078125, 15.30908203125, 16.22265625, 17.13623046875, 18.0498046875, 18.96337890625, 19.876953125, 20.79052734375, 21.7041015625, 22.61767578125, 23.53125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 17.0, 35.0, 54.0, 138.0, 226.0, 233.0, 144.0, 64.0, 40.0, 19.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-170.86727905273438, -165.98602294921875, -161.10476684570312, -156.22352600097656, -151.34226989746094, -146.4610137939453, -141.5797576904297, -136.69850158691406, -131.8172607421875, -126.93600463867188, -122.05475616455078, -117.17350006103516, -112.29225158691406, -107.41099548339844, -102.52973937988281, -97.64848327636719, -92.76722717285156, -87.88597106933594, -83.00472259521484, -78.12346649169922, -73.24221801757812, -68.3609619140625, -63.479705810546875, -58.598453521728516, -53.717201232910156, -48.8359489440918, -43.95469665527344, -39.07344055175781, -34.19218826293945, -29.310935974121094, -24.4296817779541, -19.54842758178711, -14.66717529296875, -9.785922050476074, -4.904668807983398, -0.023415565490722656, 4.857837677001953, 9.739089965820312, 14.620344161987305, 19.501598358154297, 24.382850646972656, 29.264102935791016, 34.145355224609375, 39.026611328125, 43.90786361694336, 48.78911590576172, 53.670372009277344, 58.5516242980957, 63.43287658691406, 68.31413269042969, 73.19538116455078, 78.0766372680664, 82.9578857421875, 87.83914184570312, 92.72039794921875, 97.60165405273438, 102.48290252685547, 107.3641586303711, 112.24540710449219, 117.12666320800781, 122.00791931152344, 126.88916778564453, 131.77041625976562, 136.65167236328125, 141.53292846679688]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 6.0, 12.0, 17.0, 31.0, 39.0, 43.0, 61.0, 85.0, 87.0, 119.0, 120.0, 90.0, 72.0, 60.0, 54.0, 28.0, 20.0, 12.0, 13.0, 9.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-156.28732299804688, -151.85324096679688, -147.41915893554688, -142.98509216308594, -138.55101013183594, -134.11692810058594, -129.682861328125, -125.248779296875, -120.814697265625, -116.380615234375, -111.94654083251953, -107.51246643066406, -103.07838439941406, -98.64430236816406, -94.2102279663086, -89.77615356445312, -85.34207153320312, -80.90798950195312, -76.47391510009766, -72.03984069824219, -67.60575866699219, -63.17168045043945, -58.73760223388672, -54.303524017333984, -49.86944580078125, -45.435367584228516, -41.00128936767578, -36.56721115112305, -32.13313293457031, -27.699054718017578, -23.264976501464844, -18.83089828491211, -14.396812438964844, -9.96273422241211, -5.528656005859375, -1.0945777893066406, 3.3395004272460938, 7.773578643798828, 12.207656860351562, 16.641735076904297, 21.07581329345703, 25.509891510009766, 29.9439697265625, 34.378047943115234, 38.81212615966797, 43.2462043762207, 47.68028259277344, 52.11436080932617, 56.548439025878906, 60.98251724243164, 65.41659545898438, 69.85067749023438, 74.28475189208984, 78.71882629394531, 83.15290832519531, 87.58699035644531, 92.02106475830078, 96.45513916015625, 100.88922119140625, 105.32330322265625, 109.75737762451172, 114.19145202636719, 118.62553405761719, 123.05961608886719, 127.49369049072266]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 7.0, 3.0, 6.0, 8.0, 10.0, 9.0, 6.0, 7.0, 10.0, 13.0, 14.0, 19.0, 17.0, 36.0, 45.0, 60.0, 93.0, 129.0, 220.0, 382.0, 728.0, 1692.0, 4401.0, 17273.0, 225991.0, 3891800.0, 40795.0, 7033.0, 2100.0, 736.0, 329.0, 149.0, 65.0, 48.0, 25.0, 8.0, 6.0, 4.0], "bins": [-125.9375, -123.478515625, -121.01953125, -118.560546875, -116.1015625, -113.642578125, -111.18359375, -108.724609375, -106.265625, -103.806640625, -101.34765625, -98.888671875, -96.4296875, -93.970703125, -91.51171875, -89.052734375, -86.59375, -84.134765625, -81.67578125, -79.216796875, -76.7578125, -74.298828125, -71.83984375, -69.380859375, -66.921875, -64.462890625, -62.00390625, -59.544921875, -57.0859375, -54.626953125, -52.16796875, -49.708984375, -47.25, -44.791015625, -42.33203125, -39.873046875, -37.4140625, -34.955078125, -32.49609375, -30.037109375, -27.578125, -25.119140625, -22.66015625, -20.201171875, -17.7421875, -15.283203125, -12.82421875, -10.365234375, -7.90625, -5.447265625, -2.98828125, -0.529296875, 1.9296875, 4.388671875, 6.84765625, 9.306640625, 11.765625, 14.224609375, 16.68359375, 19.142578125, 21.6015625, 24.060546875, 26.51953125, 28.978515625, 31.4375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 8.0, 2.0, 8.0, 5.0, 11.0, 8.0, 38.0, 39.0, 74.0, 100.0, 146.0, 143.0, 130.0, 112.0, 69.0, 50.0, 33.0, 11.0, 6.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.74609375, -5.62725830078125, -5.5084228515625, -5.38958740234375, -5.270751953125, -5.15191650390625, -5.0330810546875, -4.91424560546875, -4.79541015625, -4.67657470703125, -4.5577392578125, -4.43890380859375, -4.320068359375, -4.20123291015625, -4.0823974609375, -3.96356201171875, -3.8447265625, -3.72589111328125, -3.6070556640625, -3.48822021484375, -3.369384765625, -3.25054931640625, -3.1317138671875, -3.01287841796875, -2.89404296875, -2.77520751953125, -2.6563720703125, -2.53753662109375, -2.418701171875, -2.29986572265625, -2.1810302734375, -2.06219482421875, -1.943359375, -1.82452392578125, -1.7056884765625, -1.58685302734375, -1.468017578125, -1.34918212890625, -1.2303466796875, -1.11151123046875, -0.99267578125, -0.87384033203125, -0.7550048828125, -0.63616943359375, -0.517333984375, -0.39849853515625, -0.2796630859375, -0.16082763671875, -0.0419921875, 0.07684326171875, 0.1956787109375, 0.31451416015625, 0.433349609375, 0.55218505859375, 0.6710205078125, 0.78985595703125, 0.90869140625, 1.02752685546875, 1.1463623046875, 1.26519775390625, 1.384033203125, 1.50286865234375, 1.6217041015625, 1.74053955078125, 1.859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 11.0, 7.0, 12.0, 25.0, 44.0, 47.0, 106.0, 238.0, 1802.0, 3800395.0, 389952.0, 1304.0, 181.0, 58.0, 29.0, 21.0, 7.0, 13.0, 5.0, 4.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.375, -191.962890625, -185.55078125, -179.138671875, -172.7265625, -166.314453125, -159.90234375, -153.490234375, -147.078125, -140.666015625, -134.25390625, -127.841796875, -121.4296875, -115.017578125, -108.60546875, -102.193359375, -95.78125, -89.369140625, -82.95703125, -76.544921875, -70.1328125, -63.720703125, -57.30859375, -50.896484375, -44.484375, -38.072265625, -31.66015625, -25.248046875, -18.8359375, -12.423828125, -6.01171875, 0.400390625, 6.8125, 13.224609375, 19.63671875, 26.048828125, 32.4609375, 38.873046875, 45.28515625, 51.697265625, 58.109375, 64.521484375, 70.93359375, 77.345703125, 83.7578125, 90.169921875, 96.58203125, 102.994140625, 109.40625, 115.818359375, 122.23046875, 128.642578125, 135.0546875, 141.466796875, 147.87890625, 154.291015625, 160.703125, 167.115234375, 173.52734375, 179.939453125, 186.3515625, 192.763671875, 199.17578125, 205.587890625, 212.0]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 7.0, 6.0, 5.0, 5.0, 10.0, 8.0, 16.0, 34.0, 44.0, 89.0, 169.0, 465.0, 2108.0, 576.0, 211.0, 119.0, 64.0, 46.0, 37.0, 18.0, 17.0, 6.0, 10.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.9931640625, -6.771484375, -6.5498046875, -6.328125, -6.1064453125, -5.884765625, -5.6630859375, -5.44140625, -5.2197265625, -4.998046875, -4.7763671875, -4.5546875, -4.3330078125, -4.111328125, -3.8896484375, -3.66796875, -3.4462890625, -3.224609375, -3.0029296875, -2.78125, -2.5595703125, -2.337890625, -2.1162109375, -1.89453125, -1.6728515625, -1.451171875, -1.2294921875, -1.0078125, -0.7861328125, -0.564453125, -0.3427734375, -0.12109375, 0.1005859375, 0.322265625, 0.5439453125, 0.765625, 0.9873046875, 1.208984375, 1.4306640625, 1.65234375, 1.8740234375, 2.095703125, 2.3173828125, 2.5390625, 2.7607421875, 2.982421875, 3.2041015625, 3.42578125, 3.6474609375, 3.869140625, 4.0908203125, 4.3125, 4.5341796875, 4.755859375, 4.9775390625, 5.19921875, 5.4208984375, 5.642578125, 5.8642578125, 6.0859375, 6.3076171875, 6.529296875, 6.7509765625, 6.97265625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 10.0, 7.0, 38.0, 146.0, 339.0, 286.0, 117.0, 38.0, 20.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.94429588317871, -28.530942916870117, -26.117589950561523, -23.704235076904297, -21.290882110595703, -18.87752914428711, -16.464176177978516, -14.050823211669922, -11.637470245361328, -9.224117279052734, -6.810763835906982, -4.3974103927612305, -1.9840574264526367, 0.42929553985595703, 2.842649459838867, 5.256002426147461, 7.669355392456055, 10.082708358764648, 12.496061325073242, 14.909415245056152, 17.322769165039062, 19.736122131347656, 22.14947509765625, 24.562828063964844, 26.976181030273438, 29.38953399658203, 31.802886962890625, 34.21623992919922, 36.62959289550781, 39.042945861816406, 41.456298828125, 43.869651794433594, 46.28300476074219, 48.69635772705078, 51.109710693359375, 53.52306365966797, 55.93641662597656, 58.349769592285156, 60.76312255859375, 63.176475524902344, 65.58982849121094, 68.00318145751953, 70.41653442382812, 72.82988739013672, 75.24324035644531, 77.6565933227539, 80.0699462890625, 82.4832992553711, 84.89665222167969, 87.31000518798828, 89.72335815429688, 92.13671112060547, 94.55006408691406, 96.96341705322266, 99.37677001953125, 101.79012298583984, 104.20348358154297, 106.61683654785156, 109.03018951416016, 111.44354248046875, 113.85689544677734, 116.27024841308594, 118.68360137939453, 121.09695434570312, 123.51030731201172]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 18.0, 30.0, 59.0, 76.0, 126.0, 106.0, 136.0, 127.0, 103.0, 73.0, 58.0, 28.0, 23.0, 12.0, 10.0, 1.0, 1.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.632495880126953, -29.067413330078125, -27.502330780029297, -25.937246322631836, -24.372163772583008, -22.80708122253418, -21.24199676513672, -19.67691421508789, -18.111831665039062, -16.546749114990234, -14.98166561126709, -13.416582107543945, -11.851499557495117, -10.286417007446289, -8.721333503723145, -7.15625, -5.591167449951172, -4.0260844230651855, -2.461001396179199, -0.8959183692932129, 0.6691646575927734, 2.2342476844787598, 3.799330711364746, 5.364414215087891, 6.929496765136719, 8.494579315185547, 10.059662818908691, 11.624746322631836, 13.189828872680664, 14.754911422729492, 16.319995880126953, 17.88507843017578, 19.450164794921875, 21.015247344970703, 22.58032989501953, 24.145414352416992, 25.71049690246582, 27.27557945251465, 28.84066390991211, 30.405746459960938, 31.970829010009766, 33.535911560058594, 35.10099411010742, 36.66607666015625, 38.231163024902344, 39.79624557495117, 41.361328125, 42.92641067504883, 44.491493225097656, 46.056575775146484, 47.62165832519531, 49.18674087524414, 50.75182342529297, 52.31690979003906, 53.88199234008789, 55.44707489013672, 57.01215744018555, 58.577239990234375, 60.1423225402832, 61.70740509033203, 63.272491455078125, 64.83757019042969, 66.40265655517578, 67.96774291992188, 69.53282165527344]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 1.0, 10.0, 19.0, 25.0, 53.0, 71.0, 108.0, 152.0, 309.0, 518.0, 973.0, 1958.0, 3919.0, 7971.0, 17873.0, 41680.0, 101249.0, 230365.0, 316331.0, 186329.0, 78814.0, 32628.0, 14059.0, 6584.0, 3088.0, 1550.0, 817.0, 468.0, 259.0, 142.0, 80.0, 52.0, 37.0, 18.0, 10.0, 9.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7578125, -10.4034423828125, -10.049072265625, -9.6947021484375, -9.34033203125, -8.9859619140625, -8.631591796875, -8.2772216796875, -7.9228515625, -7.5684814453125, -7.214111328125, -6.8597412109375, -6.50537109375, -6.1510009765625, -5.796630859375, -5.4422607421875, -5.087890625, -4.7335205078125, -4.379150390625, -4.0247802734375, -3.67041015625, -3.3160400390625, -2.961669921875, -2.6072998046875, -2.2529296875, -1.8985595703125, -1.544189453125, -1.1898193359375, -0.83544921875, -0.4810791015625, -0.126708984375, 0.2276611328125, 0.58203125, 0.9364013671875, 1.290771484375, 1.6451416015625, 1.99951171875, 2.3538818359375, 2.708251953125, 3.0626220703125, 3.4169921875, 3.7713623046875, 4.125732421875, 4.4801025390625, 4.83447265625, 5.1888427734375, 5.543212890625, 5.8975830078125, 6.251953125, 6.6063232421875, 6.960693359375, 7.3150634765625, 7.66943359375, 8.0238037109375, 8.378173828125, 8.7325439453125, 9.0869140625, 9.4412841796875, 9.795654296875, 10.1500244140625, 10.50439453125, 10.8587646484375, 11.213134765625, 11.5675048828125, 11.921875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 5.0, 4.0, 8.0, 10.0, 8.0, 15.0, 10.0, 16.0, 22.0, 30.0, 27.0, 31.0, 32.0, 37.0, 33.0, 42.0, 42.0, 49.0, 45.0, 46.0, 52.0, 53.0, 47.0, 45.0, 31.0, 32.0, 27.0, 26.0, 32.0, 20.0, 34.0, 21.0, 13.0, 15.0, 11.0, 8.0, 5.0, 6.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.193359375, -1.15155029296875, -1.1097412109375, -1.06793212890625, -1.026123046875, -0.98431396484375, -0.9425048828125, -0.90069580078125, -0.85888671875, -0.81707763671875, -0.7752685546875, -0.73345947265625, -0.691650390625, -0.64984130859375, -0.6080322265625, -0.56622314453125, -0.5244140625, -0.48260498046875, -0.4407958984375, -0.39898681640625, -0.357177734375, -0.31536865234375, -0.2735595703125, -0.23175048828125, -0.18994140625, -0.14813232421875, -0.1063232421875, -0.06451416015625, -0.022705078125, 0.01910400390625, 0.0609130859375, 0.10272216796875, 0.14453125, 0.18634033203125, 0.2281494140625, 0.26995849609375, 0.311767578125, 0.35357666015625, 0.3953857421875, 0.43719482421875, 0.47900390625, 0.52081298828125, 0.5626220703125, 0.60443115234375, 0.646240234375, 0.68804931640625, 0.7298583984375, 0.77166748046875, 0.8134765625, 0.85528564453125, 0.8970947265625, 0.93890380859375, 0.980712890625, 1.02252197265625, 1.0643310546875, 1.10614013671875, 1.14794921875, 1.18975830078125, 1.2315673828125, 1.27337646484375, 1.315185546875, 1.35699462890625, 1.3988037109375, 1.44061279296875, 1.482421875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 14.0, 9.0, 27.0, 34.0, 55.0, 75.0, 125.0, 184.0, 312.0, 523.0, 1018.0, 1813.0, 3997.0, 9232.0, 24464.0, 73920.0, 229858.0, 399665.0, 202885.0, 63465.0, 21574.0, 8043.0, 3549.0, 1603.0, 856.0, 486.0, 264.0, 175.0, 121.0, 68.0, 43.0, 40.0, 26.0, 10.0, 8.0, 7.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.828125, -14.3709716796875, -13.913818359375, -13.4566650390625, -12.99951171875, -12.5423583984375, -12.085205078125, -11.6280517578125, -11.1708984375, -10.7137451171875, -10.256591796875, -9.7994384765625, -9.34228515625, -8.8851318359375, -8.427978515625, -7.9708251953125, -7.513671875, -7.0565185546875, -6.599365234375, -6.1422119140625, -5.68505859375, -5.2279052734375, -4.770751953125, -4.3135986328125, -3.8564453125, -3.3992919921875, -2.942138671875, -2.4849853515625, -2.02783203125, -1.5706787109375, -1.113525390625, -0.6563720703125, -0.19921875, 0.2579345703125, 0.715087890625, 1.1722412109375, 1.62939453125, 2.0865478515625, 2.543701171875, 3.0008544921875, 3.4580078125, 3.9151611328125, 4.372314453125, 4.8294677734375, 5.28662109375, 5.7437744140625, 6.200927734375, 6.6580810546875, 7.115234375, 7.5723876953125, 8.029541015625, 8.4866943359375, 8.94384765625, 9.4010009765625, 9.858154296875, 10.3153076171875, 10.7724609375, 11.2296142578125, 11.686767578125, 12.1439208984375, 12.60107421875, 13.0582275390625, 13.515380859375, 13.9725341796875, 14.4296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 5.0, 13.0, 18.0, 15.0, 14.0, 18.0, 30.0, 15.0, 26.0, 42.0, 45.0, 39.0, 34.0, 53.0, 43.0, 42.0, 41.0, 40.0, 39.0, 50.0, 56.0, 44.0, 48.0, 29.0, 31.0, 30.0, 25.0, 20.0, 17.0, 11.0, 10.0, 8.0, 5.0, 6.0, 5.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.094970703125, -8.82275390625, -8.550537109375, -8.2783203125, -8.006103515625, -7.73388671875, -7.461669921875, -7.189453125, -6.917236328125, -6.64501953125, -6.372802734375, -6.1005859375, -5.828369140625, -5.55615234375, -5.283935546875, -5.01171875, -4.739501953125, -4.46728515625, -4.195068359375, -3.9228515625, -3.650634765625, -3.37841796875, -3.106201171875, -2.833984375, -2.561767578125, -2.28955078125, -2.017333984375, -1.7451171875, -1.472900390625, -1.20068359375, -0.928466796875, -0.65625, -0.384033203125, -0.11181640625, 0.160400390625, 0.4326171875, 0.704833984375, 0.97705078125, 1.249267578125, 1.521484375, 1.793701171875, 2.06591796875, 2.338134765625, 2.6103515625, 2.882568359375, 3.15478515625, 3.427001953125, 3.69921875, 3.971435546875, 4.24365234375, 4.515869140625, 4.7880859375, 5.060302734375, 5.33251953125, 5.604736328125, 5.876953125, 6.149169921875, 6.42138671875, 6.693603515625, 6.9658203125, 7.238037109375, 7.51025390625, 7.782470703125, 8.0546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 5.0, 19.0, 16.0, 30.0, 47.0, 58.0, 106.0, 193.0, 315.0, 555.0, 1062.0, 2209.0, 5027.0, 11994.0, 36057.0, 130817.0, 411692.0, 319445.0, 86851.0, 25320.0, 9133.0, 3834.0, 1740.0, 893.0, 464.0, 249.0, 150.0, 92.0, 61.0, 35.0, 23.0, 14.0, 13.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.015625, -11.66064453125, -11.3056640625, -10.95068359375, -10.595703125, -10.24072265625, -9.8857421875, -9.53076171875, -9.17578125, -8.82080078125, -8.4658203125, -8.11083984375, -7.755859375, -7.40087890625, -7.0458984375, -6.69091796875, -6.3359375, -5.98095703125, -5.6259765625, -5.27099609375, -4.916015625, -4.56103515625, -4.2060546875, -3.85107421875, -3.49609375, -3.14111328125, -2.7861328125, -2.43115234375, -2.076171875, -1.72119140625, -1.3662109375, -1.01123046875, -0.65625, -0.30126953125, 0.0537109375, 0.40869140625, 0.763671875, 1.11865234375, 1.4736328125, 1.82861328125, 2.18359375, 2.53857421875, 2.8935546875, 3.24853515625, 3.603515625, 3.95849609375, 4.3134765625, 4.66845703125, 5.0234375, 5.37841796875, 5.7333984375, 6.08837890625, 6.443359375, 6.79833984375, 7.1533203125, 7.50830078125, 7.86328125, 8.21826171875, 8.5732421875, 8.92822265625, 9.283203125, 9.63818359375, 9.9931640625, 10.34814453125, 10.703125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 1.0, 4.0, 7.0, 9.0, 19.0, 15.0, 22.0, 16.0, 35.0, 46.0, 38.0, 41.0, 71.0, 68.0, 71.0, 66.0, 79.0, 63.0, 55.0, 71.0, 29.0, 30.0, 24.0, 19.0, 22.0, 15.0, 15.0, 11.0, 3.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009045600891113281, -0.0008744075894355774, -0.0008442550897598267, -0.0008141025900840759, -0.0007839500904083252, -0.0007537975907325745, -0.0007236450910568237, -0.000693492591381073, -0.0006633400917053223, -0.0006331875920295715, -0.0006030350923538208, -0.0005728825926780701, -0.0005427300930023193, -0.0005125775933265686, -0.00048242509365081787, -0.00045227259397506714, -0.0004221200942993164, -0.0003919675946235657, -0.00036181509494781494, -0.0003316625952720642, -0.0003015100955963135, -0.00027135759592056274, -0.000241205096244812, -0.00021105259656906128, -0.00018090009689331055, -0.00015074759721755981, -0.00012059509754180908, -9.044259786605835e-05, -6.029009819030762e-05, -3.0137598514556885e-05, 1.4901161193847656e-08, 3.016740083694458e-05, 6.031990051269531e-05, 9.047240018844604e-05, 0.00012062489986419678, 0.0001507773995399475, 0.00018092989921569824, 0.00021108239889144897, 0.0002412348985671997, 0.00027138739824295044, 0.00030153989791870117, 0.0003316923975944519, 0.00036184489727020264, 0.00039199739694595337, 0.0004221498966217041, 0.00045230239629745483, 0.00048245489597320557, 0.0005126073956489563, 0.000542759895324707, 0.0005729123950004578, 0.0006030648946762085, 0.0006332173943519592, 0.00066336989402771, 0.0006935223937034607, 0.0007236748933792114, 0.0007538273930549622, 0.0007839798927307129, 0.0008141323924064636, 0.0008442848920822144, 0.0008744373917579651, 0.0009045898914337158, 0.0009347423911094666, 0.0009648948907852173, 0.000995047390460968, 0.0010251998901367188]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 4.0, 4.0, 12.0, 11.0, 19.0, 20.0, 46.0, 43.0, 76.0, 92.0, 144.0, 249.0, 341.0, 583.0, 933.0, 1552.0, 2872.0, 5637.0, 11429.0, 28419.0, 77852.0, 228288.0, 376598.0, 199784.0, 67176.0, 24557.0, 10358.0, 4968.0, 2551.0, 1404.0, 899.0, 561.0, 336.0, 254.0, 151.0, 100.0, 47.0, 42.0, 32.0, 36.0, 18.0, 8.0, 9.0, 12.0, 9.0, 3.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-8.5234375, -8.2606201171875, -7.997802734375, -7.7349853515625, -7.47216796875, -7.2093505859375, -6.946533203125, -6.6837158203125, -6.4208984375, -6.1580810546875, -5.895263671875, -5.6324462890625, -5.36962890625, -5.1068115234375, -4.843994140625, -4.5811767578125, -4.318359375, -4.0555419921875, -3.792724609375, -3.5299072265625, -3.26708984375, -3.0042724609375, -2.741455078125, -2.4786376953125, -2.2158203125, -1.9530029296875, -1.690185546875, -1.4273681640625, -1.16455078125, -0.9017333984375, -0.638916015625, -0.3760986328125, -0.11328125, 0.1495361328125, 0.412353515625, 0.6751708984375, 0.93798828125, 1.2008056640625, 1.463623046875, 1.7264404296875, 1.9892578125, 2.2520751953125, 2.514892578125, 2.7777099609375, 3.04052734375, 3.3033447265625, 3.566162109375, 3.8289794921875, 4.091796875, 4.3546142578125, 4.617431640625, 4.8802490234375, 5.14306640625, 5.4058837890625, 5.668701171875, 5.9315185546875, 6.1943359375, 6.4571533203125, 6.719970703125, 6.9827880859375, 7.24560546875, 7.5084228515625, 7.771240234375, 8.0340576171875, 8.296875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 8.0, 4.0, 8.0, 10.0, 18.0, 19.0, 27.0, 37.0, 35.0, 44.0, 66.0, 85.0, 85.0, 78.0, 91.0, 72.0, 78.0, 51.0, 44.0, 28.0, 29.0, 25.0, 21.0, 5.0, 1.0, 5.0, 9.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8359375, -6.611572265625, -6.38720703125, -6.162841796875, -5.9384765625, -5.714111328125, -5.48974609375, -5.265380859375, -5.041015625, -4.816650390625, -4.59228515625, -4.367919921875, -4.1435546875, -3.919189453125, -3.69482421875, -3.470458984375, -3.24609375, -3.021728515625, -2.79736328125, -2.572998046875, -2.3486328125, -2.124267578125, -1.89990234375, -1.675537109375, -1.451171875, -1.226806640625, -1.00244140625, -0.778076171875, -0.5537109375, -0.329345703125, -0.10498046875, 0.119384765625, 0.34375, 0.568115234375, 0.79248046875, 1.016845703125, 1.2412109375, 1.465576171875, 1.68994140625, 1.914306640625, 2.138671875, 2.363037109375, 2.58740234375, 2.811767578125, 3.0361328125, 3.260498046875, 3.48486328125, 3.709228515625, 3.93359375, 4.157958984375, 4.38232421875, 4.606689453125, 4.8310546875, 5.055419921875, 5.27978515625, 5.504150390625, 5.728515625, 5.952880859375, 6.17724609375, 6.401611328125, 6.6259765625, 6.850341796875, 7.07470703125, 7.299072265625, 7.5234375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 7.0, 14.0, 27.0, 45.0, 97.0, 138.0, 170.0, 188.0, 123.0, 74.0, 38.0, 25.0, 18.0, 14.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.03781127929688, -68.00983428955078, -63.98186492919922, -59.953887939453125, -55.9259147644043, -51.89794158935547, -47.869964599609375, -43.84199142456055, -39.81401824951172, -35.78604507446289, -31.75806999206543, -27.73009490966797, -23.70212173461914, -19.674148559570312, -15.646173477172852, -11.61819839477539, -7.5902252197265625, -3.562251091003418, 0.46572303771972656, 4.493697166442871, 8.521671295166016, 12.549644470214844, 16.577619552612305, 20.605594635009766, 24.633567810058594, 28.661540985107422, 32.68951416015625, 36.717491149902344, 40.74546432495117, 44.7734375, 48.801414489746094, 52.82938766479492, 56.85737609863281, 60.88534927368164, 64.91332244873047, 68.94129943847656, 72.96926879882812, 76.99724578857422, 81.02522277832031, 85.05319213867188, 89.08116912841797, 93.10914611816406, 97.13711547851562, 101.16509246826172, 105.19306945800781, 109.22103881835938, 113.24901580810547, 117.27699279785156, 121.30496215820312, 125.33293914794922, 129.3609161376953, 133.38888549804688, 137.41685485839844, 141.44482421875, 145.47280883789062, 149.5007781982422, 153.52874755859375, 157.5567169189453, 161.58470153808594, 165.6126708984375, 169.64064025878906, 173.66860961914062, 177.69659423828125, 181.7245635986328, 185.75254821777344]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 10.0, 8.0, 17.0, 23.0, 22.0, 26.0, 35.0, 39.0, 40.0, 57.0, 26.0, 57.0, 46.0, 59.0, 64.0, 61.0, 57.0, 50.0, 45.0, 38.0, 32.0, 39.0, 32.0, 23.0, 16.0, 17.0, 12.0, 12.0, 10.0, 5.0, 0.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.27465057373047, -73.8612060546875, -71.44775390625, -69.03430938720703, -66.62086486816406, -64.20741271972656, -61.793968200683594, -59.380523681640625, -56.96707534790039, -54.553627014160156, -52.14018249511719, -49.72673416137695, -47.31328582763672, -44.89984130859375, -42.486392974853516, -40.07294464111328, -37.65950012207031, -35.24605178833008, -32.83260726928711, -30.419158935546875, -28.005712509155273, -25.592266082763672, -23.178817749023438, -20.765371322631836, -18.351924896240234, -15.938478469848633, -13.525031089782715, -11.111583709716797, -8.698137283325195, -6.284690856933594, -3.871243476867676, -1.4577960968017578, 0.9556427001953125, 3.3690896034240723, 5.782536506652832, 8.19598388671875, 10.609430313110352, 13.022876739501953, 15.436324119567871, 17.84977149963379, 20.26321792602539, 22.676664352416992, 25.090110778808594, 27.503559112548828, 29.91700553894043, 32.33045196533203, 34.743900299072266, 37.1573486328125, 39.57079315185547, 41.9842414855957, 44.39768600463867, 46.811134338378906, 49.224578857421875, 51.63802719116211, 54.051475524902344, 56.46492004394531, 58.87836837768555, 61.29181671142578, 63.70526123046875, 66.11870574951172, 68.53215789794922, 70.94560241699219, 73.35904693603516, 75.77249908447266, 78.18594360351562]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 1.0, 9.0, 10.0, 25.0, 10.0, 18.0, 29.0, 32.0, 53.0, 79.0, 236.0, 816.0, 3805.0, 24552.0, 892691.0, 3236081.0, 29072.0, 4841.0, 1169.0, 350.0, 142.0, 74.0, 52.0, 36.0, 24.0, 14.0, 16.0, 6.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -70.7880859375, -68.263671875, -65.7392578125, -63.21484375, -60.6904296875, -58.166015625, -55.6416015625, -53.1171875, -50.5927734375, -48.068359375, -45.5439453125, -43.01953125, -40.4951171875, -37.970703125, -35.4462890625, -32.921875, -30.3974609375, -27.873046875, -25.3486328125, -22.82421875, -20.2998046875, -17.775390625, -15.2509765625, -12.7265625, -10.2021484375, -7.677734375, -5.1533203125, -2.62890625, -0.1044921875, 2.419921875, 4.9443359375, 7.46875, 9.9931640625, 12.517578125, 15.0419921875, 17.56640625, 20.0908203125, 22.615234375, 25.1396484375, 27.6640625, 30.1884765625, 32.712890625, 35.2373046875, 37.76171875, 40.2861328125, 42.810546875, 45.3349609375, 47.859375, 50.3837890625, 52.908203125, 55.4326171875, 57.95703125, 60.4814453125, 63.005859375, 65.5302734375, 68.0546875, 70.5791015625, 73.103515625, 75.6279296875, 78.15234375, 80.6767578125, 83.201171875, 85.7255859375, 88.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 7.0, 10.0, 17.0, 11.0, 16.0, 26.0, 29.0, 39.0, 44.0, 31.0, 53.0, 54.0, 49.0, 69.0, 71.0, 61.0, 53.0, 59.0, 44.0, 56.0, 38.0, 29.0, 31.0, 21.0, 17.0, 11.0, 12.0, 10.0, 8.0, 5.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.969757080078125, -1.89849853515625, -1.827239990234375, -1.7559814453125, -1.684722900390625, -1.61346435546875, -1.542205810546875, -1.470947265625, -1.399688720703125, -1.32843017578125, -1.257171630859375, -1.1859130859375, -1.114654541015625, -1.04339599609375, -0.972137451171875, -0.90087890625, -0.829620361328125, -0.75836181640625, -0.687103271484375, -0.6158447265625, -0.544586181640625, -0.47332763671875, -0.402069091796875, -0.330810546875, -0.259552001953125, -0.18829345703125, -0.117034912109375, -0.0457763671875, 0.025482177734375, 0.09674072265625, 0.167999267578125, 0.2392578125, 0.310516357421875, 0.38177490234375, 0.453033447265625, 0.5242919921875, 0.595550537109375, 0.66680908203125, 0.738067626953125, 0.809326171875, 0.880584716796875, 0.95184326171875, 1.023101806640625, 1.0943603515625, 1.165618896484375, 1.23687744140625, 1.308135986328125, 1.37939453125, 1.450653076171875, 1.52191162109375, 1.593170166015625, 1.6644287109375, 1.735687255859375, 1.80694580078125, 1.878204345703125, 1.949462890625, 2.020721435546875, 2.09197998046875, 2.163238525390625, 2.2344970703125, 2.305755615234375, 2.37701416015625, 2.448272705078125, 2.51953125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 4.0, 7.0, 6.0, 10.0, 9.0, 13.0, 14.0, 25.0, 18.0, 37.0, 40.0, 44.0, 75.0, 136.0, 317.0, 847.0, 2888.0, 14894.0, 144263.0, 3834495.0, 173201.0, 17792.0, 3569.0, 949.0, 265.0, 127.0, 77.0, 36.0, 29.0, 22.0, 18.0, 15.0, 12.0, 7.0, 8.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.125, -43.64697265625, -42.1689453125, -40.69091796875, -39.212890625, -37.73486328125, -36.2568359375, -34.77880859375, -33.30078125, -31.82275390625, -30.3447265625, -28.86669921875, -27.388671875, -25.91064453125, -24.4326171875, -22.95458984375, -21.4765625, -19.99853515625, -18.5205078125, -17.04248046875, -15.564453125, -14.08642578125, -12.6083984375, -11.13037109375, -9.65234375, -8.17431640625, -6.6962890625, -5.21826171875, -3.740234375, -2.26220703125, -0.7841796875, 0.69384765625, 2.171875, 3.64990234375, 5.1279296875, 6.60595703125, 8.083984375, 9.56201171875, 11.0400390625, 12.51806640625, 13.99609375, 15.47412109375, 16.9521484375, 18.43017578125, 19.908203125, 21.38623046875, 22.8642578125, 24.34228515625, 25.8203125, 27.29833984375, 28.7763671875, 30.25439453125, 31.732421875, 33.21044921875, 34.6884765625, 36.16650390625, 37.64453125, 39.12255859375, 40.6005859375, 42.07861328125, 43.556640625, 45.03466796875, 46.5126953125, 47.99072265625, 49.46875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 10.0, 17.0, 21.0, 36.0, 48.0, 99.0, 195.0, 595.0, 2172.0, 468.0, 172.0, 91.0, 52.0, 32.0, 16.0, 14.0, 10.0, 11.0, 7.0, 3.0, 7.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.875, -13.58258056640625, -13.2901611328125, -12.99774169921875, -12.705322265625, -12.41290283203125, -12.1204833984375, -11.82806396484375, -11.53564453125, -11.24322509765625, -10.9508056640625, -10.65838623046875, -10.365966796875, -10.07354736328125, -9.7811279296875, -9.48870849609375, -9.1962890625, -8.90386962890625, -8.6114501953125, -8.31903076171875, -8.026611328125, -7.73419189453125, -7.4417724609375, -7.14935302734375, -6.85693359375, -6.56451416015625, -6.2720947265625, -5.97967529296875, -5.687255859375, -5.39483642578125, -5.1024169921875, -4.80999755859375, -4.517578125, -4.22515869140625, -3.9327392578125, -3.64031982421875, -3.347900390625, -3.05548095703125, -2.7630615234375, -2.47064208984375, -2.17822265625, -1.88580322265625, -1.5933837890625, -1.30096435546875, -1.008544921875, -0.71612548828125, -0.4237060546875, -0.13128662109375, 0.1611328125, 0.45355224609375, 0.7459716796875, 1.03839111328125, 1.330810546875, 1.62322998046875, 1.9156494140625, 2.20806884765625, 2.50048828125, 2.79290771484375, 3.0853271484375, 3.37774658203125, 3.670166015625, 3.96258544921875, 4.2550048828125, 4.54742431640625, 4.83984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 20.0, 117.0, 467.0, 341.0, 53.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.976234436035156, -31.376708984375, -26.777183532714844, -22.17765998840332, -17.578134536743164, -12.978609085083008, -8.379085540771484, -3.779560089111328, 0.8199653625488281, 5.419490337371826, 10.019015312194824, 14.618539810180664, 19.21806526184082, 23.817590713500977, 28.4171142578125, 33.016639709472656, 37.61616516113281, 42.21569061279297, 46.815216064453125, 51.41474151611328, 56.01426696777344, 60.613792419433594, 65.21331787109375, 69.81283569335938, 74.41236877441406, 79.01189422607422, 83.61141967773438, 88.21094512939453, 92.81047058105469, 97.40999603271484, 102.009521484375, 106.60903930664062, 111.20857238769531, 115.80809783935547, 120.40762329101562, 125.00714874267578, 129.60667419433594, 134.20619201660156, 138.80572509765625, 143.40524291992188, 148.00477600097656, 152.6042938232422, 157.20382690429688, 161.8033447265625, 166.4028778076172, 171.0023956298828, 175.6019287109375, 180.20144653320312, 184.80096435546875, 189.40048217773438, 194.00001525878906, 198.5995330810547, 203.19906616210938, 207.798583984375, 212.3981170654297, 216.9976348876953, 221.59716796875, 226.19668579101562, 230.7962188720703, 235.39573669433594, 239.99526977539062, 244.59478759765625, 249.19432067871094, 253.79383850097656, 258.39337158203125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 4.0, 6.0, 8.0, 9.0, 18.0, 13.0, 28.0, 29.0, 29.0, 34.0, 44.0, 41.0, 43.0, 62.0, 50.0, 72.0, 69.0, 50.0, 60.0, 61.0, 50.0, 41.0, 45.0, 40.0, 25.0, 23.0, 11.0, 14.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-39.434852600097656, -38.488773345947266, -37.542694091796875, -36.596614837646484, -35.650535583496094, -34.70445251464844, -33.75837326049805, -32.812294006347656, -31.866214752197266, -30.920135498046875, -29.974056243896484, -29.02797508239746, -28.08189582824707, -27.13581657409668, -26.189735412597656, -25.243656158447266, -24.297576904296875, -23.351497650146484, -22.405418395996094, -21.45933723449707, -20.51325798034668, -19.56717872619629, -18.621097564697266, -17.675018310546875, -16.728939056396484, -15.782859802246094, -14.836779594421387, -13.89069938659668, -12.944620132446289, -11.998540878295898, -11.052460670471191, -10.106380462646484, -9.160301208496094, -8.214221954345703, -7.268141746520996, -6.322062015533447, -5.375982284545898, -4.42990255355835, -3.483822822570801, -2.537743091583252, -1.5916633605957031, -0.6455836296081543, 0.30049610137939453, 1.2465758323669434, 2.192655563354492, 3.138735294342041, 4.08481502532959, 5.030894756317139, 5.9769744873046875, 6.923054218292236, 7.869133949279785, 8.815214157104492, 9.761293411254883, 10.707372665405273, 11.65345287322998, 12.599533081054688, 13.545612335205078, 14.491691589355469, 15.437771797180176, 16.383852005004883, 17.329931259155273, 18.276010513305664, 19.222091674804688, 20.168170928955078, 21.11425018310547]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 6.0, 10.0, 4.0, 20.0, 17.0, 37.0, 68.0, 73.0, 118.0, 232.0, 341.0, 609.0, 1150.0, 2401.0, 5689.0, 17304.0, 62855.0, 235696.0, 432023.0, 209877.0, 55151.0, 15130.0, 5082.0, 2128.0, 1103.0, 572.0, 305.0, 192.0, 119.0, 84.0, 55.0, 40.0, 27.0, 15.0, 11.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.990478515625, -15.46533203125, -14.940185546875, -14.4150390625, -13.889892578125, -13.36474609375, -12.839599609375, -12.314453125, -11.789306640625, -11.26416015625, -10.739013671875, -10.2138671875, -9.688720703125, -9.16357421875, -8.638427734375, -8.11328125, -7.588134765625, -7.06298828125, -6.537841796875, -6.0126953125, -5.487548828125, -4.96240234375, -4.437255859375, -3.912109375, -3.386962890625, -2.86181640625, -2.336669921875, -1.8115234375, -1.286376953125, -0.76123046875, -0.236083984375, 0.2890625, 0.814208984375, 1.33935546875, 1.864501953125, 2.3896484375, 2.914794921875, 3.43994140625, 3.965087890625, 4.490234375, 5.015380859375, 5.54052734375, 6.065673828125, 6.5908203125, 7.115966796875, 7.64111328125, 8.166259765625, 8.69140625, 9.216552734375, 9.74169921875, 10.266845703125, 10.7919921875, 11.317138671875, 11.84228515625, 12.367431640625, 12.892578125, 13.417724609375, 13.94287109375, 14.468017578125, 14.9931640625, 15.518310546875, 16.04345703125, 16.568603515625, 17.09375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 8.0, 4.0, 9.0, 8.0, 18.0, 24.0, 41.0, 48.0, 52.0, 69.0, 81.0, 84.0, 90.0, 86.0, 69.0, 74.0, 54.0, 47.0, 40.0, 26.0, 21.0, 21.0, 14.0, 9.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123046875, -3.030670166015625, -2.93829345703125, -2.845916748046875, -2.7535400390625, -2.661163330078125, -2.56878662109375, -2.476409912109375, -2.384033203125, -2.291656494140625, -2.19927978515625, -2.106903076171875, -2.0145263671875, -1.922149658203125, -1.82977294921875, -1.737396240234375, -1.64501953125, -1.552642822265625, -1.46026611328125, -1.367889404296875, -1.2755126953125, -1.183135986328125, -1.09075927734375, -0.998382568359375, -0.906005859375, -0.813629150390625, -0.72125244140625, -0.628875732421875, -0.5364990234375, -0.444122314453125, -0.35174560546875, -0.259368896484375, -0.1669921875, -0.074615478515625, 0.01776123046875, 0.110137939453125, 0.2025146484375, 0.294891357421875, 0.38726806640625, 0.479644775390625, 0.572021484375, 0.664398193359375, 0.75677490234375, 0.849151611328125, 0.9415283203125, 1.033905029296875, 1.12628173828125, 1.218658447265625, 1.31103515625, 1.403411865234375, 1.49578857421875, 1.588165283203125, 1.6805419921875, 1.772918701171875, 1.86529541015625, 1.957672119140625, 2.050048828125, 2.142425537109375, 2.23480224609375, 2.327178955078125, 2.4195556640625, 2.511932373046875, 2.60430908203125, 2.696685791015625, 2.7890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 6.0, 5.0, 13.0, 23.0, 25.0, 33.0, 54.0, 64.0, 89.0, 170.0, 205.0, 373.0, 626.0, 1181.0, 2583.0, 5912.0, 16227.0, 56631.0, 236010.0, 471596.0, 187585.0, 45403.0, 13651.0, 5120.0, 2196.0, 1068.0, 645.0, 375.0, 219.0, 156.0, 103.0, 70.0, 47.0, 24.0, 19.0, 18.0, 9.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-18.96875, -18.4478759765625, -17.927001953125, -17.4061279296875, -16.88525390625, -16.3643798828125, -15.843505859375, -15.3226318359375, -14.8017578125, -14.2808837890625, -13.760009765625, -13.2391357421875, -12.71826171875, -12.1973876953125, -11.676513671875, -11.1556396484375, -10.634765625, -10.1138916015625, -9.593017578125, -9.0721435546875, -8.55126953125, -8.0303955078125, -7.509521484375, -6.9886474609375, -6.4677734375, -5.9468994140625, -5.426025390625, -4.9051513671875, -4.38427734375, -3.8634033203125, -3.342529296875, -2.8216552734375, -2.30078125, -1.7799072265625, -1.259033203125, -0.7381591796875, -0.21728515625, 0.3035888671875, 0.824462890625, 1.3453369140625, 1.8662109375, 2.3870849609375, 2.907958984375, 3.4288330078125, 3.94970703125, 4.4705810546875, 4.991455078125, 5.5123291015625, 6.033203125, 6.5540771484375, 7.074951171875, 7.5958251953125, 8.11669921875, 8.6375732421875, 9.158447265625, 9.6793212890625, 10.2001953125, 10.7210693359375, 11.241943359375, 11.7628173828125, 12.28369140625, 12.8045654296875, 13.325439453125, 13.8463134765625, 14.3671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 2.0, 11.0, 4.0, 2.0, 8.0, 9.0, 14.0, 12.0, 17.0, 15.0, 23.0, 31.0, 42.0, 42.0, 42.0, 59.0, 43.0, 57.0, 62.0, 63.0, 56.0, 46.0, 58.0, 45.0, 35.0, 35.0, 42.0, 27.0, 19.0, 24.0, 7.0, 12.0, 7.0, 12.0, 6.0, 5.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.9609375, -8.57373046875, -8.1865234375, -7.79931640625, -7.412109375, -7.02490234375, -6.6376953125, -6.25048828125, -5.86328125, -5.47607421875, -5.0888671875, -4.70166015625, -4.314453125, -3.92724609375, -3.5400390625, -3.15283203125, -2.765625, -2.37841796875, -1.9912109375, -1.60400390625, -1.216796875, -0.82958984375, -0.4423828125, -0.05517578125, 0.33203125, 0.71923828125, 1.1064453125, 1.49365234375, 1.880859375, 2.26806640625, 2.6552734375, 3.04248046875, 3.4296875, 3.81689453125, 4.2041015625, 4.59130859375, 4.978515625, 5.36572265625, 5.7529296875, 6.14013671875, 6.52734375, 6.91455078125, 7.3017578125, 7.68896484375, 8.076171875, 8.46337890625, 8.8505859375, 9.23779296875, 9.625, 10.01220703125, 10.3994140625, 10.78662109375, 11.173828125, 11.56103515625, 11.9482421875, 12.33544921875, 12.72265625, 13.10986328125, 13.4970703125, 13.88427734375, 14.271484375, 14.65869140625, 15.0458984375, 15.43310546875, 15.8203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 10.0, 16.0, 23.0, 35.0, 79.0, 108.0, 211.0, 427.0, 986.0, 3188.0, 16164.0, 157535.0, 700695.0, 148629.0, 15457.0, 3110.0, 963.0, 415.0, 227.0, 112.0, 62.0, 31.0, 20.0, 17.0, 9.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.4296875, -11.9005126953125, -11.371337890625, -10.8421630859375, -10.31298828125, -9.7838134765625, -9.254638671875, -8.7254638671875, -8.1962890625, -7.6671142578125, -7.137939453125, -6.6087646484375, -6.07958984375, -5.5504150390625, -5.021240234375, -4.4920654296875, -3.962890625, -3.4337158203125, -2.904541015625, -2.3753662109375, -1.84619140625, -1.3170166015625, -0.787841796875, -0.2586669921875, 0.2705078125, 0.7996826171875, 1.328857421875, 1.8580322265625, 2.38720703125, 2.9163818359375, 3.445556640625, 3.9747314453125, 4.50390625, 5.0330810546875, 5.562255859375, 6.0914306640625, 6.62060546875, 7.1497802734375, 7.678955078125, 8.2081298828125, 8.7373046875, 9.2664794921875, 9.795654296875, 10.3248291015625, 10.85400390625, 11.3831787109375, 11.912353515625, 12.4415283203125, 12.970703125, 13.4998779296875, 14.029052734375, 14.5582275390625, 15.08740234375, 15.6165771484375, 16.145751953125, 16.6749267578125, 17.2041015625, 17.7332763671875, 18.262451171875, 18.7916259765625, 19.32080078125, 19.8499755859375, 20.379150390625, 20.9083251953125, 21.4375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 14.0, 4.0, 16.0, 21.0, 37.0, 37.0, 42.0, 53.0, 71.0, 107.0, 98.0, 110.0, 80.0, 78.0, 56.0, 51.0, 29.0, 27.0, 21.0, 15.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001506805419921875, -0.0014635473489761353, -0.0014202892780303955, -0.0013770312070846558, -0.001333773136138916, -0.0012905150651931763, -0.0012472569942474365, -0.0012039989233016968, -0.001160740852355957, -0.0011174827814102173, -0.0010742247104644775, -0.0010309666395187378, -0.000987708568572998, -0.0009444504976272583, -0.0009011924266815186, -0.0008579343557357788, -0.0008146762847900391, -0.0007714182138442993, -0.0007281601428985596, -0.0006849020719528198, -0.0006416440010070801, -0.0005983859300613403, -0.0005551278591156006, -0.0005118697881698608, -0.0004686117172241211, -0.00042535364627838135, -0.0003820955753326416, -0.00033883750438690186, -0.0002955794334411621, -0.00025232136249542236, -0.00020906329154968262, -0.00016580522060394287, -0.00012254714965820312, -7.928907871246338e-05, -3.603100776672363e-05, 7.227063179016113e-06, 5.048513412475586e-05, 9.37432050704956e-05, 0.00013700127601623535, 0.0001802593469619751, 0.00022351741790771484, 0.0002667754888534546, 0.00031003355979919434, 0.0003532916307449341, 0.00039654970169067383, 0.0004398077726364136, 0.0004830658435821533, 0.0005263239145278931, 0.0005695819854736328, 0.0006128400564193726, 0.0006560981273651123, 0.000699356198310852, 0.0007426142692565918, 0.0007858723402023315, 0.0008291304111480713, 0.000872388482093811, 0.0009156465530395508, 0.0009589046239852905, 0.0010021626949310303, 0.00104542076587677, 0.0010886788368225098, 0.0011319369077682495, 0.0011751949787139893, 0.001218453049659729, 0.0012617111206054688]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 9.0, 9.0, 16.0, 30.0, 47.0, 57.0, 103.0, 210.0, 384.0, 741.0, 1682.0, 4455.0, 15109.0, 71849.0, 385379.0, 450422.0, 90649.0, 18357.0, 5182.0, 1934.0, 898.0, 415.0, 251.0, 161.0, 88.0, 43.0, 28.0, 14.0, 6.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8515625, -10.4649658203125, -10.078369140625, -9.6917724609375, -9.30517578125, -8.9185791015625, -8.531982421875, -8.1453857421875, -7.7587890625, -7.3721923828125, -6.985595703125, -6.5989990234375, -6.21240234375, -5.8258056640625, -5.439208984375, -5.0526123046875, -4.666015625, -4.2794189453125, -3.892822265625, -3.5062255859375, -3.11962890625, -2.7330322265625, -2.346435546875, -1.9598388671875, -1.5732421875, -1.1866455078125, -0.800048828125, -0.4134521484375, -0.02685546875, 0.3597412109375, 0.746337890625, 1.1329345703125, 1.51953125, 1.9061279296875, 2.292724609375, 2.6793212890625, 3.06591796875, 3.4525146484375, 3.839111328125, 4.2257080078125, 4.6123046875, 4.9989013671875, 5.385498046875, 5.7720947265625, 6.15869140625, 6.5452880859375, 6.931884765625, 7.3184814453125, 7.705078125, 8.0916748046875, 8.478271484375, 8.8648681640625, 9.25146484375, 9.6380615234375, 10.024658203125, 10.4112548828125, 10.7978515625, 11.1844482421875, 11.571044921875, 11.9576416015625, 12.34423828125, 12.7308349609375, 13.117431640625, 13.5040283203125, 13.890625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 6.0, 5.0, 7.0, 13.0, 11.0, 19.0, 38.0, 40.0, 41.0, 41.0, 64.0, 73.0, 89.0, 85.0, 73.0, 50.0, 64.0, 69.0, 47.0, 44.0, 27.0, 22.0, 17.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.796875, -4.6173095703125, -4.437744140625, -4.2581787109375, -4.07861328125, -3.8990478515625, -3.719482421875, -3.5399169921875, -3.3603515625, -3.1807861328125, -3.001220703125, -2.8216552734375, -2.64208984375, -2.4625244140625, -2.282958984375, -2.1033935546875, -1.923828125, -1.7442626953125, -1.564697265625, -1.3851318359375, -1.20556640625, -1.0260009765625, -0.846435546875, -0.6668701171875, -0.4873046875, -0.3077392578125, -0.128173828125, 0.0513916015625, 0.23095703125, 0.4105224609375, 0.590087890625, 0.7696533203125, 0.94921875, 1.1287841796875, 1.308349609375, 1.4879150390625, 1.66748046875, 1.8470458984375, 2.026611328125, 2.2061767578125, 2.3857421875, 2.5653076171875, 2.744873046875, 2.9244384765625, 3.10400390625, 3.2835693359375, 3.463134765625, 3.6427001953125, 3.822265625, 4.0018310546875, 4.181396484375, 4.3609619140625, 4.54052734375, 4.7200927734375, 4.899658203125, 5.0792236328125, 5.2587890625, 5.4383544921875, 5.617919921875, 5.7974853515625, 5.97705078125, 6.1566162109375, 6.336181640625, 6.5157470703125, 6.6953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 15.0, 22.0, 35.0, 72.0, 109.0, 215.0, 213.0, 134.0, 97.0, 38.0, 14.0, 15.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.81781005859375, -111.219482421875, -106.62115478515625, -102.0228271484375, -97.42449951171875, -92.826171875, -88.22785186767578, -83.62952423095703, -79.03119659423828, -74.43286895751953, -69.83454132080078, -65.23621368408203, -60.63788986206055, -56.0395622253418, -51.44123840332031, -46.84291076660156, -42.24458312988281, -37.64625549316406, -33.04792785644531, -28.449604034423828, -23.851276397705078, -19.252948760986328, -14.654623031616211, -10.056297302246094, -5.457969665527344, -0.8596429824829102, 3.7386837005615234, 8.337010383605957, 12.93533706665039, 17.53366470336914, 22.131990432739258, 26.730316162109375, 31.328643798828125, 35.926971435546875, 40.525299072265625, 45.12362289428711, 49.72195053100586, 54.32027816772461, 58.918601989746094, 63.516929626464844, 68.1152572631836, 72.71358489990234, 77.3119125366211, 81.91024017333984, 86.50856018066406, 91.10688781738281, 95.70521545410156, 100.30354309082031, 104.90187072753906, 109.50019836425781, 114.09852600097656, 118.69685363769531, 123.29518127441406, 127.89350891113281, 132.49183654785156, 137.09014892578125, 141.6884765625, 146.28680419921875, 150.8851318359375, 155.48345947265625, 160.081787109375, 164.68011474609375, 169.2784423828125, 173.87677001953125, 178.47509765625]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 8.0, 10.0, 10.0, 18.0, 12.0, 19.0, 28.0, 26.0, 40.0, 28.0, 51.0, 48.0, 41.0, 55.0, 60.0, 71.0, 58.0, 46.0, 52.0, 49.0, 40.0, 33.0, 28.0, 32.0, 22.0, 25.0, 11.0, 17.0, 12.0, 11.0, 11.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-100.55101013183594, -97.74528503417969, -94.93956756591797, -92.13384246826172, -89.32811737060547, -86.52239990234375, -83.7166748046875, -80.91094970703125, -78.105224609375, -75.29949951171875, -72.49378204345703, -69.68805694580078, -66.88233184814453, -64.07661437988281, -61.27088928222656, -58.46516418457031, -55.659446716308594, -52.85372543334961, -50.04800033569336, -47.242279052734375, -44.436553955078125, -41.63083267211914, -38.825111389160156, -36.019386291503906, -33.21366500854492, -30.407941818237305, -27.602218627929688, -24.796497344970703, -21.990774154663086, -19.18505096435547, -16.379329681396484, -13.573606491088867, -10.767875671386719, -7.96215295791626, -5.156430244445801, -2.3507080078125, 0.4550151824951172, 3.2607383728027344, 6.066459655761719, 8.872182846069336, 11.677906036376953, 14.48362922668457, 17.289352416992188, 20.095073699951172, 22.90079689025879, 25.706520080566406, 28.51224136352539, 31.317964553833008, 34.123687744140625, 36.92940902709961, 39.73513412475586, 42.540855407714844, 45.346580505371094, 48.15230178833008, 50.95802307128906, 53.76374816894531, 56.5694694519043, 59.37519073486328, 62.18091583251953, 64.98663330078125, 67.7923583984375, 70.59808349609375, 73.40380859375, 76.20952606201172, 79.01525115966797]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 10.0, 3.0, 14.0, 9.0, 34.0, 38.0, 78.0, 124.0, 245.0, 473.0, 1177.0, 3952.0, 21130.0, 695403.0, 3434501.0, 29789.0, 5049.0, 1324.0, 493.0, 181.0, 92.0, 61.0, 31.0, 21.0, 17.0, 14.0, 11.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-71.5625, -69.86181640625, -68.1611328125, -66.46044921875, -64.759765625, -63.05908203125, -61.3583984375, -59.65771484375, -57.95703125, -56.25634765625, -54.5556640625, -52.85498046875, -51.154296875, -49.45361328125, -47.7529296875, -46.05224609375, -44.3515625, -42.65087890625, -40.9501953125, -39.24951171875, -37.548828125, -35.84814453125, -34.1474609375, -32.44677734375, -30.74609375, -29.04541015625, -27.3447265625, -25.64404296875, -23.943359375, -22.24267578125, -20.5419921875, -18.84130859375, -17.140625, -15.43994140625, -13.7392578125, -12.03857421875, -10.337890625, -8.63720703125, -6.9365234375, -5.23583984375, -3.53515625, -1.83447265625, -0.1337890625, 1.56689453125, 3.267578125, 4.96826171875, 6.6689453125, 8.36962890625, 10.0703125, 11.77099609375, 13.4716796875, 15.17236328125, 16.873046875, 18.57373046875, 20.2744140625, 21.97509765625, 23.67578125, 25.37646484375, 27.0771484375, 28.77783203125, 30.478515625, 32.17919921875, 33.8798828125, 35.58056640625, 37.28125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 26.0, 23.0, 27.0, 32.0, 46.0, 56.0, 64.0, 76.0, 84.0, 67.0, 71.0, 84.0, 64.0, 64.0, 48.0, 34.0, 22.0, 32.0, 10.0, 17.0, 11.0, 15.0, 6.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.23150634765625, -4.1192626953125, -4.00701904296875, -3.894775390625, -3.78253173828125, -3.6702880859375, -3.55804443359375, -3.44580078125, -3.33355712890625, -3.2213134765625, -3.10906982421875, -2.996826171875, -2.88458251953125, -2.7723388671875, -2.66009521484375, -2.5478515625, -2.43560791015625, -2.3233642578125, -2.21112060546875, -2.098876953125, -1.98663330078125, -1.8743896484375, -1.76214599609375, -1.64990234375, -1.53765869140625, -1.4254150390625, -1.31317138671875, -1.200927734375, -1.08868408203125, -0.9764404296875, -0.86419677734375, -0.751953125, -0.63970947265625, -0.5274658203125, -0.41522216796875, -0.302978515625, -0.19073486328125, -0.0784912109375, 0.03375244140625, 0.14599609375, 0.25823974609375, 0.3704833984375, 0.48272705078125, 0.594970703125, 0.70721435546875, 0.8194580078125, 0.93170166015625, 1.0439453125, 1.15618896484375, 1.2684326171875, 1.38067626953125, 1.492919921875, 1.60516357421875, 1.7174072265625, 1.82965087890625, 1.94189453125, 2.05413818359375, 2.1663818359375, 2.27862548828125, 2.390869140625, 2.50311279296875, 2.6153564453125, 2.72760009765625, 2.83984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 4.0, 9.0, 5.0, 10.0, 18.0, 24.0, 46.0, 93.0, 157.0, 303.0, 432.0, 907.0, 2083.0, 5417.0, 19422.0, 158395.0, 3749263.0, 226805.0, 22070.0, 5281.0, 1860.0, 766.0, 406.0, 210.0, 120.0, 68.0, 40.0, 22.0, 13.0, 8.0, 8.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.8125, -26.87158203125, -25.9306640625, -24.98974609375, -24.048828125, -23.10791015625, -22.1669921875, -21.22607421875, -20.28515625, -19.34423828125, -18.4033203125, -17.46240234375, -16.521484375, -15.58056640625, -14.6396484375, -13.69873046875, -12.7578125, -11.81689453125, -10.8759765625, -9.93505859375, -8.994140625, -8.05322265625, -7.1123046875, -6.17138671875, -5.23046875, -4.28955078125, -3.3486328125, -2.40771484375, -1.466796875, -0.52587890625, 0.4150390625, 1.35595703125, 2.296875, 3.23779296875, 4.1787109375, 5.11962890625, 6.060546875, 7.00146484375, 7.9423828125, 8.88330078125, 9.82421875, 10.76513671875, 11.7060546875, 12.64697265625, 13.587890625, 14.52880859375, 15.4697265625, 16.41064453125, 17.3515625, 18.29248046875, 19.2333984375, 20.17431640625, 21.115234375, 22.05615234375, 22.9970703125, 23.93798828125, 24.87890625, 25.81982421875, 26.7607421875, 27.70166015625, 28.642578125, 29.58349609375, 30.5244140625, 31.46533203125, 32.40625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 6.0, 10.0, 8.0, 10.0, 22.0, 29.0, 57.0, 85.0, 169.0, 383.0, 1552.0, 1041.0, 343.0, 146.0, 71.0, 40.0, 32.0, 22.0, 8.0, 6.0, 5.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.98828125, -7.7655029296875, -7.542724609375, -7.3199462890625, -7.09716796875, -6.8743896484375, -6.651611328125, -6.4288330078125, -6.2060546875, -5.9832763671875, -5.760498046875, -5.5377197265625, -5.31494140625, -5.0921630859375, -4.869384765625, -4.6466064453125, -4.423828125, -4.2010498046875, -3.978271484375, -3.7554931640625, -3.53271484375, -3.3099365234375, -3.087158203125, -2.8643798828125, -2.6416015625, -2.4188232421875, -2.196044921875, -1.9732666015625, -1.75048828125, -1.5277099609375, -1.304931640625, -1.0821533203125, -0.859375, -0.6365966796875, -0.413818359375, -0.1910400390625, 0.03173828125, 0.2545166015625, 0.477294921875, 0.7000732421875, 0.9228515625, 1.1456298828125, 1.368408203125, 1.5911865234375, 1.81396484375, 2.0367431640625, 2.259521484375, 2.4822998046875, 2.705078125, 2.9278564453125, 3.150634765625, 3.3734130859375, 3.59619140625, 3.8189697265625, 4.041748046875, 4.2645263671875, 4.4873046875, 4.7100830078125, 4.932861328125, 5.1556396484375, 5.37841796875, 5.6011962890625, 5.823974609375, 6.0467529296875, 6.26953125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 12.0, 21.0, 62.0, 111.0, 190.0, 224.0, 173.0, 97.0, 50.0, 26.0, 7.0, 8.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.49845504760742, -58.023921966552734, -56.54938888549805, -55.074851989746094, -53.600318908691406, -52.12578582763672, -50.65125274658203, -49.176719665527344, -47.702186584472656, -46.22765350341797, -44.75312042236328, -43.278587341308594, -41.80405044555664, -40.32951736450195, -38.854984283447266, -37.38045120239258, -35.905914306640625, -34.43138122558594, -32.95684814453125, -31.48231315612793, -30.00777816772461, -28.533245086669922, -27.058712005615234, -25.584178924560547, -24.109643936157227, -22.63511085510254, -21.16057586669922, -19.68604278564453, -18.211509704589844, -16.736974716186523, -15.262441635131836, -13.787907600402832, -12.313369750976562, -10.838835716247559, -9.364301681518555, -7.889768600463867, -6.415234565734863, -4.940700531005859, -3.466167449951172, -1.991633415222168, -0.5170993804931641, 0.9574344158172607, 2.4319682121276855, 3.9065017700195312, 5.381035804748535, 6.855569839477539, 8.330102920532227, 9.80463695526123, 11.279170989990234, 12.753705024719238, 14.228239059448242, 15.70277214050293, 17.17730712890625, 18.651840209960938, 20.126373291015625, 21.600906372070312, 23.075441360473633, 24.54997444152832, 26.02450942993164, 27.499042510986328, 28.973575592041016, 30.448110580444336, 31.922643661499023, 33.397178649902344, 34.87171173095703]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 9.0, 9.0, 8.0, 17.0, 20.0, 29.0, 35.0, 30.0, 38.0, 41.0, 46.0, 56.0, 65.0, 50.0, 64.0, 48.0, 58.0, 52.0, 40.0, 46.0, 25.0, 38.0, 32.0, 26.0, 27.0, 16.0, 15.0, 13.0, 12.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.93990707397461, -22.23623275756836, -21.532556533813477, -20.828880310058594, -20.125205993652344, -19.421531677246094, -18.71785545349121, -18.014179229736328, -17.310504913330078, -16.606830596923828, -15.903154373168945, -15.199479103088379, -14.495803833007812, -13.792128562927246, -13.08845329284668, -12.384778022766113, -11.681102752685547, -10.97742748260498, -10.273752212524414, -9.570076942443848, -8.866401672363281, -8.162726402282715, -7.459051132202148, -6.755375862121582, -6.051700592041016, -5.348025321960449, -4.644350051879883, -3.9406747817993164, -3.23699951171875, -2.5333242416381836, -1.8296489715576172, -1.1259737014770508, -0.4222984313964844, 0.28137683868408203, 0.9850521087646484, 1.6887273788452148, 2.3924026489257812, 3.0960779190063477, 3.799753189086914, 4.5034284591674805, 5.207103729248047, 5.910778999328613, 6.61445426940918, 7.318129539489746, 8.021804809570312, 8.725480079650879, 9.429155349731445, 10.132830619812012, 10.836505889892578, 11.540181159973145, 12.243856430053711, 12.947531700134277, 13.651206970214844, 14.35488224029541, 15.058557510375977, 15.762232780456543, 16.46590805053711, 17.16958236694336, 17.873258590698242, 18.576934814453125, 19.280609130859375, 19.984283447265625, 20.687959671020508, 21.39163589477539, 22.09531021118164]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 13.0, 13.0, 8.0, 14.0, 9.0, 21.0, 27.0, 40.0, 43.0, 94.0, 135.0, 165.0, 272.0, 494.0, 855.0, 1562.0, 3263.0, 7454.0, 18776.0, 54919.0, 166831.0, 357299.0, 278119.0, 102376.0, 33179.0, 12224.0, 5026.0, 2366.0, 1194.0, 654.0, 405.0, 214.0, 134.0, 92.0, 62.0, 47.0, 42.0, 33.0, 16.0, 12.0, 7.0, 9.0, 4.0, 9.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-12.5546875, -12.171630859375, -11.78857421875, -11.405517578125, -11.0224609375, -10.639404296875, -10.25634765625, -9.873291015625, -9.490234375, -9.107177734375, -8.72412109375, -8.341064453125, -7.9580078125, -7.574951171875, -7.19189453125, -6.808837890625, -6.42578125, -6.042724609375, -5.65966796875, -5.276611328125, -4.8935546875, -4.510498046875, -4.12744140625, -3.744384765625, -3.361328125, -2.978271484375, -2.59521484375, -2.212158203125, -1.8291015625, -1.446044921875, -1.06298828125, -0.679931640625, -0.296875, 0.086181640625, 0.46923828125, 0.852294921875, 1.2353515625, 1.618408203125, 2.00146484375, 2.384521484375, 2.767578125, 3.150634765625, 3.53369140625, 3.916748046875, 4.2998046875, 4.682861328125, 5.06591796875, 5.448974609375, 5.83203125, 6.215087890625, 6.59814453125, 6.981201171875, 7.3642578125, 7.747314453125, 8.13037109375, 8.513427734375, 8.896484375, 9.279541015625, 9.66259765625, 10.045654296875, 10.4287109375, 10.811767578125, 11.19482421875, 11.577880859375, 11.9609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 13.0, 23.0, 41.0, 43.0, 53.0, 61.0, 75.0, 80.0, 91.0, 80.0, 71.0, 80.0, 60.0, 51.0, 35.0, 29.0, 21.0, 28.0, 12.0, 11.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15234375, -4.0372314453125, -3.922119140625, -3.8070068359375, -3.69189453125, -3.5767822265625, -3.461669921875, -3.3465576171875, -3.2314453125, -3.1163330078125, -3.001220703125, -2.8861083984375, -2.77099609375, -2.6558837890625, -2.540771484375, -2.4256591796875, -2.310546875, -2.1954345703125, -2.080322265625, -1.9652099609375, -1.85009765625, -1.7349853515625, -1.619873046875, -1.5047607421875, -1.3896484375, -1.2745361328125, -1.159423828125, -1.0443115234375, -0.92919921875, -0.8140869140625, -0.698974609375, -0.5838623046875, -0.46875, -0.3536376953125, -0.238525390625, -0.1234130859375, -0.00830078125, 0.1068115234375, 0.221923828125, 0.3370361328125, 0.4521484375, 0.5672607421875, 0.682373046875, 0.7974853515625, 0.91259765625, 1.0277099609375, 1.142822265625, 1.2579345703125, 1.373046875, 1.4881591796875, 1.603271484375, 1.7183837890625, 1.83349609375, 1.9486083984375, 2.063720703125, 2.1788330078125, 2.2939453125, 2.4090576171875, 2.524169921875, 2.6392822265625, 2.75439453125, 2.8695068359375, 2.984619140625, 3.0997314453125, 3.21484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 9.0, 9.0, 19.0, 23.0, 29.0, 60.0, 70.0, 71.0, 89.0, 144.0, 236.0, 328.0, 542.0, 901.0, 1575.0, 2985.0, 6524.0, 15845.0, 39846.0, 107347.0, 255755.0, 326182.0, 176843.0, 67237.0, 25493.0, 10420.0, 4595.0, 2222.0, 1136.0, 657.0, 429.0, 265.0, 162.0, 135.0, 97.0, 63.0, 58.0, 47.0, 33.0, 24.0, 13.0, 11.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.9296875, -10.6107177734375, -10.291748046875, -9.9727783203125, -9.65380859375, -9.3348388671875, -9.015869140625, -8.6968994140625, -8.3779296875, -8.0589599609375, -7.739990234375, -7.4210205078125, -7.10205078125, -6.7830810546875, -6.464111328125, -6.1451416015625, -5.826171875, -5.5072021484375, -5.188232421875, -4.8692626953125, -4.55029296875, -4.2313232421875, -3.912353515625, -3.5933837890625, -3.2744140625, -2.9554443359375, -2.636474609375, -2.3175048828125, -1.99853515625, -1.6795654296875, -1.360595703125, -1.0416259765625, -0.72265625, -0.4036865234375, -0.084716796875, 0.2342529296875, 0.55322265625, 0.8721923828125, 1.191162109375, 1.5101318359375, 1.8291015625, 2.1480712890625, 2.467041015625, 2.7860107421875, 3.10498046875, 3.4239501953125, 3.742919921875, 4.0618896484375, 4.380859375, 4.6998291015625, 5.018798828125, 5.3377685546875, 5.65673828125, 5.9757080078125, 6.294677734375, 6.6136474609375, 6.9326171875, 7.2515869140625, 7.570556640625, 7.8895263671875, 8.20849609375, 8.5274658203125, 8.846435546875, 9.1654052734375, 9.484375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 7.0, 12.0, 9.0, 7.0, 8.0, 17.0, 12.0, 21.0, 24.0, 35.0, 24.0, 33.0, 40.0, 49.0, 38.0, 45.0, 49.0, 44.0, 41.0, 53.0, 31.0, 57.0, 44.0, 32.0, 27.0, 29.0, 34.0, 21.0, 18.0, 24.0, 16.0, 12.0, 14.0, 14.0, 13.0, 11.0, 4.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.5338134765625, -9.184814453125, -8.8358154296875, -8.48681640625, -8.1378173828125, -7.788818359375, -7.4398193359375, -7.0908203125, -6.7418212890625, -6.392822265625, -6.0438232421875, -5.69482421875, -5.3458251953125, -4.996826171875, -4.6478271484375, -4.298828125, -3.9498291015625, -3.600830078125, -3.2518310546875, -2.90283203125, -2.5538330078125, -2.204833984375, -1.8558349609375, -1.5068359375, -1.1578369140625, -0.808837890625, -0.4598388671875, -0.11083984375, 0.2381591796875, 0.587158203125, 0.9361572265625, 1.28515625, 1.6341552734375, 1.983154296875, 2.3321533203125, 2.68115234375, 3.0301513671875, 3.379150390625, 3.7281494140625, 4.0771484375, 4.4261474609375, 4.775146484375, 5.1241455078125, 5.47314453125, 5.8221435546875, 6.171142578125, 6.5201416015625, 6.869140625, 7.2181396484375, 7.567138671875, 7.9161376953125, 8.26513671875, 8.6141357421875, 8.963134765625, 9.3121337890625, 9.6611328125, 10.0101318359375, 10.359130859375, 10.7081298828125, 11.05712890625, 11.4061279296875, 11.755126953125, 12.1041259765625, 12.453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 23.0, 42.0, 55.0, 95.0, 187.0, 592.0, 2072.0, 14850.0, 248945.0, 715982.0, 58519.0, 5410.0, 1130.0, 360.0, 125.0, 64.0, 32.0, 25.0, 11.0, 12.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.09375, -14.677490234375, -14.26123046875, -13.844970703125, -13.4287109375, -13.012451171875, -12.59619140625, -12.179931640625, -11.763671875, -11.347412109375, -10.93115234375, -10.514892578125, -10.0986328125, -9.682373046875, -9.26611328125, -8.849853515625, -8.43359375, -8.017333984375, -7.60107421875, -7.184814453125, -6.7685546875, -6.352294921875, -5.93603515625, -5.519775390625, -5.103515625, -4.687255859375, -4.27099609375, -3.854736328125, -3.4384765625, -3.022216796875, -2.60595703125, -2.189697265625, -1.7734375, -1.357177734375, -0.94091796875, -0.524658203125, -0.1083984375, 0.307861328125, 0.72412109375, 1.140380859375, 1.556640625, 1.972900390625, 2.38916015625, 2.805419921875, 3.2216796875, 3.637939453125, 4.05419921875, 4.470458984375, 4.88671875, 5.302978515625, 5.71923828125, 6.135498046875, 6.5517578125, 6.968017578125, 7.38427734375, 7.800537109375, 8.216796875, 8.633056640625, 9.04931640625, 9.465576171875, 9.8818359375, 10.298095703125, 10.71435546875, 11.130615234375, 11.546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 6.0, 13.0, 16.0, 5.0, 15.0, 11.0, 25.0, 30.0, 46.0, 51.0, 62.0, 80.0, 89.0, 104.0, 87.0, 70.0, 65.0, 47.0, 44.0, 36.0, 20.0, 23.0, 17.0, 10.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007205009460449219, -0.0006960928440093994, -0.000671684741973877, -0.0006472766399383545, -0.000622868537902832, -0.0005984604358673096, -0.0005740523338317871, -0.0005496442317962646, -0.0005252361297607422, -0.0005008280277252197, -0.00047641992568969727, -0.0004520118236541748, -0.00042760372161865234, -0.0004031956195831299, -0.0003787875175476074, -0.00035437941551208496, -0.0003299713134765625, -0.00030556321144104004, -0.0002811551094055176, -0.0002567470073699951, -0.00023233890533447266, -0.0002079308032989502, -0.00018352270126342773, -0.00015911459922790527, -0.0001347064971923828, -0.00011029839515686035, -8.589029312133789e-05, -6.148219108581543e-05, -3.707408905029297e-05, -1.2665987014770508e-05, 1.1742115020751953e-05, 3.6150217056274414e-05, 6.0558319091796875e-05, 8.496642112731934e-05, 0.0001093745231628418, 0.00013378262519836426, 0.00015819072723388672, 0.00018259882926940918, 0.00020700693130493164, 0.0002314150333404541, 0.00025582313537597656, 0.000280231237411499, 0.0003046393394470215, 0.00032904744148254395, 0.0003534555435180664, 0.00037786364555358887, 0.00040227174758911133, 0.0004266798496246338, 0.00045108795166015625, 0.0004754960536956787, 0.0004999041557312012, 0.0005243122577667236, 0.0005487203598022461, 0.0005731284618377686, 0.000597536563873291, 0.0006219446659088135, 0.0006463527679443359, 0.0006707608699798584, 0.0006951689720153809, 0.0007195770740509033, 0.0007439851760864258, 0.0007683932781219482, 0.0007928013801574707, 0.0008172094821929932, 0.0008416175842285156]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 17.0, 22.0, 36.0, 55.0, 80.0, 149.0, 329.0, 669.0, 1889.0, 6523.0, 35431.0, 338078.0, 577703.0, 72201.0, 10894.0, 2716.0, 893.0, 418.0, 163.0, 114.0, 52.0, 44.0, 24.0, 15.0, 17.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.193359375, -9.85546875, -9.517578125, -9.1796875, -8.841796875, -8.50390625, -8.166015625, -7.828125, -7.490234375, -7.15234375, -6.814453125, -6.4765625, -6.138671875, -5.80078125, -5.462890625, -5.125, -4.787109375, -4.44921875, -4.111328125, -3.7734375, -3.435546875, -3.09765625, -2.759765625, -2.421875, -2.083984375, -1.74609375, -1.408203125, -1.0703125, -0.732421875, -0.39453125, -0.056640625, 0.28125, 0.619140625, 0.95703125, 1.294921875, 1.6328125, 1.970703125, 2.30859375, 2.646484375, 2.984375, 3.322265625, 3.66015625, 3.998046875, 4.3359375, 4.673828125, 5.01171875, 5.349609375, 5.6875, 6.025390625, 6.36328125, 6.701171875, 7.0390625, 7.376953125, 7.71484375, 8.052734375, 8.390625, 8.728515625, 9.06640625, 9.404296875, 9.7421875, 10.080078125, 10.41796875, 10.755859375, 11.09375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 4.0, 6.0, 9.0, 13.0, 17.0, 30.0, 46.0, 74.0, 120.0, 133.0, 150.0, 137.0, 90.0, 68.0, 37.0, 34.0, 16.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.765625, -6.44921875, -6.1328125, -5.81640625, -5.5, -5.18359375, -4.8671875, -4.55078125, -4.234375, -3.91796875, -3.6015625, -3.28515625, -2.96875, -2.65234375, -2.3359375, -2.01953125, -1.703125, -1.38671875, -1.0703125, -0.75390625, -0.4375, -0.12109375, 0.1953125, 0.51171875, 0.828125, 1.14453125, 1.4609375, 1.77734375, 2.09375, 2.41015625, 2.7265625, 3.04296875, 3.359375, 3.67578125, 3.9921875, 4.30859375, 4.625, 4.94140625, 5.2578125, 5.57421875, 5.890625, 6.20703125, 6.5234375, 6.83984375, 7.15625, 7.47265625, 7.7890625, 8.10546875, 8.421875, 8.73828125, 9.0546875, 9.37109375, 9.6875, 10.00390625, 10.3203125, 10.63671875, 10.953125, 11.26953125, 11.5859375, 11.90234375, 12.21875, 12.53515625, 12.8515625, 13.16796875, 13.484375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 8.0, 24.0, 45.0, 83.0, 157.0, 219.0, 214.0, 138.0, 62.0, 26.0, 12.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-200.93515014648438, -196.45555114746094, -191.9759521484375, -187.49635314941406, -183.01675415039062, -178.5371551513672, -174.05755615234375, -169.57797241210938, -165.09835815429688, -160.61875915527344, -156.13916015625, -151.65956115722656, -147.17996215820312, -142.7003631591797, -138.22076416015625, -133.74118041992188, -129.26158142089844, -124.781982421875, -120.30238342285156, -115.82278442382812, -111.34318542480469, -106.86358642578125, -102.38399505615234, -97.9043960571289, -93.42479705810547, -88.94519805908203, -84.4655990600586, -79.98600006103516, -75.50640869140625, -71.02680969238281, -66.54721069335938, -62.06761169433594, -57.58802795410156, -53.108428955078125, -48.62882995605469, -44.149234771728516, -39.66963577270508, -35.19003677368164, -30.710439682006836, -26.23084259033203, -21.751243591308594, -17.271644592285156, -12.792047500610352, -8.31244945526123, -3.8328514099121094, 0.6467475891113281, 5.126344680786133, 9.605941772460938, 14.085540771484375, 18.565139770507812, 23.044736862182617, 27.524333953857422, 32.00393295288086, 36.4835319519043, 40.96312713623047, 45.442726135253906, 49.922325134277344, 54.40192413330078, 58.88152313232422, 63.36111831665039, 67.84071350097656, 72.3203125, 76.79991149902344, 81.27951049804688, 85.75910949707031]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 0.0, 4.0, 2.0, 7.0, 7.0, 8.0, 6.0, 22.0, 20.0, 10.0, 20.0, 30.0, 39.0, 43.0, 44.0, 35.0, 37.0, 50.0, 44.0, 61.0, 45.0, 51.0, 44.0, 37.0, 51.0, 46.0, 39.0, 35.0, 29.0, 20.0, 23.0, 21.0, 20.0, 14.0, 18.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.02713775634766, -65.70094299316406, -63.37474060058594, -61.04854202270508, -58.72234344482422, -56.39614486694336, -54.0699462890625, -51.74374771118164, -49.41754913330078, -47.09135055541992, -44.76515197753906, -42.4389533996582, -40.112754821777344, -37.786556243896484, -35.460357666015625, -33.134159088134766, -30.807960510253906, -28.481761932373047, -26.155563354492188, -23.829364776611328, -21.50316619873047, -19.17696762084961, -16.85076904296875, -14.52457046508789, -12.198371887207031, -9.872173309326172, -7.5459747314453125, -5.219776153564453, -2.8935775756835938, -0.5673789978027344, 1.758819580078125, 4.085018157958984, 6.411224365234375, 8.737422943115234, 11.063621520996094, 13.389820098876953, 15.716018676757812, 18.042217254638672, 20.36841583251953, 22.69461441040039, 25.02081298828125, 27.34701156616211, 29.67321014404297, 31.999408721923828, 34.32560729980469, 36.65180587768555, 38.978004455566406, 41.304203033447266, 43.630401611328125, 45.956600189208984, 48.282798767089844, 50.6089973449707, 52.93519592285156, 55.26139450073242, 57.58759307861328, 59.91379165649414, 62.239990234375, 64.56619262695312, 66.89238739013672, 69.21858215332031, 71.54478454589844, 73.87098693847656, 76.19718170166016, 78.52337646484375, 80.84957885742188]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 4.0, 1.0, 8.0, 10.0, 6.0, 22.0, 27.0, 33.0, 50.0, 48.0, 62.0, 100.0, 134.0, 221.0, 382.0, 674.0, 1329.0, 2845.0, 7238.0, 23367.0, 159111.0, 3735837.0, 220640.0, 27730.0, 8293.0, 3131.0, 1416.0, 676.0, 382.0, 200.0, 115.0, 65.0, 44.0, 30.0, 10.0, 11.0, 13.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.390625, -20.805419921875, -20.22021484375, -19.635009765625, -19.0498046875, -18.464599609375, -17.87939453125, -17.294189453125, -16.708984375, -16.123779296875, -15.53857421875, -14.953369140625, -14.3681640625, -13.782958984375, -13.19775390625, -12.612548828125, -12.02734375, -11.442138671875, -10.85693359375, -10.271728515625, -9.6865234375, -9.101318359375, -8.51611328125, -7.930908203125, -7.345703125, -6.760498046875, -6.17529296875, -5.590087890625, -5.0048828125, -4.419677734375, -3.83447265625, -3.249267578125, -2.6640625, -2.078857421875, -1.49365234375, -0.908447265625, -0.3232421875, 0.261962890625, 0.84716796875, 1.432373046875, 2.017578125, 2.602783203125, 3.18798828125, 3.773193359375, 4.3583984375, 4.943603515625, 5.52880859375, 6.114013671875, 6.69921875, 7.284423828125, 7.86962890625, 8.454833984375, 9.0400390625, 9.625244140625, 10.21044921875, 10.795654296875, 11.380859375, 11.966064453125, 12.55126953125, 13.136474609375, 13.7216796875, 14.306884765625, 14.89208984375, 15.477294921875, 16.0625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 15.0, 11.0, 29.0, 37.0, 56.0, 60.0, 95.0, 78.0, 88.0, 89.0, 84.0, 66.0, 78.0, 63.0, 47.0, 34.0, 23.0, 15.0, 16.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.69525146484375, -4.5584716796875, -4.42169189453125, -4.284912109375, -4.14813232421875, -4.0113525390625, -3.87457275390625, -3.73779296875, -3.60101318359375, -3.4642333984375, -3.32745361328125, -3.190673828125, -3.05389404296875, -2.9171142578125, -2.78033447265625, -2.6435546875, -2.50677490234375, -2.3699951171875, -2.23321533203125, -2.096435546875, -1.95965576171875, -1.8228759765625, -1.68609619140625, -1.54931640625, -1.41253662109375, -1.2757568359375, -1.13897705078125, -1.002197265625, -0.86541748046875, -0.7286376953125, -0.59185791015625, -0.455078125, -0.31829833984375, -0.1815185546875, -0.04473876953125, 0.092041015625, 0.22882080078125, 0.3656005859375, 0.50238037109375, 0.63916015625, 0.77593994140625, 0.9127197265625, 1.04949951171875, 1.186279296875, 1.32305908203125, 1.4598388671875, 1.59661865234375, 1.7333984375, 1.87017822265625, 2.0069580078125, 2.14373779296875, 2.280517578125, 2.41729736328125, 2.5540771484375, 2.69085693359375, 2.82763671875, 2.96441650390625, 3.1011962890625, 3.23797607421875, 3.374755859375, 3.51153564453125, 3.6483154296875, 3.78509521484375, 3.921875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 10.0, 14.0, 12.0, 21.0, 51.0, 91.0, 135.0, 228.0, 455.0, 967.0, 3053.0, 16683.0, 384327.0, 3724232.0, 54677.0, 6224.0, 1601.0, 682.0, 357.0, 214.0, 103.0, 61.0, 37.0, 26.0, 13.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-37.5625, -36.713623046875, -35.86474609375, -35.015869140625, -34.1669921875, -33.318115234375, -32.46923828125, -31.620361328125, -30.771484375, -29.922607421875, -29.07373046875, -28.224853515625, -27.3759765625, -26.527099609375, -25.67822265625, -24.829345703125, -23.98046875, -23.131591796875, -22.28271484375, -21.433837890625, -20.5849609375, -19.736083984375, -18.88720703125, -18.038330078125, -17.189453125, -16.340576171875, -15.49169921875, -14.642822265625, -13.7939453125, -12.945068359375, -12.09619140625, -11.247314453125, -10.3984375, -9.549560546875, -8.70068359375, -7.851806640625, -7.0029296875, -6.154052734375, -5.30517578125, -4.456298828125, -3.607421875, -2.758544921875, -1.90966796875, -1.060791015625, -0.2119140625, 0.636962890625, 1.48583984375, 2.334716796875, 3.18359375, 4.032470703125, 4.88134765625, 5.730224609375, 6.5791015625, 7.427978515625, 8.27685546875, 9.125732421875, 9.974609375, 10.823486328125, 11.67236328125, 12.521240234375, 13.3701171875, 14.218994140625, 15.06787109375, 15.916748046875, 16.765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 7.0, 7.0, 11.0, 11.0, 18.0, 45.0, 99.0, 178.0, 425.0, 1593.0, 1121.0, 315.0, 136.0, 54.0, 21.0, 13.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-7.984375, -7.7841796875, -7.583984375, -7.3837890625, -7.18359375, -6.9833984375, -6.783203125, -6.5830078125, -6.3828125, -6.1826171875, -5.982421875, -5.7822265625, -5.58203125, -5.3818359375, -5.181640625, -4.9814453125, -4.78125, -4.5810546875, -4.380859375, -4.1806640625, -3.98046875, -3.7802734375, -3.580078125, -3.3798828125, -3.1796875, -2.9794921875, -2.779296875, -2.5791015625, -2.37890625, -2.1787109375, -1.978515625, -1.7783203125, -1.578125, -1.3779296875, -1.177734375, -0.9775390625, -0.77734375, -0.5771484375, -0.376953125, -0.1767578125, 0.0234375, 0.2236328125, 0.423828125, 0.6240234375, 0.82421875, 1.0244140625, 1.224609375, 1.4248046875, 1.625, 1.8251953125, 2.025390625, 2.2255859375, 2.42578125, 2.6259765625, 2.826171875, 3.0263671875, 3.2265625, 3.4267578125, 3.626953125, 3.8271484375, 4.02734375, 4.2275390625, 4.427734375, 4.6279296875, 4.828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 12.0, 7.0, 27.0, 42.0, 74.0, 95.0, 164.0, 197.0, 147.0, 107.0, 53.0, 35.0, 14.0, 10.0, 10.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.935333251953125, -36.9786262512207, -36.02191925048828, -35.06521224975586, -34.10850524902344, -33.151798248291016, -32.195091247558594, -31.238384246826172, -30.28167724609375, -29.324970245361328, -28.368263244628906, -27.411556243896484, -26.454849243164062, -25.49814224243164, -24.54143524169922, -23.584728240966797, -22.628021240234375, -21.671314239501953, -20.71460723876953, -19.75790023803711, -18.801193237304688, -17.844486236572266, -16.887779235839844, -15.931072235107422, -14.974365234375, -14.017658233642578, -13.060951232910156, -12.104244232177734, -11.147537231445312, -10.19083023071289, -9.234123229980469, -8.277416229248047, -7.320711135864258, -6.364004135131836, -5.407297134399414, -4.450590133666992, -3.4938831329345703, -2.5371761322021484, -1.5804691314697266, -0.6237621307373047, 0.3329448699951172, 1.289651870727539, 2.246358871459961, 3.203065872192383, 4.159772872924805, 5.116479873657227, 6.073186874389648, 7.02989387512207, 7.986600875854492, 8.943307876586914, 9.900014877319336, 10.856721878051758, 11.81342887878418, 12.770135879516602, 13.726842880249023, 14.683549880981445, 15.640256881713867, 16.59696388244629, 17.55367088317871, 18.510377883911133, 19.467084884643555, 20.423791885375977, 21.3804988861084, 22.33720588684082, 23.293912887573242]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 17.0, 20.0, 36.0, 48.0, 51.0, 70.0, 79.0, 88.0, 103.0, 99.0, 104.0, 74.0, 55.0, 49.0, 31.0, 23.0, 20.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.465911865234375, -33.55241012573242, -32.6389045715332, -31.725400924682617, -30.81189727783203, -29.898393630981445, -28.98488998413086, -28.071388244628906, -27.157882690429688, -26.2443790435791, -25.330875396728516, -24.41737174987793, -23.503868103027344, -22.590364456176758, -21.676860809326172, -20.76335906982422, -19.849855422973633, -18.936351776123047, -18.02284812927246, -17.109344482421875, -16.19584083557129, -15.282337188720703, -14.368834495544434, -13.455330848693848, -12.541827201843262, -11.628323554992676, -10.71481990814209, -9.80131721496582, -8.887813568115234, -7.97430944442749, -7.0608062744140625, -6.147302627563477, -5.233800888061523, -4.3202972412109375, -3.4067938327789307, -2.493290424346924, -1.579786777496338, -0.666283130645752, 0.24722003936767578, 1.1607236862182617, 2.0742273330688477, 2.9877309799194336, 3.9012343883514404, 4.814737796783447, 5.728241443634033, 6.641745090484619, 7.555248260498047, 8.468751907348633, 9.382255554199219, 10.295759201049805, 11.20926284790039, 12.122766494750977, 13.036270141601562, 13.949773788452148, 14.863276481628418, 15.776780128479004, 16.690284729003906, 17.603788375854492, 18.517292022705078, 19.430795669555664, 20.34429931640625, 21.257802963256836, 22.171306610107422, 23.084808349609375, 23.99831199645996]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 7.0, 10.0, 8.0, 5.0, 21.0, 17.0, 29.0, 45.0, 52.0, 86.0, 104.0, 181.0, 256.0, 380.0, 672.0, 1229.0, 2574.0, 6527.0, 20084.0, 74180.0, 259430.0, 415838.0, 191361.0, 51225.0, 14371.0, 4977.0, 2199.0, 1059.0, 593.0, 325.0, 221.0, 121.0, 99.0, 59.0, 43.0, 35.0, 30.0, 25.0, 13.0, 25.0, 9.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-13.671875, -13.2359619140625, -12.800048828125, -12.3641357421875, -11.92822265625, -11.4923095703125, -11.056396484375, -10.6204833984375, -10.1845703125, -9.7486572265625, -9.312744140625, -8.8768310546875, -8.44091796875, -8.0050048828125, -7.569091796875, -7.1331787109375, -6.697265625, -6.2613525390625, -5.825439453125, -5.3895263671875, -4.95361328125, -4.5177001953125, -4.081787109375, -3.6458740234375, -3.2099609375, -2.7740478515625, -2.338134765625, -1.9022216796875, -1.46630859375, -1.0303955078125, -0.594482421875, -0.1585693359375, 0.27734375, 0.7132568359375, 1.149169921875, 1.5850830078125, 2.02099609375, 2.4569091796875, 2.892822265625, 3.3287353515625, 3.7646484375, 4.2005615234375, 4.636474609375, 5.0723876953125, 5.50830078125, 5.9442138671875, 6.380126953125, 6.8160400390625, 7.251953125, 7.6878662109375, 8.123779296875, 8.5596923828125, 8.99560546875, 9.4315185546875, 9.867431640625, 10.3033447265625, 10.7392578125, 11.1751708984375, 11.611083984375, 12.0469970703125, 12.48291015625, 12.9188232421875, 13.354736328125, 13.7906494140625, 14.2265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 10.0, 15.0, 18.0, 49.0, 57.0, 62.0, 97.0, 80.0, 80.0, 100.0, 84.0, 92.0, 70.0, 55.0, 50.0, 27.0, 20.0, 15.0, 8.0, 8.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.375, -5.2305908203125, -5.086181640625, -4.9417724609375, -4.79736328125, -4.6529541015625, -4.508544921875, -4.3641357421875, -4.2197265625, -4.0753173828125, -3.930908203125, -3.7864990234375, -3.64208984375, -3.4976806640625, -3.353271484375, -3.2088623046875, -3.064453125, -2.9200439453125, -2.775634765625, -2.6312255859375, -2.48681640625, -2.3424072265625, -2.197998046875, -2.0535888671875, -1.9091796875, -1.7647705078125, -1.620361328125, -1.4759521484375, -1.33154296875, -1.1871337890625, -1.042724609375, -0.8983154296875, -0.75390625, -0.6094970703125, -0.465087890625, -0.3206787109375, -0.17626953125, -0.0318603515625, 0.112548828125, 0.2569580078125, 0.4013671875, 0.5457763671875, 0.690185546875, 0.8345947265625, 0.97900390625, 1.1234130859375, 1.267822265625, 1.4122314453125, 1.556640625, 1.7010498046875, 1.845458984375, 1.9898681640625, 2.13427734375, 2.2786865234375, 2.423095703125, 2.5675048828125, 2.7119140625, 2.8563232421875, 3.000732421875, 3.1451416015625, 3.28955078125, 3.4339599609375, 3.578369140625, 3.7227783203125, 3.8671875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 9.0, 10.0, 13.0, 30.0, 31.0, 46.0, 72.0, 99.0, 164.0, 227.0, 340.0, 516.0, 893.0, 1791.0, 3646.0, 8764.0, 24606.0, 76150.0, 225990.0, 373168.0, 218748.0, 73034.0, 23986.0, 8691.0, 3584.0, 1628.0, 938.0, 477.0, 292.0, 186.0, 132.0, 98.0, 60.0, 38.0, 23.0, 24.0, 17.0, 10.0, 9.0, 1.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4921875, -10.158935546875, -9.82568359375, -9.492431640625, -9.1591796875, -8.825927734375, -8.49267578125, -8.159423828125, -7.826171875, -7.492919921875, -7.15966796875, -6.826416015625, -6.4931640625, -6.159912109375, -5.82666015625, -5.493408203125, -5.16015625, -4.826904296875, -4.49365234375, -4.160400390625, -3.8271484375, -3.493896484375, -3.16064453125, -2.827392578125, -2.494140625, -2.160888671875, -1.82763671875, -1.494384765625, -1.1611328125, -0.827880859375, -0.49462890625, -0.161376953125, 0.171875, 0.505126953125, 0.83837890625, 1.171630859375, 1.5048828125, 1.838134765625, 2.17138671875, 2.504638671875, 2.837890625, 3.171142578125, 3.50439453125, 3.837646484375, 4.1708984375, 4.504150390625, 4.83740234375, 5.170654296875, 5.50390625, 5.837158203125, 6.17041015625, 6.503662109375, 6.8369140625, 7.170166015625, 7.50341796875, 7.836669921875, 8.169921875, 8.503173828125, 8.83642578125, 9.169677734375, 9.5029296875, 9.836181640625, 10.16943359375, 10.502685546875, 10.8359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 8.0, 7.0, 6.0, 16.0, 14.0, 21.0, 13.0, 20.0, 31.0, 24.0, 42.0, 45.0, 36.0, 46.0, 35.0, 42.0, 45.0, 44.0, 45.0, 54.0, 41.0, 37.0, 41.0, 43.0, 32.0, 31.0, 26.0, 27.0, 14.0, 19.0, 14.0, 16.0, 7.0, 14.0, 8.0, 3.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.03759765625, -9.7001953125, -9.36279296875, -9.025390625, -8.68798828125, -8.3505859375, -8.01318359375, -7.67578125, -7.33837890625, -7.0009765625, -6.66357421875, -6.326171875, -5.98876953125, -5.6513671875, -5.31396484375, -4.9765625, -4.63916015625, -4.3017578125, -3.96435546875, -3.626953125, -3.28955078125, -2.9521484375, -2.61474609375, -2.27734375, -1.93994140625, -1.6025390625, -1.26513671875, -0.927734375, -0.59033203125, -0.2529296875, 0.08447265625, 0.421875, 0.75927734375, 1.0966796875, 1.43408203125, 1.771484375, 2.10888671875, 2.4462890625, 2.78369140625, 3.12109375, 3.45849609375, 3.7958984375, 4.13330078125, 4.470703125, 4.80810546875, 5.1455078125, 5.48291015625, 5.8203125, 6.15771484375, 6.4951171875, 6.83251953125, 7.169921875, 7.50732421875, 7.8447265625, 8.18212890625, 8.51953125, 8.85693359375, 9.1943359375, 9.53173828125, 9.869140625, 10.20654296875, 10.5439453125, 10.88134765625, 11.21875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 21.0, 29.0, 66.0, 118.0, 251.0, 506.0, 1319.0, 3644.0, 13915.0, 80910.0, 472257.0, 396831.0, 62274.0, 11369.0, 3032.0, 1109.0, 448.0, 211.0, 93.0, 53.0, 35.0, 13.0, 14.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.671875, -7.43890380859375, -7.2059326171875, -6.97296142578125, -6.739990234375, -6.50701904296875, -6.2740478515625, -6.04107666015625, -5.80810546875, -5.57513427734375, -5.3421630859375, -5.10919189453125, -4.876220703125, -4.64324951171875, -4.4102783203125, -4.17730712890625, -3.9443359375, -3.71136474609375, -3.4783935546875, -3.24542236328125, -3.012451171875, -2.77947998046875, -2.5465087890625, -2.31353759765625, -2.08056640625, -1.84759521484375, -1.6146240234375, -1.38165283203125, -1.148681640625, -0.91571044921875, -0.6827392578125, -0.44976806640625, -0.216796875, 0.01617431640625, 0.2491455078125, 0.48211669921875, 0.715087890625, 0.94805908203125, 1.1810302734375, 1.41400146484375, 1.64697265625, 1.87994384765625, 2.1129150390625, 2.34588623046875, 2.578857421875, 2.81182861328125, 3.0447998046875, 3.27777099609375, 3.5107421875, 3.74371337890625, 3.9766845703125, 4.20965576171875, 4.442626953125, 4.67559814453125, 4.9085693359375, 5.14154052734375, 5.37451171875, 5.60748291015625, 5.8404541015625, 6.07342529296875, 6.306396484375, 6.53936767578125, 6.7723388671875, 7.00531005859375, 7.23828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 12.0, 11.0, 12.0, 11.0, 17.0, 21.0, 11.0, 28.0, 20.0, 43.0, 41.0, 50.0, 63.0, 54.0, 72.0, 85.0, 62.0, 75.0, 56.0, 49.0, 36.0, 24.0, 22.0, 28.0, 17.0, 16.0, 14.0, 12.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0007157325744628906, -0.0006958842277526855, -0.0006760358810424805, -0.0006561875343322754, -0.0006363391876220703, -0.0006164908409118652, -0.0005966424942016602, -0.0005767941474914551, -0.00055694580078125, -0.0005370974540710449, -0.0005172491073608398, -0.0004974007606506348, -0.0004775524139404297, -0.0004577040672302246, -0.00043785572052001953, -0.00041800737380981445, -0.0003981590270996094, -0.0003783106803894043, -0.0003584623336791992, -0.00033861398696899414, -0.00031876564025878906, -0.000298917293548584, -0.0002790689468383789, -0.00025922060012817383, -0.00023937225341796875, -0.00021952390670776367, -0.0001996755599975586, -0.00017982721328735352, -0.00015997886657714844, -0.00014013051986694336, -0.00012028217315673828, -0.0001004338264465332, -8.058547973632812e-05, -6.073713302612305e-05, -4.088878631591797e-05, -2.104043960571289e-05, -1.1920928955078125e-06, 1.8656253814697266e-05, 3.8504600524902344e-05, 5.835294723510742e-05, 7.82012939453125e-05, 9.804964065551758e-05, 0.00011789798736572266, 0.00013774633407592773, 0.0001575946807861328, 0.0001774430274963379, 0.00019729137420654297, 0.00021713972091674805, 0.00023698806762695312, 0.0002568364143371582, 0.0002766847610473633, 0.00029653310775756836, 0.00031638145446777344, 0.0003362298011779785, 0.0003560781478881836, 0.00037592649459838867, 0.00039577484130859375, 0.00041562318801879883, 0.0004354715347290039, 0.000455319881439209, 0.00047516822814941406, 0.0004950165748596191, 0.0005148649215698242, 0.0005347132682800293, 0.0005545616149902344]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 4.0, 6.0, 9.0, 18.0, 19.0, 36.0, 37.0, 65.0, 74.0, 131.0, 187.0, 341.0, 602.0, 1104.0, 2258.0, 5233.0, 14524.0, 47749.0, 172436.0, 439400.0, 258729.0, 71450.0, 20800.0, 7248.0, 2915.0, 1370.0, 672.0, 467.0, 253.0, 135.0, 88.0, 54.0, 59.0, 26.0, 17.0, 10.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.09765625, -4.94158935546875, -4.7855224609375, -4.62945556640625, -4.473388671875, -4.31732177734375, -4.1612548828125, -4.00518798828125, -3.84912109375, -3.69305419921875, -3.5369873046875, -3.38092041015625, -3.224853515625, -3.06878662109375, -2.9127197265625, -2.75665283203125, -2.6005859375, -2.44451904296875, -2.2884521484375, -2.13238525390625, -1.976318359375, -1.82025146484375, -1.6641845703125, -1.50811767578125, -1.35205078125, -1.19598388671875, -1.0399169921875, -0.88385009765625, -0.727783203125, -0.57171630859375, -0.4156494140625, -0.25958251953125, -0.103515625, 0.05255126953125, 0.2086181640625, 0.36468505859375, 0.520751953125, 0.67681884765625, 0.8328857421875, 0.98895263671875, 1.14501953125, 1.30108642578125, 1.4571533203125, 1.61322021484375, 1.769287109375, 1.92535400390625, 2.0814208984375, 2.23748779296875, 2.3935546875, 2.54962158203125, 2.7056884765625, 2.86175537109375, 3.017822265625, 3.17388916015625, 3.3299560546875, 3.48602294921875, 3.64208984375, 3.79815673828125, 3.9542236328125, 4.11029052734375, 4.266357421875, 4.42242431640625, 4.5784912109375, 4.73455810546875, 4.890625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 7.0, 12.0, 13.0, 18.0, 15.0, 33.0, 35.0, 27.0, 48.0, 52.0, 56.0, 73.0, 86.0, 77.0, 74.0, 72.0, 61.0, 38.0, 38.0, 41.0, 35.0, 22.0, 17.0, 12.0, 19.0, 7.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.483306884765625, -4.34942626953125, -4.215545654296875, -4.0816650390625, -3.947784423828125, -3.81390380859375, -3.680023193359375, -3.546142578125, -3.412261962890625, -3.27838134765625, -3.144500732421875, -3.0106201171875, -2.876739501953125, -2.74285888671875, -2.608978271484375, -2.47509765625, -2.341217041015625, -2.20733642578125, -2.073455810546875, -1.9395751953125, -1.805694580078125, -1.67181396484375, -1.537933349609375, -1.404052734375, -1.270172119140625, -1.13629150390625, -1.002410888671875, -0.8685302734375, -0.734649658203125, -0.60076904296875, -0.466888427734375, -0.3330078125, -0.199127197265625, -0.06524658203125, 0.068634033203125, 0.2025146484375, 0.336395263671875, 0.47027587890625, 0.604156494140625, 0.738037109375, 0.871917724609375, 1.00579833984375, 1.139678955078125, 1.2735595703125, 1.407440185546875, 1.54132080078125, 1.675201416015625, 1.80908203125, 1.942962646484375, 2.07684326171875, 2.210723876953125, 2.3446044921875, 2.478485107421875, 2.61236572265625, 2.746246337890625, 2.880126953125, 3.014007568359375, 3.14788818359375, 3.281768798828125, 3.4156494140625, 3.549530029296875, 3.68341064453125, 3.817291259765625, 3.951171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 6.0, 15.0, 15.0, 31.0, 36.0, 99.0, 124.0, 138.0, 143.0, 134.0, 97.0, 68.0, 36.0, 28.0, 5.0, 6.0, 7.0, 6.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-116.56721496582031, -113.68026733398438, -110.79332733154297, -107.90637969970703, -105.01943969726562, -102.13249206542969, -99.24554443359375, -96.35859680175781, -93.4716567993164, -90.58470916748047, -87.69776916503906, -84.81082153320312, -81.92387390136719, -79.03693389892578, -76.14998626708984, -73.26304626464844, -70.3760986328125, -67.48915100097656, -64.60221099853516, -61.71526336669922, -58.82831954956055, -55.941375732421875, -53.05442810058594, -50.167484283447266, -47.280540466308594, -44.39359664916992, -41.50665283203125, -38.61970520019531, -35.73276138305664, -32.84581756591797, -29.958871841430664, -27.07192611694336, -24.184982299804688, -21.298038482666016, -18.41109275817871, -15.524147987365723, -12.637203216552734, -9.750258445739746, -6.863313674926758, -3.976367950439453, -1.0894241333007812, 1.797520637512207, 4.684465408325195, 7.571410179138184, 10.458354949951172, 13.34529972076416, 16.23224449157715, 19.119190216064453, 22.006134033203125, 24.893077850341797, 27.7800235748291, 30.666969299316406, 33.55391311645508, 36.44085693359375, 39.32780456542969, 42.21474838256836, 45.10169219970703, 47.9886360168457, 50.875579833984375, 53.76252746582031, 56.649471282958984, 59.536415100097656, 62.423362731933594, 65.310302734375, 68.19725036621094]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 1.0, 4.0, 8.0, 5.0, 7.0, 9.0, 17.0, 21.0, 21.0, 25.0, 27.0, 36.0, 41.0, 70.0, 47.0, 52.0, 54.0, 54.0, 55.0, 42.0, 44.0, 52.0, 38.0, 42.0, 40.0, 21.0, 24.0, 31.0, 21.0, 19.0, 14.0, 11.0, 13.0, 7.0, 7.0, 3.0, 6.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.50252914428711, -61.2485237121582, -58.9945182800293, -56.74051284790039, -54.486507415771484, -52.23250198364258, -49.978492736816406, -47.7244873046875, -45.470481872558594, -43.21647644042969, -40.96247100830078, -38.708465576171875, -36.45446014404297, -34.20045471191406, -31.946447372436523, -29.692441940307617, -27.438438415527344, -25.184432983398438, -22.93042755126953, -20.676422119140625, -18.42241668701172, -16.168411254882812, -13.914403915405273, -11.660398483276367, -9.406393051147461, -7.152387619018555, -4.89838171005249, -2.644375801086426, -0.39037036895751953, 1.8636350631713867, 4.117641448974609, 6.371646881103516, 8.625648498535156, 10.879653930664062, 13.133659362792969, 15.387665748596191, 17.64167022705078, 19.895675659179688, 22.149682998657227, 24.403688430786133, 26.65769386291504, 28.911699295043945, 31.16570472717285, 33.41971206665039, 35.6737174987793, 37.9277229309082, 40.18172836303711, 42.435733795166016, 44.68973922729492, 46.94374465942383, 49.197750091552734, 51.45175552368164, 53.70576095581055, 55.95976638793945, 58.213775634765625, 60.46778106689453, 62.72178649902344, 64.97579193115234, 67.22979736328125, 69.48380279541016, 71.73780822753906, 73.99181365966797, 76.24581909179688, 78.49982452392578, 80.75382995605469]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 8.0, 4.0, 5.0, 5.0, 11.0, 11.0, 21.0, 35.0, 39.0, 61.0, 85.0, 127.0, 204.0, 321.0, 570.0, 1051.0, 2436.0, 6404.0, 22228.0, 142615.0, 3618634.0, 347891.0, 36411.0, 9063.0, 3150.0, 1421.0, 658.0, 361.0, 182.0, 87.0, 73.0, 35.0, 34.0, 8.0, 12.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-27.59375, -26.9312744140625, -26.268798828125, -25.6063232421875, -24.94384765625, -24.2813720703125, -23.618896484375, -22.9564208984375, -22.2939453125, -21.6314697265625, -20.968994140625, -20.3065185546875, -19.64404296875, -18.9815673828125, -18.319091796875, -17.6566162109375, -16.994140625, -16.3316650390625, -15.669189453125, -15.0067138671875, -14.34423828125, -13.6817626953125, -13.019287109375, -12.3568115234375, -11.6943359375, -11.0318603515625, -10.369384765625, -9.7069091796875, -9.04443359375, -8.3819580078125, -7.719482421875, -7.0570068359375, -6.39453125, -5.7320556640625, -5.069580078125, -4.4071044921875, -3.74462890625, -3.0821533203125, -2.419677734375, -1.7572021484375, -1.0947265625, -0.4322509765625, 0.230224609375, 0.8927001953125, 1.55517578125, 2.2176513671875, 2.880126953125, 3.5426025390625, 4.205078125, 4.8675537109375, 5.530029296875, 6.1925048828125, 6.85498046875, 7.5174560546875, 8.179931640625, 8.8424072265625, 9.5048828125, 10.1673583984375, 10.829833984375, 11.4923095703125, 12.15478515625, 12.8172607421875, 13.479736328125, 14.1422119140625, 14.8046875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 12.0, 19.0, 22.0, 37.0, 46.0, 39.0, 56.0, 71.0, 51.0, 87.0, 81.0, 82.0, 73.0, 58.0, 46.0, 57.0, 32.0, 30.0, 31.0, 21.0, 15.0, 10.0, 5.0, 5.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.6328125, -4.5130615234375, -4.393310546875, -4.2735595703125, -4.15380859375, -4.0340576171875, -3.914306640625, -3.7945556640625, -3.6748046875, -3.5550537109375, -3.435302734375, -3.3155517578125, -3.19580078125, -3.0760498046875, -2.956298828125, -2.8365478515625, -2.716796875, -2.5970458984375, -2.477294921875, -2.3575439453125, -2.23779296875, -2.1180419921875, -1.998291015625, -1.8785400390625, -1.7587890625, -1.6390380859375, -1.519287109375, -1.3995361328125, -1.27978515625, -1.1600341796875, -1.040283203125, -0.9205322265625, -0.80078125, -0.6810302734375, -0.561279296875, -0.4415283203125, -0.32177734375, -0.2020263671875, -0.082275390625, 0.0374755859375, 0.1572265625, 0.2769775390625, 0.396728515625, 0.5164794921875, 0.63623046875, 0.7559814453125, 0.875732421875, 0.9954833984375, 1.115234375, 1.2349853515625, 1.354736328125, 1.4744873046875, 1.59423828125, 1.7139892578125, 1.833740234375, 1.9534912109375, 2.0732421875, 2.1929931640625, 2.312744140625, 2.4324951171875, 2.55224609375, 2.6719970703125, 2.791748046875, 2.9114990234375, 3.03125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 9.0, 13.0, 32.0, 41.0, 62.0, 94.0, 175.0, 264.0, 526.0, 1052.0, 2262.0, 6671.0, 33916.0, 1330080.0, 2762985.0, 43675.0, 7611.0, 2554.0, 1033.0, 496.0, 293.0, 155.0, 106.0, 62.0, 34.0, 29.0, 15.0, 12.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.640625, -30.83056640625, -30.0205078125, -29.21044921875, -28.400390625, -27.59033203125, -26.7802734375, -25.97021484375, -25.16015625, -24.35009765625, -23.5400390625, -22.72998046875, -21.919921875, -21.10986328125, -20.2998046875, -19.48974609375, -18.6796875, -17.86962890625, -17.0595703125, -16.24951171875, -15.439453125, -14.62939453125, -13.8193359375, -13.00927734375, -12.19921875, -11.38916015625, -10.5791015625, -9.76904296875, -8.958984375, -8.14892578125, -7.3388671875, -6.52880859375, -5.71875, -4.90869140625, -4.0986328125, -3.28857421875, -2.478515625, -1.66845703125, -0.8583984375, -0.04833984375, 0.76171875, 1.57177734375, 2.3818359375, 3.19189453125, 4.001953125, 4.81201171875, 5.6220703125, 6.43212890625, 7.2421875, 8.05224609375, 8.8623046875, 9.67236328125, 10.482421875, 11.29248046875, 12.1025390625, 12.91259765625, 13.72265625, 14.53271484375, 15.3427734375, 16.15283203125, 16.962890625, 17.77294921875, 18.5830078125, 19.39306640625, 20.203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 9.0, 9.0, 24.0, 48.0, 81.0, 163.0, 407.0, 1549.0, 1162.0, 332.0, 150.0, 54.0, 18.0, 19.0, 13.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1171875, -10.807373046875, -10.49755859375, -10.187744140625, -9.8779296875, -9.568115234375, -9.25830078125, -8.948486328125, -8.638671875, -8.328857421875, -8.01904296875, -7.709228515625, -7.3994140625, -7.089599609375, -6.77978515625, -6.469970703125, -6.16015625, -5.850341796875, -5.54052734375, -5.230712890625, -4.9208984375, -4.611083984375, -4.30126953125, -3.991455078125, -3.681640625, -3.371826171875, -3.06201171875, -2.752197265625, -2.4423828125, -2.132568359375, -1.82275390625, -1.512939453125, -1.203125, -0.893310546875, -0.58349609375, -0.273681640625, 0.0361328125, 0.345947265625, 0.65576171875, 0.965576171875, 1.275390625, 1.585205078125, 1.89501953125, 2.204833984375, 2.5146484375, 2.824462890625, 3.13427734375, 3.444091796875, 3.75390625, 4.063720703125, 4.37353515625, 4.683349609375, 4.9931640625, 5.302978515625, 5.61279296875, 5.922607421875, 6.232421875, 6.542236328125, 6.85205078125, 7.161865234375, 7.4716796875, 7.781494140625, 8.09130859375, 8.401123046875, 8.7109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 7.0, 7.0, 7.0, 20.0, 31.0, 60.0, 111.0, 160.0, 178.0, 169.0, 111.0, 63.0, 29.0, 16.0, 13.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.343994140625, -50.74131393432617, -49.138633728027344, -47.535953521728516, -45.93327331542969, -44.330589294433594, -42.72791290283203, -41.12522888183594, -39.52254867553711, -37.91986846923828, -36.31718826293945, -34.714508056640625, -33.1118278503418, -31.509145736694336, -29.906465530395508, -28.303783416748047, -26.70110511779785, -25.098424911499023, -23.495744705200195, -21.893062591552734, -20.290382385253906, -18.687702178955078, -17.08502197265625, -15.482340812683105, -13.879660606384277, -12.27698040008545, -10.674299240112305, -9.071619033813477, -7.46893835067749, -5.866257667541504, -4.263577461242676, -2.6608963012695312, -1.0582160949707031, 0.5444644689559937, 2.1471450328826904, 3.7498254776000977, 5.352506160736084, 6.95518684387207, 8.557867050170898, 10.160548210144043, 11.763228416442871, 13.3659086227417, 14.968589782714844, 16.571269989013672, 18.1739501953125, 19.776630401611328, 21.379310607910156, 22.981992721557617, 24.584672927856445, 26.187353134155273, 27.7900333404541, 29.392715454101562, 30.99539566040039, 32.59807586669922, 34.20075607299805, 35.803436279296875, 37.4061164855957, 39.00879669189453, 40.61147689819336, 42.21415710449219, 43.816837310791016, 45.419517517089844, 47.02220153808594, 48.624881744384766, 50.227561950683594]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 22.0, 21.0, 25.0, 36.0, 38.0, 58.0, 69.0, 69.0, 82.0, 76.0, 83.0, 71.0, 75.0, 58.0, 46.0, 41.0, 27.0, 28.0, 17.0, 13.0, 14.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.47153854370117, -36.41571807861328, -35.359893798828125, -34.304073333740234, -33.248252868652344, -32.19242858886719, -31.136608123779297, -30.080785751342773, -29.02496337890625, -27.969141006469727, -26.913318634033203, -25.857498168945312, -24.80167579650879, -23.745853424072266, -22.690032958984375, -21.63421058654785, -20.578388214111328, -19.522565841674805, -18.46674346923828, -17.41092300415039, -16.355100631713867, -15.299278259277344, -14.243456840515137, -13.18763542175293, -12.131813049316406, -11.075990676879883, -10.020169258117676, -8.964347839355469, -7.908525466918945, -6.85270357131958, -5.796881675720215, -4.74105978012085, -3.68524169921875, -2.6294198036193848, -1.5735979080200195, -0.5177760124206543, 0.5380458831787109, 1.5938677787780762, 2.6496896743774414, 3.7055115699768066, 4.761333465576172, 5.817155361175537, 6.872977256774902, 7.928799152374268, 8.984621047973633, 10.040443420410156, 11.096264839172363, 12.15208625793457, 13.207908630371094, 14.263731002807617, 15.319552421569824, 16.37537384033203, 17.431196212768555, 18.487018585205078, 19.54283905029297, 20.598661422729492, 21.654483795166016, 22.71030616760254, 23.766128540039062, 24.821949005126953, 25.877771377563477, 26.93359375, 27.98941421508789, 29.045236587524414, 30.101058959960938]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 13.0, 13.0, 18.0, 35.0, 60.0, 94.0, 139.0, 270.0, 484.0, 934.0, 2057.0, 5877.0, 23537.0, 157048.0, 604695.0, 211342.0, 30552.0, 6822.0, 2302.0, 991.0, 539.0, 289.0, 157.0, 101.0, 59.0, 33.0, 34.0, 10.0, 9.0, 11.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0], "bins": [-28.53125, -27.810302734375, -27.08935546875, -26.368408203125, -25.6474609375, -24.926513671875, -24.20556640625, -23.484619140625, -22.763671875, -22.042724609375, -21.32177734375, -20.600830078125, -19.8798828125, -19.158935546875, -18.43798828125, -17.717041015625, -16.99609375, -16.275146484375, -15.55419921875, -14.833251953125, -14.1123046875, -13.391357421875, -12.67041015625, -11.949462890625, -11.228515625, -10.507568359375, -9.78662109375, -9.065673828125, -8.3447265625, -7.623779296875, -6.90283203125, -6.181884765625, -5.4609375, -4.739990234375, -4.01904296875, -3.298095703125, -2.5771484375, -1.856201171875, -1.13525390625, -0.414306640625, 0.306640625, 1.027587890625, 1.74853515625, 2.469482421875, 3.1904296875, 3.911376953125, 4.63232421875, 5.353271484375, 6.07421875, 6.795166015625, 7.51611328125, 8.237060546875, 8.9580078125, 9.678955078125, 10.39990234375, 11.120849609375, 11.841796875, 12.562744140625, 13.28369140625, 14.004638671875, 14.7255859375, 15.446533203125, 16.16748046875, 16.888427734375, 17.609375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 10.0, 18.0, 41.0, 51.0, 56.0, 60.0, 88.0, 95.0, 112.0, 90.0, 84.0, 72.0, 53.0, 45.0, 46.0, 23.0, 15.0, 11.0, 7.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.71875, -5.567108154296875, -5.41546630859375, -5.263824462890625, -5.1121826171875, -4.960540771484375, -4.80889892578125, -4.657257080078125, -4.505615234375, -4.353973388671875, -4.20233154296875, -4.050689697265625, -3.8990478515625, -3.747406005859375, -3.59576416015625, -3.444122314453125, -3.29248046875, -3.140838623046875, -2.98919677734375, -2.837554931640625, -2.6859130859375, -2.534271240234375, -2.38262939453125, -2.230987548828125, -2.079345703125, -1.927703857421875, -1.77606201171875, -1.624420166015625, -1.4727783203125, -1.321136474609375, -1.16949462890625, -1.017852783203125, -0.8662109375, -0.714569091796875, -0.56292724609375, -0.411285400390625, -0.2596435546875, -0.108001708984375, 0.04364013671875, 0.195281982421875, 0.346923828125, 0.498565673828125, 0.65020751953125, 0.801849365234375, 0.9534912109375, 1.105133056640625, 1.25677490234375, 1.408416748046875, 1.56005859375, 1.711700439453125, 1.86334228515625, 2.014984130859375, 2.1666259765625, 2.318267822265625, 2.46990966796875, 2.621551513671875, 2.773193359375, 2.924835205078125, 3.07647705078125, 3.228118896484375, 3.3797607421875, 3.531402587890625, 3.68304443359375, 3.834686279296875, 3.986328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 1.0, 6.0, 5.0, 8.0, 9.0, 20.0, 30.0, 27.0, 43.0, 81.0, 88.0, 188.0, 251.0, 393.0, 586.0, 1170.0, 2069.0, 4308.0, 9216.0, 21779.0, 54928.0, 137983.0, 283557.0, 288974.0, 144021.0, 57180.0, 22576.0, 9619.0, 4315.0, 2124.0, 1164.0, 648.0, 400.0, 251.0, 179.0, 94.0, 74.0, 60.0, 34.0, 27.0, 17.0, 13.0, 3.0, 5.0, 7.0, 7.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-8.6875, -8.4244384765625, -8.161376953125, -7.8983154296875, -7.63525390625, -7.3721923828125, -7.109130859375, -6.8460693359375, -6.5830078125, -6.3199462890625, -6.056884765625, -5.7938232421875, -5.53076171875, -5.2677001953125, -5.004638671875, -4.7415771484375, -4.478515625, -4.2154541015625, -3.952392578125, -3.6893310546875, -3.42626953125, -3.1632080078125, -2.900146484375, -2.6370849609375, -2.3740234375, -2.1109619140625, -1.847900390625, -1.5848388671875, -1.32177734375, -1.0587158203125, -0.795654296875, -0.5325927734375, -0.26953125, -0.0064697265625, 0.256591796875, 0.5196533203125, 0.78271484375, 1.0457763671875, 1.308837890625, 1.5718994140625, 1.8349609375, 2.0980224609375, 2.361083984375, 2.6241455078125, 2.88720703125, 3.1502685546875, 3.413330078125, 3.6763916015625, 3.939453125, 4.2025146484375, 4.465576171875, 4.7286376953125, 4.99169921875, 5.2547607421875, 5.517822265625, 5.7808837890625, 6.0439453125, 6.3070068359375, 6.570068359375, 6.8331298828125, 7.09619140625, 7.3592529296875, 7.622314453125, 7.8853759765625, 8.1484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 6.0, 9.0, 12.0, 13.0, 16.0, 18.0, 18.0, 26.0, 41.0, 36.0, 24.0, 36.0, 49.0, 44.0, 58.0, 49.0, 47.0, 49.0, 56.0, 42.0, 52.0, 40.0, 34.0, 35.0, 35.0, 36.0, 24.0, 22.0, 6.0, 18.0, 11.0, 13.0, 6.0, 3.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4140625, -12.06298828125, -11.7119140625, -11.36083984375, -11.009765625, -10.65869140625, -10.3076171875, -9.95654296875, -9.60546875, -9.25439453125, -8.9033203125, -8.55224609375, -8.201171875, -7.85009765625, -7.4990234375, -7.14794921875, -6.796875, -6.44580078125, -6.0947265625, -5.74365234375, -5.392578125, -5.04150390625, -4.6904296875, -4.33935546875, -3.98828125, -3.63720703125, -3.2861328125, -2.93505859375, -2.583984375, -2.23291015625, -1.8818359375, -1.53076171875, -1.1796875, -0.82861328125, -0.4775390625, -0.12646484375, 0.224609375, 0.57568359375, 0.9267578125, 1.27783203125, 1.62890625, 1.97998046875, 2.3310546875, 2.68212890625, 3.033203125, 3.38427734375, 3.7353515625, 4.08642578125, 4.4375, 4.78857421875, 5.1396484375, 5.49072265625, 5.841796875, 6.19287109375, 6.5439453125, 6.89501953125, 7.24609375, 7.59716796875, 7.9482421875, 8.29931640625, 8.650390625, 9.00146484375, 9.3525390625, 9.70361328125, 10.0546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 2.0, 5.0, 11.0, 12.0, 14.0, 24.0, 41.0, 68.0, 112.0, 193.0, 404.0, 838.0, 1875.0, 4346.0, 11966.0, 55523.0, 474684.0, 430006.0, 49753.0, 11226.0, 4044.0, 1769.0, 794.0, 362.0, 182.0, 110.0, 75.0, 38.0, 28.0, 20.0, 15.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.890625, -7.5867919921875, -7.282958984375, -6.9791259765625, -6.67529296875, -6.3714599609375, -6.067626953125, -5.7637939453125, -5.4599609375, -5.1561279296875, -4.852294921875, -4.5484619140625, -4.24462890625, -3.9407958984375, -3.636962890625, -3.3331298828125, -3.029296875, -2.7254638671875, -2.421630859375, -2.1177978515625, -1.81396484375, -1.5101318359375, -1.206298828125, -0.9024658203125, -0.5986328125, -0.2947998046875, 0.009033203125, 0.3128662109375, 0.61669921875, 0.9205322265625, 1.224365234375, 1.5281982421875, 1.83203125, 2.1358642578125, 2.439697265625, 2.7435302734375, 3.04736328125, 3.3511962890625, 3.655029296875, 3.9588623046875, 4.2626953125, 4.5665283203125, 4.870361328125, 5.1741943359375, 5.47802734375, 5.7818603515625, 6.085693359375, 6.3895263671875, 6.693359375, 6.9971923828125, 7.301025390625, 7.6048583984375, 7.90869140625, 8.2125244140625, 8.516357421875, 8.8201904296875, 9.1240234375, 9.4278564453125, 9.731689453125, 10.0355224609375, 10.33935546875, 10.6431884765625, 10.947021484375, 11.2508544921875, 11.5546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 1.0, 4.0, 6.0, 18.0, 12.0, 22.0, 20.0, 38.0, 32.0, 35.0, 58.0, 72.0, 113.0, 105.0, 109.0, 93.0, 46.0, 35.0, 42.0, 35.0, 28.0, 15.0, 13.0, 5.0, 13.0, 5.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0], "bins": [-0.001068115234375, -0.0010423734784126282, -0.0010166317224502563, -0.0009908899664878845, -0.0009651482105255127, -0.0009394064545631409, -0.000913664698600769, -0.0008879229426383972, -0.0008621811866760254, -0.0008364394307136536, -0.0008106976747512817, -0.0007849559187889099, -0.0007592141628265381, -0.0007334724068641663, -0.0007077306509017944, -0.0006819888949394226, -0.0006562471389770508, -0.000630505383014679, -0.0006047636270523071, -0.0005790218710899353, -0.0005532801151275635, -0.0005275383591651917, -0.0005017966032028198, -0.000476054847240448, -0.00045031309127807617, -0.00042457133531570435, -0.0003988295793533325, -0.0003730878233909607, -0.00034734606742858887, -0.00032160431146621704, -0.0002958625555038452, -0.0002701207995414734, -0.00024437904357910156, -0.00021863728761672974, -0.0001928955316543579, -0.00016715377569198608, -0.00014141201972961426, -0.00011567026376724243, -8.99285078048706e-05, -6.418675184249878e-05, -3.844499588012695e-05, -1.2703239917755127e-05, 1.30385160446167e-05, 3.8780272006988525e-05, 6.452202796936035e-05, 9.026378393173218e-05, 0.000116005539894104, 0.00014174729585647583, 0.00016748905181884766, 0.00019323080778121948, 0.0002189725637435913, 0.00024471431970596313, 0.00027045607566833496, 0.0002961978316307068, 0.0003219395875930786, 0.00034768134355545044, 0.00037342309951782227, 0.0003991648554801941, 0.0004249066114425659, 0.00045064836740493774, 0.00047639012336730957, 0.0005021318793296814, 0.0005278736352920532, 0.000553615391254425, 0.0005793571472167969]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 16.0, 21.0, 28.0, 28.0, 62.0, 66.0, 122.0, 191.0, 300.0, 539.0, 1067.0, 2290.0, 5597.0, 17446.0, 96758.0, 669542.0, 213274.0, 27386.0, 7875.0, 2982.0, 1310.0, 665.0, 351.0, 219.0, 134.0, 82.0, 68.0, 35.0, 22.0, 21.0, 17.0, 13.0, 12.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.515625, -11.1927490234375, -10.869873046875, -10.5469970703125, -10.22412109375, -9.9012451171875, -9.578369140625, -9.2554931640625, -8.9326171875, -8.6097412109375, -8.286865234375, -7.9639892578125, -7.64111328125, -7.3182373046875, -6.995361328125, -6.6724853515625, -6.349609375, -6.0267333984375, -5.703857421875, -5.3809814453125, -5.05810546875, -4.7352294921875, -4.412353515625, -4.0894775390625, -3.7666015625, -3.4437255859375, -3.120849609375, -2.7979736328125, -2.47509765625, -2.1522216796875, -1.829345703125, -1.5064697265625, -1.18359375, -0.8607177734375, -0.537841796875, -0.2149658203125, 0.10791015625, 0.4307861328125, 0.753662109375, 1.0765380859375, 1.3994140625, 1.7222900390625, 2.045166015625, 2.3680419921875, 2.69091796875, 3.0137939453125, 3.336669921875, 3.6595458984375, 3.982421875, 4.3052978515625, 4.628173828125, 4.9510498046875, 5.27392578125, 5.5968017578125, 5.919677734375, 6.2425537109375, 6.5654296875, 6.8883056640625, 7.211181640625, 7.5340576171875, 7.85693359375, 8.1798095703125, 8.502685546875, 8.8255615234375, 9.1484375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 1.0, 5.0, 8.0, 11.0, 26.0, 33.0, 64.0, 128.0, 198.0, 206.0, 127.0, 91.0, 36.0, 23.0, 13.0, 12.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.34423828125, -8.9853515625, -8.62646484375, -8.267578125, -7.90869140625, -7.5498046875, -7.19091796875, -6.83203125, -6.47314453125, -6.1142578125, -5.75537109375, -5.396484375, -5.03759765625, -4.6787109375, -4.31982421875, -3.9609375, -3.60205078125, -3.2431640625, -2.88427734375, -2.525390625, -2.16650390625, -1.8076171875, -1.44873046875, -1.08984375, -0.73095703125, -0.3720703125, -0.01318359375, 0.345703125, 0.70458984375, 1.0634765625, 1.42236328125, 1.78125, 2.14013671875, 2.4990234375, 2.85791015625, 3.216796875, 3.57568359375, 3.9345703125, 4.29345703125, 4.65234375, 5.01123046875, 5.3701171875, 5.72900390625, 6.087890625, 6.44677734375, 6.8056640625, 7.16455078125, 7.5234375, 7.88232421875, 8.2412109375, 8.60009765625, 8.958984375, 9.31787109375, 9.6767578125, 10.03564453125, 10.39453125, 10.75341796875, 11.1123046875, 11.47119140625, 11.830078125, 12.18896484375, 12.5478515625, 12.90673828125, 13.265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 12.0, 28.0, 57.0, 60.0, 107.0, 90.0, 146.0, 134.0, 102.0, 95.0, 56.0, 36.0, 17.0, 17.0, 6.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0], "bins": [-117.36639404296875, -114.90416717529297, -112.44194793701172, -109.97972106933594, -107.51750183105469, -105.0552749633789, -102.59304809570312, -100.13082885742188, -97.6686019897461, -95.20637512207031, -92.74415588378906, -90.28192901611328, -87.8197021484375, -85.35748291015625, -82.89525604248047, -80.43302917480469, -77.97080993652344, -75.50858306884766, -73.0463638305664, -70.58413696289062, -68.12191772460938, -65.6596908569336, -63.19746398925781, -60.7352409362793, -58.27301788330078, -55.810794830322266, -53.34857177734375, -50.88634490966797, -48.42412185668945, -45.96189880371094, -43.499671936035156, -41.03744888305664, -38.575225830078125, -36.11300277709961, -33.650779724121094, -31.188552856445312, -28.726329803466797, -26.26410675048828, -23.801881790161133, -21.339656829833984, -18.87743377685547, -16.415210723876953, -13.952985763549805, -11.490761756896973, -9.02853775024414, -6.566313743591309, -4.104089736938477, -1.6418647766113281, 0.8203582763671875, 3.2825822830200195, 5.744806289672852, 8.207030296325684, 10.669254302978516, 13.131478309631348, 15.59370231628418, 18.055927276611328, 20.518150329589844, 22.98037338256836, 25.442598342895508, 27.904823303222656, 30.367046356201172, 32.82926940917969, 35.29149627685547, 37.753719329833984, 40.2159423828125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 9.0, 7.0, 14.0, 15.0, 18.0, 19.0, 27.0, 32.0, 37.0, 34.0, 62.0, 67.0, 64.0, 62.0, 53.0, 72.0, 61.0, 58.0, 55.0, 45.0, 29.0, 36.0, 33.0, 24.0, 18.0, 13.0, 14.0, 12.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-96.25404357910156, -93.81359100341797, -91.37313842773438, -88.93269348144531, -86.49224090576172, -84.05178833007812, -81.61133575439453, -79.17088317871094, -76.73043060302734, -74.28997802734375, -71.84952545166016, -69.40907287597656, -66.9686279296875, -64.5281753540039, -62.08772277832031, -59.64727020263672, -57.20682144165039, -54.7663688659668, -52.32592010498047, -49.885467529296875, -47.44501495361328, -45.00456237792969, -42.56411361694336, -40.123661041259766, -37.68321228027344, -35.242759704589844, -32.802310943603516, -30.361858367919922, -27.921405792236328, -25.480955123901367, -23.040504455566406, -20.600051879882812, -18.159595489501953, -15.719143867492676, -13.278692245483398, -10.838241577148438, -8.39778995513916, -5.957338333129883, -3.516887664794922, -1.0764350891113281, 1.3640155792236328, 3.804466962814331, 6.244918346405029, 8.685369491577148, 11.125821113586426, 13.566272735595703, 16.006723403930664, 18.447175979614258, 20.88762664794922, 23.32807731628418, 25.768529891967773, 28.208980560302734, 30.649433135986328, 33.089881896972656, 35.53033447265625, 37.970787048339844, 40.41123962402344, 42.85169219970703, 45.29214096069336, 47.73259353637695, 50.17304611206055, 52.613494873046875, 55.05394744873047, 57.49440002441406, 59.93484878540039]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 5.0, 6.0, 12.0, 19.0, 17.0, 40.0, 34.0, 41.0, 55.0, 110.0, 145.0, 277.0, 435.0, 913.0, 1804.0, 4134.0, 13398.0, 79463.0, 3786805.0, 271297.0, 24448.0, 6137.0, 2354.0, 1034.0, 552.0, 291.0, 158.0, 111.0, 56.0, 30.0, 23.0, 22.0, 14.0, 11.0, 4.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-25.578125, -24.933837890625, -24.28955078125, -23.645263671875, -23.0009765625, -22.356689453125, -21.71240234375, -21.068115234375, -20.423828125, -19.779541015625, -19.13525390625, -18.490966796875, -17.8466796875, -17.202392578125, -16.55810546875, -15.913818359375, -15.26953125, -14.625244140625, -13.98095703125, -13.336669921875, -12.6923828125, -12.048095703125, -11.40380859375, -10.759521484375, -10.115234375, -9.470947265625, -8.82666015625, -8.182373046875, -7.5380859375, -6.893798828125, -6.24951171875, -5.605224609375, -4.9609375, -4.316650390625, -3.67236328125, -3.028076171875, -2.3837890625, -1.739501953125, -1.09521484375, -0.450927734375, 0.193359375, 0.837646484375, 1.48193359375, 2.126220703125, 2.7705078125, 3.414794921875, 4.05908203125, 4.703369140625, 5.34765625, 5.991943359375, 6.63623046875, 7.280517578125, 7.9248046875, 8.569091796875, 9.21337890625, 9.857666015625, 10.501953125, 11.146240234375, 11.79052734375, 12.434814453125, 13.0791015625, 13.723388671875, 14.36767578125, 15.011962890625, 15.65625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 12.0, 13.0, 33.0, 27.0, 42.0, 53.0, 48.0, 54.0, 72.0, 82.0, 93.0, 80.0, 68.0, 72.0, 71.0, 42.0, 34.0, 26.0, 25.0, 10.0, 11.0, 6.0, 9.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.890625, -4.75653076171875, -4.6224365234375, -4.48834228515625, -4.354248046875, -4.22015380859375, -4.0860595703125, -3.95196533203125, -3.81787109375, -3.68377685546875, -3.5496826171875, -3.41558837890625, -3.281494140625, -3.14739990234375, -3.0133056640625, -2.87921142578125, -2.7451171875, -2.61102294921875, -2.4769287109375, -2.34283447265625, -2.208740234375, -2.07464599609375, -1.9405517578125, -1.80645751953125, -1.67236328125, -1.53826904296875, -1.4041748046875, -1.27008056640625, -1.135986328125, -1.00189208984375, -0.8677978515625, -0.73370361328125, -0.599609375, -0.46551513671875, -0.3314208984375, -0.19732666015625, -0.063232421875, 0.07086181640625, 0.2049560546875, 0.33905029296875, 0.47314453125, 0.60723876953125, 0.7413330078125, 0.87542724609375, 1.009521484375, 1.14361572265625, 1.2777099609375, 1.41180419921875, 1.5458984375, 1.67999267578125, 1.8140869140625, 1.94818115234375, 2.082275390625, 2.21636962890625, 2.3504638671875, 2.48455810546875, 2.61865234375, 2.75274658203125, 2.8868408203125, 3.02093505859375, 3.155029296875, 3.28912353515625, 3.4232177734375, 3.55731201171875, 3.69140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 12.0, 9.0, 9.0, 14.0, 18.0, 24.0, 38.0, 44.0, 54.0, 79.0, 123.0, 334.0, 1257.0, 8887.0, 165660.0, 3941468.0, 69224.0, 5273.0, 964.0, 311.0, 124.0, 84.0, 63.0, 50.0, 35.0, 19.0, 29.0, 20.0, 15.0, 14.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.53125, -23.6669921875, -22.802734375, -21.9384765625, -21.07421875, -20.2099609375, -19.345703125, -18.4814453125, -17.6171875, -16.7529296875, -15.888671875, -15.0244140625, -14.16015625, -13.2958984375, -12.431640625, -11.5673828125, -10.703125, -9.8388671875, -8.974609375, -8.1103515625, -7.24609375, -6.3818359375, -5.517578125, -4.6533203125, -3.7890625, -2.9248046875, -2.060546875, -1.1962890625, -0.33203125, 0.5322265625, 1.396484375, 2.2607421875, 3.125, 3.9892578125, 4.853515625, 5.7177734375, 6.58203125, 7.4462890625, 8.310546875, 9.1748046875, 10.0390625, 10.9033203125, 11.767578125, 12.6318359375, 13.49609375, 14.3603515625, 15.224609375, 16.0888671875, 16.953125, 17.8173828125, 18.681640625, 19.5458984375, 20.41015625, 21.2744140625, 22.138671875, 23.0029296875, 23.8671875, 24.7314453125, 25.595703125, 26.4599609375, 27.32421875, 28.1884765625, 29.052734375, 29.9169921875, 30.78125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 8.0, 20.0, 31.0, 65.0, 193.0, 750.0, 2319.0, 458.0, 142.0, 53.0, 15.0, 9.0, 4.0, 2.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -3.97100830078125, -3.6490478515625, -3.32708740234375, -3.005126953125, -2.68316650390625, -2.3612060546875, -2.03924560546875, -1.71728515625, -1.39532470703125, -1.0733642578125, -0.75140380859375, -0.429443359375, -0.10748291015625, 0.2144775390625, 0.53643798828125, 0.8583984375, 1.18035888671875, 1.5023193359375, 1.82427978515625, 2.146240234375, 2.46820068359375, 2.7901611328125, 3.11212158203125, 3.43408203125, 3.75604248046875, 4.0780029296875, 4.39996337890625, 4.721923828125, 5.04388427734375, 5.3658447265625, 5.68780517578125, 6.009765625, 6.33172607421875, 6.6536865234375, 6.97564697265625, 7.297607421875, 7.61956787109375, 7.9415283203125, 8.26348876953125, 8.58544921875, 8.90740966796875, 9.2293701171875, 9.55133056640625, 9.873291015625, 10.19525146484375, 10.5172119140625, 10.83917236328125, 11.1611328125, 11.48309326171875, 11.8050537109375, 12.12701416015625, 12.448974609375, 12.77093505859375, 13.0928955078125, 13.41485595703125, 13.73681640625, 14.05877685546875, 14.3807373046875, 14.70269775390625, 15.024658203125, 15.34661865234375, 15.6685791015625, 15.99053955078125, 16.3125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 16.0, 16.0, 35.0, 62.0, 103.0, 158.0, 166.0, 146.0, 102.0, 91.0, 42.0, 20.0, 12.0, 14.0, 7.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.249961853027344, -37.10892868041992, -35.967899322509766, -34.826866149902344, -33.68583297729492, -32.5447998046875, -31.403770446777344, -30.262737274169922, -29.121706008911133, -27.980674743652344, -26.839641571044922, -25.698610305786133, -24.557579040527344, -23.416545867919922, -22.275514602661133, -21.134483337402344, -19.993450164794922, -18.852418899536133, -17.71138572692871, -16.570354461669922, -15.429322242736816, -14.288290023803711, -13.147258758544922, -12.006226539611816, -10.865194320678711, -9.724162101745605, -8.5831298828125, -7.442098617553711, -6.3010663986206055, -5.1600341796875, -4.019002437591553, -2.8779706954956055, -1.7369384765625, -0.5959064960479736, 0.5451254844665527, 1.686157464981079, 2.8271894454956055, 3.968221664428711, 5.109253406524658, 6.2502851486206055, 7.391317367553711, 8.532349586486816, 9.673381805419922, 10.814413070678711, 11.955445289611816, 13.096477508544922, 14.237508773803711, 15.378540992736816, 16.519573211669922, 17.66060447692871, 18.801637649536133, 19.942668914794922, 21.083702087402344, 22.224733352661133, 23.365764617919922, 24.506797790527344, 25.647829055786133, 26.788860321044922, 27.929893493652344, 29.070924758911133, 30.211956024169922, 31.352989196777344, 32.494022369384766, 33.63505172729492, 34.776084899902344]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 11.0, 20.0, 17.0, 22.0, 28.0, 38.0, 37.0, 39.0, 59.0, 71.0, 79.0, 67.0, 87.0, 65.0, 67.0, 57.0, 40.0, 48.0, 33.0, 40.0, 18.0, 14.0, 10.0, 8.0, 4.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.549388885498047, -26.734928131103516, -25.920467376708984, -25.106006622314453, -24.291545867919922, -23.47708511352539, -22.662622451782227, -21.848161697387695, -21.033700942993164, -20.219240188598633, -19.4047794342041, -18.59031867980957, -17.775856018066406, -16.961395263671875, -16.146934509277344, -15.332473754882812, -14.518013000488281, -13.70355224609375, -12.889091491699219, -12.074629783630371, -11.26016902923584, -10.445708274841309, -9.631246566772461, -8.81678581237793, -8.002325057983398, -7.187864303588867, -6.373403072357178, -5.558941841125488, -4.744481086730957, -3.930020332336426, -3.1155591011047363, -2.301097869873047, -1.4866371154785156, -0.6721761226654053, 0.14228487014770508, 0.9567458629608154, 1.7712068557739258, 2.585667610168457, 3.4001288414001465, 4.214590072631836, 5.029050827026367, 5.843511581420898, 6.657972812652588, 7.472434043884277, 8.286894798278809, 9.10135555267334, 9.915817260742188, 10.730278015136719, 11.54473876953125, 12.359199523925781, 13.173660278320312, 13.98812198638916, 14.802582740783691, 15.617043495178223, 16.43150520324707, 17.2459659576416, 18.060426712036133, 18.874887466430664, 19.689348220825195, 20.503808975219727, 21.31827163696289, 22.132732391357422, 22.947193145751953, 23.761653900146484, 24.576114654541016]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 6.0, 7.0, 16.0, 23.0, 24.0, 37.0, 51.0, 65.0, 91.0, 130.0, 198.0, 354.0, 563.0, 825.0, 1562.0, 3325.0, 7522.0, 21549.0, 71292.0, 252567.0, 438310.0, 174939.0, 48328.0, 15053.0, 5778.0, 2455.0, 1301.0, 751.0, 479.0, 328.0, 201.0, 125.0, 90.0, 58.0, 46.0, 30.0, 27.0, 11.0, 12.0, 11.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9296875, -15.4215087890625, -14.913330078125, -14.4051513671875, -13.89697265625, -13.3887939453125, -12.880615234375, -12.3724365234375, -11.8642578125, -11.3560791015625, -10.847900390625, -10.3397216796875, -9.83154296875, -9.3233642578125, -8.815185546875, -8.3070068359375, -7.798828125, -7.2906494140625, -6.782470703125, -6.2742919921875, -5.76611328125, -5.2579345703125, -4.749755859375, -4.2415771484375, -3.7333984375, -3.2252197265625, -2.717041015625, -2.2088623046875, -1.70068359375, -1.1925048828125, -0.684326171875, -0.1761474609375, 0.33203125, 0.8402099609375, 1.348388671875, 1.8565673828125, 2.36474609375, 2.8729248046875, 3.381103515625, 3.8892822265625, 4.3974609375, 4.9056396484375, 5.413818359375, 5.9219970703125, 6.43017578125, 6.9383544921875, 7.446533203125, 7.9547119140625, 8.462890625, 8.9710693359375, 9.479248046875, 9.9874267578125, 10.49560546875, 11.0037841796875, 11.511962890625, 12.0201416015625, 12.5283203125, 13.0364990234375, 13.544677734375, 14.0528564453125, 14.56103515625, 15.0692138671875, 15.577392578125, 16.0855712890625, 16.59375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 13.0, 8.0, 9.0, 13.0, 37.0, 44.0, 47.0, 55.0, 56.0, 78.0, 91.0, 92.0, 79.0, 87.0, 65.0, 53.0, 46.0, 31.0, 33.0, 19.0, 16.0, 11.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.984375, -4.844085693359375, -4.70379638671875, -4.563507080078125, -4.4232177734375, -4.282928466796875, -4.14263916015625, -4.002349853515625, -3.862060546875, -3.721771240234375, -3.58148193359375, -3.441192626953125, -3.3009033203125, -3.160614013671875, -3.02032470703125, -2.880035400390625, -2.73974609375, -2.599456787109375, -2.45916748046875, -2.318878173828125, -2.1785888671875, -2.038299560546875, -1.89801025390625, -1.757720947265625, -1.617431640625, -1.477142333984375, -1.33685302734375, -1.196563720703125, -1.0562744140625, -0.915985107421875, -0.77569580078125, -0.635406494140625, -0.4951171875, -0.354827880859375, -0.21453857421875, -0.074249267578125, 0.0660400390625, 0.206329345703125, 0.34661865234375, 0.486907958984375, 0.627197265625, 0.767486572265625, 0.90777587890625, 1.048065185546875, 1.1883544921875, 1.328643798828125, 1.46893310546875, 1.609222412109375, 1.74951171875, 1.889801025390625, 2.03009033203125, 2.170379638671875, 2.3106689453125, 2.450958251953125, 2.59124755859375, 2.731536865234375, 2.871826171875, 3.012115478515625, 3.15240478515625, 3.292694091796875, 3.4329833984375, 3.573272705078125, 3.71356201171875, 3.853851318359375, 3.994140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 9.0, 13.0, 15.0, 11.0, 28.0, 27.0, 46.0, 59.0, 70.0, 94.0, 118.0, 172.0, 236.0, 320.0, 432.0, 632.0, 977.0, 1682.0, 3186.0, 6347.0, 13981.0, 32808.0, 77879.0, 171472.0, 284299.0, 238306.0, 120639.0, 51947.0, 21951.0, 9682.0, 4662.0, 2405.0, 1370.0, 815.0, 522.0, 351.0, 249.0, 187.0, 123.0, 91.0, 76.0, 63.0, 38.0, 45.0, 28.0, 24.0, 15.0, 15.0, 13.0, 9.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.76171875, -7.52484130859375, -7.2879638671875, -7.05108642578125, -6.814208984375, -6.57733154296875, -6.3404541015625, -6.10357666015625, -5.86669921875, -5.62982177734375, -5.3929443359375, -5.15606689453125, -4.919189453125, -4.68231201171875, -4.4454345703125, -4.20855712890625, -3.9716796875, -3.73480224609375, -3.4979248046875, -3.26104736328125, -3.024169921875, -2.78729248046875, -2.5504150390625, -2.31353759765625, -2.07666015625, -1.83978271484375, -1.6029052734375, -1.36602783203125, -1.129150390625, -0.89227294921875, -0.6553955078125, -0.41851806640625, -0.181640625, 0.05523681640625, 0.2921142578125, 0.52899169921875, 0.765869140625, 1.00274658203125, 1.2396240234375, 1.47650146484375, 1.71337890625, 1.95025634765625, 2.1871337890625, 2.42401123046875, 2.660888671875, 2.89776611328125, 3.1346435546875, 3.37152099609375, 3.6083984375, 3.84527587890625, 4.0821533203125, 4.31903076171875, 4.555908203125, 4.79278564453125, 5.0296630859375, 5.26654052734375, 5.50341796875, 5.74029541015625, 5.9771728515625, 6.21405029296875, 6.450927734375, 6.68780517578125, 6.9246826171875, 7.16156005859375, 7.3984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 6.0, 9.0, 8.0, 12.0, 15.0, 13.0, 17.0, 21.0, 25.0, 35.0, 39.0, 33.0, 40.0, 42.0, 52.0, 48.0, 41.0, 34.0, 41.0, 37.0, 49.0, 36.0, 30.0, 43.0, 35.0, 36.0, 36.0, 18.0, 22.0, 19.0, 22.0, 15.0, 14.0, 6.0, 11.0, 6.0, 3.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.300048828125, -8.99072265625, -8.681396484375, -8.3720703125, -8.062744140625, -7.75341796875, -7.444091796875, -7.134765625, -6.825439453125, -6.51611328125, -6.206787109375, -5.8974609375, -5.588134765625, -5.27880859375, -4.969482421875, -4.66015625, -4.350830078125, -4.04150390625, -3.732177734375, -3.4228515625, -3.113525390625, -2.80419921875, -2.494873046875, -2.185546875, -1.876220703125, -1.56689453125, -1.257568359375, -0.9482421875, -0.638916015625, -0.32958984375, -0.020263671875, 0.2890625, 0.598388671875, 0.90771484375, 1.217041015625, 1.5263671875, 1.835693359375, 2.14501953125, 2.454345703125, 2.763671875, 3.072998046875, 3.38232421875, 3.691650390625, 4.0009765625, 4.310302734375, 4.61962890625, 4.928955078125, 5.23828125, 5.547607421875, 5.85693359375, 6.166259765625, 6.4755859375, 6.784912109375, 7.09423828125, 7.403564453125, 7.712890625, 8.022216796875, 8.33154296875, 8.640869140625, 8.9501953125, 9.259521484375, 9.56884765625, 9.878173828125, 10.1875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 14.0, 14.0, 22.0, 51.0, 62.0, 119.0, 189.0, 375.0, 677.0, 1481.0, 3292.0, 7837.0, 23077.0, 103488.0, 562820.0, 277090.0, 45573.0, 13197.0, 4926.0, 2191.0, 938.0, 493.0, 264.0, 133.0, 98.0, 48.0, 21.0, 18.0, 16.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1953125, -6.9158935546875, -6.636474609375, -6.3570556640625, -6.07763671875, -5.7982177734375, -5.518798828125, -5.2393798828125, -4.9599609375, -4.6805419921875, -4.401123046875, -4.1217041015625, -3.84228515625, -3.5628662109375, -3.283447265625, -3.0040283203125, -2.724609375, -2.4451904296875, -2.165771484375, -1.8863525390625, -1.60693359375, -1.3275146484375, -1.048095703125, -0.7686767578125, -0.4892578125, -0.2098388671875, 0.069580078125, 0.3489990234375, 0.62841796875, 0.9078369140625, 1.187255859375, 1.4666748046875, 1.74609375, 2.0255126953125, 2.304931640625, 2.5843505859375, 2.86376953125, 3.1431884765625, 3.422607421875, 3.7020263671875, 3.9814453125, 4.2608642578125, 4.540283203125, 4.8197021484375, 5.09912109375, 5.3785400390625, 5.657958984375, 5.9373779296875, 6.216796875, 6.4962158203125, 6.775634765625, 7.0550537109375, 7.33447265625, 7.6138916015625, 7.893310546875, 8.1727294921875, 8.4521484375, 8.7315673828125, 9.010986328125, 9.2904052734375, 9.56982421875, 9.8492431640625, 10.128662109375, 10.4080810546875, 10.6875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 11.0, 15.0, 14.0, 20.0, 41.0, 47.0, 70.0, 108.0, 149.0, 150.0, 126.0, 78.0, 52.0, 40.0, 19.0, 16.0, 16.0, 9.0, 4.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017404556274414062, -0.0016923248767852783, -0.0016441941261291504, -0.0015960633754730225, -0.0015479326248168945, -0.0014998018741607666, -0.0014516711235046387, -0.0014035403728485107, -0.0013554096221923828, -0.0013072788715362549, -0.001259148120880127, -0.001211017370223999, -0.001162886619567871, -0.0011147558689117432, -0.0010666251182556152, -0.0010184943675994873, -0.0009703636169433594, -0.0009222328662872314, -0.0008741021156311035, -0.0008259713649749756, -0.0007778406143188477, -0.0007297098636627197, -0.0006815791130065918, -0.0006334483623504639, -0.0005853176116943359, -0.000537186861038208, -0.0004890561103820801, -0.00044092535972595215, -0.0003927946090698242, -0.0003446638584136963, -0.00029653310775756836, -0.00024840235710144043, -0.0002002716064453125, -0.00015214085578918457, -0.00010401010513305664, -5.587935447692871e-05, -7.748603820800781e-06, 4.038214683532715e-05, 8.851289749145508e-05, 0.000136643648147583, 0.00018477439880371094, 0.00023290514945983887, 0.0002810359001159668, 0.0003291666507720947, 0.00037729740142822266, 0.0004254281520843506, 0.0004735589027404785, 0.0005216896533966064, 0.0005698204040527344, 0.0006179511547088623, 0.0006660819053649902, 0.0007142126560211182, 0.0007623434066772461, 0.000810474157333374, 0.000858604907989502, 0.0009067356586456299, 0.0009548664093017578, 0.0010029971599578857, 0.0010511279106140137, 0.0010992586612701416, 0.0011473894119262695, 0.0011955201625823975, 0.0012436509132385254, 0.0012917816638946533, 0.0013399124145507812]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 15.0, 25.0, 38.0, 74.0, 139.0, 230.0, 418.0, 908.0, 2265.0, 7718.0, 33817.0, 314179.0, 610826.0, 60367.0, 11673.0, 3355.0, 1289.0, 552.0, 274.0, 140.0, 78.0, 34.0, 34.0, 17.0, 10.0, 16.0, 7.0, 2.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.875, -11.5057373046875, -11.136474609375, -10.7672119140625, -10.39794921875, -10.0286865234375, -9.659423828125, -9.2901611328125, -8.9208984375, -8.5516357421875, -8.182373046875, -7.8131103515625, -7.44384765625, -7.0745849609375, -6.705322265625, -6.3360595703125, -5.966796875, -5.5975341796875, -5.228271484375, -4.8590087890625, -4.48974609375, -4.1204833984375, -3.751220703125, -3.3819580078125, -3.0126953125, -2.6434326171875, -2.274169921875, -1.9049072265625, -1.53564453125, -1.1663818359375, -0.797119140625, -0.4278564453125, -0.05859375, 0.3106689453125, 0.679931640625, 1.0491943359375, 1.41845703125, 1.7877197265625, 2.156982421875, 2.5262451171875, 2.8955078125, 3.2647705078125, 3.634033203125, 4.0032958984375, 4.37255859375, 4.7418212890625, 5.111083984375, 5.4803466796875, 5.849609375, 6.2188720703125, 6.588134765625, 6.9573974609375, 7.32666015625, 7.6959228515625, 8.065185546875, 8.4344482421875, 8.8037109375, 9.1729736328125, 9.542236328125, 9.9114990234375, 10.28076171875, 10.6500244140625, 11.019287109375, 11.3885498046875, 11.7578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 9.0, 13.0, 8.0, 13.0, 18.0, 29.0, 28.0, 48.0, 65.0, 68.0, 68.0, 93.0, 89.0, 90.0, 66.0, 70.0, 48.0, 33.0, 27.0, 22.0, 10.0, 17.0, 11.0, 10.0, 7.0, 5.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.890625, -5.722412109375, -5.55419921875, -5.385986328125, -5.2177734375, -5.049560546875, -4.88134765625, -4.713134765625, -4.544921875, -4.376708984375, -4.20849609375, -4.040283203125, -3.8720703125, -3.703857421875, -3.53564453125, -3.367431640625, -3.19921875, -3.031005859375, -2.86279296875, -2.694580078125, -2.5263671875, -2.358154296875, -2.18994140625, -2.021728515625, -1.853515625, -1.685302734375, -1.51708984375, -1.348876953125, -1.1806640625, -1.012451171875, -0.84423828125, -0.676025390625, -0.5078125, -0.339599609375, -0.17138671875, -0.003173828125, 0.1650390625, 0.333251953125, 0.50146484375, 0.669677734375, 0.837890625, 1.006103515625, 1.17431640625, 1.342529296875, 1.5107421875, 1.678955078125, 1.84716796875, 2.015380859375, 2.18359375, 2.351806640625, 2.52001953125, 2.688232421875, 2.8564453125, 3.024658203125, 3.19287109375, 3.361083984375, 3.529296875, 3.697509765625, 3.86572265625, 4.033935546875, 4.2021484375, 4.370361328125, 4.53857421875, 4.706787109375, 4.875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 8.0, 9.0, 13.0, 27.0, 33.0, 86.0, 106.0, 154.0, 157.0, 144.0, 96.0, 66.0, 48.0, 19.0, 10.0, 9.0, 8.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.79270935058594, -106.68901062011719, -103.58531188964844, -100.48162078857422, -97.37792205810547, -94.27422332763672, -91.17052459716797, -88.06683349609375, -84.963134765625, -81.85943603515625, -78.7557373046875, -75.65204620361328, -72.54834747314453, -69.44464874267578, -66.34095001220703, -63.23725509643555, -60.1335563659668, -57.02985763549805, -53.92616271972656, -50.82246398925781, -47.71876907348633, -44.61507034301758, -41.511375427246094, -38.407676696777344, -35.303977966308594, -32.200279235839844, -29.09658432006836, -25.99288558959961, -22.889190673828125, -19.785491943359375, -16.681795120239258, -13.57809829711914, -10.474403381347656, -7.370706558227539, -4.267009258270264, -1.1633119583129883, 1.940384864807129, 5.044081687927246, 8.14777946472168, 11.251476287841797, 14.355173110961914, 17.45886993408203, 20.56256675720215, 23.666263580322266, 26.769962310791016, 29.8736572265625, 32.97735595703125, 36.0810546875, 39.184749603271484, 42.288448333740234, 45.39214324951172, 48.49584197998047, 51.59953689575195, 54.7032356262207, 57.80693054199219, 60.91062927246094, 64.01432800292969, 67.11802673339844, 70.22172546386719, 73.3254165649414, 76.42911529541016, 79.5328140258789, 82.63651275634766, 85.74020385742188, 88.84390258789062]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 2.0, 3.0, 10.0, 9.0, 4.0, 20.0, 19.0, 13.0, 18.0, 18.0, 26.0, 36.0, 34.0, 42.0, 45.0, 42.0, 53.0, 54.0, 50.0, 44.0, 55.0, 48.0, 33.0, 44.0, 40.0, 31.0, 35.0, 29.0, 35.0, 19.0, 21.0, 15.0, 17.0, 8.0, 12.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.80413055419922, -48.85121154785156, -46.898292541503906, -44.945377349853516, -42.99245834350586, -41.0395393371582, -39.08662414550781, -37.133705139160156, -35.1807861328125, -33.227867126464844, -31.27495002746582, -29.322032928466797, -27.36911392211914, -25.416194915771484, -23.46327781677246, -21.510360717773438, -19.55744171142578, -17.604522705078125, -15.651605606079102, -13.698687553405762, -11.745769500732422, -9.792851448059082, -7.839933395385742, -5.887015342712402, -3.9340972900390625, -1.9811792373657227, -0.028261184692382812, 1.924656867980957, 3.877574920654297, 5.830492973327637, 7.783411026000977, 9.736329078674316, 11.689247131347656, 13.642165184020996, 15.595083236694336, 17.54800033569336, 19.500919342041016, 21.453838348388672, 23.406755447387695, 25.35967254638672, 27.312591552734375, 29.26551055908203, 31.218427658081055, 33.17134475708008, 35.124263763427734, 37.07718276977539, 39.03009796142578, 40.98301696777344, 42.935935974121094, 44.88885498046875, 46.841773986816406, 48.7946891784668, 50.74760818481445, 52.70052719116211, 54.6534423828125, 56.606361389160156, 58.55928039550781, 60.51219940185547, 62.465118408203125, 64.41803741455078, 66.37095642089844, 68.32386779785156, 70.27678680419922, 72.22970581054688, 74.18262481689453]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 2.0, 3.0, 9.0, 10.0, 32.0, 29.0, 50.0, 75.0, 119.0, 205.0, 406.0, 843.0, 1984.0, 5584.0, 25799.0, 399540.0, 3683225.0, 61564.0, 10021.0, 2785.0, 1047.0, 429.0, 213.0, 135.0, 54.0, 37.0, 26.0, 12.0, 9.0, 11.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.375, -33.540771484375, -32.70654296875, -31.872314453125, -31.0380859375, -30.203857421875, -29.36962890625, -28.535400390625, -27.701171875, -26.866943359375, -26.03271484375, -25.198486328125, -24.3642578125, -23.530029296875, -22.69580078125, -21.861572265625, -21.02734375, -20.193115234375, -19.35888671875, -18.524658203125, -17.6904296875, -16.856201171875, -16.02197265625, -15.187744140625, -14.353515625, -13.519287109375, -12.68505859375, -11.850830078125, -11.0166015625, -10.182373046875, -9.34814453125, -8.513916015625, -7.6796875, -6.845458984375, -6.01123046875, -5.177001953125, -4.3427734375, -3.508544921875, -2.67431640625, -1.840087890625, -1.005859375, -0.171630859375, 0.66259765625, 1.496826171875, 2.3310546875, 3.165283203125, 3.99951171875, 4.833740234375, 5.66796875, 6.502197265625, 7.33642578125, 8.170654296875, 9.0048828125, 9.839111328125, 10.67333984375, 11.507568359375, 12.341796875, 13.176025390625, 14.01025390625, 14.844482421875, 15.6787109375, 16.512939453125, 17.34716796875, 18.181396484375, 19.015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 9.0, 21.0, 15.0, 38.0, 36.0, 50.0, 56.0, 66.0, 71.0, 84.0, 95.0, 81.0, 72.0, 69.0, 37.0, 53.0, 36.0, 23.0, 19.0, 16.0, 10.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.0859375, -4.945953369140625, -4.80596923828125, -4.665985107421875, -4.5260009765625, -4.386016845703125, -4.24603271484375, -4.106048583984375, -3.966064453125, -3.826080322265625, -3.68609619140625, -3.546112060546875, -3.4061279296875, -3.266143798828125, -3.12615966796875, -2.986175537109375, -2.84619140625, -2.706207275390625, -2.56622314453125, -2.426239013671875, -2.2862548828125, -2.146270751953125, -2.00628662109375, -1.866302490234375, -1.726318359375, -1.586334228515625, -1.44635009765625, -1.306365966796875, -1.1663818359375, -1.026397705078125, -0.88641357421875, -0.746429443359375, -0.6064453125, -0.466461181640625, -0.32647705078125, -0.186492919921875, -0.0465087890625, 0.093475341796875, 0.23345947265625, 0.373443603515625, 0.513427734375, 0.653411865234375, 0.79339599609375, 0.933380126953125, 1.0733642578125, 1.213348388671875, 1.35333251953125, 1.493316650390625, 1.63330078125, 1.773284912109375, 1.91326904296875, 2.053253173828125, 2.1932373046875, 2.333221435546875, 2.47320556640625, 2.613189697265625, 2.753173828125, 2.893157958984375, 3.03314208984375, 3.173126220703125, 3.3131103515625, 3.453094482421875, 3.59307861328125, 3.733062744140625, 3.873046875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 10.0, 15.0, 20.0, 23.0, 32.0, 29.0, 57.0, 74.0, 124.0, 167.0, 307.0, 546.0, 1171.0, 3316.0, 13112.0, 99851.0, 3577925.0, 457692.0, 30259.0, 5948.0, 1814.0, 711.0, 373.0, 226.0, 137.0, 95.0, 76.0, 57.0, 30.0, 25.0, 22.0, 14.0, 11.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.484375, -18.870361328125, -18.25634765625, -17.642333984375, -17.0283203125, -16.414306640625, -15.80029296875, -15.186279296875, -14.572265625, -13.958251953125, -13.34423828125, -12.730224609375, -12.1162109375, -11.502197265625, -10.88818359375, -10.274169921875, -9.66015625, -9.046142578125, -8.43212890625, -7.818115234375, -7.2041015625, -6.590087890625, -5.97607421875, -5.362060546875, -4.748046875, -4.134033203125, -3.52001953125, -2.906005859375, -2.2919921875, -1.677978515625, -1.06396484375, -0.449951171875, 0.1640625, 0.778076171875, 1.39208984375, 2.006103515625, 2.6201171875, 3.234130859375, 3.84814453125, 4.462158203125, 5.076171875, 5.690185546875, 6.30419921875, 6.918212890625, 7.5322265625, 8.146240234375, 8.76025390625, 9.374267578125, 9.98828125, 10.602294921875, 11.21630859375, 11.830322265625, 12.4443359375, 13.058349609375, 13.67236328125, 14.286376953125, 14.900390625, 15.514404296875, 16.12841796875, 16.742431640625, 17.3564453125, 17.970458984375, 18.58447265625, 19.198486328125, 19.8125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 7.0, 20.0, 29.0, 76.0, 211.0, 960.0, 2162.0, 407.0, 111.0, 43.0, 22.0, 10.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.3240966796875, -11.929443359375, -11.5347900390625, -11.14013671875, -10.7454833984375, -10.350830078125, -9.9561767578125, -9.5615234375, -9.1668701171875, -8.772216796875, -8.3775634765625, -7.98291015625, -7.5882568359375, -7.193603515625, -6.7989501953125, -6.404296875, -6.0096435546875, -5.614990234375, -5.2203369140625, -4.82568359375, -4.4310302734375, -4.036376953125, -3.6417236328125, -3.2470703125, -2.8524169921875, -2.457763671875, -2.0631103515625, -1.66845703125, -1.2738037109375, -0.879150390625, -0.4844970703125, -0.08984375, 0.3048095703125, 0.699462890625, 1.0941162109375, 1.48876953125, 1.8834228515625, 2.278076171875, 2.6727294921875, 3.0673828125, 3.4620361328125, 3.856689453125, 4.2513427734375, 4.64599609375, 5.0406494140625, 5.435302734375, 5.8299560546875, 6.224609375, 6.6192626953125, 7.013916015625, 7.4085693359375, 7.80322265625, 8.1978759765625, 8.592529296875, 8.9871826171875, 9.3818359375, 9.7764892578125, 10.171142578125, 10.5657958984375, 10.96044921875, 11.3551025390625, 11.749755859375, 12.1444091796875, 12.5390625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 13.0, 21.0, 24.0, 42.0, 74.0, 88.0, 129.0, 136.0, 143.0, 92.0, 84.0, 52.0, 37.0, 22.0, 14.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.876502990722656, -36.7429313659668, -35.60935974121094, -34.47578430175781, -33.34221267700195, -32.208641052246094, -31.0750675201416, -29.94149398803711, -28.80792236328125, -27.67435073852539, -26.5407772064209, -25.407203674316406, -24.273632049560547, -23.140060424804688, -22.006486892700195, -20.872913360595703, -19.739341735839844, -18.605770111083984, -17.472196578979492, -16.338623046875, -15.20505142211914, -14.071478843688965, -12.937906265258789, -11.804333686828613, -10.670761108398438, -9.537188529968262, -8.403615951538086, -7.27004337310791, -6.136470794677734, -5.002898216247559, -3.869325637817383, -2.735753059387207, -1.6021766662597656, -0.46860408782958984, 0.6649684906005859, 1.7985410690307617, 2.9321136474609375, 4.065686225891113, 5.199258804321289, 6.332831382751465, 7.466403961181641, 8.599976539611816, 9.733549118041992, 10.867121696472168, 12.000694274902344, 13.13426685333252, 14.267839431762695, 15.401412010192871, 16.534984588623047, 17.668556213378906, 18.8021297454834, 19.93570327758789, 21.06927490234375, 22.20284652709961, 23.3364200592041, 24.469993591308594, 25.603565216064453, 26.737136840820312, 27.870710372924805, 29.004283905029297, 30.137855529785156, 31.271427154541016, 32.404998779296875, 33.53857421875, 34.67214584350586]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 3.0, 10.0, 16.0, 14.0, 29.0, 27.0, 25.0, 39.0, 59.0, 43.0, 55.0, 56.0, 65.0, 68.0, 61.0, 63.0, 67.0, 47.0, 44.0, 40.0, 37.0, 27.0, 26.0, 16.0, 20.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.943836212158203, -28.079345703125, -27.214855194091797, -26.350366592407227, -25.485876083374023, -24.62138557434082, -23.756895065307617, -22.892406463623047, -22.027915954589844, -21.16342544555664, -20.298934936523438, -19.434446334838867, -18.569955825805664, -17.70546531677246, -16.840974807739258, -15.976485252380371, -15.111994743347168, -14.247504234313965, -13.383014678955078, -12.518524169921875, -11.654034614562988, -10.789544105529785, -9.925054550170898, -9.060564041137695, -8.196073532104492, -7.331583499908447, -6.467093467712402, -5.602602958679199, -4.7381134033203125, -3.8736228942871094, -3.0091328620910645, -2.1446428298950195, -1.2801532745361328, -0.4156631827354431, 0.4488269090652466, 1.313317060470581, 2.177807092666626, 3.04229736328125, 3.906787395477295, 4.77127742767334, 5.635767459869385, 6.50025749206543, 7.364747524261475, 8.22923755645752, 9.093728065490723, 9.95821762084961, 10.822708129882812, 11.687198638916016, 12.551688194274902, 13.416178703308105, 14.280668258666992, 15.145158767700195, 16.0096492767334, 16.87413787841797, 17.738628387451172, 18.603118896484375, 19.467609405517578, 20.33209991455078, 21.196590423583984, 22.061079025268555, 22.925569534301758, 23.79006004333496, 24.654550552368164, 25.519039154052734, 26.383529663085938]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 7.0, 11.0, 9.0, 16.0, 21.0, 21.0, 42.0, 65.0, 91.0, 101.0, 193.0, 300.0, 526.0, 888.0, 1536.0, 3202.0, 7173.0, 19711.0, 65548.0, 263408.0, 489151.0, 137331.0, 36894.0, 12133.0, 4839.0, 2287.0, 1134.0, 717.0, 391.0, 267.0, 156.0, 122.0, 65.0, 45.0, 31.0, 23.0, 23.0, 17.0, 14.0, 4.0, 4.0, 4.0, 4.0, 5.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.15625, -15.6556396484375, -15.155029296875, -14.6544189453125, -14.15380859375, -13.6531982421875, -13.152587890625, -12.6519775390625, -12.1513671875, -11.6507568359375, -11.150146484375, -10.6495361328125, -10.14892578125, -9.6483154296875, -9.147705078125, -8.6470947265625, -8.146484375, -7.6458740234375, -7.145263671875, -6.6446533203125, -6.14404296875, -5.6434326171875, -5.142822265625, -4.6422119140625, -4.1416015625, -3.6409912109375, -3.140380859375, -2.6397705078125, -2.13916015625, -1.6385498046875, -1.137939453125, -0.6373291015625, -0.13671875, 0.3638916015625, 0.864501953125, 1.3651123046875, 1.86572265625, 2.3663330078125, 2.866943359375, 3.3675537109375, 3.8681640625, 4.3687744140625, 4.869384765625, 5.3699951171875, 5.87060546875, 6.3712158203125, 6.871826171875, 7.3724365234375, 7.873046875, 8.3736572265625, 8.874267578125, 9.3748779296875, 9.87548828125, 10.3760986328125, 10.876708984375, 11.3773193359375, 11.8779296875, 12.3785400390625, 12.879150390625, 13.3797607421875, 13.88037109375, 14.3809814453125, 14.881591796875, 15.3822021484375, 15.8828125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 13.0, 25.0, 26.0, 34.0, 50.0, 70.0, 53.0, 72.0, 104.0, 105.0, 83.0, 81.0, 56.0, 48.0, 39.0, 28.0, 30.0, 27.0, 15.0, 3.0, 5.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.421875, -5.2685546875, -5.115234375, -4.9619140625, -4.80859375, -4.6552734375, -4.501953125, -4.3486328125, -4.1953125, -4.0419921875, -3.888671875, -3.7353515625, -3.58203125, -3.4287109375, -3.275390625, -3.1220703125, -2.96875, -2.8154296875, -2.662109375, -2.5087890625, -2.35546875, -2.2021484375, -2.048828125, -1.8955078125, -1.7421875, -1.5888671875, -1.435546875, -1.2822265625, -1.12890625, -0.9755859375, -0.822265625, -0.6689453125, -0.515625, -0.3623046875, -0.208984375, -0.0556640625, 0.09765625, 0.2509765625, 0.404296875, 0.5576171875, 0.7109375, 0.8642578125, 1.017578125, 1.1708984375, 1.32421875, 1.4775390625, 1.630859375, 1.7841796875, 1.9375, 2.0908203125, 2.244140625, 2.3974609375, 2.55078125, 2.7041015625, 2.857421875, 3.0107421875, 3.1640625, 3.3173828125, 3.470703125, 3.6240234375, 3.77734375, 3.9306640625, 4.083984375, 4.2373046875, 4.390625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 8.0, 14.0, 13.0, 22.0, 29.0, 38.0, 51.0, 54.0, 72.0, 107.0, 151.0, 194.0, 278.0, 440.0, 699.0, 1201.0, 2562.0, 5798.0, 15567.0, 44455.0, 136730.0, 393054.0, 299618.0, 95250.0, 31494.0, 11267.0, 4461.0, 1993.0, 986.0, 611.0, 346.0, 260.0, 214.0, 122.0, 105.0, 65.0, 37.0, 46.0, 25.0, 21.0, 14.0, 16.0, 15.0, 16.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.0234375, -10.67724609375, -10.3310546875, -9.98486328125, -9.638671875, -9.29248046875, -8.9462890625, -8.60009765625, -8.25390625, -7.90771484375, -7.5615234375, -7.21533203125, -6.869140625, -6.52294921875, -6.1767578125, -5.83056640625, -5.484375, -5.13818359375, -4.7919921875, -4.44580078125, -4.099609375, -3.75341796875, -3.4072265625, -3.06103515625, -2.71484375, -2.36865234375, -2.0224609375, -1.67626953125, -1.330078125, -0.98388671875, -0.6376953125, -0.29150390625, 0.0546875, 0.40087890625, 0.7470703125, 1.09326171875, 1.439453125, 1.78564453125, 2.1318359375, 2.47802734375, 2.82421875, 3.17041015625, 3.5166015625, 3.86279296875, 4.208984375, 4.55517578125, 4.9013671875, 5.24755859375, 5.59375, 5.93994140625, 6.2861328125, 6.63232421875, 6.978515625, 7.32470703125, 7.6708984375, 8.01708984375, 8.36328125, 8.70947265625, 9.0556640625, 9.40185546875, 9.748046875, 10.09423828125, 10.4404296875, 10.78662109375, 11.1328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 8.0, 10.0, 12.0, 10.0, 19.0, 19.0, 22.0, 23.0, 35.0, 30.0, 35.0, 27.0, 42.0, 39.0, 53.0, 51.0, 44.0, 36.0, 41.0, 46.0, 53.0, 46.0, 48.0, 32.0, 26.0, 26.0, 23.0, 29.0, 25.0, 17.0, 15.0, 14.0, 6.0, 10.0, 3.0, 5.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.659912109375, -10.29638671875, -9.932861328125, -9.5693359375, -9.205810546875, -8.84228515625, -8.478759765625, -8.115234375, -7.751708984375, -7.38818359375, -7.024658203125, -6.6611328125, -6.297607421875, -5.93408203125, -5.570556640625, -5.20703125, -4.843505859375, -4.47998046875, -4.116455078125, -3.7529296875, -3.389404296875, -3.02587890625, -2.662353515625, -2.298828125, -1.935302734375, -1.57177734375, -1.208251953125, -0.8447265625, -0.481201171875, -0.11767578125, 0.245849609375, 0.609375, 0.972900390625, 1.33642578125, 1.699951171875, 2.0634765625, 2.427001953125, 2.79052734375, 3.154052734375, 3.517578125, 3.881103515625, 4.24462890625, 4.608154296875, 4.9716796875, 5.335205078125, 5.69873046875, 6.062255859375, 6.42578125, 6.789306640625, 7.15283203125, 7.516357421875, 7.8798828125, 8.243408203125, 8.60693359375, 8.970458984375, 9.333984375, 9.697509765625, 10.06103515625, 10.424560546875, 10.7880859375, 11.151611328125, 11.51513671875, 11.878662109375, 12.2421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 13.0, 19.0, 25.0, 47.0, 104.0, 241.0, 792.0, 4272.0, 75003.0, 933832.0, 30613.0, 2645.0, 565.0, 197.0, 87.0, 34.0, 25.0, 17.0, 9.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.578125, -18.91162109375, -18.2451171875, -17.57861328125, -16.912109375, -16.24560546875, -15.5791015625, -14.91259765625, -14.24609375, -13.57958984375, -12.9130859375, -12.24658203125, -11.580078125, -10.91357421875, -10.2470703125, -9.58056640625, -8.9140625, -8.24755859375, -7.5810546875, -6.91455078125, -6.248046875, -5.58154296875, -4.9150390625, -4.24853515625, -3.58203125, -2.91552734375, -2.2490234375, -1.58251953125, -0.916015625, -0.24951171875, 0.4169921875, 1.08349609375, 1.75, 2.41650390625, 3.0830078125, 3.74951171875, 4.416015625, 5.08251953125, 5.7490234375, 6.41552734375, 7.08203125, 7.74853515625, 8.4150390625, 9.08154296875, 9.748046875, 10.41455078125, 11.0810546875, 11.74755859375, 12.4140625, 13.08056640625, 13.7470703125, 14.41357421875, 15.080078125, 15.74658203125, 16.4130859375, 17.07958984375, 17.74609375, 18.41259765625, 19.0791015625, 19.74560546875, 20.412109375, 21.07861328125, 21.7451171875, 22.41162109375, 23.078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 7.0, 9.0, 8.0, 14.0, 18.0, 28.0, 28.0, 41.0, 68.0, 125.0, 262.0, 159.0, 78.0, 33.0, 32.0, 33.0, 13.0, 10.0, 15.0, 10.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001438140869140625, -0.001399993896484375, -0.001361846923828125, -0.001323699951171875, -0.001285552978515625, -0.001247406005859375, -0.001209259033203125, -0.001171112060546875, -0.001132965087890625, -0.001094818115234375, -0.001056671142578125, -0.001018524169921875, -0.000980377197265625, -0.000942230224609375, -0.000904083251953125, -0.000865936279296875, -0.000827789306640625, -0.000789642333984375, -0.000751495361328125, -0.000713348388671875, -0.000675201416015625, -0.000637054443359375, -0.000598907470703125, -0.000560760498046875, -0.000522613525390625, -0.000484466552734375, -0.000446319580078125, -0.000408172607421875, -0.000370025634765625, -0.000331878662109375, -0.000293731689453125, -0.000255584716796875, -0.000217437744140625, -0.000179290771484375, -0.000141143798828125, -0.000102996826171875, -6.4849853515625e-05, -2.6702880859375e-05, 1.1444091796875e-05, 4.9591064453125e-05, 8.7738037109375e-05, 0.000125885009765625, 0.000164031982421875, 0.000202178955078125, 0.000240325927734375, 0.000278472900390625, 0.000316619873046875, 0.000354766845703125, 0.000392913818359375, 0.000431060791015625, 0.000469207763671875, 0.000507354736328125, 0.000545501708984375, 0.000583648681640625, 0.000621795654296875, 0.000659942626953125, 0.000698089599609375, 0.000736236572265625, 0.000774383544921875, 0.000812530517578125, 0.000850677490234375, 0.000888824462890625, 0.000926971435546875, 0.000965118408203125, 0.001003265380859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 11.0, 10.0, 28.0, 53.0, 112.0, 204.0, 638.0, 2836.0, 24447.0, 915999.0, 96439.0, 6069.0, 1078.0, 350.0, 123.0, 61.0, 38.0, 20.0, 16.0, 8.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.410400390625, -16.75830078125, -16.106201171875, -15.4541015625, -14.802001953125, -14.14990234375, -13.497802734375, -12.845703125, -12.193603515625, -11.54150390625, -10.889404296875, -10.2373046875, -9.585205078125, -8.93310546875, -8.281005859375, -7.62890625, -6.976806640625, -6.32470703125, -5.672607421875, -5.0205078125, -4.368408203125, -3.71630859375, -3.064208984375, -2.412109375, -1.760009765625, -1.10791015625, -0.455810546875, 0.1962890625, 0.848388671875, 1.50048828125, 2.152587890625, 2.8046875, 3.456787109375, 4.10888671875, 4.760986328125, 5.4130859375, 6.065185546875, 6.71728515625, 7.369384765625, 8.021484375, 8.673583984375, 9.32568359375, 9.977783203125, 10.6298828125, 11.281982421875, 11.93408203125, 12.586181640625, 13.23828125, 13.890380859375, 14.54248046875, 15.194580078125, 15.8466796875, 16.498779296875, 17.15087890625, 17.802978515625, 18.455078125, 19.107177734375, 19.75927734375, 20.411376953125, 21.0634765625, 21.715576171875, 22.36767578125, 23.019775390625, 23.671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 2.0, 10.0, 9.0, 18.0, 12.0, 23.0, 29.0, 57.0, 72.0, 115.0, 145.0, 131.0, 125.0, 67.0, 55.0, 27.0, 22.0, 16.0, 14.0, 10.0, 9.0, 5.0, 1.0, 5.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.97265625, -5.75213623046875, -5.5316162109375, -5.31109619140625, -5.090576171875, -4.87005615234375, -4.6495361328125, -4.42901611328125, -4.20849609375, -3.98797607421875, -3.7674560546875, -3.54693603515625, -3.326416015625, -3.10589599609375, -2.8853759765625, -2.66485595703125, -2.4443359375, -2.22381591796875, -2.0032958984375, -1.78277587890625, -1.562255859375, -1.34173583984375, -1.1212158203125, -0.90069580078125, -0.68017578125, -0.45965576171875, -0.2391357421875, -0.01861572265625, 0.201904296875, 0.42242431640625, 0.6429443359375, 0.86346435546875, 1.083984375, 1.30450439453125, 1.5250244140625, 1.74554443359375, 1.966064453125, 2.18658447265625, 2.4071044921875, 2.62762451171875, 2.84814453125, 3.06866455078125, 3.2891845703125, 3.50970458984375, 3.730224609375, 3.95074462890625, 4.1712646484375, 4.39178466796875, 4.6123046875, 4.83282470703125, 5.0533447265625, 5.27386474609375, 5.494384765625, 5.71490478515625, 5.9354248046875, 6.15594482421875, 6.37646484375, 6.59698486328125, 6.8175048828125, 7.03802490234375, 7.258544921875, 7.47906494140625, 7.6995849609375, 7.92010498046875, 8.140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 14.0, 45.0, 79.0, 130.0, 213.0, 215.0, 158.0, 68.0, 37.0, 23.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.75274658203125, -156.89144897460938, -152.0301513671875, -147.16885375976562, -142.3075408935547, -137.4462432861328, -132.58494567871094, -127.72364807128906, -122.86235046386719, -118.00105285644531, -113.1397476196289, -108.27845001220703, -103.41715240478516, -98.55584716796875, -93.69454956054688, -88.833251953125, -83.9719467163086, -79.11064910888672, -74.24934387207031, -69.38804626464844, -64.52674865722656, -59.66544723510742, -54.80414581298828, -49.942848205566406, -45.081546783447266, -40.220245361328125, -35.35894775390625, -30.49764633178711, -25.6363468170166, -20.775047302246094, -15.913745880126953, -11.052448272705078, -6.1911468505859375, -1.3298468589782715, 3.5314531326293945, 8.392753601074219, 13.254053115844727, 18.115352630615234, 22.976654052734375, 27.83795166015625, 32.69925308227539, 37.56055450439453, 42.421852111816406, 47.28315353393555, 52.14445495605469, 57.00575256347656, 61.8670539855957, 66.72834777832031, 71.58965301513672, 76.4509506225586, 81.312255859375, 86.17355346679688, 91.03485107421875, 95.89614868164062, 100.75745391845703, 105.6187515258789, 110.48005676269531, 115.34135437011719, 120.2026596069336, 125.06395721435547, 129.92526245117188, 134.78656005859375, 139.64785766601562, 144.5091552734375, 149.37045288085938]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 5.0, 14.0, 13.0, 7.0, 9.0, 9.0, 15.0, 19.0, 22.0, 17.0, 16.0, 29.0, 23.0, 26.0, 29.0, 32.0, 45.0, 41.0, 33.0, 45.0, 46.0, 27.0, 47.0, 41.0, 50.0, 42.0, 40.0, 24.0, 35.0, 34.0, 20.0, 21.0, 20.0, 16.0, 12.0, 12.0, 17.0, 6.0, 5.0, 8.0, 2.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-61.12358093261719, -59.36177062988281, -57.59996032714844, -55.83815002441406, -54.07633972167969, -52.31452941894531, -50.55271530151367, -48.7909049987793, -47.02909469604492, -45.26728439331055, -43.50547409057617, -41.7436637878418, -39.981849670410156, -38.22003936767578, -36.458229064941406, -34.69641876220703, -32.934608459472656, -31.17279815673828, -29.410987854003906, -27.6491756439209, -25.887365341186523, -24.12555503845215, -22.36374282836914, -20.601932525634766, -18.84012222290039, -17.078311920166016, -15.316500663757324, -13.554689407348633, -11.792879104614258, -10.031068801879883, -8.269257545471191, -6.5074462890625, -4.745632171630859, -2.983821392059326, -1.222010612487793, 0.5398001670837402, 2.3016109466552734, 4.063421249389648, 5.82523250579834, 7.587043762207031, 9.348854064941406, 11.110664367675781, 12.872475624084473, 14.634286880493164, 16.39609718322754, 18.157907485961914, 19.919719696044922, 21.681529998779297, 23.443340301513672, 25.205150604248047, 26.966960906982422, 28.72877311706543, 30.490583419799805, 32.25239562988281, 34.01420593261719, 35.77601623535156, 37.53782653808594, 39.29963684082031, 41.06144714355469, 42.82325744628906, 44.58506774902344, 46.34687805175781, 48.10869216918945, 49.87050247192383, 51.6323127746582]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 10.0, 11.0, 19.0, 18.0, 25.0, 36.0, 51.0, 78.0, 131.0, 168.0, 280.0, 480.0, 907.0, 1631.0, 3596.0, 9446.0, 32492.0, 230865.0, 3732367.0, 142943.0, 25213.0, 7527.0, 2972.0, 1354.0, 692.0, 365.0, 214.0, 127.0, 78.0, 47.0, 43.0, 26.0, 15.0, 7.0, 11.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.21875, -22.56298828125, -21.9072265625, -21.25146484375, -20.595703125, -19.93994140625, -19.2841796875, -18.62841796875, -17.97265625, -17.31689453125, -16.6611328125, -16.00537109375, -15.349609375, -14.69384765625, -14.0380859375, -13.38232421875, -12.7265625, -12.07080078125, -11.4150390625, -10.75927734375, -10.103515625, -9.44775390625, -8.7919921875, -8.13623046875, -7.48046875, -6.82470703125, -6.1689453125, -5.51318359375, -4.857421875, -4.20166015625, -3.5458984375, -2.89013671875, -2.234375, -1.57861328125, -0.9228515625, -0.26708984375, 0.388671875, 1.04443359375, 1.7001953125, 2.35595703125, 3.01171875, 3.66748046875, 4.3232421875, 4.97900390625, 5.634765625, 6.29052734375, 6.9462890625, 7.60205078125, 8.2578125, 8.91357421875, 9.5693359375, 10.22509765625, 10.880859375, 11.53662109375, 12.1923828125, 12.84814453125, 13.50390625, 14.15966796875, 14.8154296875, 15.47119140625, 16.126953125, 16.78271484375, 17.4384765625, 18.09423828125, 18.75]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 10.0, 14.0, 20.0, 24.0, 30.0, 36.0, 49.0, 60.0, 77.0, 81.0, 79.0, 102.0, 82.0, 70.0, 65.0, 48.0, 28.0, 30.0, 23.0, 20.0, 9.0, 9.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6953125, -5.536376953125, -5.37744140625, -5.218505859375, -5.0595703125, -4.900634765625, -4.74169921875, -4.582763671875, -4.423828125, -4.264892578125, -4.10595703125, -3.947021484375, -3.7880859375, -3.629150390625, -3.47021484375, -3.311279296875, -3.15234375, -2.993408203125, -2.83447265625, -2.675537109375, -2.5166015625, -2.357666015625, -2.19873046875, -2.039794921875, -1.880859375, -1.721923828125, -1.56298828125, -1.404052734375, -1.2451171875, -1.086181640625, -0.92724609375, -0.768310546875, -0.609375, -0.450439453125, -0.29150390625, -0.132568359375, 0.0263671875, 0.185302734375, 0.34423828125, 0.503173828125, 0.662109375, 0.821044921875, 0.97998046875, 1.138916015625, 1.2978515625, 1.456787109375, 1.61572265625, 1.774658203125, 1.93359375, 2.092529296875, 2.25146484375, 2.410400390625, 2.5693359375, 2.728271484375, 2.88720703125, 3.046142578125, 3.205078125, 3.364013671875, 3.52294921875, 3.681884765625, 3.8408203125, 3.999755859375, 4.15869140625, 4.317626953125, 4.4765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 9.0, 6.0, 11.0, 23.0, 25.0, 33.0, 38.0, 52.0, 89.0, 94.0, 145.0, 199.0, 299.0, 437.0, 750.0, 1479.0, 4026.0, 16271.0, 158616.0, 3845697.0, 143020.0, 15370.0, 3869.0, 1433.0, 751.0, 418.0, 303.0, 201.0, 146.0, 123.0, 88.0, 71.0, 46.0, 43.0, 24.0, 16.0, 15.0, 10.0, 10.0, 5.0, 4.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.04638671875, -18.3271484375, -17.60791015625, -16.888671875, -16.16943359375, -15.4501953125, -14.73095703125, -14.01171875, -13.29248046875, -12.5732421875, -11.85400390625, -11.134765625, -10.41552734375, -9.6962890625, -8.97705078125, -8.2578125, -7.53857421875, -6.8193359375, -6.10009765625, -5.380859375, -4.66162109375, -3.9423828125, -3.22314453125, -2.50390625, -1.78466796875, -1.0654296875, -0.34619140625, 0.373046875, 1.09228515625, 1.8115234375, 2.53076171875, 3.25, 3.96923828125, 4.6884765625, 5.40771484375, 6.126953125, 6.84619140625, 7.5654296875, 8.28466796875, 9.00390625, 9.72314453125, 10.4423828125, 11.16162109375, 11.880859375, 12.60009765625, 13.3193359375, 14.03857421875, 14.7578125, 15.47705078125, 16.1962890625, 16.91552734375, 17.634765625, 18.35400390625, 19.0732421875, 19.79248046875, 20.51171875, 21.23095703125, 21.9501953125, 22.66943359375, 23.388671875, 24.10791015625, 24.8271484375, 25.54638671875, 26.265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 7.0, 6.0, 4.0, 17.0, 30.0, 43.0, 115.0, 376.0, 2166.0, 901.0, 217.0, 83.0, 43.0, 23.0, 15.0, 6.0, 11.0, 7.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.859375, -6.5438232421875, -6.228271484375, -5.9127197265625, -5.59716796875, -5.2816162109375, -4.966064453125, -4.6505126953125, -4.3349609375, -4.0194091796875, -3.703857421875, -3.3883056640625, -3.07275390625, -2.7572021484375, -2.441650390625, -2.1260986328125, -1.810546875, -1.4949951171875, -1.179443359375, -0.8638916015625, -0.54833984375, -0.2327880859375, 0.082763671875, 0.3983154296875, 0.7138671875, 1.0294189453125, 1.344970703125, 1.6605224609375, 1.97607421875, 2.2916259765625, 2.607177734375, 2.9227294921875, 3.23828125, 3.5538330078125, 3.869384765625, 4.1849365234375, 4.50048828125, 4.8160400390625, 5.131591796875, 5.4471435546875, 5.7626953125, 6.0782470703125, 6.393798828125, 6.7093505859375, 7.02490234375, 7.3404541015625, 7.656005859375, 7.9715576171875, 8.287109375, 8.6026611328125, 8.918212890625, 9.2337646484375, 9.54931640625, 9.8648681640625, 10.180419921875, 10.4959716796875, 10.8115234375, 11.1270751953125, 11.442626953125, 11.7581787109375, 12.07373046875, 12.3892822265625, 12.704833984375, 13.0203857421875, 13.3359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 14.0, 24.0, 45.0, 101.0, 141.0, 180.0, 147.0, 118.0, 77.0, 67.0, 30.0, 13.0, 12.0, 9.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.63143539428711, -34.150794982910156, -32.67015075683594, -31.189510345458984, -29.7088680267334, -28.228225708007812, -26.747583389282227, -25.26694107055664, -23.786300659179688, -22.3056583404541, -20.825016021728516, -19.344375610351562, -17.863733291625977, -16.38309097290039, -14.902448654174805, -13.421807289123535, -11.941164016723633, -10.460521697998047, -8.979880332946777, -7.499238014221191, -6.018596172332764, -4.537954330444336, -3.05731201171875, -1.5766706466674805, -0.09602832794189453, 1.3846136331558228, 2.86525559425354, 4.345897674560547, 5.826539516448975, 7.307181358337402, 8.787823677062988, 10.268465042114258, 11.749107360839844, 13.22974967956543, 14.7103910446167, 16.19103240966797, 17.671674728393555, 19.15231704711914, 20.632959365844727, 22.113601684570312, 23.594242095947266, 25.07488441467285, 26.555526733398438, 28.03616714477539, 29.516809463500977, 30.997451782226562, 32.47809600830078, 33.958736419677734, 35.43937683105469, 36.92001724243164, 38.40066146850586, 39.88130187988281, 41.36194610595703, 42.842586517333984, 44.32322692871094, 45.803871154785156, 47.284515380859375, 48.76515579223633, 50.24580001831055, 51.7264404296875, 53.20708465576172, 54.68772506713867, 56.168365478515625, 57.649009704589844, 59.1296501159668]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 18.0, 14.0, 25.0, 35.0, 48.0, 57.0, 71.0, 65.0, 78.0, 78.0, 87.0, 68.0, 72.0, 53.0, 55.0, 48.0, 38.0, 34.0, 15.0, 13.0, 14.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.2933349609375, -48.07403564453125, -46.854736328125, -45.63543701171875, -44.4161376953125, -43.19683837890625, -41.9775390625, -40.75823974609375, -39.5389404296875, -38.31964111328125, -37.100341796875, -35.88104248046875, -34.6617431640625, -33.44244384765625, -32.22314453125, -31.00384521484375, -29.7845458984375, -28.56524658203125, -27.345947265625, -26.12664794921875, -24.9073486328125, -23.68804931640625, -22.46875, -21.24945068359375, -20.0301513671875, -18.81085205078125, -17.591552734375, -16.37225341796875, -15.1529541015625, -13.93365478515625, -12.71435546875, -11.49505615234375, -10.2757568359375, -9.05645751953125, -7.837158203125, -6.61785888671875, -5.3985595703125, -4.17926025390625, -2.9599609375, -1.74066162109375, -0.5213623046875, 0.69793701171875, 1.917236328125, 3.13653564453125, 4.3558349609375, 5.57513427734375, 6.79443359375, 8.01373291015625, 9.2330322265625, 10.45233154296875, 11.671630859375, 12.89093017578125, 14.1102294921875, 15.32952880859375, 16.548828125, 17.76812744140625, 18.9874267578125, 20.20672607421875, 21.426025390625, 22.64532470703125, 23.8646240234375, 25.08392333984375, 26.30322265625, 27.52252197265625, 28.7418212890625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 10.0, 13.0, 25.0, 38.0, 63.0, 84.0, 164.0, 326.0, 613.0, 1370.0, 3521.0, 13468.0, 76418.0, 590267.0, 309261.0, 40111.0, 8274.0, 2418.0, 1036.0, 474.0, 272.0, 118.0, 77.0, 47.0, 28.0, 9.0, 12.0, 9.0, 6.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.609375, -25.82275390625, -25.0361328125, -24.24951171875, -23.462890625, -22.67626953125, -21.8896484375, -21.10302734375, -20.31640625, -19.52978515625, -18.7431640625, -17.95654296875, -17.169921875, -16.38330078125, -15.5966796875, -14.81005859375, -14.0234375, -13.23681640625, -12.4501953125, -11.66357421875, -10.876953125, -10.09033203125, -9.3037109375, -8.51708984375, -7.73046875, -6.94384765625, -6.1572265625, -5.37060546875, -4.583984375, -3.79736328125, -3.0107421875, -2.22412109375, -1.4375, -0.65087890625, 0.1357421875, 0.92236328125, 1.708984375, 2.49560546875, 3.2822265625, 4.06884765625, 4.85546875, 5.64208984375, 6.4287109375, 7.21533203125, 8.001953125, 8.78857421875, 9.5751953125, 10.36181640625, 11.1484375, 11.93505859375, 12.7216796875, 13.50830078125, 14.294921875, 15.08154296875, 15.8681640625, 16.65478515625, 17.44140625, 18.22802734375, 19.0146484375, 19.80126953125, 20.587890625, 21.37451171875, 22.1611328125, 22.94775390625, 23.734375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 6.0, 4.0, 0.0, 9.0, 11.0, 20.0, 30.0, 26.0, 30.0, 31.0, 61.0, 68.0, 81.0, 73.0, 99.0, 70.0, 80.0, 83.0, 53.0, 42.0, 33.0, 19.0, 22.0, 17.0, 8.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6171875, -5.45367431640625, -5.2901611328125, -5.12664794921875, -4.963134765625, -4.79962158203125, -4.6361083984375, -4.47259521484375, -4.30908203125, -4.14556884765625, -3.9820556640625, -3.81854248046875, -3.655029296875, -3.49151611328125, -3.3280029296875, -3.16448974609375, -3.0009765625, -2.83746337890625, -2.6739501953125, -2.51043701171875, -2.346923828125, -2.18341064453125, -2.0198974609375, -1.85638427734375, -1.69287109375, -1.52935791015625, -1.3658447265625, -1.20233154296875, -1.038818359375, -0.87530517578125, -0.7117919921875, -0.54827880859375, -0.384765625, -0.22125244140625, -0.0577392578125, 0.10577392578125, 0.269287109375, 0.43280029296875, 0.5963134765625, 0.75982666015625, 0.92333984375, 1.08685302734375, 1.2503662109375, 1.41387939453125, 1.577392578125, 1.74090576171875, 1.9044189453125, 2.06793212890625, 2.2314453125, 2.39495849609375, 2.5584716796875, 2.72198486328125, 2.885498046875, 3.04901123046875, 3.2125244140625, 3.37603759765625, 3.53955078125, 3.70306396484375, 3.8665771484375, 4.03009033203125, 4.193603515625, 4.35711669921875, 4.5206298828125, 4.68414306640625, 4.84765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 5.0, 9.0, 12.0, 19.0, 19.0, 36.0, 45.0, 54.0, 99.0, 136.0, 222.0, 366.0, 665.0, 1322.0, 2975.0, 8393.0, 25723.0, 90516.0, 350820.0, 410501.0, 109460.0, 30604.0, 9741.0, 3573.0, 1454.0, 665.0, 403.0, 204.0, 140.0, 98.0, 69.0, 51.0, 36.0, 25.0, 15.0, 15.0, 12.0, 9.0, 7.0, 6.0, 1.0, 2.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.39453125, -11.015625, -10.63671875, -10.2578125, -9.87890625, -9.5, -9.12109375, -8.7421875, -8.36328125, -7.984375, -7.60546875, -7.2265625, -6.84765625, -6.46875, -6.08984375, -5.7109375, -5.33203125, -4.953125, -4.57421875, -4.1953125, -3.81640625, -3.4375, -3.05859375, -2.6796875, -2.30078125, -1.921875, -1.54296875, -1.1640625, -0.78515625, -0.40625, -0.02734375, 0.3515625, 0.73046875, 1.109375, 1.48828125, 1.8671875, 2.24609375, 2.625, 3.00390625, 3.3828125, 3.76171875, 4.140625, 4.51953125, 4.8984375, 5.27734375, 5.65625, 6.03515625, 6.4140625, 6.79296875, 7.171875, 7.55078125, 7.9296875, 8.30859375, 8.6875, 9.06640625, 9.4453125, 9.82421875, 10.203125, 10.58203125, 10.9609375, 11.33984375, 11.71875, 12.09765625, 12.4765625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 7.0, 5.0, 3.0, 6.0, 10.0, 12.0, 9.0, 15.0, 30.0, 28.0, 33.0, 35.0, 32.0, 45.0, 59.0, 52.0, 55.0, 54.0, 49.0, 63.0, 62.0, 45.0, 42.0, 42.0, 32.0, 30.0, 30.0, 21.0, 16.0, 18.0, 10.0, 12.0, 6.0, 7.0, 6.0, 7.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.234375, -12.79296875, -12.3515625, -11.91015625, -11.46875, -11.02734375, -10.5859375, -10.14453125, -9.703125, -9.26171875, -8.8203125, -8.37890625, -7.9375, -7.49609375, -7.0546875, -6.61328125, -6.171875, -5.73046875, -5.2890625, -4.84765625, -4.40625, -3.96484375, -3.5234375, -3.08203125, -2.640625, -2.19921875, -1.7578125, -1.31640625, -0.875, -0.43359375, 0.0078125, 0.44921875, 0.890625, 1.33203125, 1.7734375, 2.21484375, 2.65625, 3.09765625, 3.5390625, 3.98046875, 4.421875, 4.86328125, 5.3046875, 5.74609375, 6.1875, 6.62890625, 7.0703125, 7.51171875, 7.953125, 8.39453125, 8.8359375, 9.27734375, 9.71875, 10.16015625, 10.6015625, 11.04296875, 11.484375, 11.92578125, 12.3671875, 12.80859375, 13.25, 13.69140625, 14.1328125, 14.57421875, 15.015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 13.0, 13.0, 22.0, 54.0, 138.0, 347.0, 1376.0, 14108.0, 447417.0, 566076.0, 16820.0, 1564.0, 355.0, 150.0, 56.0, 20.0, 14.0, 9.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.296875, -12.9278564453125, -12.558837890625, -12.1898193359375, -11.82080078125, -11.4517822265625, -11.082763671875, -10.7137451171875, -10.3447265625, -9.9757080078125, -9.606689453125, -9.2376708984375, -8.86865234375, -8.4996337890625, -8.130615234375, -7.7615966796875, -7.392578125, -7.0235595703125, -6.654541015625, -6.2855224609375, -5.91650390625, -5.5474853515625, -5.178466796875, -4.8094482421875, -4.4404296875, -4.0714111328125, -3.702392578125, -3.3333740234375, -2.96435546875, -2.5953369140625, -2.226318359375, -1.8572998046875, -1.48828125, -1.1192626953125, -0.750244140625, -0.3812255859375, -0.01220703125, 0.3568115234375, 0.725830078125, 1.0948486328125, 1.4638671875, 1.8328857421875, 2.201904296875, 2.5709228515625, 2.93994140625, 3.3089599609375, 3.677978515625, 4.0469970703125, 4.416015625, 4.7850341796875, 5.154052734375, 5.5230712890625, 5.89208984375, 6.2611083984375, 6.630126953125, 6.9991455078125, 7.3681640625, 7.7371826171875, 8.106201171875, 8.4752197265625, 8.84423828125, 9.2132568359375, 9.582275390625, 9.9512939453125, 10.3203125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 4.0, 13.0, 8.0, 12.0, 11.0, 15.0, 14.0, 32.0, 45.0, 64.0, 155.0, 180.0, 130.0, 80.0, 54.0, 34.0, 26.0, 14.0, 17.0, 14.0, 10.0, 6.0, 12.0, 6.0, 6.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006442070007324219, -0.0006216391921043396, -0.0005990713834762573, -0.000576503574848175, -0.0005539357662200928, -0.0005313679575920105, -0.0005088001489639282, -0.00048623234033584595, -0.00046366453170776367, -0.0004410967230796814, -0.0004185289144515991, -0.00039596110582351685, -0.00037339329719543457, -0.0003508254885673523, -0.00032825767993927, -0.00030568987131118774, -0.00028312206268310547, -0.0002605542540550232, -0.00023798644542694092, -0.00021541863679885864, -0.00019285082817077637, -0.0001702830195426941, -0.00014771521091461182, -0.00012514740228652954, -0.00010257959365844727, -8.001178503036499e-05, -5.7443976402282715e-05, -3.487616777420044e-05, -1.2308359146118164e-05, 1.0259449481964111e-05, 3.282725811004639e-05, 5.539506673812866e-05, 7.796287536621094e-05, 0.00010053068399429321, 0.0001230984926223755, 0.00014566630125045776, 0.00016823410987854004, 0.00019080191850662231, 0.0002133697271347046, 0.00023593753576278687, 0.00025850534439086914, 0.0002810731530189514, 0.0003036409616470337, 0.00032620877027511597, 0.00034877657890319824, 0.0003713443875312805, 0.0003939121961593628, 0.00041648000478744507, 0.00043904781341552734, 0.0004616156220436096, 0.0004841834306716919, 0.0005067512392997742, 0.0005293190479278564, 0.0005518868565559387, 0.000574454665184021, 0.0005970224738121033, 0.0006195902824401855, 0.0006421580910682678, 0.0006647258996963501, 0.0006872937083244324, 0.0007098615169525146, 0.0007324293255805969, 0.0007549971342086792, 0.0007775649428367615, 0.0008001327514648438]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 8.0, 15.0, 12.0, 22.0, 31.0, 45.0, 82.0, 155.0, 342.0, 981.0, 4998.0, 41729.0, 765922.0, 215949.0, 14861.0, 2281.0, 572.0, 226.0, 129.0, 81.0, 48.0, 35.0, 16.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.65625, -8.375, -8.09375, -7.8125, -7.53125, -7.25, -6.96875, -6.6875, -6.40625, -6.125, -5.84375, -5.5625, -5.28125, -5.0, -4.71875, -4.4375, -4.15625, -3.875, -3.59375, -3.3125, -3.03125, -2.75, -2.46875, -2.1875, -1.90625, -1.625, -1.34375, -1.0625, -0.78125, -0.5, -0.21875, 0.0625, 0.34375, 0.625, 0.90625, 1.1875, 1.46875, 1.75, 2.03125, 2.3125, 2.59375, 2.875, 3.15625, 3.4375, 3.71875, 4.0, 4.28125, 4.5625, 4.84375, 5.125, 5.40625, 5.6875, 5.96875, 6.25, 6.53125, 6.8125, 7.09375, 7.375, 7.65625, 7.9375, 8.21875, 8.5, 8.78125, 9.0625, 9.34375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 11.0, 24.0, 54.0, 122.0, 258.0, 257.0, 132.0, 75.0, 27.0, 15.0, 6.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.3978271484375, -11.053466796875, -10.7091064453125, -10.36474609375, -10.0203857421875, -9.676025390625, -9.3316650390625, -8.9873046875, -8.6429443359375, -8.298583984375, -7.9542236328125, -7.60986328125, -7.2655029296875, -6.921142578125, -6.5767822265625, -6.232421875, -5.8880615234375, -5.543701171875, -5.1993408203125, -4.85498046875, -4.5106201171875, -4.166259765625, -3.8218994140625, -3.4775390625, -3.1331787109375, -2.788818359375, -2.4444580078125, -2.10009765625, -1.7557373046875, -1.411376953125, -1.0670166015625, -0.72265625, -0.3782958984375, -0.033935546875, 0.3104248046875, 0.65478515625, 0.9991455078125, 1.343505859375, 1.6878662109375, 2.0322265625, 2.3765869140625, 2.720947265625, 3.0653076171875, 3.40966796875, 3.7540283203125, 4.098388671875, 4.4427490234375, 4.787109375, 5.1314697265625, 5.475830078125, 5.8201904296875, 6.16455078125, 6.5089111328125, 6.853271484375, 7.1976318359375, 7.5419921875, 7.8863525390625, 8.230712890625, 8.5750732421875, 8.91943359375, 9.2637939453125, 9.608154296875, 9.9525146484375, 10.296875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 24.0, 66.0, 130.0, 212.0, 228.0, 175.0, 93.0, 43.0, 20.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-236.34735107421875, -231.90211486816406, -227.4568634033203, -223.01162719726562, -218.56639099121094, -214.12115478515625, -209.6759033203125, -205.2306671142578, -200.78543090820312, -196.34019470214844, -191.8949432373047, -187.44970703125, -183.0044708251953, -178.55923461914062, -174.11398315429688, -169.6687469482422, -165.2235107421875, -160.7782745361328, -156.33302307128906, -151.88778686523438, -147.4425506591797, -142.997314453125, -138.55206298828125, -134.10682678222656, -129.6615753173828, -125.2163314819336, -120.7710952758789, -116.32585144042969, -111.880615234375, -107.43537139892578, -102.99012756347656, -98.54489135742188, -94.09964752197266, -89.65440368652344, -85.20916748046875, -80.76392364501953, -76.31868743896484, -71.87344360351562, -67.42820739746094, -62.98296356201172, -58.537723541259766, -54.09248352050781, -49.64724349975586, -45.202003479003906, -40.75675964355469, -36.3115234375, -31.86627960205078, -27.421039581298828, -22.975799560546875, -18.530559539794922, -14.085318565368652, -9.640077590942383, -5.19483757019043, -0.7495975494384766, 3.6956443786621094, 8.140884399414062, 12.586124420166016, 17.03136444091797, 21.476604461669922, 25.921846389770508, 30.36708641052246, 34.81232452392578, 39.257568359375, 43.70280838012695, 48.148048400878906]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 9.0, 5.0, 13.0, 11.0, 15.0, 12.0, 20.0, 24.0, 21.0, 23.0, 37.0, 20.0, 26.0, 33.0, 38.0, 34.0, 37.0, 48.0, 50.0, 41.0, 47.0, 40.0, 39.0, 40.0, 29.0, 34.0, 35.0, 25.0, 32.0, 17.0, 25.0, 14.0, 19.0, 18.0, 8.0, 13.0, 11.0, 6.0, 5.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-50.81325149536133, -49.17613220214844, -47.53900909423828, -45.90188980102539, -44.2647705078125, -42.62765121459961, -40.99053192138672, -39.35340881347656, -37.71628952026367, -36.07917022705078, -34.442047119140625, -32.804927825927734, -31.167808532714844, -29.530689239501953, -27.89356803894043, -26.256446838378906, -24.619327545166016, -22.982208251953125, -21.3450870513916, -19.707965850830078, -18.070846557617188, -16.433727264404297, -14.796606063842773, -13.159485816955566, -11.52236557006836, -9.885245323181152, -8.248125076293945, -6.611004829406738, -4.973884582519531, -3.336764335632324, -1.6996440887451172, -0.06252384185791016, 1.5745964050292969, 3.211716651916504, 4.848836898803711, 6.485957145690918, 8.123077392578125, 9.760197639465332, 11.397317886352539, 13.034438133239746, 14.671558380126953, 16.308677673339844, 17.945798873901367, 19.58292007446289, 21.22003936767578, 22.857158660888672, 24.494279861450195, 26.13140106201172, 27.76852035522461, 29.4056396484375, 31.042760848999023, 32.67988204956055, 34.31700134277344, 35.95412063598633, 37.59123992919922, 39.228363037109375, 40.865482330322266, 42.502601623535156, 44.13972473144531, 45.7768440246582, 47.413963317871094, 49.051082611083984, 50.688201904296875, 52.32532501220703, 53.96244430541992]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 18.0, 20.0, 15.0, 22.0, 40.0, 64.0, 99.0, 125.0, 227.0, 419.0, 749.0, 1430.0, 3247.0, 8929.0, 36846.0, 1076760.0, 3008133.0, 41495.0, 9358.0, 3283.0, 1423.0, 660.0, 351.0, 205.0, 140.0, 64.0, 47.0, 30.0, 11.0, 13.0, 8.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.65625, -39.587158203125, -38.51806640625, -37.448974609375, -36.3798828125, -35.310791015625, -34.24169921875, -33.172607421875, -32.103515625, -31.034423828125, -29.96533203125, -28.896240234375, -27.8271484375, -26.758056640625, -25.68896484375, -24.619873046875, -23.55078125, -22.481689453125, -21.41259765625, -20.343505859375, -19.2744140625, -18.205322265625, -17.13623046875, -16.067138671875, -14.998046875, -13.928955078125, -12.85986328125, -11.790771484375, -10.7216796875, -9.652587890625, -8.58349609375, -7.514404296875, -6.4453125, -5.376220703125, -4.30712890625, -3.238037109375, -2.1689453125, -1.099853515625, -0.03076171875, 1.038330078125, 2.107421875, 3.176513671875, 4.24560546875, 5.314697265625, 6.3837890625, 7.452880859375, 8.52197265625, 9.591064453125, 10.66015625, 11.729248046875, 12.79833984375, 13.867431640625, 14.9365234375, 16.005615234375, 17.07470703125, 18.143798828125, 19.212890625, 20.281982421875, 21.35107421875, 22.420166015625, 23.4892578125, 24.558349609375, 25.62744140625, 26.696533203125, 27.765625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 17.0, 22.0, 20.0, 28.0, 40.0, 47.0, 65.0, 70.0, 72.0, 90.0, 88.0, 80.0, 81.0, 63.0, 41.0, 45.0, 26.0, 25.0, 12.0, 16.0, 9.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9609375, -5.7900390625, -5.619140625, -5.4482421875, -5.27734375, -5.1064453125, -4.935546875, -4.7646484375, -4.59375, -4.4228515625, -4.251953125, -4.0810546875, -3.91015625, -3.7392578125, -3.568359375, -3.3974609375, -3.2265625, -3.0556640625, -2.884765625, -2.7138671875, -2.54296875, -2.3720703125, -2.201171875, -2.0302734375, -1.859375, -1.6884765625, -1.517578125, -1.3466796875, -1.17578125, -1.0048828125, -0.833984375, -0.6630859375, -0.4921875, -0.3212890625, -0.150390625, 0.0205078125, 0.19140625, 0.3623046875, 0.533203125, 0.7041015625, 0.875, 1.0458984375, 1.216796875, 1.3876953125, 1.55859375, 1.7294921875, 1.900390625, 2.0712890625, 2.2421875, 2.4130859375, 2.583984375, 2.7548828125, 2.92578125, 3.0966796875, 3.267578125, 3.4384765625, 3.609375, 3.7802734375, 3.951171875, 4.1220703125, 4.29296875, 4.4638671875, 4.634765625, 4.8056640625, 4.9765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 6.0, 5.0, 9.0, 12.0, 12.0, 23.0, 19.0, 26.0, 38.0, 35.0, 66.0, 85.0, 143.0, 248.0, 456.0, 712.0, 1379.0, 2862.0, 6199.0, 15002.0, 43784.0, 208172.0, 3494761.0, 332116.0, 56108.0, 17937.0, 7141.0, 3209.0, 1565.0, 855.0, 444.0, 299.0, 140.0, 113.0, 70.0, 51.0, 46.0, 23.0, 27.0, 12.0, 8.0, 17.0, 14.0, 7.0, 10.0, 4.0, 4.0, 6.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-14.4453125, -13.9881591796875, -13.531005859375, -13.0738525390625, -12.61669921875, -12.1595458984375, -11.702392578125, -11.2452392578125, -10.7880859375, -10.3309326171875, -9.873779296875, -9.4166259765625, -8.95947265625, -8.5023193359375, -8.045166015625, -7.5880126953125, -7.130859375, -6.6737060546875, -6.216552734375, -5.7593994140625, -5.30224609375, -4.8450927734375, -4.387939453125, -3.9307861328125, -3.4736328125, -3.0164794921875, -2.559326171875, -2.1021728515625, -1.64501953125, -1.1878662109375, -0.730712890625, -0.2735595703125, 0.18359375, 0.6407470703125, 1.097900390625, 1.5550537109375, 2.01220703125, 2.4693603515625, 2.926513671875, 3.3836669921875, 3.8408203125, 4.2979736328125, 4.755126953125, 5.2122802734375, 5.66943359375, 6.1265869140625, 6.583740234375, 7.0408935546875, 7.498046875, 7.9552001953125, 8.412353515625, 8.8695068359375, 9.32666015625, 9.7838134765625, 10.240966796875, 10.6981201171875, 11.1552734375, 11.6124267578125, 12.069580078125, 12.5267333984375, 12.98388671875, 13.4410400390625, 13.898193359375, 14.3553466796875, 14.8125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 8.0, 6.0, 12.0, 14.0, 14.0, 29.0, 50.0, 82.0, 167.0, 461.0, 2386.0, 481.0, 154.0, 70.0, 45.0, 30.0, 11.0, 13.0, 8.0, 10.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34375, -6.061767578125, -5.77978515625, -5.497802734375, -5.2158203125, -4.933837890625, -4.65185546875, -4.369873046875, -4.087890625, -3.805908203125, -3.52392578125, -3.241943359375, -2.9599609375, -2.677978515625, -2.39599609375, -2.114013671875, -1.83203125, -1.550048828125, -1.26806640625, -0.986083984375, -0.7041015625, -0.422119140625, -0.14013671875, 0.141845703125, 0.423828125, 0.705810546875, 0.98779296875, 1.269775390625, 1.5517578125, 1.833740234375, 2.11572265625, 2.397705078125, 2.6796875, 2.961669921875, 3.24365234375, 3.525634765625, 3.8076171875, 4.089599609375, 4.37158203125, 4.653564453125, 4.935546875, 5.217529296875, 5.49951171875, 5.781494140625, 6.0634765625, 6.345458984375, 6.62744140625, 6.909423828125, 7.19140625, 7.473388671875, 7.75537109375, 8.037353515625, 8.3193359375, 8.601318359375, 8.88330078125, 9.165283203125, 9.447265625, 9.729248046875, 10.01123046875, 10.293212890625, 10.5751953125, 10.857177734375, 11.13916015625, 11.421142578125, 11.703125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 15.0, 28.0, 59.0, 98.0, 179.0, 193.0, 162.0, 98.0, 69.0, 33.0, 16.0, 11.0, 11.0, 7.0, 5.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.06459426879883, -41.681396484375, -40.29819869995117, -38.915000915527344, -37.531803131103516, -36.14860534667969, -34.765403747558594, -33.38220977783203, -31.99901008605957, -30.615812301635742, -29.232614517211914, -27.849414825439453, -26.466217041015625, -25.083019256591797, -23.69982147216797, -22.31662368774414, -20.933425903320312, -19.550228118896484, -18.167030334472656, -16.783832550048828, -15.400633811950684, -14.017436027526855, -12.634237289428711, -11.251039505004883, -9.867841720581055, -8.484643936157227, -7.10144567489624, -5.718247413635254, -4.335049629211426, -2.9518518447875977, -1.5686531066894531, -0.185455322265625, 1.1977386474609375, 2.5809366703033447, 3.964134693145752, 5.347332954406738, 6.730530738830566, 8.113728523254395, 9.496927261352539, 10.880125045776367, 12.263322830200195, 13.646520614624023, 15.029718399047852, 16.412918090820312, 17.79611587524414, 19.17931365966797, 20.562511444091797, 21.945709228515625, 23.328907012939453, 24.71210479736328, 26.09530258178711, 27.478500366210938, 28.861698150634766, 30.244895935058594, 31.628095626831055, 33.01129150390625, 34.394493103027344, 35.77769088745117, 37.160888671875, 38.54408645629883, 39.927284240722656, 41.310482025146484, 42.69367980957031, 44.076881408691406, 45.46007537841797]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 6.0, 5.0, 3.0, 6.0, 9.0, 17.0, 10.0, 19.0, 20.0, 26.0, 38.0, 29.0, 31.0, 42.0, 34.0, 33.0, 54.0, 36.0, 44.0, 45.0, 49.0, 55.0, 41.0, 39.0, 47.0, 32.0, 29.0, 34.0, 27.0, 24.0, 16.0, 22.0, 17.0, 12.0, 8.0, 8.0, 9.0, 5.0, 1.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.48480224609375, -16.882612228393555, -16.28042221069336, -15.67823314666748, -15.076044082641602, -14.473854064941406, -13.871664047241211, -13.269474029541016, -12.667284965515137, -12.065094947814941, -11.462905883789062, -10.860715866088867, -10.258525848388672, -9.656336784362793, -9.054146766662598, -8.451957702636719, -7.849767684936523, -7.247578144073486, -6.645388603210449, -6.043198585510254, -5.441009044647217, -4.83881950378418, -4.236629486083984, -3.6344399452209473, -3.03225040435791, -2.430060863494873, -1.8278710842132568, -1.2256814241409302, -0.6234917640686035, -0.021302223205566406, 0.5808875560760498, 1.183077335357666, 1.7852668762207031, 2.3874564170837402, 2.9896461963653564, 3.5918359756469727, 4.19402551651001, 4.796215057373047, 5.398405075073242, 6.000594615936279, 6.602784156799316, 7.2049736976623535, 7.807163238525391, 8.409353256225586, 9.011543273925781, 9.61373233795166, 10.215922355651855, 10.818111419677734, 11.42030143737793, 12.022491455078125, 12.624680519104004, 13.2268705368042, 13.829059600830078, 14.431249618530273, 15.033439636230469, 15.635629653930664, 16.23781967163086, 16.840009689331055, 17.44219970703125, 18.044387817382812, 18.646577835083008, 19.248767852783203, 19.8509578704834, 20.453147888183594, 21.055335998535156]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 10.0, 11.0, 24.0, 22.0, 33.0, 49.0, 87.0, 133.0, 230.0, 368.0, 666.0, 1287.0, 2579.0, 5851.0, 16476.0, 58241.0, 222479.0, 488649.0, 180636.0, 46833.0, 13860.0, 5103.0, 2285.0, 1098.0, 602.0, 345.0, 234.0, 125.0, 74.0, 50.0, 30.0, 20.0, 12.0, 20.0, 8.0, 9.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.625, -18.0322265625, -17.439453125, -16.8466796875, -16.25390625, -15.6611328125, -15.068359375, -14.4755859375, -13.8828125, -13.2900390625, -12.697265625, -12.1044921875, -11.51171875, -10.9189453125, -10.326171875, -9.7333984375, -9.140625, -8.5478515625, -7.955078125, -7.3623046875, -6.76953125, -6.1767578125, -5.583984375, -4.9912109375, -4.3984375, -3.8056640625, -3.212890625, -2.6201171875, -2.02734375, -1.4345703125, -0.841796875, -0.2490234375, 0.34375, 0.9365234375, 1.529296875, 2.1220703125, 2.71484375, 3.3076171875, 3.900390625, 4.4931640625, 5.0859375, 5.6787109375, 6.271484375, 6.8642578125, 7.45703125, 8.0498046875, 8.642578125, 9.2353515625, 9.828125, 10.4208984375, 11.013671875, 11.6064453125, 12.19921875, 12.7919921875, 13.384765625, 13.9775390625, 14.5703125, 15.1630859375, 15.755859375, 16.3486328125, 16.94140625, 17.5341796875, 18.126953125, 18.7197265625, 19.3125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 10.0, 14.0, 16.0, 31.0, 34.0, 36.0, 52.0, 56.0, 76.0, 95.0, 81.0, 85.0, 92.0, 71.0, 52.0, 47.0, 36.0, 31.0, 24.0, 15.0, 9.0, 8.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.06640625, -5.8868408203125, -5.707275390625, -5.5277099609375, -5.34814453125, -5.1685791015625, -4.989013671875, -4.8094482421875, -4.6298828125, -4.4503173828125, -4.270751953125, -4.0911865234375, -3.91162109375, -3.7320556640625, -3.552490234375, -3.3729248046875, -3.193359375, -3.0137939453125, -2.834228515625, -2.6546630859375, -2.47509765625, -2.2955322265625, -2.115966796875, -1.9364013671875, -1.7568359375, -1.5772705078125, -1.397705078125, -1.2181396484375, -1.03857421875, -0.8590087890625, -0.679443359375, -0.4998779296875, -0.3203125, -0.1407470703125, 0.038818359375, 0.2183837890625, 0.39794921875, 0.5775146484375, 0.757080078125, 0.9366455078125, 1.1162109375, 1.2957763671875, 1.475341796875, 1.6549072265625, 1.83447265625, 2.0140380859375, 2.193603515625, 2.3731689453125, 2.552734375, 2.7322998046875, 2.911865234375, 3.0914306640625, 3.27099609375, 3.4505615234375, 3.630126953125, 3.8096923828125, 3.9892578125, 4.1688232421875, 4.348388671875, 4.5279541015625, 4.70751953125, 4.8870849609375, 5.066650390625, 5.2462158203125, 5.42578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 15.0, 19.0, 24.0, 33.0, 43.0, 66.0, 115.0, 140.0, 204.0, 331.0, 506.0, 951.0, 2034.0, 5228.0, 16797.0, 68549.0, 291642.0, 482401.0, 132946.0, 31557.0, 8528.0, 3043.0, 1414.0, 714.0, 382.0, 290.0, 183.0, 112.0, 82.0, 50.0, 48.0, 34.0, 23.0, 19.0, 9.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.4453125, -13.9970703125, -13.548828125, -13.1005859375, -12.65234375, -12.2041015625, -11.755859375, -11.3076171875, -10.859375, -10.4111328125, -9.962890625, -9.5146484375, -9.06640625, -8.6181640625, -8.169921875, -7.7216796875, -7.2734375, -6.8251953125, -6.376953125, -5.9287109375, -5.48046875, -5.0322265625, -4.583984375, -4.1357421875, -3.6875, -3.2392578125, -2.791015625, -2.3427734375, -1.89453125, -1.4462890625, -0.998046875, -0.5498046875, -0.1015625, 0.3466796875, 0.794921875, 1.2431640625, 1.69140625, 2.1396484375, 2.587890625, 3.0361328125, 3.484375, 3.9326171875, 4.380859375, 4.8291015625, 5.27734375, 5.7255859375, 6.173828125, 6.6220703125, 7.0703125, 7.5185546875, 7.966796875, 8.4150390625, 8.86328125, 9.3115234375, 9.759765625, 10.2080078125, 10.65625, 11.1044921875, 11.552734375, 12.0009765625, 12.44921875, 12.8974609375, 13.345703125, 13.7939453125, 14.2421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 6.0, 10.0, 9.0, 10.0, 16.0, 15.0, 26.0, 32.0, 36.0, 32.0, 32.0, 54.0, 52.0, 52.0, 50.0, 43.0, 65.0, 58.0, 51.0, 62.0, 37.0, 51.0, 33.0, 22.0, 26.0, 17.0, 13.0, 16.0, 15.0, 11.0, 4.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.703125, -17.1785888671875, -16.654052734375, -16.1295166015625, -15.60498046875, -15.0804443359375, -14.555908203125, -14.0313720703125, -13.5068359375, -12.9822998046875, -12.457763671875, -11.9332275390625, -11.40869140625, -10.8841552734375, -10.359619140625, -9.8350830078125, -9.310546875, -8.7860107421875, -8.261474609375, -7.7369384765625, -7.21240234375, -6.6878662109375, -6.163330078125, -5.6387939453125, -5.1142578125, -4.5897216796875, -4.065185546875, -3.5406494140625, -3.01611328125, -2.4915771484375, -1.967041015625, -1.4425048828125, -0.91796875, -0.3934326171875, 0.131103515625, 0.6556396484375, 1.18017578125, 1.7047119140625, 2.229248046875, 2.7537841796875, 3.2783203125, 3.8028564453125, 4.327392578125, 4.8519287109375, 5.37646484375, 5.9010009765625, 6.425537109375, 6.9500732421875, 7.474609375, 7.9991455078125, 8.523681640625, 9.0482177734375, 9.57275390625, 10.0972900390625, 10.621826171875, 11.1463623046875, 11.6708984375, 12.1954345703125, 12.719970703125, 13.2445068359375, 13.76904296875, 14.2935791015625, 14.818115234375, 15.3426513671875, 15.8671875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 6.0, 4.0, 10.0, 10.0, 18.0, 30.0, 45.0, 71.0, 103.0, 194.0, 340.0, 624.0, 1260.0, 2883.0, 8335.0, 31600.0, 177677.0, 691549.0, 102529.0, 20804.0, 5984.0, 2215.0, 1013.0, 487.0, 287.0, 147.0, 112.0, 64.0, 44.0, 25.0, 28.0, 10.0, 10.0, 12.0, 5.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.6171875, -12.2794189453125, -11.941650390625, -11.6038818359375, -11.26611328125, -10.9283447265625, -10.590576171875, -10.2528076171875, -9.9150390625, -9.5772705078125, -9.239501953125, -8.9017333984375, -8.56396484375, -8.2261962890625, -7.888427734375, -7.5506591796875, -7.212890625, -6.8751220703125, -6.537353515625, -6.1995849609375, -5.86181640625, -5.5240478515625, -5.186279296875, -4.8485107421875, -4.5107421875, -4.1729736328125, -3.835205078125, -3.4974365234375, -3.15966796875, -2.8218994140625, -2.484130859375, -2.1463623046875, -1.80859375, -1.4708251953125, -1.133056640625, -0.7952880859375, -0.45751953125, -0.1197509765625, 0.218017578125, 0.5557861328125, 0.8935546875, 1.2313232421875, 1.569091796875, 1.9068603515625, 2.24462890625, 2.5823974609375, 2.920166015625, 3.2579345703125, 3.595703125, 3.9334716796875, 4.271240234375, 4.6090087890625, 4.94677734375, 5.2845458984375, 5.622314453125, 5.9600830078125, 6.2978515625, 6.6356201171875, 6.973388671875, 7.3111572265625, 7.64892578125, 7.9866943359375, 8.324462890625, 8.6622314453125, 9.0]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 8.0, 4.0, 4.0, 3.0, 12.0, 13.0, 16.0, 22.0, 34.0, 40.0, 35.0, 57.0, 75.0, 121.0, 204.0, 80.0, 56.0, 46.0, 35.0, 33.0, 35.0, 19.0, 16.0, 12.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008978843688964844, -0.0008607879281044006, -0.0008236914873123169, -0.0007865950465202332, -0.0007494986057281494, -0.0007124021649360657, -0.0006753057241439819, -0.0006382092833518982, -0.0006011128425598145, -0.0005640164017677307, -0.000526919960975647, -0.0004898235201835632, -0.0004527270793914795, -0.00041563063859939575, -0.000378534197807312, -0.00034143775701522827, -0.00030434131622314453, -0.0002672448754310608, -0.00023014843463897705, -0.0001930519938468933, -0.00015595555305480957, -0.00011885911226272583, -8.176267147064209e-05, -4.466623067855835e-05, -7.569789886474609e-06, 2.952665090560913e-05, 6.662309169769287e-05, 0.00010371953248977661, 0.00014081597328186035, 0.0001779124140739441, 0.00021500885486602783, 0.00025210529565811157, 0.0002892017364501953, 0.00032629817724227905, 0.0003633946180343628, 0.00040049105882644653, 0.0004375874996185303, 0.000474683940410614, 0.0005117803812026978, 0.0005488768219947815, 0.0005859732627868652, 0.000623069703578949, 0.0006601661443710327, 0.0006972625851631165, 0.0007343590259552002, 0.0007714554667472839, 0.0008085519075393677, 0.0008456483483314514, 0.0008827447891235352, 0.0009198412299156189, 0.0009569376707077026, 0.0009940341114997864, 0.0010311305522918701, 0.0010682269930839539, 0.0011053234338760376, 0.0011424198746681213, 0.001179516315460205, 0.0012166127562522888, 0.0012537091970443726, 0.0012908056378364563, 0.00132790207862854, 0.0013649985194206238, 0.0014020949602127075, 0.0014391914010047913, 0.001476287841796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 17.0, 16.0, 52.0, 107.0, 323.0, 1265.0, 12126.0, 865292.0, 164023.0, 4370.0, 685.0, 170.0, 53.0, 31.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.46875, -31.508544921875, -30.54833984375, -29.588134765625, -28.6279296875, -27.667724609375, -26.70751953125, -25.747314453125, -24.787109375, -23.826904296875, -22.86669921875, -21.906494140625, -20.9462890625, -19.986083984375, -19.02587890625, -18.065673828125, -17.10546875, -16.145263671875, -15.18505859375, -14.224853515625, -13.2646484375, -12.304443359375, -11.34423828125, -10.384033203125, -9.423828125, -8.463623046875, -7.50341796875, -6.543212890625, -5.5830078125, -4.622802734375, -3.66259765625, -2.702392578125, -1.7421875, -0.781982421875, 0.17822265625, 1.138427734375, 2.0986328125, 3.058837890625, 4.01904296875, 4.979248046875, 5.939453125, 6.899658203125, 7.85986328125, 8.820068359375, 9.7802734375, 10.740478515625, 11.70068359375, 12.660888671875, 13.62109375, 14.581298828125, 15.54150390625, 16.501708984375, 17.4619140625, 18.422119140625, 19.38232421875, 20.342529296875, 21.302734375, 22.262939453125, 23.22314453125, 24.183349609375, 25.1435546875, 26.103759765625, 27.06396484375, 28.024169921875, 28.984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 4.0, 3.0, 6.0, 18.0, 15.0, 33.0, 26.0, 42.0, 85.0, 121.0, 251.0, 154.0, 82.0, 55.0, 43.0, 12.0, 16.0, 11.0, 5.0, 9.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3125, -13.8291015625, -13.345703125, -12.8623046875, -12.37890625, -11.8955078125, -11.412109375, -10.9287109375, -10.4453125, -9.9619140625, -9.478515625, -8.9951171875, -8.51171875, -8.0283203125, -7.544921875, -7.0615234375, -6.578125, -6.0947265625, -5.611328125, -5.1279296875, -4.64453125, -4.1611328125, -3.677734375, -3.1943359375, -2.7109375, -2.2275390625, -1.744140625, -1.2607421875, -0.77734375, -0.2939453125, 0.189453125, 0.6728515625, 1.15625, 1.6396484375, 2.123046875, 2.6064453125, 3.08984375, 3.5732421875, 4.056640625, 4.5400390625, 5.0234375, 5.5068359375, 5.990234375, 6.4736328125, 6.95703125, 7.4404296875, 7.923828125, 8.4072265625, 8.890625, 9.3740234375, 9.857421875, 10.3408203125, 10.82421875, 11.3076171875, 11.791015625, 12.2744140625, 12.7578125, 13.2412109375, 13.724609375, 14.2080078125, 14.69140625, 15.1748046875, 15.658203125, 16.1416015625, 16.625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 12.0, 34.0, 39.0, 78.0, 119.0, 156.0, 154.0, 139.0, 94.0, 66.0, 40.0, 27.0, 12.0, 10.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.95598602294922, -112.48455047607422, -108.01312255859375, -103.54168701171875, -99.07025146484375, -94.59881591796875, -90.12738037109375, -85.65595245361328, -81.18451690673828, -76.71308135986328, -72.24165344238281, -67.77021789550781, -63.29878234863281, -58.82734680175781, -54.35591506958008, -49.884483337402344, -45.413047790527344, -40.941612243652344, -36.47018051147461, -31.998746871948242, -27.527313232421875, -23.055879592895508, -18.58444595336914, -14.113012313842773, -9.641578674316406, -5.170145034790039, -0.6987113952636719, 3.7727222442626953, 8.244155883789062, 12.71558952331543, 17.187023162841797, 21.658456802368164, 26.1298828125, 30.601316452026367, 35.072750091552734, 39.54418182373047, 44.01561737060547, 48.48705291748047, 52.9584846496582, 57.42991638183594, 61.90135192871094, 66.37278747558594, 70.84422302246094, 75.3156509399414, 79.7870864868164, 84.2585220336914, 88.72994995117188, 93.20138549804688, 97.67282104492188, 102.14425659179688, 106.61569213867188, 111.08712005615234, 115.55855560302734, 120.02999114990234, 124.50141906738281, 128.9728546142578, 133.4442901611328, 137.9157257080078, 142.3871612548828, 146.8585968017578, 151.33001708984375, 155.80145263671875, 160.27288818359375, 164.74432373046875, 169.21575927734375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 9.0, 4.0, 5.0, 6.0, 12.0, 9.0, 14.0, 20.0, 22.0, 15.0, 19.0, 32.0, 41.0, 29.0, 27.0, 22.0, 30.0, 45.0, 40.0, 47.0, 40.0, 50.0, 43.0, 51.0, 36.0, 38.0, 40.0, 34.0, 29.0, 29.0, 19.0, 17.0, 16.0, 19.0, 11.0, 20.0, 11.0, 9.0, 8.0, 6.0, 7.0, 0.0, 4.0, 6.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-78.79454040527344, -76.16157531738281, -73.52861022949219, -70.8956527709961, -68.26268768310547, -65.62972259521484, -62.99675750732422, -60.363792419433594, -57.730831146240234, -55.09786605834961, -52.46490478515625, -49.831939697265625, -47.198974609375, -44.56601333618164, -41.933048248291016, -39.300086975097656, -36.66712188720703, -34.034156799316406, -31.401195526123047, -28.768230438232422, -26.13526725769043, -23.502304077148438, -20.869338989257812, -18.23637580871582, -15.603412628173828, -12.970449447631836, -10.337485313415527, -7.704521656036377, -5.071557998657227, -2.4385948181152344, 0.19436931610107422, 2.827333450317383, 5.460289001464844, 8.093252182006836, 10.726216316223145, 13.359180450439453, 15.992143630981445, 18.625106811523438, 21.258071899414062, 23.891035079956055, 26.523998260498047, 29.15696144104004, 31.78992462158203, 34.422889709472656, 37.05585479736328, 39.68881607055664, 42.321781158447266, 44.954742431640625, 47.58770751953125, 50.220672607421875, 52.853633880615234, 55.48659896850586, 58.11956024169922, 60.752525329589844, 63.38549041748047, 66.0184555053711, 68.65141296386719, 71.28437805175781, 73.91734313964844, 76.55030059814453, 79.18326568603516, 81.81623077392578, 84.4491958618164, 87.08216094970703, 89.71512603759766]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 10.0, 5.0, 12.0, 16.0, 25.0, 40.0, 75.0, 118.0, 214.0, 348.0, 615.0, 1195.0, 2786.0, 7593.0, 26600.0, 167331.0, 3731645.0, 211548.0, 30302.0, 8372.0, 3032.0, 1194.0, 552.0, 288.0, 142.0, 88.0, 64.0, 29.0, 18.0, 11.0, 12.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9375, -34.053955078125, -33.17041015625, -32.286865234375, -31.4033203125, -30.519775390625, -29.63623046875, -28.752685546875, -27.869140625, -26.985595703125, -26.10205078125, -25.218505859375, -24.3349609375, -23.451416015625, -22.56787109375, -21.684326171875, -20.80078125, -19.917236328125, -19.03369140625, -18.150146484375, -17.2666015625, -16.383056640625, -15.49951171875, -14.615966796875, -13.732421875, -12.848876953125, -11.96533203125, -11.081787109375, -10.1982421875, -9.314697265625, -8.43115234375, -7.547607421875, -6.6640625, -5.780517578125, -4.89697265625, -4.013427734375, -3.1298828125, -2.246337890625, -1.36279296875, -0.479248046875, 0.404296875, 1.287841796875, 2.17138671875, 3.054931640625, 3.9384765625, 4.822021484375, 5.70556640625, 6.589111328125, 7.47265625, 8.356201171875, 9.23974609375, 10.123291015625, 11.0068359375, 11.890380859375, 12.77392578125, 13.657470703125, 14.541015625, 15.424560546875, 16.30810546875, 17.191650390625, 18.0751953125, 18.958740234375, 19.84228515625, 20.725830078125, 21.609375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 8.0, 18.0, 23.0, 28.0, 32.0, 59.0, 52.0, 60.0, 59.0, 65.0, 75.0, 81.0, 58.0, 61.0, 64.0, 43.0, 54.0, 25.0, 25.0, 22.0, 19.0, 19.0, 8.0, 6.0, 1.0, 9.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.359375, -6.17718505859375, -5.9949951171875, -5.81280517578125, -5.630615234375, -5.44842529296875, -5.2662353515625, -5.08404541015625, -4.90185546875, -4.71966552734375, -4.5374755859375, -4.35528564453125, -4.173095703125, -3.99090576171875, -3.8087158203125, -3.62652587890625, -3.4443359375, -3.26214599609375, -3.0799560546875, -2.89776611328125, -2.715576171875, -2.53338623046875, -2.3511962890625, -2.16900634765625, -1.98681640625, -1.80462646484375, -1.6224365234375, -1.44024658203125, -1.258056640625, -1.07586669921875, -0.8936767578125, -0.71148681640625, -0.529296875, -0.34710693359375, -0.1649169921875, 0.01727294921875, 0.199462890625, 0.38165283203125, 0.5638427734375, 0.74603271484375, 0.92822265625, 1.11041259765625, 1.2926025390625, 1.47479248046875, 1.656982421875, 1.83917236328125, 2.0213623046875, 2.20355224609375, 2.3857421875, 2.56793212890625, 2.7501220703125, 2.93231201171875, 3.114501953125, 3.29669189453125, 3.4788818359375, 3.66107177734375, 3.84326171875, 4.02545166015625, 4.2076416015625, 4.38983154296875, 4.572021484375, 4.75421142578125, 4.9364013671875, 5.11859130859375, 5.30078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 5.0, 0.0, 10.0, 11.0, 13.0, 32.0, 42.0, 50.0, 59.0, 109.0, 195.0, 262.0, 442.0, 874.0, 1949.0, 4702.0, 15168.0, 70050.0, 1129623.0, 2847098.0, 95217.0, 18408.0, 5475.0, 2183.0, 932.0, 477.0, 324.0, 171.0, 105.0, 72.0, 68.0, 40.0, 20.0, 28.0, 20.0, 10.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.5, -18.87255859375, -18.2451171875, -17.61767578125, -16.990234375, -16.36279296875, -15.7353515625, -15.10791015625, -14.48046875, -13.85302734375, -13.2255859375, -12.59814453125, -11.970703125, -11.34326171875, -10.7158203125, -10.08837890625, -9.4609375, -8.83349609375, -8.2060546875, -7.57861328125, -6.951171875, -6.32373046875, -5.6962890625, -5.06884765625, -4.44140625, -3.81396484375, -3.1865234375, -2.55908203125, -1.931640625, -1.30419921875, -0.6767578125, -0.04931640625, 0.578125, 1.20556640625, 1.8330078125, 2.46044921875, 3.087890625, 3.71533203125, 4.3427734375, 4.97021484375, 5.59765625, 6.22509765625, 6.8525390625, 7.47998046875, 8.107421875, 8.73486328125, 9.3623046875, 9.98974609375, 10.6171875, 11.24462890625, 11.8720703125, 12.49951171875, 13.126953125, 13.75439453125, 14.3818359375, 15.00927734375, 15.63671875, 16.26416015625, 16.8916015625, 17.51904296875, 18.146484375, 18.77392578125, 19.4013671875, 20.02880859375, 20.65625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 15.0, 13.0, 54.0, 106.0, 234.0, 1730.0, 1449.0, 252.0, 103.0, 49.0, 31.0, 8.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.390625, -20.8419189453125, -20.293212890625, -19.7445068359375, -19.19580078125, -18.6470947265625, -18.098388671875, -17.5496826171875, -17.0009765625, -16.4522705078125, -15.903564453125, -15.3548583984375, -14.80615234375, -14.2574462890625, -13.708740234375, -13.1600341796875, -12.611328125, -12.0626220703125, -11.513916015625, -10.9652099609375, -10.41650390625, -9.8677978515625, -9.319091796875, -8.7703857421875, -8.2216796875, -7.6729736328125, -7.124267578125, -6.5755615234375, -6.02685546875, -5.4781494140625, -4.929443359375, -4.3807373046875, -3.83203125, -3.2833251953125, -2.734619140625, -2.1859130859375, -1.63720703125, -1.0885009765625, -0.539794921875, 0.0089111328125, 0.5576171875, 1.1063232421875, 1.655029296875, 2.2037353515625, 2.75244140625, 3.3011474609375, 3.849853515625, 4.3985595703125, 4.947265625, 5.4959716796875, 6.044677734375, 6.5933837890625, 7.14208984375, 7.6907958984375, 8.239501953125, 8.7882080078125, 9.3369140625, 9.8856201171875, 10.434326171875, 10.9830322265625, 11.53173828125, 12.0804443359375, 12.629150390625, 13.1778564453125, 13.7265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 17.0, 59.0, 135.0, 226.0, 258.0, 173.0, 78.0, 33.0, 9.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.23035430908203, -114.17701721191406, -111.12368774414062, -108.07035064697266, -105.01701354980469, -101.96368408203125, -98.91034698486328, -95.85700988769531, -92.80368041992188, -89.7503433227539, -86.69701385498047, -83.6436767578125, -80.59033966064453, -77.53700256347656, -74.48367309570312, -71.43033599853516, -68.37699890136719, -65.32366180419922, -62.270328521728516, -59.21699523925781, -56.163658142089844, -53.11032485961914, -50.05699157714844, -47.00365447998047, -43.950321197509766, -40.89698791503906, -37.843650817871094, -34.79031753540039, -31.736982345581055, -28.68364715576172, -25.630313873291016, -22.57697868347168, -19.523635864257812, -16.470300674438477, -13.416966438293457, -10.363632202148438, -7.310297012329102, -4.256961822509766, -1.2036285400390625, 1.8497066497802734, 4.903041839599609, 7.956376552581787, 11.009711265563965, 14.063045501708984, 17.11638069152832, 20.169715881347656, 23.22304916381836, 26.276384353637695, 29.32971954345703, 32.383052825927734, 35.4363899230957, 38.489723205566406, 41.543060302734375, 44.59639358520508, 47.64972686767578, 50.70306396484375, 53.75639724731445, 56.809730529785156, 59.863067626953125, 62.91640090942383, 65.96973419189453, 69.0230712890625, 72.07640075683594, 75.1297378540039, 78.18307495117188]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 9.0, 6.0, 7.0, 4.0, 4.0, 9.0, 13.0, 19.0, 15.0, 32.0, 33.0, 63.0, 48.0, 54.0, 59.0, 49.0, 67.0, 65.0, 66.0, 52.0, 60.0, 60.0, 42.0, 41.0, 28.0, 21.0, 25.0, 14.0, 10.0, 12.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.80608367919922, -40.597007751464844, -39.387935638427734, -38.17885971069336, -36.96978759765625, -35.760711669921875, -34.5516357421875, -33.342559814453125, -32.133487701416016, -30.924413681030273, -29.71533966064453, -28.506263732910156, -27.297189712524414, -26.088115692138672, -24.879039764404297, -23.669965744018555, -22.460891723632812, -21.25181770324707, -20.042743682861328, -18.833667755126953, -17.62459373474121, -16.41551971435547, -15.20644474029541, -13.997369766235352, -12.78829574584961, -11.579221725463867, -10.370146751403809, -9.16107177734375, -7.951997756958008, -6.742923259735107, -5.533848762512207, -4.324773788452148, -3.1156959533691406, -1.9066214561462402, -0.6975469589233398, 0.5115275382995605, 1.720602035522461, 2.9296765327453613, 4.138751029968262, 5.34782600402832, 6.5569000244140625, 7.765974521636963, 8.975049018859863, 10.184123992919922, 11.393198013305664, 12.602272033691406, 13.811347007751465, 15.020421981811523, 16.229496002197266, 17.438570022583008, 18.64764404296875, 19.856719970703125, 21.065793991088867, 22.27486801147461, 23.483943939208984, 24.693017959594727, 25.90209197998047, 27.11116600036621, 28.320240020751953, 29.529315948486328, 30.73838996887207, 31.947463989257812, 33.15653991699219, 34.36561584472656, 35.57468795776367]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 8.0, 8.0, 14.0, 21.0, 27.0, 43.0, 73.0, 89.0, 148.0, 287.0, 425.0, 797.0, 1512.0, 3241.0, 8300.0, 25443.0, 96595.0, 347989.0, 393418.0, 121942.0, 30829.0, 9737.0, 3793.0, 1686.0, 902.0, 449.0, 296.0, 173.0, 100.0, 58.0, 48.0, 25.0, 24.0, 11.0, 6.0, 8.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.392578125, -17.80078125, -17.208984375, -16.6171875, -16.025390625, -15.43359375, -14.841796875, -14.25, -13.658203125, -13.06640625, -12.474609375, -11.8828125, -11.291015625, -10.69921875, -10.107421875, -9.515625, -8.923828125, -8.33203125, -7.740234375, -7.1484375, -6.556640625, -5.96484375, -5.373046875, -4.78125, -4.189453125, -3.59765625, -3.005859375, -2.4140625, -1.822265625, -1.23046875, -0.638671875, -0.046875, 0.544921875, 1.13671875, 1.728515625, 2.3203125, 2.912109375, 3.50390625, 4.095703125, 4.6875, 5.279296875, 5.87109375, 6.462890625, 7.0546875, 7.646484375, 8.23828125, 8.830078125, 9.421875, 10.013671875, 10.60546875, 11.197265625, 11.7890625, 12.380859375, 12.97265625, 13.564453125, 14.15625, 14.748046875, 15.33984375, 15.931640625, 16.5234375, 17.115234375, 17.70703125, 18.298828125, 18.890625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 9.0, 8.0, 23.0, 24.0, 50.0, 53.0, 69.0, 59.0, 73.0, 83.0, 80.0, 83.0, 87.0, 68.0, 48.0, 43.0, 30.0, 25.0, 19.0, 19.0, 11.0, 7.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4453125, -7.2398681640625, -7.034423828125, -6.8289794921875, -6.62353515625, -6.4180908203125, -6.212646484375, -6.0072021484375, -5.8017578125, -5.5963134765625, -5.390869140625, -5.1854248046875, -4.97998046875, -4.7745361328125, -4.569091796875, -4.3636474609375, -4.158203125, -3.9527587890625, -3.747314453125, -3.5418701171875, -3.33642578125, -3.1309814453125, -2.925537109375, -2.7200927734375, -2.5146484375, -2.3092041015625, -2.103759765625, -1.8983154296875, -1.69287109375, -1.4874267578125, -1.281982421875, -1.0765380859375, -0.87109375, -0.6656494140625, -0.460205078125, -0.2547607421875, -0.04931640625, 0.1561279296875, 0.361572265625, 0.5670166015625, 0.7724609375, 0.9779052734375, 1.183349609375, 1.3887939453125, 1.59423828125, 1.7996826171875, 2.005126953125, 2.2105712890625, 2.416015625, 2.6214599609375, 2.826904296875, 3.0323486328125, 3.23779296875, 3.4432373046875, 3.648681640625, 3.8541259765625, 4.0595703125, 4.2650146484375, 4.470458984375, 4.6759033203125, 4.88134765625, 5.0867919921875, 5.292236328125, 5.4976806640625, 5.703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 8.0, 10.0, 14.0, 18.0, 29.0, 41.0, 52.0, 76.0, 108.0, 157.0, 216.0, 334.0, 548.0, 1005.0, 1921.0, 4707.0, 13490.0, 50960.0, 216340.0, 479301.0, 208127.0, 49189.0, 13147.0, 4341.0, 1804.0, 939.0, 531.0, 338.0, 229.0, 167.0, 106.0, 88.0, 60.0, 46.0, 34.0, 24.0, 16.0, 14.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4296875, -14.9547119140625, -14.479736328125, -14.0047607421875, -13.52978515625, -13.0548095703125, -12.579833984375, -12.1048583984375, -11.6298828125, -11.1549072265625, -10.679931640625, -10.2049560546875, -9.72998046875, -9.2550048828125, -8.780029296875, -8.3050537109375, -7.830078125, -7.3551025390625, -6.880126953125, -6.4051513671875, -5.93017578125, -5.4552001953125, -4.980224609375, -4.5052490234375, -4.0302734375, -3.5552978515625, -3.080322265625, -2.6053466796875, -2.13037109375, -1.6553955078125, -1.180419921875, -0.7054443359375, -0.23046875, 0.2445068359375, 0.719482421875, 1.1944580078125, 1.66943359375, 2.1444091796875, 2.619384765625, 3.0943603515625, 3.5693359375, 4.0443115234375, 4.519287109375, 4.9942626953125, 5.46923828125, 5.9442138671875, 6.419189453125, 6.8941650390625, 7.369140625, 7.8441162109375, 8.319091796875, 8.7940673828125, 9.26904296875, 9.7440185546875, 10.218994140625, 10.6939697265625, 11.1689453125, 11.6439208984375, 12.118896484375, 12.5938720703125, 13.06884765625, 13.5438232421875, 14.018798828125, 14.4937744140625, 14.96875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 7.0, 3.0, 6.0, 0.0, 9.0, 19.0, 15.0, 32.0, 18.0, 17.0, 34.0, 30.0, 40.0, 29.0, 27.0, 28.0, 47.0, 48.0, 49.0, 49.0, 39.0, 41.0, 43.0, 32.0, 41.0, 34.0, 36.0, 25.0, 38.0, 28.0, 20.0, 15.0, 10.0, 13.0, 14.0, 13.0, 9.0, 5.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.859375, -16.33642578125, -15.8134765625, -15.29052734375, -14.767578125, -14.24462890625, -13.7216796875, -13.19873046875, -12.67578125, -12.15283203125, -11.6298828125, -11.10693359375, -10.583984375, -10.06103515625, -9.5380859375, -9.01513671875, -8.4921875, -7.96923828125, -7.4462890625, -6.92333984375, -6.400390625, -5.87744140625, -5.3544921875, -4.83154296875, -4.30859375, -3.78564453125, -3.2626953125, -2.73974609375, -2.216796875, -1.69384765625, -1.1708984375, -0.64794921875, -0.125, 0.39794921875, 0.9208984375, 1.44384765625, 1.966796875, 2.48974609375, 3.0126953125, 3.53564453125, 4.05859375, 4.58154296875, 5.1044921875, 5.62744140625, 6.150390625, 6.67333984375, 7.1962890625, 7.71923828125, 8.2421875, 8.76513671875, 9.2880859375, 9.81103515625, 10.333984375, 10.85693359375, 11.3798828125, 11.90283203125, 12.42578125, 12.94873046875, 13.4716796875, 13.99462890625, 14.517578125, 15.04052734375, 15.5634765625, 16.08642578125, 16.609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 5.0, 10.0, 9.0, 10.0, 7.0, 19.0, 34.0, 39.0, 74.0, 111.0, 180.0, 296.0, 488.0, 908.0, 1819.0, 4095.0, 10551.0, 34122.0, 150718.0, 514850.0, 250341.0, 54351.0, 15031.0, 5341.0, 2401.0, 1176.0, 617.0, 361.0, 194.0, 115.0, 83.0, 61.0, 37.0, 29.0, 18.0, 12.0, 10.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.3984375, -9.1192626953125, -8.840087890625, -8.5609130859375, -8.28173828125, -8.0025634765625, -7.723388671875, -7.4442138671875, -7.1650390625, -6.8858642578125, -6.606689453125, -6.3275146484375, -6.04833984375, -5.7691650390625, -5.489990234375, -5.2108154296875, -4.931640625, -4.6524658203125, -4.373291015625, -4.0941162109375, -3.81494140625, -3.5357666015625, -3.256591796875, -2.9774169921875, -2.6982421875, -2.4190673828125, -2.139892578125, -1.8607177734375, -1.58154296875, -1.3023681640625, -1.023193359375, -0.7440185546875, -0.46484375, -0.1856689453125, 0.093505859375, 0.3726806640625, 0.65185546875, 0.9310302734375, 1.210205078125, 1.4893798828125, 1.7685546875, 2.0477294921875, 2.326904296875, 2.6060791015625, 2.88525390625, 3.1644287109375, 3.443603515625, 3.7227783203125, 4.001953125, 4.2811279296875, 4.560302734375, 4.8394775390625, 5.11865234375, 5.3978271484375, 5.677001953125, 5.9561767578125, 6.2353515625, 6.5145263671875, 6.793701171875, 7.0728759765625, 7.35205078125, 7.6312255859375, 7.910400390625, 8.1895751953125, 8.46875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 10.0, 12.0, 8.0, 15.0, 15.0, 20.0, 28.0, 33.0, 36.0, 55.0, 59.0, 86.0, 87.0, 89.0, 75.0, 80.0, 65.0, 54.0, 39.0, 21.0, 19.0, 14.0, 14.0, 11.0, 7.0, 6.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011081695556640625, -0.0010747462511062622, -0.001041322946548462, -0.0010078996419906616, -0.0009744763374328613, -0.000941053032875061, -0.0009076297283172607, -0.0008742064237594604, -0.0008407831192016602, -0.0008073598146438599, -0.0007739365100860596, -0.0007405132055282593, -0.000707089900970459, -0.0006736665964126587, -0.0006402432918548584, -0.0006068199872970581, -0.0005733966827392578, -0.0005399733781814575, -0.0005065500736236572, -0.00047312676906585693, -0.00043970346450805664, -0.00040628015995025635, -0.00037285685539245605, -0.00033943355083465576, -0.00030601024627685547, -0.0002725869417190552, -0.00023916363716125488, -0.0002057403326034546, -0.0001723170280456543, -0.000138893723487854, -0.00010547041893005371, -7.204711437225342e-05, -3.8623809814453125e-05, -5.200505256652832e-06, 2.822279930114746e-05, 6.164610385894775e-05, 9.506940841674805e-05, 0.00012849271297454834, 0.00016191601753234863, 0.00019533932209014893, 0.00022876262664794922, 0.0002621859312057495, 0.0002956092357635498, 0.0003290325403213501, 0.0003624558448791504, 0.0003958791494369507, 0.000429302453994751, 0.00046272575855255127, 0.0004961490631103516, 0.0005295723676681519, 0.0005629956722259521, 0.0005964189767837524, 0.0006298422813415527, 0.000663265585899353, 0.0006966888904571533, 0.0007301121950149536, 0.0007635354995727539, 0.0007969588041305542, 0.0008303821086883545, 0.0008638054132461548, 0.0008972287178039551, 0.0009306520223617554, 0.0009640753269195557, 0.000997498631477356, 0.0010309219360351562]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 7.0, 4.0, 7.0, 13.0, 13.0, 19.0, 30.0, 47.0, 82.0, 88.0, 156.0, 384.0, 764.0, 1959.0, 6448.0, 35011.0, 392061.0, 549439.0, 49685.0, 8265.0, 2338.0, 847.0, 398.0, 184.0, 113.0, 59.0, 31.0, 34.0, 21.0, 18.0, 7.0, 5.0, 5.0, 1.0, 5.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0390625, -13.5562744140625, -13.073486328125, -12.5906982421875, -12.10791015625, -11.6251220703125, -11.142333984375, -10.6595458984375, -10.1767578125, -9.6939697265625, -9.211181640625, -8.7283935546875, -8.24560546875, -7.7628173828125, -7.280029296875, -6.7972412109375, -6.314453125, -5.8316650390625, -5.348876953125, -4.8660888671875, -4.38330078125, -3.9005126953125, -3.417724609375, -2.9349365234375, -2.4521484375, -1.9693603515625, -1.486572265625, -1.0037841796875, -0.52099609375, -0.0382080078125, 0.444580078125, 0.9273681640625, 1.41015625, 1.8929443359375, 2.375732421875, 2.8585205078125, 3.34130859375, 3.8240966796875, 4.306884765625, 4.7896728515625, 5.2724609375, 5.7552490234375, 6.238037109375, 6.7208251953125, 7.20361328125, 7.6864013671875, 8.169189453125, 8.6519775390625, 9.134765625, 9.6175537109375, 10.100341796875, 10.5831298828125, 11.06591796875, 11.5487060546875, 12.031494140625, 12.5142822265625, 12.9970703125, 13.4798583984375, 13.962646484375, 14.4454345703125, 14.92822265625, 15.4110107421875, 15.893798828125, 16.3765869140625, 16.859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 4.0, 2.0, 6.0, 11.0, 7.0, 16.0, 14.0, 19.0, 34.0, 47.0, 58.0, 77.0, 73.0, 112.0, 100.0, 79.0, 77.0, 66.0, 49.0, 33.0, 40.0, 19.0, 11.0, 8.0, 10.0, 3.0, 4.0, 6.0, 4.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3671875, -11.052734375, -10.73828125, -10.423828125, -10.109375, -9.794921875, -9.48046875, -9.166015625, -8.8515625, -8.537109375, -8.22265625, -7.908203125, -7.59375, -7.279296875, -6.96484375, -6.650390625, -6.3359375, -6.021484375, -5.70703125, -5.392578125, -5.078125, -4.763671875, -4.44921875, -4.134765625, -3.8203125, -3.505859375, -3.19140625, -2.876953125, -2.5625, -2.248046875, -1.93359375, -1.619140625, -1.3046875, -0.990234375, -0.67578125, -0.361328125, -0.046875, 0.267578125, 0.58203125, 0.896484375, 1.2109375, 1.525390625, 1.83984375, 2.154296875, 2.46875, 2.783203125, 3.09765625, 3.412109375, 3.7265625, 4.041015625, 4.35546875, 4.669921875, 4.984375, 5.298828125, 5.61328125, 5.927734375, 6.2421875, 6.556640625, 6.87109375, 7.185546875, 7.5, 7.814453125, 8.12890625, 8.443359375, 8.7578125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 7.0, 22.0, 92.0, 307.0, 373.0, 160.0, 33.0, 13.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.18074035644531, -87.08976745605469, -74.99879455566406, -62.907814025878906, -50.81684112548828, -38.725868225097656, -26.6348876953125, -14.543914794921875, -2.45294189453125, 9.638032913208008, 21.729007720947266, 33.819984436035156, 45.91095733642578, 58.001930236816406, 70.09291076660156, 82.18388366699219, 94.27485656738281, 106.36582946777344, 118.45680236816406, 130.54779052734375, 142.63876342773438, 154.729736328125, 166.82070922851562, 178.91168212890625, 191.00265502929688, 203.0936279296875, 215.18460083007812, 227.27557373046875, 239.36654663085938, 251.45751953125, 263.54852294921875, 275.63946533203125, 287.73046875, 299.8214416503906, 311.91241455078125, 324.0033874511719, 336.0943603515625, 348.1853332519531, 360.27630615234375, 372.3673095703125, 384.458251953125, 396.5492248535156, 408.64019775390625, 420.7311706542969, 432.8221435546875, 444.9131164550781, 457.00408935546875, 469.0950927734375, 481.1860656738281, 493.27703857421875, 505.3680114746094, 517.458984375, 529.5499877929688, 541.6409301757812, 553.73193359375, 565.8228759765625, 577.9138793945312, 590.0048828125, 602.0958251953125, 614.1868286132812, 626.2777709960938, 638.3687744140625, 650.459716796875, 662.5507202148438, 674.6416625976562]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 5.0, 10.0, 8.0, 12.0, 28.0, 15.0, 20.0, 29.0, 31.0, 22.0, 48.0, 33.0, 42.0, 48.0, 46.0, 50.0, 51.0, 46.0, 58.0, 34.0, 34.0, 53.0, 36.0, 34.0, 28.0, 32.0, 21.0, 24.0, 19.0, 16.0, 16.0, 12.0, 7.0, 4.0, 5.0, 4.0, 2.0, 7.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.18205261230469, -78.10600280761719, -75.02994537353516, -71.95389556884766, -68.87784576416016, -65.80178833007812, -62.725738525390625, -59.649688720703125, -56.57363510131836, -53.497581481933594, -50.421531677246094, -47.34547805786133, -44.26942443847656, -41.19337463378906, -38.1173210144043, -35.04126739501953, -31.96521759033203, -28.8891658782959, -25.813114166259766, -22.737060546875, -19.661008834838867, -16.584957122802734, -13.508903503417969, -10.432851791381836, -7.356800079345703, -4.280747890472412, -1.204695701599121, 1.8713569641113281, 4.947408676147461, 8.023460388183594, 11.09951400756836, 14.175565719604492, 17.251617431640625, 20.327669143676758, 23.40372085571289, 26.479774475097656, 29.55582618713379, 32.63187789916992, 35.70793151855469, 38.78398132324219, 41.86003494262695, 44.93608856201172, 48.01213836669922, 51.088191986083984, 54.16424560546875, 57.24029541015625, 60.316349029541016, 63.39240264892578, 66.46845245361328, 69.54450225830078, 72.62055969238281, 75.69660949707031, 78.77265930175781, 81.84870910644531, 84.92476654052734, 88.00081634521484, 91.07687377929688, 94.15292358398438, 97.2289810180664, 100.3050308227539, 103.3810806274414, 106.45713806152344, 109.53318786621094, 112.60923767089844, 115.68528747558594]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 8.0, 20.0, 24.0, 45.0, 75.0, 203.0, 420.0, 1382.0, 7001.0, 232126.0, 3939441.0, 10820.0, 1728.0, 536.0, 221.0, 101.0, 51.0, 32.0, 14.0, 9.0, 11.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.5625, -70.87890625, -69.1953125, -67.51171875, -65.828125, -64.14453125, -62.4609375, -60.77734375, -59.09375, -57.41015625, -55.7265625, -54.04296875, -52.359375, -50.67578125, -48.9921875, -47.30859375, -45.625, -43.94140625, -42.2578125, -40.57421875, -38.890625, -37.20703125, -35.5234375, -33.83984375, -32.15625, -30.47265625, -28.7890625, -27.10546875, -25.421875, -23.73828125, -22.0546875, -20.37109375, -18.6875, -17.00390625, -15.3203125, -13.63671875, -11.953125, -10.26953125, -8.5859375, -6.90234375, -5.21875, -3.53515625, -1.8515625, -0.16796875, 1.515625, 3.19921875, 4.8828125, 6.56640625, 8.25, 9.93359375, 11.6171875, 13.30078125, 14.984375, 16.66796875, 18.3515625, 20.03515625, 21.71875, 23.40234375, 25.0859375, 26.76953125, 28.453125, 30.13671875, 31.8203125, 33.50390625, 35.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 7.0, 10.0, 17.0, 18.0, 18.0, 25.0, 40.0, 42.0, 52.0, 66.0, 54.0, 76.0, 72.0, 87.0, 66.0, 62.0, 63.0, 48.0, 39.0, 30.0, 28.0, 15.0, 14.0, 11.0, 8.0, 10.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-7.7890625, -7.577880859375, -7.36669921875, -7.155517578125, -6.9443359375, -6.733154296875, -6.52197265625, -6.310791015625, -6.099609375, -5.888427734375, -5.67724609375, -5.466064453125, -5.2548828125, -5.043701171875, -4.83251953125, -4.621337890625, -4.41015625, -4.198974609375, -3.98779296875, -3.776611328125, -3.5654296875, -3.354248046875, -3.14306640625, -2.931884765625, -2.720703125, -2.509521484375, -2.29833984375, -2.087158203125, -1.8759765625, -1.664794921875, -1.45361328125, -1.242431640625, -1.03125, -0.820068359375, -0.60888671875, -0.397705078125, -0.1865234375, 0.024658203125, 0.23583984375, 0.447021484375, 0.658203125, 0.869384765625, 1.08056640625, 1.291748046875, 1.5029296875, 1.714111328125, 1.92529296875, 2.136474609375, 2.34765625, 2.558837890625, 2.77001953125, 2.981201171875, 3.1923828125, 3.403564453125, 3.61474609375, 3.825927734375, 4.037109375, 4.248291015625, 4.45947265625, 4.670654296875, 4.8818359375, 5.093017578125, 5.30419921875, 5.515380859375, 5.7265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 13.0, 15.0, 12.0, 27.0, 41.0, 43.0, 74.0, 106.0, 114.0, 185.0, 253.0, 353.0, 571.0, 896.0, 1424.0, 2679.0, 5288.0, 12662.0, 37901.0, 186580.0, 3731125.0, 156780.0, 34077.0, 11627.0, 4969.0, 2477.0, 1391.0, 846.0, 487.0, 381.0, 273.0, 171.0, 112.0, 84.0, 54.0, 43.0, 33.0, 27.0, 11.0, 13.0, 14.0, 12.0, 7.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.28515625, -10.9375, -10.58984375, -10.2421875, -9.89453125, -9.546875, -9.19921875, -8.8515625, -8.50390625, -8.15625, -7.80859375, -7.4609375, -7.11328125, -6.765625, -6.41796875, -6.0703125, -5.72265625, -5.375, -5.02734375, -4.6796875, -4.33203125, -3.984375, -3.63671875, -3.2890625, -2.94140625, -2.59375, -2.24609375, -1.8984375, -1.55078125, -1.203125, -0.85546875, -0.5078125, -0.16015625, 0.1875, 0.53515625, 0.8828125, 1.23046875, 1.578125, 1.92578125, 2.2734375, 2.62109375, 2.96875, 3.31640625, 3.6640625, 4.01171875, 4.359375, 4.70703125, 5.0546875, 5.40234375, 5.75, 6.09765625, 6.4453125, 6.79296875, 7.140625, 7.48828125, 7.8359375, 8.18359375, 8.53125, 8.87890625, 9.2265625, 9.57421875, 9.921875, 10.26953125, 10.6171875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 13.0, 15.0, 31.0, 51.0, 87.0, 185.0, 2995.0, 439.0, 112.0, 58.0, 44.0, 16.0, 6.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.139190673828125, -4.01666259765625, -3.894134521484375, -3.7716064453125, -3.649078369140625, -3.52655029296875, -3.404022216796875, -3.281494140625, -3.158966064453125, -3.03643798828125, -2.913909912109375, -2.7913818359375, -2.668853759765625, -2.54632568359375, -2.423797607421875, -2.30126953125, -2.178741455078125, -2.05621337890625, -1.933685302734375, -1.8111572265625, -1.688629150390625, -1.56610107421875, -1.443572998046875, -1.321044921875, -1.198516845703125, -1.07598876953125, -0.953460693359375, -0.8309326171875, -0.708404541015625, -0.58587646484375, -0.463348388671875, -0.3408203125, -0.218292236328125, -0.09576416015625, 0.026763916015625, 0.1492919921875, 0.271820068359375, 0.39434814453125, 0.516876220703125, 0.639404296875, 0.761932373046875, 0.88446044921875, 1.006988525390625, 1.1295166015625, 1.252044677734375, 1.37457275390625, 1.497100830078125, 1.61962890625, 1.742156982421875, 1.86468505859375, 1.987213134765625, 2.1097412109375, 2.232269287109375, 2.35479736328125, 2.477325439453125, 2.599853515625, 2.722381591796875, 2.84490966796875, 2.967437744140625, 3.0899658203125, 3.212493896484375, 3.33502197265625, 3.457550048828125, 3.580078125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 3.0, 5.0, 5.0, 12.0, 19.0, 38.0, 45.0, 59.0, 69.0, 85.0, 91.0, 108.0, 92.0, 92.0, 62.0, 55.0, 44.0, 35.0, 26.0, 16.0, 14.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.232965469360352, -7.911106109619141, -7.58924674987793, -7.2673869132995605, -6.94552755355835, -6.623668193817139, -6.3018083572387695, -5.979948997497559, -5.658089637756348, -5.336230278015137, -5.014370918273926, -4.692511081695557, -4.370651721954346, -4.048792362213135, -3.7269327640533447, -3.4050731658935547, -3.0832138061523438, -2.761354446411133, -2.4394948482513428, -2.1176352500915527, -1.7957758903503418, -1.4739164113998413, -1.1520569324493408, -0.8301973342895508, -0.5083379745483398, -0.18647849559783936, 0.13538098335266113, 0.4572404623031616, 0.7790999412536621, 1.1009594202041626, 1.422818899154663, 1.7446784973144531, 2.0665369033813477, 2.3883962631225586, 2.7102558612823486, 3.0321154594421387, 3.3539748191833496, 3.6758341789245605, 3.9976937770843506, 4.319553375244141, 4.641412734985352, 4.9632720947265625, 5.285131454467773, 5.606991291046143, 5.9288506507873535, 6.2507100105285645, 6.572569847106934, 6.8944292068481445, 7.2162885665893555, 7.538147926330566, 7.860007286071777, 8.181866645812988, 8.503726959228516, 8.825586318969727, 9.147445678710938, 9.469305038452148, 9.79116439819336, 10.11302375793457, 10.434883117675781, 10.756742477416992, 11.078601837158203, 11.40046215057373, 11.722321510314941, 12.044180870056152, 12.366040229797363]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 6.0, 13.0, 4.0, 14.0, 14.0, 20.0, 28.0, 27.0, 31.0, 32.0, 38.0, 31.0, 40.0, 52.0, 48.0, 47.0, 54.0, 43.0, 49.0, 48.0, 40.0, 40.0, 40.0, 32.0, 35.0, 24.0, 19.0, 19.0, 17.0, 19.0, 13.0, 6.0, 16.0, 5.0, 12.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0], "bins": [-8.973464012145996, -8.739679336547852, -8.50589370727539, -8.272109031677246, -8.038324356079102, -7.804539203643799, -7.570754051208496, -7.336969375610352, -7.103184223175049, -6.869399070739746, -6.635614395141602, -6.401829242706299, -6.168044090270996, -5.934259414672852, -5.700474262237549, -5.466689109802246, -5.232904434204102, -4.999119281768799, -4.765334606170654, -4.531549453735352, -4.297764778137207, -4.063979625701904, -3.8301944732666016, -3.596409559249878, -3.3626246452331543, -3.1288397312164307, -2.895054817199707, -2.6612696647644043, -2.4274847507476807, -2.193699836730957, -1.9599148035049438, -1.7261297702789307, -1.492344856262207, -1.2585599422454834, -1.0247749090194702, -0.7909899353981018, -0.5572049617767334, -0.32342004776000977, -0.08963501453399658, 0.1441500186920166, 0.37793493270874023, 0.6117199063301086, 0.845504879951477, 1.0792899131774902, 1.3130748271942139, 1.5468597412109375, 1.7806447744369507, 2.014429807662964, 2.2482147216796875, 2.481999635696411, 2.7157845497131348, 2.9495697021484375, 3.183354616165161, 3.4171395301818848, 3.6509246826171875, 3.884709596633911, 4.118494510650635, 4.3522796630859375, 4.586064338684082, 4.819849491119385, 5.0536346435546875, 5.287419319152832, 5.521204471588135, 5.7549896240234375, 5.988774299621582]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 8.0, 7.0, 22.0, 27.0, 28.0, 60.0, 113.0, 134.0, 302.0, 610.0, 1354.0, 3290.0, 10005.0, 36056.0, 150374.0, 438715.0, 300833.0, 77571.0, 19005.0, 5924.0, 2124.0, 958.0, 430.0, 260.0, 123.0, 81.0, 34.0, 42.0, 18.0, 12.0, 10.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.234375, -18.68115234375, -18.1279296875, -17.57470703125, -17.021484375, -16.46826171875, -15.9150390625, -15.36181640625, -14.80859375, -14.25537109375, -13.7021484375, -13.14892578125, -12.595703125, -12.04248046875, -11.4892578125, -10.93603515625, -10.3828125, -9.82958984375, -9.2763671875, -8.72314453125, -8.169921875, -7.61669921875, -7.0634765625, -6.51025390625, -5.95703125, -5.40380859375, -4.8505859375, -4.29736328125, -3.744140625, -3.19091796875, -2.6376953125, -2.08447265625, -1.53125, -0.97802734375, -0.4248046875, 0.12841796875, 0.681640625, 1.23486328125, 1.7880859375, 2.34130859375, 2.89453125, 3.44775390625, 4.0009765625, 4.55419921875, 5.107421875, 5.66064453125, 6.2138671875, 6.76708984375, 7.3203125, 7.87353515625, 8.4267578125, 8.97998046875, 9.533203125, 10.08642578125, 10.6396484375, 11.19287109375, 11.74609375, 12.29931640625, 12.8525390625, 13.40576171875, 13.958984375, 14.51220703125, 15.0654296875, 15.61865234375, 16.171875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 8.0, 6.0, 6.0, 9.0, 9.0, 18.0, 23.0, 28.0, 35.0, 49.0, 56.0, 64.0, 58.0, 75.0, 75.0, 67.0, 72.0, 60.0, 60.0, 46.0, 38.0, 35.0, 26.0, 14.0, 18.0, 10.0, 11.0, 12.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.84765625, -7.63507080078125, -7.4224853515625, -7.20989990234375, -6.997314453125, -6.78472900390625, -6.5721435546875, -6.35955810546875, -6.14697265625, -5.93438720703125, -5.7218017578125, -5.50921630859375, -5.296630859375, -5.08404541015625, -4.8714599609375, -4.65887451171875, -4.4462890625, -4.23370361328125, -4.0211181640625, -3.80853271484375, -3.595947265625, -3.38336181640625, -3.1707763671875, -2.95819091796875, -2.74560546875, -2.53302001953125, -2.3204345703125, -2.10784912109375, -1.895263671875, -1.68267822265625, -1.4700927734375, -1.25750732421875, -1.044921875, -0.83233642578125, -0.6197509765625, -0.40716552734375, -0.194580078125, 0.01800537109375, 0.2305908203125, 0.44317626953125, 0.65576171875, 0.86834716796875, 1.0809326171875, 1.29351806640625, 1.506103515625, 1.71868896484375, 1.9312744140625, 2.14385986328125, 2.3564453125, 2.56903076171875, 2.7816162109375, 2.99420166015625, 3.206787109375, 3.41937255859375, 3.6319580078125, 3.84454345703125, 4.05712890625, 4.26971435546875, 4.4822998046875, 4.69488525390625, 4.907470703125, 5.12005615234375, 5.3326416015625, 5.54522705078125, 5.7578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 7.0, 10.0, 11.0, 26.0, 31.0, 54.0, 83.0, 96.0, 182.0, 251.0, 395.0, 751.0, 1536.0, 4275.0, 19430.0, 145438.0, 676819.0, 169082.0, 21711.0, 4761.0, 1639.0, 681.0, 449.0, 267.0, 157.0, 115.0, 88.0, 57.0, 33.0, 28.0, 21.0, 15.0, 9.0, 5.0, 9.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.921875, -23.20849609375, -22.4951171875, -21.78173828125, -21.068359375, -20.35498046875, -19.6416015625, -18.92822265625, -18.21484375, -17.50146484375, -16.7880859375, -16.07470703125, -15.361328125, -14.64794921875, -13.9345703125, -13.22119140625, -12.5078125, -11.79443359375, -11.0810546875, -10.36767578125, -9.654296875, -8.94091796875, -8.2275390625, -7.51416015625, -6.80078125, -6.08740234375, -5.3740234375, -4.66064453125, -3.947265625, -3.23388671875, -2.5205078125, -1.80712890625, -1.09375, -0.38037109375, 0.3330078125, 1.04638671875, 1.759765625, 2.47314453125, 3.1865234375, 3.89990234375, 4.61328125, 5.32666015625, 6.0400390625, 6.75341796875, 7.466796875, 8.18017578125, 8.8935546875, 9.60693359375, 10.3203125, 11.03369140625, 11.7470703125, 12.46044921875, 13.173828125, 13.88720703125, 14.6005859375, 15.31396484375, 16.02734375, 16.74072265625, 17.4541015625, 18.16748046875, 18.880859375, 19.59423828125, 20.3076171875, 21.02099609375, 21.734375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 9.0, 4.0, 7.0, 4.0, 7.0, 10.0, 14.0, 10.0, 13.0, 12.0, 20.0, 24.0, 25.0, 34.0, 53.0, 44.0, 37.0, 45.0, 43.0, 59.0, 51.0, 44.0, 47.0, 41.0, 55.0, 45.0, 26.0, 39.0, 32.0, 20.0, 27.0, 16.0, 16.0, 23.0, 13.0, 6.0, 7.0, 5.0, 7.0, 3.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.59375, -20.88330078125, -20.1728515625, -19.46240234375, -18.751953125, -18.04150390625, -17.3310546875, -16.62060546875, -15.91015625, -15.19970703125, -14.4892578125, -13.77880859375, -13.068359375, -12.35791015625, -11.6474609375, -10.93701171875, -10.2265625, -9.51611328125, -8.8056640625, -8.09521484375, -7.384765625, -6.67431640625, -5.9638671875, -5.25341796875, -4.54296875, -3.83251953125, -3.1220703125, -2.41162109375, -1.701171875, -0.99072265625, -0.2802734375, 0.43017578125, 1.140625, 1.85107421875, 2.5615234375, 3.27197265625, 3.982421875, 4.69287109375, 5.4033203125, 6.11376953125, 6.82421875, 7.53466796875, 8.2451171875, 8.95556640625, 9.666015625, 10.37646484375, 11.0869140625, 11.79736328125, 12.5078125, 13.21826171875, 13.9287109375, 14.63916015625, 15.349609375, 16.06005859375, 16.7705078125, 17.48095703125, 18.19140625, 18.90185546875, 19.6123046875, 20.32275390625, 21.033203125, 21.74365234375, 22.4541015625, 23.16455078125, 23.875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 7.0, 10.0, 9.0, 12.0, 23.0, 52.0, 54.0, 124.0, 198.0, 389.0, 881.0, 2224.0, 7652.0, 37963.0, 239022.0, 592942.0, 136218.0, 22681.0, 5060.0, 1595.0, 649.0, 315.0, 186.0, 103.0, 69.0, 38.0, 25.0, 14.0, 7.0, 10.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.18109130859375, -6.9364013671875, -6.69171142578125, -6.447021484375, -6.20233154296875, -5.9576416015625, -5.71295166015625, -5.46826171875, -5.22357177734375, -4.9788818359375, -4.73419189453125, -4.489501953125, -4.24481201171875, -4.0001220703125, -3.75543212890625, -3.5107421875, -3.26605224609375, -3.0213623046875, -2.77667236328125, -2.531982421875, -2.28729248046875, -2.0426025390625, -1.79791259765625, -1.55322265625, -1.30853271484375, -1.0638427734375, -0.81915283203125, -0.574462890625, -0.32977294921875, -0.0850830078125, 0.15960693359375, 0.404296875, 0.64898681640625, 0.8936767578125, 1.13836669921875, 1.383056640625, 1.62774658203125, 1.8724365234375, 2.11712646484375, 2.36181640625, 2.60650634765625, 2.8511962890625, 3.09588623046875, 3.340576171875, 3.58526611328125, 3.8299560546875, 4.07464599609375, 4.3193359375, 4.56402587890625, 4.8087158203125, 5.05340576171875, 5.298095703125, 5.54278564453125, 5.7874755859375, 6.03216552734375, 6.27685546875, 6.52154541015625, 6.7662353515625, 7.01092529296875, 7.255615234375, 7.50030517578125, 7.7449951171875, 7.98968505859375, 8.234375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 7.0, 7.0, 8.0, 10.0, 16.0, 34.0, 30.0, 35.0, 64.0, 57.0, 73.0, 92.0, 96.0, 85.0, 69.0, 79.0, 59.0, 43.0, 25.0, 24.0, 19.0, 12.0, 14.0, 9.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012607574462890625, -0.0012288987636566162, -0.00119704008102417, -0.0011651813983917236, -0.0011333227157592773, -0.001101464033126831, -0.0010696053504943848, -0.0010377466678619385, -0.0010058879852294922, -0.0009740293025970459, -0.0009421706199645996, -0.0009103119373321533, -0.000878453254699707, -0.0008465945720672607, -0.0008147358894348145, -0.0007828772068023682, -0.0007510185241699219, -0.0007191598415374756, -0.0006873011589050293, -0.000655442476272583, -0.0006235837936401367, -0.0005917251110076904, -0.0005598664283752441, -0.0005280077457427979, -0.0004961490631103516, -0.0004642903804779053, -0.000432431697845459, -0.0004005730152130127, -0.0003687143325805664, -0.0003368556499481201, -0.00030499696731567383, -0.00027313828468322754, -0.00024127960205078125, -0.00020942091941833496, -0.00017756223678588867, -0.00014570355415344238, -0.0001138448715209961, -8.19861888885498e-05, -5.0127506256103516e-05, -1.8268823623657227e-05, 1.3589859008789062e-05, 4.544854164123535e-05, 7.730722427368164e-05, 0.00010916590690612793, 0.00014102458953857422, 0.0001728832721710205, 0.0002047419548034668, 0.00023660063743591309, 0.0002684593200683594, 0.00030031800270080566, 0.00033217668533325195, 0.00036403536796569824, 0.00039589405059814453, 0.0004277527332305908, 0.0004596114158630371, 0.0004914700984954834, 0.0005233287811279297, 0.000555187463760376, 0.0005870461463928223, 0.0006189048290252686, 0.0006507635116577148, 0.0006826221942901611, 0.0007144808769226074, 0.0007463395595550537, 0.0007781982421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 22.0, 23.0, 44.0, 55.0, 96.0, 168.0, 291.0, 518.0, 1043.0, 2223.0, 6359.0, 25783.0, 164888.0, 631705.0, 177061.0, 27223.0, 6389.0, 2349.0, 1039.0, 537.0, 267.0, 153.0, 112.0, 55.0, 50.0, 23.0, 11.0, 10.0, 11.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.31640625, -6.05877685546875, -5.8011474609375, -5.54351806640625, -5.285888671875, -5.02825927734375, -4.7706298828125, -4.51300048828125, -4.25537109375, -3.99774169921875, -3.7401123046875, -3.48248291015625, -3.224853515625, -2.96722412109375, -2.7095947265625, -2.45196533203125, -2.1943359375, -1.93670654296875, -1.6790771484375, -1.42144775390625, -1.163818359375, -0.90618896484375, -0.6485595703125, -0.39093017578125, -0.13330078125, 0.12432861328125, 0.3819580078125, 0.63958740234375, 0.897216796875, 1.15484619140625, 1.4124755859375, 1.67010498046875, 1.927734375, 2.18536376953125, 2.4429931640625, 2.70062255859375, 2.958251953125, 3.21588134765625, 3.4735107421875, 3.73114013671875, 3.98876953125, 4.24639892578125, 4.5040283203125, 4.76165771484375, 5.019287109375, 5.27691650390625, 5.5345458984375, 5.79217529296875, 6.0498046875, 6.30743408203125, 6.5650634765625, 6.82269287109375, 7.080322265625, 7.33795166015625, 7.5955810546875, 7.85321044921875, 8.11083984375, 8.36846923828125, 8.6260986328125, 8.88372802734375, 9.141357421875, 9.39898681640625, 9.6566162109375, 9.91424560546875, 10.171875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 5.0, 10.0, 12.0, 14.0, 24.0, 30.0, 42.0, 63.0, 90.0, 102.0, 109.0, 131.0, 109.0, 68.0, 55.0, 42.0, 28.0, 19.0, 22.0, 16.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.8358154296875, -7.507568359375, -7.1793212890625, -6.85107421875, -6.5228271484375, -6.194580078125, -5.8663330078125, -5.5380859375, -5.2098388671875, -4.881591796875, -4.5533447265625, -4.22509765625, -3.8968505859375, -3.568603515625, -3.2403564453125, -2.912109375, -2.5838623046875, -2.255615234375, -1.9273681640625, -1.59912109375, -1.2708740234375, -0.942626953125, -0.6143798828125, -0.2861328125, 0.0421142578125, 0.370361328125, 0.6986083984375, 1.02685546875, 1.3551025390625, 1.683349609375, 2.0115966796875, 2.33984375, 2.6680908203125, 2.996337890625, 3.3245849609375, 3.65283203125, 3.9810791015625, 4.309326171875, 4.6375732421875, 4.9658203125, 5.2940673828125, 5.622314453125, 5.9505615234375, 6.27880859375, 6.6070556640625, 6.935302734375, 7.2635498046875, 7.591796875, 7.9200439453125, 8.248291015625, 8.5765380859375, 8.90478515625, 9.2330322265625, 9.561279296875, 9.8895263671875, 10.2177734375, 10.5460205078125, 10.874267578125, 11.2025146484375, 11.53076171875, 11.8590087890625, 12.187255859375, 12.5155029296875, 12.84375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 10.0, 29.0, 94.0, 214.0, 314.0, 207.0, 85.0, 31.0, 12.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.9600372314453, -163.55899047851562, -155.15794372558594, -146.75689697265625, -138.3558349609375, -129.95480346679688, -121.55374145507812, -113.15269470214844, -104.75164794921875, -96.35060119628906, -87.94955444335938, -79.54850006103516, -71.14745330810547, -62.74640655517578, -54.34535598754883, -45.944305419921875, -37.54325866699219, -29.142210006713867, -20.741161346435547, -12.340112686157227, -3.9390640258789062, 4.461982727050781, 12.863033294677734, 21.264083862304688, 29.665130615234375, 38.06617736816406, 46.467227935791016, 54.86827850341797, 63.269325256347656, 71.67037200927734, 80.07142639160156, 88.47247314453125, 96.87350463867188, 105.27455139160156, 113.67559814453125, 122.07665252685547, 130.47769165039062, 138.87875366210938, 147.27980041503906, 155.68084716796875, 164.08189392089844, 172.48294067382812, 180.8839874267578, 189.2850341796875, 197.68609619140625, 206.08712768554688, 214.48818969726562, 222.8892364501953, 231.290283203125, 239.6913299560547, 248.09237670898438, 256.4934387207031, 264.89447021484375, 273.2955322265625, 281.6965637207031, 290.0976257324219, 298.4986572265625, 306.89971923828125, 315.3007507324219, 323.7018127441406, 332.10284423828125, 340.50390625, 348.9049377441406, 357.3059997558594, 365.7070617675781]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 12.0, 18.0, 8.0, 14.0, 24.0, 19.0, 29.0, 31.0, 35.0, 39.0, 39.0, 45.0, 58.0, 58.0, 58.0, 53.0, 52.0, 51.0, 45.0, 44.0, 42.0, 40.0, 27.0, 25.0, 29.0, 19.0, 16.0, 16.0, 14.0, 5.0, 11.0, 3.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.18243408203125, -95.78191375732422, -92.38139343261719, -88.98087310791016, -85.58035278320312, -82.1798324584961, -78.77931213378906, -75.37879943847656, -71.978271484375, -68.57775115966797, -65.17723083496094, -61.776710510253906, -58.376190185546875, -54.975669860839844, -51.57515335083008, -48.17463302612305, -44.77411651611328, -41.37359619140625, -37.97307586669922, -34.57255554199219, -31.17203712463379, -27.771516799926758, -24.37099838256836, -20.970478057861328, -17.569957733154297, -14.169437408447266, -10.76891803741455, -7.368398666381836, -3.9678783416748047, -0.5673580169677734, 2.833160400390625, 6.233680725097656, 9.634201049804688, 13.034721374511719, 16.43524169921875, 19.83576011657715, 23.23628044128418, 26.63680076599121, 30.03731918334961, 33.43783950805664, 36.83835983276367, 40.2388801574707, 43.639400482177734, 47.0399169921875, 50.44043731689453, 53.84095764160156, 57.241477966308594, 60.641998291015625, 64.04251861572266, 67.44303894042969, 70.84355926513672, 74.24407958984375, 77.64459991455078, 81.04512023925781, 84.44563293457031, 87.84616088867188, 91.24667358398438, 94.6471939086914, 98.04771423339844, 101.44823455810547, 104.8487548828125, 108.24927520751953, 111.64979553222656, 115.05030822753906, 118.45083618164062]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 8.0, 17.0, 40.0, 88.0, 153.0, 469.0, 1753.0, 15185.0, 4111527.0, 60271.0, 3580.0, 714.0, 232.0, 109.0, 44.0, 33.0, 12.0, 14.0, 7.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-61.1875, -59.787109375, -58.38671875, -56.986328125, -55.5859375, -54.185546875, -52.78515625, -51.384765625, -49.984375, -48.583984375, -47.18359375, -45.783203125, -44.3828125, -42.982421875, -41.58203125, -40.181640625, -38.78125, -37.380859375, -35.98046875, -34.580078125, -33.1796875, -31.779296875, -30.37890625, -28.978515625, -27.578125, -26.177734375, -24.77734375, -23.376953125, -21.9765625, -20.576171875, -19.17578125, -17.775390625, -16.375, -14.974609375, -13.57421875, -12.173828125, -10.7734375, -9.373046875, -7.97265625, -6.572265625, -5.171875, -3.771484375, -2.37109375, -0.970703125, 0.4296875, 1.830078125, 3.23046875, 4.630859375, 6.03125, 7.431640625, 8.83203125, 10.232421875, 11.6328125, 13.033203125, 14.43359375, 15.833984375, 17.234375, 18.634765625, 20.03515625, 21.435546875, 22.8359375, 24.236328125, 25.63671875, 27.037109375, 28.4375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 7.0, 8.0, 25.0, 21.0, 22.0, 24.0, 33.0, 39.0, 49.0, 47.0, 71.0, 66.0, 75.0, 69.0, 83.0, 60.0, 47.0, 48.0, 42.0, 27.0, 24.0, 21.0, 14.0, 18.0, 12.0, 12.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-7.359375, -7.15484619140625, -6.9503173828125, -6.74578857421875, -6.541259765625, -6.33673095703125, -6.1322021484375, -5.92767333984375, -5.72314453125, -5.51861572265625, -5.3140869140625, -5.10955810546875, -4.905029296875, -4.70050048828125, -4.4959716796875, -4.29144287109375, -4.0869140625, -3.88238525390625, -3.6778564453125, -3.47332763671875, -3.268798828125, -3.06427001953125, -2.8597412109375, -2.65521240234375, -2.45068359375, -2.24615478515625, -2.0416259765625, -1.83709716796875, -1.632568359375, -1.42803955078125, -1.2235107421875, -1.01898193359375, -0.814453125, -0.60992431640625, -0.4053955078125, -0.20086669921875, 0.003662109375, 0.20819091796875, 0.4127197265625, 0.61724853515625, 0.82177734375, 1.02630615234375, 1.2308349609375, 1.43536376953125, 1.639892578125, 1.84442138671875, 2.0489501953125, 2.25347900390625, 2.4580078125, 2.66253662109375, 2.8670654296875, 3.07159423828125, 3.276123046875, 3.48065185546875, 3.6851806640625, 3.88970947265625, 4.09423828125, 4.29876708984375, 4.5032958984375, 4.70782470703125, 4.912353515625, 5.11688232421875, 5.3214111328125, 5.52593994140625, 5.73046875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 9.0, 12.0, 19.0, 28.0, 41.0, 41.0, 76.0, 76.0, 131.0, 168.0, 217.0, 344.0, 519.0, 695.0, 1128.0, 1741.0, 2840.0, 4776.0, 9359.0, 19914.0, 52624.0, 233712.0, 3602835.0, 179732.0, 45081.0, 17541.0, 8476.0, 4467.0, 2683.0, 1674.0, 1003.0, 677.0, 497.0, 329.0, 241.0, 152.0, 129.0, 78.0, 58.0, 37.0, 31.0, 30.0, 17.0, 12.0, 11.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.05078125, -6.8333740234375, -6.615966796875, -6.3985595703125, -6.18115234375, -5.9637451171875, -5.746337890625, -5.5289306640625, -5.3115234375, -5.0941162109375, -4.876708984375, -4.6593017578125, -4.44189453125, -4.2244873046875, -4.007080078125, -3.7896728515625, -3.572265625, -3.3548583984375, -3.137451171875, -2.9200439453125, -2.70263671875, -2.4852294921875, -2.267822265625, -2.0504150390625, -1.8330078125, -1.6156005859375, -1.398193359375, -1.1807861328125, -0.96337890625, -0.7459716796875, -0.528564453125, -0.3111572265625, -0.09375, 0.1236572265625, 0.341064453125, 0.5584716796875, 0.77587890625, 0.9932861328125, 1.210693359375, 1.4281005859375, 1.6455078125, 1.8629150390625, 2.080322265625, 2.2977294921875, 2.51513671875, 2.7325439453125, 2.949951171875, 3.1673583984375, 3.384765625, 3.6021728515625, 3.819580078125, 4.0369873046875, 4.25439453125, 4.4718017578125, 4.689208984375, 4.9066162109375, 5.1240234375, 5.3414306640625, 5.558837890625, 5.7762451171875, 5.99365234375, 6.2110595703125, 6.428466796875, 6.6458740234375, 6.86328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 9.0, 12.0, 14.0, 17.0, 31.0, 49.0, 106.0, 205.0, 2712.0, 494.0, 174.0, 84.0, 54.0, 28.0, 14.0, 18.0, 11.0, 9.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.620086669921875, -2.53509521484375, -2.450103759765625, -2.3651123046875, -2.280120849609375, -2.19512939453125, -2.110137939453125, -2.025146484375, -1.940155029296875, -1.85516357421875, -1.770172119140625, -1.6851806640625, -1.600189208984375, -1.51519775390625, -1.430206298828125, -1.34521484375, -1.260223388671875, -1.17523193359375, -1.090240478515625, -1.0052490234375, -0.920257568359375, -0.83526611328125, -0.750274658203125, -0.665283203125, -0.580291748046875, -0.49530029296875, -0.410308837890625, -0.3253173828125, -0.240325927734375, -0.15533447265625, -0.070343017578125, 0.0146484375, 0.099639892578125, 0.18463134765625, 0.269622802734375, 0.3546142578125, 0.439605712890625, 0.52459716796875, 0.609588623046875, 0.694580078125, 0.779571533203125, 0.86456298828125, 0.949554443359375, 1.0345458984375, 1.119537353515625, 1.20452880859375, 1.289520263671875, 1.37451171875, 1.459503173828125, 1.54449462890625, 1.629486083984375, 1.7144775390625, 1.799468994140625, 1.88446044921875, 1.969451904296875, 2.054443359375, 2.139434814453125, 2.22442626953125, 2.309417724609375, 2.3944091796875, 2.479400634765625, 2.56439208984375, 2.649383544921875, 2.734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 15.0, 52.0, 230.0, 384.0, 234.0, 81.0, 10.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.331368446350098, -8.077461242675781, -6.823554992675781, -5.569647789001465, -4.315741062164307, -3.0618343353271484, -1.807927131652832, -0.554020881652832, 0.6998863220214844, 1.9537931680679321, 3.20770001411438, 4.461606979370117, 5.715513706207275, 6.969420433044434, 8.22332763671875, 9.47723388671875, 10.731141090393066, 11.985048294067383, 13.238954544067383, 14.4928617477417, 15.746768951416016, 17.000675201416016, 18.254581451416016, 19.508487701416016, 20.76239585876465, 22.01630210876465, 23.27021026611328, 24.52411651611328, 25.77802276611328, 27.03192901611328, 28.285837173461914, 29.539743423461914, 30.793651580810547, 32.04755783081055, 33.30146408081055, 34.55537414550781, 35.80928039550781, 37.06318664550781, 38.31709289550781, 39.57099914550781, 40.82490539550781, 42.07881164550781, 43.33271789550781, 44.58662414550781, 45.84053421020508, 47.09444046020508, 48.34834671020508, 49.60225296020508, 50.856163024902344, 52.110069274902344, 53.363975524902344, 54.617881774902344, 55.87179183959961, 57.12569808959961, 58.37960433959961, 59.63351058959961, 60.88741683959961, 62.14132308959961, 63.39522933959961, 64.64913940429688, 65.90304565429688, 67.15695190429688, 68.41085815429688, 69.66476440429688, 70.91867065429688]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 8.0, 6.0, 10.0, 13.0, 9.0, 14.0, 30.0, 29.0, 30.0, 35.0, 35.0, 47.0, 29.0, 51.0, 41.0, 41.0, 68.0, 60.0, 61.0, 43.0, 57.0, 46.0, 31.0, 37.0, 40.0, 27.0, 25.0, 18.0, 19.0, 11.0, 8.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.191534042358398, -8.938962936401367, -8.686391830444336, -8.433820724487305, -8.181249618530273, -7.928678512573242, -7.676106929779053, -7.4235358238220215, -7.17096471786499, -6.918393611907959, -6.665822505950928, -6.4132513999938965, -6.160679817199707, -5.908108711242676, -5.6555376052856445, -5.402966499328613, -5.150395393371582, -4.897824287414551, -4.6452531814575195, -4.392682075500488, -4.140110969543457, -3.8875396251678467, -3.6349682807922363, -3.382397174835205, -3.129826068878174, -2.8772549629211426, -2.6246838569641113, -2.372112512588501, -2.1195414066314697, -1.8669703006744385, -1.6143990755081177, -1.3618278503417969, -1.1092567443847656, -0.8566855788230896, -0.6041144132614136, -0.35154324769973755, -0.09897208213806152, 0.15359902381896973, 0.4061702489852905, 0.6587414741516113, 0.9113125801086426, 1.1638836860656738, 1.4164549112319946, 1.6690261363983154, 1.9215972423553467, 2.174168348312378, 2.4267396926879883, 2.6793107986450195, 2.931881904602051, 3.184453010559082, 3.4370241165161133, 3.6895954608917236, 3.942166566848755, 4.194737434387207, 4.4473090171813965, 4.699880123138428, 4.952451229095459, 5.20502233505249, 5.4575934410095215, 5.710164546966553, 5.962736129760742, 6.215307235717773, 6.467878341674805, 6.720449447631836, 6.973020553588867]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 9.0, 13.0, 14.0, 23.0, 39.0, 72.0, 115.0, 206.0, 364.0, 675.0, 1267.0, 3036.0, 7622.0, 23145.0, 79077.0, 260243.0, 405545.0, 186975.0, 53683.0, 16232.0, 5621.0, 2292.0, 1043.0, 505.0, 300.0, 154.0, 84.0, 58.0, 50.0, 27.0, 16.0, 13.0, 8.0, 7.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.796875, -14.3897705078125, -13.982666015625, -13.5755615234375, -13.16845703125, -12.7613525390625, -12.354248046875, -11.9471435546875, -11.5400390625, -11.1329345703125, -10.725830078125, -10.3187255859375, -9.91162109375, -9.5045166015625, -9.097412109375, -8.6903076171875, -8.283203125, -7.8760986328125, -7.468994140625, -7.0618896484375, -6.65478515625, -6.2476806640625, -5.840576171875, -5.4334716796875, -5.0263671875, -4.6192626953125, -4.212158203125, -3.8050537109375, -3.39794921875, -2.9908447265625, -2.583740234375, -2.1766357421875, -1.76953125, -1.3624267578125, -0.955322265625, -0.5482177734375, -0.14111328125, 0.2659912109375, 0.673095703125, 1.0802001953125, 1.4873046875, 1.8944091796875, 2.301513671875, 2.7086181640625, 3.11572265625, 3.5228271484375, 3.929931640625, 4.3370361328125, 4.744140625, 5.1512451171875, 5.558349609375, 5.9654541015625, 6.37255859375, 6.7796630859375, 7.186767578125, 7.5938720703125, 8.0009765625, 8.4080810546875, 8.815185546875, 9.2222900390625, 9.62939453125, 10.0364990234375, 10.443603515625, 10.8507080078125, 11.2578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 3.0, 2.0, 4.0, 8.0, 8.0, 13.0, 18.0, 23.0, 22.0, 28.0, 36.0, 33.0, 47.0, 64.0, 56.0, 81.0, 72.0, 75.0, 56.0, 61.0, 47.0, 44.0, 46.0, 35.0, 24.0, 15.0, 17.0, 13.0, 16.0, 13.0, 7.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-7.3359375, -7.13153076171875, -6.9271240234375, -6.72271728515625, -6.518310546875, -6.31390380859375, -6.1094970703125, -5.90509033203125, -5.70068359375, -5.49627685546875, -5.2918701171875, -5.08746337890625, -4.883056640625, -4.67864990234375, -4.4742431640625, -4.26983642578125, -4.0654296875, -3.86102294921875, -3.6566162109375, -3.45220947265625, -3.247802734375, -3.04339599609375, -2.8389892578125, -2.63458251953125, -2.43017578125, -2.22576904296875, -2.0213623046875, -1.81695556640625, -1.612548828125, -1.40814208984375, -1.2037353515625, -0.99932861328125, -0.794921875, -0.59051513671875, -0.3861083984375, -0.18170166015625, 0.022705078125, 0.22711181640625, 0.4315185546875, 0.63592529296875, 0.84033203125, 1.04473876953125, 1.2491455078125, 1.45355224609375, 1.657958984375, 1.86236572265625, 2.0667724609375, 2.27117919921875, 2.4755859375, 2.67999267578125, 2.8843994140625, 3.08880615234375, 3.293212890625, 3.49761962890625, 3.7020263671875, 3.90643310546875, 4.11083984375, 4.31524658203125, 4.5196533203125, 4.72406005859375, 4.928466796875, 5.13287353515625, 5.3372802734375, 5.54168701171875, 5.74609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 7.0, 12.0, 9.0, 14.0, 24.0, 30.0, 40.0, 65.0, 92.0, 142.0, 226.0, 354.0, 613.0, 1183.0, 2721.0, 8687.0, 48296.0, 440696.0, 477859.0, 52466.0, 9326.0, 2780.0, 1218.0, 627.0, 340.0, 232.0, 122.0, 107.0, 78.0, 56.0, 37.0, 26.0, 20.0, 9.0, 10.0, 9.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-20.921875, -20.306884765625, -19.69189453125, -19.076904296875, -18.4619140625, -17.846923828125, -17.23193359375, -16.616943359375, -16.001953125, -15.386962890625, -14.77197265625, -14.156982421875, -13.5419921875, -12.927001953125, -12.31201171875, -11.697021484375, -11.08203125, -10.467041015625, -9.85205078125, -9.237060546875, -8.6220703125, -8.007080078125, -7.39208984375, -6.777099609375, -6.162109375, -5.547119140625, -4.93212890625, -4.317138671875, -3.7021484375, -3.087158203125, -2.47216796875, -1.857177734375, -1.2421875, -0.627197265625, -0.01220703125, 0.602783203125, 1.2177734375, 1.832763671875, 2.44775390625, 3.062744140625, 3.677734375, 4.292724609375, 4.90771484375, 5.522705078125, 6.1376953125, 6.752685546875, 7.36767578125, 7.982666015625, 8.59765625, 9.212646484375, 9.82763671875, 10.442626953125, 11.0576171875, 11.672607421875, 12.28759765625, 12.902587890625, 13.517578125, 14.132568359375, 14.74755859375, 15.362548828125, 15.9775390625, 16.592529296875, 17.20751953125, 17.822509765625, 18.4375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 9.0, 4.0, 5.0, 9.0, 6.0, 11.0, 12.0, 19.0, 17.0, 25.0, 27.0, 35.0, 39.0, 36.0, 44.0, 60.0, 59.0, 52.0, 48.0, 48.0, 64.0, 46.0, 46.0, 46.0, 35.0, 32.0, 25.0, 26.0, 26.0, 21.0, 16.0, 14.0, 12.0, 4.0, 4.0, 10.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.46875, -23.71484375, -22.9609375, -22.20703125, -21.453125, -20.69921875, -19.9453125, -19.19140625, -18.4375, -17.68359375, -16.9296875, -16.17578125, -15.421875, -14.66796875, -13.9140625, -13.16015625, -12.40625, -11.65234375, -10.8984375, -10.14453125, -9.390625, -8.63671875, -7.8828125, -7.12890625, -6.375, -5.62109375, -4.8671875, -4.11328125, -3.359375, -2.60546875, -1.8515625, -1.09765625, -0.34375, 0.41015625, 1.1640625, 1.91796875, 2.671875, 3.42578125, 4.1796875, 4.93359375, 5.6875, 6.44140625, 7.1953125, 7.94921875, 8.703125, 9.45703125, 10.2109375, 10.96484375, 11.71875, 12.47265625, 13.2265625, 13.98046875, 14.734375, 15.48828125, 16.2421875, 16.99609375, 17.75, 18.50390625, 19.2578125, 20.01171875, 20.765625, 21.51953125, 22.2734375, 23.02734375, 23.78125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 1.0, 8.0, 15.0, 19.0, 56.0, 88.0, 139.0, 307.0, 756.0, 3697.0, 57756.0, 939282.0, 41995.0, 3107.0, 721.0, 282.0, 146.0, 75.0, 29.0, 26.0, 20.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.65625, -21.062255859375, -20.46826171875, -19.874267578125, -19.2802734375, -18.686279296875, -18.09228515625, -17.498291015625, -16.904296875, -16.310302734375, -15.71630859375, -15.122314453125, -14.5283203125, -13.934326171875, -13.34033203125, -12.746337890625, -12.15234375, -11.558349609375, -10.96435546875, -10.370361328125, -9.7763671875, -9.182373046875, -8.58837890625, -7.994384765625, -7.400390625, -6.806396484375, -6.21240234375, -5.618408203125, -5.0244140625, -4.430419921875, -3.83642578125, -3.242431640625, -2.6484375, -2.054443359375, -1.46044921875, -0.866455078125, -0.2724609375, 0.321533203125, 0.91552734375, 1.509521484375, 2.103515625, 2.697509765625, 3.29150390625, 3.885498046875, 4.4794921875, 5.073486328125, 5.66748046875, 6.261474609375, 6.85546875, 7.449462890625, 8.04345703125, 8.637451171875, 9.2314453125, 9.825439453125, 10.41943359375, 11.013427734375, 11.607421875, 12.201416015625, 12.79541015625, 13.389404296875, 13.9833984375, 14.577392578125, 15.17138671875, 15.765380859375, 16.359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 4.0, 9.0, 12.0, 24.0, 38.0, 40.0, 58.0, 77.0, 91.0, 105.0, 113.0, 100.0, 89.0, 58.0, 50.0, 34.0, 28.0, 16.0, 12.0, 7.0, 11.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011444091796875, -0.0011076927185058594, -0.0010709762573242188, -0.0010342597961425781, -0.0009975433349609375, -0.0009608268737792969, -0.0009241104125976562, -0.0008873939514160156, -0.000850677490234375, -0.0008139610290527344, -0.0007772445678710938, -0.0007405281066894531, -0.0007038116455078125, -0.0006670951843261719, -0.0006303787231445312, -0.0005936622619628906, -0.00055694580078125, -0.0005202293395996094, -0.00048351287841796875, -0.0004467964172363281, -0.0004100799560546875, -0.0003733634948730469, -0.00033664703369140625, -0.0002999305725097656, -0.000263214111328125, -0.00022649765014648438, -0.00018978118896484375, -0.00015306472778320312, -0.0001163482666015625, -7.963180541992188e-05, -4.291534423828125e-05, -6.198883056640625e-06, 3.0517578125e-05, 6.723403930664062e-05, 0.00010395050048828125, 0.00014066696166992188, 0.0001773834228515625, 0.00021409988403320312, 0.00025081634521484375, 0.0002875328063964844, 0.000324249267578125, 0.0003609657287597656, 0.00039768218994140625, 0.0004343986511230469, 0.0004711151123046875, 0.0005078315734863281, 0.0005445480346679688, 0.0005812644958496094, 0.00061798095703125, 0.0006546974182128906, 0.0006914138793945312, 0.0007281303405761719, 0.0007648468017578125, 0.0008015632629394531, 0.0008382797241210938, 0.0008749961853027344, 0.000911712646484375, 0.0009484291076660156, 0.0009851455688476562, 0.0010218620300292969, 0.0010585784912109375, 0.0010952949523925781, 0.0011320114135742188, 0.0011687278747558594, 0.0012054443359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 6.0, 17.0, 34.0, 46.0, 80.0, 144.0, 296.0, 672.0, 2423.0, 17216.0, 669577.0, 343899.0, 11107.0, 1931.0, 561.0, 207.0, 129.0, 83.0, 41.0, 25.0, 19.0, 14.0, 7.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.09375, -14.552978515625, -14.01220703125, -13.471435546875, -12.9306640625, -12.389892578125, -11.84912109375, -11.308349609375, -10.767578125, -10.226806640625, -9.68603515625, -9.145263671875, -8.6044921875, -8.063720703125, -7.52294921875, -6.982177734375, -6.44140625, -5.900634765625, -5.35986328125, -4.819091796875, -4.2783203125, -3.737548828125, -3.19677734375, -2.656005859375, -2.115234375, -1.574462890625, -1.03369140625, -0.492919921875, 0.0478515625, 0.588623046875, 1.12939453125, 1.670166015625, 2.2109375, 2.751708984375, 3.29248046875, 3.833251953125, 4.3740234375, 4.914794921875, 5.45556640625, 5.996337890625, 6.537109375, 7.077880859375, 7.61865234375, 8.159423828125, 8.7001953125, 9.240966796875, 9.78173828125, 10.322509765625, 10.86328125, 11.404052734375, 11.94482421875, 12.485595703125, 13.0263671875, 13.567138671875, 14.10791015625, 14.648681640625, 15.189453125, 15.730224609375, 16.27099609375, 16.811767578125, 17.3525390625, 17.893310546875, 18.43408203125, 18.974853515625, 19.515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 8.0, 12.0, 13.0, 18.0, 44.0, 68.0, 174.0, 241.0, 176.0, 100.0, 77.0, 31.0, 17.0, 8.0, 5.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -8.9814453125, -8.369140625, -7.7568359375, -7.14453125, -6.5322265625, -5.919921875, -5.3076171875, -4.6953125, -4.0830078125, -3.470703125, -2.8583984375, -2.24609375, -1.6337890625, -1.021484375, -0.4091796875, 0.203125, 0.8154296875, 1.427734375, 2.0400390625, 2.65234375, 3.2646484375, 3.876953125, 4.4892578125, 5.1015625, 5.7138671875, 6.326171875, 6.9384765625, 7.55078125, 8.1630859375, 8.775390625, 9.3876953125, 10.0, 10.6123046875, 11.224609375, 11.8369140625, 12.44921875, 13.0615234375, 13.673828125, 14.2861328125, 14.8984375, 15.5107421875, 16.123046875, 16.7353515625, 17.34765625, 17.9599609375, 18.572265625, 19.1845703125, 19.796875, 20.4091796875, 21.021484375, 21.6337890625, 22.24609375, 22.8583984375, 23.470703125, 24.0830078125, 24.6953125, 25.3076171875, 25.919921875, 26.5322265625, 27.14453125, 27.7568359375, 28.369140625, 28.9814453125, 29.59375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 16.0, 54.0, 278.0, 446.0, 158.0, 32.0, 14.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.33767700195312, -174.10704040527344, -160.87640380859375, -147.64578247070312, -134.41513061523438, -121.18450164794922, -107.95387268066406, -94.72323608398438, -81.49259948730469, -68.261962890625, -55.03133010864258, -41.800697326660156, -28.57006072998047, -15.339424133300781, -2.108795166015625, 11.121841430664062, 24.35247802734375, 37.58311462402344, 50.81374740600586, 64.04438018798828, 77.27501678466797, 90.50565338134766, 103.73628234863281, 116.9669189453125, 130.1975555419922, 143.42819213867188, 156.65882873535156, 169.88946533203125, 183.12008666992188, 196.35073852539062, 209.58135986328125, 222.81199645996094, 236.04266357421875, 249.27330017089844, 262.5039367675781, 275.73455810546875, 288.9652099609375, 302.1958312988281, 315.42645263671875, 328.6571044921875, 341.88775634765625, 355.1183776855469, 368.3490295410156, 381.57965087890625, 394.810302734375, 408.0409240722656, 421.27154541015625, 434.502197265625, 447.7328186035156, 460.96343994140625, 474.194091796875, 487.4247131347656, 500.6553649902344, 513.885986328125, 527.1166381835938, 540.3472900390625, 553.577880859375, 566.8085327148438, 580.0391235351562, 593.269775390625, 606.5004272460938, 619.7310791015625, 632.961669921875, 646.1923217773438, 659.4229736328125]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 7.0, 8.0, 3.0, 8.0, 12.0, 11.0, 15.0, 12.0, 31.0, 35.0, 20.0, 26.0, 32.0, 44.0, 22.0, 40.0, 38.0, 48.0, 53.0, 44.0, 45.0, 51.0, 57.0, 34.0, 37.0, 44.0, 35.0, 37.0, 25.0, 20.0, 16.0, 14.0, 16.0, 15.0, 8.0, 9.0, 8.0, 2.0, 3.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-96.15992736816406, -93.056884765625, -89.95384979248047, -86.8508071899414, -83.74777221679688, -80.64472961425781, -77.54169464111328, -74.43865203857422, -71.33561706542969, -68.23257446289062, -65.1295394897461, -62.0265007019043, -58.9234619140625, -55.8204231262207, -52.717384338378906, -49.614341735839844, -46.51130294799805, -43.40826416015625, -40.30522537231445, -37.202186584472656, -34.09914779663086, -30.996109008789062, -27.893068313598633, -24.790029525756836, -21.68699073791504, -18.583951950073242, -15.480913162231445, -12.377873420715332, -9.274834632873535, -6.171795845031738, -3.068756103515625, 0.034282684326171875, 3.1373214721679688, 6.240360260009766, 9.343399047851562, 12.446438789367676, 15.549477577209473, 18.652515411376953, 21.755556106567383, 24.85859489440918, 27.961633682250977, 31.064672470092773, 34.1677131652832, 37.270751953125, 40.3737907409668, 43.476829528808594, 46.57986831665039, 49.68290710449219, 52.785945892333984, 55.88898468017578, 58.99202346801758, 62.095062255859375, 65.19810485839844, 68.30113983154297, 71.40418243408203, 74.50721740722656, 77.61026000976562, 80.71330261230469, 83.81633758544922, 86.91938018798828, 90.02241516113281, 93.12545776367188, 96.2284927368164, 99.33153533935547, 102.4345703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 6.0, 11.0, 12.0, 14.0, 27.0, 37.0, 60.0, 92.0, 126.0, 260.0, 564.0, 1253.0, 3426.0, 13312.0, 302545.0, 3850104.0, 15966.0, 3792.0, 1344.0, 592.0, 288.0, 153.0, 98.0, 61.0, 41.0, 34.0, 12.0, 10.0, 9.0, 9.0, 3.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.9375, -29.083251953125, -28.22900390625, -27.374755859375, -26.5205078125, -25.666259765625, -24.81201171875, -23.957763671875, -23.103515625, -22.249267578125, -21.39501953125, -20.540771484375, -19.6865234375, -18.832275390625, -17.97802734375, -17.123779296875, -16.26953125, -15.415283203125, -14.56103515625, -13.706787109375, -12.8525390625, -11.998291015625, -11.14404296875, -10.289794921875, -9.435546875, -8.581298828125, -7.72705078125, -6.872802734375, -6.0185546875, -5.164306640625, -4.31005859375, -3.455810546875, -2.6015625, -1.747314453125, -0.89306640625, -0.038818359375, 0.8154296875, 1.669677734375, 2.52392578125, 3.378173828125, 4.232421875, 5.086669921875, 5.94091796875, 6.795166015625, 7.6494140625, 8.503662109375, 9.35791015625, 10.212158203125, 11.06640625, 11.920654296875, 12.77490234375, 13.629150390625, 14.4833984375, 15.337646484375, 16.19189453125, 17.046142578125, 17.900390625, 18.754638671875, 19.60888671875, 20.463134765625, 21.3173828125, 22.171630859375, 23.02587890625, 23.880126953125, 24.734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 11.0, 13.0, 10.0, 20.0, 20.0, 29.0, 37.0, 41.0, 57.0, 51.0, 62.0, 74.0, 76.0, 73.0, 65.0, 56.0, 56.0, 41.0, 40.0, 27.0, 32.0, 18.0, 15.0, 14.0, 12.0, 12.0, 4.0, 10.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-7.63671875, -7.42486572265625, -7.2130126953125, -7.00115966796875, -6.789306640625, -6.57745361328125, -6.3656005859375, -6.15374755859375, -5.94189453125, -5.73004150390625, -5.5181884765625, -5.30633544921875, -5.094482421875, -4.88262939453125, -4.6707763671875, -4.45892333984375, -4.2470703125, -4.03521728515625, -3.8233642578125, -3.61151123046875, -3.399658203125, -3.18780517578125, -2.9759521484375, -2.76409912109375, -2.55224609375, -2.34039306640625, -2.1285400390625, -1.91668701171875, -1.704833984375, -1.49298095703125, -1.2811279296875, -1.06927490234375, -0.857421875, -0.64556884765625, -0.4337158203125, -0.22186279296875, -0.010009765625, 0.20184326171875, 0.4136962890625, 0.62554931640625, 0.83740234375, 1.04925537109375, 1.2611083984375, 1.47296142578125, 1.684814453125, 1.89666748046875, 2.1085205078125, 2.32037353515625, 2.5322265625, 2.74407958984375, 2.9559326171875, 3.16778564453125, 3.379638671875, 3.59149169921875, 3.8033447265625, 4.01519775390625, 4.22705078125, 4.43890380859375, 4.6507568359375, 4.86260986328125, 5.074462890625, 5.28631591796875, 5.4981689453125, 5.71002197265625, 5.921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 13.0, 20.0, 17.0, 27.0, 32.0, 67.0, 77.0, 94.0, 141.0, 188.0, 268.0, 381.0, 543.0, 867.0, 1247.0, 2139.0, 3793.0, 7646.0, 18202.0, 67771.0, 3812346.0, 218890.0, 34012.0, 11965.0, 5706.0, 2910.0, 1649.0, 1026.0, 653.0, 435.0, 335.0, 208.0, 137.0, 125.0, 91.0, 58.0, 44.0, 40.0, 31.0, 21.0, 15.0, 8.0, 11.0, 6.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.984375, -8.6923828125, -8.400390625, -8.1083984375, -7.81640625, -7.5244140625, -7.232421875, -6.9404296875, -6.6484375, -6.3564453125, -6.064453125, -5.7724609375, -5.48046875, -5.1884765625, -4.896484375, -4.6044921875, -4.3125, -4.0205078125, -3.728515625, -3.4365234375, -3.14453125, -2.8525390625, -2.560546875, -2.2685546875, -1.9765625, -1.6845703125, -1.392578125, -1.1005859375, -0.80859375, -0.5166015625, -0.224609375, 0.0673828125, 0.359375, 0.6513671875, 0.943359375, 1.2353515625, 1.52734375, 1.8193359375, 2.111328125, 2.4033203125, 2.6953125, 2.9873046875, 3.279296875, 3.5712890625, 3.86328125, 4.1552734375, 4.447265625, 4.7392578125, 5.03125, 5.3232421875, 5.615234375, 5.9072265625, 6.19921875, 6.4912109375, 6.783203125, 7.0751953125, 7.3671875, 7.6591796875, 7.951171875, 8.2431640625, 8.53515625, 8.8271484375, 9.119140625, 9.4111328125, 9.703125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 17.0, 36.0, 70.0, 181.0, 3309.0, 225.0, 73.0, 50.0, 19.0, 15.0, 9.0, 8.0, 7.0, 4.0, 1.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.052734375, -2.95599365234375, -2.8592529296875, -2.76251220703125, -2.665771484375, -2.56903076171875, -2.4722900390625, -2.37554931640625, -2.27880859375, -2.18206787109375, -2.0853271484375, -1.98858642578125, -1.891845703125, -1.79510498046875, -1.6983642578125, -1.60162353515625, -1.5048828125, -1.40814208984375, -1.3114013671875, -1.21466064453125, -1.117919921875, -1.02117919921875, -0.9244384765625, -0.82769775390625, -0.73095703125, -0.63421630859375, -0.5374755859375, -0.44073486328125, -0.343994140625, -0.24725341796875, -0.1505126953125, -0.05377197265625, 0.04296875, 0.13970947265625, 0.2364501953125, 0.33319091796875, 0.429931640625, 0.52667236328125, 0.6234130859375, 0.72015380859375, 0.81689453125, 0.91363525390625, 1.0103759765625, 1.10711669921875, 1.203857421875, 1.30059814453125, 1.3973388671875, 1.49407958984375, 1.5908203125, 1.68756103515625, 1.7843017578125, 1.88104248046875, 1.977783203125, 2.07452392578125, 2.1712646484375, 2.26800537109375, 2.36474609375, 2.46148681640625, 2.5582275390625, 2.65496826171875, 2.751708984375, 2.84844970703125, 2.9451904296875, 3.04193115234375, 3.138671875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 14.0, 20.0, 47.0, 96.0, 134.0, 185.0, 164.0, 159.0, 75.0, 40.0, 31.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.966727256774902, -12.366374969482422, -11.766022682189941, -11.165670394897461, -10.565317153930664, -9.964964866638184, -9.364612579345703, -8.764259338378906, -8.163908004760742, -7.563555717468262, -6.963202953338623, -6.362850666046143, -5.762497901916504, -5.162145614624023, -4.561793327331543, -3.9614405632019043, -3.3610877990722656, -2.760735273361206, -2.1603827476501465, -1.560030460357666, -0.9596779346466064, -0.3593254089355469, 0.2410268783569336, 0.8413796424865723, 1.4417319297790527, 2.0420844554901123, 2.642436981201172, 3.2427892684936523, 3.843141794204712, 4.4434943199157715, 5.043846607208252, 5.644199371337891, 6.244550704956055, 6.844902992248535, 7.445255756378174, 8.045608520507812, 8.645960807800293, 9.246313095092773, 9.846665382385254, 10.447017669677734, 11.047370910644531, 11.647723197937012, 12.248075485229492, 12.848428726196289, 13.44878101348877, 14.04913330078125, 14.64948558807373, 15.249837875366211, 15.850190162658691, 16.450542449951172, 17.05089569091797, 17.651247024536133, 18.25160026550293, 18.851951599121094, 19.45230484008789, 20.052658081054688, 20.65300941467285, 21.25336265563965, 21.853713989257812, 22.45406723022461, 23.054418563842773, 23.65477180480957, 24.255123138427734, 24.85547637939453, 25.455829620361328]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 7.0, 9.0, 17.0, 12.0, 17.0, 21.0, 28.0, 34.0, 44.0, 35.0, 44.0, 56.0, 51.0, 56.0, 42.0, 47.0, 59.0, 60.0, 51.0, 49.0, 44.0, 36.0, 26.0, 29.0, 21.0, 22.0, 23.0, 9.0, 8.0, 9.0, 10.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.598251342773438, -9.356111526489258, -9.113971710205078, -8.871831893920898, -8.629692077636719, -8.387552261352539, -8.14541244506836, -7.90327262878418, -7.6611328125, -7.41899299621582, -7.176853179931641, -6.934713363647461, -6.692573547363281, -6.450433731079102, -6.208293914794922, -5.966154098510742, -5.724014759063721, -5.481874942779541, -5.239735126495361, -4.997595310211182, -4.755455493927002, -4.513315677642822, -4.271176338195801, -4.029036521911621, -3.7868964672088623, -3.5447566509246826, -3.302616834640503, -3.0604772567749023, -2.8183374404907227, -2.576197624206543, -2.3340578079223633, -2.0919179916381836, -1.849778652191162, -1.6076388359069824, -1.3654990196228027, -1.1233593225479126, -0.8812195062637329, -0.6390796899795532, -0.3969399929046631, -0.1548001766204834, 0.08733963966369629, 0.3294794261455536, 0.5716192126274109, 0.8137589693069458, 1.0558987855911255, 1.2980386018753052, 1.5401782989501953, 1.782318115234375, 2.0244579315185547, 2.2665977478027344, 2.508737564086914, 2.7508773803710938, 2.9930171966552734, 3.235157012939453, 3.4772965908050537, 3.7194364070892334, 3.961576223373413, 4.203715801239014, 4.445855617523193, 4.687995433807373, 4.930135250091553, 5.172275066375732, 5.414414882659912, 5.656554698944092, 5.8986945152282715]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 16.0, 14.0, 23.0, 46.0, 57.0, 114.0, 233.0, 494.0, 1052.0, 2348.0, 6414.0, 18750.0, 65476.0, 245145.0, 451552.0, 185108.0, 48795.0, 14211.0, 4972.0, 1982.0, 874.0, 431.0, 201.0, 100.0, 76.0, 24.0, 17.0, 15.0, 5.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.34375, -16.9246826171875, -16.505615234375, -16.0865478515625, -15.66748046875, -15.2484130859375, -14.829345703125, -14.4102783203125, -13.9912109375, -13.5721435546875, -13.153076171875, -12.7340087890625, -12.31494140625, -11.8958740234375, -11.476806640625, -11.0577392578125, -10.638671875, -10.2196044921875, -9.800537109375, -9.3814697265625, -8.96240234375, -8.5433349609375, -8.124267578125, -7.7052001953125, -7.2861328125, -6.8670654296875, -6.447998046875, -6.0289306640625, -5.60986328125, -5.1907958984375, -4.771728515625, -4.3526611328125, -3.93359375, -3.5145263671875, -3.095458984375, -2.6763916015625, -2.25732421875, -1.8382568359375, -1.419189453125, -1.0001220703125, -0.5810546875, -0.1619873046875, 0.257080078125, 0.6761474609375, 1.09521484375, 1.5142822265625, 1.933349609375, 2.3524169921875, 2.771484375, 3.1905517578125, 3.609619140625, 4.0286865234375, 4.44775390625, 4.8668212890625, 5.285888671875, 5.7049560546875, 6.1240234375, 6.5430908203125, 6.962158203125, 7.3812255859375, 7.80029296875, 8.2193603515625, 8.638427734375, 9.0574951171875, 9.4765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 1.0, 4.0, 11.0, 15.0, 14.0, 11.0, 24.0, 22.0, 19.0, 45.0, 40.0, 54.0, 66.0, 62.0, 66.0, 64.0, 86.0, 64.0, 45.0, 47.0, 37.0, 37.0, 34.0, 25.0, 19.0, 17.0, 10.0, 15.0, 11.0, 7.0, 10.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0], "bins": [-7.51171875, -7.30169677734375, -7.0916748046875, -6.88165283203125, -6.671630859375, -6.46160888671875, -6.2515869140625, -6.04156494140625, -5.83154296875, -5.62152099609375, -5.4114990234375, -5.20147705078125, -4.991455078125, -4.78143310546875, -4.5714111328125, -4.36138916015625, -4.1513671875, -3.94134521484375, -3.7313232421875, -3.52130126953125, -3.311279296875, -3.10125732421875, -2.8912353515625, -2.68121337890625, -2.47119140625, -2.26116943359375, -2.0511474609375, -1.84112548828125, -1.631103515625, -1.42108154296875, -1.2110595703125, -1.00103759765625, -0.791015625, -0.58099365234375, -0.3709716796875, -0.16094970703125, 0.049072265625, 0.25909423828125, 0.4691162109375, 0.67913818359375, 0.88916015625, 1.09918212890625, 1.3092041015625, 1.51922607421875, 1.729248046875, 1.93927001953125, 2.1492919921875, 2.35931396484375, 2.5693359375, 2.77935791015625, 2.9893798828125, 3.19940185546875, 3.409423828125, 3.61944580078125, 3.8294677734375, 4.03948974609375, 4.24951171875, 4.45953369140625, 4.6695556640625, 4.87957763671875, 5.089599609375, 5.29962158203125, 5.5096435546875, 5.71966552734375, 5.9296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 10.0, 13.0, 18.0, 23.0, 41.0, 76.0, 140.0, 265.0, 575.0, 1290.0, 4038.0, 25779.0, 592268.0, 398812.0, 19377.0, 3565.0, 1153.0, 531.0, 255.0, 140.0, 70.0, 39.0, 22.0, 18.0, 15.0, 4.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.125, -32.119384765625, -31.11376953125, -30.108154296875, -29.1025390625, -28.096923828125, -27.09130859375, -26.085693359375, -25.080078125, -24.074462890625, -23.06884765625, -22.063232421875, -21.0576171875, -20.052001953125, -19.04638671875, -18.040771484375, -17.03515625, -16.029541015625, -15.02392578125, -14.018310546875, -13.0126953125, -12.007080078125, -11.00146484375, -9.995849609375, -8.990234375, -7.984619140625, -6.97900390625, -5.973388671875, -4.9677734375, -3.962158203125, -2.95654296875, -1.950927734375, -0.9453125, 0.060302734375, 1.06591796875, 2.071533203125, 3.0771484375, 4.082763671875, 5.08837890625, 6.093994140625, 7.099609375, 8.105224609375, 9.11083984375, 10.116455078125, 11.1220703125, 12.127685546875, 13.13330078125, 14.138916015625, 15.14453125, 16.150146484375, 17.15576171875, 18.161376953125, 19.1669921875, 20.172607421875, 21.17822265625, 22.183837890625, 23.189453125, 24.195068359375, 25.20068359375, 26.206298828125, 27.2119140625, 28.217529296875, 29.22314453125, 30.228759765625, 31.234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 9.0, 2.0, 8.0, 10.0, 21.0, 15.0, 21.0, 33.0, 29.0, 35.0, 60.0, 52.0, 52.0, 61.0, 65.0, 63.0, 64.0, 60.0, 54.0, 44.0, 45.0, 36.0, 30.0, 22.0, 22.0, 18.0, 15.0, 8.0, 7.0, 13.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.84375, -29.74462890625, -28.6455078125, -27.54638671875, -26.447265625, -25.34814453125, -24.2490234375, -23.14990234375, -22.05078125, -20.95166015625, -19.8525390625, -18.75341796875, -17.654296875, -16.55517578125, -15.4560546875, -14.35693359375, -13.2578125, -12.15869140625, -11.0595703125, -9.96044921875, -8.861328125, -7.76220703125, -6.6630859375, -5.56396484375, -4.46484375, -3.36572265625, -2.2666015625, -1.16748046875, -0.068359375, 1.03076171875, 2.1298828125, 3.22900390625, 4.328125, 5.42724609375, 6.5263671875, 7.62548828125, 8.724609375, 9.82373046875, 10.9228515625, 12.02197265625, 13.12109375, 14.22021484375, 15.3193359375, 16.41845703125, 17.517578125, 18.61669921875, 19.7158203125, 20.81494140625, 21.9140625, 23.01318359375, 24.1123046875, 25.21142578125, 26.310546875, 27.40966796875, 28.5087890625, 29.60791015625, 30.70703125, 31.80615234375, 32.9052734375, 34.00439453125, 35.103515625, 36.20263671875, 37.3017578125, 38.40087890625, 39.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 12.0, 20.0, 22.0, 20.0, 26.0, 43.0, 47.0, 57.0, 93.0, 176.0, 287.0, 660.0, 1929.0, 15269.0, 854474.0, 167288.0, 5786.0, 1180.0, 460.0, 213.0, 143.0, 90.0, 68.0, 60.0, 35.0, 20.0, 13.0, 6.0, 10.0, 7.0, 4.0, 6.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -18.120849609375, -17.44482421875, -16.768798828125, -16.0927734375, -15.416748046875, -14.74072265625, -14.064697265625, -13.388671875, -12.712646484375, -12.03662109375, -11.360595703125, -10.6845703125, -10.008544921875, -9.33251953125, -8.656494140625, -7.98046875, -7.304443359375, -6.62841796875, -5.952392578125, -5.2763671875, -4.600341796875, -3.92431640625, -3.248291015625, -2.572265625, -1.896240234375, -1.22021484375, -0.544189453125, 0.1318359375, 0.807861328125, 1.48388671875, 2.159912109375, 2.8359375, 3.511962890625, 4.18798828125, 4.864013671875, 5.5400390625, 6.216064453125, 6.89208984375, 7.568115234375, 8.244140625, 8.920166015625, 9.59619140625, 10.272216796875, 10.9482421875, 11.624267578125, 12.30029296875, 12.976318359375, 13.65234375, 14.328369140625, 15.00439453125, 15.680419921875, 16.3564453125, 17.032470703125, 17.70849609375, 18.384521484375, 19.060546875, 19.736572265625, 20.41259765625, 21.088623046875, 21.7646484375, 22.440673828125, 23.11669921875, 23.792724609375, 24.46875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 9.0, 4.0, 11.0, 7.0, 10.0, 10.0, 16.0, 20.0, 23.0, 33.0, 26.0, 41.0, 61.0, 63.0, 77.0, 112.0, 106.0, 65.0, 60.0, 45.0, 31.0, 37.0, 35.0, 26.0, 16.0, 11.0, 14.0, 7.0, 5.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0009160041809082031, -0.0008878782391548157, -0.0008597522974014282, -0.0008316263556480408, -0.0008035004138946533, -0.0007753744721412659, -0.0007472485303878784, -0.000719122588634491, -0.0006909966468811035, -0.0006628707051277161, -0.0006347447633743286, -0.0006066188216209412, -0.0005784928798675537, -0.0005503669381141663, -0.0005222409963607788, -0.0004941150546073914, -0.0004659891128540039, -0.00043786317110061646, -0.000409737229347229, -0.00038161128759384155, -0.0003534853458404541, -0.00032535940408706665, -0.0002972334623336792, -0.00026910752058029175, -0.0002409815788269043, -0.00021285563707351685, -0.0001847296953201294, -0.00015660375356674194, -0.0001284778118133545, -0.00010035187005996704, -7.222592830657959e-05, -4.409998655319214e-05, -1.5974044799804688e-05, 1.2151896953582764e-05, 4.0277838706970215e-05, 6.840378046035767e-05, 9.652972221374512e-05, 0.00012465566396713257, 0.00015278160572052002, 0.00018090754747390747, 0.00020903348922729492, 0.00023715943098068237, 0.0002652853727340698, 0.0002934113144874573, 0.0003215372562408447, 0.0003496631979942322, 0.00037778913974761963, 0.0004059150815010071, 0.00043404102325439453, 0.000462166965007782, 0.0004902929067611694, 0.0005184188485145569, 0.0005465447902679443, 0.0005746707320213318, 0.0006027966737747192, 0.0006309226155281067, 0.0006590485572814941, 0.0006871744990348816, 0.000715300440788269, 0.0007434263825416565, 0.0007715523242950439, 0.0007996782660484314, 0.0008278042078018188, 0.0008559301495552063, 0.0008840560913085938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 5.0, 7.0, 5.0, 10.0, 14.0, 23.0, 36.0, 43.0, 92.0, 149.0, 326.0, 710.0, 2285.0, 14725.0, 747335.0, 270740.0, 9077.0, 1716.0, 591.0, 303.0, 143.0, 78.0, 45.0, 32.0, 21.0, 14.0, 11.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-27.9375, -27.2542724609375, -26.571044921875, -25.8878173828125, -25.20458984375, -24.5213623046875, -23.838134765625, -23.1549072265625, -22.4716796875, -21.7884521484375, -21.105224609375, -20.4219970703125, -19.73876953125, -19.0555419921875, -18.372314453125, -17.6890869140625, -17.005859375, -16.3226318359375, -15.639404296875, -14.9561767578125, -14.27294921875, -13.5897216796875, -12.906494140625, -12.2232666015625, -11.5400390625, -10.8568115234375, -10.173583984375, -9.4903564453125, -8.80712890625, -8.1239013671875, -7.440673828125, -6.7574462890625, -6.07421875, -5.3909912109375, -4.707763671875, -4.0245361328125, -3.34130859375, -2.6580810546875, -1.974853515625, -1.2916259765625, -0.6083984375, 0.0748291015625, 0.758056640625, 1.4412841796875, 2.12451171875, 2.8077392578125, 3.490966796875, 4.1741943359375, 4.857421875, 5.5406494140625, 6.223876953125, 6.9071044921875, 7.59033203125, 8.2735595703125, 8.956787109375, 9.6400146484375, 10.3232421875, 11.0064697265625, 11.689697265625, 12.3729248046875, 13.05615234375, 13.7393798828125, 14.422607421875, 15.1058349609375, 15.7890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 9.0, 8.0, 11.0, 11.0, 26.0, 48.0, 116.0, 216.0, 244.0, 159.0, 62.0, 32.0, 16.0, 15.0, 9.0, 5.0, 3.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.0782470703125, -11.226806640625, -10.3753662109375, -9.52392578125, -8.6724853515625, -7.821044921875, -6.9696044921875, -6.1181640625, -5.2667236328125, -4.415283203125, -3.5638427734375, -2.71240234375, -1.8609619140625, -1.009521484375, -0.1580810546875, 0.693359375, 1.5447998046875, 2.396240234375, 3.2476806640625, 4.09912109375, 4.9505615234375, 5.802001953125, 6.6534423828125, 7.5048828125, 8.3563232421875, 9.207763671875, 10.0592041015625, 10.91064453125, 11.7620849609375, 12.613525390625, 13.4649658203125, 14.31640625, 15.1678466796875, 16.019287109375, 16.8707275390625, 17.72216796875, 18.5736083984375, 19.425048828125, 20.2764892578125, 21.1279296875, 21.9793701171875, 22.830810546875, 23.6822509765625, 24.53369140625, 25.3851318359375, 26.236572265625, 27.0880126953125, 27.939453125, 28.7908935546875, 29.642333984375, 30.4937744140625, 31.34521484375, 32.1966552734375, 33.048095703125, 33.8995361328125, 34.7509765625, 35.6024169921875, 36.453857421875, 37.3052978515625, 38.15673828125, 39.0081787109375, 39.859619140625, 40.7110595703125, 41.5625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 49.0, 191.0, 407.0, 265.0, 52.0, 20.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-295.6648254394531, -283.236328125, -270.80780029296875, -258.3793029785156, -245.95079040527344, -233.52227783203125, -221.09378051757812, -208.66526794433594, -196.23675537109375, -183.80824279785156, -171.37973022460938, -158.95123291015625, -146.52272033691406, -134.09420776367188, -121.66570281982422, -109.23719787597656, -96.80868530273438, -84.38017272949219, -71.95166778564453, -59.52315902709961, -47.09465026855469, -34.666141510009766, -22.237632751464844, -9.809127807617188, 2.619384765625, 15.047893524169922, 27.476402282714844, 39.904911041259766, 52.33341979980469, 64.76193237304688, 77.19043731689453, 89.61894226074219, 102.0474853515625, 114.47599792480469, 126.90450286865234, 139.3330078125, 151.7615203857422, 164.19003295898438, 176.6185302734375, 189.0470428466797, 201.47555541992188, 213.90406799316406, 226.33258056640625, 238.76107788085938, 251.18959045410156, 263.61810302734375, 276.0466003417969, 288.47509765625, 300.90362548828125, 313.3321228027344, 325.7606506347656, 338.18914794921875, 350.61767578125, 363.0461730957031, 375.47467041015625, 387.9031982421875, 400.3316955566406, 412.76019287109375, 425.188720703125, 437.6172180175781, 450.04571533203125, 462.4742431640625, 474.9027404785156, 487.33123779296875, 499.759765625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 12.0, 13.0, 22.0, 22.0, 34.0, 30.0, 35.0, 30.0, 37.0, 48.0, 53.0, 58.0, 55.0, 60.0, 54.0, 68.0, 49.0, 41.0, 43.0, 42.0, 37.0, 39.0, 27.0, 17.0, 12.0, 10.0, 8.0, 8.0, 3.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.3040313720703, -144.83834838867188, -140.37265014648438, -135.90696716308594, -131.44126892089844, -126.9755859375, -122.50989532470703, -118.04420471191406, -113.5785140991211, -109.11282348632812, -104.64713287353516, -100.18144226074219, -95.71575927734375, -91.25006103515625, -86.78437805175781, -82.31868743896484, -77.85299682617188, -73.3873062133789, -68.92161560058594, -64.45592498779297, -59.990238189697266, -55.5245475769043, -51.058860778808594, -46.593170166015625, -42.127479553222656, -37.66178894042969, -33.19609832763672, -28.730411529541016, -24.264720916748047, -19.799030303955078, -15.333341598510742, -10.867652893066406, -6.4019622802734375, -1.9362726211547852, 2.529417037963867, 6.9951066970825195, 11.460796356201172, 15.92648696899414, 20.392175674438477, 24.857864379882812, 29.32355499267578, 33.78924560546875, 38.25493621826172, 42.72062301635742, 47.18631362915039, 51.65200424194336, 56.11769104003906, 60.58338165283203, 65.049072265625, 69.51476287841797, 73.98045349121094, 78.4461441040039, 82.91183471679688, 87.37751770019531, 91.84320831298828, 96.30889892578125, 100.77458953857422, 105.24028015136719, 109.70597076416016, 114.17166137695312, 118.63734436035156, 123.10304260253906, 127.5687255859375, 132.034423828125, 136.50010681152344]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 8.0, 12.0, 14.0, 23.0, 40.0, 64.0, 111.0, 176.0, 332.0, 608.0, 1490.0, 4219.0, 16197.0, 187254.0, 3928353.0, 43575.0, 7534.0, 2369.0, 943.0, 408.0, 226.0, 133.0, 69.0, 31.0, 30.0, 19.0, 10.0, 5.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.328125, -22.7337646484375, -22.139404296875, -21.5450439453125, -20.95068359375, -20.3563232421875, -19.761962890625, -19.1676025390625, -18.5732421875, -17.9788818359375, -17.384521484375, -16.7901611328125, -16.19580078125, -15.6014404296875, -15.007080078125, -14.4127197265625, -13.818359375, -13.2239990234375, -12.629638671875, -12.0352783203125, -11.44091796875, -10.8465576171875, -10.252197265625, -9.6578369140625, -9.0634765625, -8.4691162109375, -7.874755859375, -7.2803955078125, -6.68603515625, -6.0916748046875, -5.497314453125, -4.9029541015625, -4.30859375, -3.7142333984375, -3.119873046875, -2.5255126953125, -1.93115234375, -1.3367919921875, -0.742431640625, -0.1480712890625, 0.4462890625, 1.0406494140625, 1.635009765625, 2.2293701171875, 2.82373046875, 3.4180908203125, 4.012451171875, 4.6068115234375, 5.201171875, 5.7955322265625, 6.389892578125, 6.9842529296875, 7.57861328125, 8.1729736328125, 8.767333984375, 9.3616943359375, 9.9560546875, 10.5504150390625, 11.144775390625, 11.7391357421875, 12.33349609375, 12.9278564453125, 13.522216796875, 14.1165771484375, 14.7109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 5.0, 5.0, 15.0, 23.0, 33.0, 43.0, 67.0, 89.0, 78.0, 100.0, 107.0, 100.0, 77.0, 60.0, 44.0, 42.0, 25.0, 22.0, 20.0, 14.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9921875, -11.6614990234375, -11.330810546875, -11.0001220703125, -10.66943359375, -10.3387451171875, -10.008056640625, -9.6773681640625, -9.3466796875, -9.0159912109375, -8.685302734375, -8.3546142578125, -8.02392578125, -7.6932373046875, -7.362548828125, -7.0318603515625, -6.701171875, -6.3704833984375, -6.039794921875, -5.7091064453125, -5.37841796875, -5.0477294921875, -4.717041015625, -4.3863525390625, -4.0556640625, -3.7249755859375, -3.394287109375, -3.0635986328125, -2.73291015625, -2.4022216796875, -2.071533203125, -1.7408447265625, -1.41015625, -1.0794677734375, -0.748779296875, -0.4180908203125, -0.08740234375, 0.2432861328125, 0.573974609375, 0.9046630859375, 1.2353515625, 1.5660400390625, 1.896728515625, 2.2274169921875, 2.55810546875, 2.8887939453125, 3.219482421875, 3.5501708984375, 3.880859375, 4.2115478515625, 4.542236328125, 4.8729248046875, 5.20361328125, 5.5343017578125, 5.864990234375, 6.1956787109375, 6.5263671875, 6.8570556640625, 7.187744140625, 7.5184326171875, 7.84912109375, 8.1798095703125, 8.510498046875, 8.8411865234375, 9.171875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 8.0, 8.0, 15.0, 16.0, 18.0, 22.0, 32.0, 36.0, 28.0, 47.0, 57.0, 57.0, 76.0, 107.0, 132.0, 205.0, 431.0, 955.0, 2821.0, 11072.0, 101821.0, 4010701.0, 53555.0, 7846.0, 2219.0, 769.0, 358.0, 186.0, 148.0, 95.0, 71.0, 69.0, 51.0, 40.0, 36.0, 32.0, 24.0, 23.0, 19.0, 17.0, 13.0, 5.0, 6.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-19.65625, -19.009521484375, -18.36279296875, -17.716064453125, -17.0693359375, -16.422607421875, -15.77587890625, -15.129150390625, -14.482421875, -13.835693359375, -13.18896484375, -12.542236328125, -11.8955078125, -11.248779296875, -10.60205078125, -9.955322265625, -9.30859375, -8.661865234375, -8.01513671875, -7.368408203125, -6.7216796875, -6.074951171875, -5.42822265625, -4.781494140625, -4.134765625, -3.488037109375, -2.84130859375, -2.194580078125, -1.5478515625, -0.901123046875, -0.25439453125, 0.392333984375, 1.0390625, 1.685791015625, 2.33251953125, 2.979248046875, 3.6259765625, 4.272705078125, 4.91943359375, 5.566162109375, 6.212890625, 6.859619140625, 7.50634765625, 8.153076171875, 8.7998046875, 9.446533203125, 10.09326171875, 10.739990234375, 11.38671875, 12.033447265625, 12.68017578125, 13.326904296875, 13.9736328125, 14.620361328125, 15.26708984375, 15.913818359375, 16.560546875, 17.207275390625, 17.85400390625, 18.500732421875, 19.1474609375, 19.794189453125, 20.44091796875, 21.087646484375, 21.734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 8.0, 16.0, 20.0, 61.0, 194.0, 3236.0, 381.0, 86.0, 29.0, 20.0, 7.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.625, -5.266845703125, -4.90869140625, -4.550537109375, -4.1923828125, -3.834228515625, -3.47607421875, -3.117919921875, -2.759765625, -2.401611328125, -2.04345703125, -1.685302734375, -1.3271484375, -0.968994140625, -0.61083984375, -0.252685546875, 0.10546875, 0.463623046875, 0.82177734375, 1.179931640625, 1.5380859375, 1.896240234375, 2.25439453125, 2.612548828125, 2.970703125, 3.328857421875, 3.68701171875, 4.045166015625, 4.4033203125, 4.761474609375, 5.11962890625, 5.477783203125, 5.8359375, 6.194091796875, 6.55224609375, 6.910400390625, 7.2685546875, 7.626708984375, 7.98486328125, 8.343017578125, 8.701171875, 9.059326171875, 9.41748046875, 9.775634765625, 10.1337890625, 10.491943359375, 10.85009765625, 11.208251953125, 11.56640625, 11.924560546875, 12.28271484375, 12.640869140625, 12.9990234375, 13.357177734375, 13.71533203125, 14.073486328125, 14.431640625, 14.789794921875, 15.14794921875, 15.506103515625, 15.8642578125, 16.222412109375, 16.58056640625, 16.938720703125, 17.296875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 20.0, 49.0, 195.0, 395.0, 238.0, 78.0, 18.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.07235717773438, -117.27413940429688, -114.47592163085938, -111.6777114868164, -108.8794937133789, -106.0812759399414, -103.28306579589844, -100.48484802246094, -97.68663024902344, -94.88841247558594, -92.09019470214844, -89.29198455810547, -86.49376678466797, -83.69554901123047, -80.8973388671875, -78.09912109375, -75.3009033203125, -72.502685546875, -69.7044677734375, -66.90625762939453, -64.10803985595703, -61.30982208251953, -58.5116081237793, -55.71339416503906, -52.91517639160156, -50.11695861816406, -47.31874465942383, -44.520530700683594, -41.722312927246094, -38.924095153808594, -36.12588119506836, -33.327667236328125, -30.529441833496094, -27.731225967407227, -24.93301010131836, -22.134794235229492, -19.336578369140625, -16.538362503051758, -13.74014663696289, -10.941930770874023, -8.143714904785156, -5.345499038696289, -2.547283172607422, 0.2509326934814453, 3.0491485595703125, 5.84736442565918, 8.645580291748047, 11.443796157836914, 14.242012023925781, 17.04022789001465, 19.838443756103516, 22.636659622192383, 25.43487548828125, 28.233091354370117, 31.031307220458984, 33.82952117919922, 36.62773895263672, 39.42595672607422, 42.22417068481445, 45.02238464355469, 47.82060241699219, 50.61882019042969, 53.41703414916992, 56.215248107910156, 59.013465881347656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 14.0, 5.0, 12.0, 24.0, 27.0, 36.0, 42.0, 67.0, 61.0, 86.0, 82.0, 99.0, 80.0, 61.0, 59.0, 53.0, 45.0, 46.0, 29.0, 21.0, 13.0, 12.0, 10.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.109657287597656, -35.99424362182617, -34.87882995605469, -33.7634162902832, -32.64800262451172, -31.532588958740234, -30.41717529296875, -29.301761627197266, -28.18634796142578, -27.070934295654297, -25.955520629882812, -24.840106964111328, -23.724693298339844, -22.60927963256836, -21.493865966796875, -20.37845230102539, -19.263038635253906, -18.147624969482422, -17.032211303710938, -15.916797637939453, -14.801383972167969, -13.685970306396484, -12.570556640625, -11.455142974853516, -10.339729309082031, -9.224315643310547, -8.108901977539062, -6.993488311767578, -5.878074645996094, -4.762660980224609, -3.647247314453125, -2.5318336486816406, -1.4164199829101562, -0.3010063171386719, 0.8144073486328125, 1.9298210144042969, 3.0452346801757812, 4.160648345947266, 5.27606201171875, 6.391475677490234, 7.506889343261719, 8.622303009033203, 9.737716674804688, 10.853130340576172, 11.968544006347656, 13.08395767211914, 14.199371337890625, 15.31478500366211, 16.430198669433594, 17.545612335205078, 18.661026000976562, 19.776439666748047, 20.89185333251953, 22.007266998291016, 23.1226806640625, 24.238094329833984, 25.35350799560547, 26.468921661376953, 27.584335327148438, 28.699748992919922, 29.815162658691406, 30.93057632446289, 32.045989990234375, 33.16140365600586, 34.276817321777344]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 8.0, 9.0, 10.0, 7.0, 9.0, 20.0, 39.0, 34.0, 68.0, 113.0, 225.0, 379.0, 645.0, 1307.0, 2738.0, 6652.0, 18511.0, 66232.0, 278732.0, 467763.0, 149028.0, 36278.0, 11193.0, 4320.0, 2016.0, 943.0, 528.0, 297.0, 163.0, 99.0, 66.0, 42.0, 24.0, 18.0, 16.0, 6.0, 3.0, 6.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5234375, -12.08056640625, -11.6376953125, -11.19482421875, -10.751953125, -10.30908203125, -9.8662109375, -9.42333984375, -8.98046875, -8.53759765625, -8.0947265625, -7.65185546875, -7.208984375, -6.76611328125, -6.3232421875, -5.88037109375, -5.4375, -4.99462890625, -4.5517578125, -4.10888671875, -3.666015625, -3.22314453125, -2.7802734375, -2.33740234375, -1.89453125, -1.45166015625, -1.0087890625, -0.56591796875, -0.123046875, 0.31982421875, 0.7626953125, 1.20556640625, 1.6484375, 2.09130859375, 2.5341796875, 2.97705078125, 3.419921875, 3.86279296875, 4.3056640625, 4.74853515625, 5.19140625, 5.63427734375, 6.0771484375, 6.52001953125, 6.962890625, 7.40576171875, 7.8486328125, 8.29150390625, 8.734375, 9.17724609375, 9.6201171875, 10.06298828125, 10.505859375, 10.94873046875, 11.3916015625, 11.83447265625, 12.27734375, 12.72021484375, 13.1630859375, 13.60595703125, 14.048828125, 14.49169921875, 14.9345703125, 15.37744140625, 15.8203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 2.0, 3.0, 10.0, 9.0, 12.0, 7.0, 19.0, 20.0, 35.0, 48.0, 60.0, 67.0, 71.0, 81.0, 58.0, 87.0, 69.0, 76.0, 56.0, 33.0, 33.0, 25.0, 31.0, 22.0, 14.0, 19.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2265625, -8.96136474609375, -8.6961669921875, -8.43096923828125, -8.165771484375, -7.90057373046875, -7.6353759765625, -7.37017822265625, -7.10498046875, -6.83978271484375, -6.5745849609375, -6.30938720703125, -6.044189453125, -5.77899169921875, -5.5137939453125, -5.24859619140625, -4.9833984375, -4.71820068359375, -4.4530029296875, -4.18780517578125, -3.922607421875, -3.65740966796875, -3.3922119140625, -3.12701416015625, -2.86181640625, -2.59661865234375, -2.3314208984375, -2.06622314453125, -1.801025390625, -1.53582763671875, -1.2706298828125, -1.00543212890625, -0.740234375, -0.47503662109375, -0.2098388671875, 0.05535888671875, 0.320556640625, 0.58575439453125, 0.8509521484375, 1.11614990234375, 1.38134765625, 1.64654541015625, 1.9117431640625, 2.17694091796875, 2.442138671875, 2.70733642578125, 2.9725341796875, 3.23773193359375, 3.5029296875, 3.76812744140625, 4.0333251953125, 4.29852294921875, 4.563720703125, 4.82891845703125, 5.0941162109375, 5.35931396484375, 5.62451171875, 5.88970947265625, 6.1549072265625, 6.42010498046875, 6.685302734375, 6.95050048828125, 7.2156982421875, 7.48089599609375, 7.74609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 5.0, 7.0, 6.0, 6.0, 11.0, 16.0, 26.0, 37.0, 48.0, 69.0, 132.0, 222.0, 403.0, 815.0, 2101.0, 7068.0, 49044.0, 751724.0, 213963.0, 16524.0, 3677.0, 1327.0, 557.0, 311.0, 176.0, 88.0, 57.0, 48.0, 23.0, 14.0, 15.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.5, -35.55810546875, -34.6162109375, -33.67431640625, -32.732421875, -31.79052734375, -30.8486328125, -29.90673828125, -28.96484375, -28.02294921875, -27.0810546875, -26.13916015625, -25.197265625, -24.25537109375, -23.3134765625, -22.37158203125, -21.4296875, -20.48779296875, -19.5458984375, -18.60400390625, -17.662109375, -16.72021484375, -15.7783203125, -14.83642578125, -13.89453125, -12.95263671875, -12.0107421875, -11.06884765625, -10.126953125, -9.18505859375, -8.2431640625, -7.30126953125, -6.359375, -5.41748046875, -4.4755859375, -3.53369140625, -2.591796875, -1.64990234375, -0.7080078125, 0.23388671875, 1.17578125, 2.11767578125, 3.0595703125, 4.00146484375, 4.943359375, 5.88525390625, 6.8271484375, 7.76904296875, 8.7109375, 9.65283203125, 10.5947265625, 11.53662109375, 12.478515625, 13.42041015625, 14.3623046875, 15.30419921875, 16.24609375, 17.18798828125, 18.1298828125, 19.07177734375, 20.013671875, 20.95556640625, 21.8974609375, 22.83935546875, 23.78125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 7.0, 7.0, 8.0, 9.0, 25.0, 34.0, 34.0, 30.0, 40.0, 57.0, 90.0, 75.0, 73.0, 77.0, 63.0, 68.0, 60.0, 52.0, 50.0, 29.0, 28.0, 21.0, 12.0, 9.0, 9.0, 11.0, 6.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.56884765625, -37.3251953125, -36.08154296875, -34.837890625, -33.59423828125, -32.3505859375, -31.10693359375, -29.86328125, -28.61962890625, -27.3759765625, -26.13232421875, -24.888671875, -23.64501953125, -22.4013671875, -21.15771484375, -19.9140625, -18.67041015625, -17.4267578125, -16.18310546875, -14.939453125, -13.69580078125, -12.4521484375, -11.20849609375, -9.96484375, -8.72119140625, -7.4775390625, -6.23388671875, -4.990234375, -3.74658203125, -2.5029296875, -1.25927734375, -0.015625, 1.22802734375, 2.4716796875, 3.71533203125, 4.958984375, 6.20263671875, 7.4462890625, 8.68994140625, 9.93359375, 11.17724609375, 12.4208984375, 13.66455078125, 14.908203125, 16.15185546875, 17.3955078125, 18.63916015625, 19.8828125, 21.12646484375, 22.3701171875, 23.61376953125, 24.857421875, 26.10107421875, 27.3447265625, 28.58837890625, 29.83203125, 31.07568359375, 32.3193359375, 33.56298828125, 34.806640625, 36.05029296875, 37.2939453125, 38.53759765625, 39.78125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 3.0, 10.0, 17.0, 13.0, 27.0, 26.0, 41.0, 47.0, 78.0, 103.0, 131.0, 202.0, 355.0, 686.0, 1630.0, 5174.0, 24736.0, 206333.0, 695382.0, 93832.0, 13790.0, 3261.0, 1126.0, 594.0, 302.0, 186.0, 129.0, 94.0, 68.0, 43.0, 31.0, 30.0, 16.0, 11.0, 9.0, 8.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.58203125, -6.35760498046875, -6.1331787109375, -5.90875244140625, -5.684326171875, -5.45989990234375, -5.2354736328125, -5.01104736328125, -4.78662109375, -4.56219482421875, -4.3377685546875, -4.11334228515625, -3.888916015625, -3.66448974609375, -3.4400634765625, -3.21563720703125, -2.9912109375, -2.76678466796875, -2.5423583984375, -2.31793212890625, -2.093505859375, -1.86907958984375, -1.6446533203125, -1.42022705078125, -1.19580078125, -0.97137451171875, -0.7469482421875, -0.52252197265625, -0.298095703125, -0.07366943359375, 0.1507568359375, 0.37518310546875, 0.599609375, 0.82403564453125, 1.0484619140625, 1.27288818359375, 1.497314453125, 1.72174072265625, 1.9461669921875, 2.17059326171875, 2.39501953125, 2.61944580078125, 2.8438720703125, 3.06829833984375, 3.292724609375, 3.51715087890625, 3.7415771484375, 3.96600341796875, 4.1904296875, 4.41485595703125, 4.6392822265625, 4.86370849609375, 5.088134765625, 5.31256103515625, 5.5369873046875, 5.76141357421875, 5.98583984375, 6.21026611328125, 6.4346923828125, 6.65911865234375, 6.883544921875, 7.10797119140625, 7.3323974609375, 7.55682373046875, 7.78125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 11.0, 7.0, 9.0, 17.0, 17.0, 25.0, 41.0, 72.0, 93.0, 159.0, 176.0, 128.0, 70.0, 52.0, 38.0, 24.0, 19.0, 7.0, 13.0, 7.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0020008087158203125, -0.0019524097442626953, -0.0019040107727050781, -0.001855611801147461, -0.0018072128295898438, -0.0017588138580322266, -0.0017104148864746094, -0.0016620159149169922, -0.001613616943359375, -0.0015652179718017578, -0.0015168190002441406, -0.0014684200286865234, -0.0014200210571289062, -0.001371622085571289, -0.0013232231140136719, -0.0012748241424560547, -0.0012264251708984375, -0.0011780261993408203, -0.0011296272277832031, -0.001081228256225586, -0.0010328292846679688, -0.0009844303131103516, -0.0009360313415527344, -0.0008876323699951172, -0.0008392333984375, -0.0007908344268798828, -0.0007424354553222656, -0.0006940364837646484, -0.0006456375122070312, -0.0005972385406494141, -0.0005488395690917969, -0.0005004405975341797, -0.0004520416259765625, -0.0004036426544189453, -0.0003552436828613281, -0.00030684471130371094, -0.00025844573974609375, -0.00021004676818847656, -0.00016164779663085938, -0.00011324882507324219, -6.4849853515625e-05, -1.6450881958007812e-05, 3.1948089599609375e-05, 8.034706115722656e-05, 0.00012874603271484375, 0.00017714500427246094, 0.00022554397583007812, 0.0002739429473876953, 0.0003223419189453125, 0.0003707408905029297, 0.0004191398620605469, 0.00046753883361816406, 0.0005159378051757812, 0.0005643367767333984, 0.0006127357482910156, 0.0006611347198486328, 0.00070953369140625, 0.0007579326629638672, 0.0008063316345214844, 0.0008547306060791016, 0.0009031295776367188, 0.0009515285491943359, 0.0009999275207519531, 0.0010483264923095703, 0.0010967254638671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 14.0, 14.0, 18.0, 36.0, 52.0, 63.0, 109.0, 170.0, 281.0, 488.0, 980.0, 2374.0, 8437.0, 58397.0, 700974.0, 246503.0, 21755.0, 4534.0, 1601.0, 729.0, 385.0, 232.0, 124.0, 94.0, 51.0, 36.0, 22.0, 23.0, 13.0, 8.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.51513671875, -9.2333984375, -8.95166015625, -8.669921875, -8.38818359375, -8.1064453125, -7.82470703125, -7.54296875, -7.26123046875, -6.9794921875, -6.69775390625, -6.416015625, -6.13427734375, -5.8525390625, -5.57080078125, -5.2890625, -5.00732421875, -4.7255859375, -4.44384765625, -4.162109375, -3.88037109375, -3.5986328125, -3.31689453125, -3.03515625, -2.75341796875, -2.4716796875, -2.18994140625, -1.908203125, -1.62646484375, -1.3447265625, -1.06298828125, -0.78125, -0.49951171875, -0.2177734375, 0.06396484375, 0.345703125, 0.62744140625, 0.9091796875, 1.19091796875, 1.47265625, 1.75439453125, 2.0361328125, 2.31787109375, 2.599609375, 2.88134765625, 3.1630859375, 3.44482421875, 3.7265625, 4.00830078125, 4.2900390625, 4.57177734375, 4.853515625, 5.13525390625, 5.4169921875, 5.69873046875, 5.98046875, 6.26220703125, 6.5439453125, 6.82568359375, 7.107421875, 7.38916015625, 7.6708984375, 7.95263671875, 8.234375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 5.0, 17.0, 18.0, 28.0, 49.0, 64.0, 104.0, 150.0, 177.0, 149.0, 89.0, 62.0, 25.0, 22.0, 15.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.28076171875, -7.8271484375, -7.37353515625, -6.919921875, -6.46630859375, -6.0126953125, -5.55908203125, -5.10546875, -4.65185546875, -4.1982421875, -3.74462890625, -3.291015625, -2.83740234375, -2.3837890625, -1.93017578125, -1.4765625, -1.02294921875, -0.5693359375, -0.11572265625, 0.337890625, 0.79150390625, 1.2451171875, 1.69873046875, 2.15234375, 2.60595703125, 3.0595703125, 3.51318359375, 3.966796875, 4.42041015625, 4.8740234375, 5.32763671875, 5.78125, 6.23486328125, 6.6884765625, 7.14208984375, 7.595703125, 8.04931640625, 8.5029296875, 8.95654296875, 9.41015625, 9.86376953125, 10.3173828125, 10.77099609375, 11.224609375, 11.67822265625, 12.1318359375, 12.58544921875, 13.0390625, 13.49267578125, 13.9462890625, 14.39990234375, 14.853515625, 15.30712890625, 15.7607421875, 16.21435546875, 16.66796875, 17.12158203125, 17.5751953125, 18.02880859375, 18.482421875, 18.93603515625, 19.3896484375, 19.84326171875, 20.296875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 12.0, 23.0, 40.0, 80.0, 121.0, 167.0, 171.0, 120.0, 110.0, 58.0, 37.0, 22.0, 13.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-188.11119079589844, -183.02825927734375, -177.94532775878906, -172.8623809814453, -167.77944946289062, -162.69651794433594, -157.61358642578125, -152.53065490722656, -147.44772338867188, -142.3647918701172, -137.2818603515625, -132.19891357421875, -127.11598205566406, -122.03305053710938, -116.95011901855469, -111.8671875, -106.78424072265625, -101.70130920410156, -96.61837005615234, -91.53543853759766, -86.45249938964844, -81.36956787109375, -76.28663635253906, -71.20370483398438, -66.12076568603516, -61.0378303527832, -55.95489501953125, -50.87196350097656, -45.78902816772461, -40.706092834472656, -35.62316131591797, -30.540225982666016, -25.457275390625, -20.374340057373047, -15.291406631469727, -10.20847225189209, -5.125537872314453, -0.0426025390625, 5.04033088684082, 10.12326431274414, 15.206199645996094, 20.289134979248047, 25.372068405151367, 30.455001831054688, 35.53793716430664, 40.620872497558594, 45.70380401611328, 50.786739349365234, 55.86967468261719, 60.95261001586914, 66.0355453491211, 71.11847686767578, 76.201416015625, 81.28434753417969, 86.36727905273438, 91.45021057128906, 96.53314971923828, 101.61608123779297, 106.69902038574219, 111.78195190429688, 116.86488342285156, 121.94782257080078, 127.03075408935547, 132.1136932373047, 137.19662475585938]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 9.0, 6.0, 15.0, 13.0, 19.0, 26.0, 35.0, 32.0, 30.0, 40.0, 40.0, 45.0, 48.0, 71.0, 65.0, 64.0, 42.0, 57.0, 43.0, 44.0, 38.0, 31.0, 26.0, 28.0, 22.0, 23.0, 13.0, 12.0, 13.0, 5.0, 6.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-159.5902099609375, -155.27658081054688, -150.9629669189453, -146.6493377685547, -142.33572387695312, -138.0220947265625, -133.70848083496094, -129.3948516845703, -125.08123016357422, -120.76760864257812, -116.45398712158203, -112.14036560058594, -107.82673645019531, -103.51312255859375, -99.19949340820312, -94.88587188720703, -90.57225036621094, -86.25862884521484, -81.94500732421875, -77.63138580322266, -73.31776428222656, -69.00413513183594, -64.69051361083984, -60.37689208984375, -56.063270568847656, -51.74964904785156, -47.43602752685547, -43.12240219116211, -38.808780670166016, -34.49515914916992, -30.181535720825195, -25.86791229248047, -21.554283142089844, -17.24066162109375, -12.927038192749023, -8.613415718078613, -4.299793243408203, 0.013828277587890625, 4.327451705932617, 8.641075134277344, 12.954696655273438, 17.26831817626953, 21.581941604614258, 25.895565032958984, 30.209186553955078, 34.52280807495117, 38.83643341064453, 43.150054931640625, 47.46367645263672, 51.77729797363281, 56.090919494628906, 60.404544830322266, 64.71817016601562, 69.03178405761719, 73.34541320800781, 77.6590347290039, 81.97265625, 86.2862777709961, 90.59989929199219, 94.91352081298828, 99.22714233398438, 103.540771484375, 107.8543930053711, 112.16801452636719, 116.48163604736328]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 4.0, 8.0, 16.0, 32.0, 33.0, 56.0, 83.0, 124.0, 190.0, 277.0, 504.0, 876.0, 1550.0, 3327.0, 7808.0, 24423.0, 146508.0, 3546652.0, 403163.0, 39106.0, 10888.0, 4173.0, 2001.0, 990.0, 560.0, 315.0, 217.0, 127.0, 85.0, 60.0, 32.0, 26.0, 15.0, 9.0, 17.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.40625, -11.00830078125, -10.6103515625, -10.21240234375, -9.814453125, -9.41650390625, -9.0185546875, -8.62060546875, -8.22265625, -7.82470703125, -7.4267578125, -7.02880859375, -6.630859375, -6.23291015625, -5.8349609375, -5.43701171875, -5.0390625, -4.64111328125, -4.2431640625, -3.84521484375, -3.447265625, -3.04931640625, -2.6513671875, -2.25341796875, -1.85546875, -1.45751953125, -1.0595703125, -0.66162109375, -0.263671875, 0.13427734375, 0.5322265625, 0.93017578125, 1.328125, 1.72607421875, 2.1240234375, 2.52197265625, 2.919921875, 3.31787109375, 3.7158203125, 4.11376953125, 4.51171875, 4.90966796875, 5.3076171875, 5.70556640625, 6.103515625, 6.50146484375, 6.8994140625, 7.29736328125, 7.6953125, 8.09326171875, 8.4912109375, 8.88916015625, 9.287109375, 9.68505859375, 10.0830078125, 10.48095703125, 10.87890625, 11.27685546875, 11.6748046875, 12.07275390625, 12.470703125, 12.86865234375, 13.2666015625, 13.66455078125, 14.0625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 11.0, 9.0, 4.0, 13.0, 12.0, 14.0, 21.0, 32.0, 42.0, 43.0, 55.0, 66.0, 68.0, 69.0, 71.0, 81.0, 70.0, 61.0, 52.0, 47.0, 41.0, 24.0, 17.0, 23.0, 10.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.6270751953125, -7.390869140625, -7.1546630859375, -6.91845703125, -6.6822509765625, -6.446044921875, -6.2098388671875, -5.9736328125, -5.7374267578125, -5.501220703125, -5.2650146484375, -5.02880859375, -4.7926025390625, -4.556396484375, -4.3201904296875, -4.083984375, -3.8477783203125, -3.611572265625, -3.3753662109375, -3.13916015625, -2.9029541015625, -2.666748046875, -2.4305419921875, -2.1943359375, -1.9581298828125, -1.721923828125, -1.4857177734375, -1.24951171875, -1.0133056640625, -0.777099609375, -0.5408935546875, -0.3046875, -0.0684814453125, 0.167724609375, 0.4039306640625, 0.64013671875, 0.8763427734375, 1.112548828125, 1.3487548828125, 1.5849609375, 1.8211669921875, 2.057373046875, 2.2935791015625, 2.52978515625, 2.7659912109375, 3.002197265625, 3.2384033203125, 3.474609375, 3.7108154296875, 3.947021484375, 4.1832275390625, 4.41943359375, 4.6556396484375, 4.891845703125, 5.1280517578125, 5.3642578125, 5.6004638671875, 5.836669921875, 6.0728759765625, 6.30908203125, 6.5452880859375, 6.781494140625, 7.0177001953125, 7.25390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 2.0, 9.0, 8.0, 16.0, 22.0, 28.0, 62.0, 133.0, 335.0, 1049.0, 4067.0, 22392.0, 401675.0, 3695946.0, 57511.0, 8010.0, 1858.0, 647.0, 236.0, 103.0, 55.0, 22.0, 22.0, 14.0, 10.0, 12.0, 6.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.3115234375, -17.638671875, -16.9658203125, -16.29296875, -15.6201171875, -14.947265625, -14.2744140625, -13.6015625, -12.9287109375, -12.255859375, -11.5830078125, -10.91015625, -10.2373046875, -9.564453125, -8.8916015625, -8.21875, -7.5458984375, -6.873046875, -6.2001953125, -5.52734375, -4.8544921875, -4.181640625, -3.5087890625, -2.8359375, -2.1630859375, -1.490234375, -0.8173828125, -0.14453125, 0.5283203125, 1.201171875, 1.8740234375, 2.546875, 3.2197265625, 3.892578125, 4.5654296875, 5.23828125, 5.9111328125, 6.583984375, 7.2568359375, 7.9296875, 8.6025390625, 9.275390625, 9.9482421875, 10.62109375, 11.2939453125, 11.966796875, 12.6396484375, 13.3125, 13.9853515625, 14.658203125, 15.3310546875, 16.00390625, 16.6767578125, 17.349609375, 18.0224609375, 18.6953125, 19.3681640625, 20.041015625, 20.7138671875, 21.38671875, 22.0595703125, 22.732421875, 23.4052734375, 24.078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 3.0, 3.0, 4.0, 5.0, 13.0, 20.0, 28.0, 22.0, 43.0, 86.0, 140.0, 362.0, 965.0, 1358.0, 542.0, 198.0, 85.0, 61.0, 30.0, 24.0, 12.0, 8.0, 12.0, 11.0, 7.0, 4.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.4189453125, -10.947265625, -10.4755859375, -10.00390625, -9.5322265625, -9.060546875, -8.5888671875, -8.1171875, -7.6455078125, -7.173828125, -6.7021484375, -6.23046875, -5.7587890625, -5.287109375, -4.8154296875, -4.34375, -3.8720703125, -3.400390625, -2.9287109375, -2.45703125, -1.9853515625, -1.513671875, -1.0419921875, -0.5703125, -0.0986328125, 0.373046875, 0.8447265625, 1.31640625, 1.7880859375, 2.259765625, 2.7314453125, 3.203125, 3.6748046875, 4.146484375, 4.6181640625, 5.08984375, 5.5615234375, 6.033203125, 6.5048828125, 6.9765625, 7.4482421875, 7.919921875, 8.3916015625, 8.86328125, 9.3349609375, 9.806640625, 10.2783203125, 10.75, 11.2216796875, 11.693359375, 12.1650390625, 12.63671875, 13.1083984375, 13.580078125, 14.0517578125, 14.5234375, 14.9951171875, 15.466796875, 15.9384765625, 16.41015625, 16.8818359375, 17.353515625, 17.8251953125, 18.296875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 5.0, 18.0, 22.0, 40.0, 88.0, 165.0, 189.0, 207.0, 125.0, 63.0, 37.0, 16.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.50045776367188, -153.36856079101562, -149.23666381835938, -145.10475158691406, -140.9728546142578, -136.84095764160156, -132.7090606689453, -128.57716369628906, -124.44525909423828, -120.31336212158203, -116.18145751953125, -112.049560546875, -107.91766357421875, -103.78575897216797, -99.65386199951172, -95.52195739746094, -91.39006042480469, -87.25816345214844, -83.12625885009766, -78.9943618774414, -74.86245727539062, -70.73056030273438, -66.59866333007812, -62.46676254272461, -58.334861755371094, -54.20296096801758, -50.07106018066406, -45.93916320800781, -41.8072624206543, -37.67536163330078, -33.54346466064453, -29.411563873291016, -25.279647827148438, -21.147747039794922, -17.01584815979004, -12.88394832611084, -8.75204849243164, -4.620147705078125, -0.4882488250732422, 3.6436500549316406, 7.775550842285156, 11.907450675964355, 16.039350509643555, 20.171249389648438, 24.303150177001953, 28.43505096435547, 32.56694793701172, 36.698848724365234, 40.83074951171875, 44.962650299072266, 49.09455108642578, 53.22644805908203, 57.35834884643555, 61.49024963378906, 65.62214660644531, 69.75404357910156, 73.88594818115234, 78.0178451538086, 82.14974975585938, 86.28164672851562, 90.41354370117188, 94.54544830322266, 98.6773452758789, 102.80924987792969, 106.94114685058594]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 2.0, 10.0, 10.0, 9.0, 16.0, 11.0, 29.0, 29.0, 40.0, 36.0, 38.0, 46.0, 45.0, 50.0, 55.0, 66.0, 47.0, 62.0, 50.0, 50.0, 32.0, 39.0, 42.0, 26.0, 34.0, 24.0, 33.0, 11.0, 15.0, 13.0, 9.0, 8.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-69.17698669433594, -67.13843536376953, -65.09988403320312, -63.06132888793945, -61.02277755737305, -58.98422622680664, -56.94567108154297, -54.90711975097656, -52.868568420410156, -50.83001708984375, -48.791465759277344, -46.75291061401367, -44.714359283447266, -42.67580795288086, -40.63725280761719, -38.59870147705078, -36.560150146484375, -34.52159881591797, -32.48304748535156, -30.44449234008789, -28.405941009521484, -26.367389678955078, -24.32883644104004, -22.290283203125, -20.251731872558594, -18.213180541992188, -16.17462730407715, -14.136075019836426, -12.097522735595703, -10.05897045135498, -8.020418167114258, -5.981865882873535, -3.9433059692382812, -1.9047536849975586, 0.13379859924316406, 2.1723508834838867, 4.210903167724609, 6.249455451965332, 8.288007736206055, 10.326560020446777, 12.3651123046875, 14.403664588928223, 16.442216873168945, 18.480770111083984, 20.51932144165039, 22.557872772216797, 24.596426010131836, 26.634979248046875, 28.67353057861328, 30.712081909179688, 32.750633239746094, 34.789188385009766, 36.82773971557617, 38.86629104614258, 40.90484619140625, 42.943397521972656, 44.98194885253906, 47.02050018310547, 49.059051513671875, 51.09760665893555, 53.13615798950195, 55.17470932006836, 57.21326446533203, 59.25181579589844, 61.290367126464844]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 15.0, 24.0, 37.0, 50.0, 61.0, 104.0, 146.0, 322.0, 562.0, 1071.0, 1976.0, 4258.0, 10160.0, 26913.0, 83431.0, 285419.0, 429284.0, 136163.0, 42096.0, 14903.0, 5937.0, 2640.0, 1327.0, 664.0, 384.0, 236.0, 138.0, 84.0, 49.0, 35.0, 18.0, 11.0, 12.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9921875, -9.61083984375, -9.2294921875, -8.84814453125, -8.466796875, -8.08544921875, -7.7041015625, -7.32275390625, -6.94140625, -6.56005859375, -6.1787109375, -5.79736328125, -5.416015625, -5.03466796875, -4.6533203125, -4.27197265625, -3.890625, -3.50927734375, -3.1279296875, -2.74658203125, -2.365234375, -1.98388671875, -1.6025390625, -1.22119140625, -0.83984375, -0.45849609375, -0.0771484375, 0.30419921875, 0.685546875, 1.06689453125, 1.4482421875, 1.82958984375, 2.2109375, 2.59228515625, 2.9736328125, 3.35498046875, 3.736328125, 4.11767578125, 4.4990234375, 4.88037109375, 5.26171875, 5.64306640625, 6.0244140625, 6.40576171875, 6.787109375, 7.16845703125, 7.5498046875, 7.93115234375, 8.3125, 8.69384765625, 9.0751953125, 9.45654296875, 9.837890625, 10.21923828125, 10.6005859375, 10.98193359375, 11.36328125, 11.74462890625, 12.1259765625, 12.50732421875, 12.888671875, 13.27001953125, 13.6513671875, 14.03271484375, 14.4140625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 8.0, 2.0, 2.0, 14.0, 11.0, 16.0, 24.0, 29.0, 48.0, 42.0, 54.0, 64.0, 66.0, 69.0, 82.0, 78.0, 66.0, 56.0, 52.0, 44.0, 31.0, 34.0, 24.0, 27.0, 13.0, 10.0, 6.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.7890625, -7.55645751953125, -7.3238525390625, -7.09124755859375, -6.858642578125, -6.62603759765625, -6.3934326171875, -6.16082763671875, -5.92822265625, -5.69561767578125, -5.4630126953125, -5.23040771484375, -4.997802734375, -4.76519775390625, -4.5325927734375, -4.29998779296875, -4.0673828125, -3.83477783203125, -3.6021728515625, -3.36956787109375, -3.136962890625, -2.90435791015625, -2.6717529296875, -2.43914794921875, -2.20654296875, -1.97393798828125, -1.7413330078125, -1.50872802734375, -1.276123046875, -1.04351806640625, -0.8109130859375, -0.57830810546875, -0.345703125, -0.11309814453125, 0.1195068359375, 0.35211181640625, 0.584716796875, 0.81732177734375, 1.0499267578125, 1.28253173828125, 1.51513671875, 1.74774169921875, 1.9803466796875, 2.21295166015625, 2.445556640625, 2.67816162109375, 2.9107666015625, 3.14337158203125, 3.3759765625, 3.60858154296875, 3.8411865234375, 4.07379150390625, 4.306396484375, 4.53900146484375, 4.7716064453125, 5.00421142578125, 5.23681640625, 5.46942138671875, 5.7020263671875, 5.93463134765625, 6.167236328125, 6.39984130859375, 6.6324462890625, 6.86505126953125, 7.09765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 5.0, 6.0, 11.0, 13.0, 30.0, 26.0, 46.0, 91.0, 154.0, 331.0, 871.0, 2722.0, 17166.0, 789230.0, 226138.0, 8690.0, 1823.0, 620.0, 244.0, 136.0, 69.0, 40.0, 24.0, 17.0, 12.0, 13.0, 6.0, 9.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.71875, -44.3681640625, -43.017578125, -41.6669921875, -40.31640625, -38.9658203125, -37.615234375, -36.2646484375, -34.9140625, -33.5634765625, -32.212890625, -30.8623046875, -29.51171875, -28.1611328125, -26.810546875, -25.4599609375, -24.109375, -22.7587890625, -21.408203125, -20.0576171875, -18.70703125, -17.3564453125, -16.005859375, -14.6552734375, -13.3046875, -11.9541015625, -10.603515625, -9.2529296875, -7.90234375, -6.5517578125, -5.201171875, -3.8505859375, -2.5, -1.1494140625, 0.201171875, 1.5517578125, 2.90234375, 4.2529296875, 5.603515625, 6.9541015625, 8.3046875, 9.6552734375, 11.005859375, 12.3564453125, 13.70703125, 15.0576171875, 16.408203125, 17.7587890625, 19.109375, 20.4599609375, 21.810546875, 23.1611328125, 24.51171875, 25.8623046875, 27.212890625, 28.5634765625, 29.9140625, 31.2646484375, 32.615234375, 33.9658203125, 35.31640625, 36.6669921875, 38.017578125, 39.3681640625, 40.71875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 3.0, 7.0, 9.0, 19.0, 12.0, 14.0, 24.0, 36.0, 56.0, 43.0, 63.0, 52.0, 70.0, 66.0, 69.0, 65.0, 59.0, 51.0, 52.0, 43.0, 37.0, 32.0, 27.0, 11.0, 15.0, 10.0, 8.0, 5.0, 3.0, 6.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-37.5625, -36.565673828125, -35.56884765625, -34.572021484375, -33.5751953125, -32.578369140625, -31.58154296875, -30.584716796875, -29.587890625, -28.591064453125, -27.59423828125, -26.597412109375, -25.6005859375, -24.603759765625, -23.60693359375, -22.610107421875, -21.61328125, -20.616455078125, -19.61962890625, -18.622802734375, -17.6259765625, -16.629150390625, -15.63232421875, -14.635498046875, -13.638671875, -12.641845703125, -11.64501953125, -10.648193359375, -9.6513671875, -8.654541015625, -7.65771484375, -6.660888671875, -5.6640625, -4.667236328125, -3.67041015625, -2.673583984375, -1.6767578125, -0.679931640625, 0.31689453125, 1.313720703125, 2.310546875, 3.307373046875, 4.30419921875, 5.301025390625, 6.2978515625, 7.294677734375, 8.29150390625, 9.288330078125, 10.28515625, 11.281982421875, 12.27880859375, 13.275634765625, 14.2724609375, 15.269287109375, 16.26611328125, 17.262939453125, 18.259765625, 19.256591796875, 20.25341796875, 21.250244140625, 22.2470703125, 23.243896484375, 24.24072265625, 25.237548828125, 26.234375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 6.0, 5.0, 13.0, 9.0, 20.0, 25.0, 40.0, 62.0, 101.0, 186.0, 419.0, 1270.0, 5978.0, 94952.0, 908778.0, 31801.0, 3270.0, 841.0, 350.0, 166.0, 95.0, 49.0, 33.0, 29.0, 17.0, 5.0, 11.0, 8.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.7734375, -14.330322265625, -13.88720703125, -13.444091796875, -13.0009765625, -12.557861328125, -12.11474609375, -11.671630859375, -11.228515625, -10.785400390625, -10.34228515625, -9.899169921875, -9.4560546875, -9.012939453125, -8.56982421875, -8.126708984375, -7.68359375, -7.240478515625, -6.79736328125, -6.354248046875, -5.9111328125, -5.468017578125, -5.02490234375, -4.581787109375, -4.138671875, -3.695556640625, -3.25244140625, -2.809326171875, -2.3662109375, -1.923095703125, -1.47998046875, -1.036865234375, -0.59375, -0.150634765625, 0.29248046875, 0.735595703125, 1.1787109375, 1.621826171875, 2.06494140625, 2.508056640625, 2.951171875, 3.394287109375, 3.83740234375, 4.280517578125, 4.7236328125, 5.166748046875, 5.60986328125, 6.052978515625, 6.49609375, 6.939208984375, 7.38232421875, 7.825439453125, 8.2685546875, 8.711669921875, 9.15478515625, 9.597900390625, 10.041015625, 10.484130859375, 10.92724609375, 11.370361328125, 11.8134765625, 12.256591796875, 12.69970703125, 13.142822265625, 13.5859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 2.0, 5.0, 9.0, 7.0, 11.0, 11.0, 9.0, 17.0, 28.0, 26.0, 38.0, 47.0, 77.0, 117.0, 148.0, 137.0, 85.0, 61.0, 40.0, 20.0, 20.0, 22.0, 10.0, 15.0, 9.0, 9.0, 6.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013093948364257812, -0.0012704581022262573, -0.0012315213680267334, -0.0011925846338272095, -0.0011536478996276855, -0.0011147111654281616, -0.0010757744312286377, -0.0010368376970291138, -0.0009979009628295898, -0.0009589642286300659, -0.000920027494430542, -0.0008810907602310181, -0.0008421540260314941, -0.0008032172918319702, -0.0007642805576324463, -0.0007253438234329224, -0.0006864070892333984, -0.0006474703550338745, -0.0006085336208343506, -0.0005695968866348267, -0.0005306601524353027, -0.0004917234182357788, -0.0004527866840362549, -0.00041384994983673096, -0.00037491321563720703, -0.0003359764814376831, -0.0002970397472381592, -0.00025810301303863525, -0.00021916627883911133, -0.0001802295446395874, -0.00014129281044006348, -0.00010235607624053955, -6.341934204101562e-05, -2.44826078414917e-05, 1.4454126358032227e-05, 5.339086055755615e-05, 9.232759475708008e-05, 0.000131264328956604, 0.00017020106315612793, 0.00020913779735565186, 0.0002480745315551758, 0.0002870112657546997, 0.00032594799995422363, 0.00036488473415374756, 0.0004038214683532715, 0.0004427582025527954, 0.00048169493675231934, 0.0005206316709518433, 0.0005595684051513672, 0.0005985051393508911, 0.000637441873550415, 0.000676378607749939, 0.0007153153419494629, 0.0007542520761489868, 0.0007931888103485107, 0.0008321255445480347, 0.0008710622787475586, 0.0009099990129470825, 0.0009489357471466064, 0.0009878724813461304, 0.0010268092155456543, 0.0010657459497451782, 0.0011046826839447021, 0.001143619418144226, 0.00118255615234375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 5.0, 12.0, 20.0, 20.0, 52.0, 74.0, 104.0, 174.0, 293.0, 597.0, 1337.0, 4055.0, 20861.0, 337258.0, 645217.0, 30166.0, 5135.0, 1640.0, 704.0, 332.0, 163.0, 115.0, 65.0, 48.0, 27.0, 17.0, 11.0, 12.0, 5.0, 9.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.053955078125, -7.73291015625, -7.411865234375, -7.0908203125, -6.769775390625, -6.44873046875, -6.127685546875, -5.806640625, -5.485595703125, -5.16455078125, -4.843505859375, -4.5224609375, -4.201416015625, -3.88037109375, -3.559326171875, -3.23828125, -2.917236328125, -2.59619140625, -2.275146484375, -1.9541015625, -1.633056640625, -1.31201171875, -0.990966796875, -0.669921875, -0.348876953125, -0.02783203125, 0.293212890625, 0.6142578125, 0.935302734375, 1.25634765625, 1.577392578125, 1.8984375, 2.219482421875, 2.54052734375, 2.861572265625, 3.1826171875, 3.503662109375, 3.82470703125, 4.145751953125, 4.466796875, 4.787841796875, 5.10888671875, 5.429931640625, 5.7509765625, 6.072021484375, 6.39306640625, 6.714111328125, 7.03515625, 7.356201171875, 7.67724609375, 7.998291015625, 8.3193359375, 8.640380859375, 8.96142578125, 9.282470703125, 9.603515625, 9.924560546875, 10.24560546875, 10.566650390625, 10.8876953125, 11.208740234375, 11.52978515625, 11.850830078125, 12.171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 6.0, 2.0, 5.0, 11.0, 12.0, 16.0, 19.0, 19.0, 34.0, 45.0, 52.0, 78.0, 80.0, 100.0, 83.0, 76.0, 67.0, 63.0, 48.0, 41.0, 26.0, 15.0, 20.0, 15.0, 9.0, 5.0, 6.0, 5.0, 8.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0], "bins": [-6.83203125, -6.6192626953125, -6.406494140625, -6.1937255859375, -5.98095703125, -5.7681884765625, -5.555419921875, -5.3426513671875, -5.1298828125, -4.9171142578125, -4.704345703125, -4.4915771484375, -4.27880859375, -4.0660400390625, -3.853271484375, -3.6405029296875, -3.427734375, -3.2149658203125, -3.002197265625, -2.7894287109375, -2.57666015625, -2.3638916015625, -2.151123046875, -1.9383544921875, -1.7255859375, -1.5128173828125, -1.300048828125, -1.0872802734375, -0.87451171875, -0.6617431640625, -0.448974609375, -0.2362060546875, -0.0234375, 0.1893310546875, 0.402099609375, 0.6148681640625, 0.82763671875, 1.0404052734375, 1.253173828125, 1.4659423828125, 1.6787109375, 1.8914794921875, 2.104248046875, 2.3170166015625, 2.52978515625, 2.7425537109375, 2.955322265625, 3.1680908203125, 3.380859375, 3.5936279296875, 3.806396484375, 4.0191650390625, 4.23193359375, 4.4447021484375, 4.657470703125, 4.8702392578125, 5.0830078125, 5.2957763671875, 5.508544921875, 5.7213134765625, 5.93408203125, 6.1468505859375, 6.359619140625, 6.5723876953125, 6.78515625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 13.0, 30.0, 102.0, 297.0, 326.0, 140.0, 56.0, 20.0, 9.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-397.07867431640625, -388.6428527832031, -380.2070007324219, -371.77117919921875, -363.3353271484375, -354.8995056152344, -346.4636535644531, -338.02783203125, -329.59197998046875, -321.1561584472656, -312.7203063964844, -304.28448486328125, -295.8486328125, -287.4128112792969, -278.9769592285156, -270.5411376953125, -262.1053161621094, -253.6694793701172, -245.233642578125, -236.7978057861328, -228.36196899414062, -219.9261474609375, -211.4903106689453, -203.05447387695312, -194.61863708496094, -186.18280029296875, -177.74696350097656, -169.31112670898438, -160.87530517578125, -152.439453125, -144.00363159179688, -135.5677947998047, -127.1319580078125, -118.69612121582031, -110.26028442382812, -101.82445526123047, -93.38861846923828, -84.9527816772461, -76.51695251464844, -68.08111572265625, -59.64527893066406, -51.209442138671875, -42.77360916137695, -34.33777618408203, -25.901939392089844, -17.466102600097656, -9.030269622802734, -0.5944366455078125, 7.841400146484375, 16.27723503112793, 24.713069915771484, 33.148902893066406, 41.584739685058594, 50.02057647705078, 58.4564094543457, 66.89224243164062, 75.32807922363281, 83.763916015625, 92.19975280761719, 100.63558197021484, 109.07141876220703, 117.50725555419922, 125.94308471679688, 134.37892150878906, 142.81475830078125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 1.0, 8.0, 5.0, 6.0, 12.0, 18.0, 25.0, 21.0, 35.0, 44.0, 51.0, 45.0, 54.0, 66.0, 81.0, 88.0, 59.0, 66.0, 55.0, 51.0, 32.0, 30.0, 28.0, 28.0, 20.0, 16.0, 19.0, 7.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-163.83663940429688, -159.44334411621094, -155.05006408691406, -150.65676879882812, -146.26348876953125, -141.8701934814453, -137.47691345214844, -133.0836181640625, -128.69033813476562, -124.29705047607422, -119.90376281738281, -115.5104751586914, -111.1171875, -106.72389221191406, -102.33060455322266, -97.93731689453125, -93.54402160644531, -89.1507339477539, -84.7574462890625, -80.3641586303711, -75.97087097167969, -71.57757568359375, -67.18428802490234, -62.79100036621094, -58.39771270751953, -54.004425048828125, -49.61113739013672, -45.21784591674805, -40.82455825805664, -36.431270599365234, -32.03797912597656, -27.644691467285156, -23.251388549804688, -18.85810089111328, -14.464811325073242, -10.07152271270752, -5.678234100341797, -1.2849464416503906, 3.1083431243896484, 7.5016326904296875, 11.894920349121094, 16.2882080078125, 20.68149757385254, 25.074787139892578, 29.468074798583984, 33.86136245727539, 38.25465393066406, 42.64794158935547, 47.041229248046875, 51.43451690673828, 55.82780456542969, 60.22109603881836, 64.6143798828125, 69.00767517089844, 73.40096282958984, 77.79425048828125, 82.18753814697266, 86.58082580566406, 90.97411346435547, 95.36740112304688, 99.76069641113281, 104.15397644042969, 108.54727172851562, 112.94055938720703, 117.33384704589844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 6.0, 3.0, 3.0, 8.0, 11.0, 11.0, 19.0, 16.0, 30.0, 34.0, 38.0, 91.0, 112.0, 196.0, 301.0, 538.0, 1013.0, 2164.0, 5299.0, 15821.0, 81966.0, 1829815.0, 2141014.0, 88916.0, 16691.0, 5465.0, 2214.0, 1051.0, 593.0, 285.0, 195.0, 119.0, 83.0, 50.0, 30.0, 25.0, 15.0, 12.0, 6.0, 12.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.734375, -10.4278564453125, -10.121337890625, -9.8148193359375, -9.50830078125, -9.2017822265625, -8.895263671875, -8.5887451171875, -8.2822265625, -7.9757080078125, -7.669189453125, -7.3626708984375, -7.05615234375, -6.7496337890625, -6.443115234375, -6.1365966796875, -5.830078125, -5.5235595703125, -5.217041015625, -4.9105224609375, -4.60400390625, -4.2974853515625, -3.990966796875, -3.6844482421875, -3.3779296875, -3.0714111328125, -2.764892578125, -2.4583740234375, -2.15185546875, -1.8453369140625, -1.538818359375, -1.2322998046875, -0.92578125, -0.6192626953125, -0.312744140625, -0.0062255859375, 0.30029296875, 0.6068115234375, 0.913330078125, 1.2198486328125, 1.5263671875, 1.8328857421875, 2.139404296875, 2.4459228515625, 2.75244140625, 3.0589599609375, 3.365478515625, 3.6719970703125, 3.978515625, 4.2850341796875, 4.591552734375, 4.8980712890625, 5.20458984375, 5.5111083984375, 5.817626953125, 6.1241455078125, 6.4306640625, 6.7371826171875, 7.043701171875, 7.3502197265625, 7.65673828125, 7.9632568359375, 8.269775390625, 8.5762939453125, 8.8828125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 2.0, 7.0, 7.0, 20.0, 20.0, 17.0, 37.0, 51.0, 47.0, 80.0, 77.0, 90.0, 86.0, 90.0, 73.0, 59.0, 51.0, 42.0, 32.0, 25.0, 24.0, 15.0, 11.0, 7.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.578125, -9.30810546875, -9.0380859375, -8.76806640625, -8.498046875, -8.22802734375, -7.9580078125, -7.68798828125, -7.41796875, -7.14794921875, -6.8779296875, -6.60791015625, -6.337890625, -6.06787109375, -5.7978515625, -5.52783203125, -5.2578125, -4.98779296875, -4.7177734375, -4.44775390625, -4.177734375, -3.90771484375, -3.6376953125, -3.36767578125, -3.09765625, -2.82763671875, -2.5576171875, -2.28759765625, -2.017578125, -1.74755859375, -1.4775390625, -1.20751953125, -0.9375, -0.66748046875, -0.3974609375, -0.12744140625, 0.142578125, 0.41259765625, 0.6826171875, 0.95263671875, 1.22265625, 1.49267578125, 1.7626953125, 2.03271484375, 2.302734375, 2.57275390625, 2.8427734375, 3.11279296875, 3.3828125, 3.65283203125, 3.9228515625, 4.19287109375, 4.462890625, 4.73291015625, 5.0029296875, 5.27294921875, 5.54296875, 5.81298828125, 6.0830078125, 6.35302734375, 6.623046875, 6.89306640625, 7.1630859375, 7.43310546875, 7.703125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 18.0, 30.0, 53.0, 96.0, 236.0, 534.0, 1324.0, 3799.0, 12803.0, 66808.0, 2583469.0, 1459278.0, 50699.0, 10269.0, 3054.0, 1044.0, 415.0, 183.0, 75.0, 33.0, 27.0, 15.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.515625, -12.0831298828125, -11.650634765625, -11.2181396484375, -10.78564453125, -10.3531494140625, -9.920654296875, -9.4881591796875, -9.0556640625, -8.6231689453125, -8.190673828125, -7.7581787109375, -7.32568359375, -6.8931884765625, -6.460693359375, -6.0281982421875, -5.595703125, -5.1632080078125, -4.730712890625, -4.2982177734375, -3.86572265625, -3.4332275390625, -3.000732421875, -2.5682373046875, -2.1357421875, -1.7032470703125, -1.270751953125, -0.8382568359375, -0.40576171875, 0.0267333984375, 0.459228515625, 0.8917236328125, 1.32421875, 1.7567138671875, 2.189208984375, 2.6217041015625, 3.05419921875, 3.4866943359375, 3.919189453125, 4.3516845703125, 4.7841796875, 5.2166748046875, 5.649169921875, 6.0816650390625, 6.51416015625, 6.9466552734375, 7.379150390625, 7.8116455078125, 8.244140625, 8.6766357421875, 9.109130859375, 9.5416259765625, 9.97412109375, 10.4066162109375, 10.839111328125, 11.2716064453125, 11.7041015625, 12.1365966796875, 12.569091796875, 13.0015869140625, 13.43408203125, 13.8665771484375, 14.299072265625, 14.7315673828125, 15.1640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 8.0, 10.0, 8.0, 14.0, 23.0, 25.0, 48.0, 108.0, 211.0, 514.0, 1059.0, 1138.0, 476.0, 199.0, 81.0, 54.0, 24.0, 22.0, 12.0, 9.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.234375, -11.8260498046875, -11.417724609375, -11.0093994140625, -10.60107421875, -10.1927490234375, -9.784423828125, -9.3760986328125, -8.9677734375, -8.5594482421875, -8.151123046875, -7.7427978515625, -7.33447265625, -6.9261474609375, -6.517822265625, -6.1094970703125, -5.701171875, -5.2928466796875, -4.884521484375, -4.4761962890625, -4.06787109375, -3.6595458984375, -3.251220703125, -2.8428955078125, -2.4345703125, -2.0262451171875, -1.617919921875, -1.2095947265625, -0.80126953125, -0.3929443359375, 0.015380859375, 0.4237060546875, 0.83203125, 1.2403564453125, 1.648681640625, 2.0570068359375, 2.46533203125, 2.8736572265625, 3.281982421875, 3.6903076171875, 4.0986328125, 4.5069580078125, 4.915283203125, 5.3236083984375, 5.73193359375, 6.1402587890625, 6.548583984375, 6.9569091796875, 7.365234375, 7.7735595703125, 8.181884765625, 8.5902099609375, 8.99853515625, 9.4068603515625, 9.815185546875, 10.2235107421875, 10.6318359375, 11.0401611328125, 11.448486328125, 11.8568115234375, 12.26513671875, 12.6734619140625, 13.081787109375, 13.4901123046875, 13.8984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 7.0, 6.0, 24.0, 50.0, 100.0, 152.0, 219.0, 169.0, 119.0, 63.0, 38.0, 13.0, 15.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.99039459228516, -87.25459289550781, -84.51879119873047, -81.78298950195312, -79.04719543457031, -76.31139373779297, -73.57559204101562, -70.83979034423828, -68.10398864746094, -65.3681869506836, -62.63238525390625, -59.89658737182617, -57.16078567504883, -54.424983978271484, -51.689186096191406, -48.95338439941406, -46.21758270263672, -43.481781005859375, -40.74597930908203, -38.01018142700195, -35.27437973022461, -32.538578033447266, -29.802778244018555, -27.066978454589844, -24.3311767578125, -21.595375061035156, -18.859575271606445, -16.123775482177734, -13.38797378540039, -10.652173042297363, -7.916372299194336, -5.180572509765625, -2.4447708129882812, 0.2910299301147461, 3.0268306732177734, 5.762631416320801, 8.498432159423828, 11.234232902526855, 13.970033645629883, 16.705833435058594, 19.441635131835938, 22.17743682861328, 24.913236618041992, 27.649036407470703, 30.384838104248047, 33.12063980102539, 35.85643768310547, 38.59223937988281, 41.328041076660156, 44.0638427734375, 46.799644470214844, 49.53544235229492, 52.271244049072266, 55.00704574584961, 57.74284362792969, 60.47864532470703, 63.214447021484375, 65.95024871826172, 68.68605041503906, 71.4218521118164, 74.15765380859375, 76.89344787597656, 79.6292495727539, 82.36505126953125, 85.1008529663086]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 8.0, 13.0, 11.0, 13.0, 7.0, 12.0, 19.0, 34.0, 40.0, 46.0, 52.0, 40.0, 45.0, 52.0, 48.0, 84.0, 59.0, 47.0, 52.0, 45.0, 50.0, 39.0, 36.0, 29.0, 25.0, 19.0, 16.0, 11.0, 7.0, 11.0, 6.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.56804656982422, -38.130245208740234, -36.69244384765625, -35.254642486572266, -33.81684112548828, -32.37903594970703, -30.94123649597168, -29.503433227539062, -28.065631866455078, -26.627830505371094, -25.19002914428711, -23.752227783203125, -22.314424514770508, -20.876623153686523, -19.43882179260254, -18.001018524169922, -16.56321907043457, -15.125417709350586, -13.687615394592285, -12.2498140335083, -10.81201171875, -9.374210357666016, -7.936408996582031, -6.4986066818237305, -5.060805320739746, -3.6230034828186035, -2.18520188331604, -0.7474002838134766, 0.690401554107666, 2.1282033920288086, 3.566004753112793, 5.003807067871094, 6.441608428955078, 7.879410266876221, 9.317212104797363, 10.755013465881348, 12.192815780639648, 13.630617141723633, 15.068418502807617, 16.506221771240234, 17.94402313232422, 19.381824493408203, 20.819625854492188, 22.257427215576172, 23.69523048400879, 25.133031845092773, 26.570833206176758, 28.008636474609375, 29.446435928344727, 30.88423728942871, 32.32204055786133, 33.75984191894531, 35.1976432800293, 36.63544464111328, 38.073246002197266, 39.51104736328125, 40.948848724365234, 42.38665008544922, 43.8244514465332, 45.26225280761719, 46.70005416870117, 48.137855529785156, 49.575660705566406, 51.01346206665039, 52.451263427734375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 6.0, 7.0, 13.0, 25.0, 27.0, 31.0, 65.0, 85.0, 143.0, 231.0, 351.0, 657.0, 1128.0, 2067.0, 4332.0, 9005.0, 21266.0, 53863.0, 153487.0, 401323.0, 256598.0, 85831.0, 32205.0, 13378.0, 5930.0, 2944.0, 1525.0, 801.0, 453.0, 272.0, 166.0, 91.0, 78.0, 50.0, 35.0, 26.0, 18.0, 8.0, 8.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.59375, -8.3046875, -8.015625, -7.7265625, -7.4375, -7.1484375, -6.859375, -6.5703125, -6.28125, -5.9921875, -5.703125, -5.4140625, -5.125, -4.8359375, -4.546875, -4.2578125, -3.96875, -3.6796875, -3.390625, -3.1015625, -2.8125, -2.5234375, -2.234375, -1.9453125, -1.65625, -1.3671875, -1.078125, -0.7890625, -0.5, -0.2109375, 0.078125, 0.3671875, 0.65625, 0.9453125, 1.234375, 1.5234375, 1.8125, 2.1015625, 2.390625, 2.6796875, 2.96875, 3.2578125, 3.546875, 3.8359375, 4.125, 4.4140625, 4.703125, 4.9921875, 5.28125, 5.5703125, 5.859375, 6.1484375, 6.4375, 6.7265625, 7.015625, 7.3046875, 7.59375, 7.8828125, 8.171875, 8.4609375, 8.75, 9.0390625, 9.328125, 9.6171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 11.0, 14.0, 18.0, 25.0, 31.0, 45.0, 49.0, 63.0, 62.0, 68.0, 93.0, 70.0, 70.0, 67.0, 68.0, 50.0, 32.0, 42.0, 20.0, 20.0, 16.0, 14.0, 8.0, 9.0, 3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.359375, -8.12060546875, -7.8818359375, -7.64306640625, -7.404296875, -7.16552734375, -6.9267578125, -6.68798828125, -6.44921875, -6.21044921875, -5.9716796875, -5.73291015625, -5.494140625, -5.25537109375, -5.0166015625, -4.77783203125, -4.5390625, -4.30029296875, -4.0615234375, -3.82275390625, -3.583984375, -3.34521484375, -3.1064453125, -2.86767578125, -2.62890625, -2.39013671875, -2.1513671875, -1.91259765625, -1.673828125, -1.43505859375, -1.1962890625, -0.95751953125, -0.71875, -0.47998046875, -0.2412109375, -0.00244140625, 0.236328125, 0.47509765625, 0.7138671875, 0.95263671875, 1.19140625, 1.43017578125, 1.6689453125, 1.90771484375, 2.146484375, 2.38525390625, 2.6240234375, 2.86279296875, 3.1015625, 3.34033203125, 3.5791015625, 3.81787109375, 4.056640625, 4.29541015625, 4.5341796875, 4.77294921875, 5.01171875, 5.25048828125, 5.4892578125, 5.72802734375, 5.966796875, 6.20556640625, 6.4443359375, 6.68310546875, 6.921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 12.0, 13.0, 39.0, 40.0, 72.0, 123.0, 174.0, 394.0, 817.0, 2146.0, 8194.0, 60555.0, 702231.0, 244137.0, 22679.0, 4248.0, 1364.0, 594.0, 290.0, 163.0, 89.0, 59.0, 32.0, 28.0, 20.0, 12.0, 7.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-27.328125, -26.64111328125, -25.9541015625, -25.26708984375, -24.580078125, -23.89306640625, -23.2060546875, -22.51904296875, -21.83203125, -21.14501953125, -20.4580078125, -19.77099609375, -19.083984375, -18.39697265625, -17.7099609375, -17.02294921875, -16.3359375, -15.64892578125, -14.9619140625, -14.27490234375, -13.587890625, -12.90087890625, -12.2138671875, -11.52685546875, -10.83984375, -10.15283203125, -9.4658203125, -8.77880859375, -8.091796875, -7.40478515625, -6.7177734375, -6.03076171875, -5.34375, -4.65673828125, -3.9697265625, -3.28271484375, -2.595703125, -1.90869140625, -1.2216796875, -0.53466796875, 0.15234375, 0.83935546875, 1.5263671875, 2.21337890625, 2.900390625, 3.58740234375, 4.2744140625, 4.96142578125, 5.6484375, 6.33544921875, 7.0224609375, 7.70947265625, 8.396484375, 9.08349609375, 9.7705078125, 10.45751953125, 11.14453125, 11.83154296875, 12.5185546875, 13.20556640625, 13.892578125, 14.57958984375, 15.2666015625, 15.95361328125, 16.640625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 17.0, 12.0, 33.0, 34.0, 47.0, 50.0, 58.0, 69.0, 67.0, 101.0, 69.0, 91.0, 67.0, 63.0, 46.0, 47.0, 39.0, 35.0, 16.0, 15.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.328125, -26.276123046875, -25.22412109375, -24.172119140625, -23.1201171875, -22.068115234375, -21.01611328125, -19.964111328125, -18.912109375, -17.860107421875, -16.80810546875, -15.756103515625, -14.7041015625, -13.652099609375, -12.60009765625, -11.548095703125, -10.49609375, -9.444091796875, -8.39208984375, -7.340087890625, -6.2880859375, -5.236083984375, -4.18408203125, -3.132080078125, -2.080078125, -1.028076171875, 0.02392578125, 1.075927734375, 2.1279296875, 3.179931640625, 4.23193359375, 5.283935546875, 6.3359375, 7.387939453125, 8.43994140625, 9.491943359375, 10.5439453125, 11.595947265625, 12.64794921875, 13.699951171875, 14.751953125, 15.803955078125, 16.85595703125, 17.907958984375, 18.9599609375, 20.011962890625, 21.06396484375, 22.115966796875, 23.16796875, 24.219970703125, 25.27197265625, 26.323974609375, 27.3759765625, 28.427978515625, 29.47998046875, 30.531982421875, 31.583984375, 32.635986328125, 33.68798828125, 34.739990234375, 35.7919921875, 36.843994140625, 37.89599609375, 38.947998046875, 40.0]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 5.0, 12.0, 7.0, 10.0, 11.0, 39.0, 46.0, 116.0, 339.0, 1459.0, 15712.0, 1008025.0, 20564.0, 1544.0, 371.0, 123.0, 66.0, 29.0, 19.0, 19.0, 14.0, 5.0, 6.0, 5.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.890625, -21.23779296875, -20.5849609375, -19.93212890625, -19.279296875, -18.62646484375, -17.9736328125, -17.32080078125, -16.66796875, -16.01513671875, -15.3623046875, -14.70947265625, -14.056640625, -13.40380859375, -12.7509765625, -12.09814453125, -11.4453125, -10.79248046875, -10.1396484375, -9.48681640625, -8.833984375, -8.18115234375, -7.5283203125, -6.87548828125, -6.22265625, -5.56982421875, -4.9169921875, -4.26416015625, -3.611328125, -2.95849609375, -2.3056640625, -1.65283203125, -1.0, -0.34716796875, 0.3056640625, 0.95849609375, 1.611328125, 2.26416015625, 2.9169921875, 3.56982421875, 4.22265625, 4.87548828125, 5.5283203125, 6.18115234375, 6.833984375, 7.48681640625, 8.1396484375, 8.79248046875, 9.4453125, 10.09814453125, 10.7509765625, 11.40380859375, 12.056640625, 12.70947265625, 13.3623046875, 14.01513671875, 14.66796875, 15.32080078125, 15.9736328125, 16.62646484375, 17.279296875, 17.93212890625, 18.5849609375, 19.23779296875, 19.890625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 12.0, 4.0, 14.0, 20.0, 23.0, 53.0, 45.0, 89.0, 158.0, 195.0, 130.0, 92.0, 59.0, 39.0, 17.0, 17.0, 18.0, 6.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012941360473632812, -0.0012467950582504272, -0.0011994540691375732, -0.0011521130800247192, -0.0011047720909118652, -0.0010574311017990112, -0.0010100901126861572, -0.0009627491235733032, -0.0009154081344604492, -0.0008680671453475952, -0.0008207261562347412, -0.0007733851671218872, -0.0007260441780090332, -0.0006787031888961792, -0.0006313621997833252, -0.0005840212106704712, -0.0005366802215576172, -0.0004893392324447632, -0.0004419982433319092, -0.0003946572542190552, -0.00034731626510620117, -0.00029997527599334717, -0.00025263428688049316, -0.00020529329776763916, -0.00015795230865478516, -0.00011061131954193115, -6.327033042907715e-05, -1.5929341316223145e-05, 3.141164779663086e-05, 7.875263690948486e-05, 0.00012609362602233887, 0.00017343461513519287, 0.00022077560424804688, 0.0002681165933609009, 0.0003154575824737549, 0.0003627985715866089, 0.0004101395606994629, 0.0004574805498123169, 0.0005048215389251709, 0.0005521625280380249, 0.0005995035171508789, 0.0006468445062637329, 0.0006941854953765869, 0.0007415264844894409, 0.0007888674736022949, 0.0008362084627151489, 0.0008835494518280029, 0.0009308904409408569, 0.000978231430053711, 0.001025572419166565, 0.001072913408279419, 0.001120254397392273, 0.001167595386505127, 0.001214936375617981, 0.001262277364730835, 0.001309618353843689, 0.001356959342956543, 0.001404300332069397, 0.001451641321182251, 0.001498982310295105, 0.001546323299407959, 0.001593664288520813, 0.001641005277633667, 0.001688346266746521, 0.001735687255859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 10.0, 6.0, 16.0, 21.0, 25.0, 36.0, 59.0, 97.0, 185.0, 350.0, 823.0, 2490.0, 11586.0, 161371.0, 822129.0, 40896.0, 5665.0, 1622.0, 558.0, 258.0, 130.0, 78.0, 54.0, 30.0, 19.0, 14.0, 12.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-13.046875, -12.75225830078125, -12.4576416015625, -12.16302490234375, -11.868408203125, -11.57379150390625, -11.2791748046875, -10.98455810546875, -10.68994140625, -10.39532470703125, -10.1007080078125, -9.80609130859375, -9.511474609375, -9.21685791015625, -8.9222412109375, -8.62762451171875, -8.3330078125, -8.03839111328125, -7.7437744140625, -7.44915771484375, -7.154541015625, -6.85992431640625, -6.5653076171875, -6.27069091796875, -5.97607421875, -5.68145751953125, -5.3868408203125, -5.09222412109375, -4.797607421875, -4.50299072265625, -4.2083740234375, -3.91375732421875, -3.619140625, -3.32452392578125, -3.0299072265625, -2.73529052734375, -2.440673828125, -2.14605712890625, -1.8514404296875, -1.55682373046875, -1.26220703125, -0.96759033203125, -0.6729736328125, -0.37835693359375, -0.083740234375, 0.21087646484375, 0.5054931640625, 0.80010986328125, 1.0947265625, 1.38934326171875, 1.6839599609375, 1.97857666015625, 2.273193359375, 2.56781005859375, 2.8624267578125, 3.15704345703125, 3.45166015625, 3.74627685546875, 4.0408935546875, 4.33551025390625, 4.630126953125, 4.92474365234375, 5.2193603515625, 5.51397705078125, 5.80859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 2.0, 8.0, 6.0, 9.0, 16.0, 20.0, 35.0, 52.0, 80.0, 106.0, 148.0, 136.0, 111.0, 103.0, 68.0, 25.0, 26.0, 21.0, 9.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.146728515625, -5.87939453125, -5.612060546875, -5.3447265625, -5.077392578125, -4.81005859375, -4.542724609375, -4.275390625, -4.008056640625, -3.74072265625, -3.473388671875, -3.2060546875, -2.938720703125, -2.67138671875, -2.404052734375, -2.13671875, -1.869384765625, -1.60205078125, -1.334716796875, -1.0673828125, -0.800048828125, -0.53271484375, -0.265380859375, 0.001953125, 0.269287109375, 0.53662109375, 0.803955078125, 1.0712890625, 1.338623046875, 1.60595703125, 1.873291015625, 2.140625, 2.407958984375, 2.67529296875, 2.942626953125, 3.2099609375, 3.477294921875, 3.74462890625, 4.011962890625, 4.279296875, 4.546630859375, 4.81396484375, 5.081298828125, 5.3486328125, 5.615966796875, 5.88330078125, 6.150634765625, 6.41796875, 6.685302734375, 6.95263671875, 7.219970703125, 7.4873046875, 7.754638671875, 8.02197265625, 8.289306640625, 8.556640625, 8.823974609375, 9.09130859375, 9.358642578125, 9.6259765625, 9.893310546875, 10.16064453125, 10.427978515625, 10.6953125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 9.0, 34.0, 118.0, 343.0, 340.0, 91.0, 40.0, 8.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.81680297851562, -132.0328369140625, -124.2488784790039, -116.46491241455078, -108.68095397949219, -100.89698791503906, -93.11302185058594, -85.32906341552734, -77.54510498046875, -69.76113891601562, -61.97718048095703, -54.193214416503906, -46.40925598144531, -38.62528991699219, -30.841327667236328, -23.05736541748047, -15.273399353027344, -7.489436626434326, 0.2945261001586914, 8.078489303588867, 15.862451553344727, 23.64641571044922, 31.430377960205078, 39.21434020996094, 46.9983024597168, 54.782264709472656, 62.566226959228516, 70.35018920898438, 78.1341552734375, 85.91812133789062, 93.70207977294922, 101.48603820800781, 109.27000427246094, 117.05397033691406, 124.83792877197266, 132.62188720703125, 140.40585327148438, 148.1898193359375, 155.97378540039062, 163.75775146484375, 171.5417022705078, 179.32566833496094, 187.10963439941406, 194.89358520507812, 202.67755126953125, 210.46151733398438, 218.2454833984375, 226.02944946289062, 233.81341552734375, 241.59738159179688, 249.38134765625, 257.1653137207031, 264.94927978515625, 272.73321533203125, 280.5171813964844, 288.3011474609375, 296.0851135253906, 303.86907958984375, 311.6530456542969, 319.43701171875, 327.2209777832031, 335.00494384765625, 342.78887939453125, 350.5728454589844, 358.3568115234375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 8.0, 5.0, 13.0, 7.0, 9.0, 7.0, 17.0, 28.0, 32.0, 28.0, 26.0, 39.0, 41.0, 36.0, 51.0, 58.0, 66.0, 49.0, 57.0, 54.0, 39.0, 42.0, 31.0, 38.0, 31.0, 28.0, 26.0, 22.0, 22.0, 18.0, 10.0, 10.0, 8.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.03341674804688, -74.40672302246094, -71.780029296875, -69.15333557128906, -66.52664184570312, -63.89995193481445, -61.273258209228516, -58.646568298339844, -56.019874572753906, -53.39318084716797, -50.76648712158203, -48.139793395996094, -45.51310348510742, -42.886409759521484, -40.25971603393555, -37.633026123046875, -35.00632858276367, -32.379634857177734, -29.75294303894043, -27.126249313354492, -24.499557495117188, -21.87286376953125, -19.246170043945312, -16.619478225708008, -13.99278450012207, -11.36609172821045, -8.739398956298828, -6.112705230712891, -3.4860124588012695, -0.8593196868896484, 1.767374038696289, 4.394065856933594, 7.020759582519531, 9.647452354431152, 12.274145126342773, 14.900838851928711, 17.527530670166016, 20.154224395751953, 22.78091812133789, 25.407609939575195, 28.034303665161133, 30.66099739074707, 33.287689208984375, 35.91438293457031, 38.54107666015625, 41.16777038574219, 43.794464111328125, 46.4211540222168, 49.047847747802734, 51.67454147338867, 54.30123519897461, 56.92792510986328, 59.55461883544922, 62.181312561035156, 64.8080062866211, 67.43470001220703, 70.06139373779297, 72.6880874633789, 75.31478118896484, 77.94147491455078, 80.56816864013672, 83.19485473632812, 85.82154846191406, 88.4482421875, 91.07493591308594]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 16.0, 20.0, 29.0, 70.0, 103.0, 200.0, 516.0, 1317.0, 4621.0, 21497.0, 216439.0, 3473926.0, 435914.0, 30835.0, 5957.0, 1653.0, 602.0, 252.0, 132.0, 66.0, 37.0, 19.0, 12.0, 6.0, 10.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0390625, -11.6697998046875, -11.300537109375, -10.9312744140625, -10.56201171875, -10.1927490234375, -9.823486328125, -9.4542236328125, -9.0849609375, -8.7156982421875, -8.346435546875, -7.9771728515625, -7.60791015625, -7.2386474609375, -6.869384765625, -6.5001220703125, -6.130859375, -5.7615966796875, -5.392333984375, -5.0230712890625, -4.65380859375, -4.2845458984375, -3.915283203125, -3.5460205078125, -3.1767578125, -2.8074951171875, -2.438232421875, -2.0689697265625, -1.69970703125, -1.3304443359375, -0.961181640625, -0.5919189453125, -0.22265625, 0.1466064453125, 0.515869140625, 0.8851318359375, 1.25439453125, 1.6236572265625, 1.992919921875, 2.3621826171875, 2.7314453125, 3.1007080078125, 3.469970703125, 3.8392333984375, 4.20849609375, 4.5777587890625, 4.947021484375, 5.3162841796875, 5.685546875, 6.0548095703125, 6.424072265625, 6.7933349609375, 7.16259765625, 7.5318603515625, 7.901123046875, 8.2703857421875, 8.6396484375, 9.0089111328125, 9.378173828125, 9.7474365234375, 10.11669921875, 10.4859619140625, 10.855224609375, 11.2244873046875, 11.59375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 9.0, 9.0, 16.0, 23.0, 41.0, 43.0, 84.0, 105.0, 118.0, 140.0, 111.0, 87.0, 79.0, 51.0, 32.0, 26.0, 12.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.0452880859375, -7.715576171875, -7.3858642578125, -7.05615234375, -6.7264404296875, -6.396728515625, -6.0670166015625, -5.7373046875, -5.4075927734375, -5.077880859375, -4.7481689453125, -4.41845703125, -4.0887451171875, -3.759033203125, -3.4293212890625, -3.099609375, -2.7698974609375, -2.440185546875, -2.1104736328125, -1.78076171875, -1.4510498046875, -1.121337890625, -0.7916259765625, -0.4619140625, -0.1322021484375, 0.197509765625, 0.5272216796875, 0.85693359375, 1.1866455078125, 1.516357421875, 1.8460693359375, 2.17578125, 2.5054931640625, 2.835205078125, 3.1649169921875, 3.49462890625, 3.8243408203125, 4.154052734375, 4.4837646484375, 4.8134765625, 5.1431884765625, 5.472900390625, 5.8026123046875, 6.13232421875, 6.4620361328125, 6.791748046875, 7.1214599609375, 7.451171875, 7.7808837890625, 8.110595703125, 8.4403076171875, 8.77001953125, 9.0997314453125, 9.429443359375, 9.7591552734375, 10.0888671875, 10.4185791015625, 10.748291015625, 11.0780029296875, 11.40771484375, 11.7374267578125, 12.067138671875, 12.3968505859375, 12.7265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 6.0, 11.0, 8.0, 9.0, 8.0, 13.0, 21.0, 36.0, 58.0, 71.0, 131.0, 185.0, 335.0, 640.0, 1154.0, 2619.0, 6216.0, 18582.0, 70115.0, 467609.0, 3099414.0, 435634.0, 65681.0, 16474.0, 5323.0, 1992.0, 880.0, 416.0, 255.0, 141.0, 80.0, 76.0, 32.0, 25.0, 7.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8828125, -8.6175537109375, -8.352294921875, -8.0870361328125, -7.82177734375, -7.5565185546875, -7.291259765625, -7.0260009765625, -6.7607421875, -6.4954833984375, -6.230224609375, -5.9649658203125, -5.69970703125, -5.4344482421875, -5.169189453125, -4.9039306640625, -4.638671875, -4.3734130859375, -4.108154296875, -3.8428955078125, -3.57763671875, -3.3123779296875, -3.047119140625, -2.7818603515625, -2.5166015625, -2.2513427734375, -1.986083984375, -1.7208251953125, -1.45556640625, -1.1903076171875, -0.925048828125, -0.6597900390625, -0.39453125, -0.1292724609375, 0.135986328125, 0.4012451171875, 0.66650390625, 0.9317626953125, 1.197021484375, 1.4622802734375, 1.7275390625, 1.9927978515625, 2.258056640625, 2.5233154296875, 2.78857421875, 3.0538330078125, 3.319091796875, 3.5843505859375, 3.849609375, 4.1148681640625, 4.380126953125, 4.6453857421875, 4.91064453125, 5.1759033203125, 5.441162109375, 5.7064208984375, 5.9716796875, 6.2369384765625, 6.502197265625, 6.7674560546875, 7.03271484375, 7.2979736328125, 7.563232421875, 7.8284912109375, 8.09375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 6.0, 7.0, 6.0, 16.0, 22.0, 27.0, 23.0, 37.0, 85.0, 139.0, 251.0, 435.0, 799.0, 914.0, 570.0, 293.0, 162.0, 109.0, 54.0, 40.0, 24.0, 18.0, 13.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.813232421875, -12.41552734375, -12.017822265625, -11.6201171875, -11.222412109375, -10.82470703125, -10.427001953125, -10.029296875, -9.631591796875, -9.23388671875, -8.836181640625, -8.4384765625, -8.040771484375, -7.64306640625, -7.245361328125, -6.84765625, -6.449951171875, -6.05224609375, -5.654541015625, -5.2568359375, -4.859130859375, -4.46142578125, -4.063720703125, -3.666015625, -3.268310546875, -2.87060546875, -2.472900390625, -2.0751953125, -1.677490234375, -1.27978515625, -0.882080078125, -0.484375, -0.086669921875, 0.31103515625, 0.708740234375, 1.1064453125, 1.504150390625, 1.90185546875, 2.299560546875, 2.697265625, 3.094970703125, 3.49267578125, 3.890380859375, 4.2880859375, 4.685791015625, 5.08349609375, 5.481201171875, 5.87890625, 6.276611328125, 6.67431640625, 7.072021484375, 7.4697265625, 7.867431640625, 8.26513671875, 8.662841796875, 9.060546875, 9.458251953125, 9.85595703125, 10.253662109375, 10.6513671875, 11.049072265625, 11.44677734375, 11.844482421875, 12.2421875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 4.0, 6.0, 12.0, 15.0, 37.0, 73.0, 125.0, 185.0, 198.0, 141.0, 100.0, 55.0, 17.0, 6.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.53681182861328, -107.11796569824219, -103.69911193847656, -100.28025817871094, -96.86141204833984, -93.44256591796875, -90.02371215820312, -86.6048583984375, -83.1860122680664, -79.76716613769531, -76.34831237792969, -72.92945861816406, -69.51061248779297, -66.09176635742188, -62.67291259765625, -59.25406265258789, -55.83521270751953, -52.41636276245117, -48.99751281738281, -45.57866287231445, -42.159812927246094, -38.740962982177734, -35.322113037109375, -31.903263092041016, -28.484413146972656, -25.065563201904297, -21.646713256835938, -18.227863311767578, -14.809013366699219, -11.39016342163086, -7.9713134765625, -4.552463531494141, -1.13360595703125, 2.2852439880371094, 5.704093933105469, 9.122943878173828, 12.541793823242188, 15.960643768310547, 19.379493713378906, 22.798343658447266, 26.217193603515625, 29.636043548583984, 33.054893493652344, 36.4737434387207, 39.89259338378906, 43.31144332885742, 46.73029327392578, 50.14914321899414, 53.5679931640625, 56.98684310913086, 60.40569305419922, 63.82454299926758, 67.24339294433594, 70.66224670410156, 74.08109283447266, 77.49993896484375, 80.91879272460938, 84.337646484375, 87.7564926147461, 91.17533874511719, 94.59419250488281, 98.01304626464844, 101.43189239501953, 104.85073852539062, 108.26959228515625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 16.0, 10.0, 27.0, 27.0, 25.0, 28.0, 42.0, 64.0, 76.0, 77.0, 84.0, 71.0, 75.0, 74.0, 67.0, 50.0, 35.0, 38.0, 30.0, 29.0, 24.0, 11.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-93.062255859375, -90.72755432128906, -88.39285278320312, -86.05815124511719, -83.72344970703125, -81.38874816894531, -79.05404663085938, -76.71934509277344, -74.3846435546875, -72.04994201660156, -69.71524047851562, -67.38053894042969, -65.04583740234375, -62.71113586425781, -60.376434326171875, -58.04173278808594, -55.70703125, -53.37232971191406, -51.037628173828125, -48.70292663574219, -46.36822509765625, -44.03352355957031, -41.698822021484375, -39.36412048339844, -37.0294189453125, -34.69471740722656, -32.360015869140625, -30.025314331054688, -27.69061279296875, -25.355911254882812, -23.021209716796875, -20.686508178710938, -18.351806640625, -16.017105102539062, -13.682403564453125, -11.347702026367188, -9.01300048828125, -6.6782989501953125, -4.343597412109375, -2.0088958740234375, 0.3258056640625, 2.6605072021484375, 4.995208740234375, 7.3299102783203125, 9.66461181640625, 11.999313354492188, 14.334014892578125, 16.668716430664062, 19.00341796875, 21.338119506835938, 23.672821044921875, 26.007522583007812, 28.34222412109375, 30.676925659179688, 33.011627197265625, 35.34632873535156, 37.6810302734375, 40.01573181152344, 42.350433349609375, 44.68513488769531, 47.01983642578125, 49.35453796386719, 51.689239501953125, 54.02394104003906, 56.358642578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 8.0, 26.0, 40.0, 65.0, 135.0, 234.0, 491.0, 1157.0, 2823.0, 9153.0, 33201.0, 141238.0, 477824.0, 288216.0, 68562.0, 16992.0, 5059.0, 1850.0, 773.0, 337.0, 168.0, 91.0, 43.0, 21.0, 18.0, 11.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.765625, -14.37451171875, -13.9833984375, -13.59228515625, -13.201171875, -12.81005859375, -12.4189453125, -12.02783203125, -11.63671875, -11.24560546875, -10.8544921875, -10.46337890625, -10.072265625, -9.68115234375, -9.2900390625, -8.89892578125, -8.5078125, -8.11669921875, -7.7255859375, -7.33447265625, -6.943359375, -6.55224609375, -6.1611328125, -5.77001953125, -5.37890625, -4.98779296875, -4.5966796875, -4.20556640625, -3.814453125, -3.42333984375, -3.0322265625, -2.64111328125, -2.25, -1.85888671875, -1.4677734375, -1.07666015625, -0.685546875, -0.29443359375, 0.0966796875, 0.48779296875, 0.87890625, 1.27001953125, 1.6611328125, 2.05224609375, 2.443359375, 2.83447265625, 3.2255859375, 3.61669921875, 4.0078125, 4.39892578125, 4.7900390625, 5.18115234375, 5.572265625, 5.96337890625, 6.3544921875, 6.74560546875, 7.13671875, 7.52783203125, 7.9189453125, 8.31005859375, 8.701171875, 9.09228515625, 9.4833984375, 9.87451171875, 10.265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 3.0, 8.0, 10.0, 17.0, 14.0, 29.0, 29.0, 47.0, 48.0, 65.0, 75.0, 84.0, 85.0, 91.0, 71.0, 62.0, 60.0, 48.0, 43.0, 28.0, 24.0, 20.0, 12.0, 14.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.8828125, -8.65374755859375, -8.4246826171875, -8.19561767578125, -7.966552734375, -7.73748779296875, -7.5084228515625, -7.27935791015625, -7.05029296875, -6.82122802734375, -6.5921630859375, -6.36309814453125, -6.134033203125, -5.90496826171875, -5.6759033203125, -5.44683837890625, -5.2177734375, -4.98870849609375, -4.7596435546875, -4.53057861328125, -4.301513671875, -4.07244873046875, -3.8433837890625, -3.61431884765625, -3.38525390625, -3.15618896484375, -2.9271240234375, -2.69805908203125, -2.468994140625, -2.23992919921875, -2.0108642578125, -1.78179931640625, -1.552734375, -1.32366943359375, -1.0946044921875, -0.86553955078125, -0.636474609375, -0.40740966796875, -0.1783447265625, 0.05072021484375, 0.27978515625, 0.50885009765625, 0.7379150390625, 0.96697998046875, 1.196044921875, 1.42510986328125, 1.6541748046875, 1.88323974609375, 2.1123046875, 2.34136962890625, 2.5704345703125, 2.79949951171875, 3.028564453125, 3.25762939453125, 3.4866943359375, 3.71575927734375, 3.94482421875, 4.17388916015625, 4.4029541015625, 4.63201904296875, 4.861083984375, 5.09014892578125, 5.3192138671875, 5.54827880859375, 5.77734375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 10.0, 13.0, 23.0, 29.0, 60.0, 120.0, 205.0, 319.0, 593.0, 1181.0, 2845.0, 13326.0, 248385.0, 743429.0, 30584.0, 4262.0, 1471.0, 761.0, 393.0, 200.0, 134.0, 77.0, 49.0, 19.0, 24.0, 14.0, 10.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.3876953125, -25.541015625, -24.6943359375, -23.84765625, -23.0009765625, -22.154296875, -21.3076171875, -20.4609375, -19.6142578125, -18.767578125, -17.9208984375, -17.07421875, -16.2275390625, -15.380859375, -14.5341796875, -13.6875, -12.8408203125, -11.994140625, -11.1474609375, -10.30078125, -9.4541015625, -8.607421875, -7.7607421875, -6.9140625, -6.0673828125, -5.220703125, -4.3740234375, -3.52734375, -2.6806640625, -1.833984375, -0.9873046875, -0.140625, 0.7060546875, 1.552734375, 2.3994140625, 3.24609375, 4.0927734375, 4.939453125, 5.7861328125, 6.6328125, 7.4794921875, 8.326171875, 9.1728515625, 10.01953125, 10.8662109375, 11.712890625, 12.5595703125, 13.40625, 14.2529296875, 15.099609375, 15.9462890625, 16.79296875, 17.6396484375, 18.486328125, 19.3330078125, 20.1796875, 21.0263671875, 21.873046875, 22.7197265625, 23.56640625, 24.4130859375, 25.259765625, 26.1064453125, 26.953125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 4.0, 13.0, 16.0, 15.0, 11.0, 16.0, 29.0, 33.0, 30.0, 45.0, 44.0, 45.0, 47.0, 48.0, 48.0, 61.0, 44.0, 52.0, 49.0, 40.0, 34.0, 48.0, 40.0, 29.0, 24.0, 33.0, 12.0, 15.0, 13.0, 12.0, 12.0, 11.0, 7.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.125, -17.47998046875, -16.8349609375, -16.18994140625, -15.544921875, -14.89990234375, -14.2548828125, -13.60986328125, -12.96484375, -12.31982421875, -11.6748046875, -11.02978515625, -10.384765625, -9.73974609375, -9.0947265625, -8.44970703125, -7.8046875, -7.15966796875, -6.5146484375, -5.86962890625, -5.224609375, -4.57958984375, -3.9345703125, -3.28955078125, -2.64453125, -1.99951171875, -1.3544921875, -0.70947265625, -0.064453125, 0.58056640625, 1.2255859375, 1.87060546875, 2.515625, 3.16064453125, 3.8056640625, 4.45068359375, 5.095703125, 5.74072265625, 6.3857421875, 7.03076171875, 7.67578125, 8.32080078125, 8.9658203125, 9.61083984375, 10.255859375, 10.90087890625, 11.5458984375, 12.19091796875, 12.8359375, 13.48095703125, 14.1259765625, 14.77099609375, 15.416015625, 16.06103515625, 16.7060546875, 17.35107421875, 17.99609375, 18.64111328125, 19.2861328125, 19.93115234375, 20.576171875, 21.22119140625, 21.8662109375, 22.51123046875, 23.15625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 7.0, 8.0, 13.0, 13.0, 17.0, 25.0, 33.0, 55.0, 84.0, 113.0, 202.0, 391.0, 937.0, 2947.0, 16986.0, 232456.0, 746172.0, 40293.0, 5186.0, 1362.0, 545.0, 270.0, 135.0, 73.0, 72.0, 43.0, 28.0, 23.0, 20.0, 5.0, 4.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.71929931640625, -5.5089111328125, -5.29852294921875, -5.088134765625, -4.87774658203125, -4.6673583984375, -4.45697021484375, -4.24658203125, -4.03619384765625, -3.8258056640625, -3.61541748046875, -3.405029296875, -3.19464111328125, -2.9842529296875, -2.77386474609375, -2.5634765625, -2.35308837890625, -2.1427001953125, -1.93231201171875, -1.721923828125, -1.51153564453125, -1.3011474609375, -1.09075927734375, -0.88037109375, -0.66998291015625, -0.4595947265625, -0.24920654296875, -0.038818359375, 0.17156982421875, 0.3819580078125, 0.59234619140625, 0.802734375, 1.01312255859375, 1.2235107421875, 1.43389892578125, 1.644287109375, 1.85467529296875, 2.0650634765625, 2.27545166015625, 2.48583984375, 2.69622802734375, 2.9066162109375, 3.11700439453125, 3.327392578125, 3.53778076171875, 3.7481689453125, 3.95855712890625, 4.1689453125, 4.37933349609375, 4.5897216796875, 4.80010986328125, 5.010498046875, 5.22088623046875, 5.4312744140625, 5.64166259765625, 5.85205078125, 6.06243896484375, 6.2728271484375, 6.48321533203125, 6.693603515625, 6.90399169921875, 7.1143798828125, 7.32476806640625, 7.53515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 1.0, 7.0, 1.0, 15.0, 8.0, 9.0, 8.0, 20.0, 17.0, 20.0, 24.0, 28.0, 35.0, 40.0, 51.0, 77.0, 84.0, 125.0, 100.0, 47.0, 39.0, 30.0, 27.0, 25.0, 17.0, 17.0, 17.0, 23.0, 20.0, 12.0, 10.0, 7.0, 11.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008015632629394531, -0.0007758289575576782, -0.0007500946521759033, -0.0007243603467941284, -0.0006986260414123535, -0.0006728917360305786, -0.0006471574306488037, -0.0006214231252670288, -0.0005956888198852539, -0.000569954514503479, -0.0005442202091217041, -0.0005184859037399292, -0.0004927515983581543, -0.0004670172929763794, -0.0004412829875946045, -0.0004155486822128296, -0.0003898143768310547, -0.0003640800714492798, -0.0003383457660675049, -0.00031261146068573, -0.0002868771553039551, -0.0002611428499221802, -0.00023540854454040527, -0.00020967423915863037, -0.00018393993377685547, -0.00015820562839508057, -0.00013247132301330566, -0.00010673701763153076, -8.100271224975586e-05, -5.526840686798096e-05, -2.9534101486206055e-05, -3.7997961044311523e-06, 2.193450927734375e-05, 4.766881465911865e-05, 7.340312004089355e-05, 9.913742542266846e-05, 0.00012487173080444336, 0.00015060603618621826, 0.00017634034156799316, 0.00020207464694976807, 0.00022780895233154297, 0.00025354325771331787, 0.0002792775630950928, 0.0003050118684768677, 0.0003307461738586426, 0.0003564804792404175, 0.0003822147846221924, 0.0004079490900039673, 0.0004336833953857422, 0.0004594177007675171, 0.000485152006149292, 0.0005108863115310669, 0.0005366206169128418, 0.0005623549222946167, 0.0005880892276763916, 0.0006138235330581665, 0.0006395578384399414, 0.0006652921438217163, 0.0006910264492034912, 0.0007167607545852661, 0.000742495059967041, 0.0007682293653488159, 0.0007939636707305908, 0.0008196979761123657, 0.0008454322814941406]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 10.0, 9.0, 12.0, 9.0, 9.0, 22.0, 28.0, 36.0, 51.0, 72.0, 118.0, 175.0, 267.0, 527.0, 996.0, 2036.0, 4944.0, 16418.0, 106801.0, 776743.0, 113232.0, 16740.0, 4965.0, 2048.0, 893.0, 538.0, 289.0, 182.0, 114.0, 70.0, 67.0, 30.0, 24.0, 22.0, 15.0, 16.0, 8.0, 7.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.84765625, -4.67144775390625, -4.4952392578125, -4.31903076171875, -4.142822265625, -3.96661376953125, -3.7904052734375, -3.61419677734375, -3.43798828125, -3.26177978515625, -3.0855712890625, -2.90936279296875, -2.733154296875, -2.55694580078125, -2.3807373046875, -2.20452880859375, -2.0283203125, -1.85211181640625, -1.6759033203125, -1.49969482421875, -1.323486328125, -1.14727783203125, -0.9710693359375, -0.79486083984375, -0.61865234375, -0.44244384765625, -0.2662353515625, -0.09002685546875, 0.086181640625, 0.26239013671875, 0.4385986328125, 0.61480712890625, 0.791015625, 0.96722412109375, 1.1434326171875, 1.31964111328125, 1.495849609375, 1.67205810546875, 1.8482666015625, 2.02447509765625, 2.20068359375, 2.37689208984375, 2.5531005859375, 2.72930908203125, 2.905517578125, 3.08172607421875, 3.2579345703125, 3.43414306640625, 3.6103515625, 3.78656005859375, 3.9627685546875, 4.13897705078125, 4.315185546875, 4.49139404296875, 4.6676025390625, 4.84381103515625, 5.02001953125, 5.19622802734375, 5.3724365234375, 5.54864501953125, 5.724853515625, 5.90106201171875, 6.0772705078125, 6.25347900390625, 6.4296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 2.0, 7.0, 8.0, 10.0, 11.0, 20.0, 14.0, 28.0, 61.0, 63.0, 60.0, 81.0, 90.0, 109.0, 99.0, 66.0, 63.0, 49.0, 32.0, 31.0, 24.0, 18.0, 9.0, 11.0, 9.0, 6.0, 3.0, 7.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.04461669921875, -3.8782958984375, -3.71197509765625, -3.545654296875, -3.37933349609375, -3.2130126953125, -3.04669189453125, -2.88037109375, -2.71405029296875, -2.5477294921875, -2.38140869140625, -2.215087890625, -2.04876708984375, -1.8824462890625, -1.71612548828125, -1.5498046875, -1.38348388671875, -1.2171630859375, -1.05084228515625, -0.884521484375, -0.71820068359375, -0.5518798828125, -0.38555908203125, -0.21923828125, -0.05291748046875, 0.1134033203125, 0.27972412109375, 0.446044921875, 0.61236572265625, 0.7786865234375, 0.94500732421875, 1.111328125, 1.27764892578125, 1.4439697265625, 1.61029052734375, 1.776611328125, 1.94293212890625, 2.1092529296875, 2.27557373046875, 2.44189453125, 2.60821533203125, 2.7745361328125, 2.94085693359375, 3.107177734375, 3.27349853515625, 3.4398193359375, 3.60614013671875, 3.7724609375, 3.93878173828125, 4.1051025390625, 4.27142333984375, 4.437744140625, 4.60406494140625, 4.7703857421875, 4.93670654296875, 5.10302734375, 5.26934814453125, 5.4356689453125, 5.60198974609375, 5.768310546875, 5.93463134765625, 6.1009521484375, 6.26727294921875, 6.43359375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 4.0, 2.0, 4.0, 4.0, 7.0, 7.0, 19.0, 32.0, 55.0, 106.0, 180.0, 275.0, 152.0, 83.0, 33.0, 17.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.31533813476562, -112.49703979492188, -108.67874908447266, -104.8604507446289, -101.04216003417969, -97.22386169433594, -93.40556335449219, -89.58726501464844, -85.76897430419922, -81.95067596435547, -78.13238525390625, -74.3140869140625, -70.49578857421875, -66.67749786376953, -62.85919952392578, -59.0409049987793, -55.22261047363281, -51.40431594848633, -47.586021423339844, -43.767723083496094, -39.94942855834961, -36.131134033203125, -32.312835693359375, -28.49454116821289, -24.676246643066406, -20.857952117919922, -17.039655685424805, -13.221360206604004, -9.403064727783203, -5.584770202636719, -1.7664737701416016, 2.0518226623535156, 5.8701171875, 9.6884126663208, 13.506708145141602, 17.32500457763672, 21.143299102783203, 24.961593627929688, 28.779890060424805, 32.59818649291992, 36.416481018066406, 40.23477554321289, 44.053070068359375, 47.871368408203125, 51.68966293334961, 55.507957458496094, 59.326255798339844, 63.14455032348633, 66.96284484863281, 70.78114318847656, 74.59943389892578, 78.41773223876953, 82.23602294921875, 86.0543212890625, 89.87261962890625, 93.69091796875, 97.50920867919922, 101.32750701904297, 105.14579772949219, 108.96409606933594, 112.78239440917969, 116.6006851196289, 120.41898345947266, 124.23727416992188, 128.05557250976562]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 6.0, 9.0, 9.0, 14.0, 5.0, 7.0, 11.0, 20.0, 23.0, 20.0, 17.0, 29.0, 39.0, 33.0, 41.0, 31.0, 42.0, 58.0, 68.0, 71.0, 54.0, 42.0, 42.0, 35.0, 32.0, 32.0, 29.0, 28.0, 23.0, 18.0, 24.0, 14.0, 19.0, 9.0, 8.0, 8.0, 2.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.34864807128906, -62.28942108154297, -60.23019790649414, -58.17097473144531, -56.11174774169922, -54.052520751953125, -51.9932975769043, -49.93407440185547, -47.874847412109375, -45.81562042236328, -43.75639724731445, -41.697174072265625, -39.63794708251953, -37.57872009277344, -35.51949691772461, -33.46027374267578, -31.401046752929688, -29.341821670532227, -27.282596588134766, -25.223371505737305, -23.164146423339844, -21.104921340942383, -19.045696258544922, -16.98647117614746, -14.92724609375, -12.868021011352539, -10.808795928955078, -8.749570846557617, -6.690345764160156, -4.631120681762695, -2.5718955993652344, -0.5126705169677734, 1.5465621948242188, 3.6057872772216797, 5.665012359619141, 7.724237442016602, 9.783462524414062, 11.842687606811523, 13.901912689208984, 15.961137771606445, 18.020362854003906, 20.079587936401367, 22.138813018798828, 24.19803810119629, 26.25726318359375, 28.31648826599121, 30.375713348388672, 32.4349365234375, 34.494163513183594, 36.55339050292969, 38.612613677978516, 40.671836853027344, 42.73106384277344, 44.79029083251953, 46.84951400756836, 48.90873718261719, 50.96796417236328, 53.027191162109375, 55.0864143371582, 57.14563751220703, 59.204864501953125, 61.26409149169922, 63.32331466674805, 65.38253784179688, 67.44176483154297]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 3.0, 7.0, 9.0, 7.0, 12.0, 12.0, 31.0, 35.0, 48.0, 78.0, 148.0, 220.0, 440.0, 936.0, 2252.0, 7142.0, 29642.0, 252470.0, 3044328.0, 774888.0, 62798.0, 12590.0, 3749.0, 1277.0, 555.0, 265.0, 155.0, 75.0, 47.0, 24.0, 19.0, 12.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1328125, -6.875244140625, -6.61767578125, -6.360107421875, -6.1025390625, -5.844970703125, -5.58740234375, -5.329833984375, -5.072265625, -4.814697265625, -4.55712890625, -4.299560546875, -4.0419921875, -3.784423828125, -3.52685546875, -3.269287109375, -3.01171875, -2.754150390625, -2.49658203125, -2.239013671875, -1.9814453125, -1.723876953125, -1.46630859375, -1.208740234375, -0.951171875, -0.693603515625, -0.43603515625, -0.178466796875, 0.0791015625, 0.336669921875, 0.59423828125, 0.851806640625, 1.109375, 1.366943359375, 1.62451171875, 1.882080078125, 2.1396484375, 2.397216796875, 2.65478515625, 2.912353515625, 3.169921875, 3.427490234375, 3.68505859375, 3.942626953125, 4.2001953125, 4.457763671875, 4.71533203125, 4.972900390625, 5.23046875, 5.488037109375, 5.74560546875, 6.003173828125, 6.2607421875, 6.518310546875, 6.77587890625, 7.033447265625, 7.291015625, 7.548583984375, 7.80615234375, 8.063720703125, 8.3212890625, 8.578857421875, 8.83642578125, 9.093994140625, 9.3515625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 8.0, 7.0, 11.0, 17.0, 28.0, 31.0, 40.0, 45.0, 57.0, 70.0, 98.0, 87.0, 91.0, 58.0, 84.0, 53.0, 62.0, 35.0, 39.0, 21.0, 10.0, 22.0, 9.0, 5.0, 8.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.2890625, -9.062255859375, -8.83544921875, -8.608642578125, -8.3818359375, -8.155029296875, -7.92822265625, -7.701416015625, -7.474609375, -7.247802734375, -7.02099609375, -6.794189453125, -6.5673828125, -6.340576171875, -6.11376953125, -5.886962890625, -5.66015625, -5.433349609375, -5.20654296875, -4.979736328125, -4.7529296875, -4.526123046875, -4.29931640625, -4.072509765625, -3.845703125, -3.618896484375, -3.39208984375, -3.165283203125, -2.9384765625, -2.711669921875, -2.48486328125, -2.258056640625, -2.03125, -1.804443359375, -1.57763671875, -1.350830078125, -1.1240234375, -0.897216796875, -0.67041015625, -0.443603515625, -0.216796875, 0.010009765625, 0.23681640625, 0.463623046875, 0.6904296875, 0.917236328125, 1.14404296875, 1.370849609375, 1.59765625, 1.824462890625, 2.05126953125, 2.278076171875, 2.5048828125, 2.731689453125, 2.95849609375, 3.185302734375, 3.412109375, 3.638916015625, 3.86572265625, 4.092529296875, 4.3193359375, 4.546142578125, 4.77294921875, 4.999755859375, 5.2265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 7.0, 10.0, 11.0, 25.0, 29.0, 43.0, 56.0, 99.0, 144.0, 214.0, 408.0, 650.0, 1236.0, 2487.0, 6358.0, 21365.0, 112987.0, 1964380.0, 1933901.0, 115477.0, 22825.0, 6607.0, 2481.0, 1089.0, 587.0, 319.0, 172.0, 122.0, 62.0, 39.0, 29.0, 24.0, 11.0, 13.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.8515625, -9.570068359375, -9.28857421875, -9.007080078125, -8.7255859375, -8.444091796875, -8.16259765625, -7.881103515625, -7.599609375, -7.318115234375, -7.03662109375, -6.755126953125, -6.4736328125, -6.192138671875, -5.91064453125, -5.629150390625, -5.34765625, -5.066162109375, -4.78466796875, -4.503173828125, -4.2216796875, -3.940185546875, -3.65869140625, -3.377197265625, -3.095703125, -2.814208984375, -2.53271484375, -2.251220703125, -1.9697265625, -1.688232421875, -1.40673828125, -1.125244140625, -0.84375, -0.562255859375, -0.28076171875, 0.000732421875, 0.2822265625, 0.563720703125, 0.84521484375, 1.126708984375, 1.408203125, 1.689697265625, 1.97119140625, 2.252685546875, 2.5341796875, 2.815673828125, 3.09716796875, 3.378662109375, 3.66015625, 3.941650390625, 4.22314453125, 4.504638671875, 4.7861328125, 5.067626953125, 5.34912109375, 5.630615234375, 5.912109375, 6.193603515625, 6.47509765625, 6.756591796875, 7.0380859375, 7.319580078125, 7.60107421875, 7.882568359375, 8.1640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 16.0, 20.0, 32.0, 49.0, 99.0, 198.0, 395.0, 870.0, 1126.0, 627.0, 280.0, 139.0, 75.0, 44.0, 31.0, 10.0, 14.0, 10.0, 6.0, 5.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.328125, -14.893310546875, -14.45849609375, -14.023681640625, -13.5888671875, -13.154052734375, -12.71923828125, -12.284423828125, -11.849609375, -11.414794921875, -10.97998046875, -10.545166015625, -10.1103515625, -9.675537109375, -9.24072265625, -8.805908203125, -8.37109375, -7.936279296875, -7.50146484375, -7.066650390625, -6.6318359375, -6.197021484375, -5.76220703125, -5.327392578125, -4.892578125, -4.457763671875, -4.02294921875, -3.588134765625, -3.1533203125, -2.718505859375, -2.28369140625, -1.848876953125, -1.4140625, -0.979248046875, -0.54443359375, -0.109619140625, 0.3251953125, 0.760009765625, 1.19482421875, 1.629638671875, 2.064453125, 2.499267578125, 2.93408203125, 3.368896484375, 3.8037109375, 4.238525390625, 4.67333984375, 5.108154296875, 5.54296875, 5.977783203125, 6.41259765625, 6.847412109375, 7.2822265625, 7.717041015625, 8.15185546875, 8.586669921875, 9.021484375, 9.456298828125, 9.89111328125, 10.325927734375, 10.7607421875, 11.195556640625, 11.63037109375, 12.065185546875, 12.5]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 13.0, 31.0, 120.0, 231.0, 271.0, 204.0, 79.0, 23.0, 5.0, 6.0, 3.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.34669494628906, -136.8162841796875, -132.285888671875, -127.75547790527344, -123.2250747680664, -118.69467163085938, -114.16426086425781, -109.63385772705078, -105.10345458984375, -100.57305145263672, -96.04264831542969, -91.51223754882812, -86.9818344116211, -82.45143127441406, -77.9210205078125, -73.39061737060547, -68.86021423339844, -64.3298110961914, -59.79940414428711, -55.26899719238281, -50.73859405517578, -46.20819091796875, -41.67778396606445, -37.147377014160156, -32.616973876953125, -28.08656883239746, -23.556163787841797, -19.025758743286133, -14.495353698730469, -9.964948654174805, -5.434543609619141, -0.9041385650634766, 3.6262664794921875, 8.156671524047852, 12.687076568603516, 17.21748161315918, 21.747886657714844, 26.278291702270508, 30.808696746826172, 35.33910369873047, 39.8695068359375, 44.39990997314453, 48.93031692504883, 53.460723876953125, 57.991127014160156, 62.52153015136719, 67.05194091796875, 71.58234405517578, 76.11274719238281, 80.64315032958984, 85.17355346679688, 89.70396423339844, 94.23436737060547, 98.7647705078125, 103.29518127441406, 107.8255844116211, 112.35598754882812, 116.88639068603516, 121.41679382324219, 125.94720458984375, 130.47760009765625, 135.0080108642578, 139.53842163085938, 144.06881713867188, 148.59922790527344]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 9.0, 8.0, 7.0, 16.0, 21.0, 19.0, 36.0, 32.0, 43.0, 47.0, 47.0, 43.0, 66.0, 80.0, 64.0, 72.0, 55.0, 62.0, 48.0, 52.0, 35.0, 37.0, 34.0, 25.0, 14.0, 7.0, 9.0, 9.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.39604187011719, -45.49321746826172, -43.59039306640625, -41.68756866455078, -39.78474044799805, -37.88191604614258, -35.97909164428711, -34.07626724243164, -32.17344284057617, -30.270618438720703, -28.3677921295166, -26.464967727661133, -24.562143325805664, -22.659317016601562, -20.756492614746094, -18.853668212890625, -16.950841903686523, -15.048016548156738, -13.14519214630127, -11.242366790771484, -9.339542388916016, -7.4367170333862305, -5.533891677856445, -3.6310672760009766, -1.7282419204711914, 0.1745830774307251, 2.0774080753326416, 3.9802331924438477, 5.883058071136475, 7.785882949829102, 9.688708305358887, 11.591532707214355, 13.49435806274414, 15.397183418273926, 17.30000877380371, 19.20283317565918, 21.10565757751465, 23.00848388671875, 24.91130828857422, 26.814132690429688, 28.716957092285156, 30.619781494140625, 32.522605895996094, 34.42543029785156, 36.3282585144043, 38.231082916259766, 40.133907318115234, 42.0367317199707, 43.93955993652344, 45.842384338378906, 47.745208740234375, 49.648033142089844, 51.55086135864258, 53.45368576049805, 55.356510162353516, 57.259334564208984, 59.16215896606445, 61.06498336791992, 62.96780776977539, 64.87063598632812, 66.7734603881836, 68.67628479003906, 70.57910919189453, 72.48193359375, 74.38475799560547]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 3.0, 11.0, 10.0, 10.0, 24.0, 19.0, 35.0, 47.0, 65.0, 138.0, 190.0, 279.0, 520.0, 954.0, 1923.0, 3976.0, 9454.0, 25327.0, 75094.0, 237587.0, 424624.0, 177238.0, 56895.0, 19743.0, 7586.0, 3292.0, 1547.0, 785.0, 457.0, 234.0, 184.0, 107.0, 66.0, 30.0, 22.0, 27.0, 16.0, 8.0, 9.0, 12.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.171875, -7.8936767578125, -7.615478515625, -7.3372802734375, -7.05908203125, -6.7808837890625, -6.502685546875, -6.2244873046875, -5.9462890625, -5.6680908203125, -5.389892578125, -5.1116943359375, -4.83349609375, -4.5552978515625, -4.277099609375, -3.9989013671875, -3.720703125, -3.4425048828125, -3.164306640625, -2.8861083984375, -2.60791015625, -2.3297119140625, -2.051513671875, -1.7733154296875, -1.4951171875, -1.2169189453125, -0.938720703125, -0.6605224609375, -0.38232421875, -0.1041259765625, 0.174072265625, 0.4522705078125, 0.73046875, 1.0086669921875, 1.286865234375, 1.5650634765625, 1.84326171875, 2.1214599609375, 2.399658203125, 2.6778564453125, 2.9560546875, 3.2342529296875, 3.512451171875, 3.7906494140625, 4.06884765625, 4.3470458984375, 4.625244140625, 4.9034423828125, 5.181640625, 5.4598388671875, 5.738037109375, 6.0162353515625, 6.29443359375, 6.5726318359375, 6.850830078125, 7.1290283203125, 7.4072265625, 7.6854248046875, 7.963623046875, 8.2418212890625, 8.52001953125, 8.7982177734375, 9.076416015625, 9.3546142578125, 9.6328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 10.0, 12.0, 17.0, 31.0, 38.0, 38.0, 53.0, 59.0, 77.0, 85.0, 84.0, 87.0, 83.0, 61.0, 65.0, 53.0, 42.0, 27.0, 15.0, 20.0, 9.0, 16.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.3671875, -9.1375732421875, -8.907958984375, -8.6783447265625, -8.44873046875, -8.2191162109375, -7.989501953125, -7.7598876953125, -7.5302734375, -7.3006591796875, -7.071044921875, -6.8414306640625, -6.61181640625, -6.3822021484375, -6.152587890625, -5.9229736328125, -5.693359375, -5.4637451171875, -5.234130859375, -5.0045166015625, -4.77490234375, -4.5452880859375, -4.315673828125, -4.0860595703125, -3.8564453125, -3.6268310546875, -3.397216796875, -3.1676025390625, -2.93798828125, -2.7083740234375, -2.478759765625, -2.2491455078125, -2.01953125, -1.7899169921875, -1.560302734375, -1.3306884765625, -1.10107421875, -0.8714599609375, -0.641845703125, -0.4122314453125, -0.1826171875, 0.0469970703125, 0.276611328125, 0.5062255859375, 0.73583984375, 0.9654541015625, 1.195068359375, 1.4246826171875, 1.654296875, 1.8839111328125, 2.113525390625, 2.3431396484375, 2.57275390625, 2.8023681640625, 3.031982421875, 3.2615966796875, 3.4912109375, 3.7208251953125, 3.950439453125, 4.1800537109375, 4.40966796875, 4.6392822265625, 4.868896484375, 5.0985107421875, 5.328125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 5.0, 5.0, 13.0, 15.0, 29.0, 29.0, 40.0, 47.0, 76.0, 129.0, 161.0, 263.0, 415.0, 698.0, 1317.0, 2866.0, 9712.0, 68037.0, 735191.0, 199517.0, 21121.0, 4696.0, 1728.0, 900.0, 567.0, 339.0, 211.0, 119.0, 102.0, 51.0, 40.0, 32.0, 20.0, 16.0, 8.0, 9.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.8125, -18.237548828125, -17.66259765625, -17.087646484375, -16.5126953125, -15.937744140625, -15.36279296875, -14.787841796875, -14.212890625, -13.637939453125, -13.06298828125, -12.488037109375, -11.9130859375, -11.338134765625, -10.76318359375, -10.188232421875, -9.61328125, -9.038330078125, -8.46337890625, -7.888427734375, -7.3134765625, -6.738525390625, -6.16357421875, -5.588623046875, -5.013671875, -4.438720703125, -3.86376953125, -3.288818359375, -2.7138671875, -2.138916015625, -1.56396484375, -0.989013671875, -0.4140625, 0.160888671875, 0.73583984375, 1.310791015625, 1.8857421875, 2.460693359375, 3.03564453125, 3.610595703125, 4.185546875, 4.760498046875, 5.33544921875, 5.910400390625, 6.4853515625, 7.060302734375, 7.63525390625, 8.210205078125, 8.78515625, 9.360107421875, 9.93505859375, 10.510009765625, 11.0849609375, 11.659912109375, 12.23486328125, 12.809814453125, 13.384765625, 13.959716796875, 14.53466796875, 15.109619140625, 15.6845703125, 16.259521484375, 16.83447265625, 17.409423828125, 17.984375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 2.0, 3.0, 12.0, 4.0, 15.0, 18.0, 15.0, 17.0, 31.0, 33.0, 38.0, 37.0, 34.0, 45.0, 53.0, 39.0, 42.0, 47.0, 61.0, 52.0, 48.0, 44.0, 46.0, 36.0, 38.0, 29.0, 32.0, 23.0, 25.0, 21.0, 12.0, 14.0, 9.0, 10.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -17.195556640625, -16.65673828125, -16.117919921875, -15.5791015625, -15.040283203125, -14.50146484375, -13.962646484375, -13.423828125, -12.885009765625, -12.34619140625, -11.807373046875, -11.2685546875, -10.729736328125, -10.19091796875, -9.652099609375, -9.11328125, -8.574462890625, -8.03564453125, -7.496826171875, -6.9580078125, -6.419189453125, -5.88037109375, -5.341552734375, -4.802734375, -4.263916015625, -3.72509765625, -3.186279296875, -2.6474609375, -2.108642578125, -1.56982421875, -1.031005859375, -0.4921875, 0.046630859375, 0.58544921875, 1.124267578125, 1.6630859375, 2.201904296875, 2.74072265625, 3.279541015625, 3.818359375, 4.357177734375, 4.89599609375, 5.434814453125, 5.9736328125, 6.512451171875, 7.05126953125, 7.590087890625, 8.12890625, 8.667724609375, 9.20654296875, 9.745361328125, 10.2841796875, 10.822998046875, 11.36181640625, 11.900634765625, 12.439453125, 12.978271484375, 13.51708984375, 14.055908203125, 14.5947265625, 15.133544921875, 15.67236328125, 16.211181640625, 16.75]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 11.0, 8.0, 14.0, 16.0, 14.0, 25.0, 40.0, 68.0, 110.0, 208.0, 471.0, 1342.0, 6726.0, 77502.0, 882294.0, 71105.0, 6387.0, 1218.0, 435.0, 209.0, 104.0, 83.0, 42.0, 43.0, 25.0, 13.0, 13.0, 12.0, 12.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.25775146484375, -7.0115966796875, -6.76544189453125, -6.519287109375, -6.27313232421875, -6.0269775390625, -5.78082275390625, -5.53466796875, -5.28851318359375, -5.0423583984375, -4.79620361328125, -4.550048828125, -4.30389404296875, -4.0577392578125, -3.81158447265625, -3.5654296875, -3.31927490234375, -3.0731201171875, -2.82696533203125, -2.580810546875, -2.33465576171875, -2.0885009765625, -1.84234619140625, -1.59619140625, -1.35003662109375, -1.1038818359375, -0.85772705078125, -0.611572265625, -0.36541748046875, -0.1192626953125, 0.12689208984375, 0.373046875, 0.61920166015625, 0.8653564453125, 1.11151123046875, 1.357666015625, 1.60382080078125, 1.8499755859375, 2.09613037109375, 2.34228515625, 2.58843994140625, 2.8345947265625, 3.08074951171875, 3.326904296875, 3.57305908203125, 3.8192138671875, 4.06536865234375, 4.3115234375, 4.55767822265625, 4.8038330078125, 5.04998779296875, 5.296142578125, 5.54229736328125, 5.7884521484375, 6.03460693359375, 6.28076171875, 6.52691650390625, 6.7730712890625, 7.01922607421875, 7.265380859375, 7.51153564453125, 7.7576904296875, 8.00384521484375, 8.25]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 7.0, 9.0, 15.0, 19.0, 21.0, 22.0, 20.0, 31.0, 54.0, 77.0, 107.0, 136.0, 127.0, 100.0, 59.0, 47.0, 35.0, 27.0, 17.0, 13.0, 12.0, 7.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0010671615600585938, -0.0010344982147216797, -0.0010018348693847656, -0.0009691715240478516, -0.0009365081787109375, -0.0009038448333740234, -0.0008711814880371094, -0.0008385181427001953, -0.0008058547973632812, -0.0007731914520263672, -0.0007405281066894531, -0.0007078647613525391, -0.000675201416015625, -0.0006425380706787109, -0.0006098747253417969, -0.0005772113800048828, -0.0005445480346679688, -0.0005118846893310547, -0.0004792213439941406, -0.00044655799865722656, -0.0004138946533203125, -0.00038123130798339844, -0.0003485679626464844, -0.0003159046173095703, -0.00028324127197265625, -0.0002505779266357422, -0.00021791458129882812, -0.00018525123596191406, -0.000152587890625, -0.00011992454528808594, -8.726119995117188e-05, -5.459785461425781e-05, -2.193450927734375e-05, 1.0728836059570312e-05, 4.3392181396484375e-05, 7.605552673339844e-05, 0.0001087188720703125, 0.00014138221740722656, 0.00017404556274414062, 0.0002067089080810547, 0.00023937225341796875, 0.0002720355987548828, 0.0003046989440917969, 0.00033736228942871094, 0.000370025634765625, 0.00040268898010253906, 0.0004353523254394531, 0.0004680156707763672, 0.0005006790161132812, 0.0005333423614501953, 0.0005660057067871094, 0.0005986690521240234, 0.0006313323974609375, 0.0006639957427978516, 0.0006966590881347656, 0.0007293224334716797, 0.0007619857788085938, 0.0007946491241455078, 0.0008273124694824219, 0.0008599758148193359, 0.00089263916015625, 0.0009253025054931641, 0.0009579658508300781, 0.0009906291961669922, 0.0010232925415039062]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 12.0, 8.0, 15.0, 21.0, 29.0, 37.0, 54.0, 97.0, 109.0, 163.0, 331.0, 568.0, 1038.0, 2406.0, 6918.0, 26503.0, 189116.0, 707148.0, 89588.0, 15721.0, 4834.0, 1811.0, 823.0, 461.0, 257.0, 169.0, 91.0, 81.0, 36.0, 31.0, 22.0, 17.0, 14.0, 9.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.46875, -4.32611083984375, -4.1834716796875, -4.04083251953125, -3.898193359375, -3.75555419921875, -3.6129150390625, -3.47027587890625, -3.32763671875, -3.18499755859375, -3.0423583984375, -2.89971923828125, -2.757080078125, -2.61444091796875, -2.4718017578125, -2.32916259765625, -2.1865234375, -2.04388427734375, -1.9012451171875, -1.75860595703125, -1.615966796875, -1.47332763671875, -1.3306884765625, -1.18804931640625, -1.04541015625, -0.90277099609375, -0.7601318359375, -0.61749267578125, -0.474853515625, -0.33221435546875, -0.1895751953125, -0.04693603515625, 0.095703125, 0.23834228515625, 0.3809814453125, 0.52362060546875, 0.666259765625, 0.80889892578125, 0.9515380859375, 1.09417724609375, 1.23681640625, 1.37945556640625, 1.5220947265625, 1.66473388671875, 1.807373046875, 1.95001220703125, 2.0926513671875, 2.23529052734375, 2.3779296875, 2.52056884765625, 2.6632080078125, 2.80584716796875, 2.948486328125, 3.09112548828125, 3.2337646484375, 3.37640380859375, 3.51904296875, 3.66168212890625, 3.8043212890625, 3.94696044921875, 4.089599609375, 4.23223876953125, 4.3748779296875, 4.51751708984375, 4.66015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 7.0, 3.0, 7.0, 5.0, 11.0, 13.0, 18.0, 16.0, 29.0, 47.0, 55.0, 85.0, 80.0, 95.0, 86.0, 106.0, 78.0, 52.0, 43.0, 34.0, 28.0, 18.0, 13.0, 13.0, 12.0, 13.0, 7.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.321533203125, -4.18212890625, -4.042724609375, -3.9033203125, -3.763916015625, -3.62451171875, -3.485107421875, -3.345703125, -3.206298828125, -3.06689453125, -2.927490234375, -2.7880859375, -2.648681640625, -2.50927734375, -2.369873046875, -2.23046875, -2.091064453125, -1.95166015625, -1.812255859375, -1.6728515625, -1.533447265625, -1.39404296875, -1.254638671875, -1.115234375, -0.975830078125, -0.83642578125, -0.697021484375, -0.5576171875, -0.418212890625, -0.27880859375, -0.139404296875, 0.0, 0.139404296875, 0.27880859375, 0.418212890625, 0.5576171875, 0.697021484375, 0.83642578125, 0.975830078125, 1.115234375, 1.254638671875, 1.39404296875, 1.533447265625, 1.6728515625, 1.812255859375, 1.95166015625, 2.091064453125, 2.23046875, 2.369873046875, 2.50927734375, 2.648681640625, 2.7880859375, 2.927490234375, 3.06689453125, 3.206298828125, 3.345703125, 3.485107421875, 3.62451171875, 3.763916015625, 3.9033203125, 4.042724609375, 4.18212890625, 4.321533203125, 4.4609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 30.0, 79.0, 205.0, 338.0, 190.0, 68.0, 34.0, 14.0, 5.0, 9.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-142.3876190185547, -137.53054809570312, -132.67349243164062, -127.8164291381836, -122.95936584472656, -118.102294921875, -113.24523162841797, -108.38816833496094, -103.5311050415039, -98.67404174804688, -93.81697845458984, -88.95991516113281, -84.10284423828125, -79.24578857421875, -74.38871765136719, -69.53165435791016, -64.67459106445312, -59.817527770996094, -54.96046447753906, -50.103397369384766, -45.246334075927734, -40.3892707824707, -35.532203674316406, -30.675140380859375, -25.818077087402344, -20.961013793945312, -16.10394859313965, -11.2468843460083, -6.389820098876953, -1.5327568054199219, 3.324308395385742, 8.181373596191406, 13.038436889648438, 17.89550018310547, 22.752565383911133, 27.609630584716797, 32.46669387817383, 37.32375717163086, 42.180824279785156, 47.03788757324219, 51.89495086669922, 56.75201416015625, 61.60907745361328, 66.46614074707031, 71.32321166992188, 76.18026733398438, 81.03733825683594, 85.89440155029297, 90.75146484375, 95.60852813720703, 100.46559143066406, 105.3226547241211, 110.17971801757812, 115.03678894042969, 119.89385223388672, 124.75091552734375, 129.60797119140625, 134.4650421142578, 139.3220977783203, 144.17916870117188, 149.03622436523438, 153.89329528808594, 158.75035095214844, 163.607421875, 168.46449279785156]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 7.0, 4.0, 7.0, 6.0, 4.0, 6.0, 8.0, 10.0, 14.0, 14.0, 20.0, 12.0, 12.0, 21.0, 19.0, 33.0, 31.0, 30.0, 37.0, 41.0, 36.0, 62.0, 61.0, 60.0, 44.0, 40.0, 43.0, 31.0, 36.0, 26.0, 28.0, 21.0, 12.0, 21.0, 12.0, 12.0, 15.0, 18.0, 5.0, 7.0, 12.0, 17.0, 4.0, 4.0, 8.0, 4.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-52.010581970214844, -50.38212966918945, -48.75367736816406, -47.12522506713867, -45.49677276611328, -43.86832046508789, -42.2398681640625, -40.611419677734375, -38.98296356201172, -37.35451126098633, -35.72605895996094, -34.09760665893555, -32.469154357910156, -30.840702056884766, -29.212251663208008, -27.583799362182617, -25.95534896850586, -24.32689666748047, -22.698444366455078, -21.069992065429688, -19.441539764404297, -17.813087463378906, -16.18463706970215, -14.556184768676758, -12.927732467651367, -11.299280166625977, -9.670827865600586, -8.042376518249512, -6.413924217224121, -4.7854719161987305, -3.1570205688476562, -1.5285682678222656, 0.099884033203125, 1.7283360958099365, 3.356788158416748, 4.9852399826049805, 6.613692283630371, 8.242144584655762, 9.870595932006836, 11.499048233032227, 13.127500534057617, 14.755952835083008, 16.3844051361084, 18.012855529785156, 19.641307830810547, 21.269760131835938, 22.898212432861328, 24.52666473388672, 26.15511703491211, 27.7835693359375, 29.41202163696289, 31.04047393798828, 32.66892623901367, 34.29737854003906, 35.92582702636719, 37.554283142089844, 39.18273162841797, 40.81118392944336, 42.43963623046875, 44.06808853149414, 45.69654083251953, 47.32499313354492, 48.95344543457031, 50.58189392089844, 52.210350036621094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 16.0, 22.0, 23.0, 45.0, 64.0, 124.0, 233.0, 581.0, 1943.0, 9967.0, 203833.0, 3812477.0, 152440.0, 9701.0, 1777.0, 581.0, 183.0, 109.0, 59.0, 33.0, 25.0, 15.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-18.359375, -17.9166259765625, -17.473876953125, -17.0311279296875, -16.58837890625, -16.1456298828125, -15.702880859375, -15.2601318359375, -14.8173828125, -14.3746337890625, -13.931884765625, -13.4891357421875, -13.04638671875, -12.6036376953125, -12.160888671875, -11.7181396484375, -11.275390625, -10.8326416015625, -10.389892578125, -9.9471435546875, -9.50439453125, -9.0616455078125, -8.618896484375, -8.1761474609375, -7.7333984375, -7.2906494140625, -6.847900390625, -6.4051513671875, -5.96240234375, -5.5196533203125, -5.076904296875, -4.6341552734375, -4.19140625, -3.7486572265625, -3.305908203125, -2.8631591796875, -2.42041015625, -1.9776611328125, -1.534912109375, -1.0921630859375, -0.6494140625, -0.2066650390625, 0.236083984375, 0.6788330078125, 1.12158203125, 1.5643310546875, 2.007080078125, 2.4498291015625, 2.892578125, 3.3353271484375, 3.778076171875, 4.2208251953125, 4.66357421875, 5.1063232421875, 5.549072265625, 5.9918212890625, 6.4345703125, 6.8773193359375, 7.320068359375, 7.7628173828125, 8.20556640625, 8.6483154296875, 9.091064453125, 9.5338134765625, 9.9765625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 13.0, 27.0, 24.0, 35.0, 36.0, 66.0, 67.0, 66.0, 98.0, 99.0, 92.0, 76.0, 66.0, 39.0, 53.0, 37.0, 30.0, 22.0, 13.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.671875, -9.43902587890625, -9.2061767578125, -8.97332763671875, -8.740478515625, -8.50762939453125, -8.2747802734375, -8.04193115234375, -7.80908203125, -7.57623291015625, -7.3433837890625, -7.11053466796875, -6.877685546875, -6.64483642578125, -6.4119873046875, -6.17913818359375, -5.9462890625, -5.71343994140625, -5.4805908203125, -5.24774169921875, -5.014892578125, -4.78204345703125, -4.5491943359375, -4.31634521484375, -4.08349609375, -3.85064697265625, -3.6177978515625, -3.38494873046875, -3.152099609375, -2.91925048828125, -2.6864013671875, -2.45355224609375, -2.220703125, -1.98785400390625, -1.7550048828125, -1.52215576171875, -1.289306640625, -1.05645751953125, -0.8236083984375, -0.59075927734375, -0.35791015625, -0.12506103515625, 0.1077880859375, 0.34063720703125, 0.573486328125, 0.80633544921875, 1.0391845703125, 1.27203369140625, 1.5048828125, 1.73773193359375, 1.9705810546875, 2.20343017578125, 2.436279296875, 2.66912841796875, 2.9019775390625, 3.13482666015625, 3.36767578125, 3.60052490234375, 3.8333740234375, 4.06622314453125, 4.299072265625, 4.53192138671875, 4.7647705078125, 4.99761962890625, 5.23046875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 8.0, 4.0, 9.0, 11.0, 15.0, 24.0, 36.0, 69.0, 102.0, 201.0, 333.0, 735.0, 1902.0, 6167.0, 39679.0, 2032683.0, 2062414.0, 40179.0, 6453.0, 1878.0, 731.0, 331.0, 123.0, 75.0, 54.0, 16.0, 18.0, 7.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.1148681640625, -15.667236328125, -15.2196044921875, -14.77197265625, -14.3243408203125, -13.876708984375, -13.4290771484375, -12.9814453125, -12.5338134765625, -12.086181640625, -11.6385498046875, -11.19091796875, -10.7432861328125, -10.295654296875, -9.8480224609375, -9.400390625, -8.9527587890625, -8.505126953125, -8.0574951171875, -7.60986328125, -7.1622314453125, -6.714599609375, -6.2669677734375, -5.8193359375, -5.3717041015625, -4.924072265625, -4.4764404296875, -4.02880859375, -3.5811767578125, -3.133544921875, -2.6859130859375, -2.23828125, -1.7906494140625, -1.343017578125, -0.8953857421875, -0.44775390625, -0.0001220703125, 0.447509765625, 0.8951416015625, 1.3427734375, 1.7904052734375, 2.238037109375, 2.6856689453125, 3.13330078125, 3.5809326171875, 4.028564453125, 4.4761962890625, 4.923828125, 5.3714599609375, 5.819091796875, 6.2667236328125, 6.71435546875, 7.1619873046875, 7.609619140625, 8.0572509765625, 8.5048828125, 8.9525146484375, 9.400146484375, 9.8477783203125, 10.29541015625, 10.7430419921875, 11.190673828125, 11.6383056640625, 12.0859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 12.0, 23.0, 21.0, 45.0, 104.0, 229.0, 583.0, 1295.0, 1018.0, 416.0, 144.0, 65.0, 44.0, 19.0, 23.0, 10.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.59375, -19.088134765625, -18.58251953125, -18.076904296875, -17.5712890625, -17.065673828125, -16.56005859375, -16.054443359375, -15.548828125, -15.043212890625, -14.53759765625, -14.031982421875, -13.5263671875, -13.020751953125, -12.51513671875, -12.009521484375, -11.50390625, -10.998291015625, -10.49267578125, -9.987060546875, -9.4814453125, -8.975830078125, -8.47021484375, -7.964599609375, -7.458984375, -6.953369140625, -6.44775390625, -5.942138671875, -5.4365234375, -4.930908203125, -4.42529296875, -3.919677734375, -3.4140625, -2.908447265625, -2.40283203125, -1.897216796875, -1.3916015625, -0.885986328125, -0.38037109375, 0.125244140625, 0.630859375, 1.136474609375, 1.64208984375, 2.147705078125, 2.6533203125, 3.158935546875, 3.66455078125, 4.170166015625, 4.67578125, 5.181396484375, 5.68701171875, 6.192626953125, 6.6982421875, 7.203857421875, 7.70947265625, 8.215087890625, 8.720703125, 9.226318359375, 9.73193359375, 10.237548828125, 10.7431640625, 11.248779296875, 11.75439453125, 12.260009765625, 12.765625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 41.0, 176.0, 397.0, 260.0, 70.0, 17.0, 13.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.7108154296875, -150.80667114257812, -144.9025115966797, -138.9983673095703, -133.09420776367188, -127.1900634765625, -121.2859115600586, -115.38175964355469, -109.47761535644531, -103.5734634399414, -97.6693115234375, -91.76516723632812, -85.86101531982422, -79.95686340332031, -74.0527114868164, -68.1485595703125, -62.244407653808594, -56.34025573730469, -50.43610763549805, -44.53195571899414, -38.6278076171875, -32.723655700683594, -26.819503784179688, -20.915355682373047, -15.01120376586914, -9.107053756713867, -3.2029027938842773, 2.7012481689453125, 8.605398178100586, 14.50954818725586, 20.413700103759766, 26.317848205566406, 32.22200012207031, 38.12615203857422, 44.03030014038086, 49.934452056884766, 55.838600158691406, 61.74275207519531, 67.64690399169922, 73.55105590820312, 79.4552001953125, 85.3593521118164, 91.26350402832031, 97.16764831542969, 103.0718002319336, 108.9759521484375, 114.8801040649414, 120.78425598144531, 126.68840789794922, 132.59255981445312, 138.4967041015625, 144.40086364746094, 150.3050079345703, 156.20916748046875, 162.11331176757812, 168.0174560546875, 173.92161560058594, 179.8257598876953, 185.72991943359375, 191.63406372070312, 197.53822326660156, 203.44236755371094, 209.34652709960938, 215.25067138671875, 221.15481567382812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 13.0, 21.0, 26.0, 35.0, 42.0, 39.0, 63.0, 54.0, 68.0, 71.0, 88.0, 67.0, 74.0, 57.0, 54.0, 55.0, 55.0, 27.0, 31.0, 21.0, 13.0, 6.0, 2.0, 6.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.51918029785156, -37.604488372802734, -35.689796447753906, -33.77510452270508, -31.86041259765625, -29.945720672607422, -28.031030654907227, -26.1163387298584, -24.20164680480957, -22.286954879760742, -20.372262954711914, -18.45757293701172, -16.54288101196289, -14.628188133239746, -12.713497161865234, -10.798805236816406, -8.884113311767578, -6.96942138671875, -5.05472993850708, -3.14003849029541, -1.225346565246582, 0.6893453598022461, 2.604036331176758, 4.518728256225586, 6.433420181274414, 8.348112106323242, 10.26280403137207, 12.177495002746582, 14.09218692779541, 16.006877899169922, 17.92156982421875, 19.836261749267578, 21.750953674316406, 23.665645599365234, 25.580337524414062, 27.49502944946289, 29.40972137451172, 31.324413299560547, 33.239105224609375, 35.15379333496094, 37.06848907470703, 38.98318099975586, 40.89787292480469, 42.812564849853516, 44.727256774902344, 46.64194869995117, 48.556640625, 50.47132873535156, 52.38602066040039, 54.30071258544922, 56.21540451049805, 58.130096435546875, 60.0447883605957, 61.95948028564453, 63.874168395996094, 65.78886413574219, 67.70355224609375, 69.61824035644531, 71.5329360961914, 73.44762420654297, 75.36231994628906, 77.27700805664062, 79.19170379638672, 81.10639190673828, 83.02108764648438]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 5.0, 8.0, 9.0, 22.0, 25.0, 44.0, 68.0, 135.0, 187.0, 415.0, 841.0, 2025.0, 6231.0, 22784.0, 106622.0, 476362.0, 343382.0, 66499.0, 15233.0, 4501.0, 1631.0, 732.0, 319.0, 173.0, 98.0, 57.0, 41.0, 30.0, 21.0, 18.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.6009521484375, -10.287841796875, -9.9747314453125, -9.66162109375, -9.3485107421875, -9.035400390625, -8.7222900390625, -8.4091796875, -8.0960693359375, -7.782958984375, -7.4698486328125, -7.15673828125, -6.8436279296875, -6.530517578125, -6.2174072265625, -5.904296875, -5.5911865234375, -5.278076171875, -4.9649658203125, -4.65185546875, -4.3387451171875, -4.025634765625, -3.7125244140625, -3.3994140625, -3.0863037109375, -2.773193359375, -2.4600830078125, -2.14697265625, -1.8338623046875, -1.520751953125, -1.2076416015625, -0.89453125, -0.5814208984375, -0.268310546875, 0.0447998046875, 0.35791015625, 0.6710205078125, 0.984130859375, 1.2972412109375, 1.6103515625, 1.9234619140625, 2.236572265625, 2.5496826171875, 2.86279296875, 3.1759033203125, 3.489013671875, 3.8021240234375, 4.115234375, 4.4283447265625, 4.741455078125, 5.0545654296875, 5.36767578125, 5.6807861328125, 5.993896484375, 6.3070068359375, 6.6201171875, 6.9332275390625, 7.246337890625, 7.5594482421875, 7.87255859375, 8.1856689453125, 8.498779296875, 8.8118896484375, 9.125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 6.0, 10.0, 11.0, 17.0, 26.0, 35.0, 34.0, 45.0, 55.0, 75.0, 88.0, 55.0, 83.0, 77.0, 59.0, 66.0, 66.0, 49.0, 33.0, 33.0, 22.0, 20.0, 18.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-9.0625, -8.84423828125, -8.6259765625, -8.40771484375, -8.189453125, -7.97119140625, -7.7529296875, -7.53466796875, -7.31640625, -7.09814453125, -6.8798828125, -6.66162109375, -6.443359375, -6.22509765625, -6.0068359375, -5.78857421875, -5.5703125, -5.35205078125, -5.1337890625, -4.91552734375, -4.697265625, -4.47900390625, -4.2607421875, -4.04248046875, -3.82421875, -3.60595703125, -3.3876953125, -3.16943359375, -2.951171875, -2.73291015625, -2.5146484375, -2.29638671875, -2.078125, -1.85986328125, -1.6416015625, -1.42333984375, -1.205078125, -0.98681640625, -0.7685546875, -0.55029296875, -0.33203125, -0.11376953125, 0.1044921875, 0.32275390625, 0.541015625, 0.75927734375, 0.9775390625, 1.19580078125, 1.4140625, 1.63232421875, 1.8505859375, 2.06884765625, 2.287109375, 2.50537109375, 2.7236328125, 2.94189453125, 3.16015625, 3.37841796875, 3.5966796875, 3.81494140625, 4.033203125, 4.25146484375, 4.4697265625, 4.68798828125, 4.90625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 22.0, 19.0, 27.0, 31.0, 44.0, 77.0, 138.0, 253.0, 589.0, 1475.0, 5164.0, 25595.0, 186759.0, 697052.0, 109326.0, 16208.0, 3638.0, 1132.0, 455.0, 210.0, 120.0, 73.0, 33.0, 39.0, 20.0, 14.0, 10.0, 9.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0390625, -12.6483154296875, -12.257568359375, -11.8668212890625, -11.47607421875, -11.0853271484375, -10.694580078125, -10.3038330078125, -9.9130859375, -9.5223388671875, -9.131591796875, -8.7408447265625, -8.35009765625, -7.9593505859375, -7.568603515625, -7.1778564453125, -6.787109375, -6.3963623046875, -6.005615234375, -5.6148681640625, -5.22412109375, -4.8333740234375, -4.442626953125, -4.0518798828125, -3.6611328125, -3.2703857421875, -2.879638671875, -2.4888916015625, -2.09814453125, -1.7073974609375, -1.316650390625, -0.9259033203125, -0.53515625, -0.1444091796875, 0.246337890625, 0.6370849609375, 1.02783203125, 1.4185791015625, 1.809326171875, 2.2000732421875, 2.5908203125, 2.9815673828125, 3.372314453125, 3.7630615234375, 4.15380859375, 4.5445556640625, 4.935302734375, 5.3260498046875, 5.716796875, 6.1075439453125, 6.498291015625, 6.8890380859375, 7.27978515625, 7.6705322265625, 8.061279296875, 8.4520263671875, 8.8427734375, 9.2335205078125, 9.624267578125, 10.0150146484375, 10.40576171875, 10.7965087890625, 11.187255859375, 11.5780029296875, 11.96875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 5.0, 8.0, 9.0, 9.0, 13.0, 22.0, 20.0, 22.0, 24.0, 37.0, 35.0, 38.0, 28.0, 59.0, 48.0, 47.0, 43.0, 57.0, 57.0, 50.0, 41.0, 36.0, 43.0, 36.0, 35.0, 36.0, 24.0, 23.0, 20.0, 20.0, 13.0, 14.0, 9.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.843505859375, -15.32763671875, -14.811767578125, -14.2958984375, -13.780029296875, -13.26416015625, -12.748291015625, -12.232421875, -11.716552734375, -11.20068359375, -10.684814453125, -10.1689453125, -9.653076171875, -9.13720703125, -8.621337890625, -8.10546875, -7.589599609375, -7.07373046875, -6.557861328125, -6.0419921875, -5.526123046875, -5.01025390625, -4.494384765625, -3.978515625, -3.462646484375, -2.94677734375, -2.430908203125, -1.9150390625, -1.399169921875, -0.88330078125, -0.367431640625, 0.1484375, 0.664306640625, 1.18017578125, 1.696044921875, 2.2119140625, 2.727783203125, 3.24365234375, 3.759521484375, 4.275390625, 4.791259765625, 5.30712890625, 5.822998046875, 6.3388671875, 6.854736328125, 7.37060546875, 7.886474609375, 8.40234375, 8.918212890625, 9.43408203125, 9.949951171875, 10.4658203125, 10.981689453125, 11.49755859375, 12.013427734375, 12.529296875, 13.045166015625, 13.56103515625, 14.076904296875, 14.5927734375, 15.108642578125, 15.62451171875, 16.140380859375, 16.65625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 2.0, 7.0, 7.0, 7.0, 15.0, 15.0, 28.0, 39.0, 53.0, 103.0, 167.0, 312.0, 700.0, 1966.0, 6566.0, 27434.0, 151302.0, 677634.0, 145767.0, 26728.0, 6284.0, 1928.0, 731.0, 329.0, 158.0, 77.0, 60.0, 40.0, 21.0, 13.0, 13.0, 6.0, 9.0, 9.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.546875, -2.46051025390625, -2.3741455078125, -2.28778076171875, -2.201416015625, -2.11505126953125, -2.0286865234375, -1.94232177734375, -1.85595703125, -1.76959228515625, -1.6832275390625, -1.59686279296875, -1.510498046875, -1.42413330078125, -1.3377685546875, -1.25140380859375, -1.1650390625, -1.07867431640625, -0.9923095703125, -0.90594482421875, -0.819580078125, -0.73321533203125, -0.6468505859375, -0.56048583984375, -0.47412109375, -0.38775634765625, -0.3013916015625, -0.21502685546875, -0.128662109375, -0.04229736328125, 0.0440673828125, 0.13043212890625, 0.216796875, 0.30316162109375, 0.3895263671875, 0.47589111328125, 0.562255859375, 0.64862060546875, 0.7349853515625, 0.82135009765625, 0.90771484375, 0.99407958984375, 1.0804443359375, 1.16680908203125, 1.253173828125, 1.33953857421875, 1.4259033203125, 1.51226806640625, 1.5986328125, 1.68499755859375, 1.7713623046875, 1.85772705078125, 1.944091796875, 2.03045654296875, 2.1168212890625, 2.20318603515625, 2.28955078125, 2.37591552734375, 2.4622802734375, 2.54864501953125, 2.635009765625, 2.72137451171875, 2.8077392578125, 2.89410400390625, 2.98046875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 6.0, 12.0, 12.0, 13.0, 23.0, 27.0, 33.0, 57.0, 81.0, 116.0, 140.0, 108.0, 92.0, 89.0, 48.0, 44.0, 25.0, 16.0, 18.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006136894226074219, -0.0005915537476539612, -0.0005694180727005005, -0.0005472823977470398, -0.0005251467227935791, -0.0005030110478401184, -0.0004808753728866577, -0.000458739697933197, -0.00043660402297973633, -0.00041446834802627563, -0.00039233267307281494, -0.00037019699811935425, -0.00034806132316589355, -0.00032592564821243286, -0.00030378997325897217, -0.0002816542983055115, -0.0002595186233520508, -0.0002373829483985901, -0.0002152472734451294, -0.0001931115984916687, -0.000170975923538208, -0.00014884024858474731, -0.00012670457363128662, -0.00010456889867782593, -8.243322372436523e-05, -6.029754877090454e-05, -3.816187381744385e-05, -1.6026198863983154e-05, 6.109476089477539e-06, 2.8245151042938232e-05, 5.0380825996398926e-05, 7.251650094985962e-05, 9.465217590332031e-05, 0.000116787850856781, 0.0001389235258102417, 0.0001610592007637024, 0.00018319487571716309, 0.00020533055067062378, 0.00022746622562408447, 0.00024960190057754517, 0.00027173757553100586, 0.00029387325048446655, 0.00031600892543792725, 0.00033814460039138794, 0.00036028027534484863, 0.0003824159502983093, 0.00040455162525177, 0.0004266873002052307, 0.0004488229751586914, 0.0004709586501121521, 0.0004930943250656128, 0.0005152300000190735, 0.0005373656749725342, 0.0005595013499259949, 0.0005816370248794556, 0.0006037726998329163, 0.000625908374786377, 0.0006480440497398376, 0.0006701797246932983, 0.000692315399646759, 0.0007144510746002197, 0.0007365867495536804, 0.0007587224245071411, 0.0007808580994606018, 0.0008029937744140625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 6.0, 11.0, 13.0, 26.0, 52.0, 96.0, 161.0, 375.0, 1100.0, 3707.0, 17517.0, 155588.0, 759176.0, 94194.0, 12176.0, 2714.0, 928.0, 357.0, 163.0, 65.0, 54.0, 23.0, 20.0, 12.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7421875, -4.618682861328125, -4.49517822265625, -4.371673583984375, -4.2481689453125, -4.124664306640625, -4.00115966796875, -3.877655029296875, -3.754150390625, -3.630645751953125, -3.50714111328125, -3.383636474609375, -3.2601318359375, -3.136627197265625, -3.01312255859375, -2.889617919921875, -2.76611328125, -2.642608642578125, -2.51910400390625, -2.395599365234375, -2.2720947265625, -2.148590087890625, -2.02508544921875, -1.901580810546875, -1.778076171875, -1.654571533203125, -1.53106689453125, -1.407562255859375, -1.2840576171875, -1.160552978515625, -1.03704833984375, -0.913543701171875, -0.7900390625, -0.666534423828125, -0.54302978515625, -0.419525146484375, -0.2960205078125, -0.172515869140625, -0.04901123046875, 0.074493408203125, 0.197998046875, 0.321502685546875, 0.44500732421875, 0.568511962890625, 0.6920166015625, 0.815521240234375, 0.93902587890625, 1.062530517578125, 1.18603515625, 1.309539794921875, 1.43304443359375, 1.556549072265625, 1.6800537109375, 1.803558349609375, 1.92706298828125, 2.050567626953125, 2.174072265625, 2.297576904296875, 2.42108154296875, 2.544586181640625, 2.6680908203125, 2.791595458984375, 2.91510009765625, 3.038604736328125, 3.162109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 8.0, 11.0, 13.0, 18.0, 22.0, 23.0, 43.0, 69.0, 73.0, 96.0, 108.0, 121.0, 93.0, 76.0, 63.0, 42.0, 39.0, 17.0, 18.0, 15.0, 5.0, 12.0, 3.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17578125, -3.07379150390625, -2.9718017578125, -2.86981201171875, -2.767822265625, -2.66583251953125, -2.5638427734375, -2.46185302734375, -2.35986328125, -2.25787353515625, -2.1558837890625, -2.05389404296875, -1.951904296875, -1.84991455078125, -1.7479248046875, -1.64593505859375, -1.5439453125, -1.44195556640625, -1.3399658203125, -1.23797607421875, -1.135986328125, -1.03399658203125, -0.9320068359375, -0.83001708984375, -0.72802734375, -0.62603759765625, -0.5240478515625, -0.42205810546875, -0.320068359375, -0.21807861328125, -0.1160888671875, -0.01409912109375, 0.087890625, 0.18988037109375, 0.2918701171875, 0.39385986328125, 0.495849609375, 0.59783935546875, 0.6998291015625, 0.80181884765625, 0.90380859375, 1.00579833984375, 1.1077880859375, 1.20977783203125, 1.311767578125, 1.41375732421875, 1.5157470703125, 1.61773681640625, 1.7197265625, 1.82171630859375, 1.9237060546875, 2.02569580078125, 2.127685546875, 2.22967529296875, 2.3316650390625, 2.43365478515625, 2.53564453125, 2.63763427734375, 2.7396240234375, 2.84161376953125, 2.943603515625, 3.04559326171875, 3.1475830078125, 3.24957275390625, 3.3515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 6.0, 11.0, 15.0, 41.0, 99.0, 218.0, 333.0, 136.0, 70.0, 37.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.84374237060547, -97.51134490966797, -94.17894744873047, -90.84654998779297, -87.51415252685547, -84.18175506591797, -80.84935760498047, -77.51696014404297, -74.18456268310547, -70.85216522216797, -67.51976776123047, -64.18737030029297, -60.85497283935547, -57.52257537841797, -54.19017791748047, -50.85778045654297, -47.52538299560547, -44.19298553466797, -40.86058807373047, -37.52819061279297, -34.19579315185547, -30.86339569091797, -27.53099822998047, -24.19860076904297, -20.86620330810547, -17.53380584716797, -14.201408386230469, -10.869010925292969, -7.536613464355469, -4.204216003417969, -0.8718185424804688, 2.4605789184570312, 5.792976379394531, 9.125373840332031, 12.457771301269531, 15.790168762207031, 19.12256622314453, 22.45496368408203, 25.78736114501953, 29.11975860595703, 32.45215606689453, 35.78455352783203, 39.11695098876953, 42.44934844970703, 45.78174591064453, 49.11414337158203, 52.44654083251953, 55.77893829345703, 59.11133575439453, 62.44373321533203, 65.77613067626953, 69.10852813720703, 72.44092559814453, 75.77332305908203, 79.10572052001953, 82.43811798095703, 85.77051544189453, 89.10291290283203, 92.43531036376953, 95.76770782470703, 99.10010528564453, 102.43250274658203, 105.76490020751953, 109.09729766845703, 112.42969512939453]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 14.0, 9.0, 13.0, 11.0, 21.0, 33.0, 23.0, 36.0, 42.0, 35.0, 53.0, 47.0, 67.0, 84.0, 73.0, 70.0, 61.0, 42.0, 47.0, 34.0, 24.0, 28.0, 23.0, 20.0, 14.0, 20.0, 15.0, 7.0, 5.0, 6.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.76741027832031, -69.72059631347656, -67.67377471923828, -65.62696075439453, -63.580142974853516, -61.5333251953125, -59.48651123046875, -57.439693450927734, -55.39287567138672, -53.3460578918457, -51.29924011230469, -49.25242614746094, -47.20560836791992, -45.158790588378906, -43.111976623535156, -41.06515884399414, -39.018341064453125, -36.97152328491211, -34.924705505371094, -32.877891540527344, -30.831073760986328, -28.784255981445312, -26.73744010925293, -24.690624237060547, -22.64380645751953, -20.596988677978516, -18.550172805786133, -16.50335693359375, -14.456539154052734, -12.409722328186035, -10.362905502319336, -8.316088676452637, -6.269268035888672, -4.222451210021973, -2.1756343841552734, -0.12881755828857422, 1.917999267578125, 3.964816093444824, 6.011632919311523, 8.058449745178223, 10.105266571044922, 12.152083396911621, 14.19890022277832, 16.245716094970703, 18.29253387451172, 20.339351654052734, 22.386167526245117, 24.4329833984375, 26.479801177978516, 28.52661895751953, 30.573434829711914, 32.6202507019043, 34.66706848144531, 36.71388626098633, 38.760704040527344, 40.807518005371094, 42.85433578491211, 44.901153564453125, 46.947967529296875, 48.99478530883789, 51.041603088378906, 53.08842086791992, 55.13523864746094, 57.18205261230469, 59.2288703918457]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 11.0, 9.0, 14.0, 14.0, 21.0, 19.0, 35.0, 48.0, 108.0, 125.0, 225.0, 404.0, 887.0, 2156.0, 7093.0, 36148.0, 415995.0, 3163329.0, 511871.0, 42064.0, 8738.0, 2801.0, 1086.0, 456.0, 248.0, 141.0, 72.0, 53.0, 37.0, 25.0, 15.0, 8.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484375, -6.26483154296875, -6.0452880859375, -5.82574462890625, -5.606201171875, -5.38665771484375, -5.1671142578125, -4.94757080078125, -4.72802734375, -4.50848388671875, -4.2889404296875, -4.06939697265625, -3.849853515625, -3.63031005859375, -3.4107666015625, -3.19122314453125, -2.9716796875, -2.75213623046875, -2.5325927734375, -2.31304931640625, -2.093505859375, -1.87396240234375, -1.6544189453125, -1.43487548828125, -1.21533203125, -0.99578857421875, -0.7762451171875, -0.55670166015625, -0.337158203125, -0.11761474609375, 0.1019287109375, 0.32147216796875, 0.541015625, 0.76055908203125, 0.9801025390625, 1.19964599609375, 1.419189453125, 1.63873291015625, 1.8582763671875, 2.07781982421875, 2.29736328125, 2.51690673828125, 2.7364501953125, 2.95599365234375, 3.175537109375, 3.39508056640625, 3.6146240234375, 3.83416748046875, 4.0537109375, 4.27325439453125, 4.4927978515625, 4.71234130859375, 4.931884765625, 5.15142822265625, 5.3709716796875, 5.59051513671875, 5.81005859375, 6.02960205078125, 6.2491455078125, 6.46868896484375, 6.688232421875, 6.90777587890625, 7.1273193359375, 7.34686279296875, 7.56640625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 7.0, 13.0, 14.0, 22.0, 34.0, 40.0, 54.0, 51.0, 67.0, 78.0, 70.0, 65.0, 84.0, 80.0, 67.0, 69.0, 53.0, 32.0, 27.0, 21.0, 13.0, 10.0, 11.0, 4.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-8.84375, -8.6356201171875, -8.427490234375, -8.2193603515625, -8.01123046875, -7.8031005859375, -7.594970703125, -7.3868408203125, -7.1787109375, -6.9705810546875, -6.762451171875, -6.5543212890625, -6.34619140625, -6.1380615234375, -5.929931640625, -5.7218017578125, -5.513671875, -5.3055419921875, -5.097412109375, -4.8892822265625, -4.68115234375, -4.4730224609375, -4.264892578125, -4.0567626953125, -3.8486328125, -3.6405029296875, -3.432373046875, -3.2242431640625, -3.01611328125, -2.8079833984375, -2.599853515625, -2.3917236328125, -2.18359375, -1.9754638671875, -1.767333984375, -1.5592041015625, -1.35107421875, -1.1429443359375, -0.934814453125, -0.7266845703125, -0.5185546875, -0.3104248046875, -0.102294921875, 0.1058349609375, 0.31396484375, 0.5220947265625, 0.730224609375, 0.9383544921875, 1.146484375, 1.3546142578125, 1.562744140625, 1.7708740234375, 1.97900390625, 2.1871337890625, 2.395263671875, 2.6033935546875, 2.8115234375, 3.0196533203125, 3.227783203125, 3.4359130859375, 3.64404296875, 3.8521728515625, 4.060302734375, 4.2684326171875, 4.4765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 9.0, 6.0, 5.0, 13.0, 10.0, 9.0, 16.0, 21.0, 18.0, 35.0, 62.0, 98.0, 147.0, 318.0, 724.0, 2221.0, 7232.0, 32955.0, 333776.0, 3433204.0, 340035.0, 32839.0, 7015.0, 2054.0, 721.0, 289.0, 161.0, 83.0, 57.0, 41.0, 29.0, 22.0, 14.0, 11.0, 9.0, 9.0, 10.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.51318359375, -6.2763671875, -6.03955078125, -5.802734375, -5.56591796875, -5.3291015625, -5.09228515625, -4.85546875, -4.61865234375, -4.3818359375, -4.14501953125, -3.908203125, -3.67138671875, -3.4345703125, -3.19775390625, -2.9609375, -2.72412109375, -2.4873046875, -2.25048828125, -2.013671875, -1.77685546875, -1.5400390625, -1.30322265625, -1.06640625, -0.82958984375, -0.5927734375, -0.35595703125, -0.119140625, 0.11767578125, 0.3544921875, 0.59130859375, 0.828125, 1.06494140625, 1.3017578125, 1.53857421875, 1.775390625, 2.01220703125, 2.2490234375, 2.48583984375, 2.72265625, 2.95947265625, 3.1962890625, 3.43310546875, 3.669921875, 3.90673828125, 4.1435546875, 4.38037109375, 4.6171875, 4.85400390625, 5.0908203125, 5.32763671875, 5.564453125, 5.80126953125, 6.0380859375, 6.27490234375, 6.51171875, 6.74853515625, 6.9853515625, 7.22216796875, 7.458984375, 7.69580078125, 7.9326171875, 8.16943359375, 8.40625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 1.0, 8.0, 9.0, 2.0, 20.0, 14.0, 14.0, 30.0, 31.0, 61.0, 72.0, 89.0, 129.0, 192.0, 304.0, 432.0, 550.0, 575.0, 446.0, 346.0, 210.0, 179.0, 95.0, 73.0, 58.0, 32.0, 26.0, 14.0, 13.0, 9.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.25390625, -5.07354736328125, -4.8931884765625, -4.71282958984375, -4.532470703125, -4.35211181640625, -4.1717529296875, -3.99139404296875, -3.81103515625, -3.63067626953125, -3.4503173828125, -3.26995849609375, -3.089599609375, -2.90924072265625, -2.7288818359375, -2.54852294921875, -2.3681640625, -2.18780517578125, -2.0074462890625, -1.82708740234375, -1.646728515625, -1.46636962890625, -1.2860107421875, -1.10565185546875, -0.92529296875, -0.74493408203125, -0.5645751953125, -0.38421630859375, -0.203857421875, -0.02349853515625, 0.1568603515625, 0.33721923828125, 0.517578125, 0.69793701171875, 0.8782958984375, 1.05865478515625, 1.239013671875, 1.41937255859375, 1.5997314453125, 1.78009033203125, 1.96044921875, 2.14080810546875, 2.3211669921875, 2.50152587890625, 2.681884765625, 2.86224365234375, 3.0426025390625, 3.22296142578125, 3.4033203125, 3.58367919921875, 3.7640380859375, 3.94439697265625, 4.124755859375, 4.30511474609375, 4.4854736328125, 4.66583251953125, 4.84619140625, 5.02655029296875, 5.2069091796875, 5.38726806640625, 5.567626953125, 5.74798583984375, 5.9283447265625, 6.10870361328125, 6.2890625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 0.0, 2.0, 8.0, 14.0, 19.0, 57.0, 73.0, 125.0, 214.0, 180.0, 134.0, 67.0, 59.0, 10.0, 13.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.89309692382812, -70.10135650634766, -68.30960845947266, -66.51786804199219, -64.72612762451172, -62.934383392333984, -61.142642974853516, -59.35089874267578, -57.55915832519531, -55.76741409301758, -53.97567367553711, -52.183929443359375, -50.392189025878906, -48.60044479370117, -46.8087043762207, -45.01696014404297, -43.2252197265625, -41.433475494384766, -39.6417350769043, -37.84999084472656, -36.058250427246094, -34.26650619506836, -32.47476577758789, -30.683021545410156, -28.891277313232422, -27.09953498840332, -25.30779266357422, -23.516050338745117, -21.724308013916016, -19.93256378173828, -18.140823364257812, -16.349079132080078, -14.55733871459961, -12.765596389770508, -10.973854064941406, -9.182111740112305, -7.390368938446045, -5.598626136779785, -3.8068838119506836, -2.015141487121582, -0.22339916229248047, 1.5683432817459106, 3.3600857257843018, 5.151828289031982, 6.943570613861084, 8.735313415527344, 10.527055740356445, 12.318798065185547, 14.110540390014648, 15.90228271484375, 17.69402503967285, 19.485767364501953, 21.277509689331055, 23.069252014160156, 24.86099624633789, 26.65273666381836, 28.444480895996094, 30.236223220825195, 32.0279655456543, 33.81970977783203, 35.6114501953125, 37.403194427490234, 39.1949348449707, 40.98667907714844, 42.778419494628906]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 0.0, 1.0, 6.0, 1.0, 2.0, 12.0, 12.0, 6.0, 12.0, 29.0, 16.0, 27.0, 26.0, 22.0, 21.0, 36.0, 41.0, 43.0, 35.0, 32.0, 48.0, 43.0, 48.0, 37.0, 42.0, 47.0, 55.0, 41.0, 29.0, 39.0, 42.0, 24.0, 17.0, 21.0, 22.0, 11.0, 8.0, 13.0, 8.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.513671875, -26.714061737060547, -25.91444969177246, -25.114839553833008, -24.315229415893555, -23.51561737060547, -22.716007232666016, -21.916397094726562, -21.11678695678711, -20.317176818847656, -19.51756477355957, -18.717954635620117, -17.918344497680664, -17.118732452392578, -16.319122314453125, -15.519512176513672, -14.719900131225586, -13.920289039611816, -13.120678901672363, -12.321067810058594, -11.52145767211914, -10.721846580505371, -9.922235488891602, -9.122625350952148, -8.323014259338379, -7.523403644561768, -6.723793029785156, -5.924181938171387, -5.124571323394775, -4.324960708618164, -3.5253496170043945, -2.725739002227783, -1.9261283874511719, -1.126517653465271, -0.3269069194793701, 0.4727039337158203, 1.2723145484924316, 2.071925163269043, 2.8715362548828125, 3.671146869659424, 4.470757484436035, 5.2703680992126465, 6.069978713989258, 6.869589805603027, 7.669200420379639, 8.46881103515625, 9.26842212677002, 10.068033218383789, 10.867643356323242, 11.667254447937012, 12.466864585876465, 13.266475677490234, 14.066085815429688, 14.865696907043457, 15.665307998657227, 16.46491813659668, 17.264530181884766, 18.06414031982422, 18.863752365112305, 19.663362503051758, 20.46297264099121, 21.262584686279297, 22.06219482421875, 22.861804962158203, 23.661415100097656]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 10.0, 5.0, 8.0, 15.0, 17.0, 28.0, 29.0, 38.0, 70.0, 114.0, 158.0, 315.0, 509.0, 920.0, 1930.0, 4601.0, 12166.0, 37083.0, 128316.0, 403986.0, 321464.0, 92846.0, 27628.0, 9170.0, 3665.0, 1507.0, 770.0, 421.0, 269.0, 157.0, 97.0, 76.0, 41.0, 45.0, 22.0, 14.0, 10.0, 6.0, 12.0, 9.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.76953125, -6.55712890625, -6.3447265625, -6.13232421875, -5.919921875, -5.70751953125, -5.4951171875, -5.28271484375, -5.0703125, -4.85791015625, -4.6455078125, -4.43310546875, -4.220703125, -4.00830078125, -3.7958984375, -3.58349609375, -3.37109375, -3.15869140625, -2.9462890625, -2.73388671875, -2.521484375, -2.30908203125, -2.0966796875, -1.88427734375, -1.671875, -1.45947265625, -1.2470703125, -1.03466796875, -0.822265625, -0.60986328125, -0.3974609375, -0.18505859375, 0.02734375, 0.23974609375, 0.4521484375, 0.66455078125, 0.876953125, 1.08935546875, 1.3017578125, 1.51416015625, 1.7265625, 1.93896484375, 2.1513671875, 2.36376953125, 2.576171875, 2.78857421875, 3.0009765625, 3.21337890625, 3.42578125, 3.63818359375, 3.8505859375, 4.06298828125, 4.275390625, 4.48779296875, 4.7001953125, 4.91259765625, 5.125, 5.33740234375, 5.5498046875, 5.76220703125, 5.974609375, 6.18701171875, 6.3994140625, 6.61181640625, 6.82421875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 17.0, 13.0, 20.0, 40.0, 39.0, 45.0, 52.0, 71.0, 67.0, 78.0, 82.0, 71.0, 85.0, 73.0, 58.0, 37.0, 33.0, 37.0, 20.0, 20.0, 13.0, 8.0, 3.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-8.8359375, -8.62835693359375, -8.4207763671875, -8.21319580078125, -8.005615234375, -7.79803466796875, -7.5904541015625, -7.38287353515625, -7.17529296875, -6.96771240234375, -6.7601318359375, -6.55255126953125, -6.344970703125, -6.13739013671875, -5.9298095703125, -5.72222900390625, -5.5146484375, -5.30706787109375, -5.0994873046875, -4.89190673828125, -4.684326171875, -4.47674560546875, -4.2691650390625, -4.06158447265625, -3.85400390625, -3.64642333984375, -3.4388427734375, -3.23126220703125, -3.023681640625, -2.81610107421875, -2.6085205078125, -2.40093994140625, -2.193359375, -1.98577880859375, -1.7781982421875, -1.57061767578125, -1.363037109375, -1.15545654296875, -0.9478759765625, -0.74029541015625, -0.53271484375, -0.32513427734375, -0.1175537109375, 0.09002685546875, 0.297607421875, 0.50518798828125, 0.7127685546875, 0.92034912109375, 1.1279296875, 1.33551025390625, 1.5430908203125, 1.75067138671875, 1.958251953125, 2.16583251953125, 2.3734130859375, 2.58099365234375, 2.78857421875, 2.99615478515625, 3.2037353515625, 3.41131591796875, 3.618896484375, 3.82647705078125, 4.0340576171875, 4.24163818359375, 4.44921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 8.0, 10.0, 16.0, 30.0, 22.0, 45.0, 76.0, 95.0, 134.0, 196.0, 346.0, 518.0, 1016.0, 2275.0, 8353.0, 51497.0, 656672.0, 286333.0, 31176.0, 5762.0, 1758.0, 836.0, 482.0, 289.0, 187.0, 124.0, 80.0, 68.0, 39.0, 29.0, 24.0, 18.0, 6.0, 10.0, 3.0, 3.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7734375, -10.412841796875, -10.05224609375, -9.691650390625, -9.3310546875, -8.970458984375, -8.60986328125, -8.249267578125, -7.888671875, -7.528076171875, -7.16748046875, -6.806884765625, -6.4462890625, -6.085693359375, -5.72509765625, -5.364501953125, -5.00390625, -4.643310546875, -4.28271484375, -3.922119140625, -3.5615234375, -3.200927734375, -2.84033203125, -2.479736328125, -2.119140625, -1.758544921875, -1.39794921875, -1.037353515625, -0.6767578125, -0.316162109375, 0.04443359375, 0.405029296875, 0.765625, 1.126220703125, 1.48681640625, 1.847412109375, 2.2080078125, 2.568603515625, 2.92919921875, 3.289794921875, 3.650390625, 4.010986328125, 4.37158203125, 4.732177734375, 5.0927734375, 5.453369140625, 5.81396484375, 6.174560546875, 6.53515625, 6.895751953125, 7.25634765625, 7.616943359375, 7.9775390625, 8.338134765625, 8.69873046875, 9.059326171875, 9.419921875, 9.780517578125, 10.14111328125, 10.501708984375, 10.8623046875, 11.222900390625, 11.58349609375, 11.944091796875, 12.3046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 7.0, 11.0, 13.0, 12.0, 8.0, 15.0, 23.0, 21.0, 32.0, 30.0, 34.0, 30.0, 42.0, 39.0, 50.0, 50.0, 53.0, 48.0, 60.0, 46.0, 40.0, 42.0, 37.0, 29.0, 36.0, 19.0, 31.0, 18.0, 19.0, 14.0, 17.0, 17.0, 7.0, 11.0, 2.0, 10.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.6875, -12.2603759765625, -11.833251953125, -11.4061279296875, -10.97900390625, -10.5518798828125, -10.124755859375, -9.6976318359375, -9.2705078125, -8.8433837890625, -8.416259765625, -7.9891357421875, -7.56201171875, -7.1348876953125, -6.707763671875, -6.2806396484375, -5.853515625, -5.4263916015625, -4.999267578125, -4.5721435546875, -4.14501953125, -3.7178955078125, -3.290771484375, -2.8636474609375, -2.4365234375, -2.0093994140625, -1.582275390625, -1.1551513671875, -0.72802734375, -0.3009033203125, 0.126220703125, 0.5533447265625, 0.98046875, 1.4075927734375, 1.834716796875, 2.2618408203125, 2.68896484375, 3.1160888671875, 3.543212890625, 3.9703369140625, 4.3974609375, 4.8245849609375, 5.251708984375, 5.6788330078125, 6.10595703125, 6.5330810546875, 6.960205078125, 7.3873291015625, 7.814453125, 8.2415771484375, 8.668701171875, 9.0958251953125, 9.52294921875, 9.9500732421875, 10.377197265625, 10.8043212890625, 11.2314453125, 11.6585693359375, 12.085693359375, 12.5128173828125, 12.93994140625, 13.3670654296875, 13.794189453125, 14.2213134765625, 14.6484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 14.0, 25.0, 46.0, 82.0, 154.0, 323.0, 838.0, 2632.0, 10298.0, 62366.0, 799070.0, 147587.0, 18748.0, 4273.0, 1247.0, 415.0, 175.0, 97.0, 56.0, 30.0, 19.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.756439208984375, -3.63787841796875, -3.519317626953125, -3.4007568359375, -3.282196044921875, -3.16363525390625, -3.045074462890625, -2.926513671875, -2.807952880859375, -2.68939208984375, -2.570831298828125, -2.4522705078125, -2.333709716796875, -2.21514892578125, -2.096588134765625, -1.97802734375, -1.859466552734375, -1.74090576171875, -1.622344970703125, -1.5037841796875, -1.385223388671875, -1.26666259765625, -1.148101806640625, -1.029541015625, -0.910980224609375, -0.79241943359375, -0.673858642578125, -0.5552978515625, -0.436737060546875, -0.31817626953125, -0.199615478515625, -0.0810546875, 0.037506103515625, 0.15606689453125, 0.274627685546875, 0.3931884765625, 0.511749267578125, 0.63031005859375, 0.748870849609375, 0.867431640625, 0.985992431640625, 1.10455322265625, 1.223114013671875, 1.3416748046875, 1.460235595703125, 1.57879638671875, 1.697357177734375, 1.81591796875, 1.934478759765625, 2.05303955078125, 2.171600341796875, 2.2901611328125, 2.408721923828125, 2.52728271484375, 2.645843505859375, 2.764404296875, 2.882965087890625, 3.00152587890625, 3.120086669921875, 3.2386474609375, 3.357208251953125, 3.47576904296875, 3.594329833984375, 3.712890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 1.0, 3.0, 7.0, 5.0, 7.0, 9.0, 10.0, 9.0, 21.0, 22.0, 37.0, 44.0, 67.0, 95.0, 121.0, 129.0, 104.0, 73.0, 54.0, 39.0, 31.0, 15.0, 14.0, 17.0, 10.0, 8.0, 6.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0006160736083984375, -0.0005994811654090881, -0.0005828887224197388, -0.0005662962794303894, -0.00054970383644104, -0.0005331113934516907, -0.0005165189504623413, -0.0004999265074729919, -0.0004833340644836426, -0.0004667416214942932, -0.00045014917850494385, -0.0004335567355155945, -0.0004169642925262451, -0.00040037184953689575, -0.0003837794065475464, -0.000367186963558197, -0.00035059452056884766, -0.0003340020775794983, -0.0003174096345901489, -0.00030081719160079956, -0.0002842247486114502, -0.00026763230562210083, -0.00025103986263275146, -0.0002344474196434021, -0.00021785497665405273, -0.00020126253366470337, -0.000184670090675354, -0.00016807764768600464, -0.00015148520469665527, -0.0001348927617073059, -0.00011830031871795654, -0.00010170787572860718, -8.511543273925781e-05, -6.852298974990845e-05, -5.193054676055908e-05, -3.533810377120972e-05, -1.874566078186035e-05, -2.1532177925109863e-06, 1.4439225196838379e-05, 3.1031668186187744e-05, 4.762411117553711e-05, 6.421655416488647e-05, 8.080899715423584e-05, 9.74014401435852e-05, 0.00011399388313293457, 0.00013058632612228394, 0.0001471787691116333, 0.00016377121210098267, 0.00018036365509033203, 0.0001969560980796814, 0.00021354854106903076, 0.00023014098405838013, 0.0002467334270477295, 0.00026332587003707886, 0.0002799183130264282, 0.0002965107560157776, 0.00031310319900512695, 0.0003296956419944763, 0.0003462880849838257, 0.00036288052797317505, 0.0003794729709625244, 0.0003960654139518738, 0.00041265785694122314, 0.0004292502999305725, 0.0004458427429199219]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 7.0, 8.0, 12.0, 16.0, 26.0, 31.0, 35.0, 42.0, 81.0, 120.0, 178.0, 334.0, 519.0, 957.0, 2080.0, 4775.0, 13461.0, 45773.0, 232404.0, 634621.0, 79587.0, 20859.0, 6967.0, 2745.0, 1224.0, 673.0, 380.0, 221.0, 131.0, 101.0, 53.0, 34.0, 23.0, 24.0, 16.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.4871826171875, -2.409912109375, -2.3326416015625, -2.25537109375, -2.1781005859375, -2.100830078125, -2.0235595703125, -1.9462890625, -1.8690185546875, -1.791748046875, -1.7144775390625, -1.63720703125, -1.5599365234375, -1.482666015625, -1.4053955078125, -1.328125, -1.2508544921875, -1.173583984375, -1.0963134765625, -1.01904296875, -0.9417724609375, -0.864501953125, -0.7872314453125, -0.7099609375, -0.6326904296875, -0.555419921875, -0.4781494140625, -0.40087890625, -0.3236083984375, -0.246337890625, -0.1690673828125, -0.091796875, -0.0145263671875, 0.062744140625, 0.1400146484375, 0.21728515625, 0.2945556640625, 0.371826171875, 0.4490966796875, 0.5263671875, 0.6036376953125, 0.680908203125, 0.7581787109375, 0.83544921875, 0.9127197265625, 0.989990234375, 1.0672607421875, 1.14453125, 1.2218017578125, 1.299072265625, 1.3763427734375, 1.45361328125, 1.5308837890625, 1.608154296875, 1.6854248046875, 1.7626953125, 1.8399658203125, 1.917236328125, 1.9945068359375, 2.07177734375, 2.1490478515625, 2.226318359375, 2.3035888671875, 2.380859375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 9.0, 8.0, 2.0, 6.0, 6.0, 5.0, 10.0, 12.0, 8.0, 15.0, 21.0, 20.0, 26.0, 41.0, 37.0, 49.0, 65.0, 60.0, 72.0, 68.0, 83.0, 65.0, 53.0, 45.0, 44.0, 25.0, 26.0, 18.0, 11.0, 11.0, 17.0, 5.0, 12.0, 10.0, 6.0, 3.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.05078125, -1.987091064453125, -1.92340087890625, -1.859710693359375, -1.7960205078125, -1.732330322265625, -1.66864013671875, -1.604949951171875, -1.541259765625, -1.477569580078125, -1.41387939453125, -1.350189208984375, -1.2864990234375, -1.222808837890625, -1.15911865234375, -1.095428466796875, -1.03173828125, -0.968048095703125, -0.90435791015625, -0.840667724609375, -0.7769775390625, -0.713287353515625, -0.64959716796875, -0.585906982421875, -0.522216796875, -0.458526611328125, -0.39483642578125, -0.331146240234375, -0.2674560546875, -0.203765869140625, -0.14007568359375, -0.076385498046875, -0.0126953125, 0.050994873046875, 0.11468505859375, 0.178375244140625, 0.2420654296875, 0.305755615234375, 0.36944580078125, 0.433135986328125, 0.496826171875, 0.560516357421875, 0.62420654296875, 0.687896728515625, 0.7515869140625, 0.815277099609375, 0.87896728515625, 0.942657470703125, 1.00634765625, 1.070037841796875, 1.13372802734375, 1.197418212890625, 1.2611083984375, 1.324798583984375, 1.38848876953125, 1.452178955078125, 1.515869140625, 1.579559326171875, 1.64324951171875, 1.706939697265625, 1.7706298828125, 1.834320068359375, 1.89801025390625, 1.961700439453125, 2.025390625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 16.0, 39.0, 108.0, 336.0, 374.0, 83.0, 21.0, 8.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.59498596191406, -189.19638061523438, -184.79779052734375, -180.39918518066406, -176.00059509277344, -171.60198974609375, -167.20339965820312, -162.80479431152344, -158.40618896484375, -154.00758361816406, -149.60899353027344, -145.21038818359375, -140.81179809570312, -136.41319274902344, -132.01458740234375, -127.61599731445312, -123.21739959716797, -118.81880187988281, -114.42020416259766, -110.0216064453125, -105.62300109863281, -101.22440338134766, -96.8258056640625, -92.42720794677734, -88.02861022949219, -83.63001251220703, -79.23141479492188, -74.83280944824219, -70.43421173095703, -66.03561401367188, -61.63701629638672, -57.23841857910156, -52.839813232421875, -48.44121551513672, -44.0426139831543, -39.64401626586914, -35.24541473388672, -30.846817016601562, -26.448219299316406, -22.049619674682617, -17.651020050048828, -13.252420425415039, -8.853821754455566, -4.455223083496094, -0.05662345886230469, 4.341976165771484, 8.74057388305664, 13.13917350769043, 17.53777313232422, 21.936372756958008, 26.334972381591797, 30.733570098876953, 35.132171630859375, 39.53076934814453, 43.92936706542969, 48.327964782714844, 52.726566314697266, 57.12516403198242, 61.523765563964844, 65.92236328125, 70.32096099853516, 74.71955871582031, 79.1181640625, 83.51676177978516, 87.91535949707031]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 6.0, 5.0, 8.0, 7.0, 5.0, 11.0, 13.0, 22.0, 19.0, 14.0, 26.0, 19.0, 30.0, 24.0, 40.0, 38.0, 59.0, 70.0, 94.0, 85.0, 56.0, 51.0, 22.0, 36.0, 28.0, 29.0, 30.0, 32.0, 19.0, 21.0, 13.0, 14.0, 9.0, 13.0, 12.0, 3.0, 9.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.802303314208984, -50.22300338745117, -48.643699645996094, -47.06439971923828, -45.48509979248047, -43.90579605102539, -42.32649612426758, -40.7471923828125, -39.16789245605469, -37.588592529296875, -36.0092887878418, -34.429988861083984, -32.850685119628906, -31.271385192871094, -29.69208526611328, -28.112783432006836, -26.53348159790039, -24.954179763793945, -23.3748779296875, -21.795578002929688, -20.216276168823242, -18.636974334716797, -17.057674407958984, -15.478372573852539, -13.899070739746094, -12.319768905639648, -10.74046802520752, -9.16116714477539, -7.581865310668945, -6.002563953399658, -4.423262596130371, -2.843961715698242, -1.2646560668945312, 0.31464529037475586, 1.893946647644043, 3.47324800491333, 5.052549362182617, 6.631850719451904, 8.211152076721191, 9.79045295715332, 11.369754791259766, 12.949056625366211, 14.52835750579834, 16.10765838623047, 17.686960220336914, 19.26626205444336, 20.845561981201172, 22.424863815307617, 24.004165649414062, 25.583467483520508, 27.162769317626953, 28.742069244384766, 30.32137107849121, 31.900672912597656, 33.47997283935547, 35.05927276611328, 36.63857650756836, 38.21787643432617, 39.79718017578125, 41.37648010253906, 42.955780029296875, 44.53508377075195, 46.114383697509766, 47.693687438964844, 49.272987365722656]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 9.0, 7.0, 10.0, 12.0, 10.0, 25.0, 30.0, 44.0, 74.0, 113.0, 172.0, 286.0, 490.0, 954.0, 2095.0, 5604.0, 21438.0, 143678.0, 1500774.0, 2238133.0, 234199.0, 32318.0, 8361.0, 2934.0, 1176.0, 562.0, 322.0, 159.0, 99.0, 61.0, 42.0, 31.0, 11.0, 13.0, 12.0, 6.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.83270263671875, -6.6263427734375, -6.41998291015625, -6.213623046875, -6.00726318359375, -5.8009033203125, -5.59454345703125, -5.38818359375, -5.18182373046875, -4.9754638671875, -4.76910400390625, -4.562744140625, -4.35638427734375, -4.1500244140625, -3.94366455078125, -3.7373046875, -3.53094482421875, -3.3245849609375, -3.11822509765625, -2.911865234375, -2.70550537109375, -2.4991455078125, -2.29278564453125, -2.08642578125, -1.88006591796875, -1.6737060546875, -1.46734619140625, -1.260986328125, -1.05462646484375, -0.8482666015625, -0.64190673828125, -0.435546875, -0.22918701171875, -0.0228271484375, 0.18353271484375, 0.389892578125, 0.59625244140625, 0.8026123046875, 1.00897216796875, 1.21533203125, 1.42169189453125, 1.6280517578125, 1.83441162109375, 2.040771484375, 2.24713134765625, 2.4534912109375, 2.65985107421875, 2.8662109375, 3.07257080078125, 3.2789306640625, 3.48529052734375, 3.691650390625, 3.89801025390625, 4.1043701171875, 4.31072998046875, 4.51708984375, 4.72344970703125, 4.9298095703125, 5.13616943359375, 5.342529296875, 5.54888916015625, 5.7552490234375, 5.96160888671875, 6.16796875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 13.0, 8.0, 22.0, 23.0, 26.0, 34.0, 49.0, 42.0, 62.0, 81.0, 66.0, 78.0, 71.0, 61.0, 72.0, 50.0, 55.0, 39.0, 33.0, 31.0, 22.0, 21.0, 8.0, 6.0, 7.0, 3.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-8.453125, -8.255859375, -8.05859375, -7.861328125, -7.6640625, -7.466796875, -7.26953125, -7.072265625, -6.875, -6.677734375, -6.48046875, -6.283203125, -6.0859375, -5.888671875, -5.69140625, -5.494140625, -5.296875, -5.099609375, -4.90234375, -4.705078125, -4.5078125, -4.310546875, -4.11328125, -3.916015625, -3.71875, -3.521484375, -3.32421875, -3.126953125, -2.9296875, -2.732421875, -2.53515625, -2.337890625, -2.140625, -1.943359375, -1.74609375, -1.548828125, -1.3515625, -1.154296875, -0.95703125, -0.759765625, -0.5625, -0.365234375, -0.16796875, 0.029296875, 0.2265625, 0.423828125, 0.62109375, 0.818359375, 1.015625, 1.212890625, 1.41015625, 1.607421875, 1.8046875, 2.001953125, 2.19921875, 2.396484375, 2.59375, 2.791015625, 2.98828125, 3.185546875, 3.3828125, 3.580078125, 3.77734375, 3.974609375, 4.171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 16.0, 19.0, 25.0, 38.0, 46.0, 98.0, 130.0, 264.0, 629.0, 1792.0, 8511.0, 74198.0, 2603635.0, 1446718.0, 49013.0, 6493.0, 1476.0, 538.0, 226.0, 152.0, 79.0, 39.0, 35.0, 26.0, 16.0, 15.0, 7.0, 3.0, 6.0, 5.0, 2.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7109375, -8.4197998046875, -8.128662109375, -7.8375244140625, -7.54638671875, -7.2552490234375, -6.964111328125, -6.6729736328125, -6.3818359375, -6.0906982421875, -5.799560546875, -5.5084228515625, -5.21728515625, -4.9261474609375, -4.635009765625, -4.3438720703125, -4.052734375, -3.7615966796875, -3.470458984375, -3.1793212890625, -2.88818359375, -2.5970458984375, -2.305908203125, -2.0147705078125, -1.7236328125, -1.4324951171875, -1.141357421875, -0.8502197265625, -0.55908203125, -0.2679443359375, 0.023193359375, 0.3143310546875, 0.60546875, 0.8966064453125, 1.187744140625, 1.4788818359375, 1.77001953125, 2.0611572265625, 2.352294921875, 2.6434326171875, 2.9345703125, 3.2257080078125, 3.516845703125, 3.8079833984375, 4.09912109375, 4.3902587890625, 4.681396484375, 4.9725341796875, 5.263671875, 5.5548095703125, 5.845947265625, 6.1370849609375, 6.42822265625, 6.7193603515625, 7.010498046875, 7.3016357421875, 7.5927734375, 7.8839111328125, 8.175048828125, 8.4661865234375, 8.75732421875, 9.0484619140625, 9.339599609375, 9.6307373046875, 9.921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 7.0, 8.0, 19.0, 13.0, 15.0, 36.0, 58.0, 66.0, 95.0, 157.0, 225.0, 311.0, 481.0, 601.0, 600.0, 459.0, 291.0, 199.0, 135.0, 71.0, 71.0, 41.0, 27.0, 16.0, 22.0, 8.0, 6.0, 7.0, 7.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0859375, -6.86431884765625, -6.6427001953125, -6.42108154296875, -6.199462890625, -5.97784423828125, -5.7562255859375, -5.53460693359375, -5.31298828125, -5.09136962890625, -4.8697509765625, -4.64813232421875, -4.426513671875, -4.20489501953125, -3.9832763671875, -3.76165771484375, -3.5400390625, -3.31842041015625, -3.0968017578125, -2.87518310546875, -2.653564453125, -2.43194580078125, -2.2103271484375, -1.98870849609375, -1.76708984375, -1.54547119140625, -1.3238525390625, -1.10223388671875, -0.880615234375, -0.65899658203125, -0.4373779296875, -0.21575927734375, 0.005859375, 0.22747802734375, 0.4490966796875, 0.67071533203125, 0.892333984375, 1.11395263671875, 1.3355712890625, 1.55718994140625, 1.77880859375, 2.00042724609375, 2.2220458984375, 2.44366455078125, 2.665283203125, 2.88690185546875, 3.1085205078125, 3.33013916015625, 3.5517578125, 3.77337646484375, 3.9949951171875, 4.21661376953125, 4.438232421875, 4.65985107421875, 4.8814697265625, 5.10308837890625, 5.32470703125, 5.54632568359375, 5.7679443359375, 5.98956298828125, 6.211181640625, 6.43280029296875, 6.6544189453125, 6.87603759765625, 7.09765625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 5.0, 9.0, 24.0, 30.0, 70.0, 105.0, 158.0, 185.0, 154.0, 105.0, 66.0, 25.0, 27.0, 10.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.9650764465332, -49.999420166015625, -48.03376007080078, -46.06809997558594, -44.10244369506836, -42.13678741455078, -40.17112731933594, -38.205467224121094, -36.239810943603516, -34.27415466308594, -32.308494567871094, -30.342836380004883, -28.377178192138672, -26.41152000427246, -24.44586181640625, -22.48020362854004, -20.514545440673828, -18.548887252807617, -16.583229064941406, -14.617570877075195, -12.651912689208984, -10.686254501342773, -8.720596313476562, -6.754938125610352, -4.789279937744141, -2.8236217498779297, -0.8579635620117188, 1.1076946258544922, 3.073352813720703, 5.039011001586914, 7.004669189453125, 8.970327377319336, 10.935989379882812, 12.901647567749023, 14.867305755615234, 16.832963943481445, 18.798622131347656, 20.764280319213867, 22.729938507080078, 24.69559669494629, 26.6612548828125, 28.62691307067871, 30.592571258544922, 32.5582275390625, 34.523887634277344, 36.48954772949219, 38.455204010009766, 40.420860290527344, 42.38652038574219, 44.35218048095703, 46.31783676147461, 48.28349304199219, 50.24915313720703, 52.214813232421875, 54.18046951293945, 56.14612579345703, 58.111785888671875, 60.07744598388672, 62.0431022644043, 64.00875854492188, 65.97441864013672, 67.94007873535156, 69.90573120117188, 71.87139129638672, 73.83705139160156]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 9.0, 6.0, 12.0, 5.0, 11.0, 19.0, 15.0, 21.0, 23.0, 41.0, 40.0, 38.0, 49.0, 51.0, 57.0, 49.0, 45.0, 47.0, 43.0, 51.0, 41.0, 40.0, 46.0, 36.0, 41.0, 25.0, 25.0, 13.0, 19.0, 7.0, 11.0, 8.0, 9.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.63080406188965, -30.558277130126953, -29.48575210571289, -28.413225173950195, -27.3406982421875, -26.268171310424805, -25.19564437866211, -24.123119354248047, -23.05059242248535, -21.978065490722656, -20.905540466308594, -19.8330135345459, -18.760486602783203, -17.687959671020508, -16.615432739257812, -15.54290771484375, -14.470380783081055, -13.39785385131836, -12.32532787322998, -11.252801895141602, -10.180274963378906, -9.107748031616211, -8.035222053527832, -6.962695598602295, -5.890169143676758, -4.817642688751221, -3.7451162338256836, -2.6725897789001465, -1.6000633239746094, -0.5275368690490723, 0.5449895858764648, 1.617516040802002, 2.6900405883789062, 3.7625670433044434, 4.8350934982299805, 5.907619953155518, 6.980146408081055, 8.05267333984375, 9.125199317932129, 10.197725296020508, 11.270252227783203, 12.342779159545898, 13.415305137634277, 14.487831115722656, 15.560358047485352, 16.632884979248047, 17.70541000366211, 18.777936935424805, 19.8504638671875, 20.922990798950195, 21.99551773071289, 23.068042755126953, 24.14056968688965, 25.213096618652344, 26.285621643066406, 27.3581485748291, 28.430675506591797, 29.503202438354492, 30.575729370117188, 31.64825439453125, 32.72077941894531, 33.79330825805664, 34.8658332824707, 35.93836212158203, 37.010887145996094]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 8.0, 8.0, 3.0, 8.0, 8.0, 26.0, 26.0, 40.0, 56.0, 99.0, 179.0, 266.0, 512.0, 941.0, 1824.0, 4002.0, 9735.0, 27008.0, 87006.0, 321107.0, 416995.0, 120661.0, 35827.0, 12494.0, 5016.0, 2157.0, 1111.0, 552.0, 321.0, 185.0, 131.0, 81.0, 60.0, 32.0, 19.0, 15.0, 7.0, 12.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-6.7578125, -6.53350830078125, -6.3092041015625, -6.08489990234375, -5.860595703125, -5.63629150390625, -5.4119873046875, -5.18768310546875, -4.96337890625, -4.73907470703125, -4.5147705078125, -4.29046630859375, -4.066162109375, -3.84185791015625, -3.6175537109375, -3.39324951171875, -3.1689453125, -2.94464111328125, -2.7203369140625, -2.49603271484375, -2.271728515625, -2.04742431640625, -1.8231201171875, -1.59881591796875, -1.37451171875, -1.15020751953125, -0.9259033203125, -0.70159912109375, -0.477294921875, -0.25299072265625, -0.0286865234375, 0.19561767578125, 0.419921875, 0.64422607421875, 0.8685302734375, 1.09283447265625, 1.317138671875, 1.54144287109375, 1.7657470703125, 1.99005126953125, 2.21435546875, 2.43865966796875, 2.6629638671875, 2.88726806640625, 3.111572265625, 3.33587646484375, 3.5601806640625, 3.78448486328125, 4.0087890625, 4.23309326171875, 4.4573974609375, 4.68170166015625, 4.906005859375, 5.13031005859375, 5.3546142578125, 5.57891845703125, 5.80322265625, 6.02752685546875, 6.2518310546875, 6.47613525390625, 6.700439453125, 6.92474365234375, 7.1490478515625, 7.37335205078125, 7.59765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 11.0, 13.0, 15.0, 26.0, 15.0, 30.0, 42.0, 52.0, 65.0, 77.0, 73.0, 59.0, 67.0, 70.0, 70.0, 53.0, 42.0, 42.0, 48.0, 34.0, 27.0, 21.0, 12.0, 7.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-8.5546875, -8.3568115234375, -8.158935546875, -7.9610595703125, -7.76318359375, -7.5653076171875, -7.367431640625, -7.1695556640625, -6.9716796875, -6.7738037109375, -6.575927734375, -6.3780517578125, -6.18017578125, -5.9822998046875, -5.784423828125, -5.5865478515625, -5.388671875, -5.1907958984375, -4.992919921875, -4.7950439453125, -4.59716796875, -4.3992919921875, -4.201416015625, -4.0035400390625, -3.8056640625, -3.6077880859375, -3.409912109375, -3.2120361328125, -3.01416015625, -2.8162841796875, -2.618408203125, -2.4205322265625, -2.22265625, -2.0247802734375, -1.826904296875, -1.6290283203125, -1.43115234375, -1.2332763671875, -1.035400390625, -0.8375244140625, -0.6396484375, -0.4417724609375, -0.243896484375, -0.0460205078125, 0.15185546875, 0.3497314453125, 0.547607421875, 0.7454833984375, 0.943359375, 1.1412353515625, 1.339111328125, 1.5369873046875, 1.73486328125, 1.9327392578125, 2.130615234375, 2.3284912109375, 2.5263671875, 2.7242431640625, 2.922119140625, 3.1199951171875, 3.31787109375, 3.5157470703125, 3.713623046875, 3.9114990234375, 4.109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 3.0, 7.0, 21.0, 13.0, 13.0, 23.0, 18.0, 42.0, 68.0, 87.0, 112.0, 149.0, 230.0, 307.0, 419.0, 671.0, 1192.0, 2527.0, 8969.0, 63071.0, 826920.0, 123144.0, 13334.0, 3358.0, 1392.0, 782.0, 474.0, 324.0, 239.0, 174.0, 130.0, 96.0, 63.0, 38.0, 42.0, 25.0, 14.0, 14.0, 9.0, 4.0, 10.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.125, -11.7291259765625, -11.333251953125, -10.9373779296875, -10.54150390625, -10.1456298828125, -9.749755859375, -9.3538818359375, -8.9580078125, -8.5621337890625, -8.166259765625, -7.7703857421875, -7.37451171875, -6.9786376953125, -6.582763671875, -6.1868896484375, -5.791015625, -5.3951416015625, -4.999267578125, -4.6033935546875, -4.20751953125, -3.8116455078125, -3.415771484375, -3.0198974609375, -2.6240234375, -2.2281494140625, -1.832275390625, -1.4364013671875, -1.04052734375, -0.6446533203125, -0.248779296875, 0.1470947265625, 0.54296875, 0.9388427734375, 1.334716796875, 1.7305908203125, 2.12646484375, 2.5223388671875, 2.918212890625, 3.3140869140625, 3.7099609375, 4.1058349609375, 4.501708984375, 4.8975830078125, 5.29345703125, 5.6893310546875, 6.085205078125, 6.4810791015625, 6.876953125, 7.2728271484375, 7.668701171875, 8.0645751953125, 8.46044921875, 8.8563232421875, 9.252197265625, 9.6480712890625, 10.0439453125, 10.4398193359375, 10.835693359375, 11.2315673828125, 11.62744140625, 12.0233154296875, 12.419189453125, 12.8150634765625, 13.2109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 4.0, 6.0, 9.0, 8.0, 15.0, 17.0, 16.0, 24.0, 33.0, 19.0, 31.0, 34.0, 44.0, 46.0, 56.0, 57.0, 47.0, 52.0, 39.0, 51.0, 54.0, 49.0, 37.0, 28.0, 28.0, 36.0, 26.0, 26.0, 21.0, 13.0, 22.0, 12.0, 11.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.0234375, -14.5323486328125, -14.041259765625, -13.5501708984375, -13.05908203125, -12.5679931640625, -12.076904296875, -11.5858154296875, -11.0947265625, -10.6036376953125, -10.112548828125, -9.6214599609375, -9.13037109375, -8.6392822265625, -8.148193359375, -7.6571044921875, -7.166015625, -6.6749267578125, -6.183837890625, -5.6927490234375, -5.20166015625, -4.7105712890625, -4.219482421875, -3.7283935546875, -3.2373046875, -2.7462158203125, -2.255126953125, -1.7640380859375, -1.27294921875, -0.7818603515625, -0.290771484375, 0.2003173828125, 0.69140625, 1.1824951171875, 1.673583984375, 2.1646728515625, 2.65576171875, 3.1468505859375, 3.637939453125, 4.1290283203125, 4.6201171875, 5.1112060546875, 5.602294921875, 6.0933837890625, 6.58447265625, 7.0755615234375, 7.566650390625, 8.0577392578125, 8.548828125, 9.0399169921875, 9.531005859375, 10.0220947265625, 10.51318359375, 11.0042724609375, 11.495361328125, 11.9864501953125, 12.4775390625, 12.9686279296875, 13.459716796875, 13.9508056640625, 14.44189453125, 14.9329833984375, 15.424072265625, 15.9151611328125, 16.40625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 8.0, 9.0, 12.0, 11.0, 20.0, 20.0, 24.0, 30.0, 40.0, 49.0, 76.0, 102.0, 146.0, 315.0, 775.0, 2271.0, 9453.0, 135916.0, 868476.0, 24448.0, 4030.0, 1176.0, 469.0, 216.0, 139.0, 61.0, 58.0, 42.0, 33.0, 28.0, 15.0, 13.0, 12.0, 14.0, 6.0, 10.0, 3.0, 5.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.87890625, -4.740386962890625, -4.60186767578125, -4.463348388671875, -4.3248291015625, -4.186309814453125, -4.04779052734375, -3.909271240234375, -3.770751953125, -3.632232666015625, -3.49371337890625, -3.355194091796875, -3.2166748046875, -3.078155517578125, -2.93963623046875, -2.801116943359375, -2.66259765625, -2.524078369140625, -2.38555908203125, -2.247039794921875, -2.1085205078125, -1.970001220703125, -1.83148193359375, -1.692962646484375, -1.554443359375, -1.415924072265625, -1.27740478515625, -1.138885498046875, -1.0003662109375, -0.861846923828125, -0.72332763671875, -0.584808349609375, -0.4462890625, -0.307769775390625, -0.16925048828125, -0.030731201171875, 0.1077880859375, 0.246307373046875, 0.38482666015625, 0.523345947265625, 0.661865234375, 0.800384521484375, 0.93890380859375, 1.077423095703125, 1.2159423828125, 1.354461669921875, 1.49298095703125, 1.631500244140625, 1.77001953125, 1.908538818359375, 2.04705810546875, 2.185577392578125, 2.3240966796875, 2.462615966796875, 2.60113525390625, 2.739654541015625, 2.878173828125, 3.016693115234375, 3.15521240234375, 3.293731689453125, 3.4322509765625, 3.570770263671875, 3.70928955078125, 3.847808837890625, 3.986328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 10.0, 8.0, 15.0, 15.0, 30.0, 63.0, 100.0, 163.0, 194.0, 149.0, 92.0, 55.0, 31.0, 12.0, 10.0, 7.0, 5.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0010166168212890625, -0.0009894296526908875, -0.0009622424840927124, -0.0009350553154945374, -0.0009078681468963623, -0.0008806809782981873, -0.0008534938097000122, -0.0008263066411018372, -0.0007991194725036621, -0.0007719323039054871, -0.000744745135307312, -0.000717557966709137, -0.0006903707981109619, -0.0006631836295127869, -0.0006359964609146118, -0.0006088092923164368, -0.0005816221237182617, -0.0005544349551200867, -0.0005272477865219116, -0.0005000606179237366, -0.0004728734493255615, -0.0004456862807273865, -0.0004184991121292114, -0.0003913119435310364, -0.00036412477493286133, -0.0003369376063346863, -0.00030975043773651123, -0.0002825632691383362, -0.00025537610054016113, -0.00022818893194198608, -0.00020100176334381104, -0.00017381459474563599, -0.00014662742614746094, -0.00011944025754928589, -9.225308895111084e-05, -6.506592035293579e-05, -3.787875175476074e-05, -1.0691583156585693e-05, 1.6495585441589355e-05, 4.3682754039764404e-05, 7.086992263793945e-05, 9.80570912361145e-05, 0.00012524425983428955, 0.0001524314284324646, 0.00017961859703063965, 0.0002068057656288147, 0.00023399293422698975, 0.0002611801028251648, 0.00028836727142333984, 0.0003155544400215149, 0.00034274160861968994, 0.000369928777217865, 0.00039711594581604004, 0.0004243031144142151, 0.00045149028301239014, 0.0004786774516105652, 0.0005058646202087402, 0.0005330517888069153, 0.0005602389574050903, 0.0005874261260032654, 0.0006146132946014404, 0.0006418004631996155, 0.0006689876317977905, 0.0006961748003959656, 0.0007233619689941406]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 9.0, 11.0, 9.0, 22.0, 17.0, 33.0, 48.0, 53.0, 84.0, 129.0, 207.0, 323.0, 535.0, 964.0, 1950.0, 4249.0, 11417.0, 50936.0, 712877.0, 221821.0, 27961.0, 7901.0, 3359.0, 1595.0, 786.0, 451.0, 252.0, 168.0, 118.0, 68.0, 46.0, 39.0, 34.0, 15.0, 18.0, 16.0, 12.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.701171875, -2.623626708984375, -2.54608154296875, -2.468536376953125, -2.3909912109375, -2.313446044921875, -2.23590087890625, -2.158355712890625, -2.080810546875, -2.003265380859375, -1.92572021484375, -1.848175048828125, -1.7706298828125, -1.693084716796875, -1.61553955078125, -1.537994384765625, -1.46044921875, -1.382904052734375, -1.30535888671875, -1.227813720703125, -1.1502685546875, -1.072723388671875, -0.99517822265625, -0.917633056640625, -0.840087890625, -0.762542724609375, -0.68499755859375, -0.607452392578125, -0.5299072265625, -0.452362060546875, -0.37481689453125, -0.297271728515625, -0.2197265625, -0.142181396484375, -0.06463623046875, 0.012908935546875, 0.0904541015625, 0.167999267578125, 0.24554443359375, 0.323089599609375, 0.400634765625, 0.478179931640625, 0.55572509765625, 0.633270263671875, 0.7108154296875, 0.788360595703125, 0.86590576171875, 0.943450927734375, 1.02099609375, 1.098541259765625, 1.17608642578125, 1.253631591796875, 1.3311767578125, 1.408721923828125, 1.48626708984375, 1.563812255859375, 1.641357421875, 1.718902587890625, 1.79644775390625, 1.873992919921875, 1.9515380859375, 2.029083251953125, 2.10662841796875, 2.184173583984375, 2.26171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 10.0, 7.0, 18.0, 16.0, 22.0, 14.0, 23.0, 49.0, 40.0, 70.0, 80.0, 67.0, 92.0, 75.0, 72.0, 65.0, 54.0, 29.0, 44.0, 26.0, 21.0, 15.0, 14.0, 11.0, 8.0, 10.0, 4.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3828125, -2.3148193359375, -2.246826171875, -2.1788330078125, -2.11083984375, -2.0428466796875, -1.974853515625, -1.9068603515625, -1.8388671875, -1.7708740234375, -1.702880859375, -1.6348876953125, -1.56689453125, -1.4989013671875, -1.430908203125, -1.3629150390625, -1.294921875, -1.2269287109375, -1.158935546875, -1.0909423828125, -1.02294921875, -0.9549560546875, -0.886962890625, -0.8189697265625, -0.7509765625, -0.6829833984375, -0.614990234375, -0.5469970703125, -0.47900390625, -0.4110107421875, -0.343017578125, -0.2750244140625, -0.20703125, -0.1390380859375, -0.071044921875, -0.0030517578125, 0.06494140625, 0.1329345703125, 0.200927734375, 0.2689208984375, 0.3369140625, 0.4049072265625, 0.472900390625, 0.5408935546875, 0.60888671875, 0.6768798828125, 0.744873046875, 0.8128662109375, 0.880859375, 0.9488525390625, 1.016845703125, 1.0848388671875, 1.15283203125, 1.2208251953125, 1.288818359375, 1.3568115234375, 1.4248046875, 1.4927978515625, 1.560791015625, 1.6287841796875, 1.69677734375, 1.7647705078125, 1.832763671875, 1.9007568359375, 1.96875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 25.0, 76.0, 353.0, 440.0, 76.0, 15.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.36038208007812, -159.06854248046875, -153.7766876220703, -148.48484802246094, -143.1929931640625, -137.90115356445312, -132.60931396484375, -127.31745910644531, -122.02561950683594, -116.73377227783203, -111.44192504882812, -106.15008544921875, -100.85823822021484, -95.56639099121094, -90.27454376220703, -84.98269653320312, -79.69084930419922, -74.39900207519531, -69.1071548461914, -63.815311431884766, -58.523468017578125, -53.23162078857422, -47.93977355957031, -42.64793014526367, -37.356082916259766, -32.06423568725586, -26.77239227294922, -21.480545043945312, -16.18869972229004, -10.896854400634766, -5.605007171630859, -0.31316375732421875, 4.9786834716796875, 10.270528793334961, 15.56237506866455, 20.85422134399414, 26.146066665649414, 31.437911987304688, 36.729759216308594, 42.021602630615234, 47.31344985961914, 52.60529708862305, 57.89714050292969, 63.188987731933594, 68.4808349609375, 73.77267456054688, 79.06452941894531, 84.35636901855469, 89.6482162475586, 94.9400634765625, 100.2319107055664, 105.52375793457031, 110.81559753417969, 116.1074447631836, 121.3992919921875, 126.69113159179688, 131.9829864501953, 137.2748260498047, 142.56668090820312, 147.8585205078125, 153.15037536621094, 158.4422149658203, 163.73406982421875, 169.02590942382812, 174.3177490234375]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 8.0, 16.0, 13.0, 8.0, 12.0, 26.0, 23.0, 19.0, 26.0, 39.0, 38.0, 43.0, 67.0, 130.0, 151.0, 78.0, 61.0, 40.0, 30.0, 31.0, 19.0, 27.0, 25.0, 9.0, 17.0, 13.0, 4.0, 5.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.832786560058594, -60.748443603515625, -58.66409683227539, -56.57975387573242, -54.49540710449219, -52.41106414794922, -50.32672119140625, -48.242374420166016, -46.15802764892578, -44.07368469238281, -41.98933792114258, -39.90499496459961, -37.820648193359375, -35.736305236816406, -33.65196228027344, -31.567615509033203, -29.483272552490234, -27.398927688598633, -25.31458282470703, -23.230239868164062, -21.145893096923828, -19.06155014038086, -16.977205276489258, -14.892860412597656, -12.808515548706055, -10.724170684814453, -8.639825820922852, -6.555481910705566, -4.471137046813965, -2.3867921829223633, -0.3024482727050781, 1.7818965911865234, 3.866241455078125, 5.950586318969727, 8.034931182861328, 10.119275093078613, 12.203619956970215, 14.287964820861816, 16.3723087310791, 18.456653594970703, 20.540998458862305, 22.625343322753906, 24.709688186645508, 26.79403305053711, 28.878376007080078, 30.962722778320312, 33.04706573486328, 35.13140869140625, 37.215755462646484, 39.30009841918945, 41.38444519042969, 43.468788146972656, 45.55313491821289, 47.63747787475586, 49.721824645996094, 51.80616760253906, 53.89051055908203, 55.974853515625, 58.059200286865234, 60.1435432434082, 62.22789001464844, 64.3122329711914, 66.39657592773438, 68.48092651367188, 70.56526947021484]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 9.0, 14.0, 12.0, 26.0, 30.0, 59.0, 63.0, 142.0, 242.0, 397.0, 829.0, 1509.0, 3797.0, 11221.0, 57972.0, 502091.0, 2307601.0, 1132154.0, 141939.0, 22637.0, 6769.0, 2576.0, 1085.0, 483.0, 245.0, 137.0, 80.0, 56.0, 22.0, 23.0, 15.0, 12.0, 5.0, 12.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.316162109375, -7.08544921875, -6.854736328125, -6.6240234375, -6.393310546875, -6.16259765625, -5.931884765625, -5.701171875, -5.470458984375, -5.23974609375, -5.009033203125, -4.7783203125, -4.547607421875, -4.31689453125, -4.086181640625, -3.85546875, -3.624755859375, -3.39404296875, -3.163330078125, -2.9326171875, -2.701904296875, -2.47119140625, -2.240478515625, -2.009765625, -1.779052734375, -1.54833984375, -1.317626953125, -1.0869140625, -0.856201171875, -0.62548828125, -0.394775390625, -0.1640625, 0.066650390625, 0.29736328125, 0.528076171875, 0.7587890625, 0.989501953125, 1.22021484375, 1.450927734375, 1.681640625, 1.912353515625, 2.14306640625, 2.373779296875, 2.6044921875, 2.835205078125, 3.06591796875, 3.296630859375, 3.52734375, 3.758056640625, 3.98876953125, 4.219482421875, 4.4501953125, 4.680908203125, 4.91162109375, 5.142333984375, 5.373046875, 5.603759765625, 5.83447265625, 6.065185546875, 6.2958984375, 6.526611328125, 6.75732421875, 6.988037109375, 7.21875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 10.0, 15.0, 24.0, 31.0, 28.0, 33.0, 57.0, 60.0, 71.0, 79.0, 70.0, 62.0, 82.0, 63.0, 68.0, 57.0, 39.0, 40.0, 31.0, 30.0, 13.0, 15.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-8.5, -8.3028564453125, -8.105712890625, -7.9085693359375, -7.71142578125, -7.5142822265625, -7.317138671875, -7.1199951171875, -6.9228515625, -6.7257080078125, -6.528564453125, -6.3314208984375, -6.13427734375, -5.9371337890625, -5.739990234375, -5.5428466796875, -5.345703125, -5.1485595703125, -4.951416015625, -4.7542724609375, -4.55712890625, -4.3599853515625, -4.162841796875, -3.9656982421875, -3.7685546875, -3.5714111328125, -3.374267578125, -3.1771240234375, -2.97998046875, -2.7828369140625, -2.585693359375, -2.3885498046875, -2.19140625, -1.9942626953125, -1.797119140625, -1.5999755859375, -1.40283203125, -1.2056884765625, -1.008544921875, -0.8114013671875, -0.6142578125, -0.4171142578125, -0.219970703125, -0.0228271484375, 0.17431640625, 0.3714599609375, 0.568603515625, 0.7657470703125, 0.962890625, 1.1600341796875, 1.357177734375, 1.5543212890625, 1.75146484375, 1.9486083984375, 2.145751953125, 2.3428955078125, 2.5400390625, 2.7371826171875, 2.934326171875, 3.1314697265625, 3.32861328125, 3.5257568359375, 3.722900390625, 3.9200439453125, 4.1171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 11.0, 24.0, 21.0, 32.0, 39.0, 52.0, 77.0, 125.0, 179.0, 353.0, 600.0, 1189.0, 3061.0, 14353.0, 421605.0, 3695401.0, 47201.0, 6064.0, 1904.0, 840.0, 368.0, 268.0, 153.0, 93.0, 70.0, 44.0, 34.0, 28.0, 11.0, 16.0, 7.0, 8.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.030517578125, -16.46728515625, -15.904052734375, -15.3408203125, -14.777587890625, -14.21435546875, -13.651123046875, -13.087890625, -12.524658203125, -11.96142578125, -11.398193359375, -10.8349609375, -10.271728515625, -9.70849609375, -9.145263671875, -8.58203125, -8.018798828125, -7.45556640625, -6.892333984375, -6.3291015625, -5.765869140625, -5.20263671875, -4.639404296875, -4.076171875, -3.512939453125, -2.94970703125, -2.386474609375, -1.8232421875, -1.260009765625, -0.69677734375, -0.133544921875, 0.4296875, 0.992919921875, 1.55615234375, 2.119384765625, 2.6826171875, 3.245849609375, 3.80908203125, 4.372314453125, 4.935546875, 5.498779296875, 6.06201171875, 6.625244140625, 7.1884765625, 7.751708984375, 8.31494140625, 8.878173828125, 9.44140625, 10.004638671875, 10.56787109375, 11.131103515625, 11.6943359375, 12.257568359375, 12.82080078125, 13.384033203125, 13.947265625, 14.510498046875, 15.07373046875, 15.636962890625, 16.2001953125, 16.763427734375, 17.32666015625, 17.889892578125, 18.453125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 14.0, 3.0, 18.0, 20.0, 39.0, 59.0, 83.0, 127.0, 236.0, 384.0, 662.0, 785.0, 589.0, 406.0, 259.0, 142.0, 90.0, 50.0, 35.0, 21.0, 15.0, 10.0, 8.0, 6.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.75, -16.23486328125, -15.7197265625, -15.20458984375, -14.689453125, -14.17431640625, -13.6591796875, -13.14404296875, -12.62890625, -12.11376953125, -11.5986328125, -11.08349609375, -10.568359375, -10.05322265625, -9.5380859375, -9.02294921875, -8.5078125, -7.99267578125, -7.4775390625, -6.96240234375, -6.447265625, -5.93212890625, -5.4169921875, -4.90185546875, -4.38671875, -3.87158203125, -3.3564453125, -2.84130859375, -2.326171875, -1.81103515625, -1.2958984375, -0.78076171875, -0.265625, 0.24951171875, 0.7646484375, 1.27978515625, 1.794921875, 2.31005859375, 2.8251953125, 3.34033203125, 3.85546875, 4.37060546875, 4.8857421875, 5.40087890625, 5.916015625, 6.43115234375, 6.9462890625, 7.46142578125, 7.9765625, 8.49169921875, 9.0068359375, 9.52197265625, 10.037109375, 10.55224609375, 11.0673828125, 11.58251953125, 12.09765625, 12.61279296875, 13.1279296875, 13.64306640625, 14.158203125, 14.67333984375, 15.1884765625, 15.70361328125, 16.21875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 5.0, 12.0, 13.0, 20.0, 55.0, 110.0, 210.0, 225.0, 158.0, 93.0, 37.0, 15.0, 14.0, 9.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.91278076171875, -128.97137451171875, -124.02996063232422, -119.08854675292969, -114.14714050292969, -109.20572662353516, -104.26431274414062, -99.32290649414062, -94.38150024414062, -89.4400863647461, -84.4986801147461, -79.55726623535156, -74.61585998535156, -69.67444610595703, -64.7330322265625, -59.7916259765625, -54.85021209716797, -49.9088020324707, -44.96739196777344, -40.025978088378906, -35.084571838378906, -30.143159866333008, -25.20174789428711, -20.260337829589844, -15.318927764892578, -10.377517700195312, -5.4361066818237305, -0.49469566345214844, 4.446714401245117, 9.388124465942383, 14.329536437988281, 19.270946502685547, 24.212356567382812, 29.153766632080078, 34.095176696777344, 39.036590576171875, 43.977996826171875, 48.919410705566406, 53.86082077026367, 58.80223083496094, 63.7436408996582, 68.68505096435547, 73.62646484375, 78.56787109375, 83.50928497314453, 88.45069122314453, 93.39210510253906, 98.33351135253906, 103.2749252319336, 108.21633911132812, 113.15774536132812, 118.09915924072266, 123.04056549072266, 127.98197937011719, 132.9233856201172, 137.86480712890625, 142.80621337890625, 147.74761962890625, 152.6890411376953, 157.6304473876953, 162.5718536376953, 167.5132598876953, 172.45468139648438, 177.39608764648438, 182.33749389648438]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 8.0, 18.0, 23.0, 19.0, 24.0, 25.0, 30.0, 30.0, 30.0, 44.0, 50.0, 45.0, 61.0, 62.0, 87.0, 74.0, 62.0, 41.0, 55.0, 35.0, 28.0, 30.0, 14.0, 19.0, 20.0, 14.0, 8.0, 14.0, 5.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.3277587890625, -75.74333953857422, -73.15892791748047, -70.57450866699219, -67.99009704589844, -65.40567779541016, -62.82126235961914, -60.236846923828125, -57.65243148803711, -55.068016052246094, -52.48360061645508, -49.89918518066406, -47.31476593017578, -44.73035430908203, -42.14593505859375, -39.561519622802734, -36.97710418701172, -34.3926887512207, -31.808273315429688, -29.22385597229004, -26.639440536499023, -24.055025100708008, -21.47060775756836, -18.886192321777344, -16.301776885986328, -13.717361450195312, -11.13294506072998, -8.548528671264648, -5.964113235473633, -3.379697799682617, -0.7952814102172852, 1.7891349792480469, 4.3735504150390625, 6.957966327667236, 9.54238224029541, 12.126798629760742, 14.711214065551758, 17.295629501342773, 19.880046844482422, 22.464462280273438, 25.048877716064453, 27.63329315185547, 30.217708587646484, 32.8021240234375, 35.38654327392578, 37.97095489501953, 40.55537414550781, 43.13978958129883, 45.724205017089844, 48.30862045288086, 50.893035888671875, 53.47745132446289, 56.061866760253906, 58.64628601074219, 61.2307014465332, 63.81511688232422, 66.3995361328125, 68.98395538330078, 71.56836700439453, 74.15278625488281, 76.73719787597656, 79.32161712646484, 81.9060287475586, 84.49044799804688, 87.07485961914062]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 3.0, 15.0, 11.0, 26.0, 38.0, 51.0, 74.0, 108.0, 176.0, 270.0, 542.0, 938.0, 1775.0, 3870.0, 9273.0, 29001.0, 126458.0, 663083.0, 159325.0, 34243.0, 10654.0, 4211.0, 1989.0, 985.0, 536.0, 310.0, 201.0, 122.0, 84.0, 47.0, 29.0, 19.0, 19.0, 14.0, 11.0, 4.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7890625, -5.57904052734375, -5.3690185546875, -5.15899658203125, -4.948974609375, -4.73895263671875, -4.5289306640625, -4.31890869140625, -4.10888671875, -3.89886474609375, -3.6888427734375, -3.47882080078125, -3.268798828125, -3.05877685546875, -2.8487548828125, -2.63873291015625, -2.4287109375, -2.21868896484375, -2.0086669921875, -1.79864501953125, -1.588623046875, -1.37860107421875, -1.1685791015625, -0.95855712890625, -0.74853515625, -0.53851318359375, -0.3284912109375, -0.11846923828125, 0.091552734375, 0.30157470703125, 0.5115966796875, 0.72161865234375, 0.931640625, 1.14166259765625, 1.3516845703125, 1.56170654296875, 1.771728515625, 1.98175048828125, 2.1917724609375, 2.40179443359375, 2.61181640625, 2.82183837890625, 3.0318603515625, 3.24188232421875, 3.451904296875, 3.66192626953125, 3.8719482421875, 4.08197021484375, 4.2919921875, 4.50201416015625, 4.7120361328125, 4.92205810546875, 5.132080078125, 5.34210205078125, 5.5521240234375, 5.76214599609375, 5.97216796875, 6.18218994140625, 6.3922119140625, 6.60223388671875, 6.812255859375, 7.02227783203125, 7.2322998046875, 7.44232177734375, 7.65234375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 6.0, 17.0, 26.0, 18.0, 35.0, 43.0, 51.0, 77.0, 64.0, 85.0, 77.0, 82.0, 88.0, 70.0, 63.0, 44.0, 40.0, 23.0, 30.0, 21.0, 16.0, 13.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.98828125, -7.73785400390625, -7.4874267578125, -7.23699951171875, -6.986572265625, -6.73614501953125, -6.4857177734375, -6.23529052734375, -5.98486328125, -5.73443603515625, -5.4840087890625, -5.23358154296875, -4.983154296875, -4.73272705078125, -4.4822998046875, -4.23187255859375, -3.9814453125, -3.73101806640625, -3.4805908203125, -3.23016357421875, -2.979736328125, -2.72930908203125, -2.4788818359375, -2.22845458984375, -1.97802734375, -1.72760009765625, -1.4771728515625, -1.22674560546875, -0.976318359375, -0.72589111328125, -0.4754638671875, -0.22503662109375, 0.025390625, 0.27581787109375, 0.5262451171875, 0.77667236328125, 1.027099609375, 1.27752685546875, 1.5279541015625, 1.77838134765625, 2.02880859375, 2.27923583984375, 2.5296630859375, 2.78009033203125, 3.030517578125, 3.28094482421875, 3.5313720703125, 3.78179931640625, 4.0322265625, 4.28265380859375, 4.5330810546875, 4.78350830078125, 5.033935546875, 5.28436279296875, 5.5347900390625, 5.78521728515625, 6.03564453125, 6.28607177734375, 6.5364990234375, 6.78692626953125, 7.037353515625, 7.28778076171875, 7.5382080078125, 7.78863525390625, 8.0390625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 14.0, 21.0, 35.0, 54.0, 87.0, 134.0, 227.0, 416.0, 889.0, 2850.0, 21456.0, 926077.0, 87856.0, 5785.0, 1377.0, 535.0, 266.0, 175.0, 87.0, 78.0, 49.0, 19.0, 22.0, 20.0, 5.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.654296875, -9.29296875, -8.931640625, -8.5703125, -8.208984375, -7.84765625, -7.486328125, -7.125, -6.763671875, -6.40234375, -6.041015625, -5.6796875, -5.318359375, -4.95703125, -4.595703125, -4.234375, -3.873046875, -3.51171875, -3.150390625, -2.7890625, -2.427734375, -2.06640625, -1.705078125, -1.34375, -0.982421875, -0.62109375, -0.259765625, 0.1015625, 0.462890625, 0.82421875, 1.185546875, 1.546875, 1.908203125, 2.26953125, 2.630859375, 2.9921875, 3.353515625, 3.71484375, 4.076171875, 4.4375, 4.798828125, 5.16015625, 5.521484375, 5.8828125, 6.244140625, 6.60546875, 6.966796875, 7.328125, 7.689453125, 8.05078125, 8.412109375, 8.7734375, 9.134765625, 9.49609375, 9.857421875, 10.21875, 10.580078125, 10.94140625, 11.302734375, 11.6640625, 12.025390625, 12.38671875, 12.748046875, 13.109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 6.0, 3.0, 3.0, 10.0, 8.0, 6.0, 12.0, 11.0, 9.0, 22.0, 17.0, 14.0, 30.0, 25.0, 27.0, 36.0, 24.0, 35.0, 63.0, 48.0, 70.0, 63.0, 61.0, 66.0, 56.0, 37.0, 35.0, 38.0, 21.0, 19.0, 20.0, 8.0, 11.0, 15.0, 11.0, 9.0, 6.0, 7.0, 9.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0859375, -12.637939453125, -12.18994140625, -11.741943359375, -11.2939453125, -10.845947265625, -10.39794921875, -9.949951171875, -9.501953125, -9.053955078125, -8.60595703125, -8.157958984375, -7.7099609375, -7.261962890625, -6.81396484375, -6.365966796875, -5.91796875, -5.469970703125, -5.02197265625, -4.573974609375, -4.1259765625, -3.677978515625, -3.22998046875, -2.781982421875, -2.333984375, -1.885986328125, -1.43798828125, -0.989990234375, -0.5419921875, -0.093994140625, 0.35400390625, 0.802001953125, 1.25, 1.697998046875, 2.14599609375, 2.593994140625, 3.0419921875, 3.489990234375, 3.93798828125, 4.385986328125, 4.833984375, 5.281982421875, 5.72998046875, 6.177978515625, 6.6259765625, 7.073974609375, 7.52197265625, 7.969970703125, 8.41796875, 8.865966796875, 9.31396484375, 9.761962890625, 10.2099609375, 10.657958984375, 11.10595703125, 11.553955078125, 12.001953125, 12.449951171875, 12.89794921875, 13.345947265625, 13.7939453125, 14.241943359375, 14.68994140625, 15.137939453125, 15.5859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 5.0, 12.0, 8.0, 15.0, 22.0, 32.0, 66.0, 71.0, 145.0, 353.0, 761.0, 2441.0, 11578.0, 144567.0, 861204.0, 21568.0, 3699.0, 1050.0, 423.0, 189.0, 123.0, 79.0, 37.0, 24.0, 19.0, 11.0, 7.0, 14.0, 4.0, 2.0, 4.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6162109375, -1.565948486328125, -1.51568603515625, -1.465423583984375, -1.4151611328125, -1.364898681640625, -1.31463623046875, -1.264373779296875, -1.214111328125, -1.163848876953125, -1.11358642578125, -1.063323974609375, -1.0130615234375, -0.962799072265625, -0.91253662109375, -0.862274169921875, -0.81201171875, -0.761749267578125, -0.71148681640625, -0.661224365234375, -0.6109619140625, -0.560699462890625, -0.51043701171875, -0.460174560546875, -0.409912109375, -0.359649658203125, -0.30938720703125, -0.259124755859375, -0.2088623046875, -0.158599853515625, -0.10833740234375, -0.058074951171875, -0.0078125, 0.042449951171875, 0.09271240234375, 0.142974853515625, 0.1932373046875, 0.243499755859375, 0.29376220703125, 0.344024658203125, 0.394287109375, 0.444549560546875, 0.49481201171875, 0.545074462890625, 0.5953369140625, 0.645599365234375, 0.69586181640625, 0.746124267578125, 0.79638671875, 0.846649169921875, 0.89691162109375, 0.947174072265625, 0.9974365234375, 1.047698974609375, 1.09796142578125, 1.148223876953125, 1.198486328125, 1.248748779296875, 1.29901123046875, 1.349273681640625, 1.3995361328125, 1.449798583984375, 1.50006103515625, 1.550323486328125, 1.6005859375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 7.0, 2.0, 5.0, 8.0, 10.0, 10.0, 12.0, 13.0, 19.0, 26.0, 47.0, 63.0, 67.0, 96.0, 106.0, 117.0, 81.0, 69.0, 54.0, 30.0, 32.0, 22.0, 23.0, 15.0, 13.0, 6.0, 7.0, 9.0, 6.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00022268295288085938, -0.0002162940800189972, -0.000209905207157135, -0.00020351633429527283, -0.00019712746143341064, -0.00019073858857154846, -0.00018434971570968628, -0.0001779608428478241, -0.00017157196998596191, -0.00016518309712409973, -0.00015879422426223755, -0.00015240535140037537, -0.00014601647853851318, -0.000139627605676651, -0.00013323873281478882, -0.00012684985995292664, -0.00012046098709106445, -0.00011407211422920227, -0.00010768324136734009, -0.0001012943685054779, -9.490549564361572e-05, -8.851662278175354e-05, -8.212774991989136e-05, -7.573887705802917e-05, -6.935000419616699e-05, -6.296113133430481e-05, -5.657225847244263e-05, -5.0183385610580444e-05, -4.379451274871826e-05, -3.740563988685608e-05, -3.1016767024993896e-05, -2.4627894163131714e-05, -1.823902130126953e-05, -1.1850148439407349e-05, -5.461275577545166e-06, 9.275972843170166e-07, 7.316470146179199e-06, 1.3705343008041382e-05, 2.0094215869903564e-05, 2.6483088731765747e-05, 3.287196159362793e-05, 3.926083445549011e-05, 4.5649707317352295e-05, 5.203858017921448e-05, 5.842745304107666e-05, 6.481632590293884e-05, 7.120519876480103e-05, 7.759407162666321e-05, 8.398294448852539e-05, 9.037181735038757e-05, 9.676069021224976e-05, 0.00010314956307411194, 0.00010953843593597412, 0.0001159273087978363, 0.00012231618165969849, 0.00012870505452156067, 0.00013509392738342285, 0.00014148280024528503, 0.00014787167310714722, 0.0001542605459690094, 0.00016064941883087158, 0.00016703829169273376, 0.00017342716455459595, 0.00017981603741645813, 0.0001862049102783203]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 8.0, 9.0, 14.0, 20.0, 31.0, 50.0, 59.0, 113.0, 169.0, 322.0, 523.0, 1112.0, 2404.0, 6161.0, 19594.0, 99828.0, 829475.0, 64641.0, 14773.0, 5094.0, 2035.0, 942.0, 470.0, 255.0, 143.0, 101.0, 68.0, 43.0, 42.0, 18.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0277099609375, -0.993896484375, -0.9600830078125, -0.92626953125, -0.8924560546875, -0.858642578125, -0.8248291015625, -0.791015625, -0.7572021484375, -0.723388671875, -0.6895751953125, -0.65576171875, -0.6219482421875, -0.588134765625, -0.5543212890625, -0.5205078125, -0.4866943359375, -0.452880859375, -0.4190673828125, -0.38525390625, -0.3514404296875, -0.317626953125, -0.2838134765625, -0.25, -0.2161865234375, -0.182373046875, -0.1485595703125, -0.11474609375, -0.0809326171875, -0.047119140625, -0.0133056640625, 0.0205078125, 0.0543212890625, 0.088134765625, 0.1219482421875, 0.15576171875, 0.1895751953125, 0.223388671875, 0.2572021484375, 0.291015625, 0.3248291015625, 0.358642578125, 0.3924560546875, 0.42626953125, 0.4600830078125, 0.493896484375, 0.5277099609375, 0.5615234375, 0.5953369140625, 0.629150390625, 0.6629638671875, 0.69677734375, 0.7305908203125, 0.764404296875, 0.7982177734375, 0.83203125, 0.8658447265625, 0.899658203125, 0.9334716796875, 0.96728515625, 1.0010986328125, 1.034912109375, 1.0687255859375, 1.1025390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 8.0, 2.0, 2.0, 11.0, 11.0, 9.0, 15.0, 13.0, 19.0, 17.0, 40.0, 73.0, 58.0, 99.0, 116.0, 142.0, 89.0, 69.0, 52.0, 34.0, 25.0, 21.0, 22.0, 13.0, 14.0, 4.0, 7.0, 6.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.6455078125, -1.6022491455078125, -1.558990478515625, -1.5157318115234375, -1.47247314453125, -1.4292144775390625, -1.385955810546875, -1.3426971435546875, -1.2994384765625, -1.2561798095703125, -1.212921142578125, -1.1696624755859375, -1.12640380859375, -1.0831451416015625, -1.039886474609375, -0.9966278076171875, -0.953369140625, -0.9101104736328125, -0.866851806640625, -0.8235931396484375, -0.78033447265625, -0.7370758056640625, -0.693817138671875, -0.6505584716796875, -0.6072998046875, -0.5640411376953125, -0.520782470703125, -0.4775238037109375, -0.43426513671875, -0.3910064697265625, -0.347747802734375, -0.3044891357421875, -0.26123046875, -0.2179718017578125, -0.174713134765625, -0.1314544677734375, -0.08819580078125, -0.0449371337890625, -0.001678466796875, 0.0415802001953125, 0.0848388671875, 0.1280975341796875, 0.171356201171875, 0.2146148681640625, 0.25787353515625, 0.3011322021484375, 0.344390869140625, 0.3876495361328125, 0.430908203125, 0.4741668701171875, 0.517425537109375, 0.5606842041015625, 0.60394287109375, 0.6472015380859375, 0.690460205078125, 0.7337188720703125, 0.7769775390625, 0.8202362060546875, 0.863494873046875, 0.9067535400390625, 0.95001220703125, 0.9932708740234375, 1.036529541015625, 1.0797882080078125, 1.123046875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 8.0, 9.0, 29.0, 53.0, 170.0, 566.0, 90.0, 36.0, 27.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-128.6829376220703, -125.57109069824219, -122.45924377441406, -119.34739685058594, -116.23554992675781, -113.12370300292969, -110.01185607910156, -106.90000915527344, -103.78816223144531, -100.67631530761719, -97.56446838378906, -94.45262145996094, -91.34077453613281, -88.22892761230469, -85.11708068847656, -82.00523376464844, -78.89338684082031, -75.78153991699219, -72.66969299316406, -69.55784606933594, -66.44599914550781, -63.33415222167969, -60.22230529785156, -57.11045837402344, -53.99861145019531, -50.88676452636719, -47.77491760253906, -44.66307067871094, -41.55122375488281, -38.43937683105469, -35.32752990722656, -32.21568298339844, -29.103843688964844, -25.99199676513672, -22.880149841308594, -19.76830291748047, -16.656455993652344, -13.544609069824219, -10.432762145996094, -7.320915222167969, -4.209068298339844, -1.0972213745117188, 2.0146255493164062, 5.126472473144531, 8.238319396972656, 11.350166320800781, 14.462013244628906, 17.57386016845703, 20.685707092285156, 23.79755401611328, 26.909400939941406, 30.02124786376953, 33.133094787597656, 36.24494171142578, 39.356788635253906, 42.46863555908203, 45.580482482910156, 48.69232940673828, 51.804176330566406, 54.91602325439453, 58.027870178222656, 61.13971710205078, 64.2515640258789, 67.36341094970703, 70.47525787353516]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 1.0, 4.0, 9.0, 11.0, 10.0, 13.0, 10.0, 18.0, 27.0, 18.0, 21.0, 31.0, 30.0, 34.0, 164.0, 276.0, 93.0, 36.0, 32.0, 28.0, 24.0, 12.0, 19.0, 23.0, 14.0, 13.0, 7.0, 6.0, 7.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.11936950683594, -41.19038772583008, -39.26140594482422, -37.33242416381836, -35.4034423828125, -33.47446060180664, -31.54547691345215, -29.61649513244629, -27.68751335144043, -25.75853157043457, -23.82954978942871, -21.90056610107422, -19.97158432006836, -18.0426025390625, -16.11362075805664, -14.184638977050781, -12.255657196044922, -10.326675415039062, -8.397693634033203, -6.468710899353027, -4.539729118347168, -2.6107473373413086, -0.6817646026611328, 1.2472171783447266, 3.176198959350586, 5.105180740356445, 7.034162998199463, 8.96314525604248, 10.89212703704834, 12.8211088180542, 14.750091552734375, 16.679073333740234, 18.608055114746094, 20.537036895751953, 22.466018676757812, 24.395000457763672, 26.32398223876953, 28.25296401977539, 30.181947708129883, 32.110931396484375, 34.03990936279297, 35.96889114379883, 37.89787292480469, 39.82685470581055, 41.755836486816406, 43.684818267822266, 45.613800048828125, 47.54278564453125, 49.47176742553711, 51.40074920654297, 53.32973098754883, 55.25871276855469, 57.18769454956055, 59.116676330566406, 61.04566192626953, 62.974639892578125, 64.90362548828125, 66.83261108398438, 68.76158905029297, 70.6905746459961, 72.61955261230469, 74.54853820800781, 76.4775161743164, 78.40650177001953, 80.33547973632812]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 9.0, 7.0, 9.0, 23.0, 18.0, 15.0, 30.0, 39.0, 32.0, 37.0, 47.0, 114.0, 307.0, 81.0, 32.0, 36.0, 28.0, 27.0, 20.0, 22.0, 19.0, 11.0, 7.0, 10.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.244140625, -6.0625, -5.880859375, -5.69921875, -5.517578125, -5.3359375, -5.154296875, -4.97265625, -4.791015625, -4.609375, -4.427734375, -4.24609375, -4.064453125, -3.8828125, -3.701171875, -3.51953125, -3.337890625, -3.15625, -2.974609375, -2.79296875, -2.611328125, -2.4296875, -2.248046875, -2.06640625, -1.884765625, -1.703125, -1.521484375, -1.33984375, -1.158203125, -0.9765625, -0.794921875, -0.61328125, -0.431640625, -0.25, -0.068359375, 0.11328125, 0.294921875, 0.4765625, 0.658203125, 0.83984375, 1.021484375, 1.203125, 1.384765625, 1.56640625, 1.748046875, 1.9296875, 2.111328125, 2.29296875, 2.474609375, 2.65625, 2.837890625, 3.01953125, 3.201171875, 3.3828125, 3.564453125, 3.74609375, 3.927734375, 4.109375, 4.291015625, 4.47265625, 4.654296875, 4.8359375, 5.017578125, 5.19921875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 6.0, 3.0, 5.0, 9.0, 15.0, 25.0, 23.0, 27.0, 55.0, 82.0, 154.0, 269.0, 731.0, 3098.0, 33470.0, 8340671.0, 7631.0, 1363.0, 411.0, 189.0, 99.0, 59.0, 48.0, 35.0, 21.0, 8.0, 13.0, 10.0, 3.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.39027786254883, -49.84444808959961, -48.298614501953125, -46.752784729003906, -45.20695495605469, -43.66112518310547, -42.11529541015625, -40.569461822509766, -39.02363204956055, -37.47780227661133, -35.931968688964844, -34.386138916015625, -32.840309143066406, -31.294479370117188, -29.748647689819336, -28.202816009521484, -26.656986236572266, -25.111156463623047, -23.565324783325195, -22.019493103027344, -20.473663330078125, -18.927833557128906, -17.382001876831055, -15.83617115020752, -14.290340423583984, -12.74450969696045, -11.198678970336914, -9.652848243713379, -8.107017517089844, -6.561186790466309, -5.015356063842773, -3.4695253372192383, -1.9236984252929688, -0.3778676986694336, 1.1679630279541016, 2.7137937545776367, 4.259624481201172, 5.805455207824707, 7.351285934448242, 8.897116661071777, 10.442947387695312, 11.988778114318848, 13.534608840942383, 15.080439567565918, 16.626270294189453, 18.172100067138672, 19.717931747436523, 21.263763427734375, 22.809593200683594, 24.355422973632812, 25.901254653930664, 27.447086334228516, 28.992916107177734, 30.538745880126953, 32.08457946777344, 33.630409240722656, 35.176239013671875, 36.722068786621094, 38.26789855957031, 39.8137321472168, 41.359561920166016, 42.905391693115234, 44.45122528076172, 45.99705505371094, 47.542884826660156]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 1.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-65.31219482421875, -63.57953643798828, -61.84687805175781, -60.11422348022461, -58.38156509399414, -56.64890670776367, -54.91625213623047, -53.18359375, -51.45093536376953, -49.71827697753906, -47.985618591308594, -46.25296401977539, -44.52030563354492, -42.78764724731445, -41.05499267578125, -39.32233428955078, -37.58967590332031, -35.857017517089844, -34.124359130859375, -32.39170455932617, -30.659046173095703, -28.926387786865234, -27.1937313079834, -25.461074829101562, -23.728416442871094, -21.995758056640625, -20.26310157775879, -18.530445098876953, -16.797786712646484, -15.065129280090332, -13.33247184753418, -11.599814414978027, -9.86715316772461, -8.134495735168457, -6.401838302612305, -4.669180870056152, -2.9365234375, -1.2038660049438477, 0.5287914276123047, 2.261448860168457, 3.9941062927246094, 5.726763725280762, 7.459421157836914, 9.192078590393066, 10.924736022949219, 12.657393455505371, 14.390050888061523, 16.12270736694336, 17.855365753173828, 19.588024139404297, 21.320680618286133, 23.05333709716797, 24.785995483398438, 26.518653869628906, 28.251310348510742, 29.983966827392578, 31.716625213623047, 33.449283599853516, 35.18193817138672, 36.91459655761719, 38.647254943847656, 40.379913330078125, 42.112571716308594, 43.8452262878418, 45.577884674072266]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 10.0, 7.0, 9.0, 22.0, 20.0, 32.0, 44.0, 65.0, 80.0, 159.0, 208.0, 379.0, 699.0, 1489.0, 4326.0, 13723.0, 48398.0, 170884.0, 197910.0, 59969.0, 16794.0, 5230.0, 1850.0, 785.0, 402.0, 256.0, 156.0, 102.0, 81.0, 55.0, 25.0, 31.0, 15.0, 14.0, 6.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.65625, -31.4931640625, -30.330078125, -29.1669921875, -28.00390625, -26.8408203125, -25.677734375, -24.5146484375, -23.3515625, -22.1884765625, -21.025390625, -19.8623046875, -18.69921875, -17.5361328125, -16.373046875, -15.2099609375, -14.046875, -12.8837890625, -11.720703125, -10.5576171875, -9.39453125, -8.2314453125, -7.068359375, -5.9052734375, -4.7421875, -3.5791015625, -2.416015625, -1.2529296875, -0.08984375, 1.0732421875, 2.236328125, 3.3994140625, 4.5625, 5.7255859375, 6.888671875, 8.0517578125, 9.21484375, 10.3779296875, 11.541015625, 12.7041015625, 13.8671875, 15.0302734375, 16.193359375, 17.3564453125, 18.51953125, 19.6826171875, 20.845703125, 22.0087890625, 23.171875, 24.3349609375, 25.498046875, 26.6611328125, 27.82421875, 28.9873046875, 30.150390625, 31.3134765625, 32.4765625, 33.6396484375, 34.802734375, 35.9658203125, 37.12890625, 38.2919921875, 39.455078125, 40.6181640625, 41.78125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 9.0, 12.0, 6.0, 23.0, 36.0, 47.0, 63.0, 72.0, 84.0, 125.0, 96.0, 90.0, 64.0, 57.0, 53.0, 45.0, 29.0, 26.0, 17.0, 13.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.7354736328125, -6.478759765625, -6.2220458984375, -5.96533203125, -5.7086181640625, -5.451904296875, -5.1951904296875, -4.9384765625, -4.6817626953125, -4.425048828125, -4.1683349609375, -3.91162109375, -3.6549072265625, -3.398193359375, -3.1414794921875, -2.884765625, -2.6280517578125, -2.371337890625, -2.1146240234375, -1.85791015625, -1.6011962890625, -1.344482421875, -1.0877685546875, -0.8310546875, -0.5743408203125, -0.317626953125, -0.0609130859375, 0.19580078125, 0.4525146484375, 0.709228515625, 0.9659423828125, 1.22265625, 1.4793701171875, 1.736083984375, 1.9927978515625, 2.24951171875, 2.5062255859375, 2.762939453125, 3.0196533203125, 3.2763671875, 3.5330810546875, 3.789794921875, 4.0465087890625, 4.30322265625, 4.5599365234375, 4.816650390625, 5.0733642578125, 5.330078125, 5.5867919921875, 5.843505859375, 6.1002197265625, 6.35693359375, 6.6136474609375, 6.870361328125, 7.1270751953125, 7.3837890625, 7.6405029296875, 7.897216796875, 8.1539306640625, 8.41064453125, 8.6673583984375, 8.924072265625, 9.1807861328125, 9.4375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 17.0, 23.0, 26.0, 44.0, 72.0, 72.0, 65.0, 47.0, 26.0, 18.0, 19.0, 8.0, 6.0, 4.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.602140426635742, -22.676210403442383, -21.750282287597656, -20.824352264404297, -19.89842414855957, -18.97249412536621, -18.046566009521484, -17.120635986328125, -16.194705963134766, -15.268776893615723, -14.34284782409668, -13.41691780090332, -12.490989685058594, -11.565059661865234, -10.639130592346191, -9.713201522827148, -8.787273406982422, -7.861344337463379, -6.935415267944336, -6.009485721588135, -5.083556652069092, -4.157627582550049, -3.2316980361938477, -2.3057689666748047, -1.3798398971557617, -0.4539107084274292, 0.4720184803009033, 1.3979477882385254, 2.3238768577575684, 3.2498059272766113, 4.1757354736328125, 5.1016645431518555, 6.027591705322266, 6.953520774841309, 7.879449844360352, 8.805379867553711, 9.731307983398438, 10.657238006591797, 11.58316707611084, 12.509096145629883, 13.435025215148926, 14.360954284667969, 15.286883354187012, 16.212812423706055, 17.138742446899414, 18.06467056274414, 18.9906005859375, 19.91653060913086, 20.842458724975586, 21.768388748168945, 22.694316864013672, 23.62024688720703, 24.546175003051758, 25.472105026245117, 26.398033142089844, 27.323963165283203, 28.249893188476562, 29.175823211669922, 30.10175132751465, 31.027681350708008, 31.953609466552734, 32.879539489746094, 33.80546951293945, 34.73139953613281, 35.657325744628906]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 1.0, 1.0, 5.0, 2.0, 7.0, 11.0, 2.0, 10.0, 37.0, 93.0, 163.0, 85.0, 23.0, 9.0, 6.0, 6.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.467105865478516, -45.772544860839844, -44.077980041503906, -42.38341522216797, -40.6888542175293, -38.994293212890625, -37.29972839355469, -35.60516357421875, -33.91060256958008, -32.216041564941406, -30.52147674560547, -28.826913833618164, -27.13235092163086, -25.437788009643555, -23.74322509765625, -22.048662185668945, -20.35409927368164, -18.659536361694336, -16.96497344970703, -15.270410537719727, -13.575847625732422, -11.881284713745117, -10.186721801757812, -8.492158889770508, -6.797595977783203, -5.103033065795898, -3.4084701538085938, -1.713907241821289, -0.019344329833984375, 1.6752185821533203, 3.369781494140625, 5.06434440612793, 6.758903503417969, 8.453466415405273, 10.148029327392578, 11.842592239379883, 13.537155151367188, 15.231718063354492, 16.926280975341797, 18.6208438873291, 20.315406799316406, 22.00996971130371, 23.704532623291016, 25.39909553527832, 27.093658447265625, 28.78822135925293, 30.482784271240234, 32.177345275878906, 33.871910095214844, 35.56647491455078, 37.26103591918945, 38.955596923828125, 40.65016174316406, 42.3447265625, 44.03928756713867, 45.733848571777344, 47.42841339111328, 49.12297821044922, 50.81753921508789, 52.51210021972656, 54.2066650390625, 55.90122985839844, 57.59579086303711, 59.29035186767578, 60.98491668701172]}, "eval/loss": 5.550514221191406, "eval/wer": 1.6318431652677738, "eval/runtime": 934.4257, "eval/samples_per_second": 2.827, "eval/steps_per_second": 0.354} \ No newline at end of file +{"train/loss": 3.575, "train/learning_rate": 2.3768408551068884e-05, "train/epoch": 5.04, "train/global_step": 4500, "_runtime": 29171, "_timestamp": 1646690410, "_step": 4502, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 80.0, 17.0, 11.0, 6.0, 1.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 0.0, 29497.0, 639.0, 98.0, 53.0, 32.0, 8.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.03125, -59.52392578125, -58.0166015625, -56.50927734375, -55.001953125, -53.49462890625, -51.9873046875, -50.47998046875, -48.97265625, -47.46533203125, -45.9580078125, -44.45068359375, -42.943359375, -41.43603515625, -39.9287109375, -38.42138671875, -36.9140625, -35.40673828125, -33.8994140625, -32.39208984375, -30.884765625, -29.37744140625, -27.8701171875, -26.36279296875, -24.85546875, -23.34814453125, -21.8408203125, -20.33349609375, -18.826171875, -17.31884765625, -15.8115234375, -14.30419921875, -12.796875, -11.28955078125, -9.7822265625, -8.27490234375, -6.767578125, -5.26025390625, -3.7529296875, -2.24560546875, -0.73828125, 0.76904296875, 2.2763671875, 3.78369140625, 5.291015625, 6.79833984375, 8.3056640625, 9.81298828125, 11.3203125, 12.82763671875, 14.3349609375, 15.84228515625, 17.349609375, 18.85693359375, 20.3642578125, 21.87158203125, 23.37890625, 24.88623046875, 26.3935546875, 27.90087890625, 29.408203125, 30.91552734375, 32.4228515625, 33.93017578125, 35.4375]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 6.0, 2.0, 8.0, 14.0, 15.0, 7.0, 25.0, 15.0, 21.0, 22.0, 25.0, 34.0, 32.0, 29.0, 45.0, 37.0, 44.0, 49.0, 58.0, 50.0, 45.0, 54.0, 38.0, 47.0, 36.0, 45.0, 40.0, 28.0, 25.0, 21.0, 23.0, 17.0, 10.0, 7.0, 6.0, 10.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.9805793762207, -37.988128662109375, -36.99567794799805, -36.00322723388672, -35.010780334472656, -34.01832962036133, -33.02587890625, -32.03342819213867, -31.040977478027344, -30.048526763916016, -29.056076049804688, -28.063627243041992, -27.071176528930664, -26.078725814819336, -25.08627700805664, -24.093826293945312, -23.101375579833984, -22.108924865722656, -21.116474151611328, -20.124025344848633, -19.131574630737305, -18.139123916625977, -17.14667510986328, -16.154224395751953, -15.161773681640625, -14.169322967529297, -13.176873207092285, -12.184423446655273, -11.191972732543945, -10.199522018432617, -9.207072257995605, -8.214622497558594, -7.222169876098633, -6.229719638824463, -5.237269401550293, -4.244819164276123, -3.252368927001953, -2.259918689727783, -1.2674684524536133, -0.27501821517944336, 0.7174320220947266, 1.7098822593688965, 2.7023324966430664, 3.6947827339172363, 4.687232971191406, 5.679683208465576, 6.672133445739746, 7.664583683013916, 8.657033920288086, 9.649484634399414, 10.641934394836426, 11.634384155273438, 12.626834869384766, 13.619285583496094, 14.611735343933105, 15.604185104370117, 16.596635818481445, 17.589086532592773, 18.58153533935547, 19.573986053466797, 20.566436767578125, 21.558887481689453, 22.55133819580078, 23.543787002563477, 24.536237716674805]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 1.0, 5.0, 10.0, 11.0, 13.0, 10.0, 14.0, 15.0, 21.0, 23.0, 26.0, 26.0, 39.0, 27.0, 39.0, 32.0, 39.0, 43.0, 53.0, 47.0, 35.0, 46.0, 46.0, 36.0, 45.0, 44.0, 38.0, 33.0, 27.0, 24.0, 17.0, 22.0, 22.0, 17.0, 9.0, 11.0, 10.0, 5.0, 4.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.333877563476562, -27.439260482788086, -26.544641494750977, -25.6500244140625, -24.75540542602539, -23.860788345336914, -22.966171264648438, -22.071552276611328, -21.17693519592285, -20.282318115234375, -19.387699127197266, -18.49308204650879, -17.598464965820312, -16.703845977783203, -15.809228897094727, -14.914610862731934, -14.01999282836914, -13.125374794006348, -12.230756759643555, -11.336139678955078, -10.441521644592285, -9.546903610229492, -8.652286529541016, -7.757668495178223, -6.86305046081543, -5.968432426452637, -5.073814868927002, -4.179197311401367, -3.284579277038574, -2.3899612426757812, -1.4953436851501465, -0.6007261276245117, 0.29389381408691406, 1.188511610031128, 2.083129405975342, 2.9777472019195557, 3.8723649978637695, 4.7669830322265625, 5.661600589752197, 6.556218147277832, 7.450836181640625, 8.345454216003418, 9.240072250366211, 10.134689331054688, 11.02930736541748, 11.923925399780273, 12.81854248046875, 13.713160514831543, 14.607778549194336, 15.502396583557129, 16.397014617919922, 17.2916316986084, 18.186248779296875, 19.080867767333984, 19.97548484802246, 20.870101928710938, 21.764720916748047, 22.659337997436523, 23.553956985473633, 24.44857406616211, 25.34319305419922, 26.237810134887695, 27.132427215576172, 28.02704620361328, 28.921663284301758]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 16.0, 17.0, 33.0, 53.0, 76.0, 112.0, 165.0, 295.0, 420.0, 688.0, 1049.0, 1526.0, 2226.0, 3212.0, 4844.0, 7050.0, 9968.0, 13904.0, 19144.0, 25851.0, 34149.0, 43572.0, 54784.0, 67079.0, 79821.0, 97823.0, 120191.0, 96406.0, 78474.0, 65956.0, 54261.0, 43449.0, 33233.0, 25292.0, 18909.0, 13531.0, 9772.0, 6745.0, 4792.0, 3165.0, 2268.0, 1441.0, 1012.0, 645.0, 400.0, 267.0, 179.0, 112.0, 75.0, 42.0, 29.0, 18.0, 5.0, 9.0, 6.0, 2.0, 1.0, 2.0], "bins": [-61.9375, -60.02978515625, -58.1220703125, -56.21435546875, -54.306640625, -52.39892578125, -50.4912109375, -48.58349609375, -46.67578125, -44.76806640625, -42.8603515625, -40.95263671875, -39.044921875, -37.13720703125, -35.2294921875, -33.32177734375, -31.4140625, -29.50634765625, -27.5986328125, -25.69091796875, -23.783203125, -21.87548828125, -19.9677734375, -18.06005859375, -16.15234375, -14.24462890625, -12.3369140625, -10.42919921875, -8.521484375, -6.61376953125, -4.7060546875, -2.79833984375, -0.890625, 1.01708984375, 2.9248046875, 4.83251953125, 6.740234375, 8.64794921875, 10.5556640625, 12.46337890625, 14.37109375, 16.27880859375, 18.1865234375, 20.09423828125, 22.001953125, 23.90966796875, 25.8173828125, 27.72509765625, 29.6328125, 31.54052734375, 33.4482421875, 35.35595703125, 37.263671875, 39.17138671875, 41.0791015625, 42.98681640625, 44.89453125, 46.80224609375, 48.7099609375, 50.61767578125, 52.525390625, 54.43310546875, 56.3408203125, 58.24853515625, 60.15625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 3.0, 5.0, 7.0, 8.0, 9.0, 10.0, 13.0, 14.0, 19.0, 20.0, 15.0, 18.0, 15.0, 22.0, 25.0, 25.0, 28.0, 45.0, 51.0, 41.0, 50.0, 39.0, 56.0, 53.0, 31.0, 46.0, 28.0, 35.0, 33.0, 27.0, 31.0, 26.0, 22.0, 13.0, 8.0, 17.0, 11.0, 17.0, 9.0, 8.0, 3.0, 8.0, 5.0, 3.0, 7.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-27.046875, -26.14453125, -25.2421875, -24.33984375, -23.4375, -22.53515625, -21.6328125, -20.73046875, -19.828125, -18.92578125, -18.0234375, -17.12109375, -16.21875, -15.31640625, -14.4140625, -13.51171875, -12.609375, -11.70703125, -10.8046875, -9.90234375, -9.0, -8.09765625, -7.1953125, -6.29296875, -5.390625, -4.48828125, -3.5859375, -2.68359375, -1.78125, -0.87890625, 0.0234375, 0.92578125, 1.828125, 2.73046875, 3.6328125, 4.53515625, 5.4375, 6.33984375, 7.2421875, 8.14453125, 9.046875, 9.94921875, 10.8515625, 11.75390625, 12.65625, 13.55859375, 14.4609375, 15.36328125, 16.265625, 17.16796875, 18.0703125, 18.97265625, 19.875, 20.77734375, 21.6796875, 22.58203125, 23.484375, 24.38671875, 25.2890625, 26.19140625, 27.09375, 27.99609375, 28.8984375, 29.80078125, 30.703125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 10.0, 4.0, 10.0, 9.0, 7.0, 21.0, 22.0, 19.0, 23.0, 23.0, 33.0, 33.0, 40.0, 48.0, 28.0, 49.0, 42.0, 49.0, 57.0, 40.0, 38.0, 39.0, 62.0, 32.0, 39.0, 30.0, 39.0, 30.0, 18.0, 14.0, 21.0, 18.0, 8.0, 5.0, 4.0, 7.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.536663055419922, -19.864686965942383, -19.192712783813477, -18.520736694335938, -17.84876251220703, -17.176786422729492, -16.504812240600586, -15.832836151123047, -15.16086196899414, -14.488886833190918, -13.816911697387695, -13.144936561584473, -12.47296142578125, -11.800986289978027, -11.129011154174805, -10.457035064697266, -9.785059928894043, -9.11308479309082, -8.441109657287598, -7.769134521484375, -7.097159385681152, -6.42518424987793, -5.753208637237549, -5.081233501434326, -4.4092583656311035, -3.737283229827881, -3.065308094024658, -2.3933327198028564, -1.7213575839996338, -1.0493824481964111, -0.3774070739746094, 0.2945680618286133, 0.9665431976318359, 1.6385183334350586, 2.3104934692382812, 2.982468843460083, 3.6544439792633057, 4.326418876647949, 4.99839448928833, 5.670369625091553, 6.342344760894775, 7.014319896697998, 7.686295032501221, 8.358270645141602, 9.030245780944824, 9.702220916748047, 10.37419605255127, 11.046171188354492, 11.718146324157715, 12.390121459960938, 13.06209659576416, 13.734071731567383, 14.406046867370605, 15.078022003173828, 15.749998092651367, 16.421972274780273, 17.093948364257812, 17.76592445373535, 18.437898635864258, 19.109874725341797, 19.781848907470703, 20.453824996948242, 21.12579917907715, 21.797775268554688, 22.469749450683594]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 5.0, 6.0, 10.0, 11.0, 13.0, 18.0, 16.0, 20.0, 24.0, 28.0, 32.0, 27.0, 37.0, 36.0, 42.0, 49.0, 41.0, 53.0, 49.0, 34.0, 38.0, 48.0, 47.0, 37.0, 35.0, 38.0, 25.0, 27.0, 22.0, 16.0, 26.0, 21.0, 16.0, 13.0, 6.0, 11.0, 3.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.259138107299805, -20.608158111572266, -19.95718002319336, -19.30620002746582, -18.65522003173828, -18.004241943359375, -17.353261947631836, -16.702281951904297, -16.05130386352539, -15.400324821472168, -14.749344825744629, -14.098365783691406, -13.447385787963867, -12.796406745910645, -12.145427703857422, -11.494447708129883, -10.843467712402344, -10.192488670349121, -9.541508674621582, -8.89052963256836, -8.23954963684082, -7.588570594787598, -6.937591552734375, -6.286612033843994, -5.635632514953613, -4.984652996063232, -4.333673477172852, -3.682694435119629, -3.031714916229248, -2.380735397338867, -1.7297561168670654, -1.0787768363952637, -0.4277992248535156, 0.22318017482757568, 0.874159574508667, 1.5251389741897583, 2.1761183738708496, 2.8270978927612305, 3.4780771732330322, 4.129056453704834, 4.780035972595215, 5.431015491485596, 6.081995010375977, 6.732974052429199, 7.38395357131958, 8.034933090209961, 8.685912132263184, 9.336891174316406, 9.987871170043945, 10.638850212097168, 11.289830207824707, 11.94080924987793, 12.591789245605469, 13.242768287658691, 13.893747329711914, 14.544727325439453, 15.195706367492676, 15.846685409545898, 16.497665405273438, 17.148645401000977, 17.799623489379883, 18.450603485107422, 19.10158348083496, 19.752561569213867, 20.403541564941406]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 6.0, 20.0, 17.0, 25.0, 42.0, 50.0, 87.0, 131.0, 218.0, 294.0, 538.0, 797.0, 1389.0, 2245.0, 3887.0, 6489.0, 11267.0, 19824.0, 35066.0, 61816.0, 109436.0, 191100.0, 323787.0, 514932.0, 702790.0, 733593.0, 576174.0, 375318.0, 224305.0, 129706.0, 73403.0, 41147.0, 23169.0, 13133.0, 7461.0, 4253.0, 2507.0, 1513.0, 869.0, 537.0, 365.0, 203.0, 135.0, 101.0, 47.0, 27.0, 27.0, 10.0, 10.0, 11.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-23.09375, -22.39697265625, -21.7001953125, -21.00341796875, -20.306640625, -19.60986328125, -18.9130859375, -18.21630859375, -17.51953125, -16.82275390625, -16.1259765625, -15.42919921875, -14.732421875, -14.03564453125, -13.3388671875, -12.64208984375, -11.9453125, -11.24853515625, -10.5517578125, -9.85498046875, -9.158203125, -8.46142578125, -7.7646484375, -7.06787109375, -6.37109375, -5.67431640625, -4.9775390625, -4.28076171875, -3.583984375, -2.88720703125, -2.1904296875, -1.49365234375, -0.796875, -0.10009765625, 0.5966796875, 1.29345703125, 1.990234375, 2.68701171875, 3.3837890625, 4.08056640625, 4.77734375, 5.47412109375, 6.1708984375, 6.86767578125, 7.564453125, 8.26123046875, 8.9580078125, 9.65478515625, 10.3515625, 11.04833984375, 11.7451171875, 12.44189453125, 13.138671875, 13.83544921875, 14.5322265625, 15.22900390625, 15.92578125, 16.62255859375, 17.3193359375, 18.01611328125, 18.712890625, 19.40966796875, 20.1064453125, 20.80322265625, 21.5]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 7.0, 4.0, 7.0, 11.0, 7.0, 15.0, 12.0, 17.0, 21.0, 22.0, 25.0, 20.0, 28.0, 39.0, 31.0, 31.0, 42.0, 45.0, 41.0, 51.0, 43.0, 45.0, 48.0, 44.0, 42.0, 32.0, 38.0, 26.0, 30.0, 25.0, 20.0, 24.0, 21.0, 24.0, 16.0, 15.0, 13.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.8260498046875, -14.355224609375, -13.8843994140625, -13.41357421875, -12.9427490234375, -12.471923828125, -12.0010986328125, -11.5302734375, -11.0594482421875, -10.588623046875, -10.1177978515625, -9.64697265625, -9.1761474609375, -8.705322265625, -8.2344970703125, -7.763671875, -7.2928466796875, -6.822021484375, -6.3511962890625, -5.88037109375, -5.4095458984375, -4.938720703125, -4.4678955078125, -3.9970703125, -3.5262451171875, -3.055419921875, -2.5845947265625, -2.11376953125, -1.6429443359375, -1.172119140625, -0.7012939453125, -0.23046875, 0.2403564453125, 0.711181640625, 1.1820068359375, 1.65283203125, 2.1236572265625, 2.594482421875, 3.0653076171875, 3.5361328125, 4.0069580078125, 4.477783203125, 4.9486083984375, 5.41943359375, 5.8902587890625, 6.361083984375, 6.8319091796875, 7.302734375, 7.7735595703125, 8.244384765625, 8.7152099609375, 9.18603515625, 9.6568603515625, 10.127685546875, 10.5985107421875, 11.0693359375, 11.5401611328125, 12.010986328125, 12.4818115234375, 12.95263671875, 13.4234619140625, 13.894287109375, 14.3651123046875, 14.8359375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 22.0, 26.0, 57.0, 95.0, 165.0, 312.0, 531.0, 938.0, 1650.0, 2751.0, 4885.0, 8658.0, 14777.0, 25628.0, 43270.0, 72783.0, 119442.0, 186944.0, 280334.0, 392445.0, 501492.0, 567422.0, 545115.0, 456980.0, 341490.0, 236681.0, 153440.0, 96635.0, 58651.0, 33813.0, 19933.0, 11359.0, 6712.0, 3757.0, 2147.0, 1250.0, 711.0, 412.0, 244.0, 133.0, 74.0, 51.0, 29.0, 12.0, 9.0, 3.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.75, -16.222900390625, -15.69580078125, -15.168701171875, -14.6416015625, -14.114501953125, -13.58740234375, -13.060302734375, -12.533203125, -12.006103515625, -11.47900390625, -10.951904296875, -10.4248046875, -9.897705078125, -9.37060546875, -8.843505859375, -8.31640625, -7.789306640625, -7.26220703125, -6.735107421875, -6.2080078125, -5.680908203125, -5.15380859375, -4.626708984375, -4.099609375, -3.572509765625, -3.04541015625, -2.518310546875, -1.9912109375, -1.464111328125, -0.93701171875, -0.409912109375, 0.1171875, 0.644287109375, 1.17138671875, 1.698486328125, 2.2255859375, 2.752685546875, 3.27978515625, 3.806884765625, 4.333984375, 4.861083984375, 5.38818359375, 5.915283203125, 6.4423828125, 6.969482421875, 7.49658203125, 8.023681640625, 8.55078125, 9.077880859375, 9.60498046875, 10.132080078125, 10.6591796875, 11.186279296875, 11.71337890625, 12.240478515625, 12.767578125, 13.294677734375, 13.82177734375, 14.348876953125, 14.8759765625, 15.403076171875, 15.93017578125, 16.457275390625, 16.984375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 3.0, 8.0, 9.0, 8.0, 13.0, 12.0, 14.0, 27.0, 28.0, 30.0, 42.0, 48.0, 45.0, 70.0, 83.0, 101.0, 106.0, 152.0, 138.0, 146.0, 181.0, 193.0, 178.0, 207.0, 199.0, 189.0, 192.0, 210.0, 180.0, 171.0, 146.0, 140.0, 122.0, 114.0, 86.0, 84.0, 61.0, 54.0, 59.0, 49.0, 31.0, 27.0, 26.0, 18.0, 25.0, 16.0, 8.0, 9.0, 4.0, 3.0, 3.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.39453125, -5.197998046875, -5.00146484375, -4.804931640625, -4.6083984375, -4.411865234375, -4.21533203125, -4.018798828125, -3.822265625, -3.625732421875, -3.42919921875, -3.232666015625, -3.0361328125, -2.839599609375, -2.64306640625, -2.446533203125, -2.25, -2.053466796875, -1.85693359375, -1.660400390625, -1.4638671875, -1.267333984375, -1.07080078125, -0.874267578125, -0.677734375, -0.481201171875, -0.28466796875, -0.088134765625, 0.1083984375, 0.304931640625, 0.50146484375, 0.697998046875, 0.89453125, 1.091064453125, 1.28759765625, 1.484130859375, 1.6806640625, 1.877197265625, 2.07373046875, 2.270263671875, 2.466796875, 2.663330078125, 2.85986328125, 3.056396484375, 3.2529296875, 3.449462890625, 3.64599609375, 3.842529296875, 4.0390625, 4.235595703125, 4.43212890625, 4.628662109375, 4.8251953125, 5.021728515625, 5.21826171875, 5.414794921875, 5.611328125, 5.807861328125, 6.00439453125, 6.200927734375, 6.3974609375, 6.593994140625, 6.79052734375, 6.987060546875, 7.18359375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 7.0, 17.0, 9.0, 19.0, 32.0, 27.0, 26.0, 38.0, 41.0, 46.0, 42.0, 46.0, 63.0, 57.0, 51.0, 53.0, 49.0, 43.0, 46.0, 44.0, 29.0, 40.0, 23.0, 22.0, 22.0, 20.0, 17.0, 13.0, 14.0, 10.0, 10.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.262739181518555, -21.616479873657227, -20.9702205657959, -20.32396125793457, -19.677703857421875, -19.031444549560547, -18.38518524169922, -17.73892593383789, -17.092666625976562, -16.446407318115234, -15.800148010253906, -15.153889656066895, -14.507630348205566, -13.861371040344238, -13.215112686157227, -12.568853378295898, -11.92259407043457, -11.276334762573242, -10.630075454711914, -9.983817100524902, -9.337557792663574, -8.691298484802246, -8.045040130615234, -7.398780822753906, -6.752521514892578, -6.10626220703125, -5.46000337600708, -4.81374454498291, -4.167485237121582, -3.521226167678833, -2.874967098236084, -2.228708267211914, -1.582448959350586, -0.9361898899078369, -0.2899308204650879, 0.35632824897766113, 1.0025873184204102, 1.6488463878631592, 2.295105457305908, 2.941364288330078, 3.5876235961914062, 4.233882904052734, 4.880141735076904, 5.526400566101074, 6.172659873962402, 6.8189191818237305, 7.4651780128479, 8.11143684387207, 8.757696151733398, 9.403955459594727, 10.050214767456055, 10.696473121643066, 11.342732429504395, 11.988991737365723, 12.635250091552734, 13.281509399414062, 13.92776870727539, 14.574028015136719, 15.220287322998047, 15.866545677185059, 16.512805938720703, 17.1590633392334, 17.805322647094727, 18.451581954956055, 19.097841262817383]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 4.0, 3.0, 5.0, 2.0, 7.0, 11.0, 10.0, 13.0, 14.0, 18.0, 15.0, 24.0, 18.0, 35.0, 29.0, 38.0, 31.0, 47.0, 39.0, 38.0, 32.0, 40.0, 38.0, 44.0, 38.0, 40.0, 41.0, 40.0, 34.0, 30.0, 32.0, 32.0, 30.0, 25.0, 21.0, 16.0, 12.0, 13.0, 5.0, 13.0, 2.0, 4.0, 6.0, 4.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.441852569580078, -14.933212280273438, -14.42457103729248, -13.91593074798584, -13.407289505004883, -12.898649215698242, -12.390008926391602, -11.881368637084961, -11.372727394104004, -10.864087104797363, -10.355445861816406, -9.846805572509766, -9.338165283203125, -8.829524040222168, -8.320883750915527, -7.8122429847717285, -7.30360221862793, -6.794961452484131, -6.286320686340332, -5.777680397033691, -5.269039630889893, -4.760398864746094, -4.251758575439453, -3.7431178092956543, -3.2344770431518555, -2.7258362770080566, -2.217195749282837, -1.7085551023483276, -1.1999144554138184, -0.6912736892700195, -0.1826331615447998, 0.3260073661804199, 0.8346481323242188, 1.343288779258728, 1.8519294261932373, 2.360569953918457, 2.869210720062256, 3.3778514862060547, 3.8864920139312744, 4.395132541656494, 4.903773307800293, 5.412414073944092, 5.921054840087891, 6.429695129394531, 6.93833589553833, 7.446976661682129, 7.9556169509887695, 8.464258193969727, 8.972898483276367, 9.481538772583008, 9.990180015563965, 10.498820304870605, 11.007461547851562, 11.516101837158203, 12.024742126464844, 12.533382415771484, 13.042023658752441, 13.550663948059082, 14.059305191040039, 14.56794548034668, 15.07658576965332, 15.585227012634277, 16.093868255615234, 16.602508544921875, 17.111148834228516]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 8.0, 23.0, 26.0, 42.0, 76.0, 143.0, 194.0, 297.0, 461.0, 601.0, 1000.0, 1503.0, 2283.0, 3368.0, 5158.0, 7444.0, 11054.0, 16163.0, 23374.0, 34634.0, 51588.0, 75700.0, 107618.0, 138430.0, 148397.0, 126377.0, 93180.0, 64477.0, 43554.0, 29505.0, 20133.0, 13615.0, 9107.0, 6298.0, 4240.0, 2844.0, 1857.0, 1327.0, 845.0, 539.0, 360.0, 263.0, 173.0, 99.0, 51.0, 54.0, 33.0, 15.0, 11.0, 2.0, 4.0, 4.0, 2.0, 1.0], "bins": [-22.03125, -21.388671875, -20.74609375, -20.103515625, -19.4609375, -18.818359375, -18.17578125, -17.533203125, -16.890625, -16.248046875, -15.60546875, -14.962890625, -14.3203125, -13.677734375, -13.03515625, -12.392578125, -11.75, -11.107421875, -10.46484375, -9.822265625, -9.1796875, -8.537109375, -7.89453125, -7.251953125, -6.609375, -5.966796875, -5.32421875, -4.681640625, -4.0390625, -3.396484375, -2.75390625, -2.111328125, -1.46875, -0.826171875, -0.18359375, 0.458984375, 1.1015625, 1.744140625, 2.38671875, 3.029296875, 3.671875, 4.314453125, 4.95703125, 5.599609375, 6.2421875, 6.884765625, 7.52734375, 8.169921875, 8.8125, 9.455078125, 10.09765625, 10.740234375, 11.3828125, 12.025390625, 12.66796875, 13.310546875, 13.953125, 14.595703125, 15.23828125, 15.880859375, 16.5234375, 17.166015625, 17.80859375, 18.451171875, 19.09375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 6.0, 9.0, 5.0, 5.0, 6.0, 17.0, 13.0, 24.0, 20.0, 25.0, 24.0, 28.0, 34.0, 41.0, 28.0, 20.0, 40.0, 38.0, 40.0, 44.0, 28.0, 38.0, 41.0, 49.0, 43.0, 32.0, 29.0, 20.0, 36.0, 35.0, 21.0, 24.0, 20.0, 18.0, 16.0, 22.0, 8.0, 12.0, 7.0, 6.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.9296875, -13.47509765625, -13.0205078125, -12.56591796875, -12.111328125, -11.65673828125, -11.2021484375, -10.74755859375, -10.29296875, -9.83837890625, -9.3837890625, -8.92919921875, -8.474609375, -8.02001953125, -7.5654296875, -7.11083984375, -6.65625, -6.20166015625, -5.7470703125, -5.29248046875, -4.837890625, -4.38330078125, -3.9287109375, -3.47412109375, -3.01953125, -2.56494140625, -2.1103515625, -1.65576171875, -1.201171875, -0.74658203125, -0.2919921875, 0.16259765625, 0.6171875, 1.07177734375, 1.5263671875, 1.98095703125, 2.435546875, 2.89013671875, 3.3447265625, 3.79931640625, 4.25390625, 4.70849609375, 5.1630859375, 5.61767578125, 6.072265625, 6.52685546875, 6.9814453125, 7.43603515625, 7.890625, 8.34521484375, 8.7998046875, 9.25439453125, 9.708984375, 10.16357421875, 10.6181640625, 11.07275390625, 11.52734375, 11.98193359375, 12.4365234375, 12.89111328125, 13.345703125, 13.80029296875, 14.2548828125, 14.70947265625, 15.1640625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 4.0, 9.0, 8.0, 29.0, 28.0, 47.0, 71.0, 121.0, 149.0, 210.0, 312.0, 526.0, 783.0, 1178.0, 1876.0, 2754.0, 4275.0, 6752.0, 10788.0, 18015.0, 30425.0, 53482.0, 97465.0, 171847.0, 230015.0, 177701.0, 101910.0, 55967.0, 31724.0, 18747.0, 11487.0, 7036.0, 4507.0, 2853.0, 1888.0, 1236.0, 738.0, 516.0, 347.0, 248.0, 170.0, 98.0, 88.0, 41.0, 22.0, 24.0, 14.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-22.65625, -21.914306640625, -21.17236328125, -20.430419921875, -19.6884765625, -18.946533203125, -18.20458984375, -17.462646484375, -16.720703125, -15.978759765625, -15.23681640625, -14.494873046875, -13.7529296875, -13.010986328125, -12.26904296875, -11.527099609375, -10.78515625, -10.043212890625, -9.30126953125, -8.559326171875, -7.8173828125, -7.075439453125, -6.33349609375, -5.591552734375, -4.849609375, -4.107666015625, -3.36572265625, -2.623779296875, -1.8818359375, -1.139892578125, -0.39794921875, 0.343994140625, 1.0859375, 1.827880859375, 2.56982421875, 3.311767578125, 4.0537109375, 4.795654296875, 5.53759765625, 6.279541015625, 7.021484375, 7.763427734375, 8.50537109375, 9.247314453125, 9.9892578125, 10.731201171875, 11.47314453125, 12.215087890625, 12.95703125, 13.698974609375, 14.44091796875, 15.182861328125, 15.9248046875, 16.666748046875, 17.40869140625, 18.150634765625, 18.892578125, 19.634521484375, 20.37646484375, 21.118408203125, 21.8603515625, 22.602294921875, 23.34423828125, 24.086181640625, 24.828125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 10.0, 6.0, 4.0, 5.0, 12.0, 14.0, 10.0, 16.0, 26.0, 30.0, 30.0, 31.0, 27.0, 35.0, 39.0, 51.0, 54.0, 38.0, 50.0, 34.0, 43.0, 40.0, 45.0, 41.0, 34.0, 38.0, 37.0, 35.0, 31.0, 34.0, 21.0, 15.0, 17.0, 11.0, 7.0, 10.0, 6.0, 9.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.40625, -13.0489501953125, -12.691650390625, -12.3343505859375, -11.97705078125, -11.6197509765625, -11.262451171875, -10.9051513671875, -10.5478515625, -10.1905517578125, -9.833251953125, -9.4759521484375, -9.11865234375, -8.7613525390625, -8.404052734375, -8.0467529296875, -7.689453125, -7.3321533203125, -6.974853515625, -6.6175537109375, -6.26025390625, -5.9029541015625, -5.545654296875, -5.1883544921875, -4.8310546875, -4.4737548828125, -4.116455078125, -3.7591552734375, -3.40185546875, -3.0445556640625, -2.687255859375, -2.3299560546875, -1.97265625, -1.6153564453125, -1.258056640625, -0.9007568359375, -0.54345703125, -0.1861572265625, 0.171142578125, 0.5284423828125, 0.8857421875, 1.2430419921875, 1.600341796875, 1.9576416015625, 2.31494140625, 2.6722412109375, 3.029541015625, 3.3868408203125, 3.744140625, 4.1014404296875, 4.458740234375, 4.8160400390625, 5.17333984375, 5.5306396484375, 5.887939453125, 6.2452392578125, 6.6025390625, 6.9598388671875, 7.317138671875, 7.6744384765625, 8.03173828125, 8.3890380859375, 8.746337890625, 9.1036376953125, 9.4609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 7.0, 22.0, 20.0, 20.0, 47.0, 69.0, 104.0, 157.0, 225.0, 404.0, 650.0, 1116.0, 1883.0, 3216.0, 6064.0, 11887.0, 26365.0, 64331.0, 179406.0, 391830.0, 221115.0, 78593.0, 31136.0, 14013.0, 7071.0, 3566.0, 2059.0, 1205.0, 727.0, 441.0, 276.0, 164.0, 128.0, 67.0, 61.0, 37.0, 21.0, 9.0, 16.0, 9.0, 0.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.40625, -24.650146484375, -23.89404296875, -23.137939453125, -22.3818359375, -21.625732421875, -20.86962890625, -20.113525390625, -19.357421875, -18.601318359375, -17.84521484375, -17.089111328125, -16.3330078125, -15.576904296875, -14.82080078125, -14.064697265625, -13.30859375, -12.552490234375, -11.79638671875, -11.040283203125, -10.2841796875, -9.528076171875, -8.77197265625, -8.015869140625, -7.259765625, -6.503662109375, -5.74755859375, -4.991455078125, -4.2353515625, -3.479248046875, -2.72314453125, -1.967041015625, -1.2109375, -0.454833984375, 0.30126953125, 1.057373046875, 1.8134765625, 2.569580078125, 3.32568359375, 4.081787109375, 4.837890625, 5.593994140625, 6.35009765625, 7.106201171875, 7.8623046875, 8.618408203125, 9.37451171875, 10.130615234375, 10.88671875, 11.642822265625, 12.39892578125, 13.155029296875, 13.9111328125, 14.667236328125, 15.42333984375, 16.179443359375, 16.935546875, 17.691650390625, 18.44775390625, 19.203857421875, 19.9599609375, 20.716064453125, 21.47216796875, 22.228271484375, 22.984375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 11.0, 17.0, 24.0, 42.0, 65.0, 93.0, 154.0, 216.0, 144.0, 63.0, 46.0, 36.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003326416015625, -0.0032374560832977295, -0.003148496150970459, -0.0030595362186431885, -0.002970576286315918, -0.0028816163539886475, -0.002792656421661377, -0.0027036964893341064, -0.002614736557006836, -0.0025257766246795654, -0.002436816692352295, -0.0023478567600250244, -0.002258896827697754, -0.0021699368953704834, -0.002080976963043213, -0.0019920170307159424, -0.0019030570983886719, -0.0018140971660614014, -0.0017251372337341309, -0.0016361773014068604, -0.0015472173690795898, -0.0014582574367523193, -0.0013692975044250488, -0.0012803375720977783, -0.0011913776397705078, -0.0011024177074432373, -0.0010134577751159668, -0.0009244978427886963, -0.0008355379104614258, -0.0007465779781341553, -0.0006576180458068848, -0.0005686581134796143, -0.00047969818115234375, -0.00039073824882507324, -0.00030177831649780273, -0.00021281838417053223, -0.00012385845184326172, -3.489851951599121e-05, 5.40614128112793e-05, 0.0001430213451385498, 0.0002319812774658203, 0.0003209412097930908, 0.00040990114212036133, 0.0004988610744476318, 0.0005878210067749023, 0.0006767809391021729, 0.0007657408714294434, 0.0008547008037567139, 0.0009436607360839844, 0.0010326206684112549, 0.0011215806007385254, 0.001210540533065796, 0.0012995004653930664, 0.001388460397720337, 0.0014774203300476074, 0.001566380262374878, 0.0016553401947021484, 0.001744300127029419, 0.0018332600593566895, 0.00192221999168396, 0.0020111799240112305, 0.002100139856338501, 0.0021890997886657715, 0.002278059720993042, 0.0023670196533203125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 9.0, 17.0, 21.0, 29.0, 49.0, 70.0, 88.0, 119.0, 183.0, 229.0, 369.0, 514.0, 792.0, 1138.0, 1822.0, 2757.0, 4577.0, 8046.0, 14943.0, 27852.0, 54969.0, 108646.0, 205049.0, 262843.0, 169153.0, 87224.0, 44508.0, 22724.0, 12135.0, 6664.0, 3806.0, 2380.0, 1647.0, 977.0, 647.0, 491.0, 339.0, 211.0, 152.0, 106.0, 70.0, 71.0, 34.0, 24.0, 12.0, 18.0, 8.0, 7.0, 8.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-21.984375, -21.324951171875, -20.66552734375, -20.006103515625, -19.3466796875, -18.687255859375, -18.02783203125, -17.368408203125, -16.708984375, -16.049560546875, -15.39013671875, -14.730712890625, -14.0712890625, -13.411865234375, -12.75244140625, -12.093017578125, -11.43359375, -10.774169921875, -10.11474609375, -9.455322265625, -8.7958984375, -8.136474609375, -7.47705078125, -6.817626953125, -6.158203125, -5.498779296875, -4.83935546875, -4.179931640625, -3.5205078125, -2.861083984375, -2.20166015625, -1.542236328125, -0.8828125, -0.223388671875, 0.43603515625, 1.095458984375, 1.7548828125, 2.414306640625, 3.07373046875, 3.733154296875, 4.392578125, 5.052001953125, 5.71142578125, 6.370849609375, 7.0302734375, 7.689697265625, 8.34912109375, 9.008544921875, 9.66796875, 10.327392578125, 10.98681640625, 11.646240234375, 12.3056640625, 12.965087890625, 13.62451171875, 14.283935546875, 14.943359375, 15.602783203125, 16.26220703125, 16.921630859375, 17.5810546875, 18.240478515625, 18.89990234375, 19.559326171875, 20.21875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 7.0, 3.0, 6.0, 6.0, 12.0, 15.0, 13.0, 18.0, 29.0, 30.0, 22.0, 28.0, 36.0, 40.0, 44.0, 55.0, 55.0, 57.0, 75.0, 79.0, 65.0, 52.0, 38.0, 34.0, 44.0, 23.0, 16.0, 20.0, 22.0, 10.0, 8.0, 9.0, 10.0, 3.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.6942138671875, -4.532958984375, -4.3717041015625, -4.21044921875, -4.0491943359375, -3.887939453125, -3.7266845703125, -3.5654296875, -3.4041748046875, -3.242919921875, -3.0816650390625, -2.92041015625, -2.7591552734375, -2.597900390625, -2.4366455078125, -2.275390625, -2.1141357421875, -1.952880859375, -1.7916259765625, -1.63037109375, -1.4691162109375, -1.307861328125, -1.1466064453125, -0.9853515625, -0.8240966796875, -0.662841796875, -0.5015869140625, -0.34033203125, -0.1790771484375, -0.017822265625, 0.1434326171875, 0.3046875, 0.4659423828125, 0.627197265625, 0.7884521484375, 0.94970703125, 1.1109619140625, 1.272216796875, 1.4334716796875, 1.5947265625, 1.7559814453125, 1.917236328125, 2.0784912109375, 2.23974609375, 2.4010009765625, 2.562255859375, 2.7235107421875, 2.884765625, 3.0460205078125, 3.207275390625, 3.3685302734375, 3.52978515625, 3.6910400390625, 3.852294921875, 4.0135498046875, 4.1748046875, 4.3360595703125, 4.497314453125, 4.6585693359375, 4.81982421875, 4.9810791015625, 5.142333984375, 5.3035888671875, 5.46484375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 11.0, 9.0, 11.0, 12.0, 16.0, 14.0, 15.0, 25.0, 33.0, 27.0, 40.0, 25.0, 49.0, 42.0, 57.0, 44.0, 35.0, 51.0, 55.0, 57.0, 49.0, 40.0, 40.0, 22.0, 23.0, 32.0, 18.0, 30.0, 28.0, 16.0, 10.0, 12.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.09552001953125, -15.579512596130371, -15.063505172729492, -14.547497749328613, -14.031490325927734, -13.515483856201172, -12.999476432800293, -12.483469009399414, -11.967461585998535, -11.451454162597656, -10.935446739196777, -10.419439315795898, -9.903432846069336, -9.38742446899414, -8.871417999267578, -8.3554105758667, -7.83940315246582, -7.323395729064941, -6.8073883056640625, -6.291381359100342, -5.775373935699463, -5.259366512298584, -4.743359565734863, -4.227352142333984, -3.7113447189331055, -3.1953372955322266, -2.6793301105499268, -2.163322925567627, -1.647315502166748, -1.1313080787658691, -0.6153008937835693, -0.09929370880126953, 0.41671180725097656, 0.9327191114425659, 1.4487264156341553, 1.9647337198257446, 2.480741024017334, 2.996748447418213, 3.5127556324005127, 4.0287628173828125, 4.544770240783691, 5.06077766418457, 5.576785087585449, 6.09279203414917, 6.608799457550049, 7.124806880950928, 7.640813827514648, 8.156821250915527, 8.672828674316406, 9.188836097717285, 9.704843521118164, 10.220850944519043, 10.736858367919922, 11.252864837646484, 11.768872261047363, 12.284879684448242, 12.800887107849121, 13.31689453125, 13.832901954650879, 14.348909378051758, 14.86491584777832, 15.380924224853516, 15.896930694580078, 16.41293716430664, 16.928945541381836]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 3.0, 6.0, 6.0, 2.0, 7.0, 6.0, 10.0, 15.0, 15.0, 10.0, 19.0, 21.0, 18.0, 26.0, 33.0, 37.0, 32.0, 44.0, 34.0, 37.0, 35.0, 38.0, 42.0, 37.0, 35.0, 41.0, 40.0, 41.0, 41.0, 36.0, 37.0, 29.0, 24.0, 26.0, 26.0, 20.0, 13.0, 10.0, 13.0, 7.0, 9.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.952642440795898, -13.499324798583984, -13.046008110046387, -12.592690467834473, -12.139372825622559, -11.686056137084961, -11.232738494873047, -10.779420852661133, -10.326103210449219, -9.872785568237305, -9.419468879699707, -8.966151237487793, -8.512833595275879, -8.059516906738281, -7.606199264526367, -7.152881622314453, -6.6995649337768555, -6.2462477684021, -5.7929301261901855, -5.33961296081543, -4.886295318603516, -4.43297815322876, -3.979660987854004, -3.526343584060669, -3.073026180267334, -2.619708776473999, -2.166391372680664, -1.7130742073059082, -1.2597568035125732, -0.8064393997192383, -0.3531222343444824, 0.10019516944885254, 0.5535135269165039, 1.0068309307098389, 1.4601482152938843, 1.9134654998779297, 2.3667829036712646, 2.8201003074645996, 3.2734174728393555, 3.7267348766326904, 4.180052280426025, 4.633369445800781, 5.086687088012695, 5.540004253387451, 5.993321418762207, 6.446639060974121, 6.899956226348877, 7.353273391723633, 7.806591033935547, 8.259908676147461, 8.713225364685059, 9.166543006896973, 9.619860649108887, 10.073177337646484, 10.526494979858398, 10.979812622070312, 11.433130264282227, 11.88644790649414, 12.339764595031738, 12.793082237243652, 13.246399879455566, 13.699716567993164, 14.153034210205078, 14.606351852416992, 15.05966854095459]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 9.0, 19.0, 22.0, 39.0, 62.0, 92.0, 175.0, 256.0, 397.0, 644.0, 973.0, 1574.0, 2273.0, 3475.0, 5285.0, 7899.0, 12141.0, 17453.0, 25131.0, 35556.0, 47829.0, 62482.0, 77710.0, 90574.0, 99334.0, 101233.0, 97204.0, 86832.0, 72143.0, 57100.0, 43216.0, 31285.0, 22294.0, 15237.0, 10461.0, 6948.0, 4629.0, 2974.0, 2004.0, 1275.0, 836.0, 534.0, 354.0, 218.0, 137.0, 76.0, 66.0, 29.0, 22.0, 17.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-12.1015625, -11.7152099609375, -11.328857421875, -10.9425048828125, -10.55615234375, -10.1697998046875, -9.783447265625, -9.3970947265625, -9.0107421875, -8.6243896484375, -8.238037109375, -7.8516845703125, -7.46533203125, -7.0789794921875, -6.692626953125, -6.3062744140625, -5.919921875, -5.5335693359375, -5.147216796875, -4.7608642578125, -4.37451171875, -3.9881591796875, -3.601806640625, -3.2154541015625, -2.8291015625, -2.4427490234375, -2.056396484375, -1.6700439453125, -1.28369140625, -0.8973388671875, -0.510986328125, -0.1246337890625, 0.26171875, 0.6480712890625, 1.034423828125, 1.4207763671875, 1.80712890625, 2.1934814453125, 2.579833984375, 2.9661865234375, 3.3525390625, 3.7388916015625, 4.125244140625, 4.5115966796875, 4.89794921875, 5.2843017578125, 5.670654296875, 6.0570068359375, 6.443359375, 6.8297119140625, 7.216064453125, 7.6024169921875, 7.98876953125, 8.3751220703125, 8.761474609375, 9.1478271484375, 9.5341796875, 9.9205322265625, 10.306884765625, 10.6932373046875, 11.07958984375, 11.4659423828125, 11.852294921875, 12.2386474609375, 12.625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 5.0, 10.0, 4.0, 6.0, 5.0, 10.0, 14.0, 18.0, 16.0, 19.0, 28.0, 24.0, 24.0, 23.0, 33.0, 35.0, 27.0, 43.0, 35.0, 45.0, 42.0, 36.0, 45.0, 37.0, 38.0, 29.0, 32.0, 37.0, 37.0, 27.0, 29.0, 26.0, 24.0, 16.0, 30.0, 13.0, 12.0, 18.0, 19.0, 1.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.205322265625, -11.76220703125, -11.319091796875, -10.8759765625, -10.432861328125, -9.98974609375, -9.546630859375, -9.103515625, -8.660400390625, -8.21728515625, -7.774169921875, -7.3310546875, -6.887939453125, -6.44482421875, -6.001708984375, -5.55859375, -5.115478515625, -4.67236328125, -4.229248046875, -3.7861328125, -3.343017578125, -2.89990234375, -2.456787109375, -2.013671875, -1.570556640625, -1.12744140625, -0.684326171875, -0.2412109375, 0.201904296875, 0.64501953125, 1.088134765625, 1.53125, 1.974365234375, 2.41748046875, 2.860595703125, 3.3037109375, 3.746826171875, 4.18994140625, 4.633056640625, 5.076171875, 5.519287109375, 5.96240234375, 6.405517578125, 6.8486328125, 7.291748046875, 7.73486328125, 8.177978515625, 8.62109375, 9.064208984375, 9.50732421875, 9.950439453125, 10.3935546875, 10.836669921875, 11.27978515625, 11.722900390625, 12.166015625, 12.609130859375, 13.05224609375, 13.495361328125, 13.9384765625, 14.381591796875, 14.82470703125, 15.267822265625, 15.7109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 6.0, 21.0, 28.0, 38.0, 68.0, 111.0, 159.0, 269.0, 391.0, 607.0, 964.0, 1537.0, 2281.0, 3403.0, 5362.0, 7932.0, 11793.0, 16897.0, 24198.0, 33251.0, 45020.0, 57825.0, 71790.0, 84357.0, 93920.0, 97650.0, 95779.0, 87022.0, 75300.0, 61790.0, 48304.0, 36251.0, 26418.0, 18807.0, 13016.0, 8952.0, 5861.0, 3954.0, 2585.0, 1619.0, 1076.0, 691.0, 430.0, 285.0, 210.0, 139.0, 68.0, 37.0, 25.0, 23.0, 18.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.890625, -11.5147705078125, -11.138916015625, -10.7630615234375, -10.38720703125, -10.0113525390625, -9.635498046875, -9.2596435546875, -8.8837890625, -8.5079345703125, -8.132080078125, -7.7562255859375, -7.38037109375, -7.0045166015625, -6.628662109375, -6.2528076171875, -5.876953125, -5.5010986328125, -5.125244140625, -4.7493896484375, -4.37353515625, -3.9976806640625, -3.621826171875, -3.2459716796875, -2.8701171875, -2.4942626953125, -2.118408203125, -1.7425537109375, -1.36669921875, -0.9908447265625, -0.614990234375, -0.2391357421875, 0.13671875, 0.5125732421875, 0.888427734375, 1.2642822265625, 1.64013671875, 2.0159912109375, 2.391845703125, 2.7677001953125, 3.1435546875, 3.5194091796875, 3.895263671875, 4.2711181640625, 4.64697265625, 5.0228271484375, 5.398681640625, 5.7745361328125, 6.150390625, 6.5262451171875, 6.902099609375, 7.2779541015625, 7.65380859375, 8.0296630859375, 8.405517578125, 8.7813720703125, 9.1572265625, 9.5330810546875, 9.908935546875, 10.2847900390625, 10.66064453125, 11.0364990234375, 11.412353515625, 11.7882080078125, 12.1640625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 11.0, 12.0, 5.0, 12.0, 19.0, 13.0, 19.0, 18.0, 22.0, 32.0, 38.0, 30.0, 40.0, 30.0, 41.0, 42.0, 52.0, 52.0, 47.0, 36.0, 53.0, 45.0, 49.0, 34.0, 34.0, 29.0, 34.0, 35.0, 25.0, 20.0, 17.0, 7.0, 11.0, 16.0, 13.0, 1.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.336181640625, -9.99267578125, -9.649169921875, -9.3056640625, -8.962158203125, -8.61865234375, -8.275146484375, -7.931640625, -7.588134765625, -7.24462890625, -6.901123046875, -6.5576171875, -6.214111328125, -5.87060546875, -5.527099609375, -5.18359375, -4.840087890625, -4.49658203125, -4.153076171875, -3.8095703125, -3.466064453125, -3.12255859375, -2.779052734375, -2.435546875, -2.092041015625, -1.74853515625, -1.405029296875, -1.0615234375, -0.718017578125, -0.37451171875, -0.031005859375, 0.3125, 0.656005859375, 0.99951171875, 1.343017578125, 1.6865234375, 2.030029296875, 2.37353515625, 2.717041015625, 3.060546875, 3.404052734375, 3.74755859375, 4.091064453125, 4.4345703125, 4.778076171875, 5.12158203125, 5.465087890625, 5.80859375, 6.152099609375, 6.49560546875, 6.839111328125, 7.1826171875, 7.526123046875, 7.86962890625, 8.213134765625, 8.556640625, 8.900146484375, 9.24365234375, 9.587158203125, 9.9306640625, 10.274169921875, 10.61767578125, 10.961181640625, 11.3046875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 17.0, 24.0, 32.0, 38.0, 35.0, 63.0, 72.0, 87.0, 141.0, 164.0, 216.0, 286.0, 380.0, 543.0, 880.0, 1257.0, 2014.0, 3517.0, 6968.0, 14027.0, 29623.0, 61003.0, 116063.0, 184287.0, 218175.0, 179990.0, 112069.0, 58449.0, 28563.0, 13416.0, 6635.0, 3472.0, 1897.0, 1203.0, 821.0, 545.0, 401.0, 268.0, 217.0, 165.0, 124.0, 86.0, 75.0, 51.0, 56.0, 45.0, 23.0, 19.0, 12.0, 7.0, 6.0, 5.0, 5.0, 7.0, 3.0], "bins": [-10.9453125, -10.6182861328125, -10.291259765625, -9.9642333984375, -9.63720703125, -9.3101806640625, -8.983154296875, -8.6561279296875, -8.3291015625, -8.0020751953125, -7.675048828125, -7.3480224609375, -7.02099609375, -6.6939697265625, -6.366943359375, -6.0399169921875, -5.712890625, -5.3858642578125, -5.058837890625, -4.7318115234375, -4.40478515625, -4.0777587890625, -3.750732421875, -3.4237060546875, -3.0966796875, -2.7696533203125, -2.442626953125, -2.1156005859375, -1.78857421875, -1.4615478515625, -1.134521484375, -0.8074951171875, -0.48046875, -0.1534423828125, 0.173583984375, 0.5006103515625, 0.82763671875, 1.1546630859375, 1.481689453125, 1.8087158203125, 2.1357421875, 2.4627685546875, 2.789794921875, 3.1168212890625, 3.44384765625, 3.7708740234375, 4.097900390625, 4.4249267578125, 4.751953125, 5.0789794921875, 5.406005859375, 5.7330322265625, 6.06005859375, 6.3870849609375, 6.714111328125, 7.0411376953125, 7.3681640625, 7.6951904296875, 8.022216796875, 8.3492431640625, 8.67626953125, 9.0032958984375, 9.330322265625, 9.6573486328125, 9.984375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 13.0, 13.0, 13.0, 13.0, 18.0, 23.0, 31.0, 44.0, 38.0, 43.0, 52.0, 53.0, 62.0, 52.0, 68.0, 58.0, 54.0, 54.0, 43.0, 50.0, 40.0, 38.0, 28.0, 23.0, 12.0, 17.0, 11.0, 4.0, 9.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009183883666992188, -0.0008923634886741638, -0.0008663386106491089, -0.000840313732624054, -0.000814288854598999, -0.0007882639765739441, -0.0007622390985488892, -0.0007362142205238342, -0.0007101893424987793, -0.0006841644644737244, -0.0006581395864486694, -0.0006321147084236145, -0.0006060898303985596, -0.0005800649523735046, -0.0005540400743484497, -0.0005280151963233948, -0.0005019903182983398, -0.0004759654402732849, -0.00044994056224823, -0.00042391568422317505, -0.0003978908061981201, -0.0003718659281730652, -0.00034584105014801025, -0.0003198161721229553, -0.0002937912940979004, -0.00026776641607284546, -0.00024174153804779053, -0.0002157166600227356, -0.00018969178199768066, -0.00016366690397262573, -0.0001376420259475708, -0.00011161714792251587, -8.559226989746094e-05, -5.9567391872406006e-05, -3.3542513847351074e-05, -7.517635822296143e-06, 1.850724220275879e-05, 4.453212022781372e-05, 7.055699825286865e-05, 9.658187627792358e-05, 0.00012260675430297852, 0.00014863163232803345, 0.00017465651035308838, 0.0002006813883781433, 0.00022670626640319824, 0.0002527311444282532, 0.0002787560224533081, 0.00030478090047836304, 0.00033080577850341797, 0.0003568306565284729, 0.00038285553455352783, 0.00040888041257858276, 0.0004349052906036377, 0.0004609301686286926, 0.00048695504665374756, 0.0005129799246788025, 0.0005390048027038574, 0.0005650296807289124, 0.0005910545587539673, 0.0006170794367790222, 0.0006431043148040771, 0.0006691291928291321, 0.000695154070854187, 0.0007211789488792419, 0.0007472038269042969]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 8.0, 15.0, 13.0, 32.0, 39.0, 46.0, 77.0, 100.0, 134.0, 182.0, 258.0, 391.0, 536.0, 747.0, 1174.0, 1964.0, 3357.0, 6497.0, 13682.0, 29485.0, 61482.0, 116600.0, 184190.0, 216533.0, 180988.0, 113641.0, 59414.0, 28526.0, 13192.0, 6234.0, 3330.0, 1883.0, 1221.0, 735.0, 537.0, 397.0, 251.0, 168.0, 121.0, 109.0, 83.0, 61.0, 32.0, 27.0, 20.0, 7.0, 12.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.561279296875, -9.24755859375, -8.933837890625, -8.6201171875, -8.306396484375, -7.99267578125, -7.678955078125, -7.365234375, -7.051513671875, -6.73779296875, -6.424072265625, -6.1103515625, -5.796630859375, -5.48291015625, -5.169189453125, -4.85546875, -4.541748046875, -4.22802734375, -3.914306640625, -3.6005859375, -3.286865234375, -2.97314453125, -2.659423828125, -2.345703125, -2.031982421875, -1.71826171875, -1.404541015625, -1.0908203125, -0.777099609375, -0.46337890625, -0.149658203125, 0.1640625, 0.477783203125, 0.79150390625, 1.105224609375, 1.4189453125, 1.732666015625, 2.04638671875, 2.360107421875, 2.673828125, 2.987548828125, 3.30126953125, 3.614990234375, 3.9287109375, 4.242431640625, 4.55615234375, 4.869873046875, 5.18359375, 5.497314453125, 5.81103515625, 6.124755859375, 6.4384765625, 6.752197265625, 7.06591796875, 7.379638671875, 7.693359375, 8.007080078125, 8.32080078125, 8.634521484375, 8.9482421875, 9.261962890625, 9.57568359375, 9.889404296875, 10.203125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 9.0, 7.0, 13.0, 10.0, 10.0, 17.0, 27.0, 44.0, 40.0, 58.0, 63.0, 71.0, 57.0, 72.0, 69.0, 70.0, 67.0, 61.0, 42.0, 41.0, 36.0, 24.0, 26.0, 12.0, 10.0, 8.0, 8.0, 2.0, 8.0, 2.0, 1.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.0831298828125, -2.982666015625, -2.8822021484375, -2.78173828125, -2.6812744140625, -2.580810546875, -2.4803466796875, -2.3798828125, -2.2794189453125, -2.178955078125, -2.0784912109375, -1.97802734375, -1.8775634765625, -1.777099609375, -1.6766357421875, -1.576171875, -1.4757080078125, -1.375244140625, -1.2747802734375, -1.17431640625, -1.0738525390625, -0.973388671875, -0.8729248046875, -0.7724609375, -0.6719970703125, -0.571533203125, -0.4710693359375, -0.37060546875, -0.2701416015625, -0.169677734375, -0.0692138671875, 0.03125, 0.1317138671875, 0.232177734375, 0.3326416015625, 0.43310546875, 0.5335693359375, 0.634033203125, 0.7344970703125, 0.8349609375, 0.9354248046875, 1.035888671875, 1.1363525390625, 1.23681640625, 1.3372802734375, 1.437744140625, 1.5382080078125, 1.638671875, 1.7391357421875, 1.839599609375, 1.9400634765625, 2.04052734375, 2.1409912109375, 2.241455078125, 2.3419189453125, 2.4423828125, 2.5428466796875, 2.643310546875, 2.7437744140625, 2.84423828125, 2.9447021484375, 3.045166015625, 3.1456298828125, 3.24609375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 2.0, 8.0, 10.0, 9.0, 12.0, 16.0, 14.0, 26.0, 33.0, 21.0, 28.0, 48.0, 42.0, 58.0, 44.0, 35.0, 56.0, 64.0, 57.0, 59.0, 56.0, 40.0, 38.0, 32.0, 27.0, 38.0, 26.0, 17.0, 21.0, 10.0, 13.0, 7.0, 6.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.244752883911133, -17.66324806213379, -17.081741333007812, -16.50023651123047, -15.918730735778809, -15.337224960327148, -14.755720138549805, -14.174214363098145, -13.592708587646484, -13.011202812194824, -12.42969799041748, -11.84819221496582, -11.26668643951416, -10.6851806640625, -10.103675842285156, -9.522170066833496, -8.940665245056152, -8.359159469604492, -7.77765417098999, -7.196148872375488, -6.614643096923828, -6.033137798309326, -5.451632499694824, -4.870126724243164, -4.288621425628662, -3.707115888595581, -3.1256103515625, -2.544105052947998, -1.962599515914917, -1.381093978881836, -0.799588680267334, -0.21808290481567383, 0.3634223937988281, 0.9449278712272644, 1.5264333486557007, 2.107938766479492, 2.6894443035125732, 3.2709498405456543, 3.8524551391601562, 4.433960914611816, 5.015466213226318, 5.59697151184082, 6.1784772872924805, 6.759982585906982, 7.341487884521484, 7.9229936599731445, 8.504499435424805, 9.086004257202148, 9.667510032653809, 10.249015808105469, 10.830520629882812, 11.412026405334473, 11.993532180786133, 12.575037002563477, 13.156542778015137, 13.738048553466797, 14.31955337524414, 14.9010591506958, 15.482563972473145, 16.064069747924805, 16.64557456970215, 17.227081298828125, 17.80858612060547, 18.390090942382812, 18.97159767150879]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 3.0, 7.0, 6.0, 9.0, 9.0, 6.0, 8.0, 18.0, 14.0, 18.0, 24.0, 26.0, 31.0, 25.0, 31.0, 27.0, 45.0, 32.0, 49.0, 39.0, 29.0, 36.0, 42.0, 43.0, 30.0, 46.0, 37.0, 36.0, 42.0, 31.0, 31.0, 35.0, 17.0, 20.0, 12.0, 16.0, 16.0, 9.0, 10.0, 10.0, 7.0, 5.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.138433456420898, -12.680917739868164, -12.22340202331543, -11.765886306762695, -11.308371543884277, -10.850855827331543, -10.393340110778809, -9.935824394226074, -9.478309631347656, -9.020793914794922, -8.563278198242188, -8.105762481689453, -7.648247718811035, -7.190732002258301, -6.733216285705566, -6.275700569152832, -5.818184852600098, -5.360669136047363, -4.903153896331787, -4.445638179779053, -3.9881227016448975, -3.530607223510742, -3.073091506958008, -2.6155760288238525, -2.1580605506896973, -1.700545072555542, -1.2430294752120972, -0.7855138778686523, -0.32799839973449707, 0.1295170783996582, 0.5870327949523926, 1.0445482730865479, 1.5020637512207031, 1.9595792293548584, 2.4170947074890137, 2.874610424041748, 3.3321259021759033, 3.7896413803100586, 4.247157096862793, 4.704672813415527, 5.1621880531311035, 5.619703769683838, 6.077219009399414, 6.534734725952148, 6.992250442504883, 7.449765682220459, 7.907281398773193, 8.36479663848877, 8.822312355041504, 9.279828071594238, 9.737343788146973, 10.19485855102539, 10.652374267578125, 11.10988998413086, 11.567405700683594, 12.024921417236328, 12.482437133789062, 12.939952850341797, 13.397468566894531, 13.854984283447266, 14.312499046325684, 14.770014762878418, 15.227530479431152, 15.685046195983887, 16.142560958862305]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 7.0, 16.0, 42.0, 48.0, 65.0, 84.0, 125.0, 210.0, 357.0, 556.0, 820.0, 1328.0, 1984.0, 3214.0, 4926.0, 7815.0, 12436.0, 19354.0, 30612.0, 49219.0, 77883.0, 122332.0, 189632.0, 287167.0, 410395.0, 528018.0, 584879.0, 543116.0, 434057.0, 310689.0, 208451.0, 134616.0, 85880.0, 53642.0, 33764.0, 21111.0, 13227.0, 8231.0, 5101.0, 3298.0, 2009.0, 1301.0, 810.0, 528.0, 330.0, 228.0, 148.0, 85.0, 54.0, 24.0, 20.0, 21.0, 10.0, 9.0, 2.0, 1.0, 4.0, 3.0], "bins": [-14.2265625, -13.7900390625, -13.353515625, -12.9169921875, -12.48046875, -12.0439453125, -11.607421875, -11.1708984375, -10.734375, -10.2978515625, -9.861328125, -9.4248046875, -8.98828125, -8.5517578125, -8.115234375, -7.6787109375, -7.2421875, -6.8056640625, -6.369140625, -5.9326171875, -5.49609375, -5.0595703125, -4.623046875, -4.1865234375, -3.75, -3.3134765625, -2.876953125, -2.4404296875, -2.00390625, -1.5673828125, -1.130859375, -0.6943359375, -0.2578125, 0.1787109375, 0.615234375, 1.0517578125, 1.48828125, 1.9248046875, 2.361328125, 2.7978515625, 3.234375, 3.6708984375, 4.107421875, 4.5439453125, 4.98046875, 5.4169921875, 5.853515625, 6.2900390625, 6.7265625, 7.1630859375, 7.599609375, 8.0361328125, 8.47265625, 8.9091796875, 9.345703125, 9.7822265625, 10.21875, 10.6552734375, 11.091796875, 11.5283203125, 11.96484375, 12.4013671875, 12.837890625, 13.2744140625, 13.7109375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 5.0, 10.0, 7.0, 7.0, 8.0, 14.0, 14.0, 21.0, 22.0, 18.0, 18.0, 28.0, 26.0, 29.0, 23.0, 31.0, 56.0, 24.0, 43.0, 42.0, 38.0, 41.0, 33.0, 45.0, 38.0, 36.0, 39.0, 34.0, 24.0, 33.0, 20.0, 25.0, 18.0, 24.0, 14.0, 14.0, 16.0, 7.0, 11.0, 7.0, 10.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.0, -10.6644287109375, -10.328857421875, -9.9932861328125, -9.65771484375, -9.3221435546875, -8.986572265625, -8.6510009765625, -8.3154296875, -7.9798583984375, -7.644287109375, -7.3087158203125, -6.97314453125, -6.6375732421875, -6.302001953125, -5.9664306640625, -5.630859375, -5.2952880859375, -4.959716796875, -4.6241455078125, -4.28857421875, -3.9530029296875, -3.617431640625, -3.2818603515625, -2.9462890625, -2.6107177734375, -2.275146484375, -1.9395751953125, -1.60400390625, -1.2684326171875, -0.932861328125, -0.5972900390625, -0.26171875, 0.0738525390625, 0.409423828125, 0.7449951171875, 1.08056640625, 1.4161376953125, 1.751708984375, 2.0872802734375, 2.4228515625, 2.7584228515625, 3.093994140625, 3.4295654296875, 3.76513671875, 4.1007080078125, 4.436279296875, 4.7718505859375, 5.107421875, 5.4429931640625, 5.778564453125, 6.1141357421875, 6.44970703125, 6.7852783203125, 7.120849609375, 7.4564208984375, 7.7919921875, 8.1275634765625, 8.463134765625, 8.7987060546875, 9.13427734375, 9.4698486328125, 9.805419921875, 10.1409912109375, 10.4765625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 16.0, 25.0, 40.0, 58.0, 128.0, 189.0, 349.0, 589.0, 964.0, 1659.0, 2805.0, 4791.0, 8255.0, 14045.0, 23367.0, 38938.0, 64335.0, 103107.0, 162183.0, 242559.0, 341786.0, 445607.0, 520355.0, 536264.0, 484148.0, 389136.0, 286153.0, 194898.0, 126454.0, 80054.0, 48986.0, 29531.0, 17549.0, 10510.0, 6110.0, 3473.0, 2022.0, 1169.0, 724.0, 380.0, 241.0, 127.0, 73.0, 40.0, 31.0, 34.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.3359375, -12.9088134765625, -12.481689453125, -12.0545654296875, -11.62744140625, -11.2003173828125, -10.773193359375, -10.3460693359375, -9.9189453125, -9.4918212890625, -9.064697265625, -8.6375732421875, -8.21044921875, -7.7833251953125, -7.356201171875, -6.9290771484375, -6.501953125, -6.0748291015625, -5.647705078125, -5.2205810546875, -4.79345703125, -4.3663330078125, -3.939208984375, -3.5120849609375, -3.0849609375, -2.6578369140625, -2.230712890625, -1.8035888671875, -1.37646484375, -0.9493408203125, -0.522216796875, -0.0950927734375, 0.33203125, 0.7591552734375, 1.186279296875, 1.6134033203125, 2.04052734375, 2.4676513671875, 2.894775390625, 3.3218994140625, 3.7490234375, 4.1761474609375, 4.603271484375, 5.0303955078125, 5.45751953125, 5.8846435546875, 6.311767578125, 6.7388916015625, 7.166015625, 7.5931396484375, 8.020263671875, 8.4473876953125, 8.87451171875, 9.3016357421875, 9.728759765625, 10.1558837890625, 10.5830078125, 11.0101318359375, 11.437255859375, 11.8643798828125, 12.29150390625, 12.7186279296875, 13.145751953125, 13.5728759765625, 14.0]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 12.0, 9.0, 14.0, 19.0, 20.0, 26.0, 35.0, 35.0, 39.0, 55.0, 63.0, 73.0, 108.0, 115.0, 105.0, 126.0, 163.0, 186.0, 168.0, 207.0, 191.0, 207.0, 206.0, 198.0, 213.0, 191.0, 173.0, 172.0, 148.0, 119.0, 117.0, 89.0, 83.0, 73.0, 51.0, 66.0, 39.0, 30.0, 32.0, 12.0, 19.0, 18.0, 14.0, 11.0, 5.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0], "bins": [-6.17578125, -5.999267578125, -5.82275390625, -5.646240234375, -5.4697265625, -5.293212890625, -5.11669921875, -4.940185546875, -4.763671875, -4.587158203125, -4.41064453125, -4.234130859375, -4.0576171875, -3.881103515625, -3.70458984375, -3.528076171875, -3.3515625, -3.175048828125, -2.99853515625, -2.822021484375, -2.6455078125, -2.468994140625, -2.29248046875, -2.115966796875, -1.939453125, -1.762939453125, -1.58642578125, -1.409912109375, -1.2333984375, -1.056884765625, -0.88037109375, -0.703857421875, -0.52734375, -0.350830078125, -0.17431640625, 0.002197265625, 0.1787109375, 0.355224609375, 0.53173828125, 0.708251953125, 0.884765625, 1.061279296875, 1.23779296875, 1.414306640625, 1.5908203125, 1.767333984375, 1.94384765625, 2.120361328125, 2.296875, 2.473388671875, 2.64990234375, 2.826416015625, 3.0029296875, 3.179443359375, 3.35595703125, 3.532470703125, 3.708984375, 3.885498046875, 4.06201171875, 4.238525390625, 4.4150390625, 4.591552734375, 4.76806640625, 4.944580078125, 5.12109375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 8.0, 7.0, 5.0, 16.0, 14.0, 14.0, 22.0, 22.0, 32.0, 34.0, 41.0, 44.0, 44.0, 63.0, 56.0, 47.0, 60.0, 46.0, 43.0, 45.0, 55.0, 45.0, 37.0, 30.0, 26.0, 29.0, 26.0, 20.0, 20.0, 11.0, 8.0, 2.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0], "bins": [-20.975299835205078, -20.428804397583008, -19.882308959960938, -19.335811614990234, -18.789316177368164, -18.242820739746094, -17.69632339477539, -17.14982795715332, -16.60333251953125, -16.05683708190918, -15.510340690612793, -14.963844299316406, -14.417348861694336, -13.870853424072266, -13.324357032775879, -12.777860641479492, -12.231365203857422, -11.684869766235352, -11.138373374938965, -10.591876983642578, -10.045381546020508, -9.498886108398438, -8.95238971710205, -8.405893325805664, -7.859397888183594, -7.312901973724365, -6.766406059265137, -6.219910144805908, -5.67341423034668, -5.126918315887451, -4.580422401428223, -4.033926486968994, -3.4874324798583984, -2.94093656539917, -2.3944406509399414, -1.847944736480713, -1.3014488220214844, -0.7549529075622559, -0.20845699310302734, 0.33803892135620117, 0.8845348358154297, 1.4310307502746582, 1.9775266647338867, 2.5240225791931152, 3.0705184936523438, 3.6170144081115723, 4.163510322570801, 4.710006237030029, 5.256502151489258, 5.802998065948486, 6.349493980407715, 6.895989894866943, 7.442485809326172, 7.9889817237854, 8.535477638244629, 9.081974029541016, 9.628469467163086, 10.174964904785156, 10.721461296081543, 11.26795768737793, 11.814453125, 12.36094856262207, 12.907444953918457, 13.453941345214844, 14.000436782836914]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 5.0, 8.0, 2.0, 2.0, 8.0, 10.0, 9.0, 8.0, 19.0, 15.0, 14.0, 23.0, 21.0, 28.0, 27.0, 35.0, 36.0, 25.0, 37.0, 38.0, 35.0, 46.0, 33.0, 47.0, 40.0, 34.0, 31.0, 45.0, 39.0, 35.0, 29.0, 27.0, 25.0, 25.0, 22.0, 20.0, 20.0, 17.0, 12.0, 14.0, 14.0, 5.0, 7.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.884172439575195, -13.466789245605469, -13.049405097961426, -12.6320219039917, -12.214637756347656, -11.79725456237793, -11.379871368408203, -10.96248722076416, -10.545103073120117, -10.12771987915039, -9.710335731506348, -9.292952537536621, -8.875568389892578, -8.458185195922852, -8.040802001953125, -7.623417854309082, -7.2060346603393555, -6.788650989532471, -6.371267318725586, -5.953884124755859, -5.536499977111816, -5.11911678314209, -4.701733112335205, -4.28434944152832, -3.8669657707214355, -3.449582099914551, -3.032198429107666, -2.6148149967193604, -2.1974313259124756, -1.7800476551055908, -1.3626642227172852, -0.9452805519104004, -0.5278959274291992, -0.11051231622695923, 0.30687129497528076, 0.724254846572876, 1.1416385173797607, 1.5590221881866455, 1.9764056205749512, 2.393789291381836, 2.8111729621887207, 3.2285566329956055, 3.6459403038024902, 4.063323974609375, 4.480707168579102, 4.8980913162231445, 5.315474510192871, 5.732858180999756, 6.150241851806641, 6.567625522613525, 6.98500919342041, 7.402392387390137, 7.81977653503418, 8.237159729003906, 8.654542922973633, 9.071927070617676, 9.489311218261719, 9.906694412231445, 10.324078559875488, 10.741461753845215, 11.158845901489258, 11.576229095458984, 11.993612289428711, 12.410996437072754, 12.82837963104248]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 16.0, 16.0, 21.0, 43.0, 47.0, 105.0, 169.0, 215.0, 315.0, 530.0, 788.0, 1181.0, 1954.0, 2954.0, 4736.0, 7380.0, 11715.0, 18508.0, 28700.0, 43320.0, 63115.0, 88371.0, 113595.0, 132281.0, 133636.0, 114799.0, 90018.0, 64541.0, 44099.0, 29312.0, 18745.0, 12268.0, 7590.0, 4853.0, 3040.0, 2007.0, 1246.0, 812.0, 516.0, 327.0, 244.0, 142.0, 84.0, 76.0, 45.0, 22.0, 20.0, 15.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-25.90625, -25.097412109375, -24.28857421875, -23.479736328125, -22.6708984375, -21.862060546875, -21.05322265625, -20.244384765625, -19.435546875, -18.626708984375, -17.81787109375, -17.009033203125, -16.2001953125, -15.391357421875, -14.58251953125, -13.773681640625, -12.96484375, -12.156005859375, -11.34716796875, -10.538330078125, -9.7294921875, -8.920654296875, -8.11181640625, -7.302978515625, -6.494140625, -5.685302734375, -4.87646484375, -4.067626953125, -3.2587890625, -2.449951171875, -1.64111328125, -0.832275390625, -0.0234375, 0.785400390625, 1.59423828125, 2.403076171875, 3.2119140625, 4.020751953125, 4.82958984375, 5.638427734375, 6.447265625, 7.256103515625, 8.06494140625, 8.873779296875, 9.6826171875, 10.491455078125, 11.30029296875, 12.109130859375, 12.91796875, 13.726806640625, 14.53564453125, 15.344482421875, 16.1533203125, 16.962158203125, 17.77099609375, 18.579833984375, 19.388671875, 20.197509765625, 21.00634765625, 21.815185546875, 22.6240234375, 23.432861328125, 24.24169921875, 25.050537109375, 25.859375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 10.0, 6.0, 7.0, 9.0, 12.0, 10.0, 14.0, 21.0, 21.0, 26.0, 30.0, 32.0, 33.0, 34.0, 29.0, 46.0, 42.0, 39.0, 42.0, 41.0, 39.0, 34.0, 43.0, 41.0, 46.0, 43.0, 33.0, 26.0, 34.0, 26.0, 22.0, 20.0, 13.0, 14.0, 15.0, 15.0, 8.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.765625, -13.3812255859375, -12.996826171875, -12.6124267578125, -12.22802734375, -11.8436279296875, -11.459228515625, -11.0748291015625, -10.6904296875, -10.3060302734375, -9.921630859375, -9.5372314453125, -9.15283203125, -8.7684326171875, -8.384033203125, -7.9996337890625, -7.615234375, -7.2308349609375, -6.846435546875, -6.4620361328125, -6.07763671875, -5.6932373046875, -5.308837890625, -4.9244384765625, -4.5400390625, -4.1556396484375, -3.771240234375, -3.3868408203125, -3.00244140625, -2.6180419921875, -2.233642578125, -1.8492431640625, -1.46484375, -1.0804443359375, -0.696044921875, -0.3116455078125, 0.07275390625, 0.4571533203125, 0.841552734375, 1.2259521484375, 1.6103515625, 1.9947509765625, 2.379150390625, 2.7635498046875, 3.14794921875, 3.5323486328125, 3.916748046875, 4.3011474609375, 4.685546875, 5.0699462890625, 5.454345703125, 5.8387451171875, 6.22314453125, 6.6075439453125, 6.991943359375, 7.3763427734375, 7.7607421875, 8.1451416015625, 8.529541015625, 8.9139404296875, 9.29833984375, 9.6827392578125, 10.067138671875, 10.4515380859375, 10.8359375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 19.0, 17.0, 21.0, 40.0, 41.0, 78.0, 107.0, 163.0, 236.0, 368.0, 594.0, 793.0, 1343.0, 1988.0, 3042.0, 4708.0, 7688.0, 12111.0, 19245.0, 31756.0, 53017.0, 88258.0, 141540.0, 190333.0, 177708.0, 121777.0, 74616.0, 44897.0, 27058.0, 16522.0, 10287.0, 6493.0, 4011.0, 2566.0, 1764.0, 1110.0, 722.0, 486.0, 329.0, 227.0, 165.0, 113.0, 68.0, 37.0, 29.0, 21.0, 9.0, 10.0, 6.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0], "bins": [-27.796875, -26.9501953125, -26.103515625, -25.2568359375, -24.41015625, -23.5634765625, -22.716796875, -21.8701171875, -21.0234375, -20.1767578125, -19.330078125, -18.4833984375, -17.63671875, -16.7900390625, -15.943359375, -15.0966796875, -14.25, -13.4033203125, -12.556640625, -11.7099609375, -10.86328125, -10.0166015625, -9.169921875, -8.3232421875, -7.4765625, -6.6298828125, -5.783203125, -4.9365234375, -4.08984375, -3.2431640625, -2.396484375, -1.5498046875, -0.703125, 0.1435546875, 0.990234375, 1.8369140625, 2.68359375, 3.5302734375, 4.376953125, 5.2236328125, 6.0703125, 6.9169921875, 7.763671875, 8.6103515625, 9.45703125, 10.3037109375, 11.150390625, 11.9970703125, 12.84375, 13.6904296875, 14.537109375, 15.3837890625, 16.23046875, 17.0771484375, 17.923828125, 18.7705078125, 19.6171875, 20.4638671875, 21.310546875, 22.1572265625, 23.00390625, 23.8505859375, 24.697265625, 25.5439453125, 26.390625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 5.0, 15.0, 16.0, 16.0, 17.0, 27.0, 27.0, 27.0, 26.0, 27.0, 36.0, 38.0, 46.0, 31.0, 41.0, 42.0, 41.0, 37.0, 40.0, 38.0, 53.0, 34.0, 38.0, 38.0, 30.0, 25.0, 28.0, 17.0, 16.0, 16.0, 20.0, 14.0, 11.0, 8.0, 5.0, 5.0, 7.0, 0.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.6953125, -8.4195556640625, -8.143798828125, -7.8680419921875, -7.59228515625, -7.3165283203125, -7.040771484375, -6.7650146484375, -6.4892578125, -6.2135009765625, -5.937744140625, -5.6619873046875, -5.38623046875, -5.1104736328125, -4.834716796875, -4.5589599609375, -4.283203125, -4.0074462890625, -3.731689453125, -3.4559326171875, -3.18017578125, -2.9044189453125, -2.628662109375, -2.3529052734375, -2.0771484375, -1.8013916015625, -1.525634765625, -1.2498779296875, -0.97412109375, -0.6983642578125, -0.422607421875, -0.1468505859375, 0.12890625, 0.4046630859375, 0.680419921875, 0.9561767578125, 1.23193359375, 1.5076904296875, 1.783447265625, 2.0592041015625, 2.3349609375, 2.6107177734375, 2.886474609375, 3.1622314453125, 3.43798828125, 3.7137451171875, 3.989501953125, 4.2652587890625, 4.541015625, 4.8167724609375, 5.092529296875, 5.3682861328125, 5.64404296875, 5.9197998046875, 6.195556640625, 6.4713134765625, 6.7470703125, 7.0228271484375, 7.298583984375, 7.5743408203125, 7.85009765625, 8.1258544921875, 8.401611328125, 8.6773681640625, 8.953125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 1.0, 4.0, 8.0, 10.0, 14.0, 14.0, 23.0, 38.0, 78.0, 87.0, 171.0, 227.0, 348.0, 527.0, 857.0, 1293.0, 2060.0, 3468.0, 5846.0, 10794.0, 21462.0, 52023.0, 198685.0, 550550.0, 122181.0, 38349.0, 17388.0, 9040.0, 5067.0, 2978.0, 1786.0, 1116.0, 721.0, 467.0, 269.0, 205.0, 120.0, 90.0, 59.0, 40.0, 30.0, 22.0, 9.0, 12.0, 6.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-84.875, -82.330078125, -79.78515625, -77.240234375, -74.6953125, -72.150390625, -69.60546875, -67.060546875, -64.515625, -61.970703125, -59.42578125, -56.880859375, -54.3359375, -51.791015625, -49.24609375, -46.701171875, -44.15625, -41.611328125, -39.06640625, -36.521484375, -33.9765625, -31.431640625, -28.88671875, -26.341796875, -23.796875, -21.251953125, -18.70703125, -16.162109375, -13.6171875, -11.072265625, -8.52734375, -5.982421875, -3.4375, -0.892578125, 1.65234375, 4.197265625, 6.7421875, 9.287109375, 11.83203125, 14.376953125, 16.921875, 19.466796875, 22.01171875, 24.556640625, 27.1015625, 29.646484375, 32.19140625, 34.736328125, 37.28125, 39.826171875, 42.37109375, 44.916015625, 47.4609375, 50.005859375, 52.55078125, 55.095703125, 57.640625, 60.185546875, 62.73046875, 65.275390625, 67.8203125, 70.365234375, 72.91015625, 75.455078125, 78.0]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 11.0, 11.0, 22.0, 19.0, 22.0, 51.0, 99.0, 190.0, 223.0, 119.0, 59.0, 43.0, 25.0, 17.0, 15.0, 13.0, 15.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00933837890625, -0.009047269821166992, -0.008756160736083984, -0.008465051651000977, -0.008173942565917969, -0.007882833480834961, -0.007591724395751953, -0.007300615310668945, -0.0070095062255859375, -0.00671839714050293, -0.006427288055419922, -0.006136178970336914, -0.005845069885253906, -0.0055539608001708984, -0.005262851715087891, -0.004971742630004883, -0.004680633544921875, -0.004389524459838867, -0.004098415374755859, -0.0038073062896728516, -0.0035161972045898438, -0.003225088119506836, -0.002933979034423828, -0.0026428699493408203, -0.0023517608642578125, -0.0020606517791748047, -0.0017695426940917969, -0.001478433609008789, -0.0011873245239257812, -0.0008962154388427734, -0.0006051063537597656, -0.0003139972686767578, -2.288818359375e-05, 0.0002682209014892578, 0.0005593299865722656, 0.0008504390716552734, 0.0011415481567382812, 0.001432657241821289, 0.0017237663269042969, 0.0020148754119873047, 0.0023059844970703125, 0.0025970935821533203, 0.002888202667236328, 0.003179311752319336, 0.0034704208374023438, 0.0037615299224853516, 0.004052639007568359, 0.004343748092651367, 0.004634857177734375, 0.004925966262817383, 0.005217075347900391, 0.0055081844329833984, 0.005799293518066406, 0.006090402603149414, 0.006381511688232422, 0.00667262077331543, 0.0069637298583984375, 0.007254838943481445, 0.007545948028564453, 0.007837057113647461, 0.008128166198730469, 0.008419275283813477, 0.008710384368896484, 0.009001493453979492, 0.0092926025390625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 4.0, 14.0, 20.0, 24.0, 26.0, 49.0, 57.0, 111.0, 132.0, 259.0, 318.0, 557.0, 922.0, 1543.0, 2787.0, 5071.0, 9519.0, 20219.0, 50645.0, 195090.0, 494728.0, 178548.0, 47696.0, 19424.0, 9312.0, 4832.0, 2698.0, 1509.0, 921.0, 530.0, 337.0, 199.0, 140.0, 100.0, 65.0, 51.0, 29.0, 19.0, 14.0, 15.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0, -49.1435546875, -47.287109375, -45.4306640625, -43.57421875, -41.7177734375, -39.861328125, -38.0048828125, -36.1484375, -34.2919921875, -32.435546875, -30.5791015625, -28.72265625, -26.8662109375, -25.009765625, -23.1533203125, -21.296875, -19.4404296875, -17.583984375, -15.7275390625, -13.87109375, -12.0146484375, -10.158203125, -8.3017578125, -6.4453125, -4.5888671875, -2.732421875, -0.8759765625, 0.98046875, 2.8369140625, 4.693359375, 6.5498046875, 8.40625, 10.2626953125, 12.119140625, 13.9755859375, 15.83203125, 17.6884765625, 19.544921875, 21.4013671875, 23.2578125, 25.1142578125, 26.970703125, 28.8271484375, 30.68359375, 32.5400390625, 34.396484375, 36.2529296875, 38.109375, 39.9658203125, 41.822265625, 43.6787109375, 45.53515625, 47.3916015625, 49.248046875, 51.1044921875, 52.9609375, 54.8173828125, 56.673828125, 58.5302734375, 60.38671875, 62.2431640625, 64.099609375, 65.9560546875, 67.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 13.0, 19.0, 13.0, 17.0, 34.0, 67.0, 94.0, 142.0, 130.0, 140.0, 93.0, 52.0, 38.0, 29.0, 23.0, 14.0, 9.0, 5.0, 9.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.375, -14.88818359375, -14.4013671875, -13.91455078125, -13.427734375, -12.94091796875, -12.4541015625, -11.96728515625, -11.48046875, -10.99365234375, -10.5068359375, -10.02001953125, -9.533203125, -9.04638671875, -8.5595703125, -8.07275390625, -7.5859375, -7.09912109375, -6.6123046875, -6.12548828125, -5.638671875, -5.15185546875, -4.6650390625, -4.17822265625, -3.69140625, -3.20458984375, -2.7177734375, -2.23095703125, -1.744140625, -1.25732421875, -0.7705078125, -0.28369140625, 0.203125, 0.68994140625, 1.1767578125, 1.66357421875, 2.150390625, 2.63720703125, 3.1240234375, 3.61083984375, 4.09765625, 4.58447265625, 5.0712890625, 5.55810546875, 6.044921875, 6.53173828125, 7.0185546875, 7.50537109375, 7.9921875, 8.47900390625, 8.9658203125, 9.45263671875, 9.939453125, 10.42626953125, 10.9130859375, 11.39990234375, 11.88671875, 12.37353515625, 12.8603515625, 13.34716796875, 13.833984375, 14.32080078125, 14.8076171875, 15.29443359375, 15.78125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 5.0, 3.0, 6.0, 16.0, 21.0, 16.0, 24.0, 20.0, 28.0, 48.0, 45.0, 44.0, 51.0, 56.0, 57.0, 48.0, 50.0, 59.0, 53.0, 54.0, 40.0, 44.0, 33.0, 33.0, 25.0, 28.0, 10.0, 12.0, 5.0, 10.0, 10.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.071081161499023, -17.462955474853516, -16.85483169555664, -16.246706008911133, -15.638582229614258, -15.03045654296875, -14.422331809997559, -13.814207077026367, -13.206082344055176, -12.597957611083984, -11.989832878112793, -11.381708145141602, -10.773582458496094, -10.165458679199219, -9.557332992553711, -8.94920825958252, -8.341083526611328, -7.732958793640137, -7.124834060668945, -6.516708850860596, -5.908584117889404, -5.300459384918213, -4.692334175109863, -4.084209442138672, -3.4760847091674805, -2.867959976196289, -2.2598350048065186, -1.6517101526260376, -1.0435853004455566, -0.43546056747436523, 0.17266440391540527, 0.7807893753051758, 1.3889141082763672, 1.9970389604568481, 2.605163812637329, 3.2132887840270996, 3.821413516998291, 4.429538249969482, 5.037663459777832, 5.645788192749023, 6.253912925720215, 6.862037658691406, 7.470162391662598, 8.078287124633789, 8.686412811279297, 9.294536590576172, 9.90266227722168, 10.510787010192871, 11.118911743164062, 11.727036476135254, 12.335161209106445, 12.943285942077637, 13.551410675048828, 14.159536361694336, 14.767661094665527, 15.375785827636719, 15.98391056060791, 16.5920352935791, 17.20016098022461, 17.808284759521484, 18.416410446166992, 19.024534225463867, 19.632659912109375, 20.24078369140625, 20.848909378051758]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 7.0, 7.0, 4.0, 6.0, 12.0, 11.0, 16.0, 22.0, 22.0, 22.0, 20.0, 31.0, 22.0, 31.0, 33.0, 46.0, 41.0, 41.0, 34.0, 39.0, 28.0, 35.0, 39.0, 36.0, 35.0, 36.0, 33.0, 30.0, 29.0, 25.0, 27.0, 18.0, 24.0, 18.0, 17.0, 16.0, 13.0, 10.0, 9.0, 8.0, 12.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.740565299987793, -12.29871654510498, -11.856867790222168, -11.415019035339355, -10.97317123413086, -10.531322479248047, -10.089473724365234, -9.647624969482422, -9.20577621459961, -8.763927459716797, -8.322078704833984, -7.88023042678833, -7.438381671905518, -6.996532917022705, -6.554684638977051, -6.112835884094238, -5.670987129211426, -5.229138374328613, -4.787289619445801, -4.3454413414001465, -3.903592586517334, -3.4617438316345215, -3.019895315170288, -2.5780467987060547, -2.136198043823242, -1.6943494081497192, -1.2525007724761963, -0.8106521368026733, -0.3688035011291504, 0.07304525375366211, 0.5148937702178955, 0.9567422866821289, 1.3985919952392578, 1.8404406309127808, 2.2822892665863037, 2.724137783050537, 3.1659865379333496, 3.607835292816162, 4.049683570861816, 4.491532325744629, 4.933381080627441, 5.375229835510254, 5.817078590393066, 6.258926868438721, 6.700775623321533, 7.142624378204346, 7.58447265625, 8.026321411132812, 8.468170166015625, 8.910018920898438, 9.35186767578125, 9.793716430664062, 10.235565185546875, 10.677413940429688, 11.119261741638184, 11.561110496520996, 12.002959251403809, 12.444808006286621, 12.886656761169434, 13.328505516052246, 13.770353317260742, 14.212202072143555, 14.654050827026367, 15.09589958190918, 15.537748336791992]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 10.0, 14.0, 16.0, 28.0, 30.0, 35.0, 81.0, 98.0, 150.0, 204.0, 275.0, 469.0, 641.0, 1044.0, 1581.0, 2638.0, 3935.0, 6727.0, 10983.0, 18707.0, 32006.0, 53409.0, 85479.0, 126046.0, 158708.0, 163373.0, 135618.0, 95433.0, 60449.0, 36274.0, 21360.0, 12529.0, 7551.0, 4625.0, 2813.0, 1824.0, 1114.0, 781.0, 430.0, 323.0, 205.0, 153.0, 126.0, 86.0, 49.0, 34.0, 26.0, 30.0, 18.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-22.796875, -22.108642578125, -21.42041015625, -20.732177734375, -20.0439453125, -19.355712890625, -18.66748046875, -17.979248046875, -17.291015625, -16.602783203125, -15.91455078125, -15.226318359375, -14.5380859375, -13.849853515625, -13.16162109375, -12.473388671875, -11.78515625, -11.096923828125, -10.40869140625, -9.720458984375, -9.0322265625, -8.343994140625, -7.65576171875, -6.967529296875, -6.279296875, -5.591064453125, -4.90283203125, -4.214599609375, -3.5263671875, -2.838134765625, -2.14990234375, -1.461669921875, -0.7734375, -0.085205078125, 0.60302734375, 1.291259765625, 1.9794921875, 2.667724609375, 3.35595703125, 4.044189453125, 4.732421875, 5.420654296875, 6.10888671875, 6.797119140625, 7.4853515625, 8.173583984375, 8.86181640625, 9.550048828125, 10.23828125, 10.926513671875, 11.61474609375, 12.302978515625, 12.9912109375, 13.679443359375, 14.36767578125, 15.055908203125, 15.744140625, 16.432373046875, 17.12060546875, 17.808837890625, 18.4970703125, 19.185302734375, 19.87353515625, 20.561767578125, 21.25]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 6.0, 1.0, 5.0, 7.0, 1.0, 5.0, 9.0, 7.0, 14.0, 11.0, 8.0, 15.0, 19.0, 20.0, 15.0, 30.0, 28.0, 28.0, 44.0, 30.0, 41.0, 44.0, 36.0, 37.0, 39.0, 44.0, 34.0, 39.0, 28.0, 35.0, 39.0, 45.0, 24.0, 26.0, 21.0, 25.0, 24.0, 24.0, 21.0, 14.0, 8.0, 7.0, 11.0, 9.0, 5.0, 5.0, 10.0, 1.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.578125, -12.147216796875, -11.71630859375, -11.285400390625, -10.8544921875, -10.423583984375, -9.99267578125, -9.561767578125, -9.130859375, -8.699951171875, -8.26904296875, -7.838134765625, -7.4072265625, -6.976318359375, -6.54541015625, -6.114501953125, -5.68359375, -5.252685546875, -4.82177734375, -4.390869140625, -3.9599609375, -3.529052734375, -3.09814453125, -2.667236328125, -2.236328125, -1.805419921875, -1.37451171875, -0.943603515625, -0.5126953125, -0.081787109375, 0.34912109375, 0.780029296875, 1.2109375, 1.641845703125, 2.07275390625, 2.503662109375, 2.9345703125, 3.365478515625, 3.79638671875, 4.227294921875, 4.658203125, 5.089111328125, 5.52001953125, 5.950927734375, 6.3818359375, 6.812744140625, 7.24365234375, 7.674560546875, 8.10546875, 8.536376953125, 8.96728515625, 9.398193359375, 9.8291015625, 10.260009765625, 10.69091796875, 11.121826171875, 11.552734375, 11.983642578125, 12.41455078125, 12.845458984375, 13.2763671875, 13.707275390625, 14.13818359375, 14.569091796875, 15.0]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 24.0, 17.0, 25.0, 41.0, 84.0, 108.0, 163.0, 262.0, 373.0, 632.0, 1113.0, 1758.0, 3127.0, 5446.0, 9664.0, 17666.0, 32348.0, 58525.0, 100302.0, 153719.0, 189500.0, 175633.0, 125578.0, 76356.0, 42674.0, 23467.0, 12863.0, 7112.0, 4068.0, 2364.0, 1329.0, 830.0, 505.0, 296.0, 190.0, 111.0, 87.0, 58.0, 34.0, 17.0, 21.0, 18.0, 15.0, 7.0, 5.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-26.0625, -25.266357421875, -24.47021484375, -23.674072265625, -22.8779296875, -22.081787109375, -21.28564453125, -20.489501953125, -19.693359375, -18.897216796875, -18.10107421875, -17.304931640625, -16.5087890625, -15.712646484375, -14.91650390625, -14.120361328125, -13.32421875, -12.528076171875, -11.73193359375, -10.935791015625, -10.1396484375, -9.343505859375, -8.54736328125, -7.751220703125, -6.955078125, -6.158935546875, -5.36279296875, -4.566650390625, -3.7705078125, -2.974365234375, -2.17822265625, -1.382080078125, -0.5859375, 0.210205078125, 1.00634765625, 1.802490234375, 2.5986328125, 3.394775390625, 4.19091796875, 4.987060546875, 5.783203125, 6.579345703125, 7.37548828125, 8.171630859375, 8.9677734375, 9.763916015625, 10.56005859375, 11.356201171875, 12.15234375, 12.948486328125, 13.74462890625, 14.540771484375, 15.3369140625, 16.133056640625, 16.92919921875, 17.725341796875, 18.521484375, 19.317626953125, 20.11376953125, 20.909912109375, 21.7060546875, 22.502197265625, 23.29833984375, 24.094482421875, 24.890625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 4.0, 12.0, 17.0, 19.0, 21.0, 25.0, 31.0, 27.0, 20.0, 47.0, 46.0, 47.0, 45.0, 42.0, 38.0, 51.0, 58.0, 46.0, 46.0, 52.0, 44.0, 44.0, 39.0, 35.0, 33.0, 20.0, 21.0, 15.0, 11.0, 7.0, 9.0, 4.0, 2.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.7734375, -14.3316650390625, -13.889892578125, -13.4481201171875, -13.00634765625, -12.5645751953125, -12.122802734375, -11.6810302734375, -11.2392578125, -10.7974853515625, -10.355712890625, -9.9139404296875, -9.47216796875, -9.0303955078125, -8.588623046875, -8.1468505859375, -7.705078125, -7.2633056640625, -6.821533203125, -6.3797607421875, -5.93798828125, -5.4962158203125, -5.054443359375, -4.6126708984375, -4.1708984375, -3.7291259765625, -3.287353515625, -2.8455810546875, -2.40380859375, -1.9620361328125, -1.520263671875, -1.0784912109375, -0.63671875, -0.1949462890625, 0.246826171875, 0.6885986328125, 1.13037109375, 1.5721435546875, 2.013916015625, 2.4556884765625, 2.8974609375, 3.3392333984375, 3.781005859375, 4.2227783203125, 4.66455078125, 5.1063232421875, 5.548095703125, 5.9898681640625, 6.431640625, 6.8734130859375, 7.315185546875, 7.7569580078125, 8.19873046875, 8.6405029296875, 9.082275390625, 9.5240478515625, 9.9658203125, 10.4075927734375, 10.849365234375, 11.2911376953125, 11.73291015625, 12.1746826171875, 12.616455078125, 13.0582275390625, 13.5]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 10.0, 7.0, 6.0, 16.0, 15.0, 27.0, 36.0, 42.0, 49.0, 62.0, 125.0, 141.0, 223.0, 323.0, 438.0, 690.0, 1002.0, 1482.0, 2179.0, 3523.0, 5494.0, 9122.0, 15720.0, 28199.0, 55333.0, 118164.0, 245989.0, 273412.0, 142247.0, 65800.0, 33005.0, 17816.0, 10309.0, 6176.0, 3909.0, 2408.0, 1596.0, 1061.0, 718.0, 508.0, 349.0, 229.0, 166.0, 126.0, 94.0, 48.0, 42.0, 29.0, 24.0, 27.0, 19.0, 3.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0], "bins": [-31.109375, -30.109619140625, -29.10986328125, -28.110107421875, -27.1103515625, -26.110595703125, -25.11083984375, -24.111083984375, -23.111328125, -22.111572265625, -21.11181640625, -20.112060546875, -19.1123046875, -18.112548828125, -17.11279296875, -16.113037109375, -15.11328125, -14.113525390625, -13.11376953125, -12.114013671875, -11.1142578125, -10.114501953125, -9.11474609375, -8.114990234375, -7.115234375, -6.115478515625, -5.11572265625, -4.115966796875, -3.1162109375, -2.116455078125, -1.11669921875, -0.116943359375, 0.8828125, 1.882568359375, 2.88232421875, 3.882080078125, 4.8818359375, 5.881591796875, 6.88134765625, 7.881103515625, 8.880859375, 9.880615234375, 10.88037109375, 11.880126953125, 12.8798828125, 13.879638671875, 14.87939453125, 15.879150390625, 16.87890625, 17.878662109375, 18.87841796875, 19.878173828125, 20.8779296875, 21.877685546875, 22.87744140625, 23.877197265625, 24.876953125, 25.876708984375, 26.87646484375, 27.876220703125, 28.8759765625, 29.875732421875, 30.87548828125, 31.875244140625, 32.875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 4.0, 1.0, 1.0, 6.0, 14.0, 5.0, 9.0, 10.0, 20.0, 19.0, 18.0, 27.0, 40.0, 45.0, 41.0, 50.0, 85.0, 82.0, 97.0, 74.0, 78.0, 53.0, 43.0, 35.0, 27.0, 24.0, 23.0, 14.0, 14.0, 6.0, 12.0, 4.0, 6.0, 9.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002758026123046875, -0.0026730895042419434, -0.0025881528854370117, -0.00250321626663208, -0.0024182796478271484, -0.002333343029022217, -0.002248406410217285, -0.0021634697914123535, -0.002078533172607422, -0.0019935965538024902, -0.0019086599349975586, -0.001823723316192627, -0.0017387866973876953, -0.0016538500785827637, -0.001568913459777832, -0.0014839768409729004, -0.0013990402221679688, -0.0013141036033630371, -0.0012291669845581055, -0.0011442303657531738, -0.0010592937469482422, -0.0009743571281433105, -0.0008894205093383789, -0.0008044838905334473, -0.0007195472717285156, -0.000634610652923584, -0.0005496740341186523, -0.0004647374153137207, -0.00037980079650878906, -0.0002948641777038574, -0.00020992755889892578, -0.00012499094009399414, -4.00543212890625e-05, 4.488229751586914e-05, 0.00012981891632080078, 0.00021475553512573242, 0.00029969215393066406, 0.0003846287727355957, 0.00046956539154052734, 0.000554502010345459, 0.0006394386291503906, 0.0007243752479553223, 0.0008093118667602539, 0.0008942484855651855, 0.0009791851043701172, 0.0010641217231750488, 0.0011490583419799805, 0.0012339949607849121, 0.0013189315795898438, 0.0014038681983947754, 0.001488804817199707, 0.0015737414360046387, 0.0016586780548095703, 0.001743614673614502, 0.0018285512924194336, 0.0019134879112243652, 0.001998424530029297, 0.0020833611488342285, 0.00216829776763916, 0.002253234386444092, 0.0023381710052490234, 0.002423107624053955, 0.0025080442428588867, 0.0025929808616638184, 0.00267791748046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 10.0, 15.0, 27.0, 50.0, 61.0, 109.0, 158.0, 246.0, 397.0, 626.0, 1042.0, 1751.0, 2882.0, 4967.0, 8946.0, 17014.0, 35991.0, 87977.0, 231949.0, 343645.0, 181064.0, 68045.0, 29476.0, 13996.0, 7467.0, 4194.0, 2505.0, 1473.0, 956.0, 549.0, 341.0, 217.0, 134.0, 99.0, 59.0, 39.0, 23.0, 16.0, 11.0, 8.0, 5.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.09375, -30.9208984375, -29.748046875, -28.5751953125, -27.40234375, -26.2294921875, -25.056640625, -23.8837890625, -22.7109375, -21.5380859375, -20.365234375, -19.1923828125, -18.01953125, -16.8466796875, -15.673828125, -14.5009765625, -13.328125, -12.1552734375, -10.982421875, -9.8095703125, -8.63671875, -7.4638671875, -6.291015625, -5.1181640625, -3.9453125, -2.7724609375, -1.599609375, -0.4267578125, 0.74609375, 1.9189453125, 3.091796875, 4.2646484375, 5.4375, 6.6103515625, 7.783203125, 8.9560546875, 10.12890625, 11.3017578125, 12.474609375, 13.6474609375, 14.8203125, 15.9931640625, 17.166015625, 18.3388671875, 19.51171875, 20.6845703125, 21.857421875, 23.0302734375, 24.203125, 25.3759765625, 26.548828125, 27.7216796875, 28.89453125, 30.0673828125, 31.240234375, 32.4130859375, 33.5859375, 34.7587890625, 35.931640625, 37.1044921875, 38.27734375, 39.4501953125, 40.623046875, 41.7958984375, 42.96875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 10.0, 9.0, 6.0, 10.0, 6.0, 13.0, 23.0, 22.0, 15.0, 31.0, 40.0, 40.0, 48.0, 52.0, 69.0, 71.0, 76.0, 73.0, 65.0, 46.0, 45.0, 36.0, 28.0, 25.0, 20.0, 23.0, 15.0, 14.0, 10.0, 9.0, 5.0, 5.0, 10.0, 8.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.53125, -8.2652587890625, -7.999267578125, -7.7332763671875, -7.46728515625, -7.2012939453125, -6.935302734375, -6.6693115234375, -6.4033203125, -6.1373291015625, -5.871337890625, -5.6053466796875, -5.33935546875, -5.0733642578125, -4.807373046875, -4.5413818359375, -4.275390625, -4.0093994140625, -3.743408203125, -3.4774169921875, -3.21142578125, -2.9454345703125, -2.679443359375, -2.4134521484375, -2.1474609375, -1.8814697265625, -1.615478515625, -1.3494873046875, -1.08349609375, -0.8175048828125, -0.551513671875, -0.2855224609375, -0.01953125, 0.2464599609375, 0.512451171875, 0.7784423828125, 1.04443359375, 1.3104248046875, 1.576416015625, 1.8424072265625, 2.1083984375, 2.3743896484375, 2.640380859375, 2.9063720703125, 3.17236328125, 3.4383544921875, 3.704345703125, 3.9703369140625, 4.236328125, 4.5023193359375, 4.768310546875, 5.0343017578125, 5.30029296875, 5.5662841796875, 5.832275390625, 6.0982666015625, 6.3642578125, 6.6302490234375, 6.896240234375, 7.1622314453125, 7.42822265625, 7.6942138671875, 7.960205078125, 8.2261962890625, 8.4921875]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 4.0, 10.0, 13.0, 18.0, 20.0, 16.0, 23.0, 19.0, 28.0, 33.0, 32.0, 42.0, 55.0, 62.0, 57.0, 55.0, 45.0, 51.0, 47.0, 46.0, 39.0, 38.0, 36.0, 31.0, 19.0, 25.0, 19.0, 17.0, 19.0, 18.0, 11.0, 5.0, 13.0, 6.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.966279983520508, -17.36782455444336, -16.769371032714844, -16.170915603637695, -15.57246208190918, -14.974006652832031, -14.3755521774292, -13.777097702026367, -13.178643226623535, -12.580188751220703, -11.981734275817871, -11.383279800415039, -10.78482437133789, -10.186370849609375, -9.587915420532227, -8.989460945129395, -8.391006469726562, -7.7925519943237305, -7.194097518920898, -6.595642566680908, -5.997188091278076, -5.398733615875244, -4.800278663635254, -4.201824188232422, -3.60336971282959, -3.004915237426758, -2.4064605236053467, -1.808005928993225, -1.2095513343811035, -0.6110968589782715, -0.012642145156860352, 0.5858125686645508, 1.1842689514160156, 1.7827235460281372, 2.381178140640259, 2.97963285446167, 3.578087329864502, 4.176541805267334, 4.774996757507324, 5.373451232910156, 5.971905708312988, 6.57036018371582, 7.168814659118652, 7.767269611358643, 8.365724563598633, 8.964178085327148, 9.562633514404297, 10.161087989807129, 10.759542465209961, 11.357996940612793, 11.956451416015625, 12.554905891418457, 13.153360366821289, 13.751815795898438, 14.35027027130127, 14.948724746704102, 15.547179222106934, 16.145633697509766, 16.744089126586914, 17.34254264831543, 17.940998077392578, 18.539451599121094, 19.137907028198242, 19.73636245727539, 20.334815979003906]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 4.0, 6.0, 6.0, 7.0, 8.0, 13.0, 17.0, 14.0, 15.0, 17.0, 23.0, 24.0, 28.0, 33.0, 34.0, 28.0, 34.0, 31.0, 37.0, 49.0, 45.0, 35.0, 37.0, 30.0, 42.0, 40.0, 33.0, 30.0, 31.0, 34.0, 28.0, 27.0, 15.0, 11.0, 26.0, 18.0, 13.0, 17.0, 14.0, 11.0, 7.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.088459014892578, -14.612427711486816, -14.136395454406738, -13.660364151000977, -13.184332847595215, -12.708300590515137, -12.232269287109375, -11.756237030029297, -11.280205726623535, -10.804174423217773, -10.328142166137695, -9.852110862731934, -9.376079559326172, -8.900047302246094, -8.424015998840332, -7.947984218597412, -7.47195291519165, -6.9959211349487305, -6.519889831542969, -6.043858051300049, -5.567826271057129, -5.091794967651367, -4.615763187408447, -4.139731407165527, -3.6636998653411865, -3.1876683235168457, -2.711636543273926, -2.235605001449585, -1.7595733404159546, -1.2835416793823242, -0.8075101375579834, -0.3314783573150635, 0.14455318450927734, 0.6205848455429077, 1.096616506576538, 1.572648048400879, 2.048679828643799, 2.5247113704681396, 3.0007429122924805, 3.4767746925354004, 3.952806234359741, 4.428837776184082, 4.904869556427002, 5.380901336669922, 5.856932640075684, 6.3329644203186035, 6.808996200561523, 7.285027503967285, 7.761059284210205, 8.237091064453125, 8.713122367858887, 9.189153671264648, 9.665185928344727, 10.141217231750488, 10.61724853515625, 11.093280792236328, 11.56931209564209, 12.045343399047852, 12.52137565612793, 12.997406959533691, 13.473438262939453, 13.949470520019531, 14.425501823425293, 14.901533126831055, 15.377565383911133]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 6.0, 6.0, 9.0, 8.0, 18.0, 20.0, 26.0, 46.0, 80.0, 104.0, 124.0, 214.0, 264.0, 509.0, 713.0, 1090.0, 1672.0, 2571.0, 4288.0, 6871.0, 11464.0, 19817.0, 34503.0, 61147.0, 110427.0, 196683.0, 338291.0, 527357.0, 688560.0, 709050.0, 571691.0, 380666.0, 227079.0, 128356.0, 72225.0, 40411.0, 23101.0, 13807.0, 8040.0, 4773.0, 2969.0, 1856.0, 1196.0, 763.0, 459.0, 330.0, 208.0, 132.0, 86.0, 61.0, 43.0, 41.0, 20.0, 14.0, 7.0, 7.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0], "bins": [-14.6328125, -14.1627197265625, -13.692626953125, -13.2225341796875, -12.75244140625, -12.2823486328125, -11.812255859375, -11.3421630859375, -10.8720703125, -10.4019775390625, -9.931884765625, -9.4617919921875, -8.99169921875, -8.5216064453125, -8.051513671875, -7.5814208984375, -7.111328125, -6.6412353515625, -6.171142578125, -5.7010498046875, -5.23095703125, -4.7608642578125, -4.290771484375, -3.8206787109375, -3.3505859375, -2.8804931640625, -2.410400390625, -1.9403076171875, -1.47021484375, -1.0001220703125, -0.530029296875, -0.0599365234375, 0.41015625, 0.8802490234375, 1.350341796875, 1.8204345703125, 2.29052734375, 2.7606201171875, 3.230712890625, 3.7008056640625, 4.1708984375, 4.6409912109375, 5.111083984375, 5.5811767578125, 6.05126953125, 6.5213623046875, 6.991455078125, 7.4615478515625, 7.931640625, 8.4017333984375, 8.871826171875, 9.3419189453125, 9.81201171875, 10.2821044921875, 10.752197265625, 11.2222900390625, 11.6923828125, 12.1624755859375, 12.632568359375, 13.1026611328125, 13.57275390625, 14.0428466796875, 14.512939453125, 14.9830322265625, 15.453125]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 7.0, 13.0, 14.0, 22.0, 18.0, 19.0, 29.0, 20.0, 28.0, 30.0, 33.0, 30.0, 28.0, 40.0, 36.0, 39.0, 41.0, 36.0, 34.0, 38.0, 42.0, 35.0, 36.0, 36.0, 24.0, 27.0, 17.0, 22.0, 26.0, 21.0, 17.0, 22.0, 17.0, 13.0, 13.0, 8.0, 8.0, 9.0, 4.0, 2.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1015625, -9.759033203125, -9.41650390625, -9.073974609375, -8.7314453125, -8.388916015625, -8.04638671875, -7.703857421875, -7.361328125, -7.018798828125, -6.67626953125, -6.333740234375, -5.9912109375, -5.648681640625, -5.30615234375, -4.963623046875, -4.62109375, -4.278564453125, -3.93603515625, -3.593505859375, -3.2509765625, -2.908447265625, -2.56591796875, -2.223388671875, -1.880859375, -1.538330078125, -1.19580078125, -0.853271484375, -0.5107421875, -0.168212890625, 0.17431640625, 0.516845703125, 0.859375, 1.201904296875, 1.54443359375, 1.886962890625, 2.2294921875, 2.572021484375, 2.91455078125, 3.257080078125, 3.599609375, 3.942138671875, 4.28466796875, 4.627197265625, 4.9697265625, 5.312255859375, 5.65478515625, 5.997314453125, 6.33984375, 6.682373046875, 7.02490234375, 7.367431640625, 7.7099609375, 8.052490234375, 8.39501953125, 8.737548828125, 9.080078125, 9.422607421875, 9.76513671875, 10.107666015625, 10.4501953125, 10.792724609375, 11.13525390625, 11.477783203125, 11.8203125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 13.0, 5.0, 20.0, 39.0, 46.0, 66.0, 127.0, 211.0, 314.0, 528.0, 825.0, 1355.0, 2288.0, 3861.0, 6880.0, 12535.0, 23707.0, 46777.0, 95898.0, 194476.0, 377247.0, 641719.0, 850800.0, 796578.0, 540581.0, 296890.0, 149245.0, 72529.0, 36493.0, 18363.0, 10132.0, 5520.0, 3293.0, 1879.0, 1134.0, 680.0, 454.0, 279.0, 166.0, 129.0, 72.0, 40.0, 29.0, 27.0, 12.0, 7.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.484375, -19.860107421875, -19.23583984375, -18.611572265625, -17.9873046875, -17.363037109375, -16.73876953125, -16.114501953125, -15.490234375, -14.865966796875, -14.24169921875, -13.617431640625, -12.9931640625, -12.368896484375, -11.74462890625, -11.120361328125, -10.49609375, -9.871826171875, -9.24755859375, -8.623291015625, -7.9990234375, -7.374755859375, -6.75048828125, -6.126220703125, -5.501953125, -4.877685546875, -4.25341796875, -3.629150390625, -3.0048828125, -2.380615234375, -1.75634765625, -1.132080078125, -0.5078125, 0.116455078125, 0.74072265625, 1.364990234375, 1.9892578125, 2.613525390625, 3.23779296875, 3.862060546875, 4.486328125, 5.110595703125, 5.73486328125, 6.359130859375, 6.9833984375, 7.607666015625, 8.23193359375, 8.856201171875, 9.48046875, 10.104736328125, 10.72900390625, 11.353271484375, 11.9775390625, 12.601806640625, 13.22607421875, 13.850341796875, 14.474609375, 15.098876953125, 15.72314453125, 16.347412109375, 16.9716796875, 17.595947265625, 18.22021484375, 18.844482421875, 19.46875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 2.0, 11.0, 17.0, 12.0, 19.0, 19.0, 32.0, 39.0, 48.0, 51.0, 60.0, 85.0, 111.0, 124.0, 129.0, 178.0, 199.0, 203.0, 224.0, 268.0, 246.0, 267.0, 224.0, 225.0, 206.0, 199.0, 192.0, 153.0, 116.0, 90.0, 75.0, 68.0, 40.0, 33.0, 25.0, 24.0, 15.0, 13.0, 6.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-7.12109375, -6.922119140625, -6.72314453125, -6.524169921875, -6.3251953125, -6.126220703125, -5.92724609375, -5.728271484375, -5.529296875, -5.330322265625, -5.13134765625, -4.932373046875, -4.7333984375, -4.534423828125, -4.33544921875, -4.136474609375, -3.9375, -3.738525390625, -3.53955078125, -3.340576171875, -3.1416015625, -2.942626953125, -2.74365234375, -2.544677734375, -2.345703125, -2.146728515625, -1.94775390625, -1.748779296875, -1.5498046875, -1.350830078125, -1.15185546875, -0.952880859375, -0.75390625, -0.554931640625, -0.35595703125, -0.156982421875, 0.0419921875, 0.240966796875, 0.43994140625, 0.638916015625, 0.837890625, 1.036865234375, 1.23583984375, 1.434814453125, 1.6337890625, 1.832763671875, 2.03173828125, 2.230712890625, 2.4296875, 2.628662109375, 2.82763671875, 3.026611328125, 3.2255859375, 3.424560546875, 3.62353515625, 3.822509765625, 4.021484375, 4.220458984375, 4.41943359375, 4.618408203125, 4.8173828125, 5.016357421875, 5.21533203125, 5.414306640625, 5.61328125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 6.0, 16.0, 18.0, 16.0, 25.0, 32.0, 29.0, 41.0, 61.0, 56.0, 64.0, 60.0, 70.0, 68.0, 66.0, 59.0, 45.0, 49.0, 38.0, 29.0, 32.0, 27.0, 25.0, 15.0, 14.0, 9.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.96455192565918, -24.27136993408203, -23.578187942504883, -22.885005950927734, -22.191823959350586, -21.498641967773438, -20.80545997619629, -20.11227798461914, -19.419095993041992, -18.725914001464844, -18.032732009887695, -17.339550018310547, -16.6463680267334, -15.95318603515625, -15.260004043579102, -14.566822052001953, -13.873640060424805, -13.180458068847656, -12.487276077270508, -11.79409408569336, -11.100912094116211, -10.407730102539062, -9.714548110961914, -9.021366119384766, -8.328184127807617, -7.635002136230469, -6.94182014465332, -6.248638153076172, -5.555456161499023, -4.862274169921875, -4.169092178344727, -3.475910186767578, -2.782726287841797, -2.0895442962646484, -1.3963623046875, -0.7031803131103516, -0.009998321533203125, 0.6831836700439453, 1.3763656616210938, 2.069547653198242, 2.7627296447753906, 3.455911636352539, 4.1490936279296875, 4.842275619506836, 5.535457611083984, 6.228639602661133, 6.921821594238281, 7.61500358581543, 8.308185577392578, 9.001367568969727, 9.694549560546875, 10.387731552124023, 11.080913543701172, 11.77409553527832, 12.467277526855469, 13.160459518432617, 13.853641510009766, 14.546823501586914, 15.240005493164062, 15.933187484741211, 16.62636947631836, 17.319551467895508, 18.012733459472656, 18.705915451049805, 19.399097442626953]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 5.0, 8.0, 8.0, 8.0, 14.0, 19.0, 5.0, 28.0, 29.0, 33.0, 39.0, 35.0, 41.0, 24.0, 47.0, 39.0, 41.0, 47.0, 43.0, 60.0, 40.0, 56.0, 44.0, 32.0, 32.0, 39.0, 41.0, 25.0, 22.0, 14.0, 17.0, 12.0, 9.0, 14.0, 6.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.160979270935059, -13.660107612609863, -13.159235000610352, -12.658363342285156, -12.157491683959961, -11.656620025634766, -11.155747413635254, -10.654875755310059, -10.154003143310547, -9.653131484985352, -9.15225887298584, -8.651387214660645, -8.15051555633545, -7.649643421173096, -7.148771286010742, -6.647899627685547, -6.147027969360352, -5.646155834197998, -5.145284175872803, -4.644412040710449, -4.143540382385254, -3.6426682472229004, -3.141796112060547, -2.6409242153167725, -2.140052318572998, -1.6391804218292236, -1.1383084058761597, -0.6374363899230957, -0.1365644931793213, 0.3643074035644531, 0.8651795387268066, 1.366051435470581, 1.8669242858886719, 2.3677961826324463, 2.8686680793762207, 3.369540214538574, 3.8704121112823486, 4.371284008026123, 4.872156143188477, 5.373027801513672, 5.873899936676025, 6.374772071838379, 6.875643730163574, 7.376515865325928, 7.877388000488281, 8.378259658813477, 8.879131317138672, 9.380003929138184, 9.880875587463379, 10.381747245788574, 10.882619857788086, 11.383491516113281, 11.884363174438477, 12.385234832763672, 12.886107444763184, 13.386979103088379, 13.88785171508789, 14.388723373413086, 14.889595985412598, 15.390467643737793, 15.891339302062988, 16.3922119140625, 16.893083572387695, 17.39395523071289, 17.894826889038086]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 14.0, 19.0, 27.0, 42.0, 72.0, 90.0, 166.0, 243.0, 402.0, 601.0, 900.0, 1527.0, 2328.0, 3871.0, 6139.0, 9870.0, 15886.0, 25953.0, 41002.0, 66054.0, 102504.0, 148632.0, 175002.0, 153601.0, 108552.0, 69451.0, 43465.0, 27397.0, 16807.0, 10461.0, 6536.0, 4056.0, 2515.0, 1570.0, 1026.0, 631.0, 435.0, 262.0, 146.0, 106.0, 72.0, 40.0, 23.0, 21.0, 13.0, 8.0, 6.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.765625, -30.819091796875, -29.87255859375, -28.926025390625, -27.9794921875, -27.032958984375, -26.08642578125, -25.139892578125, -24.193359375, -23.246826171875, -22.30029296875, -21.353759765625, -20.4072265625, -19.460693359375, -18.51416015625, -17.567626953125, -16.62109375, -15.674560546875, -14.72802734375, -13.781494140625, -12.8349609375, -11.888427734375, -10.94189453125, -9.995361328125, -9.048828125, -8.102294921875, -7.15576171875, -6.209228515625, -5.2626953125, -4.316162109375, -3.36962890625, -2.423095703125, -1.4765625, -0.530029296875, 0.41650390625, 1.363037109375, 2.3095703125, 3.256103515625, 4.20263671875, 5.149169921875, 6.095703125, 7.042236328125, 7.98876953125, 8.935302734375, 9.8818359375, 10.828369140625, 11.77490234375, 12.721435546875, 13.66796875, 14.614501953125, 15.56103515625, 16.507568359375, 17.4541015625, 18.400634765625, 19.34716796875, 20.293701171875, 21.240234375, 22.186767578125, 23.13330078125, 24.079833984375, 25.0263671875, 25.972900390625, 26.91943359375, 27.865966796875, 28.8125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 10.0, 13.0, 10.0, 10.0, 20.0, 22.0, 27.0, 40.0, 32.0, 40.0, 27.0, 48.0, 39.0, 33.0, 42.0, 43.0, 56.0, 54.0, 48.0, 40.0, 37.0, 41.0, 27.0, 38.0, 43.0, 12.0, 35.0, 23.0, 15.0, 14.0, 15.0, 11.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.671875, -13.187255859375, -12.70263671875, -12.218017578125, -11.7333984375, -11.248779296875, -10.76416015625, -10.279541015625, -9.794921875, -9.310302734375, -8.82568359375, -8.341064453125, -7.8564453125, -7.371826171875, -6.88720703125, -6.402587890625, -5.91796875, -5.433349609375, -4.94873046875, -4.464111328125, -3.9794921875, -3.494873046875, -3.01025390625, -2.525634765625, -2.041015625, -1.556396484375, -1.07177734375, -0.587158203125, -0.1025390625, 0.382080078125, 0.86669921875, 1.351318359375, 1.8359375, 2.320556640625, 2.80517578125, 3.289794921875, 3.7744140625, 4.259033203125, 4.74365234375, 5.228271484375, 5.712890625, 6.197509765625, 6.68212890625, 7.166748046875, 7.6513671875, 8.135986328125, 8.62060546875, 9.105224609375, 9.58984375, 10.074462890625, 10.55908203125, 11.043701171875, 11.5283203125, 12.012939453125, 12.49755859375, 12.982177734375, 13.466796875, 13.951416015625, 14.43603515625, 14.920654296875, 15.4052734375, 15.889892578125, 16.37451171875, 16.859130859375, 17.34375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 11.0, 24.0, 24.0, 31.0, 47.0, 74.0, 108.0, 138.0, 198.0, 350.0, 533.0, 868.0, 1379.0, 2280.0, 3713.0, 6196.0, 10932.0, 19717.0, 36710.0, 69588.0, 134712.0, 228754.0, 233764.0, 139593.0, 72929.0, 37902.0, 20398.0, 11222.0, 6295.0, 3860.0, 2275.0, 1419.0, 838.0, 566.0, 379.0, 220.0, 166.0, 97.0, 65.0, 59.0, 37.0, 26.0, 18.0, 15.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.5, -34.3916015625, -33.283203125, -32.1748046875, -31.06640625, -29.9580078125, -28.849609375, -27.7412109375, -26.6328125, -25.5244140625, -24.416015625, -23.3076171875, -22.19921875, -21.0908203125, -19.982421875, -18.8740234375, -17.765625, -16.6572265625, -15.548828125, -14.4404296875, -13.33203125, -12.2236328125, -11.115234375, -10.0068359375, -8.8984375, -7.7900390625, -6.681640625, -5.5732421875, -4.46484375, -3.3564453125, -2.248046875, -1.1396484375, -0.03125, 1.0771484375, 2.185546875, 3.2939453125, 4.40234375, 5.5107421875, 6.619140625, 7.7275390625, 8.8359375, 9.9443359375, 11.052734375, 12.1611328125, 13.26953125, 14.3779296875, 15.486328125, 16.5947265625, 17.703125, 18.8115234375, 19.919921875, 21.0283203125, 22.13671875, 23.2451171875, 24.353515625, 25.4619140625, 26.5703125, 27.6787109375, 28.787109375, 29.8955078125, 31.00390625, 32.1123046875, 33.220703125, 34.3291015625, 35.4375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 2.0, 17.0, 14.0, 21.0, 22.0, 19.0, 23.0, 36.0, 44.0, 42.0, 58.0, 50.0, 58.0, 48.0, 65.0, 56.0, 55.0, 40.0, 55.0, 54.0, 33.0, 35.0, 22.0, 25.0, 23.0, 17.0, 18.0, 10.0, 12.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.125, -14.7047119140625, -14.284423828125, -13.8641357421875, -13.44384765625, -13.0235595703125, -12.603271484375, -12.1829833984375, -11.7626953125, -11.3424072265625, -10.922119140625, -10.5018310546875, -10.08154296875, -9.6612548828125, -9.240966796875, -8.8206787109375, -8.400390625, -7.9801025390625, -7.559814453125, -7.1395263671875, -6.71923828125, -6.2989501953125, -5.878662109375, -5.4583740234375, -5.0380859375, -4.6177978515625, -4.197509765625, -3.7772216796875, -3.35693359375, -2.9366455078125, -2.516357421875, -2.0960693359375, -1.67578125, -1.2554931640625, -0.835205078125, -0.4149169921875, 0.00537109375, 0.4256591796875, 0.845947265625, 1.2662353515625, 1.6865234375, 2.1068115234375, 2.527099609375, 2.9473876953125, 3.36767578125, 3.7879638671875, 4.208251953125, 4.6285400390625, 5.048828125, 5.4691162109375, 5.889404296875, 6.3096923828125, 6.72998046875, 7.1502685546875, 7.570556640625, 7.9908447265625, 8.4111328125, 8.8314208984375, 9.251708984375, 9.6719970703125, 10.09228515625, 10.5125732421875, 10.932861328125, 11.3531494140625, 11.7734375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 8.0, 6.0, 12.0, 5.0, 10.0, 19.0, 21.0, 24.0, 50.0, 59.0, 102.0, 101.0, 134.0, 204.0, 311.0, 405.0, 598.0, 1012.0, 1524.0, 2591.0, 4483.0, 8421.0, 18173.0, 47025.0, 241386.0, 593509.0, 77280.0, 25807.0, 11050.0, 5598.0, 3159.0, 1875.0, 1139.0, 790.0, 515.0, 323.0, 231.0, 183.0, 119.0, 86.0, 69.0, 42.0, 33.0, 25.0, 15.0, 7.0, 7.0, 11.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.0625, -87.17578125, -84.2890625, -81.40234375, -78.515625, -75.62890625, -72.7421875, -69.85546875, -66.96875, -64.08203125, -61.1953125, -58.30859375, -55.421875, -52.53515625, -49.6484375, -46.76171875, -43.875, -40.98828125, -38.1015625, -35.21484375, -32.328125, -29.44140625, -26.5546875, -23.66796875, -20.78125, -17.89453125, -15.0078125, -12.12109375, -9.234375, -6.34765625, -3.4609375, -0.57421875, 2.3125, 5.19921875, 8.0859375, 10.97265625, 13.859375, 16.74609375, 19.6328125, 22.51953125, 25.40625, 28.29296875, 31.1796875, 34.06640625, 36.953125, 39.83984375, 42.7265625, 45.61328125, 48.5, 51.38671875, 54.2734375, 57.16015625, 60.046875, 62.93359375, 65.8203125, 68.70703125, 71.59375, 74.48046875, 77.3671875, 80.25390625, 83.140625, 86.02734375, 88.9140625, 91.80078125, 94.6875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 2.0, 3.0, 10.0, 7.0, 10.0, 12.0, 14.0, 27.0, 35.0, 90.0, 223.0, 258.0, 110.0, 56.0, 21.0, 18.0, 16.0, 13.0, 12.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0094451904296875, -0.009151577949523926, -0.008857965469360352, -0.008564352989196777, -0.008270740509033203, -0.007977128028869629, -0.007683515548706055, -0.0073899030685424805, -0.007096290588378906, -0.006802678108215332, -0.006509065628051758, -0.006215453147888184, -0.005921840667724609, -0.005628228187561035, -0.005334615707397461, -0.005041003227233887, -0.0047473907470703125, -0.004453778266906738, -0.004160165786743164, -0.00386655330657959, -0.0035729408264160156, -0.0032793283462524414, -0.002985715866088867, -0.002692103385925293, -0.0023984909057617188, -0.0021048784255981445, -0.0018112659454345703, -0.001517653465270996, -0.0012240409851074219, -0.0009304285049438477, -0.0006368160247802734, -0.0003432035446166992, -4.9591064453125e-05, 0.00024402141571044922, 0.0005376338958740234, 0.0008312463760375977, 0.0011248588562011719, 0.001418471336364746, 0.0017120838165283203, 0.0020056962966918945, 0.0022993087768554688, 0.002592921257019043, 0.002886533737182617, 0.0031801462173461914, 0.0034737586975097656, 0.00376737117767334, 0.004060983657836914, 0.004354596138000488, 0.0046482086181640625, 0.004941821098327637, 0.005235433578491211, 0.005529046058654785, 0.005822658538818359, 0.006116271018981934, 0.006409883499145508, 0.006703495979309082, 0.006997108459472656, 0.0072907209396362305, 0.007584333419799805, 0.007877945899963379, 0.008171558380126953, 0.008465170860290527, 0.008758783340454102, 0.009052395820617676, 0.00934600830078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 14.0, 18.0, 20.0, 22.0, 33.0, 49.0, 77.0, 92.0, 165.0, 237.0, 317.0, 437.0, 599.0, 752.0, 1124.0, 1621.0, 2490.0, 4091.0, 7233.0, 13885.0, 32709.0, 100487.0, 420494.0, 326591.0, 78063.0, 27377.0, 12063.0, 6297.0, 3716.0, 2297.0, 1508.0, 1072.0, 730.0, 537.0, 364.0, 248.0, 200.0, 156.0, 94.0, 83.0, 60.0, 43.0, 26.0, 18.0, 14.0, 10.0, 8.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-60.75, -59.00927734375, -57.2685546875, -55.52783203125, -53.787109375, -52.04638671875, -50.3056640625, -48.56494140625, -46.82421875, -45.08349609375, -43.3427734375, -41.60205078125, -39.861328125, -38.12060546875, -36.3798828125, -34.63916015625, -32.8984375, -31.15771484375, -29.4169921875, -27.67626953125, -25.935546875, -24.19482421875, -22.4541015625, -20.71337890625, -18.97265625, -17.23193359375, -15.4912109375, -13.75048828125, -12.009765625, -10.26904296875, -8.5283203125, -6.78759765625, -5.046875, -3.30615234375, -1.5654296875, 0.17529296875, 1.916015625, 3.65673828125, 5.3974609375, 7.13818359375, 8.87890625, 10.61962890625, 12.3603515625, 14.10107421875, 15.841796875, 17.58251953125, 19.3232421875, 21.06396484375, 22.8046875, 24.54541015625, 26.2861328125, 28.02685546875, 29.767578125, 31.50830078125, 33.2490234375, 34.98974609375, 36.73046875, 38.47119140625, 40.2119140625, 41.95263671875, 43.693359375, 45.43408203125, 47.1748046875, 48.91552734375, 50.65625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 9.0, 6.0, 17.0, 18.0, 19.0, 32.0, 53.0, 57.0, 94.0, 144.0, 146.0, 117.0, 75.0, 51.0, 38.0, 19.0, 18.0, 14.0, 15.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.203125, -19.660400390625, -19.11767578125, -18.574951171875, -18.0322265625, -17.489501953125, -16.94677734375, -16.404052734375, -15.861328125, -15.318603515625, -14.77587890625, -14.233154296875, -13.6904296875, -13.147705078125, -12.60498046875, -12.062255859375, -11.51953125, -10.976806640625, -10.43408203125, -9.891357421875, -9.3486328125, -8.805908203125, -8.26318359375, -7.720458984375, -7.177734375, -6.635009765625, -6.09228515625, -5.549560546875, -5.0068359375, -4.464111328125, -3.92138671875, -3.378662109375, -2.8359375, -2.293212890625, -1.75048828125, -1.207763671875, -0.6650390625, -0.122314453125, 0.42041015625, 0.963134765625, 1.505859375, 2.048583984375, 2.59130859375, 3.134033203125, 3.6767578125, 4.219482421875, 4.76220703125, 5.304931640625, 5.84765625, 6.390380859375, 6.93310546875, 7.475830078125, 8.0185546875, 8.561279296875, 9.10400390625, 9.646728515625, 10.189453125, 10.732177734375, 11.27490234375, 11.817626953125, 12.3603515625, 12.903076171875, 13.44580078125, 13.988525390625, 14.53125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 8.0, 9.0, 5.0, 12.0, 26.0, 16.0, 28.0, 39.0, 37.0, 39.0, 50.0, 47.0, 53.0, 71.0, 78.0, 70.0, 69.0, 66.0, 54.0, 35.0, 40.0, 35.0, 23.0, 23.0, 12.0, 15.0, 7.0, 8.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.788639068603516, -30.958770751953125, -30.128902435302734, -29.299034118652344, -28.46916389465332, -27.63929557800293, -26.80942726135254, -25.97955894470215, -25.149688720703125, -24.319820404052734, -23.489952087402344, -22.660083770751953, -21.83021354675293, -21.00034523010254, -20.17047691345215, -19.340608596801758, -18.510740280151367, -17.680871963500977, -16.851003646850586, -16.021133422851562, -15.191265106201172, -14.361396789550781, -13.53152847290039, -12.70166015625, -11.871790885925293, -11.041922569274902, -10.212053298950195, -9.382184982299805, -8.552316665649414, -7.722447395324707, -6.892579078674316, -6.062710285186768, -5.232839584350586, -4.402970790863037, -3.5731022357940674, -2.7432336807250977, -1.9133648872375488, -1.08349609375, -0.2536277770996094, 0.5762410163879395, 1.4061098098754883, 2.235978603363037, 3.065847158432007, 3.8957157135009766, 4.725584506988525, 5.555453300476074, 6.385321617126465, 7.215190410614014, 8.045059204101562, 8.874927520751953, 9.70479679107666, 10.53466510772705, 11.364534378051758, 12.194402694702148, 13.024271011352539, 13.85413932800293, 14.684008598327637, 15.513876914978027, 16.343746185302734, 17.173614501953125, 18.003482818603516, 18.833351135253906, 19.663219451904297, 20.49308967590332, 21.32295799255371]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 8.0, 10.0, 8.0, 13.0, 14.0, 16.0, 19.0, 27.0, 24.0, 22.0, 26.0, 23.0, 27.0, 29.0, 31.0, 48.0, 25.0, 44.0, 44.0, 38.0, 49.0, 36.0, 34.0, 27.0, 40.0, 30.0, 36.0, 29.0, 28.0, 30.0, 23.0, 18.0, 14.0, 18.0, 10.0, 13.0, 10.0, 11.0, 9.0, 11.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0], "bins": [-18.461637496948242, -17.9154052734375, -17.369173049926758, -16.82294273376465, -16.276710510253906, -15.730478286743164, -15.184246063232422, -14.63801383972168, -14.091782569885254, -13.545550346374512, -12.999319076538086, -12.453086853027344, -11.906854629516602, -11.360623359680176, -10.814391136169434, -10.268159866333008, -9.721927642822266, -9.175695419311523, -8.629464149475098, -8.083231925964355, -7.5370001792907715, -6.9907684326171875, -6.444536209106445, -5.898304462432861, -5.352072715759277, -4.805840969085693, -4.259609222412109, -3.713376998901367, -3.167145252227783, -2.620913505554199, -2.074681520462036, -1.528449535369873, -0.9822158813476562, -0.4359840154647827, 0.11024785041809082, 0.6564797163009644, 1.202711582183838, 1.7489433288574219, 2.295175313949585, 2.841407299041748, 3.387639045715332, 3.933870792388916, 4.4801025390625, 5.026334762573242, 5.572566509246826, 6.11879825592041, 6.665030479431152, 7.211262226104736, 7.75749397277832, 8.303726196289062, 8.849957466125488, 9.39618968963623, 9.942420959472656, 10.488653182983398, 11.03488540649414, 11.581117630004883, 12.127348899841309, 12.67358112335205, 13.219812393188477, 13.766044616699219, 14.312276840209961, 14.858508110046387, 15.404740333557129, 15.950971603393555, 16.497203826904297]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 8.0, 15.0, 12.0, 22.0, 28.0, 40.0, 69.0, 106.0, 108.0, 178.0, 281.0, 372.0, 556.0, 880.0, 1399.0, 2443.0, 4198.0, 7764.0, 15473.0, 33477.0, 79629.0, 186128.0, 302131.0, 227552.0, 102128.0, 42517.0, 19198.0, 9323.0, 4968.0, 2741.0, 1749.0, 1034.0, 639.0, 425.0, 291.0, 213.0, 127.0, 89.0, 61.0, 60.0, 28.0, 22.0, 22.0, 10.0, 13.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-44.46875, -43.1064453125, -41.744140625, -40.3818359375, -39.01953125, -37.6572265625, -36.294921875, -34.9326171875, -33.5703125, -32.2080078125, -30.845703125, -29.4833984375, -28.12109375, -26.7587890625, -25.396484375, -24.0341796875, -22.671875, -21.3095703125, -19.947265625, -18.5849609375, -17.22265625, -15.8603515625, -14.498046875, -13.1357421875, -11.7734375, -10.4111328125, -9.048828125, -7.6865234375, -6.32421875, -4.9619140625, -3.599609375, -2.2373046875, -0.875, 0.4873046875, 1.849609375, 3.2119140625, 4.57421875, 5.9365234375, 7.298828125, 8.6611328125, 10.0234375, 11.3857421875, 12.748046875, 14.1103515625, 15.47265625, 16.8349609375, 18.197265625, 19.5595703125, 20.921875, 22.2841796875, 23.646484375, 25.0087890625, 26.37109375, 27.7333984375, 29.095703125, 30.4580078125, 31.8203125, 33.1826171875, 34.544921875, 35.9072265625, 37.26953125, 38.6318359375, 39.994140625, 41.3564453125, 42.71875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 7.0, 5.0, 15.0, 9.0, 13.0, 19.0, 15.0, 22.0, 22.0, 30.0, 23.0, 28.0, 34.0, 44.0, 28.0, 38.0, 46.0, 41.0, 46.0, 40.0, 35.0, 47.0, 34.0, 41.0, 40.0, 34.0, 41.0, 30.0, 22.0, 21.0, 26.0, 19.0, 14.0, 11.0, 11.0, 8.0, 10.0, 6.0, 1.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.0, -18.427734375, -17.85546875, -17.283203125, -16.7109375, -16.138671875, -15.56640625, -14.994140625, -14.421875, -13.849609375, -13.27734375, -12.705078125, -12.1328125, -11.560546875, -10.98828125, -10.416015625, -9.84375, -9.271484375, -8.69921875, -8.126953125, -7.5546875, -6.982421875, -6.41015625, -5.837890625, -5.265625, -4.693359375, -4.12109375, -3.548828125, -2.9765625, -2.404296875, -1.83203125, -1.259765625, -0.6875, -0.115234375, 0.45703125, 1.029296875, 1.6015625, 2.173828125, 2.74609375, 3.318359375, 3.890625, 4.462890625, 5.03515625, 5.607421875, 6.1796875, 6.751953125, 7.32421875, 7.896484375, 8.46875, 9.041015625, 9.61328125, 10.185546875, 10.7578125, 11.330078125, 11.90234375, 12.474609375, 13.046875, 13.619140625, 14.19140625, 14.763671875, 15.3359375, 15.908203125, 16.48046875, 17.052734375, 17.625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 3.0, 10.0, 7.0, 11.0, 24.0, 29.0, 50.0, 54.0, 84.0, 150.0, 194.0, 265.0, 435.0, 597.0, 935.0, 1351.0, 2063.0, 3224.0, 5145.0, 8020.0, 13416.0, 22655.0, 40656.0, 75546.0, 141471.0, 220604.0, 214317.0, 133096.0, 70405.0, 37837.0, 21515.0, 12681.0, 7770.0, 4908.0, 3092.0, 1954.0, 1318.0, 864.0, 584.0, 389.0, 254.0, 184.0, 120.0, 76.0, 70.0, 33.0, 31.0, 23.0, 8.0, 9.0, 10.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-30.984375, -29.983154296875, -28.98193359375, -27.980712890625, -26.9794921875, -25.978271484375, -24.97705078125, -23.975830078125, -22.974609375, -21.973388671875, -20.97216796875, -19.970947265625, -18.9697265625, -17.968505859375, -16.96728515625, -15.966064453125, -14.96484375, -13.963623046875, -12.96240234375, -11.961181640625, -10.9599609375, -9.958740234375, -8.95751953125, -7.956298828125, -6.955078125, -5.953857421875, -4.95263671875, -3.951416015625, -2.9501953125, -1.948974609375, -0.94775390625, 0.053466796875, 1.0546875, 2.055908203125, 3.05712890625, 4.058349609375, 5.0595703125, 6.060791015625, 7.06201171875, 8.063232421875, 9.064453125, 10.065673828125, 11.06689453125, 12.068115234375, 13.0693359375, 14.070556640625, 15.07177734375, 16.072998046875, 17.07421875, 18.075439453125, 19.07666015625, 20.077880859375, 21.0791015625, 22.080322265625, 23.08154296875, 24.082763671875, 25.083984375, 26.085205078125, 27.08642578125, 28.087646484375, 29.0888671875, 30.090087890625, 31.09130859375, 32.092529296875, 33.09375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 0.0, 8.0, 1.0, 2.0, 6.0, 6.0, 9.0, 7.0, 10.0, 15.0, 19.0, 16.0, 13.0, 17.0, 19.0, 22.0, 16.0, 27.0, 27.0, 39.0, 27.0, 29.0, 32.0, 46.0, 33.0, 44.0, 32.0, 40.0, 33.0, 24.0, 29.0, 32.0, 37.0, 32.0, 37.0, 26.0, 34.0, 23.0, 17.0, 19.0, 9.0, 7.0, 15.0, 10.0, 13.0, 12.0, 8.0, 7.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.6640625, -12.2310791015625, -11.798095703125, -11.3651123046875, -10.93212890625, -10.4991455078125, -10.066162109375, -9.6331787109375, -9.2001953125, -8.7672119140625, -8.334228515625, -7.9012451171875, -7.46826171875, -7.0352783203125, -6.602294921875, -6.1693115234375, -5.736328125, -5.3033447265625, -4.870361328125, -4.4373779296875, -4.00439453125, -3.5714111328125, -3.138427734375, -2.7054443359375, -2.2724609375, -1.8394775390625, -1.406494140625, -0.9735107421875, -0.54052734375, -0.1075439453125, 0.325439453125, 0.7584228515625, 1.19140625, 1.6243896484375, 2.057373046875, 2.4903564453125, 2.92333984375, 3.3563232421875, 3.789306640625, 4.2222900390625, 4.6552734375, 5.0882568359375, 5.521240234375, 5.9542236328125, 6.38720703125, 6.8201904296875, 7.253173828125, 7.6861572265625, 8.119140625, 8.5521240234375, 8.985107421875, 9.4180908203125, 9.85107421875, 10.2840576171875, 10.717041015625, 11.1500244140625, 11.5830078125, 12.0159912109375, 12.448974609375, 12.8819580078125, 13.31494140625, 13.7479248046875, 14.180908203125, 14.6138916015625, 15.046875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 9.0, 12.0, 13.0, 11.0, 13.0, 22.0, 36.0, 45.0, 62.0, 74.0, 116.0, 148.0, 203.0, 275.0, 377.0, 482.0, 708.0, 1099.0, 1625.0, 2371.0, 3703.0, 6067.0, 10351.0, 18977.0, 37951.0, 91102.0, 262486.0, 359521.0, 138654.0, 53168.0, 24857.0, 12990.0, 7454.0, 4477.0, 2866.0, 1939.0, 1262.0, 850.0, 566.0, 473.0, 308.0, 198.0, 186.0, 115.0, 90.0, 79.0, 43.0, 30.0, 25.0, 25.0, 6.0, 15.0, 12.0, 6.0, 4.0, 0.0, 3.0, 3.0], "bins": [-61.21875, -59.375, -57.53125, -55.6875, -53.84375, -52.0, -50.15625, -48.3125, -46.46875, -44.625, -42.78125, -40.9375, -39.09375, -37.25, -35.40625, -33.5625, -31.71875, -29.875, -28.03125, -26.1875, -24.34375, -22.5, -20.65625, -18.8125, -16.96875, -15.125, -13.28125, -11.4375, -9.59375, -7.75, -5.90625, -4.0625, -2.21875, -0.375, 1.46875, 3.3125, 5.15625, 7.0, 8.84375, 10.6875, 12.53125, 14.375, 16.21875, 18.0625, 19.90625, 21.75, 23.59375, 25.4375, 27.28125, 29.125, 30.96875, 32.8125, 34.65625, 36.5, 38.34375, 40.1875, 42.03125, 43.875, 45.71875, 47.5625, 49.40625, 51.25, 53.09375, 54.9375, 56.78125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 5.0, 7.0, 6.0, 14.0, 12.0, 25.0, 44.0, 57.0, 67.0, 107.0, 145.0, 128.0, 104.0, 81.0, 59.0, 36.0, 23.0, 14.0, 17.0, 11.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005161285400390625, -0.004983842372894287, -0.004806399345397949, -0.004628956317901611, -0.0044515132904052734, -0.0042740702629089355, -0.004096627235412598, -0.00391918420791626, -0.003741741180419922, -0.003564298152923584, -0.003386855125427246, -0.003209412097930908, -0.0030319690704345703, -0.0028545260429382324, -0.0026770830154418945, -0.0024996399879455566, -0.0023221969604492188, -0.002144753932952881, -0.001967310905456543, -0.001789867877960205, -0.0016124248504638672, -0.0014349818229675293, -0.0012575387954711914, -0.0010800957679748535, -0.0009026527404785156, -0.0007252097129821777, -0.0005477666854858398, -0.00037032365798950195, -0.00019288063049316406, -1.5437602996826172e-05, 0.00016200542449951172, 0.0003394484519958496, 0.0005168914794921875, 0.0006943345069885254, 0.0008717775344848633, 0.0010492205619812012, 0.001226663589477539, 0.001404106616973877, 0.0015815496444702148, 0.0017589926719665527, 0.0019364356994628906, 0.0021138787269592285, 0.0022913217544555664, 0.0024687647819519043, 0.002646207809448242, 0.00282365083694458, 0.003001093864440918, 0.003178536891937256, 0.0033559799194335938, 0.0035334229469299316, 0.0037108659744262695, 0.0038883090019226074, 0.004065752029418945, 0.004243195056915283, 0.004420638084411621, 0.004598081111907959, 0.004775524139404297, 0.004952967166900635, 0.005130410194396973, 0.0053078532218933105, 0.0054852962493896484, 0.005662739276885986, 0.005840182304382324, 0.006017625331878662, 0.006195068359375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 10.0, 4.0, 8.0, 9.0, 10.0, 20.0, 28.0, 25.0, 33.0, 60.0, 50.0, 88.0, 104.0, 143.0, 174.0, 249.0, 346.0, 497.0, 732.0, 1058.0, 1680.0, 2881.0, 5376.0, 10425.0, 24858.0, 71642.0, 255669.0, 434636.0, 155413.0, 45859.0, 17354.0, 7980.0, 4253.0, 2340.0, 1325.0, 946.0, 664.0, 415.0, 302.0, 219.0, 162.0, 128.0, 76.0, 85.0, 58.0, 39.0, 35.0, 22.0, 15.0, 18.0, 10.0, 9.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0], "bins": [-59.90625, -57.99267578125, -56.0791015625, -54.16552734375, -52.251953125, -50.33837890625, -48.4248046875, -46.51123046875, -44.59765625, -42.68408203125, -40.7705078125, -38.85693359375, -36.943359375, -35.02978515625, -33.1162109375, -31.20263671875, -29.2890625, -27.37548828125, -25.4619140625, -23.54833984375, -21.634765625, -19.72119140625, -17.8076171875, -15.89404296875, -13.98046875, -12.06689453125, -10.1533203125, -8.23974609375, -6.326171875, -4.41259765625, -2.4990234375, -0.58544921875, 1.328125, 3.24169921875, 5.1552734375, 7.06884765625, 8.982421875, 10.89599609375, 12.8095703125, 14.72314453125, 16.63671875, 18.55029296875, 20.4638671875, 22.37744140625, 24.291015625, 26.20458984375, 28.1181640625, 30.03173828125, 31.9453125, 33.85888671875, 35.7724609375, 37.68603515625, 39.599609375, 41.51318359375, 43.4267578125, 45.34033203125, 47.25390625, 49.16748046875, 51.0810546875, 52.99462890625, 54.908203125, 56.82177734375, 58.7353515625, 60.64892578125, 62.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 9.0, 7.0, 9.0, 7.0, 9.0, 14.0, 16.0, 21.0, 37.0, 40.0, 48.0, 68.0, 80.0, 91.0, 91.0, 75.0, 84.0, 64.0, 42.0, 34.0, 40.0, 29.0, 20.0, 20.0, 6.0, 7.0, 3.0, 6.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.015625, -17.5037841796875, -16.991943359375, -16.4801025390625, -15.96826171875, -15.4564208984375, -14.944580078125, -14.4327392578125, -13.9208984375, -13.4090576171875, -12.897216796875, -12.3853759765625, -11.87353515625, -11.3616943359375, -10.849853515625, -10.3380126953125, -9.826171875, -9.3143310546875, -8.802490234375, -8.2906494140625, -7.77880859375, -7.2669677734375, -6.755126953125, -6.2432861328125, -5.7314453125, -5.2196044921875, -4.707763671875, -4.1959228515625, -3.68408203125, -3.1722412109375, -2.660400390625, -2.1485595703125, -1.63671875, -1.1248779296875, -0.613037109375, -0.1011962890625, 0.41064453125, 0.9224853515625, 1.434326171875, 1.9461669921875, 2.4580078125, 2.9698486328125, 3.481689453125, 3.9935302734375, 4.50537109375, 5.0172119140625, 5.529052734375, 6.0408935546875, 6.552734375, 7.0645751953125, 7.576416015625, 8.0882568359375, 8.60009765625, 9.1119384765625, 9.623779296875, 10.1356201171875, 10.6474609375, 11.1593017578125, 11.671142578125, 12.1829833984375, 12.69482421875, 13.2066650390625, 13.718505859375, 14.2303466796875, 14.7421875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 10.0, 13.0, 17.0, 25.0, 33.0, 40.0, 41.0, 68.0, 62.0, 71.0, 79.0, 80.0, 74.0, 82.0, 49.0, 52.0, 46.0, 38.0, 23.0, 17.0, 23.0, 10.0, 18.0, 4.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.158958435058594, -34.048431396484375, -32.937904357910156, -31.827377319335938, -30.71685028076172, -29.6063232421875, -28.49579620361328, -27.385269165039062, -26.274742126464844, -25.164215087890625, -24.053688049316406, -22.943161010742188, -21.83263397216797, -20.72210693359375, -19.61157989501953, -18.501052856445312, -17.39052391052246, -16.279996871948242, -15.169469833374023, -14.058942794799805, -12.948415756225586, -11.837888717651367, -10.727360725402832, -9.616833686828613, -8.506306648254395, -7.395779609680176, -6.285252571105957, -5.17472505569458, -4.064198017120361, -2.9536709785461426, -1.8431434631347656, -0.7326164245605469, 0.3779106140136719, 1.4884377717971802, 2.5989649295806885, 3.7094922065734863, 4.820019245147705, 5.930546283721924, 7.041073799133301, 8.15160083770752, 9.262127876281738, 10.372654914855957, 11.483181953430176, 12.593709945678711, 13.70423698425293, 14.814764022827148, 15.925291061401367, 17.035818099975586, 18.146345138549805, 19.256872177124023, 20.367399215698242, 21.47792625427246, 22.58845329284668, 23.6989803314209, 24.80950927734375, 25.92003631591797, 27.030563354492188, 28.141090393066406, 29.251617431640625, 30.362144470214844, 31.472671508789062, 32.58319854736328, 33.6937255859375, 34.80425262451172, 35.91477966308594]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 6.0, 9.0, 11.0, 10.0, 13.0, 14.0, 24.0, 19.0, 23.0, 23.0, 27.0, 34.0, 42.0, 41.0, 30.0, 44.0, 44.0, 43.0, 56.0, 64.0, 31.0, 46.0, 40.0, 35.0, 34.0, 36.0, 25.0, 21.0, 26.0, 12.0, 18.0, 22.0, 20.0, 8.0, 11.0, 10.0, 6.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0], "bins": [-25.682144165039062, -25.01441764831543, -24.34669303894043, -23.678966522216797, -23.011241912841797, -22.343515396118164, -21.675790786743164, -21.00806427001953, -20.34033966064453, -19.6726131439209, -19.0048885345459, -18.337162017822266, -17.669437408447266, -17.001710891723633, -16.333986282348633, -15.666259765625, -14.998534202575684, -14.330808639526367, -13.66308307647705, -12.995357513427734, -12.327631950378418, -11.659906387329102, -10.992179870605469, -10.324455261230469, -9.656728744506836, -8.98900318145752, -8.321277618408203, -7.653552055358887, -6.98582649230957, -6.318100929260254, -5.650374889373779, -4.982649326324463, -4.314924240112305, -3.6471986770629883, -2.979473114013672, -2.3117473125457764, -1.64402174949646, -0.9762961864471436, -0.30857038497924805, 0.35915517807006836, 1.0268807411193848, 1.6946063041687012, 2.3623318672180176, 3.030057668685913, 3.6977832317352295, 4.365509033203125, 5.033234596252441, 5.700960159301758, 6.368685722351074, 7.036411285400391, 7.704136848449707, 8.371862411499023, 9.03958797454834, 9.707313537597656, 10.375040054321289, 11.042764663696289, 11.710491180419922, 12.378216743469238, 13.045942306518555, 13.713667869567871, 14.381393432617188, 15.049118995666504, 15.71684455871582, 16.384571075439453, 17.052295684814453]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 0.0, 1.0, 10.0, 3.0, 8.0, 15.0, 19.0, 26.0, 29.0, 53.0, 59.0, 107.0, 130.0, 208.0, 274.0, 400.0, 563.0, 849.0, 1321.0, 1987.0, 3256.0, 5486.0, 9728.0, 18277.0, 36465.0, 78318.0, 189110.0, 481992.0, 1012605.0, 1180428.0, 680732.0, 276891.0, 111198.0, 49675.0, 23701.0, 12540.0, 6947.0, 3995.0, 2328.0, 1504.0, 954.0, 635.0, 448.0, 272.0, 217.0, 169.0, 111.0, 78.0, 44.0, 43.0, 29.0, 15.0, 15.0, 4.0, 7.0, 11.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-26.171875, -25.359130859375, -24.54638671875, -23.733642578125, -22.9208984375, -22.108154296875, -21.29541015625, -20.482666015625, -19.669921875, -18.857177734375, -18.04443359375, -17.231689453125, -16.4189453125, -15.606201171875, -14.79345703125, -13.980712890625, -13.16796875, -12.355224609375, -11.54248046875, -10.729736328125, -9.9169921875, -9.104248046875, -8.29150390625, -7.478759765625, -6.666015625, -5.853271484375, -5.04052734375, -4.227783203125, -3.4150390625, -2.602294921875, -1.78955078125, -0.976806640625, -0.1640625, 0.648681640625, 1.46142578125, 2.274169921875, 3.0869140625, 3.899658203125, 4.71240234375, 5.525146484375, 6.337890625, 7.150634765625, 7.96337890625, 8.776123046875, 9.5888671875, 10.401611328125, 11.21435546875, 12.027099609375, 12.83984375, 13.652587890625, 14.46533203125, 15.278076171875, 16.0908203125, 16.903564453125, 17.71630859375, 18.529052734375, 19.341796875, 20.154541015625, 20.96728515625, 21.780029296875, 22.5927734375, 23.405517578125, 24.21826171875, 25.031005859375, 25.84375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 6.0, 5.0, 11.0, 9.0, 9.0, 20.0, 17.0, 19.0, 28.0, 33.0, 38.0, 38.0, 42.0, 49.0, 36.0, 35.0, 53.0, 47.0, 52.0, 53.0, 33.0, 39.0, 36.0, 42.0, 36.0, 35.0, 24.0, 27.0, 21.0, 18.0, 14.0, 13.0, 11.0, 4.0, 13.0, 7.0, 10.0, 9.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.203125, -16.73779296875, -16.2724609375, -15.80712890625, -15.341796875, -14.87646484375, -14.4111328125, -13.94580078125, -13.48046875, -13.01513671875, -12.5498046875, -12.08447265625, -11.619140625, -11.15380859375, -10.6884765625, -10.22314453125, -9.7578125, -9.29248046875, -8.8271484375, -8.36181640625, -7.896484375, -7.43115234375, -6.9658203125, -6.50048828125, -6.03515625, -5.56982421875, -5.1044921875, -4.63916015625, -4.173828125, -3.70849609375, -3.2431640625, -2.77783203125, -2.3125, -1.84716796875, -1.3818359375, -0.91650390625, -0.451171875, 0.01416015625, 0.4794921875, 0.94482421875, 1.41015625, 1.87548828125, 2.3408203125, 2.80615234375, 3.271484375, 3.73681640625, 4.2021484375, 4.66748046875, 5.1328125, 5.59814453125, 6.0634765625, 6.52880859375, 6.994140625, 7.45947265625, 7.9248046875, 8.39013671875, 8.85546875, 9.32080078125, 9.7861328125, 10.25146484375, 10.716796875, 11.18212890625, 11.6474609375, 12.11279296875, 12.578125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 10.0, 2.0, 7.0, 18.0, 22.0, 30.0, 59.0, 91.0, 138.0, 225.0, 387.0, 639.0, 1103.0, 1928.0, 3652.0, 7004.0, 14974.0, 34399.0, 92583.0, 283054.0, 863133.0, 1504970.0, 915640.0, 304507.0, 98059.0, 36396.0, 15498.0, 7339.0, 3711.0, 1985.0, 1061.0, 603.0, 395.0, 238.0, 157.0, 95.0, 58.0, 45.0, 24.0, 10.0, 10.0, 11.0, 7.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.125, -31.037109375, -29.94921875, -28.861328125, -27.7734375, -26.685546875, -25.59765625, -24.509765625, -23.421875, -22.333984375, -21.24609375, -20.158203125, -19.0703125, -17.982421875, -16.89453125, -15.806640625, -14.71875, -13.630859375, -12.54296875, -11.455078125, -10.3671875, -9.279296875, -8.19140625, -7.103515625, -6.015625, -4.927734375, -3.83984375, -2.751953125, -1.6640625, -0.576171875, 0.51171875, 1.599609375, 2.6875, 3.775390625, 4.86328125, 5.951171875, 7.0390625, 8.126953125, 9.21484375, 10.302734375, 11.390625, 12.478515625, 13.56640625, 14.654296875, 15.7421875, 16.830078125, 17.91796875, 19.005859375, 20.09375, 21.181640625, 22.26953125, 23.357421875, 24.4453125, 25.533203125, 26.62109375, 27.708984375, 28.796875, 29.884765625, 30.97265625, 32.060546875, 33.1484375, 34.236328125, 35.32421875, 36.412109375, 37.5]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 3.0, 7.0, 10.0, 12.0, 19.0, 12.0, 24.0, 36.0, 50.0, 74.0, 66.0, 85.0, 113.0, 141.0, 176.0, 236.0, 237.0, 264.0, 289.0, 290.0, 269.0, 290.0, 264.0, 216.0, 168.0, 149.0, 118.0, 98.0, 79.0, 59.0, 45.0, 39.0, 31.0, 30.0, 9.0, 13.0, 18.0, 11.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.18359375, -6.93829345703125, -6.6929931640625, -6.44769287109375, -6.202392578125, -5.95709228515625, -5.7117919921875, -5.46649169921875, -5.22119140625, -4.97589111328125, -4.7305908203125, -4.48529052734375, -4.239990234375, -3.99468994140625, -3.7493896484375, -3.50408935546875, -3.2587890625, -3.01348876953125, -2.7681884765625, -2.52288818359375, -2.277587890625, -2.03228759765625, -1.7869873046875, -1.54168701171875, -1.29638671875, -1.05108642578125, -0.8057861328125, -0.56048583984375, -0.315185546875, -0.06988525390625, 0.1754150390625, 0.42071533203125, 0.666015625, 0.91131591796875, 1.1566162109375, 1.40191650390625, 1.647216796875, 1.89251708984375, 2.1378173828125, 2.38311767578125, 2.62841796875, 2.87371826171875, 3.1190185546875, 3.36431884765625, 3.609619140625, 3.85491943359375, 4.1002197265625, 4.34552001953125, 4.5908203125, 4.83612060546875, 5.0814208984375, 5.32672119140625, 5.572021484375, 5.81732177734375, 6.0626220703125, 6.30792236328125, 6.55322265625, 6.79852294921875, 7.0438232421875, 7.28912353515625, 7.534423828125, 7.77972412109375, 8.0250244140625, 8.27032470703125, 8.515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 9.0, 9.0, 15.0, 18.0, 32.0, 22.0, 55.0, 59.0, 69.0, 91.0, 100.0, 106.0, 82.0, 101.0, 62.0, 45.0, 35.0, 25.0, 16.0, 17.0, 13.0, 9.0, 7.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.2837028503418, -36.24574279785156, -35.207786560058594, -34.16982650756836, -33.131866455078125, -32.093910217285156, -31.055950164794922, -30.01799201965332, -28.98003387451172, -27.942075729370117, -26.904115676879883, -25.86615753173828, -24.82819938659668, -23.790241241455078, -22.752281188964844, -21.714323043823242, -20.676362991333008, -19.638404846191406, -18.600444793701172, -17.56248664855957, -16.52452850341797, -15.48656940460205, -14.448610305786133, -13.410652160644531, -12.372693061828613, -11.334733963012695, -10.296775817871094, -9.258816719055176, -8.220857620239258, -7.182899475097656, -6.144940376281738, -5.1069817543029785, -4.069023132324219, -3.031064510345459, -1.9931056499481201, -0.9551467895507812, 0.08281183242797852, 1.1207704544067383, 2.1587295532226562, 3.196688175201416, 4.234646797180176, 5.2726054191589355, 6.310564041137695, 7.348523139953613, 8.386482238769531, 9.424440383911133, 10.46239948272705, 11.500358581542969, 12.53831672668457, 13.576275825500488, 14.61423397064209, 15.652193069458008, 16.69015121459961, 17.728111267089844, 18.766069412231445, 19.804027557373047, 20.84198760986328, 21.879945755004883, 22.917905807495117, 23.95586395263672, 24.99382209777832, 26.031780242919922, 27.069740295410156, 28.107698440551758, 29.14565658569336]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 10.0, 6.0, 13.0, 7.0, 14.0, 18.0, 25.0, 22.0, 25.0, 22.0, 38.0, 29.0, 29.0, 38.0, 50.0, 50.0, 40.0, 43.0, 38.0, 37.0, 45.0, 48.0, 37.0, 35.0, 32.0, 31.0, 25.0, 22.0, 24.0, 25.0, 23.0, 21.0, 9.0, 17.0, 6.0, 7.0, 5.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-19.662553787231445, -19.122377395629883, -18.58220100402832, -18.042022705078125, -17.501846313476562, -16.961669921875, -16.421493530273438, -15.881317138671875, -15.341140747070312, -14.80096435546875, -14.260787010192871, -13.720610618591309, -13.180434226989746, -12.640256881713867, -12.100080490112305, -11.559904098510742, -11.019726753234863, -10.4795503616333, -9.939373016357422, -9.39919662475586, -8.859020233154297, -8.318843841552734, -7.7786664962768555, -7.238490104675293, -6.698313236236572, -6.158136367797852, -5.617959976196289, -5.077783107757568, -4.537606239318848, -3.997429847717285, -3.4572529792785645, -2.917076349258423, -2.3768997192382812, -1.8367230892181396, -1.2965463399887085, -0.7563695907592773, -0.21619296073913574, 0.32398366928100586, 0.8641605377197266, 1.4043371677398682, 1.9445137977600098, 2.4846904277801514, 3.024867057800293, 3.5650439262390137, 4.105220794677734, 4.645397186279297, 5.185574054718018, 5.725750923156738, 6.265927314758301, 6.8061041831970215, 7.346280574798584, 7.886457443237305, 8.426633834838867, 8.96681022644043, 9.506987571716309, 10.047163963317871, 10.58734130859375, 11.127517700195312, 11.667695045471191, 12.207871437072754, 12.748047828674316, 13.288225173950195, 13.828401565551758, 14.36857795715332, 14.908754348754883]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 6.0, 6.0, 5.0, 10.0, 21.0, 22.0, 27.0, 36.0, 50.0, 75.0, 100.0, 130.0, 203.0, 278.0, 396.0, 582.0, 815.0, 1219.0, 1731.0, 2697.0, 4228.0, 6765.0, 11326.0, 19186.0, 33777.0, 62785.0, 123059.0, 228251.0, 246222.0, 140449.0, 71329.0, 37613.0, 21316.0, 12522.0, 7502.0, 4717.0, 2992.0, 1912.0, 1235.0, 877.0, 607.0, 442.0, 289.0, 187.0, 176.0, 113.0, 67.0, 76.0, 48.0, 25.0, 20.0, 15.0, 11.0, 7.0, 10.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-30.859375, -29.89794921875, -28.9365234375, -27.97509765625, -27.013671875, -26.05224609375, -25.0908203125, -24.12939453125, -23.16796875, -22.20654296875, -21.2451171875, -20.28369140625, -19.322265625, -18.36083984375, -17.3994140625, -16.43798828125, -15.4765625, -14.51513671875, -13.5537109375, -12.59228515625, -11.630859375, -10.66943359375, -9.7080078125, -8.74658203125, -7.78515625, -6.82373046875, -5.8623046875, -4.90087890625, -3.939453125, -2.97802734375, -2.0166015625, -1.05517578125, -0.09375, 0.86767578125, 1.8291015625, 2.79052734375, 3.751953125, 4.71337890625, 5.6748046875, 6.63623046875, 7.59765625, 8.55908203125, 9.5205078125, 10.48193359375, 11.443359375, 12.40478515625, 13.3662109375, 14.32763671875, 15.2890625, 16.25048828125, 17.2119140625, 18.17333984375, 19.134765625, 20.09619140625, 21.0576171875, 22.01904296875, 22.98046875, 23.94189453125, 24.9033203125, 25.86474609375, 26.826171875, 27.78759765625, 28.7490234375, 29.71044921875, 30.671875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 5.0, 4.0, 10.0, 12.0, 13.0, 10.0, 16.0, 24.0, 30.0, 25.0, 24.0, 27.0, 29.0, 32.0, 46.0, 32.0, 37.0, 47.0, 49.0, 50.0, 44.0, 44.0, 34.0, 39.0, 29.0, 44.0, 23.0, 27.0, 23.0, 22.0, 17.0, 14.0, 20.0, 17.0, 16.0, 10.0, 15.0, 6.0, 7.0, 1.0, 4.0, 10.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-18.5625, -18.0382080078125, -17.513916015625, -16.9896240234375, -16.46533203125, -15.9410400390625, -15.416748046875, -14.8924560546875, -14.3681640625, -13.8438720703125, -13.319580078125, -12.7952880859375, -12.27099609375, -11.7467041015625, -11.222412109375, -10.6981201171875, -10.173828125, -9.6495361328125, -9.125244140625, -8.6009521484375, -8.07666015625, -7.5523681640625, -7.028076171875, -6.5037841796875, -5.9794921875, -5.4552001953125, -4.930908203125, -4.4066162109375, -3.88232421875, -3.3580322265625, -2.833740234375, -2.3094482421875, -1.78515625, -1.2608642578125, -0.736572265625, -0.2122802734375, 0.31201171875, 0.8363037109375, 1.360595703125, 1.8848876953125, 2.4091796875, 2.9334716796875, 3.457763671875, 3.9820556640625, 4.50634765625, 5.0306396484375, 5.554931640625, 6.0792236328125, 6.603515625, 7.1278076171875, 7.652099609375, 8.1763916015625, 8.70068359375, 9.2249755859375, 9.749267578125, 10.2735595703125, 10.7978515625, 11.3221435546875, 11.846435546875, 12.3707275390625, 12.89501953125, 13.4193115234375, 13.943603515625, 14.4678955078125, 14.9921875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 5.0, 13.0, 18.0, 23.0, 38.0, 54.0, 82.0, 97.0, 161.0, 228.0, 375.0, 596.0, 962.0, 1520.0, 2698.0, 4725.0, 8208.0, 15908.0, 32888.0, 73997.0, 199742.0, 393212.0, 180466.0, 67856.0, 30835.0, 14949.0, 7986.0, 4433.0, 2462.0, 1429.0, 923.0, 587.0, 344.0, 231.0, 161.0, 94.0, 77.0, 46.0, 36.0, 29.0, 15.0, 7.0, 9.0, 8.0, 2.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-45.25, -43.9365234375, -42.623046875, -41.3095703125, -39.99609375, -38.6826171875, -37.369140625, -36.0556640625, -34.7421875, -33.4287109375, -32.115234375, -30.8017578125, -29.48828125, -28.1748046875, -26.861328125, -25.5478515625, -24.234375, -22.9208984375, -21.607421875, -20.2939453125, -18.98046875, -17.6669921875, -16.353515625, -15.0400390625, -13.7265625, -12.4130859375, -11.099609375, -9.7861328125, -8.47265625, -7.1591796875, -5.845703125, -4.5322265625, -3.21875, -1.9052734375, -0.591796875, 0.7216796875, 2.03515625, 3.3486328125, 4.662109375, 5.9755859375, 7.2890625, 8.6025390625, 9.916015625, 11.2294921875, 12.54296875, 13.8564453125, 15.169921875, 16.4833984375, 17.796875, 19.1103515625, 20.423828125, 21.7373046875, 23.05078125, 24.3642578125, 25.677734375, 26.9912109375, 28.3046875, 29.6181640625, 30.931640625, 32.2451171875, 33.55859375, 34.8720703125, 36.185546875, 37.4990234375, 38.8125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 2.0, 11.0, 12.0, 6.0, 10.0, 10.0, 12.0, 15.0, 22.0, 27.0, 28.0, 27.0, 22.0, 27.0, 35.0, 46.0, 43.0, 46.0, 49.0, 51.0, 43.0, 42.0, 63.0, 28.0, 33.0, 30.0, 34.0, 30.0, 29.0, 25.0, 26.0, 15.0, 21.0, 18.0, 15.0, 12.0, 8.0, 5.0, 3.0, 7.0, 5.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.15625, -11.763916015625, -11.37158203125, -10.979248046875, -10.5869140625, -10.194580078125, -9.80224609375, -9.409912109375, -9.017578125, -8.625244140625, -8.23291015625, -7.840576171875, -7.4482421875, -7.055908203125, -6.66357421875, -6.271240234375, -5.87890625, -5.486572265625, -5.09423828125, -4.701904296875, -4.3095703125, -3.917236328125, -3.52490234375, -3.132568359375, -2.740234375, -2.347900390625, -1.95556640625, -1.563232421875, -1.1708984375, -0.778564453125, -0.38623046875, 0.006103515625, 0.3984375, 0.790771484375, 1.18310546875, 1.575439453125, 1.9677734375, 2.360107421875, 2.75244140625, 3.144775390625, 3.537109375, 3.929443359375, 4.32177734375, 4.714111328125, 5.1064453125, 5.498779296875, 5.89111328125, 6.283447265625, 6.67578125, 7.068115234375, 7.46044921875, 7.852783203125, 8.2451171875, 8.637451171875, 9.02978515625, 9.422119140625, 9.814453125, 10.206787109375, 10.59912109375, 10.991455078125, 11.3837890625, 11.776123046875, 12.16845703125, 12.560791015625, 12.953125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 15.0, 9.0, 21.0, 26.0, 22.0, 39.0, 36.0, 77.0, 100.0, 142.0, 193.0, 282.0, 422.0, 669.0, 970.0, 1492.0, 2399.0, 3941.0, 6787.0, 12799.0, 27673.0, 75725.0, 295074.0, 432505.0, 112975.0, 37151.0, 16169.0, 8173.0, 4600.0, 2820.0, 1807.0, 1102.0, 736.0, 504.0, 311.0, 250.0, 174.0, 97.0, 77.0, 49.0, 35.0, 31.0, 27.0, 14.0, 9.0, 7.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0], "bins": [-30.34375, -29.4287109375, -28.513671875, -27.5986328125, -26.68359375, -25.7685546875, -24.853515625, -23.9384765625, -23.0234375, -22.1083984375, -21.193359375, -20.2783203125, -19.36328125, -18.4482421875, -17.533203125, -16.6181640625, -15.703125, -14.7880859375, -13.873046875, -12.9580078125, -12.04296875, -11.1279296875, -10.212890625, -9.2978515625, -8.3828125, -7.4677734375, -6.552734375, -5.6376953125, -4.72265625, -3.8076171875, -2.892578125, -1.9775390625, -1.0625, -0.1474609375, 0.767578125, 1.6826171875, 2.59765625, 3.5126953125, 4.427734375, 5.3427734375, 6.2578125, 7.1728515625, 8.087890625, 9.0029296875, 9.91796875, 10.8330078125, 11.748046875, 12.6630859375, 13.578125, 14.4931640625, 15.408203125, 16.3232421875, 17.23828125, 18.1533203125, 19.068359375, 19.9833984375, 20.8984375, 21.8134765625, 22.728515625, 23.6435546875, 24.55859375, 25.4736328125, 26.388671875, 27.3037109375, 28.21875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 6.0, 8.0, 16.0, 6.0, 12.0, 24.0, 55.0, 74.0, 120.0, 165.0, 180.0, 96.0, 71.0, 36.0, 31.0, 13.0, 14.0, 11.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0026073455810546875, -0.0025326311588287354, -0.002457916736602783, -0.002383202314376831, -0.002308487892150879, -0.0022337734699249268, -0.0021590590476989746, -0.0020843446254730225, -0.0020096302032470703, -0.0019349157810211182, -0.001860201358795166, -0.0017854869365692139, -0.0017107725143432617, -0.0016360580921173096, -0.0015613436698913574, -0.0014866292476654053, -0.0014119148254394531, -0.001337200403213501, -0.0012624859809875488, -0.0011877715587615967, -0.0011130571365356445, -0.0010383427143096924, -0.0009636282920837402, -0.0008889138698577881, -0.0008141994476318359, -0.0007394850254058838, -0.0006647706031799316, -0.0005900561809539795, -0.0005153417587280273, -0.0004406273365020752, -0.00036591291427612305, -0.0002911984920501709, -0.00021648406982421875, -0.0001417696475982666, -6.705522537231445e-05, 7.659196853637695e-06, 8.237361907958984e-05, 0.000157088041305542, 0.00023180246353149414, 0.0003065168857574463, 0.00038123130798339844, 0.0004559457302093506, 0.0005306601524353027, 0.0006053745746612549, 0.000680088996887207, 0.0007548034191131592, 0.0008295178413391113, 0.0009042322635650635, 0.0009789466857910156, 0.0010536611080169678, 0.00112837553024292, 0.001203089952468872, 0.0012778043746948242, 0.0013525187969207764, 0.0014272332191467285, 0.0015019476413726807, 0.0015766620635986328, 0.001651376485824585, 0.0017260909080505371, 0.0018008053302764893, 0.0018755197525024414, 0.0019502341747283936, 0.0020249485969543457, 0.002099663019180298, 0.00217437744140625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 6.0, 8.0, 22.0, 18.0, 24.0, 48.0, 54.0, 62.0, 87.0, 151.0, 209.0, 312.0, 517.0, 730.0, 1097.0, 1633.0, 2732.0, 4273.0, 7241.0, 12758.0, 25490.0, 57481.0, 143500.0, 317207.0, 269719.0, 109830.0, 44866.0, 20990.0, 10791.0, 6195.0, 3798.0, 2325.0, 1454.0, 951.0, 622.0, 422.0, 304.0, 197.0, 132.0, 92.0, 68.0, 53.0, 29.0, 16.0, 16.0, 11.0, 11.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-23.4375, -22.76513671875, -22.0927734375, -21.42041015625, -20.748046875, -20.07568359375, -19.4033203125, -18.73095703125, -18.05859375, -17.38623046875, -16.7138671875, -16.04150390625, -15.369140625, -14.69677734375, -14.0244140625, -13.35205078125, -12.6796875, -12.00732421875, -11.3349609375, -10.66259765625, -9.990234375, -9.31787109375, -8.6455078125, -7.97314453125, -7.30078125, -6.62841796875, -5.9560546875, -5.28369140625, -4.611328125, -3.93896484375, -3.2666015625, -2.59423828125, -1.921875, -1.24951171875, -0.5771484375, 0.09521484375, 0.767578125, 1.43994140625, 2.1123046875, 2.78466796875, 3.45703125, 4.12939453125, 4.8017578125, 5.47412109375, 6.146484375, 6.81884765625, 7.4912109375, 8.16357421875, 8.8359375, 9.50830078125, 10.1806640625, 10.85302734375, 11.525390625, 12.19775390625, 12.8701171875, 13.54248046875, 14.21484375, 14.88720703125, 15.5595703125, 16.23193359375, 16.904296875, 17.57666015625, 18.2490234375, 18.92138671875, 19.59375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 1.0, 8.0, 4.0, 4.0, 5.0, 7.0, 9.0, 19.0, 12.0, 21.0, 23.0, 35.0, 31.0, 57.0, 65.0, 87.0, 84.0, 104.0, 79.0, 79.0, 50.0, 31.0, 37.0, 24.0, 34.0, 17.0, 15.0, 4.0, 4.0, 7.0, 5.0, 5.0, 9.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.578125, -5.380126953125, -5.18212890625, -4.984130859375, -4.7861328125, -4.588134765625, -4.39013671875, -4.192138671875, -3.994140625, -3.796142578125, -3.59814453125, -3.400146484375, -3.2021484375, -3.004150390625, -2.80615234375, -2.608154296875, -2.41015625, -2.212158203125, -2.01416015625, -1.816162109375, -1.6181640625, -1.420166015625, -1.22216796875, -1.024169921875, -0.826171875, -0.628173828125, -0.43017578125, -0.232177734375, -0.0341796875, 0.163818359375, 0.36181640625, 0.559814453125, 0.7578125, 0.955810546875, 1.15380859375, 1.351806640625, 1.5498046875, 1.747802734375, 1.94580078125, 2.143798828125, 2.341796875, 2.539794921875, 2.73779296875, 2.935791015625, 3.1337890625, 3.331787109375, 3.52978515625, 3.727783203125, 3.92578125, 4.123779296875, 4.32177734375, 4.519775390625, 4.7177734375, 4.915771484375, 5.11376953125, 5.311767578125, 5.509765625, 5.707763671875, 5.90576171875, 6.103759765625, 6.3017578125, 6.499755859375, 6.69775390625, 6.895751953125, 7.09375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 9.0, 14.0, 17.0, 26.0, 26.0, 22.0, 47.0, 67.0, 86.0, 92.0, 96.0, 110.0, 99.0, 70.0, 52.0, 49.0, 27.0, 27.0, 23.0, 15.0, 9.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.76021194458008, -33.79523468017578, -32.830257415771484, -31.865278244018555, -30.900300979614258, -29.93532371520996, -28.97034454345703, -28.005367279052734, -27.040390014648438, -26.07541275024414, -25.110435485839844, -24.145456314086914, -23.180479049682617, -22.21550178527832, -21.25052261352539, -20.285545349121094, -19.320568084716797, -18.3555908203125, -17.390613555908203, -16.425634384155273, -15.460657119750977, -14.49567985534668, -13.530701637268066, -12.565723419189453, -11.600746154785156, -10.63576889038086, -9.670790672302246, -8.705812454223633, -7.740835189819336, -6.775857448577881, -5.810879707336426, -4.845901966094971, -3.880922317504883, -2.9159445762634277, -1.9509668350219727, -0.9859890937805176, -0.0210113525390625, 0.9439663887023926, 1.9089441299438477, 2.8739218711853027, 3.838899612426758, 4.803877353668213, 5.768855094909668, 6.733832836151123, 7.698810577392578, 8.663787841796875, 9.628766059875488, 10.593744277954102, 11.558721542358398, 12.523698806762695, 13.488677024841309, 14.453655242919922, 15.418632507324219, 16.383609771728516, 17.348587036132812, 18.313566207885742, 19.27854347229004, 20.243520736694336, 21.208499908447266, 22.173477172851562, 23.13845443725586, 24.103431701660156, 25.068408966064453, 26.033388137817383, 26.99836540222168]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 3.0, 7.0, 11.0, 11.0, 11.0, 16.0, 24.0, 21.0, 20.0, 20.0, 26.0, 24.0, 32.0, 36.0, 35.0, 38.0, 42.0, 45.0, 27.0, 51.0, 45.0, 38.0, 37.0, 42.0, 36.0, 34.0, 28.0, 37.0, 22.0, 19.0, 19.0, 23.0, 21.0, 17.0, 15.0, 13.0, 14.0, 7.0, 2.0, 5.0, 4.0, 12.0, 0.0, 3.0, 4.0, 1.0, 2.0], "bins": [-18.848363876342773, -18.33615493774414, -17.823945999145508, -17.311737060546875, -16.799528121948242, -16.28731918334961, -15.775110244750977, -15.262901306152344, -14.750692367553711, -14.238483428955078, -13.726274490356445, -13.214065551757812, -12.70185661315918, -12.189647674560547, -11.677438735961914, -11.165229797363281, -10.653019905090332, -10.1408109664917, -9.628602027893066, -9.116393089294434, -8.6041841506958, -8.091975212097168, -7.579765796661377, -7.067556858062744, -6.555347919464111, -6.0431389808654785, -5.530930042266846, -5.018720626831055, -4.506511688232422, -3.994302988052368, -3.4820938110351562, -2.9698848724365234, -2.4576759338378906, -1.9454669952392578, -1.4332579374313354, -0.9210488796234131, -0.4088399410247803, 0.10336899757385254, 0.6155781745910645, 1.1277871131896973, 1.63999605178833, 2.152204990386963, 2.6644139289855957, 3.1766231060028076, 3.6888320446014404, 4.201041221618652, 4.713250160217285, 5.225459098815918, 5.737668037414551, 6.249876976013184, 6.762085914611816, 7.274294853210449, 7.786503791809082, 8.298712730407715, 8.810922622680664, 9.323131561279297, 9.83534049987793, 10.347549438476562, 10.859758377075195, 11.371967315673828, 11.884176254272461, 12.396385192871094, 12.908594131469727, 13.42080307006836, 13.933012008666992]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 12.0, 12.0, 12.0, 17.0, 30.0, 42.0, 44.0, 70.0, 98.0, 137.0, 184.0, 289.0, 443.0, 639.0, 1032.0, 1677.0, 2718.0, 4701.0, 8176.0, 14723.0, 27208.0, 50536.0, 92392.0, 155488.0, 208755.0, 192348.0, 127225.0, 71836.0, 39098.0, 20855.0, 11583.0, 6468.0, 3685.0, 2198.0, 1296.0, 821.0, 549.0, 357.0, 216.0, 164.0, 100.0, 85.0, 60.0, 58.0, 34.0, 27.0, 16.0, 16.0, 7.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 5.0, 2.0], "bins": [-24.671875, -23.895751953125, -23.11962890625, -22.343505859375, -21.5673828125, -20.791259765625, -20.01513671875, -19.239013671875, -18.462890625, -17.686767578125, -16.91064453125, -16.134521484375, -15.3583984375, -14.582275390625, -13.80615234375, -13.030029296875, -12.25390625, -11.477783203125, -10.70166015625, -9.925537109375, -9.1494140625, -8.373291015625, -7.59716796875, -6.821044921875, -6.044921875, -5.268798828125, -4.49267578125, -3.716552734375, -2.9404296875, -2.164306640625, -1.38818359375, -0.612060546875, 0.1640625, 0.940185546875, 1.71630859375, 2.492431640625, 3.2685546875, 4.044677734375, 4.82080078125, 5.596923828125, 6.373046875, 7.149169921875, 7.92529296875, 8.701416015625, 9.4775390625, 10.253662109375, 11.02978515625, 11.805908203125, 12.58203125, 13.358154296875, 14.13427734375, 14.910400390625, 15.6865234375, 16.462646484375, 17.23876953125, 18.014892578125, 18.791015625, 19.567138671875, 20.34326171875, 21.119384765625, 21.8955078125, 22.671630859375, 23.44775390625, 24.223876953125, 25.0]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 9.0, 9.0, 7.0, 12.0, 13.0, 15.0, 23.0, 27.0, 26.0, 26.0, 21.0, 29.0, 41.0, 35.0, 29.0, 48.0, 42.0, 44.0, 43.0, 56.0, 35.0, 42.0, 40.0, 31.0, 32.0, 30.0, 40.0, 26.0, 20.0, 20.0, 25.0, 17.0, 15.0, 16.0, 14.0, 7.0, 5.0, 9.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.015625, -19.498046875, -18.98046875, -18.462890625, -17.9453125, -17.427734375, -16.91015625, -16.392578125, -15.875, -15.357421875, -14.83984375, -14.322265625, -13.8046875, -13.287109375, -12.76953125, -12.251953125, -11.734375, -11.216796875, -10.69921875, -10.181640625, -9.6640625, -9.146484375, -8.62890625, -8.111328125, -7.59375, -7.076171875, -6.55859375, -6.041015625, -5.5234375, -5.005859375, -4.48828125, -3.970703125, -3.453125, -2.935546875, -2.41796875, -1.900390625, -1.3828125, -0.865234375, -0.34765625, 0.169921875, 0.6875, 1.205078125, 1.72265625, 2.240234375, 2.7578125, 3.275390625, 3.79296875, 4.310546875, 4.828125, 5.345703125, 5.86328125, 6.380859375, 6.8984375, 7.416015625, 7.93359375, 8.451171875, 8.96875, 9.486328125, 10.00390625, 10.521484375, 11.0390625, 11.556640625, 12.07421875, 12.591796875, 13.109375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 13.0, 18.0, 16.0, 29.0, 53.0, 71.0, 95.0, 157.0, 261.0, 475.0, 759.0, 1350.0, 2343.0, 4291.0, 8288.0, 15986.0, 32683.0, 68361.0, 134378.0, 217507.0, 234706.0, 160673.0, 83622.0, 40690.0, 19781.0, 9983.0, 5133.0, 2865.0, 1612.0, 924.0, 519.0, 348.0, 200.0, 131.0, 59.0, 73.0, 31.0, 23.0, 10.0, 13.0, 8.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.78125, -21.942138671875, -21.10302734375, -20.263916015625, -19.4248046875, -18.585693359375, -17.74658203125, -16.907470703125, -16.068359375, -15.229248046875, -14.39013671875, -13.551025390625, -12.7119140625, -11.872802734375, -11.03369140625, -10.194580078125, -9.35546875, -8.516357421875, -7.67724609375, -6.838134765625, -5.9990234375, -5.159912109375, -4.32080078125, -3.481689453125, -2.642578125, -1.803466796875, -0.96435546875, -0.125244140625, 0.7138671875, 1.552978515625, 2.39208984375, 3.231201171875, 4.0703125, 4.909423828125, 5.74853515625, 6.587646484375, 7.4267578125, 8.265869140625, 9.10498046875, 9.944091796875, 10.783203125, 11.622314453125, 12.46142578125, 13.300537109375, 14.1396484375, 14.978759765625, 15.81787109375, 16.656982421875, 17.49609375, 18.335205078125, 19.17431640625, 20.013427734375, 20.8525390625, 21.691650390625, 22.53076171875, 23.369873046875, 24.208984375, 25.048095703125, 25.88720703125, 26.726318359375, 27.5654296875, 28.404541015625, 29.24365234375, 30.082763671875, 30.921875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 1.0, 1.0, 6.0, 5.0, 4.0, 13.0, 7.0, 7.0, 14.0, 15.0, 36.0, 28.0, 15.0, 26.0, 22.0, 16.0, 34.0, 24.0, 24.0, 38.0, 43.0, 38.0, 34.0, 46.0, 38.0, 47.0, 49.0, 32.0, 44.0, 34.0, 27.0, 33.0, 33.0, 26.0, 17.0, 17.0, 17.0, 15.0, 11.0, 17.0, 12.0, 9.0, 4.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-11.9375, -11.574951171875, -11.21240234375, -10.849853515625, -10.4873046875, -10.124755859375, -9.76220703125, -9.399658203125, -9.037109375, -8.674560546875, -8.31201171875, -7.949462890625, -7.5869140625, -7.224365234375, -6.86181640625, -6.499267578125, -6.13671875, -5.774169921875, -5.41162109375, -5.049072265625, -4.6865234375, -4.323974609375, -3.96142578125, -3.598876953125, -3.236328125, -2.873779296875, -2.51123046875, -2.148681640625, -1.7861328125, -1.423583984375, -1.06103515625, -0.698486328125, -0.3359375, 0.026611328125, 0.38916015625, 0.751708984375, 1.1142578125, 1.476806640625, 1.83935546875, 2.201904296875, 2.564453125, 2.927001953125, 3.28955078125, 3.652099609375, 4.0146484375, 4.377197265625, 4.73974609375, 5.102294921875, 5.46484375, 5.827392578125, 6.18994140625, 6.552490234375, 6.9150390625, 7.277587890625, 7.64013671875, 8.002685546875, 8.365234375, 8.727783203125, 9.09033203125, 9.452880859375, 9.8154296875, 10.177978515625, 10.54052734375, 10.903076171875, 11.265625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 12.0, 18.0, 18.0, 40.0, 59.0, 90.0, 126.0, 191.0, 295.0, 362.0, 603.0, 1008.0, 1512.0, 2628.0, 4468.0, 7970.0, 15788.0, 33204.0, 79549.0, 217725.0, 368834.0, 184525.0, 68239.0, 29288.0, 13986.0, 7495.0, 4094.0, 2328.0, 1516.0, 904.0, 612.0, 353.0, 228.0, 166.0, 98.0, 56.0, 52.0, 39.0, 23.0, 19.0, 13.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.625, -37.46923828125, -36.3134765625, -35.15771484375, -34.001953125, -32.84619140625, -31.6904296875, -30.53466796875, -29.37890625, -28.22314453125, -27.0673828125, -25.91162109375, -24.755859375, -23.60009765625, -22.4443359375, -21.28857421875, -20.1328125, -18.97705078125, -17.8212890625, -16.66552734375, -15.509765625, -14.35400390625, -13.1982421875, -12.04248046875, -10.88671875, -9.73095703125, -8.5751953125, -7.41943359375, -6.263671875, -5.10791015625, -3.9521484375, -2.79638671875, -1.640625, -0.48486328125, 0.6708984375, 1.82666015625, 2.982421875, 4.13818359375, 5.2939453125, 6.44970703125, 7.60546875, 8.76123046875, 9.9169921875, 11.07275390625, 12.228515625, 13.38427734375, 14.5400390625, 15.69580078125, 16.8515625, 18.00732421875, 19.1630859375, 20.31884765625, 21.474609375, 22.63037109375, 23.7861328125, 24.94189453125, 26.09765625, 27.25341796875, 28.4091796875, 29.56494140625, 30.720703125, 31.87646484375, 33.0322265625, 34.18798828125, 35.34375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 8.0, 6.0, 3.0, 3.0, 6.0, 7.0, 10.0, 13.0, 24.0, 33.0, 38.0, 58.0, 52.0, 63.0, 73.0, 81.0, 78.0, 77.0, 70.0, 54.0, 49.0, 49.0, 26.0, 28.0, 16.0, 14.0, 10.0, 7.0, 11.0, 8.0, 4.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002002716064453125, -0.0019365549087524414, -0.0018703937530517578, -0.0018042325973510742, -0.0017380714416503906, -0.001671910285949707, -0.0016057491302490234, -0.0015395879745483398, -0.0014734268188476562, -0.0014072656631469727, -0.001341104507446289, -0.0012749433517456055, -0.0012087821960449219, -0.0011426210403442383, -0.0010764598846435547, -0.001010298728942871, -0.0009441375732421875, -0.0008779764175415039, -0.0008118152618408203, -0.0007456541061401367, -0.0006794929504394531, -0.0006133317947387695, -0.0005471706390380859, -0.00048100948333740234, -0.00041484832763671875, -0.00034868717193603516, -0.00028252601623535156, -0.00021636486053466797, -0.00015020370483398438, -8.404254913330078e-05, -1.7881393432617188e-05, 4.8279762268066406e-05, 0.00011444091796875, 0.0001806020736694336, 0.0002467632293701172, 0.0003129243850708008, 0.0003790855407714844, 0.00044524669647216797, 0.0005114078521728516, 0.0005775690078735352, 0.0006437301635742188, 0.0007098913192749023, 0.0007760524749755859, 0.0008422136306762695, 0.0009083747863769531, 0.0009745359420776367, 0.0010406970977783203, 0.001106858253479004, 0.0011730194091796875, 0.001239180564880371, 0.0013053417205810547, 0.0013715028762817383, 0.0014376640319824219, 0.0015038251876831055, 0.001569986343383789, 0.0016361474990844727, 0.0017023086547851562, 0.0017684698104858398, 0.0018346309661865234, 0.001900792121887207, 0.0019669532775878906, 0.0020331144332885742, 0.002099275588989258, 0.0021654367446899414, 0.002231597900390625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 0.0, 5.0, 9.0, 9.0, 5.0, 15.0, 25.0, 25.0, 36.0, 51.0, 55.0, 105.0, 116.0, 187.0, 277.0, 443.0, 645.0, 949.0, 1577.0, 2885.0, 5283.0, 10742.0, 25981.0, 73518.0, 230999.0, 401591.0, 190337.0, 59934.0, 22018.0, 9492.0, 4553.0, 2465.0, 1420.0, 898.0, 564.0, 388.0, 264.0, 187.0, 146.0, 85.0, 71.0, 55.0, 41.0, 35.0, 29.0, 19.0, 8.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.8125, -34.67236328125, -33.5322265625, -32.39208984375, -31.251953125, -30.11181640625, -28.9716796875, -27.83154296875, -26.69140625, -25.55126953125, -24.4111328125, -23.27099609375, -22.130859375, -20.99072265625, -19.8505859375, -18.71044921875, -17.5703125, -16.43017578125, -15.2900390625, -14.14990234375, -13.009765625, -11.86962890625, -10.7294921875, -9.58935546875, -8.44921875, -7.30908203125, -6.1689453125, -5.02880859375, -3.888671875, -2.74853515625, -1.6083984375, -0.46826171875, 0.671875, 1.81201171875, 2.9521484375, 4.09228515625, 5.232421875, 6.37255859375, 7.5126953125, 8.65283203125, 9.79296875, 10.93310546875, 12.0732421875, 13.21337890625, 14.353515625, 15.49365234375, 16.6337890625, 17.77392578125, 18.9140625, 20.05419921875, 21.1943359375, 22.33447265625, 23.474609375, 24.61474609375, 25.7548828125, 26.89501953125, 28.03515625, 29.17529296875, 30.3154296875, 31.45556640625, 32.595703125, 33.73583984375, 34.8759765625, 36.01611328125, 37.15625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 1.0, 1.0, 6.0, 3.0, 1.0, 5.0, 6.0, 11.0, 6.0, 12.0, 16.0, 19.0, 26.0, 35.0, 36.0, 37.0, 54.0, 78.0, 74.0, 90.0, 81.0, 72.0, 53.0, 66.0, 45.0, 38.0, 26.0, 31.0, 15.0, 10.0, 9.0, 14.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5703125, -9.2255859375, -8.880859375, -8.5361328125, -8.19140625, -7.8466796875, -7.501953125, -7.1572265625, -6.8125, -6.4677734375, -6.123046875, -5.7783203125, -5.43359375, -5.0888671875, -4.744140625, -4.3994140625, -4.0546875, -3.7099609375, -3.365234375, -3.0205078125, -2.67578125, -2.3310546875, -1.986328125, -1.6416015625, -1.296875, -0.9521484375, -0.607421875, -0.2626953125, 0.08203125, 0.4267578125, 0.771484375, 1.1162109375, 1.4609375, 1.8056640625, 2.150390625, 2.4951171875, 2.83984375, 3.1845703125, 3.529296875, 3.8740234375, 4.21875, 4.5634765625, 4.908203125, 5.2529296875, 5.59765625, 5.9423828125, 6.287109375, 6.6318359375, 6.9765625, 7.3212890625, 7.666015625, 8.0107421875, 8.35546875, 8.7001953125, 9.044921875, 9.3896484375, 9.734375, 10.0791015625, 10.423828125, 10.7685546875, 11.11328125, 11.4580078125, 11.802734375, 12.1474609375, 12.4921875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 6.0, 5.0, 16.0, 16.0, 16.0, 27.0, 36.0, 49.0, 40.0, 64.0, 79.0, 87.0, 88.0, 93.0, 77.0, 69.0, 39.0, 57.0, 31.0, 33.0, 15.0, 16.0, 11.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.420326232910156, -33.53227233886719, -32.644222259521484, -31.75617027282715, -30.868118286132812, -29.980066299438477, -29.09201431274414, -28.203962326049805, -27.31591033935547, -26.427858352661133, -25.539806365966797, -24.65175437927246, -23.763702392578125, -22.87565040588379, -21.987598419189453, -21.099546432495117, -20.21149444580078, -19.323442459106445, -18.43539047241211, -17.547338485717773, -16.659286499023438, -15.771234512329102, -14.883182525634766, -13.99513053894043, -13.107078552246094, -12.219026565551758, -11.330974578857422, -10.442922592163086, -9.55487060546875, -8.666818618774414, -7.778766632080078, -6.890714645385742, -6.002662658691406, -5.11461067199707, -4.226558685302734, -3.3385066986083984, -2.4504547119140625, -1.5624027252197266, -0.6743507385253906, 0.2137012481689453, 1.1017532348632812, 1.9898052215576172, 2.877857208251953, 3.765909194946289, 4.653961181640625, 5.542013168334961, 6.430065155029297, 7.318117141723633, 8.206169128417969, 9.094221115112305, 9.98227310180664, 10.870325088500977, 11.758377075195312, 12.646429061889648, 13.534481048583984, 14.42253303527832, 15.310585021972656, 16.198637008666992, 17.086688995361328, 17.974740982055664, 18.86279296875, 19.750844955444336, 20.638896942138672, 21.526948928833008, 22.415000915527344]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 2.0, 5.0, 6.0, 8.0, 10.0, 13.0, 11.0, 17.0, 20.0, 17.0, 23.0, 26.0, 32.0, 28.0, 42.0, 31.0, 48.0, 40.0, 39.0, 57.0, 34.0, 36.0, 47.0, 45.0, 38.0, 38.0, 34.0, 31.0, 45.0, 22.0, 22.0, 31.0, 22.0, 13.0, 21.0, 9.0, 6.0, 13.0, 6.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.10556411743164, -19.556655883789062, -19.007749557495117, -18.45884132385254, -17.909934997558594, -17.361026763916016, -16.812118530273438, -16.263212203979492, -15.714303970336914, -15.165396690368652, -14.61648941040039, -14.067581176757812, -13.51867389678955, -12.969766616821289, -12.420858383178711, -11.87195110321045, -11.323043823242188, -10.774136543273926, -10.225229263305664, -9.676321029663086, -9.127413749694824, -8.578506469726562, -8.029598236083984, -7.480690956115723, -6.931783676147461, -6.382876396179199, -5.833968639373779, -5.285060882568359, -4.736153602600098, -4.187246322631836, -3.638338565826416, -3.089431047439575, -2.540524482727051, -1.99161696434021, -1.4427094459533691, -0.8938019275665283, -0.3448944091796875, 0.20401310920715332, 0.7529206275939941, 1.301828145980835, 1.8507356643676758, 2.3996431827545166, 2.9485507011413574, 3.4974582195281982, 4.046365737915039, 4.595273017883301, 5.144180774688721, 5.693088531494141, 6.241995811462402, 6.790903091430664, 7.339810848236084, 7.888718605041504, 8.437625885009766, 8.986533164978027, 9.535440444946289, 10.084348678588867, 10.633255958557129, 11.18216323852539, 11.731071472167969, 12.27997875213623, 12.828886032104492, 13.377793312072754, 13.926700592041016, 14.475608825683594, 15.024516105651855]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 9.0, 17.0, 26.0, 17.0, 23.0, 41.0, 46.0, 84.0, 137.0, 203.0, 302.0, 408.0, 657.0, 964.0, 1524.0, 2395.0, 3938.0, 7138.0, 13333.0, 27064.0, 61491.0, 158531.0, 463907.0, 1142940.0, 1320206.0, 626961.0, 212786.0, 78153.0, 33675.0, 15998.0, 8405.0, 4866.0, 2764.0, 1701.0, 1191.0, 757.0, 514.0, 324.0, 233.0, 186.0, 118.0, 84.0, 46.0, 37.0, 28.0, 18.0, 18.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.484375, -23.72265625, -22.9609375, -22.19921875, -21.4375, -20.67578125, -19.9140625, -19.15234375, -18.390625, -17.62890625, -16.8671875, -16.10546875, -15.34375, -14.58203125, -13.8203125, -13.05859375, -12.296875, -11.53515625, -10.7734375, -10.01171875, -9.25, -8.48828125, -7.7265625, -6.96484375, -6.203125, -5.44140625, -4.6796875, -3.91796875, -3.15625, -2.39453125, -1.6328125, -0.87109375, -0.109375, 0.65234375, 1.4140625, 2.17578125, 2.9375, 3.69921875, 4.4609375, 5.22265625, 5.984375, 6.74609375, 7.5078125, 8.26953125, 9.03125, 9.79296875, 10.5546875, 11.31640625, 12.078125, 12.83984375, 13.6015625, 14.36328125, 15.125, 15.88671875, 16.6484375, 17.41015625, 18.171875, 18.93359375, 19.6953125, 20.45703125, 21.21875, 21.98046875, 22.7421875, 23.50390625, 24.265625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 13.0, 10.0, 15.0, 11.0, 20.0, 13.0, 25.0, 27.0, 25.0, 25.0, 34.0, 30.0, 52.0, 45.0, 39.0, 47.0, 45.0, 32.0, 48.0, 38.0, 39.0, 37.0, 35.0, 40.0, 32.0, 35.0, 25.0, 15.0, 31.0, 14.0, 10.0, 21.0, 15.0, 10.0, 10.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0], "bins": [-13.609375, -13.254150390625, -12.89892578125, -12.543701171875, -12.1884765625, -11.833251953125, -11.47802734375, -11.122802734375, -10.767578125, -10.412353515625, -10.05712890625, -9.701904296875, -9.3466796875, -8.991455078125, -8.63623046875, -8.281005859375, -7.92578125, -7.570556640625, -7.21533203125, -6.860107421875, -6.5048828125, -6.149658203125, -5.79443359375, -5.439208984375, -5.083984375, -4.728759765625, -4.37353515625, -4.018310546875, -3.6630859375, -3.307861328125, -2.95263671875, -2.597412109375, -2.2421875, -1.886962890625, -1.53173828125, -1.176513671875, -0.8212890625, -0.466064453125, -0.11083984375, 0.244384765625, 0.599609375, 0.954833984375, 1.31005859375, 1.665283203125, 2.0205078125, 2.375732421875, 2.73095703125, 3.086181640625, 3.44140625, 3.796630859375, 4.15185546875, 4.507080078125, 4.8623046875, 5.217529296875, 5.57275390625, 5.927978515625, 6.283203125, 6.638427734375, 6.99365234375, 7.348876953125, 7.7041015625, 8.059326171875, 8.41455078125, 8.769775390625, 9.125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 14.0, 24.0, 24.0, 48.0, 69.0, 116.0, 145.0, 250.0, 390.0, 586.0, 915.0, 1375.0, 2298.0, 3767.0, 6473.0, 11448.0, 21063.0, 42234.0, 93501.0, 232140.0, 593061.0, 1161019.0, 1108769.0, 536457.0, 208841.0, 84433.0, 38944.0, 19445.0, 10574.0, 6112.0, 3647.0, 2198.0, 1421.0, 886.0, 545.0, 374.0, 205.0, 151.0, 86.0, 67.0, 54.0, 34.0, 29.0, 12.0, 7.0, 9.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.28125, -20.593505859375, -19.90576171875, -19.218017578125, -18.5302734375, -17.842529296875, -17.15478515625, -16.467041015625, -15.779296875, -15.091552734375, -14.40380859375, -13.716064453125, -13.0283203125, -12.340576171875, -11.65283203125, -10.965087890625, -10.27734375, -9.589599609375, -8.90185546875, -8.214111328125, -7.5263671875, -6.838623046875, -6.15087890625, -5.463134765625, -4.775390625, -4.087646484375, -3.39990234375, -2.712158203125, -2.0244140625, -1.336669921875, -0.64892578125, 0.038818359375, 0.7265625, 1.414306640625, 2.10205078125, 2.789794921875, 3.4775390625, 4.165283203125, 4.85302734375, 5.540771484375, 6.228515625, 6.916259765625, 7.60400390625, 8.291748046875, 8.9794921875, 9.667236328125, 10.35498046875, 11.042724609375, 11.73046875, 12.418212890625, 13.10595703125, 13.793701171875, 14.4814453125, 15.169189453125, 15.85693359375, 16.544677734375, 17.232421875, 17.920166015625, 18.60791015625, 19.295654296875, 19.9833984375, 20.671142578125, 21.35888671875, 22.046630859375, 22.734375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 6.0, 7.0, 9.0, 10.0, 13.0, 16.0, 29.0, 25.0, 40.0, 49.0, 72.0, 89.0, 91.0, 125.0, 167.0, 229.0, 245.0, 266.0, 285.0, 343.0, 304.0, 297.0, 265.0, 244.0, 192.0, 160.0, 120.0, 87.0, 75.0, 53.0, 31.0, 44.0, 20.0, 13.0, 20.0, 7.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.05078125, -6.83477783203125, -6.6187744140625, -6.40277099609375, -6.186767578125, -5.97076416015625, -5.7547607421875, -5.53875732421875, -5.32275390625, -5.10675048828125, -4.8907470703125, -4.67474365234375, -4.458740234375, -4.24273681640625, -4.0267333984375, -3.81072998046875, -3.5947265625, -3.37872314453125, -3.1627197265625, -2.94671630859375, -2.730712890625, -2.51470947265625, -2.2987060546875, -2.08270263671875, -1.86669921875, -1.65069580078125, -1.4346923828125, -1.21868896484375, -1.002685546875, -0.78668212890625, -0.5706787109375, -0.35467529296875, -0.138671875, 0.07733154296875, 0.2933349609375, 0.50933837890625, 0.725341796875, 0.94134521484375, 1.1573486328125, 1.37335205078125, 1.58935546875, 1.80535888671875, 2.0213623046875, 2.23736572265625, 2.453369140625, 2.66937255859375, 2.8853759765625, 3.10137939453125, 3.3173828125, 3.53338623046875, 3.7493896484375, 3.96539306640625, 4.181396484375, 4.39739990234375, 4.6134033203125, 4.82940673828125, 5.04541015625, 5.26141357421875, 5.4774169921875, 5.69342041015625, 5.909423828125, 6.12542724609375, 6.3414306640625, 6.55743408203125, 6.7734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 4.0, 9.0, 16.0, 22.0, 33.0, 40.0, 34.0, 39.0, 80.0, 74.0, 108.0, 100.0, 87.0, 68.0, 58.0, 55.0, 39.0, 24.0, 24.0, 16.0, 11.0, 10.0, 5.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.15639877319336, -24.414915084838867, -23.673431396484375, -22.93194580078125, -22.190462112426758, -21.448978424072266, -20.70749282836914, -19.96600914001465, -19.224525451660156, -18.483041763305664, -17.741558074951172, -17.000072479248047, -16.258588790893555, -15.517105102539062, -14.775620460510254, -14.034135818481445, -13.292652130126953, -12.551168441772461, -11.809683799743652, -11.068199157714844, -10.326715469360352, -9.58523178100586, -8.84374713897705, -8.102262496948242, -7.36077880859375, -6.6192946434021, -5.877810478210449, -5.136326313018799, -4.394842147827148, -3.653357982635498, -2.9118738174438477, -2.1703896522521973, -1.4289073944091797, -0.6874232292175293, 0.054060935974121094, 0.7955451011657715, 1.5370292663574219, 2.2785134315490723, 3.0199975967407227, 3.761481761932373, 4.502965927124023, 5.244450092315674, 5.985934257507324, 6.727418422698975, 7.468902587890625, 8.210386276245117, 8.951870918273926, 9.693355560302734, 10.434839248657227, 11.176322937011719, 11.917807579040527, 12.659292221069336, 13.400775909423828, 14.14225959777832, 14.883744239807129, 15.625228881835938, 16.36671257019043, 17.108196258544922, 17.849681854248047, 18.59116554260254, 19.33264923095703, 20.074132919311523, 20.815616607666016, 21.55710220336914, 22.298585891723633]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 5.0, 9.0, 13.0, 19.0, 11.0, 20.0, 28.0, 26.0, 23.0, 22.0, 28.0, 27.0, 34.0, 39.0, 41.0, 31.0, 48.0, 51.0, 38.0, 38.0, 48.0, 41.0, 48.0, 28.0, 32.0, 44.0, 29.0, 25.0, 22.0, 19.0, 20.0, 14.0, 15.0, 12.0, 8.0, 5.0, 5.0, 7.0, 4.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-16.193523406982422, -15.731340408325195, -15.269157409667969, -14.806974411010742, -14.3447904586792, -13.882607460021973, -13.420424461364746, -12.95824146270752, -12.496057510375977, -12.03387451171875, -11.571691513061523, -11.109508514404297, -10.647324562072754, -10.185141563415527, -9.7229585647583, -9.260775566101074, -8.798592567443848, -8.336409568786621, -7.874226093292236, -7.41204309463501, -6.949859619140625, -6.487676620483398, -6.025493621826172, -5.563310623168945, -5.1011271476745605, -4.638944149017334, -4.176760673522949, -3.7145776748657227, -3.252394437789917, -2.7902112007141113, -2.3280282020568848, -1.865844964981079, -1.4036626815795898, -0.941479504108429, -0.47929632663726807, -0.017113208770751953, 0.4450700283050537, 0.9072532653808594, 1.369436264038086, 1.8316195011138916, 2.2938027381896973, 2.755985975265503, 3.2181692123413086, 3.680352210998535, 4.142535209655762, 4.6047186851501465, 5.066901683807373, 5.529085159301758, 5.991268157958984, 6.453451156616211, 6.915634632110596, 7.377817630767822, 7.840001106262207, 8.302184104919434, 8.76436710357666, 9.226550102233887, 9.68873405456543, 10.150917053222656, 10.613100051879883, 11.07528305053711, 11.537467002868652, 11.999650001525879, 12.461833000183105, 12.924015998840332, 13.386198997497559]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 7.0, 7.0, 13.0, 8.0, 27.0, 19.0, 45.0, 45.0, 94.0, 113.0, 171.0, 241.0, 379.0, 484.0, 740.0, 1049.0, 1469.0, 2168.0, 3337.0, 5162.0, 8477.0, 14347.0, 26150.0, 49458.0, 98889.0, 189055.0, 254284.0, 184469.0, 96183.0, 48427.0, 25462.0, 14199.0, 8366.0, 5100.0, 3251.0, 2212.0, 1419.0, 963.0, 669.0, 517.0, 311.0, 238.0, 158.0, 105.0, 83.0, 69.0, 41.0, 28.0, 17.0, 17.0, 4.0, 10.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-18.546875, -17.975830078125, -17.40478515625, -16.833740234375, -16.2626953125, -15.691650390625, -15.12060546875, -14.549560546875, -13.978515625, -13.407470703125, -12.83642578125, -12.265380859375, -11.6943359375, -11.123291015625, -10.55224609375, -9.981201171875, -9.41015625, -8.839111328125, -8.26806640625, -7.697021484375, -7.1259765625, -6.554931640625, -5.98388671875, -5.412841796875, -4.841796875, -4.270751953125, -3.69970703125, -3.128662109375, -2.5576171875, -1.986572265625, -1.41552734375, -0.844482421875, -0.2734375, 0.297607421875, 0.86865234375, 1.439697265625, 2.0107421875, 2.581787109375, 3.15283203125, 3.723876953125, 4.294921875, 4.865966796875, 5.43701171875, 6.008056640625, 6.5791015625, 7.150146484375, 7.72119140625, 8.292236328125, 8.86328125, 9.434326171875, 10.00537109375, 10.576416015625, 11.1474609375, 11.718505859375, 12.28955078125, 12.860595703125, 13.431640625, 14.002685546875, 14.57373046875, 15.144775390625, 15.7158203125, 16.286865234375, 16.85791015625, 17.428955078125, 18.0]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 6.0, 5.0, 13.0, 8.0, 14.0, 20.0, 20.0, 26.0, 21.0, 17.0, 22.0, 37.0, 37.0, 23.0, 43.0, 52.0, 46.0, 52.0, 37.0, 48.0, 49.0, 50.0, 39.0, 27.0, 38.0, 40.0, 29.0, 34.0, 20.0, 24.0, 21.0, 15.0, 18.0, 10.0, 6.0, 5.0, 6.0, 8.0, 3.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.40625, -16.90478515625, -16.4033203125, -15.90185546875, -15.400390625, -14.89892578125, -14.3974609375, -13.89599609375, -13.39453125, -12.89306640625, -12.3916015625, -11.89013671875, -11.388671875, -10.88720703125, -10.3857421875, -9.88427734375, -9.3828125, -8.88134765625, -8.3798828125, -7.87841796875, -7.376953125, -6.87548828125, -6.3740234375, -5.87255859375, -5.37109375, -4.86962890625, -4.3681640625, -3.86669921875, -3.365234375, -2.86376953125, -2.3623046875, -1.86083984375, -1.359375, -0.85791015625, -0.3564453125, 0.14501953125, 0.646484375, 1.14794921875, 1.6494140625, 2.15087890625, 2.65234375, 3.15380859375, 3.6552734375, 4.15673828125, 4.658203125, 5.15966796875, 5.6611328125, 6.16259765625, 6.6640625, 7.16552734375, 7.6669921875, 8.16845703125, 8.669921875, 9.17138671875, 9.6728515625, 10.17431640625, 10.67578125, 11.17724609375, 11.6787109375, 12.18017578125, 12.681640625, 13.18310546875, 13.6845703125, 14.18603515625, 14.6875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 8.0, 8.0, 7.0, 7.0, 20.0, 23.0, 27.0, 48.0, 56.0, 79.0, 119.0, 181.0, 255.0, 383.0, 505.0, 754.0, 1203.0, 1893.0, 3101.0, 5299.0, 9433.0, 18260.0, 39359.0, 97074.0, 264596.0, 351411.0, 146086.0, 55039.0, 24397.0, 12149.0, 6367.0, 3818.0, 2276.0, 1414.0, 962.0, 601.0, 397.0, 281.0, 192.0, 140.0, 81.0, 73.0, 51.0, 34.0, 21.0, 20.0, 14.0, 14.0, 7.0, 2.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-23.703125, -22.967041015625, -22.23095703125, -21.494873046875, -20.7587890625, -20.022705078125, -19.28662109375, -18.550537109375, -17.814453125, -17.078369140625, -16.34228515625, -15.606201171875, -14.8701171875, -14.134033203125, -13.39794921875, -12.661865234375, -11.92578125, -11.189697265625, -10.45361328125, -9.717529296875, -8.9814453125, -8.245361328125, -7.50927734375, -6.773193359375, -6.037109375, -5.301025390625, -4.56494140625, -3.828857421875, -3.0927734375, -2.356689453125, -1.62060546875, -0.884521484375, -0.1484375, 0.587646484375, 1.32373046875, 2.059814453125, 2.7958984375, 3.531982421875, 4.26806640625, 5.004150390625, 5.740234375, 6.476318359375, 7.21240234375, 7.948486328125, 8.6845703125, 9.420654296875, 10.15673828125, 10.892822265625, 11.62890625, 12.364990234375, 13.10107421875, 13.837158203125, 14.5732421875, 15.309326171875, 16.04541015625, 16.781494140625, 17.517578125, 18.253662109375, 18.98974609375, 19.725830078125, 20.4619140625, 21.197998046875, 21.93408203125, 22.670166015625, 23.40625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 12.0, 7.0, 10.0, 13.0, 7.0, 25.0, 24.0, 23.0, 27.0, 28.0, 39.0, 29.0, 29.0, 47.0, 46.0, 56.0, 45.0, 50.0, 38.0, 49.0, 47.0, 46.0, 49.0, 34.0, 36.0, 38.0, 25.0, 20.0, 24.0, 12.0, 14.0, 14.0, 6.0, 7.0, 4.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.4453125, -10.12353515625, -9.8017578125, -9.47998046875, -9.158203125, -8.83642578125, -8.5146484375, -8.19287109375, -7.87109375, -7.54931640625, -7.2275390625, -6.90576171875, -6.583984375, -6.26220703125, -5.9404296875, -5.61865234375, -5.296875, -4.97509765625, -4.6533203125, -4.33154296875, -4.009765625, -3.68798828125, -3.3662109375, -3.04443359375, -2.72265625, -2.40087890625, -2.0791015625, -1.75732421875, -1.435546875, -1.11376953125, -0.7919921875, -0.47021484375, -0.1484375, 0.17333984375, 0.4951171875, 0.81689453125, 1.138671875, 1.46044921875, 1.7822265625, 2.10400390625, 2.42578125, 2.74755859375, 3.0693359375, 3.39111328125, 3.712890625, 4.03466796875, 4.3564453125, 4.67822265625, 5.0, 5.32177734375, 5.6435546875, 5.96533203125, 6.287109375, 6.60888671875, 6.9306640625, 7.25244140625, 7.57421875, 7.89599609375, 8.2177734375, 8.53955078125, 8.861328125, 9.18310546875, 9.5048828125, 9.82666015625, 10.1484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 10.0, 17.0, 18.0, 30.0, 39.0, 37.0, 72.0, 80.0, 124.0, 166.0, 262.0, 311.0, 440.0, 668.0, 956.0, 1396.0, 2482.0, 4184.0, 7978.0, 17077.0, 41000.0, 121540.0, 397920.0, 302357.0, 87510.0, 31904.0, 13536.0, 6663.0, 3533.0, 2030.0, 1334.0, 803.0, 609.0, 395.0, 319.0, 216.0, 134.0, 111.0, 80.0, 50.0, 45.0, 33.0, 20.0, 16.0, 13.0, 7.0, 11.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-16.25, -15.7554931640625, -15.260986328125, -14.7664794921875, -14.27197265625, -13.7774658203125, -13.282958984375, -12.7884521484375, -12.2939453125, -11.7994384765625, -11.304931640625, -10.8104248046875, -10.31591796875, -9.8214111328125, -9.326904296875, -8.8323974609375, -8.337890625, -7.8433837890625, -7.348876953125, -6.8543701171875, -6.35986328125, -5.8653564453125, -5.370849609375, -4.8763427734375, -4.3818359375, -3.8873291015625, -3.392822265625, -2.8983154296875, -2.40380859375, -1.9093017578125, -1.414794921875, -0.9202880859375, -0.42578125, 0.0687255859375, 0.563232421875, 1.0577392578125, 1.55224609375, 2.0467529296875, 2.541259765625, 3.0357666015625, 3.5302734375, 4.0247802734375, 4.519287109375, 5.0137939453125, 5.50830078125, 6.0028076171875, 6.497314453125, 6.9918212890625, 7.486328125, 7.9808349609375, 8.475341796875, 8.9698486328125, 9.46435546875, 9.9588623046875, 10.453369140625, 10.9478759765625, 11.4423828125, 11.9368896484375, 12.431396484375, 12.9259033203125, 13.42041015625, 13.9149169921875, 14.409423828125, 14.9039306640625, 15.3984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 11.0, 12.0, 15.0, 21.0, 69.0, 107.0, 169.0, 241.0, 169.0, 74.0, 35.0, 20.0, 13.0, 11.0, 4.0, 5.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018768310546875, -0.0018237382173538208, -0.0017706453800201416, -0.0017175525426864624, -0.0016644597053527832, -0.001611366868019104, -0.0015582740306854248, -0.0015051811933517456, -0.0014520883560180664, -0.0013989955186843872, -0.001345902681350708, -0.0012928098440170288, -0.0012397170066833496, -0.0011866241693496704, -0.0011335313320159912, -0.001080438494682312, -0.0010273456573486328, -0.0009742528200149536, -0.0009211599826812744, -0.0008680671453475952, -0.000814974308013916, -0.0007618814706802368, -0.0007087886333465576, -0.0006556957960128784, -0.0006026029586791992, -0.00054951012134552, -0.0004964172840118408, -0.0004433244466781616, -0.0003902316093444824, -0.0003371387720108032, -0.000284045934677124, -0.00023095309734344482, -0.00017786026000976562, -0.00012476742267608643, -7.167458534240723e-05, -1.8581748008728027e-05, 3.451108932495117e-05, 8.760392665863037e-05, 0.00014069676399230957, 0.00019378960132598877, 0.00024688243865966797, 0.00029997527599334717, 0.00035306811332702637, 0.00040616095066070557, 0.00045925378799438477, 0.000512346625328064, 0.0005654394626617432, 0.0006185322999954224, 0.0006716251373291016, 0.0007247179746627808, 0.00077781081199646, 0.0008309036493301392, 0.0008839964866638184, 0.0009370893239974976, 0.0009901821613311768, 0.001043274998664856, 0.0010963678359985352, 0.0011494606733322144, 0.0012025535106658936, 0.0012556463479995728, 0.001308739185333252, 0.0013618320226669312, 0.0014149248600006104, 0.0014680176973342896, 0.0015211105346679688]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 5.0, 5.0, 8.0, 8.0, 15.0, 25.0, 30.0, 56.0, 64.0, 95.0, 186.0, 223.0, 370.0, 590.0, 1017.0, 1801.0, 3408.0, 6943.0, 16841.0, 45391.0, 141753.0, 382272.0, 295516.0, 95897.0, 31941.0, 12263.0, 5395.0, 2658.0, 1505.0, 830.0, 522.0, 311.0, 222.0, 105.0, 89.0, 55.0, 44.0, 33.0, 17.0, 14.0, 12.0, 6.0, 3.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.96875, -16.451904296875, -15.93505859375, -15.418212890625, -14.9013671875, -14.384521484375, -13.86767578125, -13.350830078125, -12.833984375, -12.317138671875, -11.80029296875, -11.283447265625, -10.7666015625, -10.249755859375, -9.73291015625, -9.216064453125, -8.69921875, -8.182373046875, -7.66552734375, -7.148681640625, -6.6318359375, -6.114990234375, -5.59814453125, -5.081298828125, -4.564453125, -4.047607421875, -3.53076171875, -3.013916015625, -2.4970703125, -1.980224609375, -1.46337890625, -0.946533203125, -0.4296875, 0.087158203125, 0.60400390625, 1.120849609375, 1.6376953125, 2.154541015625, 2.67138671875, 3.188232421875, 3.705078125, 4.221923828125, 4.73876953125, 5.255615234375, 5.7724609375, 6.289306640625, 6.80615234375, 7.322998046875, 7.83984375, 8.356689453125, 8.87353515625, 9.390380859375, 9.9072265625, 10.424072265625, 10.94091796875, 11.457763671875, 11.974609375, 12.491455078125, 13.00830078125, 13.525146484375, 14.0419921875, 14.558837890625, 15.07568359375, 15.592529296875, 16.109375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 8.0, 9.0, 16.0, 6.0, 17.0, 23.0, 28.0, 47.0, 55.0, 52.0, 61.0, 72.0, 77.0, 72.0, 77.0, 80.0, 52.0, 52.0, 45.0, 32.0, 23.0, 15.0, 11.0, 17.0, 16.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.85546875, -3.7276611328125, -3.599853515625, -3.4720458984375, -3.34423828125, -3.2164306640625, -3.088623046875, -2.9608154296875, -2.8330078125, -2.7052001953125, -2.577392578125, -2.4495849609375, -2.32177734375, -2.1939697265625, -2.066162109375, -1.9383544921875, -1.810546875, -1.6827392578125, -1.554931640625, -1.4271240234375, -1.29931640625, -1.1715087890625, -1.043701171875, -0.9158935546875, -0.7880859375, -0.6602783203125, -0.532470703125, -0.4046630859375, -0.27685546875, -0.1490478515625, -0.021240234375, 0.1065673828125, 0.234375, 0.3621826171875, 0.489990234375, 0.6177978515625, 0.74560546875, 0.8734130859375, 1.001220703125, 1.1290283203125, 1.2568359375, 1.3846435546875, 1.512451171875, 1.6402587890625, 1.76806640625, 1.8958740234375, 2.023681640625, 2.1514892578125, 2.279296875, 2.4071044921875, 2.534912109375, 2.6627197265625, 2.79052734375, 2.9183349609375, 3.046142578125, 3.1739501953125, 3.3017578125, 3.4295654296875, 3.557373046875, 3.6851806640625, 3.81298828125, 3.9407958984375, 4.068603515625, 4.1964111328125, 4.32421875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 6.0, 10.0, 5.0, 12.0, 18.0, 27.0, 20.0, 30.0, 40.0, 53.0, 69.0, 88.0, 98.0, 88.0, 79.0, 76.0, 58.0, 61.0, 32.0, 29.0, 29.0, 19.0, 15.0, 7.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.597742080688477, -22.88474464416504, -22.1717472076416, -21.458749771118164, -20.745752334594727, -20.03275489807129, -19.31975746154785, -18.606760025024414, -17.893762588500977, -17.18076515197754, -16.4677677154541, -15.754770278930664, -15.041772842407227, -14.328775405883789, -13.615777969360352, -12.902780532836914, -12.189783096313477, -11.476785659790039, -10.763788223266602, -10.050790786743164, -9.337793350219727, -8.624795913696289, -7.911798477172852, -7.198801040649414, -6.485803604125977, -5.772806167602539, -5.059808731079102, -4.346811294555664, -3.6338138580322266, -2.920816421508789, -2.2078189849853516, -1.494821548461914, -0.7818260192871094, -0.06882858276367188, 0.6441688537597656, 1.3571662902832031, 2.0701637268066406, 2.783161163330078, 3.4961585998535156, 4.209156036376953, 4.922153472900391, 5.635150909423828, 6.348148345947266, 7.061145782470703, 7.774143218994141, 8.487140655517578, 9.200138092041016, 9.913135528564453, 10.62613296508789, 11.339130401611328, 12.052127838134766, 12.765125274658203, 13.47812271118164, 14.191120147705078, 14.904117584228516, 15.617115020751953, 16.33011245727539, 17.043109893798828, 17.756107330322266, 18.469104766845703, 19.18210220336914, 19.895099639892578, 20.608097076416016, 21.321094512939453, 22.03409194946289]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 9.0, 13.0, 14.0, 21.0, 20.0, 24.0, 24.0, 35.0, 19.0, 35.0, 22.0, 42.0, 39.0, 31.0, 28.0, 56.0, 38.0, 39.0, 47.0, 45.0, 33.0, 38.0, 39.0, 40.0, 35.0, 30.0, 22.0, 21.0, 24.0, 16.0, 18.0, 15.0, 13.0, 4.0, 5.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-15.475081443786621, -15.032533645629883, -14.589986801147461, -14.147439002990723, -13.704891204833984, -13.262344360351562, -12.819796562194824, -12.377248764038086, -11.934701919555664, -11.492154121398926, -11.049607276916504, -10.607059478759766, -10.164511680603027, -9.721963882446289, -9.279417037963867, -8.836869239807129, -8.39432144165039, -7.9517741203308105, -7.509226322174072, -7.066679000854492, -6.624131202697754, -6.181583881378174, -5.739036560058594, -5.2964887619018555, -4.853941440582275, -4.411394119262695, -3.968846321105957, -3.526298999786377, -3.0837514400482178, -2.6412038803100586, -2.1986565589904785, -1.7561089992523193, -1.3135623931884766, -0.8710148930549622, -0.42846739292144775, 0.014080047607421875, 0.45662760734558105, 0.8991751670837402, 1.3417224884033203, 1.7842700481414795, 2.2268176078796387, 2.669365167617798, 3.111912727355957, 3.554460048675537, 3.9970076084136963, 4.4395551681518555, 4.8821024894714355, 5.324649810791016, 5.767197608947754, 6.209744930267334, 6.652292728424072, 7.094840049743652, 7.537387847900391, 7.979935169219971, 8.42248249053955, 8.865030288696289, 9.307577133178711, 9.75012493133545, 10.192671775817871, 10.63521957397461, 11.077767372131348, 11.520315170288086, 11.962862014770508, 12.405409812927246, 12.847957611083984]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 4.0, 4.0, 13.0, 26.0, 20.0, 45.0, 42.0, 63.0, 61.0, 99.0, 132.0, 160.0, 243.0, 315.0, 509.0, 799.0, 1184.0, 1872.0, 3061.0, 5848.0, 10557.0, 21465.0, 45771.0, 100314.0, 195725.0, 263848.0, 199100.0, 102900.0, 46640.0, 22294.0, 10779.0, 5755.0, 3275.0, 1921.0, 1152.0, 734.0, 541.0, 359.0, 224.0, 195.0, 127.0, 95.0, 71.0, 50.0, 35.0, 28.0, 29.0, 22.0, 17.0, 10.0, 10.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-27.59375, -26.7451171875, -25.896484375, -25.0478515625, -24.19921875, -23.3505859375, -22.501953125, -21.6533203125, -20.8046875, -19.9560546875, -19.107421875, -18.2587890625, -17.41015625, -16.5615234375, -15.712890625, -14.8642578125, -14.015625, -13.1669921875, -12.318359375, -11.4697265625, -10.62109375, -9.7724609375, -8.923828125, -8.0751953125, -7.2265625, -6.3779296875, -5.529296875, -4.6806640625, -3.83203125, -2.9833984375, -2.134765625, -1.2861328125, -0.4375, 0.4111328125, 1.259765625, 2.1083984375, 2.95703125, 3.8056640625, 4.654296875, 5.5029296875, 6.3515625, 7.2001953125, 8.048828125, 8.8974609375, 9.74609375, 10.5947265625, 11.443359375, 12.2919921875, 13.140625, 13.9892578125, 14.837890625, 15.6865234375, 16.53515625, 17.3837890625, 18.232421875, 19.0810546875, 19.9296875, 20.7783203125, 21.626953125, 22.4755859375, 23.32421875, 24.1728515625, 25.021484375, 25.8701171875, 26.71875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 4.0, 12.0, 12.0, 19.0, 18.0, 15.0, 24.0, 25.0, 23.0, 35.0, 40.0, 36.0, 43.0, 36.0, 40.0, 35.0, 49.0, 44.0, 45.0, 32.0, 40.0, 45.0, 37.0, 40.0, 31.0, 28.0, 37.0, 19.0, 30.0, 18.0, 12.0, 12.0, 15.0, 5.0, 6.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.5234375, -15.0849609375, -14.646484375, -14.2080078125, -13.76953125, -13.3310546875, -12.892578125, -12.4541015625, -12.015625, -11.5771484375, -11.138671875, -10.7001953125, -10.26171875, -9.8232421875, -9.384765625, -8.9462890625, -8.5078125, -8.0693359375, -7.630859375, -7.1923828125, -6.75390625, -6.3154296875, -5.876953125, -5.4384765625, -5.0, -4.5615234375, -4.123046875, -3.6845703125, -3.24609375, -2.8076171875, -2.369140625, -1.9306640625, -1.4921875, -1.0537109375, -0.615234375, -0.1767578125, 0.26171875, 0.7001953125, 1.138671875, 1.5771484375, 2.015625, 2.4541015625, 2.892578125, 3.3310546875, 3.76953125, 4.2080078125, 4.646484375, 5.0849609375, 5.5234375, 5.9619140625, 6.400390625, 6.8388671875, 7.27734375, 7.7158203125, 8.154296875, 8.5927734375, 9.03125, 9.4697265625, 9.908203125, 10.3466796875, 10.78515625, 11.2236328125, 11.662109375, 12.1005859375, 12.5390625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 6.0, 6.0, 8.0, 17.0, 29.0, 27.0, 34.0, 65.0, 84.0, 143.0, 163.0, 291.0, 405.0, 557.0, 817.0, 1287.0, 2031.0, 3062.0, 4985.0, 8115.0, 13416.0, 22602.0, 38082.0, 65311.0, 110580.0, 165327.0, 192305.0, 159744.0, 104910.0, 62341.0, 36222.0, 21373.0, 12805.0, 7800.0, 4796.0, 2975.0, 1943.0, 1321.0, 831.0, 539.0, 391.0, 232.0, 185.0, 134.0, 81.0, 51.0, 40.0, 26.0, 20.0, 15.0, 9.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0], "bins": [-17.9375, -17.384765625, -16.83203125, -16.279296875, -15.7265625, -15.173828125, -14.62109375, -14.068359375, -13.515625, -12.962890625, -12.41015625, -11.857421875, -11.3046875, -10.751953125, -10.19921875, -9.646484375, -9.09375, -8.541015625, -7.98828125, -7.435546875, -6.8828125, -6.330078125, -5.77734375, -5.224609375, -4.671875, -4.119140625, -3.56640625, -3.013671875, -2.4609375, -1.908203125, -1.35546875, -0.802734375, -0.25, 0.302734375, 0.85546875, 1.408203125, 1.9609375, 2.513671875, 3.06640625, 3.619140625, 4.171875, 4.724609375, 5.27734375, 5.830078125, 6.3828125, 6.935546875, 7.48828125, 8.041015625, 8.59375, 9.146484375, 9.69921875, 10.251953125, 10.8046875, 11.357421875, 11.91015625, 12.462890625, 13.015625, 13.568359375, 14.12109375, 14.673828125, 15.2265625, 15.779296875, 16.33203125, 16.884765625, 17.4375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 13.0, 9.0, 15.0, 15.0, 9.0, 22.0, 18.0, 21.0, 29.0, 32.0, 27.0, 30.0, 21.0, 31.0, 32.0, 37.0, 34.0, 49.0, 37.0, 47.0, 41.0, 31.0, 38.0, 37.0, 36.0, 28.0, 27.0, 31.0, 26.0, 19.0, 27.0, 25.0, 14.0, 18.0, 19.0, 10.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.015625, -8.7208251953125, -8.426025390625, -8.1312255859375, -7.83642578125, -7.5416259765625, -7.246826171875, -6.9520263671875, -6.6572265625, -6.3624267578125, -6.067626953125, -5.7728271484375, -5.47802734375, -5.1832275390625, -4.888427734375, -4.5936279296875, -4.298828125, -4.0040283203125, -3.709228515625, -3.4144287109375, -3.11962890625, -2.8248291015625, -2.530029296875, -2.2352294921875, -1.9404296875, -1.6456298828125, -1.350830078125, -1.0560302734375, -0.76123046875, -0.4664306640625, -0.171630859375, 0.1231689453125, 0.41796875, 0.7127685546875, 1.007568359375, 1.3023681640625, 1.59716796875, 1.8919677734375, 2.186767578125, 2.4815673828125, 2.7763671875, 3.0711669921875, 3.365966796875, 3.6607666015625, 3.95556640625, 4.2503662109375, 4.545166015625, 4.8399658203125, 5.134765625, 5.4295654296875, 5.724365234375, 6.0191650390625, 6.31396484375, 6.6087646484375, 6.903564453125, 7.1983642578125, 7.4931640625, 7.7879638671875, 8.082763671875, 8.3775634765625, 8.67236328125, 8.9671630859375, 9.261962890625, 9.5567626953125, 9.8515625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 5.0, 3.0, 4.0, 4.0, 9.0, 17.0, 18.0, 32.0, 44.0, 52.0, 68.0, 99.0, 143.0, 194.0, 265.0, 366.0, 519.0, 806.0, 1179.0, 1709.0, 2660.0, 4481.0, 7652.0, 14512.0, 29513.0, 66009.0, 171962.0, 355987.0, 227123.0, 85712.0, 36576.0, 17437.0, 9200.0, 5056.0, 3110.0, 1895.0, 1289.0, 802.0, 577.0, 426.0, 277.0, 212.0, 145.0, 123.0, 90.0, 58.0, 48.0, 31.0, 19.0, 14.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-23.515625, -22.694580078125, -21.87353515625, -21.052490234375, -20.2314453125, -19.410400390625, -18.58935546875, -17.768310546875, -16.947265625, -16.126220703125, -15.30517578125, -14.484130859375, -13.6630859375, -12.842041015625, -12.02099609375, -11.199951171875, -10.37890625, -9.557861328125, -8.73681640625, -7.915771484375, -7.0947265625, -6.273681640625, -5.45263671875, -4.631591796875, -3.810546875, -2.989501953125, -2.16845703125, -1.347412109375, -0.5263671875, 0.294677734375, 1.11572265625, 1.936767578125, 2.7578125, 3.578857421875, 4.39990234375, 5.220947265625, 6.0419921875, 6.863037109375, 7.68408203125, 8.505126953125, 9.326171875, 10.147216796875, 10.96826171875, 11.789306640625, 12.6103515625, 13.431396484375, 14.25244140625, 15.073486328125, 15.89453125, 16.715576171875, 17.53662109375, 18.357666015625, 19.1787109375, 19.999755859375, 20.82080078125, 21.641845703125, 22.462890625, 23.283935546875, 24.10498046875, 24.926025390625, 25.7470703125, 26.568115234375, 27.38916015625, 28.210205078125, 29.03125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 12.0, 8.0, 20.0, 22.0, 21.0, 39.0, 59.0, 67.0, 73.0, 133.0, 101.0, 100.0, 90.0, 66.0, 36.0, 29.0, 25.0, 25.0, 15.0, 13.0, 8.0, 5.0, 0.0, 5.0, 2.0, 9.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023937225341796875, -0.0023223459720611572, -0.002250969409942627, -0.0021795928478240967, -0.0021082162857055664, -0.002036839723587036, -0.001965463161468506, -0.0018940865993499756, -0.0018227100372314453, -0.001751333475112915, -0.0016799569129943848, -0.0016085803508758545, -0.0015372037887573242, -0.001465827226638794, -0.0013944506645202637, -0.0013230741024017334, -0.0012516975402832031, -0.0011803209781646729, -0.0011089444160461426, -0.0010375678539276123, -0.000966191291809082, -0.0008948147296905518, -0.0008234381675720215, -0.0007520616054534912, -0.0006806850433349609, -0.0006093084812164307, -0.0005379319190979004, -0.0004665553569793701, -0.00039517879486083984, -0.00032380223274230957, -0.0002524256706237793, -0.00018104910850524902, -0.00010967254638671875, -3.8295984268188477e-05, 3.30805778503418e-05, 0.00010445713996887207, 0.00017583370208740234, 0.0002472102642059326, 0.0003185868263244629, 0.00038996338844299316, 0.00046133995056152344, 0.0005327165126800537, 0.000604093074798584, 0.0006754696369171143, 0.0007468461990356445, 0.0008182227611541748, 0.0008895993232727051, 0.0009609758853912354, 0.0010323524475097656, 0.001103729009628296, 0.0011751055717468262, 0.0012464821338653564, 0.0013178586959838867, 0.001389235258102417, 0.0014606118202209473, 0.0015319883823394775, 0.0016033649444580078, 0.001674741506576538, 0.0017461180686950684, 0.0018174946308135986, 0.001888871192932129, 0.001960247755050659, 0.0020316243171691895, 0.0021030008792877197, 0.00217437744140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 8.0, 10.0, 19.0, 19.0, 39.0, 62.0, 105.0, 147.0, 228.0, 347.0, 492.0, 829.0, 1361.0, 2085.0, 3634.0, 6224.0, 11860.0, 23215.0, 50154.0, 123925.0, 279000.0, 295279.0, 138737.0, 56226.0, 25025.0, 12776.0, 6832.0, 3786.0, 2298.0, 1347.0, 858.0, 589.0, 346.0, 254.0, 141.0, 101.0, 62.0, 43.0, 26.0, 20.0, 23.0, 12.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.46875, -19.830322265625, -19.19189453125, -18.553466796875, -17.9150390625, -17.276611328125, -16.63818359375, -15.999755859375, -15.361328125, -14.722900390625, -14.08447265625, -13.446044921875, -12.8076171875, -12.169189453125, -11.53076171875, -10.892333984375, -10.25390625, -9.615478515625, -8.97705078125, -8.338623046875, -7.7001953125, -7.061767578125, -6.42333984375, -5.784912109375, -5.146484375, -4.508056640625, -3.86962890625, -3.231201171875, -2.5927734375, -1.954345703125, -1.31591796875, -0.677490234375, -0.0390625, 0.599365234375, 1.23779296875, 1.876220703125, 2.5146484375, 3.153076171875, 3.79150390625, 4.429931640625, 5.068359375, 5.706787109375, 6.34521484375, 6.983642578125, 7.6220703125, 8.260498046875, 8.89892578125, 9.537353515625, 10.17578125, 10.814208984375, 11.45263671875, 12.091064453125, 12.7294921875, 13.367919921875, 14.00634765625, 14.644775390625, 15.283203125, 15.921630859375, 16.56005859375, 17.198486328125, 17.8369140625, 18.475341796875, 19.11376953125, 19.752197265625, 20.390625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 10.0, 7.0, 15.0, 27.0, 19.0, 17.0, 26.0, 39.0, 43.0, 54.0, 52.0, 65.0, 82.0, 80.0, 68.0, 71.0, 55.0, 51.0, 29.0, 32.0, 25.0, 16.0, 16.0, 20.0, 18.0, 10.0, 8.0, 5.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.796875, -5.61236572265625, -5.4278564453125, -5.24334716796875, -5.058837890625, -4.87432861328125, -4.6898193359375, -4.50531005859375, -4.32080078125, -4.13629150390625, -3.9517822265625, -3.76727294921875, -3.582763671875, -3.39825439453125, -3.2137451171875, -3.02923583984375, -2.8447265625, -2.66021728515625, -2.4757080078125, -2.29119873046875, -2.106689453125, -1.92218017578125, -1.7376708984375, -1.55316162109375, -1.36865234375, -1.18414306640625, -0.9996337890625, -0.81512451171875, -0.630615234375, -0.44610595703125, -0.2615966796875, -0.07708740234375, 0.107421875, 0.29193115234375, 0.4764404296875, 0.66094970703125, 0.845458984375, 1.02996826171875, 1.2144775390625, 1.39898681640625, 1.58349609375, 1.76800537109375, 1.9525146484375, 2.13702392578125, 2.321533203125, 2.50604248046875, 2.6905517578125, 2.87506103515625, 3.0595703125, 3.24407958984375, 3.4285888671875, 3.61309814453125, 3.797607421875, 3.98211669921875, 4.1666259765625, 4.35113525390625, 4.53564453125, 4.72015380859375, 4.9046630859375, 5.08917236328125, 5.273681640625, 5.45819091796875, 5.6427001953125, 5.82720947265625, 6.01171875]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 8.0, 18.0, 20.0, 17.0, 28.0, 40.0, 39.0, 49.0, 58.0, 75.0, 70.0, 94.0, 100.0, 82.0, 55.0, 54.0, 40.0, 29.0, 27.0, 26.0, 7.0, 7.0, 12.0, 10.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.743560791015625, -27.035123825073242, -26.326688766479492, -25.61825180053711, -24.90981674194336, -24.201379776000977, -23.492942810058594, -22.784507751464844, -22.07607078552246, -21.367633819580078, -20.659198760986328, -19.950761795043945, -19.242324829101562, -18.533889770507812, -17.82545280456543, -17.117015838623047, -16.408580780029297, -15.70014476776123, -14.991708755493164, -14.283271789550781, -13.574835777282715, -12.866399765014648, -12.157962799072266, -11.4495267868042, -10.741090774536133, -10.032654762268066, -9.32421875, -8.615781784057617, -7.907345771789551, -7.198909759521484, -6.49047327041626, -5.782036781311035, -5.073600769042969, -4.365164756774902, -3.6567282676696777, -2.9482920169830322, -2.2398557662963867, -1.5314195156097412, -0.8229832649230957, -0.1145467758178711, 0.5938892364501953, 1.3023254871368408, 2.0107617378234863, 2.719197988510132, 3.4276342391967773, 4.136070251464844, 4.844506740570068, 5.552943229675293, 6.261379241943359, 6.969815254211426, 7.67825174331665, 8.386688232421875, 9.095124244689941, 9.803560256958008, 10.51199722290039, 11.220433235168457, 11.928869247436523, 12.63730525970459, 13.345741271972656, 14.054178237915039, 14.762614250183105, 15.471050262451172, 16.179487228393555, 16.887924194335938, 17.596359252929688]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 12.0, 14.0, 6.0, 10.0, 16.0, 15.0, 16.0, 18.0, 28.0, 27.0, 32.0, 28.0, 28.0, 38.0, 43.0, 41.0, 37.0, 36.0, 40.0, 44.0, 48.0, 49.0, 40.0, 41.0, 42.0, 29.0, 40.0, 23.0, 17.0, 13.0, 28.0, 24.0, 12.0, 16.0, 6.0, 9.0, 7.0, 3.0, 9.0, 6.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.803695678710938, -15.339011192321777, -14.874327659606934, -14.409643173217773, -13.94495964050293, -13.48027515411377, -13.01559066772461, -12.550907135009766, -12.086223602294922, -11.621539115905762, -11.156855583190918, -10.692171096801758, -10.227487564086914, -9.762803077697754, -9.298118591308594, -8.83343505859375, -8.36875057220459, -7.904066562652588, -7.439382553100586, -6.974698066711426, -6.510014533996582, -6.045330047607422, -5.58064603805542, -5.115962028503418, -4.651278018951416, -4.186594009399414, -3.721909999847412, -3.257225751876831, -2.792541742324829, -2.327857732772827, -1.863173484802246, -1.3984894752502441, -0.9338045120239258, -0.46912044286727905, -0.004436373710632324, 0.4602477550506592, 0.9249317646026611, 1.389615774154663, 1.8543000221252441, 2.318984031677246, 2.783668041229248, 3.24835205078125, 3.713036060333252, 4.177720069885254, 4.642404556274414, 5.107088088989258, 5.571772575378418, 6.03645658493042, 6.501140594482422, 6.965824604034424, 7.430508613586426, 7.895193099975586, 8.35987663269043, 8.82456111907959, 9.28924560546875, 9.753929138183594, 10.218612670898438, 10.683297157287598, 11.147980690002441, 11.612665176391602, 12.077348709106445, 12.542033195495605, 13.006717681884766, 13.47140121459961, 13.93608570098877]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 3.0, 12.0, 12.0, 14.0, 27.0, 28.0, 39.0, 60.0, 89.0, 153.0, 189.0, 297.0, 394.0, 694.0, 928.0, 1618.0, 2307.0, 3748.0, 6259.0, 10538.0, 19411.0, 37819.0, 82547.0, 198401.0, 499195.0, 1033980.0, 1169580.0, 650329.0, 260502.0, 105378.0, 48287.0, 24180.0, 13727.0, 8248.0, 5028.0, 3414.0, 2174.0, 1513.0, 954.0, 665.0, 475.0, 322.0, 239.0, 172.0, 79.0, 87.0, 49.0, 31.0, 19.0, 26.0, 17.0, 12.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0], "bins": [-16.359375, -15.81689453125, -15.2744140625, -14.73193359375, -14.189453125, -13.64697265625, -13.1044921875, -12.56201171875, -12.01953125, -11.47705078125, -10.9345703125, -10.39208984375, -9.849609375, -9.30712890625, -8.7646484375, -8.22216796875, -7.6796875, -7.13720703125, -6.5947265625, -6.05224609375, -5.509765625, -4.96728515625, -4.4248046875, -3.88232421875, -3.33984375, -2.79736328125, -2.2548828125, -1.71240234375, -1.169921875, -0.62744140625, -0.0849609375, 0.45751953125, 1.0, 1.54248046875, 2.0849609375, 2.62744140625, 3.169921875, 3.71240234375, 4.2548828125, 4.79736328125, 5.33984375, 5.88232421875, 6.4248046875, 6.96728515625, 7.509765625, 8.05224609375, 8.5947265625, 9.13720703125, 9.6796875, 10.22216796875, 10.7646484375, 11.30712890625, 11.849609375, 12.39208984375, 12.9345703125, 13.47705078125, 14.01953125, 14.56201171875, 15.1044921875, 15.64697265625, 16.189453125, 16.73193359375, 17.2744140625, 17.81689453125, 18.359375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 8.0, 14.0, 6.0, 12.0, 16.0, 13.0, 24.0, 26.0, 29.0, 37.0, 42.0, 25.0, 33.0, 45.0, 46.0, 44.0, 51.0, 49.0, 41.0, 49.0, 36.0, 50.0, 34.0, 50.0, 32.0, 33.0, 16.0, 18.0, 15.0, 29.0, 10.0, 13.0, 11.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.58740234375, -10.2607421875, -9.93408203125, -9.607421875, -9.28076171875, -8.9541015625, -8.62744140625, -8.30078125, -7.97412109375, -7.6474609375, -7.32080078125, -6.994140625, -6.66748046875, -6.3408203125, -6.01416015625, -5.6875, -5.36083984375, -5.0341796875, -4.70751953125, -4.380859375, -4.05419921875, -3.7275390625, -3.40087890625, -3.07421875, -2.74755859375, -2.4208984375, -2.09423828125, -1.767578125, -1.44091796875, -1.1142578125, -0.78759765625, -0.4609375, -0.13427734375, 0.1923828125, 0.51904296875, 0.845703125, 1.17236328125, 1.4990234375, 1.82568359375, 2.15234375, 2.47900390625, 2.8056640625, 3.13232421875, 3.458984375, 3.78564453125, 4.1123046875, 4.43896484375, 4.765625, 5.09228515625, 5.4189453125, 5.74560546875, 6.072265625, 6.39892578125, 6.7255859375, 7.05224609375, 7.37890625, 7.70556640625, 8.0322265625, 8.35888671875, 8.685546875, 9.01220703125, 9.3388671875, 9.66552734375, 9.9921875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 13.0, 20.0, 29.0, 38.0, 56.0, 76.0, 98.0, 151.0, 207.0, 309.0, 505.0, 823.0, 1227.0, 2008.0, 3481.0, 5679.0, 10004.0, 18349.0, 37423.0, 85794.0, 234171.0, 683432.0, 1393427.0, 1067402.0, 399270.0, 137379.0, 54919.0, 25681.0, 13169.0, 7413.0, 4373.0, 2712.0, 1614.0, 994.0, 687.0, 403.0, 269.0, 189.0, 145.0, 105.0, 72.0, 31.0, 30.0, 18.0, 23.0, 16.0, 9.0, 6.0, 6.0, 4.0, 5.0, 0.0, 0.0, 2.0], "bins": [-21.25, -20.60107421875, -19.9521484375, -19.30322265625, -18.654296875, -18.00537109375, -17.3564453125, -16.70751953125, -16.05859375, -15.40966796875, -14.7607421875, -14.11181640625, -13.462890625, -12.81396484375, -12.1650390625, -11.51611328125, -10.8671875, -10.21826171875, -9.5693359375, -8.92041015625, -8.271484375, -7.62255859375, -6.9736328125, -6.32470703125, -5.67578125, -5.02685546875, -4.3779296875, -3.72900390625, -3.080078125, -2.43115234375, -1.7822265625, -1.13330078125, -0.484375, 0.16455078125, 0.8134765625, 1.46240234375, 2.111328125, 2.76025390625, 3.4091796875, 4.05810546875, 4.70703125, 5.35595703125, 6.0048828125, 6.65380859375, 7.302734375, 7.95166015625, 8.6005859375, 9.24951171875, 9.8984375, 10.54736328125, 11.1962890625, 11.84521484375, 12.494140625, 13.14306640625, 13.7919921875, 14.44091796875, 15.08984375, 15.73876953125, 16.3876953125, 17.03662109375, 17.685546875, 18.33447265625, 18.9833984375, 19.63232421875, 20.28125]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 15.0, 9.0, 20.0, 30.0, 39.0, 53.0, 53.0, 69.0, 84.0, 100.0, 139.0, 160.0, 219.0, 285.0, 318.0, 344.0, 321.0, 347.0, 291.0, 257.0, 214.0, 164.0, 135.0, 90.0, 66.0, 62.0, 34.0, 24.0, 23.0, 25.0, 10.0, 9.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.37109375, -7.177490234375, -6.98388671875, -6.790283203125, -6.5966796875, -6.403076171875, -6.20947265625, -6.015869140625, -5.822265625, -5.628662109375, -5.43505859375, -5.241455078125, -5.0478515625, -4.854248046875, -4.66064453125, -4.467041015625, -4.2734375, -4.079833984375, -3.88623046875, -3.692626953125, -3.4990234375, -3.305419921875, -3.11181640625, -2.918212890625, -2.724609375, -2.531005859375, -2.33740234375, -2.143798828125, -1.9501953125, -1.756591796875, -1.56298828125, -1.369384765625, -1.17578125, -0.982177734375, -0.78857421875, -0.594970703125, -0.4013671875, -0.207763671875, -0.01416015625, 0.179443359375, 0.373046875, 0.566650390625, 0.76025390625, 0.953857421875, 1.1474609375, 1.341064453125, 1.53466796875, 1.728271484375, 1.921875, 2.115478515625, 2.30908203125, 2.502685546875, 2.6962890625, 2.889892578125, 3.08349609375, 3.277099609375, 3.470703125, 3.664306640625, 3.85791015625, 4.051513671875, 4.2451171875, 4.438720703125, 4.63232421875, 4.825927734375, 5.01953125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 6.0, 18.0, 7.0, 21.0, 31.0, 43.0, 56.0, 70.0, 110.0, 117.0, 114.0, 69.0, 118.0, 60.0, 39.0, 30.0, 27.0, 11.0, 14.0, 7.0, 8.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.934629440307617, -29.168359756469727, -28.40209197998047, -27.635822296142578, -26.86955451965332, -26.10328483581543, -25.337017059326172, -24.57074737548828, -23.80447769165039, -23.0382080078125, -22.271940231323242, -21.50567054748535, -20.739402770996094, -19.973133087158203, -19.206863403320312, -18.440595626831055, -17.674327850341797, -16.908058166503906, -16.14179039001465, -15.375520706176758, -14.6092529296875, -13.84298324584961, -13.076714515686035, -12.310445785522461, -11.544177055358887, -10.777908325195312, -10.011639595031738, -9.245370864868164, -8.479101181030273, -7.712832927703857, -6.946563720703125, -6.180294990539551, -5.414026260375977, -4.647757530212402, -3.881488561630249, -3.1152195930480957, -2.3489508628845215, -1.5826821327209473, -0.8164129257202148, -0.050144195556640625, 0.7161245346069336, 1.4823933839797974, 2.248662233352661, 3.0149312019348145, 3.7811999320983887, 4.547468662261963, 5.313737869262695, 6.0800065994262695, 6.846275329589844, 7.612544059753418, 8.378812789916992, 9.145082473754883, 9.91135025024414, 10.677619934082031, 11.443888664245605, 12.21015739440918, 12.976426124572754, 13.742694854736328, 14.508963584899902, 15.275232315063477, 16.041501998901367, 16.807769775390625, 17.574039459228516, 18.340309143066406, 19.106576919555664]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 9.0, 4.0, 5.0, 6.0, 17.0, 20.0, 16.0, 20.0, 30.0, 32.0, 19.0, 32.0, 34.0, 50.0, 35.0, 55.0, 33.0, 49.0, 38.0, 61.0, 48.0, 38.0, 47.0, 31.0, 46.0, 35.0, 29.0, 29.0, 22.0, 23.0, 21.0, 13.0, 12.0, 8.0, 12.0, 10.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.543462753295898, -15.096383094787598, -14.649303436279297, -14.20222282409668, -13.755143165588379, -13.308063507080078, -12.860983848571777, -12.413904190063477, -11.96682357788086, -11.519743919372559, -11.072664260864258, -10.62558364868164, -10.17850399017334, -9.731424331665039, -9.284344673156738, -8.837265014648438, -8.390185356140137, -7.943105697631836, -7.496025562286377, -7.048945903778076, -6.601865768432617, -6.154786109924316, -5.707706451416016, -5.260626792907715, -4.813546657562256, -4.366466999053955, -3.919386863708496, -3.4723072052001953, -3.0252273082733154, -2.5781474113464355, -2.1310677528381348, -1.6839878559112549, -1.2369070053100586, -0.7898271679878235, -0.3427473306655884, 0.10433244705200195, 0.5514123439788818, 0.9984922409057617, 1.4455718994140625, 1.8926517963409424, 2.3397316932678223, 2.786811590194702, 3.233891487121582, 3.680971145629883, 4.128050804138184, 4.575130939483643, 5.022210597991943, 5.469290733337402, 5.916370391845703, 6.363450050354004, 6.810530185699463, 7.257609844207764, 7.704689979553223, 8.151769638061523, 8.598849296569824, 9.045928955078125, 9.493009567260742, 9.940089225769043, 10.387168884277344, 10.834249496459961, 11.281329154968262, 11.728408813476562, 12.175488471984863, 12.622568130493164, 13.069647789001465]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 16.0, 20.0, 36.0, 39.0, 63.0, 98.0, 141.0, 202.0, 346.0, 442.0, 656.0, 1036.0, 1486.0, 2499.0, 3999.0, 6315.0, 10862.0, 18910.0, 34072.0, 62855.0, 115731.0, 188334.0, 219537.0, 165174.0, 95884.0, 51656.0, 27836.0, 15942.0, 9211.0, 5548.0, 3354.0, 2135.0, 1327.0, 945.0, 597.0, 364.0, 294.0, 190.0, 119.0, 89.0, 61.0, 50.0, 29.0, 20.0, 10.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.40625, -10.07421875, -9.7421875, -9.41015625, -9.078125, -8.74609375, -8.4140625, -8.08203125, -7.75, -7.41796875, -7.0859375, -6.75390625, -6.421875, -6.08984375, -5.7578125, -5.42578125, -5.09375, -4.76171875, -4.4296875, -4.09765625, -3.765625, -3.43359375, -3.1015625, -2.76953125, -2.4375, -2.10546875, -1.7734375, -1.44140625, -1.109375, -0.77734375, -0.4453125, -0.11328125, 0.21875, 0.55078125, 0.8828125, 1.21484375, 1.546875, 1.87890625, 2.2109375, 2.54296875, 2.875, 3.20703125, 3.5390625, 3.87109375, 4.203125, 4.53515625, 4.8671875, 5.19921875, 5.53125, 5.86328125, 6.1953125, 6.52734375, 6.859375, 7.19140625, 7.5234375, 7.85546875, 8.1875, 8.51953125, 8.8515625, 9.18359375, 9.515625, 9.84765625, 10.1796875, 10.51171875, 10.84375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 4.0, 6.0, 12.0, 11.0, 13.0, 27.0, 26.0, 21.0, 27.0, 31.0, 35.0, 34.0, 38.0, 63.0, 60.0, 41.0, 40.0, 39.0, 53.0, 39.0, 39.0, 40.0, 42.0, 29.0, 41.0, 33.0, 22.0, 19.0, 22.0, 17.0, 13.0, 13.0, 5.0, 9.0, 10.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.0546875, -14.60107421875, -14.1474609375, -13.69384765625, -13.240234375, -12.78662109375, -12.3330078125, -11.87939453125, -11.42578125, -10.97216796875, -10.5185546875, -10.06494140625, -9.611328125, -9.15771484375, -8.7041015625, -8.25048828125, -7.796875, -7.34326171875, -6.8896484375, -6.43603515625, -5.982421875, -5.52880859375, -5.0751953125, -4.62158203125, -4.16796875, -3.71435546875, -3.2607421875, -2.80712890625, -2.353515625, -1.89990234375, -1.4462890625, -0.99267578125, -0.5390625, -0.08544921875, 0.3681640625, 0.82177734375, 1.275390625, 1.72900390625, 2.1826171875, 2.63623046875, 3.08984375, 3.54345703125, 3.9970703125, 4.45068359375, 4.904296875, 5.35791015625, 5.8115234375, 6.26513671875, 6.71875, 7.17236328125, 7.6259765625, 8.07958984375, 8.533203125, 8.98681640625, 9.4404296875, 9.89404296875, 10.34765625, 10.80126953125, 11.2548828125, 11.70849609375, 12.162109375, 12.61572265625, 13.0693359375, 13.52294921875, 13.9765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 3.0, 9.0, 8.0, 10.0, 6.0, 17.0, 15.0, 17.0, 39.0, 35.0, 64.0, 71.0, 122.0, 134.0, 200.0, 281.0, 426.0, 587.0, 875.0, 1360.0, 2026.0, 3382.0, 5347.0, 9272.0, 16801.0, 31691.0, 64571.0, 135151.0, 252105.0, 251304.0, 135500.0, 64379.0, 31650.0, 16619.0, 9231.0, 5486.0, 3276.0, 2095.0, 1365.0, 872.0, 589.0, 454.0, 275.0, 238.0, 163.0, 118.0, 86.0, 52.0, 41.0, 42.0, 16.0, 23.0, 20.0, 8.0, 9.0, 7.0, 6.0, 6.0, 4.0, 4.0, 1.0], "bins": [-12.1796875, -11.799072265625, -11.41845703125, -11.037841796875, -10.6572265625, -10.276611328125, -9.89599609375, -9.515380859375, -9.134765625, -8.754150390625, -8.37353515625, -7.992919921875, -7.6123046875, -7.231689453125, -6.85107421875, -6.470458984375, -6.08984375, -5.709228515625, -5.32861328125, -4.947998046875, -4.5673828125, -4.186767578125, -3.80615234375, -3.425537109375, -3.044921875, -2.664306640625, -2.28369140625, -1.903076171875, -1.5224609375, -1.141845703125, -0.76123046875, -0.380615234375, 0.0, 0.380615234375, 0.76123046875, 1.141845703125, 1.5224609375, 1.903076171875, 2.28369140625, 2.664306640625, 3.044921875, 3.425537109375, 3.80615234375, 4.186767578125, 4.5673828125, 4.947998046875, 5.32861328125, 5.709228515625, 6.08984375, 6.470458984375, 6.85107421875, 7.231689453125, 7.6123046875, 7.992919921875, 8.37353515625, 8.754150390625, 9.134765625, 9.515380859375, 9.89599609375, 10.276611328125, 10.6572265625, 11.037841796875, 11.41845703125, 11.799072265625, 12.1796875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 6.0, 9.0, 9.0, 11.0, 11.0, 14.0, 12.0, 29.0, 19.0, 25.0, 26.0, 34.0, 27.0, 28.0, 29.0, 34.0, 48.0, 34.0, 61.0, 35.0, 51.0, 31.0, 39.0, 42.0, 36.0, 31.0, 27.0, 33.0, 35.0, 37.0, 23.0, 19.0, 11.0, 17.0, 21.0, 12.0, 4.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.2813720703125, -7.015869140625, -6.7503662109375, -6.48486328125, -6.2193603515625, -5.953857421875, -5.6883544921875, -5.4228515625, -5.1573486328125, -4.891845703125, -4.6263427734375, -4.36083984375, -4.0953369140625, -3.829833984375, -3.5643310546875, -3.298828125, -3.0333251953125, -2.767822265625, -2.5023193359375, -2.23681640625, -1.9713134765625, -1.705810546875, -1.4403076171875, -1.1748046875, -0.9093017578125, -0.643798828125, -0.3782958984375, -0.11279296875, 0.1527099609375, 0.418212890625, 0.6837158203125, 0.94921875, 1.2147216796875, 1.480224609375, 1.7457275390625, 2.01123046875, 2.2767333984375, 2.542236328125, 2.8077392578125, 3.0732421875, 3.3387451171875, 3.604248046875, 3.8697509765625, 4.13525390625, 4.4007568359375, 4.666259765625, 4.9317626953125, 5.197265625, 5.4627685546875, 5.728271484375, 5.9937744140625, 6.25927734375, 6.5247802734375, 6.790283203125, 7.0557861328125, 7.3212890625, 7.5867919921875, 7.852294921875, 8.1177978515625, 8.38330078125, 8.6488037109375, 8.914306640625, 9.1798095703125, 9.4453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 13.0, 11.0, 12.0, 17.0, 32.0, 46.0, 58.0, 92.0, 160.0, 180.0, 270.0, 491.0, 807.0, 1344.0, 2444.0, 4869.0, 10488.0, 26145.0, 76071.0, 258401.0, 431373.0, 154381.0, 47594.0, 17528.0, 7514.0, 3506.0, 1852.0, 1024.0, 610.0, 392.0, 254.0, 185.0, 114.0, 82.0, 55.0, 42.0, 27.0, 14.0, 13.0, 17.0, 5.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.46875, -11.124267578125, -10.77978515625, -10.435302734375, -10.0908203125, -9.746337890625, -9.40185546875, -9.057373046875, -8.712890625, -8.368408203125, -8.02392578125, -7.679443359375, -7.3349609375, -6.990478515625, -6.64599609375, -6.301513671875, -5.95703125, -5.612548828125, -5.26806640625, -4.923583984375, -4.5791015625, -4.234619140625, -3.89013671875, -3.545654296875, -3.201171875, -2.856689453125, -2.51220703125, -2.167724609375, -1.8232421875, -1.478759765625, -1.13427734375, -0.789794921875, -0.4453125, -0.100830078125, 0.24365234375, 0.588134765625, 0.9326171875, 1.277099609375, 1.62158203125, 1.966064453125, 2.310546875, 2.655029296875, 2.99951171875, 3.343994140625, 3.6884765625, 4.032958984375, 4.37744140625, 4.721923828125, 5.06640625, 5.410888671875, 5.75537109375, 6.099853515625, 6.4443359375, 6.788818359375, 7.13330078125, 7.477783203125, 7.822265625, 8.166748046875, 8.51123046875, 8.855712890625, 9.2001953125, 9.544677734375, 9.88916015625, 10.233642578125, 10.578125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 9.0, 9.0, 11.0, 10.0, 27.0, 24.0, 31.0, 58.0, 73.0, 88.0, 122.0, 113.0, 111.0, 82.0, 50.0, 47.0, 37.0, 19.0, 19.0, 12.0, 10.0, 4.0, 8.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005164146423339844, -0.0005009956657886505, -0.00048557668924331665, -0.0004701577126979828, -0.0004547387361526489, -0.00043931975960731506, -0.0004239007830619812, -0.00040848180651664734, -0.0003930628299713135, -0.0003776438534259796, -0.00036222487688064575, -0.0003468059003353119, -0.00033138692378997803, -0.00031596794724464417, -0.0003005489706993103, -0.00028512999415397644, -0.0002697110176086426, -0.0002542920410633087, -0.00023887306451797485, -0.000223454087972641, -0.00020803511142730713, -0.00019261613488197327, -0.0001771971583366394, -0.00016177818179130554, -0.00014635920524597168, -0.00013094022870063782, -0.00011552125215530396, -0.00010010227560997009, -8.468329906463623e-05, -6.926432251930237e-05, -5.3845345973968506e-05, -3.8426369428634644e-05, -2.300739288330078e-05, -7.588416337966919e-06, 7.830560207366943e-06, 2.3249536752700806e-05, 3.866851329803467e-05, 5.408748984336853e-05, 6.950646638870239e-05, 8.492544293403625e-05, 0.00010034441947937012, 0.00011576339602470398, 0.00013118237257003784, 0.0001466013491153717, 0.00016202032566070557, 0.00017743930220603943, 0.0001928582787513733, 0.00020827725529670715, 0.00022369623184204102, 0.00023911520838737488, 0.00025453418493270874, 0.0002699531614780426, 0.00028537213802337646, 0.00030079111456871033, 0.0003162100911140442, 0.00033162906765937805, 0.0003470480442047119, 0.0003624670207500458, 0.00037788599729537964, 0.0003933049738407135, 0.00040872395038604736, 0.0004241429269313812, 0.0004395619034767151, 0.00045498088002204895, 0.0004703998565673828]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 6.0, 10.0, 12.0, 16.0, 19.0, 32.0, 72.0, 74.0, 121.0, 178.0, 298.0, 445.0, 667.0, 1094.0, 1887.0, 3534.0, 7021.0, 15322.0, 37000.0, 101098.0, 283413.0, 357514.0, 147192.0, 51466.0, 20510.0, 9288.0, 4405.0, 2320.0, 1316.0, 783.0, 481.0, 328.0, 212.0, 137.0, 90.0, 63.0, 44.0, 15.0, 22.0, 10.0, 9.0, 4.0, 10.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.484375, -9.1700439453125, -8.855712890625, -8.5413818359375, -8.22705078125, -7.9127197265625, -7.598388671875, -7.2840576171875, -6.9697265625, -6.6553955078125, -6.341064453125, -6.0267333984375, -5.71240234375, -5.3980712890625, -5.083740234375, -4.7694091796875, -4.455078125, -4.1407470703125, -3.826416015625, -3.5120849609375, -3.19775390625, -2.8834228515625, -2.569091796875, -2.2547607421875, -1.9404296875, -1.6260986328125, -1.311767578125, -0.9974365234375, -0.68310546875, -0.3687744140625, -0.054443359375, 0.2598876953125, 0.57421875, 0.8885498046875, 1.202880859375, 1.5172119140625, 1.83154296875, 2.1458740234375, 2.460205078125, 2.7745361328125, 3.0888671875, 3.4031982421875, 3.717529296875, 4.0318603515625, 4.34619140625, 4.6605224609375, 4.974853515625, 5.2891845703125, 5.603515625, 5.9178466796875, 6.232177734375, 6.5465087890625, 6.86083984375, 7.1751708984375, 7.489501953125, 7.8038330078125, 8.1181640625, 8.4324951171875, 8.746826171875, 9.0611572265625, 9.37548828125, 9.6898193359375, 10.004150390625, 10.3184814453125, 10.6328125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 2.0, 6.0, 9.0, 8.0, 12.0, 13.0, 20.0, 32.0, 34.0, 43.0, 50.0, 55.0, 73.0, 57.0, 75.0, 83.0, 80.0, 72.0, 51.0, 50.0, 47.0, 24.0, 19.0, 23.0, 16.0, 9.0, 11.0, 3.0, 3.0, 6.0, 1.0, 4.0, 0.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.9661865234375, -2.860107421875, -2.7540283203125, -2.64794921875, -2.5418701171875, -2.435791015625, -2.3297119140625, -2.2236328125, -2.1175537109375, -2.011474609375, -1.9053955078125, -1.79931640625, -1.6932373046875, -1.587158203125, -1.4810791015625, -1.375, -1.2689208984375, -1.162841796875, -1.0567626953125, -0.95068359375, -0.8446044921875, -0.738525390625, -0.6324462890625, -0.5263671875, -0.4202880859375, -0.314208984375, -0.2081298828125, -0.10205078125, 0.0040283203125, 0.110107421875, 0.2161865234375, 0.322265625, 0.4283447265625, 0.534423828125, 0.6405029296875, 0.74658203125, 0.8526611328125, 0.958740234375, 1.0648193359375, 1.1708984375, 1.2769775390625, 1.383056640625, 1.4891357421875, 1.59521484375, 1.7012939453125, 1.807373046875, 1.9134521484375, 2.01953125, 2.1256103515625, 2.231689453125, 2.3377685546875, 2.44384765625, 2.5499267578125, 2.656005859375, 2.7620849609375, 2.8681640625, 2.9742431640625, 3.080322265625, 3.1864013671875, 3.29248046875, 3.3985595703125, 3.504638671875, 3.6107177734375, 3.716796875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 0.0, 5.0, 8.0, 15.0, 15.0, 15.0, 30.0, 46.0, 67.0, 69.0, 108.0, 114.0, 105.0, 102.0, 79.0, 61.0, 45.0, 34.0, 20.0, 13.0, 13.0, 12.0, 5.0, 1.0, 4.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.49533462524414, -27.763118743896484, -27.030900955200195, -26.29868507385254, -25.56646728515625, -24.834251403808594, -24.102035522460938, -23.36981773376465, -22.63759994506836, -21.905384063720703, -21.173166275024414, -20.440950393676758, -19.70873260498047, -18.976516723632812, -18.244300842285156, -17.512083053588867, -16.77986717224121, -16.047651290893555, -15.315433502197266, -14.58321762084961, -13.85099983215332, -13.118783950805664, -12.386567115783691, -11.654350280761719, -10.922133445739746, -10.189916610717773, -9.4576997756958, -8.725482940673828, -7.993266582489014, -7.261049747467041, -6.528833389282227, -5.796616554260254, -5.064399719238281, -4.332182884216309, -3.599966287612915, -2.8677496910095215, -2.135532855987549, -1.4033160209655762, -0.6710996627807617, 0.06111717224121094, 0.7933340072631836, 1.5255507230758667, 2.25776743888855, 2.9899840354919434, 3.722200870513916, 4.454417705535889, 5.186634063720703, 5.918850898742676, 6.651067733764648, 7.383284568786621, 8.115501403808594, 8.84771728515625, 9.579935073852539, 10.312150955200195, 11.044367790222168, 11.77658462524414, 12.508801460266113, 13.241018295288086, 13.973235130310059, 14.705451965332031, 15.437667846679688, 16.169885635375977, 16.902101516723633, 17.634319305419922, 18.366535186767578]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 3.0, 8.0, 7.0, 5.0, 12.0, 11.0, 15.0, 18.0, 19.0, 25.0, 35.0, 33.0, 27.0, 36.0, 42.0, 37.0, 49.0, 46.0, 42.0, 46.0, 44.0, 49.0, 48.0, 33.0, 33.0, 42.0, 38.0, 33.0, 23.0, 17.0, 21.0, 24.0, 15.0, 17.0, 13.0, 8.0, 9.0, 8.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-14.731971740722656, -14.319819450378418, -13.907666206359863, -13.495513916015625, -13.08336067199707, -12.671208381652832, -12.259056091308594, -11.846902847290039, -11.434749603271484, -11.022597312927246, -10.610444068908691, -10.198291778564453, -9.786138534545898, -9.37398624420166, -8.961833953857422, -8.549680709838867, -8.137528419494629, -7.725375652313232, -7.313222885131836, -6.901070594787598, -6.488917350769043, -6.076765060424805, -5.664612293243408, -5.252459526062012, -4.840306758880615, -4.428153991699219, -4.016001224517822, -3.603848695755005, -3.1916959285736084, -2.779543161392212, -2.3673906326293945, -1.955237865447998, -1.5430850982666016, -1.130932331085205, -0.7187796831130981, -0.3066270351409912, 0.10552573204040527, 0.5176784992218018, 0.9298310279846191, 1.3419837951660156, 1.754136562347412, 2.1662893295288086, 2.578442096710205, 2.9905946254730225, 3.402747392654419, 3.8149001598358154, 4.227052688598633, 4.639205455780029, 5.051358222961426, 5.463510990142822, 5.875663757324219, 6.287816047668457, 6.699969291687012, 7.11212158203125, 7.5242743492126465, 7.936427116394043, 8.348579406738281, 8.76073169708252, 9.172884941101074, 9.585037231445312, 9.997190475463867, 10.409342765808105, 10.821495056152344, 11.233648300170898, 11.645801544189453]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 5.0, 10.0, 11.0, 24.0, 25.0, 41.0, 76.0, 83.0, 107.0, 190.0, 311.0, 422.0, 703.0, 1123.0, 1771.0, 2952.0, 5180.0, 9411.0, 17785.0, 34845.0, 70830.0, 138559.0, 220921.0, 230184.0, 151416.0, 79166.0, 38708.0, 19573.0, 10309.0, 5520.0, 3146.0, 1955.0, 1137.0, 703.0, 459.0, 316.0, 178.0, 118.0, 89.0, 65.0, 40.0, 36.0, 18.0, 17.0, 5.0, 8.0, 3.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.03125, -19.443359375, -18.85546875, -18.267578125, -17.6796875, -17.091796875, -16.50390625, -15.916015625, -15.328125, -14.740234375, -14.15234375, -13.564453125, -12.9765625, -12.388671875, -11.80078125, -11.212890625, -10.625, -10.037109375, -9.44921875, -8.861328125, -8.2734375, -7.685546875, -7.09765625, -6.509765625, -5.921875, -5.333984375, -4.74609375, -4.158203125, -3.5703125, -2.982421875, -2.39453125, -1.806640625, -1.21875, -0.630859375, -0.04296875, 0.544921875, 1.1328125, 1.720703125, 2.30859375, 2.896484375, 3.484375, 4.072265625, 4.66015625, 5.248046875, 5.8359375, 6.423828125, 7.01171875, 7.599609375, 8.1875, 8.775390625, 9.36328125, 9.951171875, 10.5390625, 11.126953125, 11.71484375, 12.302734375, 12.890625, 13.478515625, 14.06640625, 14.654296875, 15.2421875, 15.830078125, 16.41796875, 17.005859375, 17.59375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 9.0, 5.0, 10.0, 14.0, 13.0, 21.0, 33.0, 29.0, 30.0, 26.0, 28.0, 40.0, 38.0, 50.0, 35.0, 48.0, 45.0, 47.0, 45.0, 39.0, 46.0, 31.0, 33.0, 45.0, 34.0, 30.0, 21.0, 19.0, 18.0, 16.0, 17.0, 17.0, 16.0, 11.0, 7.0, 5.0, 4.0, 6.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-14.1796875, -13.7786865234375, -13.377685546875, -12.9766845703125, -12.57568359375, -12.1746826171875, -11.773681640625, -11.3726806640625, -10.9716796875, -10.5706787109375, -10.169677734375, -9.7686767578125, -9.36767578125, -8.9666748046875, -8.565673828125, -8.1646728515625, -7.763671875, -7.3626708984375, -6.961669921875, -6.5606689453125, -6.15966796875, -5.7586669921875, -5.357666015625, -4.9566650390625, -4.5556640625, -4.1546630859375, -3.753662109375, -3.3526611328125, -2.95166015625, -2.5506591796875, -2.149658203125, -1.7486572265625, -1.34765625, -0.9466552734375, -0.545654296875, -0.1446533203125, 0.25634765625, 0.6573486328125, 1.058349609375, 1.4593505859375, 1.8603515625, 2.2613525390625, 2.662353515625, 3.0633544921875, 3.46435546875, 3.8653564453125, 4.266357421875, 4.6673583984375, 5.068359375, 5.4693603515625, 5.870361328125, 6.2713623046875, 6.67236328125, 7.0733642578125, 7.474365234375, 7.8753662109375, 8.2763671875, 8.6773681640625, 9.078369140625, 9.4793701171875, 9.88037109375, 10.2813720703125, 10.682373046875, 11.0833740234375, 11.484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 2.0, 8.0, 8.0, 14.0, 20.0, 22.0, 25.0, 58.0, 61.0, 105.0, 148.0, 204.0, 359.0, 549.0, 798.0, 1212.0, 1939.0, 2838.0, 4603.0, 7344.0, 12304.0, 20372.0, 34733.0, 59550.0, 100906.0, 156867.0, 193453.0, 169732.0, 113194.0, 68149.0, 38999.0, 22975.0, 14128.0, 8371.0, 5152.0, 3316.0, 2120.0, 1337.0, 839.0, 561.0, 380.0, 267.0, 171.0, 110.0, 73.0, 63.0, 34.0, 23.0, 14.0, 20.0, 19.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.046875, -13.588134765625, -13.12939453125, -12.670654296875, -12.2119140625, -11.753173828125, -11.29443359375, -10.835693359375, -10.376953125, -9.918212890625, -9.45947265625, -9.000732421875, -8.5419921875, -8.083251953125, -7.62451171875, -7.165771484375, -6.70703125, -6.248291015625, -5.78955078125, -5.330810546875, -4.8720703125, -4.413330078125, -3.95458984375, -3.495849609375, -3.037109375, -2.578369140625, -2.11962890625, -1.660888671875, -1.2021484375, -0.743408203125, -0.28466796875, 0.174072265625, 0.6328125, 1.091552734375, 1.55029296875, 2.009033203125, 2.4677734375, 2.926513671875, 3.38525390625, 3.843994140625, 4.302734375, 4.761474609375, 5.22021484375, 5.678955078125, 6.1376953125, 6.596435546875, 7.05517578125, 7.513916015625, 7.97265625, 8.431396484375, 8.89013671875, 9.348876953125, 9.8076171875, 10.266357421875, 10.72509765625, 11.183837890625, 11.642578125, 12.101318359375, 12.56005859375, 13.018798828125, 13.4775390625, 13.936279296875, 14.39501953125, 14.853759765625, 15.3125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 9.0, 11.0, 11.0, 11.0, 12.0, 9.0, 18.0, 22.0, 18.0, 18.0, 23.0, 25.0, 33.0, 32.0, 34.0, 34.0, 33.0, 35.0, 35.0, 39.0, 37.0, 32.0, 37.0, 33.0, 25.0, 35.0, 39.0, 28.0, 38.0, 38.0, 32.0, 17.0, 24.0, 15.0, 17.0, 11.0, 16.0, 12.0, 8.0, 8.0, 5.0, 2.0, 4.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.046875, -7.7847900390625, -7.522705078125, -7.2606201171875, -6.99853515625, -6.7364501953125, -6.474365234375, -6.2122802734375, -5.9501953125, -5.6881103515625, -5.426025390625, -5.1639404296875, -4.90185546875, -4.6397705078125, -4.377685546875, -4.1156005859375, -3.853515625, -3.5914306640625, -3.329345703125, -3.0672607421875, -2.80517578125, -2.5430908203125, -2.281005859375, -2.0189208984375, -1.7568359375, -1.4947509765625, -1.232666015625, -0.9705810546875, -0.70849609375, -0.4464111328125, -0.184326171875, 0.0777587890625, 0.33984375, 0.6019287109375, 0.864013671875, 1.1260986328125, 1.38818359375, 1.6502685546875, 1.912353515625, 2.1744384765625, 2.4365234375, 2.6986083984375, 2.960693359375, 3.2227783203125, 3.48486328125, 3.7469482421875, 4.009033203125, 4.2711181640625, 4.533203125, 4.7952880859375, 5.057373046875, 5.3194580078125, 5.58154296875, 5.8436279296875, 6.105712890625, 6.3677978515625, 6.6298828125, 6.8919677734375, 7.154052734375, 7.4161376953125, 7.67822265625, 7.9403076171875, 8.202392578125, 8.4644775390625, 8.7265625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 8.0, 9.0, 9.0, 14.0, 27.0, 50.0, 62.0, 97.0, 142.0, 198.0, 343.0, 597.0, 991.0, 1643.0, 2940.0, 5320.0, 10734.0, 24020.0, 64939.0, 215472.0, 439480.0, 182282.0, 55960.0, 21852.0, 9865.0, 4934.0, 2678.0, 1502.0, 913.0, 536.0, 341.0, 214.0, 146.0, 79.0, 55.0, 39.0, 23.0, 18.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.921875, -29.968505859375, -29.01513671875, -28.061767578125, -27.1083984375, -26.155029296875, -25.20166015625, -24.248291015625, -23.294921875, -22.341552734375, -21.38818359375, -20.434814453125, -19.4814453125, -18.528076171875, -17.57470703125, -16.621337890625, -15.66796875, -14.714599609375, -13.76123046875, -12.807861328125, -11.8544921875, -10.901123046875, -9.94775390625, -8.994384765625, -8.041015625, -7.087646484375, -6.13427734375, -5.180908203125, -4.2275390625, -3.274169921875, -2.32080078125, -1.367431640625, -0.4140625, 0.539306640625, 1.49267578125, 2.446044921875, 3.3994140625, 4.352783203125, 5.30615234375, 6.259521484375, 7.212890625, 8.166259765625, 9.11962890625, 10.072998046875, 11.0263671875, 11.979736328125, 12.93310546875, 13.886474609375, 14.83984375, 15.793212890625, 16.74658203125, 17.699951171875, 18.6533203125, 19.606689453125, 20.56005859375, 21.513427734375, 22.466796875, 23.420166015625, 24.37353515625, 25.326904296875, 26.2802734375, 27.233642578125, 28.18701171875, 29.140380859375, 30.09375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 6.0, 5.0, 6.0, 4.0, 7.0, 10.0, 9.0, 19.0, 8.0, 30.0, 37.0, 44.0, 65.0, 78.0, 104.0, 104.0, 96.0, 76.0, 63.0, 50.0, 40.0, 28.0, 19.0, 19.0, 9.0, 14.0, 8.0, 4.0, 8.0, 3.0, 8.0, 5.0, 2.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016937255859375, -0.001638263463973999, -0.001582801342010498, -0.001527339220046997, -0.001471877098083496, -0.0014164149761199951, -0.0013609528541564941, -0.0013054907321929932, -0.0012500286102294922, -0.0011945664882659912, -0.0011391043663024902, -0.0010836422443389893, -0.0010281801223754883, -0.0009727180004119873, -0.0009172558784484863, -0.0008617937564849854, -0.0008063316345214844, -0.0007508695125579834, -0.0006954073905944824, -0.0006399452686309814, -0.0005844831466674805, -0.0005290210247039795, -0.0004735589027404785, -0.00041809678077697754, -0.00036263465881347656, -0.0003071725368499756, -0.0002517104148864746, -0.00019624829292297363, -0.00014078617095947266, -8.532404899597168e-05, -2.9861927032470703e-05, 2.5600194931030273e-05, 8.106231689453125e-05, 0.00013652443885803223, 0.0001919865608215332, 0.0002474486827850342, 0.00030291080474853516, 0.00035837292671203613, 0.0004138350486755371, 0.0004692971706390381, 0.0005247592926025391, 0.00058022141456604, 0.000635683536529541, 0.000691145658493042, 0.000746607780456543, 0.0008020699024200439, 0.0008575320243835449, 0.0009129941463470459, 0.0009684562683105469, 0.0010239183902740479, 0.0010793805122375488, 0.0011348426342010498, 0.0011903047561645508, 0.0012457668781280518, 0.0013012290000915527, 0.0013566911220550537, 0.0014121532440185547, 0.0014676153659820557, 0.0015230774879455566, 0.0015785396099090576, 0.0016340017318725586, 0.0016894638538360596, 0.0017449259757995605, 0.0018003880977630615, 0.0018558502197265625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 27.0, 28.0, 50.0, 49.0, 71.0, 75.0, 146.0, 191.0, 262.0, 439.0, 685.0, 1038.0, 1658.0, 2756.0, 4522.0, 8054.0, 15867.0, 33336.0, 75227.0, 182761.0, 322338.0, 223451.0, 93592.0, 40106.0, 18791.0, 9537.0, 5128.0, 3060.0, 1796.0, 1176.0, 722.0, 493.0, 350.0, 231.0, 157.0, 124.0, 60.0, 55.0, 27.0, 29.0, 11.0, 11.0, 12.0, 12.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0], "bins": [-20.40625, -19.79931640625, -19.1923828125, -18.58544921875, -17.978515625, -17.37158203125, -16.7646484375, -16.15771484375, -15.55078125, -14.94384765625, -14.3369140625, -13.72998046875, -13.123046875, -12.51611328125, -11.9091796875, -11.30224609375, -10.6953125, -10.08837890625, -9.4814453125, -8.87451171875, -8.267578125, -7.66064453125, -7.0537109375, -6.44677734375, -5.83984375, -5.23291015625, -4.6259765625, -4.01904296875, -3.412109375, -2.80517578125, -2.1982421875, -1.59130859375, -0.984375, -0.37744140625, 0.2294921875, 0.83642578125, 1.443359375, 2.05029296875, 2.6572265625, 3.26416015625, 3.87109375, 4.47802734375, 5.0849609375, 5.69189453125, 6.298828125, 6.90576171875, 7.5126953125, 8.11962890625, 8.7265625, 9.33349609375, 9.9404296875, 10.54736328125, 11.154296875, 11.76123046875, 12.3681640625, 12.97509765625, 13.58203125, 14.18896484375, 14.7958984375, 15.40283203125, 16.009765625, 16.61669921875, 17.2236328125, 17.83056640625, 18.4375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 6.0, 2.0, 5.0, 11.0, 20.0, 23.0, 29.0, 37.0, 55.0, 71.0, 76.0, 77.0, 97.0, 94.0, 67.0, 73.0, 66.0, 47.0, 40.0, 23.0, 19.0, 20.0, 13.0, 8.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.625, -9.3397216796875, -9.054443359375, -8.7691650390625, -8.48388671875, -8.1986083984375, -7.913330078125, -7.6280517578125, -7.3427734375, -7.0574951171875, -6.772216796875, -6.4869384765625, -6.20166015625, -5.9163818359375, -5.631103515625, -5.3458251953125, -5.060546875, -4.7752685546875, -4.489990234375, -4.2047119140625, -3.91943359375, -3.6341552734375, -3.348876953125, -3.0635986328125, -2.7783203125, -2.4930419921875, -2.207763671875, -1.9224853515625, -1.63720703125, -1.3519287109375, -1.066650390625, -0.7813720703125, -0.49609375, -0.2108154296875, 0.074462890625, 0.3597412109375, 0.64501953125, 0.9302978515625, 1.215576171875, 1.5008544921875, 1.7861328125, 2.0714111328125, 2.356689453125, 2.6419677734375, 2.92724609375, 3.2125244140625, 3.497802734375, 3.7830810546875, 4.068359375, 4.3536376953125, 4.638916015625, 4.9241943359375, 5.20947265625, 5.4947509765625, 5.780029296875, 6.0653076171875, 6.3505859375, 6.6358642578125, 6.921142578125, 7.2064208984375, 7.49169921875, 7.7769775390625, 8.062255859375, 8.3475341796875, 8.6328125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 2.0, 7.0, 4.0, 5.0, 10.0, 19.0, 14.0, 25.0, 25.0, 29.0, 33.0, 55.0, 62.0, 75.0, 81.0, 74.0, 76.0, 70.0, 59.0, 55.0, 47.0, 33.0, 29.0, 30.0, 13.0, 12.0, 11.0, 11.0, 4.0, 8.0, 6.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.959487915039062, -18.40255355834961, -17.845619201660156, -17.28868293762207, -16.731748580932617, -16.174814224243164, -15.617879867553711, -15.060945510864258, -14.504010200500488, -13.947075843811035, -13.390140533447266, -12.833206176757812, -12.27627182006836, -11.71933650970459, -11.162402153015137, -10.605466842651367, -10.048532485961914, -9.491598129272461, -8.934662818908691, -8.377728462219238, -7.820793628692627, -7.263858795166016, -6.7069244384765625, -6.149989604949951, -5.59305477142334, -5.0361199378967285, -4.479185104370117, -3.922250747680664, -3.3653159141540527, -2.8083810806274414, -2.251446485519409, -1.694511890411377, -1.1375789642333984, -0.5806442499160767, -0.023709535598754883, 0.5332251787185669, 1.0901598930358887, 1.6470947265625, 2.2040293216705322, 2.7609639167785645, 3.317898750305176, 3.874833583831787, 4.431768417358398, 4.988702774047852, 5.545637607574463, 6.102572441101074, 6.659506797790527, 7.216441631317139, 7.77337646484375, 8.330310821533203, 8.887246131896973, 9.444180488586426, 10.001115798950195, 10.558050155639648, 11.114984512329102, 11.671918869018555, 12.228854179382324, 12.785788536071777, 13.342723846435547, 13.899658203125, 14.456592559814453, 15.013527870178223, 15.570462226867676, 16.127397537231445, 16.6843318939209]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 8.0, 3.0, 9.0, 8.0, 17.0, 12.0, 24.0, 32.0, 30.0, 42.0, 42.0, 35.0, 40.0, 44.0, 47.0, 38.0, 52.0, 42.0, 43.0, 58.0, 54.0, 35.0, 36.0, 31.0, 35.0, 36.0, 39.0, 21.0, 16.0, 15.0, 12.0, 9.0, 9.0, 5.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.434259414672852, -13.986702919006348, -13.539145469665527, -13.091588973999023, -12.644031524658203, -12.1964750289917, -11.748918533325195, -11.301361083984375, -10.853803634643555, -10.40624713897705, -9.95868968963623, -9.511133193969727, -9.063575744628906, -8.616019248962402, -8.168462753295898, -7.720905303955078, -7.273348808288574, -6.825791835784912, -6.37823486328125, -5.930678367614746, -5.483120918273926, -5.035564422607422, -4.58800745010376, -4.140450477600098, -3.6928935050964355, -3.2453365325927734, -2.7977795600891113, -2.3502228260040283, -1.9026658535003662, -1.455108880996704, -1.007552146911621, -0.559995174407959, -0.11243724822998047, 0.33511966466903687, 0.7826765775680542, 1.2302334308624268, 1.6777904033660889, 2.125347375869751, 2.572904109954834, 3.020461082458496, 3.468018054962158, 3.9155750274658203, 4.363131999969482, 4.8106889724731445, 5.258245468139648, 5.705802917480469, 6.153359413146973, 6.600916385650635, 7.048473358154297, 7.496030330657959, 7.943587303161621, 8.391143798828125, 8.838701248168945, 9.28625774383545, 9.733814239501953, 10.181371688842773, 10.628929138183594, 11.076485633850098, 11.524043083190918, 11.971599578857422, 12.419157028198242, 12.866713523864746, 13.31427001953125, 13.76182746887207, 14.209383964538574]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 11.0, 21.0, 29.0, 43.0, 85.0, 128.0, 189.0, 296.0, 523.0, 816.0, 1241.0, 2172.0, 3643.0, 6650.0, 12763.0, 26094.0, 61519.0, 170198.0, 533300.0, 1314840.0, 1287355.0, 502636.0, 157998.0, 57912.0, 25227.0, 12372.0, 6670.0, 3696.0, 2228.0, 1270.0, 790.0, 559.0, 362.0, 232.0, 134.0, 94.0, 58.0, 39.0, 19.0, 21.0, 9.0, 11.0, 5.0, 5.0, 3.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-16.34375, -15.759521484375, -15.17529296875, -14.591064453125, -14.0068359375, -13.422607421875, -12.83837890625, -12.254150390625, -11.669921875, -11.085693359375, -10.50146484375, -9.917236328125, -9.3330078125, -8.748779296875, -8.16455078125, -7.580322265625, -6.99609375, -6.411865234375, -5.82763671875, -5.243408203125, -4.6591796875, -4.074951171875, -3.49072265625, -2.906494140625, -2.322265625, -1.738037109375, -1.15380859375, -0.569580078125, 0.0146484375, 0.598876953125, 1.18310546875, 1.767333984375, 2.3515625, 2.935791015625, 3.52001953125, 4.104248046875, 4.6884765625, 5.272705078125, 5.85693359375, 6.441162109375, 7.025390625, 7.609619140625, 8.19384765625, 8.778076171875, 9.3623046875, 9.946533203125, 10.53076171875, 11.114990234375, 11.69921875, 12.283447265625, 12.86767578125, 13.451904296875, 14.0361328125, 14.620361328125, 15.20458984375, 15.788818359375, 16.373046875, 16.957275390625, 17.54150390625, 18.125732421875, 18.7099609375, 19.294189453125, 19.87841796875, 20.462646484375, 21.046875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 3.0, 5.0, 11.0, 11.0, 7.0, 19.0, 16.0, 25.0, 25.0, 26.0, 35.0, 43.0, 42.0, 32.0, 38.0, 43.0, 50.0, 41.0, 46.0, 55.0, 47.0, 45.0, 42.0, 33.0, 35.0, 31.0, 32.0, 28.0, 26.0, 22.0, 16.0, 10.0, 15.0, 11.0, 11.0, 4.0, 4.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.84375, -9.5634765625, -9.283203125, -9.0029296875, -8.72265625, -8.4423828125, -8.162109375, -7.8818359375, -7.6015625, -7.3212890625, -7.041015625, -6.7607421875, -6.48046875, -6.2001953125, -5.919921875, -5.6396484375, -5.359375, -5.0791015625, -4.798828125, -4.5185546875, -4.23828125, -3.9580078125, -3.677734375, -3.3974609375, -3.1171875, -2.8369140625, -2.556640625, -2.2763671875, -1.99609375, -1.7158203125, -1.435546875, -1.1552734375, -0.875, -0.5947265625, -0.314453125, -0.0341796875, 0.24609375, 0.5263671875, 0.806640625, 1.0869140625, 1.3671875, 1.6474609375, 1.927734375, 2.2080078125, 2.48828125, 2.7685546875, 3.048828125, 3.3291015625, 3.609375, 3.8896484375, 4.169921875, 4.4501953125, 4.73046875, 5.0107421875, 5.291015625, 5.5712890625, 5.8515625, 6.1318359375, 6.412109375, 6.6923828125, 6.97265625, 7.2529296875, 7.533203125, 7.8134765625, 8.09375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 7.0, 2.0, 6.0, 7.0, 14.0, 10.0, 20.0, 31.0, 45.0, 62.0, 70.0, 108.0, 156.0, 252.0, 393.0, 525.0, 808.0, 1109.0, 1743.0, 2594.0, 3908.0, 6407.0, 10915.0, 19682.0, 37867.0, 85687.0, 224441.0, 633143.0, 1318819.0, 1107770.0, 445303.0, 158657.0, 62905.0, 30102.0, 15698.0, 9051.0, 5550.0, 3492.0, 2249.0, 1516.0, 998.0, 667.0, 456.0, 329.0, 226.0, 159.0, 88.0, 82.0, 45.0, 31.0, 25.0, 22.0, 19.0, 10.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.448486328125, -14.91259765625, -14.376708984375, -13.8408203125, -13.304931640625, -12.76904296875, -12.233154296875, -11.697265625, -11.161376953125, -10.62548828125, -10.089599609375, -9.5537109375, -9.017822265625, -8.48193359375, -7.946044921875, -7.41015625, -6.874267578125, -6.33837890625, -5.802490234375, -5.2666015625, -4.730712890625, -4.19482421875, -3.658935546875, -3.123046875, -2.587158203125, -2.05126953125, -1.515380859375, -0.9794921875, -0.443603515625, 0.09228515625, 0.628173828125, 1.1640625, 1.699951171875, 2.23583984375, 2.771728515625, 3.3076171875, 3.843505859375, 4.37939453125, 4.915283203125, 5.451171875, 5.987060546875, 6.52294921875, 7.058837890625, 7.5947265625, 8.130615234375, 8.66650390625, 9.202392578125, 9.73828125, 10.274169921875, 10.81005859375, 11.345947265625, 11.8818359375, 12.417724609375, 12.95361328125, 13.489501953125, 14.025390625, 14.561279296875, 15.09716796875, 15.633056640625, 16.1689453125, 16.704833984375, 17.24072265625, 17.776611328125, 18.3125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 5.0, 9.0, 6.0, 15.0, 10.0, 13.0, 19.0, 21.0, 31.0, 44.0, 50.0, 69.0, 80.0, 102.0, 118.0, 181.0, 214.0, 261.0, 298.0, 299.0, 337.0, 335.0, 280.0, 278.0, 219.0, 165.0, 137.0, 123.0, 86.0, 60.0, 41.0, 42.0, 22.0, 18.0, 13.0, 13.0, 7.0, 7.0, 10.0, 9.0, 2.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-5.6015625, -5.44842529296875, -5.2952880859375, -5.14215087890625, -4.989013671875, -4.83587646484375, -4.6827392578125, -4.52960205078125, -4.37646484375, -4.22332763671875, -4.0701904296875, -3.91705322265625, -3.763916015625, -3.61077880859375, -3.4576416015625, -3.30450439453125, -3.1513671875, -2.99822998046875, -2.8450927734375, -2.69195556640625, -2.538818359375, -2.38568115234375, -2.2325439453125, -2.07940673828125, -1.92626953125, -1.77313232421875, -1.6199951171875, -1.46685791015625, -1.313720703125, -1.16058349609375, -1.0074462890625, -0.85430908203125, -0.701171875, -0.54803466796875, -0.3948974609375, -0.24176025390625, -0.088623046875, 0.06451416015625, 0.2176513671875, 0.37078857421875, 0.52392578125, 0.67706298828125, 0.8302001953125, 0.98333740234375, 1.136474609375, 1.28961181640625, 1.4427490234375, 1.59588623046875, 1.7490234375, 1.90216064453125, 2.0552978515625, 2.20843505859375, 2.361572265625, 2.51470947265625, 2.6678466796875, 2.82098388671875, 2.97412109375, 3.12725830078125, 3.2803955078125, 3.43353271484375, 3.586669921875, 3.73980712890625, 3.8929443359375, 4.04608154296875, 4.19921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 8.0, 6.0, 8.0, 14.0, 14.0, 22.0, 30.0, 30.0, 48.0, 48.0, 76.0, 82.0, 116.0, 93.0, 74.0, 69.0, 67.0, 53.0, 31.0, 23.0, 23.0, 17.0, 16.0, 3.0, 8.0, 7.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.927227020263672, -22.33791160583496, -21.74859619140625, -21.15928077697754, -20.569965362548828, -19.980649948120117, -19.391334533691406, -18.802019119262695, -18.212703704833984, -17.623388290405273, -17.034072875976562, -16.44475746154785, -15.85544204711914, -15.26612663269043, -14.676811218261719, -14.087495803833008, -13.498181343078613, -12.908865928649902, -12.319550514221191, -11.73023509979248, -11.14091968536377, -10.551604270935059, -9.962289810180664, -9.372974395751953, -8.783658981323242, -8.194343566894531, -7.60502815246582, -7.015712738037109, -6.426397323608398, -5.8370819091796875, -5.247766971588135, -4.658451557159424, -4.069136619567871, -3.47982120513916, -2.890505790710449, -2.3011906147003174, -1.7118752002716064, -1.1225597858428955, -0.5332446098327637, 0.056070804595947266, 0.6453862190246582, 1.2347016334533691, 1.8240169286727905, 2.413332223892212, 3.002647638320923, 3.591963052749634, 4.181278228759766, 4.770593643188477, 5.3599090576171875, 5.949224472045898, 6.538539886474609, 7.12785530090332, 7.717170715332031, 8.306486129760742, 8.895801544189453, 9.485116958618164, 10.074432373046875, 10.663747787475586, 11.253063201904297, 11.842378616333008, 12.431694030761719, 13.02100944519043, 13.61032485961914, 14.199640274047852, 14.788954734802246]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 9.0, 22.0, 16.0, 16.0, 26.0, 33.0, 40.0, 36.0, 31.0, 35.0, 43.0, 44.0, 63.0, 56.0, 56.0, 60.0, 47.0, 49.0, 43.0, 36.0, 34.0, 24.0, 37.0, 25.0, 27.0, 17.0, 15.0, 12.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.667814254760742, -12.26236343383789, -11.856912612915039, -11.451460838317871, -11.04601001739502, -10.640559196472168, -10.235107421875, -9.829656600952148, -9.424205780029297, -9.018754959106445, -8.613304138183594, -8.207852363586426, -7.802401542663574, -7.396950721740723, -6.991499423980713, -6.586048126220703, -6.180597305297852, -5.775146484375, -5.36969518661499, -4.9642438888549805, -4.558793067932129, -4.153342247009277, -3.7478909492492676, -3.342439889907837, -2.9369888305664062, -2.5315377712249756, -2.126086711883545, -1.7206356525421143, -1.3151845932006836, -0.9097335338592529, -0.5042824745178223, -0.0988314151763916, 0.30661964416503906, 0.7120707035064697, 1.1175217628479004, 1.522972822189331, 1.9284238815307617, 2.3338749408721924, 2.739326000213623, 3.1447770595550537, 3.5502281188964844, 3.955679178237915, 4.361130237579346, 4.7665815353393555, 5.172032356262207, 5.577483177185059, 5.982934474945068, 6.388385772705078, 6.79383659362793, 7.199287414550781, 7.604738712310791, 8.0101900100708, 8.415640830993652, 8.821091651916504, 9.226543426513672, 9.631994247436523, 10.037445068359375, 10.442895889282227, 10.848346710205078, 11.253798484802246, 11.659249305725098, 12.06470012664795, 12.470151901245117, 12.875602722167969, 13.28105354309082]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 4.0, 6.0, 8.0, 13.0, 24.0, 33.0, 55.0, 82.0, 126.0, 171.0, 311.0, 460.0, 675.0, 1192.0, 2029.0, 3677.0, 6613.0, 12106.0, 23081.0, 44470.0, 84498.0, 152076.0, 220409.0, 207518.0, 134102.0, 73130.0, 38048.0, 19674.0, 10624.0, 5657.0, 3191.0, 1794.0, 1055.0, 561.0, 383.0, 244.0, 151.0, 107.0, 65.0, 47.0, 24.0, 19.0, 18.0, 12.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-8.59375, -8.354248046875, -8.11474609375, -7.875244140625, -7.6357421875, -7.396240234375, -7.15673828125, -6.917236328125, -6.677734375, -6.438232421875, -6.19873046875, -5.959228515625, -5.7197265625, -5.480224609375, -5.24072265625, -5.001220703125, -4.76171875, -4.522216796875, -4.28271484375, -4.043212890625, -3.8037109375, -3.564208984375, -3.32470703125, -3.085205078125, -2.845703125, -2.606201171875, -2.36669921875, -2.127197265625, -1.8876953125, -1.648193359375, -1.40869140625, -1.169189453125, -0.9296875, -0.690185546875, -0.45068359375, -0.211181640625, 0.0283203125, 0.267822265625, 0.50732421875, 0.746826171875, 0.986328125, 1.225830078125, 1.46533203125, 1.704833984375, 1.9443359375, 2.183837890625, 2.42333984375, 2.662841796875, 2.90234375, 3.141845703125, 3.38134765625, 3.620849609375, 3.8603515625, 4.099853515625, 4.33935546875, 4.578857421875, 4.818359375, 5.057861328125, 5.29736328125, 5.536865234375, 5.7763671875, 6.015869140625, 6.25537109375, 6.494873046875, 6.734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 11.0, 19.0, 21.0, 11.0, 29.0, 35.0, 33.0, 28.0, 45.0, 44.0, 39.0, 59.0, 49.0, 66.0, 52.0, 58.0, 54.0, 46.0, 38.0, 39.0, 37.0, 32.0, 26.0, 30.0, 14.0, 23.0, 12.0, 5.0, 9.0, 5.0, 10.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0390625, -13.59765625, -13.15625, -12.71484375, -12.2734375, -11.83203125, -11.390625, -10.94921875, -10.5078125, -10.06640625, -9.625, -9.18359375, -8.7421875, -8.30078125, -7.859375, -7.41796875, -6.9765625, -6.53515625, -6.09375, -5.65234375, -5.2109375, -4.76953125, -4.328125, -3.88671875, -3.4453125, -3.00390625, -2.5625, -2.12109375, -1.6796875, -1.23828125, -0.796875, -0.35546875, 0.0859375, 0.52734375, 0.96875, 1.41015625, 1.8515625, 2.29296875, 2.734375, 3.17578125, 3.6171875, 4.05859375, 4.5, 4.94140625, 5.3828125, 5.82421875, 6.265625, 6.70703125, 7.1484375, 7.58984375, 8.03125, 8.47265625, 8.9140625, 9.35546875, 9.796875, 10.23828125, 10.6796875, 11.12109375, 11.5625, 12.00390625, 12.4453125, 12.88671875, 13.328125, 13.76953125, 14.2109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 18.0, 30.0, 33.0, 45.0, 67.0, 80.0, 149.0, 196.0, 262.0, 421.0, 599.0, 976.0, 1558.0, 2457.0, 3860.0, 6660.0, 11115.0, 19379.0, 36442.0, 70490.0, 139304.0, 239013.0, 233375.0, 133815.0, 66936.0, 34860.0, 19094.0, 10738.0, 6197.0, 3751.0, 2320.0, 1474.0, 948.0, 614.0, 391.0, 272.0, 175.0, 131.0, 81.0, 52.0, 40.0, 29.0, 28.0, 20.0, 10.0, 5.0, 10.0, 5.0, 2.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-8.3046875, -8.0364990234375, -7.768310546875, -7.5001220703125, -7.23193359375, -6.9637451171875, -6.695556640625, -6.4273681640625, -6.1591796875, -5.8909912109375, -5.622802734375, -5.3546142578125, -5.08642578125, -4.8182373046875, -4.550048828125, -4.2818603515625, -4.013671875, -3.7454833984375, -3.477294921875, -3.2091064453125, -2.94091796875, -2.6727294921875, -2.404541015625, -2.1363525390625, -1.8681640625, -1.5999755859375, -1.331787109375, -1.0635986328125, -0.79541015625, -0.5272216796875, -0.259033203125, 0.0091552734375, 0.27734375, 0.5455322265625, 0.813720703125, 1.0819091796875, 1.35009765625, 1.6182861328125, 1.886474609375, 2.1546630859375, 2.4228515625, 2.6910400390625, 2.959228515625, 3.2274169921875, 3.49560546875, 3.7637939453125, 4.031982421875, 4.3001708984375, 4.568359375, 4.8365478515625, 5.104736328125, 5.3729248046875, 5.64111328125, 5.9093017578125, 6.177490234375, 6.4456787109375, 6.7138671875, 6.9820556640625, 7.250244140625, 7.5184326171875, 7.78662109375, 8.0548095703125, 8.322998046875, 8.5911865234375, 8.859375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 7.0, 13.0, 14.0, 15.0, 21.0, 16.0, 21.0, 25.0, 34.0, 29.0, 34.0, 29.0, 42.0, 37.0, 35.0, 45.0, 43.0, 52.0, 51.0, 41.0, 35.0, 37.0, 54.0, 40.0, 23.0, 24.0, 28.0, 21.0, 29.0, 19.0, 11.0, 13.0, 13.0, 13.0, 7.0, 4.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.671875, -6.4432373046875, -6.214599609375, -5.9859619140625, -5.75732421875, -5.5286865234375, -5.300048828125, -5.0714111328125, -4.8427734375, -4.6141357421875, -4.385498046875, -4.1568603515625, -3.92822265625, -3.6995849609375, -3.470947265625, -3.2423095703125, -3.013671875, -2.7850341796875, -2.556396484375, -2.3277587890625, -2.09912109375, -1.8704833984375, -1.641845703125, -1.4132080078125, -1.1845703125, -0.9559326171875, -0.727294921875, -0.4986572265625, -0.27001953125, -0.0413818359375, 0.187255859375, 0.4158935546875, 0.64453125, 0.8731689453125, 1.101806640625, 1.3304443359375, 1.55908203125, 1.7877197265625, 2.016357421875, 2.2449951171875, 2.4736328125, 2.7022705078125, 2.930908203125, 3.1595458984375, 3.38818359375, 3.6168212890625, 3.845458984375, 4.0740966796875, 4.302734375, 4.5313720703125, 4.760009765625, 4.9886474609375, 5.21728515625, 5.4459228515625, 5.674560546875, 5.9031982421875, 6.1318359375, 6.3604736328125, 6.589111328125, 6.8177490234375, 7.04638671875, 7.2750244140625, 7.503662109375, 7.7322998046875, 7.9609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 8.0, 12.0, 17.0, 29.0, 33.0, 53.0, 87.0, 153.0, 248.0, 385.0, 656.0, 1041.0, 1805.0, 3301.0, 5842.0, 11276.0, 23826.0, 55707.0, 147309.0, 358266.0, 265702.0, 97185.0, 38882.0, 17256.0, 8505.0, 4506.0, 2660.0, 1442.0, 922.0, 530.0, 329.0, 213.0, 152.0, 67.0, 49.0, 35.0, 29.0, 13.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.62109375, -6.39886474609375, -6.1766357421875, -5.95440673828125, -5.732177734375, -5.50994873046875, -5.2877197265625, -5.06549072265625, -4.84326171875, -4.62103271484375, -4.3988037109375, -4.17657470703125, -3.954345703125, -3.73211669921875, -3.5098876953125, -3.28765869140625, -3.0654296875, -2.84320068359375, -2.6209716796875, -2.39874267578125, -2.176513671875, -1.95428466796875, -1.7320556640625, -1.50982666015625, -1.28759765625, -1.06536865234375, -0.8431396484375, -0.62091064453125, -0.398681640625, -0.17645263671875, 0.0457763671875, 0.26800537109375, 0.490234375, 0.71246337890625, 0.9346923828125, 1.15692138671875, 1.379150390625, 1.60137939453125, 1.8236083984375, 2.04583740234375, 2.26806640625, 2.49029541015625, 2.7125244140625, 2.93475341796875, 3.156982421875, 3.37921142578125, 3.6014404296875, 3.82366943359375, 4.0458984375, 4.26812744140625, 4.4903564453125, 4.71258544921875, 4.934814453125, 5.15704345703125, 5.3792724609375, 5.60150146484375, 5.82373046875, 6.04595947265625, 6.2681884765625, 6.49041748046875, 6.712646484375, 6.93487548828125, 7.1571044921875, 7.37933349609375, 7.6015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 15.0, 2.0, 7.0, 7.0, 9.0, 11.0, 22.0, 26.0, 26.0, 44.0, 53.0, 86.0, 101.0, 106.0, 122.0, 83.0, 93.0, 51.0, 34.0, 22.0, 20.0, 15.0, 9.0, 9.0, 8.0, 4.0, 5.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034165382385253906, -0.00033053383231163025, -0.00031941384077072144, -0.0003082938492298126, -0.0002971738576889038, -0.000286053866147995, -0.0002749338746070862, -0.00026381388306617737, -0.00025269389152526855, -0.00024157389998435974, -0.00023045390844345093, -0.00021933391690254211, -0.0002082139253616333, -0.0001970939338207245, -0.00018597394227981567, -0.00017485395073890686, -0.00016373395919799805, -0.00015261396765708923, -0.00014149397611618042, -0.0001303739845752716, -0.00011925399303436279, -0.00010813400149345398, -9.701400995254517e-05, -8.589401841163635e-05, -7.477402687072754e-05, -6.365403532981873e-05, -5.253404378890991e-05, -4.14140522480011e-05, -3.0294060707092285e-05, -1.917406916618347e-05, -8.054077625274658e-06, 3.0659139156341553e-06, 1.4185905456542969e-05, 2.5305896997451782e-05, 3.6425888538360596e-05, 4.754588007926941e-05, 5.866587162017822e-05, 6.978586316108704e-05, 8.090585470199585e-05, 9.202584624290466e-05, 0.00010314583778381348, 0.00011426582932472229, 0.0001253858208656311, 0.00013650581240653992, 0.00014762580394744873, 0.00015874579548835754, 0.00016986578702926636, 0.00018098577857017517, 0.00019210577011108398, 0.0002032257616519928, 0.0002143457531929016, 0.00022546574473381042, 0.00023658573627471924, 0.00024770572781562805, 0.00025882571935653687, 0.0002699457108974457, 0.0002810657024383545, 0.0002921856939792633, 0.0003033056855201721, 0.00031442567706108093, 0.00032554566860198975, 0.00033666566014289856, 0.0003477856516838074, 0.0003589056432247162, 0.000370025634765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 3.0, 9.0, 5.0, 11.0, 10.0, 16.0, 26.0, 23.0, 48.0, 58.0, 99.0, 124.0, 186.0, 263.0, 437.0, 629.0, 902.0, 1342.0, 2054.0, 3085.0, 4919.0, 7947.0, 12875.0, 22480.0, 39889.0, 74704.0, 138483.0, 221622.0, 216503.0, 133273.0, 71848.0, 38623.0, 21728.0, 12831.0, 7649.0, 4789.0, 3010.0, 1948.0, 1291.0, 879.0, 608.0, 393.0, 275.0, 201.0, 150.0, 99.0, 66.0, 48.0, 28.0, 26.0, 12.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.34765625, -4.207275390625, -4.06689453125, -3.926513671875, -3.7861328125, -3.645751953125, -3.50537109375, -3.364990234375, -3.224609375, -3.084228515625, -2.94384765625, -2.803466796875, -2.6630859375, -2.522705078125, -2.38232421875, -2.241943359375, -2.1015625, -1.961181640625, -1.82080078125, -1.680419921875, -1.5400390625, -1.399658203125, -1.25927734375, -1.118896484375, -0.978515625, -0.838134765625, -0.69775390625, -0.557373046875, -0.4169921875, -0.276611328125, -0.13623046875, 0.004150390625, 0.14453125, 0.284912109375, 0.42529296875, 0.565673828125, 0.7060546875, 0.846435546875, 0.98681640625, 1.127197265625, 1.267578125, 1.407958984375, 1.54833984375, 1.688720703125, 1.8291015625, 1.969482421875, 2.10986328125, 2.250244140625, 2.390625, 2.531005859375, 2.67138671875, 2.811767578125, 2.9521484375, 3.092529296875, 3.23291015625, 3.373291015625, 3.513671875, 3.654052734375, 3.79443359375, 3.934814453125, 4.0751953125, 4.215576171875, 4.35595703125, 4.496337890625, 4.63671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 7.0, 8.0, 5.0, 13.0, 12.0, 8.0, 19.0, 19.0, 20.0, 22.0, 32.0, 37.0, 39.0, 47.0, 54.0, 60.0, 67.0, 64.0, 63.0, 45.0, 56.0, 30.0, 38.0, 41.0, 28.0, 30.0, 28.0, 12.0, 18.0, 9.0, 14.0, 6.0, 5.0, 11.0, 3.0, 5.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.968231201171875, -1.90716552734375, -1.846099853515625, -1.7850341796875, -1.723968505859375, -1.66290283203125, -1.601837158203125, -1.540771484375, -1.479705810546875, -1.41864013671875, -1.357574462890625, -1.2965087890625, -1.235443115234375, -1.17437744140625, -1.113311767578125, -1.05224609375, -0.991180419921875, -0.93011474609375, -0.869049072265625, -0.8079833984375, -0.746917724609375, -0.68585205078125, -0.624786376953125, -0.563720703125, -0.502655029296875, -0.44158935546875, -0.380523681640625, -0.3194580078125, -0.258392333984375, -0.19732666015625, -0.136260986328125, -0.0751953125, -0.014129638671875, 0.04693603515625, 0.108001708984375, 0.1690673828125, 0.230133056640625, 0.29119873046875, 0.352264404296875, 0.413330078125, 0.474395751953125, 0.53546142578125, 0.596527099609375, 0.6575927734375, 0.718658447265625, 0.77972412109375, 0.840789794921875, 0.90185546875, 0.962921142578125, 1.02398681640625, 1.085052490234375, 1.1461181640625, 1.207183837890625, 1.26824951171875, 1.329315185546875, 1.390380859375, 1.451446533203125, 1.51251220703125, 1.573577880859375, 1.6346435546875, 1.695709228515625, 1.75677490234375, 1.817840576171875, 1.87890625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 5.0, 10.0, 17.0, 13.0, 18.0, 19.0, 39.0, 45.0, 68.0, 73.0, 83.0, 108.0, 96.0, 63.0, 85.0, 67.0, 42.0, 42.0, 23.0, 18.0, 15.0, 11.0, 9.0, 6.0, 6.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.896865844726562, -22.305076599121094, -21.713285446166992, -21.121496200561523, -20.529706954956055, -19.937917709350586, -19.346126556396484, -18.754337310791016, -18.162548065185547, -17.570758819580078, -16.978967666625977, -16.387178421020508, -15.795389175415039, -15.203598976135254, -14.611808776855469, -14.02001953125, -13.428229331970215, -12.83643913269043, -12.244649887084961, -11.652859687805176, -11.061070442199707, -10.469280242919922, -9.877490997314453, -9.285700798034668, -8.693910598754883, -8.102120399475098, -7.510331153869629, -6.918540954589844, -6.326751708984375, -5.73496150970459, -5.143171787261963, -4.551382064819336, -3.9595937728881836, -3.3678040504455566, -2.7760143280029297, -2.1842243671417236, -1.5924346446990967, -1.0006449222564697, -0.40885496139526367, 0.18293476104736328, 0.7747244834899902, 1.3665142059326172, 1.9583040475845337, 2.55009388923645, 3.141883611679077, 3.733673334121704, 4.32546329498291, 4.917253017425537, 5.509042739868164, 6.100832462310791, 6.692622184753418, 7.284412384033203, 7.876201629638672, 8.467991828918457, 9.059782028198242, 9.651571273803711, 10.24336051940918, 10.835150718688965, 11.426939964294434, 12.018730163574219, 12.610519409179688, 13.202309608459473, 13.794099807739258, 14.385889053344727, 14.977679252624512]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 9.0, 11.0, 6.0, 24.0, 9.0, 25.0, 32.0, 28.0, 39.0, 29.0, 38.0, 31.0, 45.0, 54.0, 48.0, 67.0, 62.0, 41.0, 56.0, 50.0, 37.0, 45.0, 28.0, 35.0, 21.0, 29.0, 21.0, 19.0, 11.0, 12.0, 11.0, 10.0, 4.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.114065170288086, -11.72291088104248, -11.331755638122559, -10.940601348876953, -10.549447059631348, -10.158292770385742, -9.76713752746582, -9.375983238220215, -8.98482894897461, -8.593674659729004, -8.202519416809082, -7.811365127563477, -7.420210838317871, -7.029056072235107, -6.637901306152344, -6.246747016906738, -5.855591773986816, -5.464437007904053, -5.073282718658447, -4.682127952575684, -4.290973663330078, -3.8998188972473145, -3.508664131164551, -3.117509603500366, -2.7263550758361816, -2.335200548171997, -1.944045901298523, -1.5528912544250488, -1.1617367267608643, -0.7705821990966797, -0.379427433013916, 0.011727094650268555, 0.4028816223144531, 0.7940362095832825, 1.1851907968521118, 1.576345443725586, 1.9674999713897705, 2.358654499053955, 2.7498092651367188, 3.1409637928009033, 3.532118320465088, 3.9232728481292725, 4.314427375793457, 4.705582141876221, 5.096736907958984, 5.48789119720459, 5.8790459632873535, 6.270200729370117, 6.661355018615723, 7.052509784698486, 7.443664073944092, 7.8348188400268555, 8.225973129272461, 8.617128372192383, 9.008282661437988, 9.399436950683594, 9.790592193603516, 10.181746482849121, 10.572901725769043, 10.964056015014648, 11.355210304260254, 11.74636459350586, 12.137519836425781, 12.528674125671387, 12.919828414916992]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 9.0, 4.0, 16.0, 16.0, 26.0, 28.0, 37.0, 55.0, 76.0, 129.0, 169.0, 238.0, 381.0, 722.0, 1201.0, 2250.0, 4220.0, 8947.0, 20436.0, 51196.0, 135708.0, 290831.0, 295448.0, 142065.0, 54191.0, 21313.0, 9190.0, 4361.0, 2169.0, 1195.0, 678.0, 408.0, 260.0, 176.0, 115.0, 81.0, 48.0, 40.0, 27.0, 36.0, 14.0, 11.0, 15.0, 9.0, 9.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-22.265625, -21.5703125, -20.875, -20.1796875, -19.484375, -18.7890625, -18.09375, -17.3984375, -16.703125, -16.0078125, -15.3125, -14.6171875, -13.921875, -13.2265625, -12.53125, -11.8359375, -11.140625, -10.4453125, -9.75, -9.0546875, -8.359375, -7.6640625, -6.96875, -6.2734375, -5.578125, -4.8828125, -4.1875, -3.4921875, -2.796875, -2.1015625, -1.40625, -0.7109375, -0.015625, 0.6796875, 1.375, 2.0703125, 2.765625, 3.4609375, 4.15625, 4.8515625, 5.546875, 6.2421875, 6.9375, 7.6328125, 8.328125, 9.0234375, 9.71875, 10.4140625, 11.109375, 11.8046875, 12.5, 13.1953125, 13.890625, 14.5859375, 15.28125, 15.9765625, 16.671875, 17.3671875, 18.0625, 18.7578125, 19.453125, 20.1484375, 20.84375, 21.5390625, 22.234375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 5.0, 10.0, 14.0, 14.0, 18.0, 18.0, 29.0, 28.0, 29.0, 42.0, 29.0, 34.0, 49.0, 48.0, 46.0, 53.0, 52.0, 59.0, 74.0, 41.0, 36.0, 35.0, 40.0, 33.0, 30.0, 24.0, 19.0, 23.0, 19.0, 14.0, 7.0, 6.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.36328125, -10.9765625, -10.58984375, -10.203125, -9.81640625, -9.4296875, -9.04296875, -8.65625, -8.26953125, -7.8828125, -7.49609375, -7.109375, -6.72265625, -6.3359375, -5.94921875, -5.5625, -5.17578125, -4.7890625, -4.40234375, -4.015625, -3.62890625, -3.2421875, -2.85546875, -2.46875, -2.08203125, -1.6953125, -1.30859375, -0.921875, -0.53515625, -0.1484375, 0.23828125, 0.625, 1.01171875, 1.3984375, 1.78515625, 2.171875, 2.55859375, 2.9453125, 3.33203125, 3.71875, 4.10546875, 4.4921875, 4.87890625, 5.265625, 5.65234375, 6.0390625, 6.42578125, 6.8125, 7.19921875, 7.5859375, 7.97265625, 8.359375, 8.74609375, 9.1328125, 9.51953125, 9.90625, 10.29296875, 10.6796875, 11.06640625, 11.453125, 11.83984375, 12.2265625, 12.61328125, 13.0]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 7.0, 8.0, 16.0, 27.0, 32.0, 33.0, 65.0, 79.0, 142.0, 197.0, 288.0, 445.0, 649.0, 948.0, 1462.0, 2354.0, 3449.0, 5337.0, 8570.0, 13948.0, 23329.0, 39533.0, 65831.0, 108448.0, 159207.0, 184174.0, 157685.0, 107068.0, 65662.0, 38547.0, 23110.0, 13981.0, 8519.0, 5284.0, 3477.0, 2254.0, 1525.0, 920.0, 610.0, 444.0, 282.0, 191.0, 141.0, 86.0, 62.0, 36.0, 30.0, 20.0, 9.0, 11.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-11.296875, -10.9381103515625, -10.579345703125, -10.2205810546875, -9.86181640625, -9.5030517578125, -9.144287109375, -8.7855224609375, -8.4267578125, -8.0679931640625, -7.709228515625, -7.3504638671875, -6.99169921875, -6.6329345703125, -6.274169921875, -5.9154052734375, -5.556640625, -5.1978759765625, -4.839111328125, -4.4803466796875, -4.12158203125, -3.7628173828125, -3.404052734375, -3.0452880859375, -2.6865234375, -2.3277587890625, -1.968994140625, -1.6102294921875, -1.25146484375, -0.8927001953125, -0.533935546875, -0.1751708984375, 0.18359375, 0.5423583984375, 0.901123046875, 1.2598876953125, 1.61865234375, 1.9774169921875, 2.336181640625, 2.6949462890625, 3.0537109375, 3.4124755859375, 3.771240234375, 4.1300048828125, 4.48876953125, 4.8475341796875, 5.206298828125, 5.5650634765625, 5.923828125, 6.2825927734375, 6.641357421875, 7.0001220703125, 7.35888671875, 7.7176513671875, 8.076416015625, 8.4351806640625, 8.7939453125, 9.1527099609375, 9.511474609375, 9.8702392578125, 10.22900390625, 10.5877685546875, 10.946533203125, 11.3052978515625, 11.6640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 6.0, 7.0, 6.0, 5.0, 11.0, 6.0, 19.0, 15.0, 29.0, 23.0, 24.0, 33.0, 36.0, 19.0, 40.0, 49.0, 39.0, 47.0, 34.0, 40.0, 50.0, 39.0, 41.0, 43.0, 36.0, 47.0, 26.0, 38.0, 34.0, 25.0, 22.0, 21.0, 12.0, 13.0, 20.0, 9.0, 5.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-8.7109375, -8.47357177734375, -8.2362060546875, -7.99884033203125, -7.761474609375, -7.52410888671875, -7.2867431640625, -7.04937744140625, -6.81201171875, -6.57464599609375, -6.3372802734375, -6.09991455078125, -5.862548828125, -5.62518310546875, -5.3878173828125, -5.15045166015625, -4.9130859375, -4.67572021484375, -4.4383544921875, -4.20098876953125, -3.963623046875, -3.72625732421875, -3.4888916015625, -3.25152587890625, -3.01416015625, -2.77679443359375, -2.5394287109375, -2.30206298828125, -2.064697265625, -1.82733154296875, -1.5899658203125, -1.35260009765625, -1.115234375, -0.87786865234375, -0.6405029296875, -0.40313720703125, -0.165771484375, 0.07159423828125, 0.3089599609375, 0.54632568359375, 0.78369140625, 1.02105712890625, 1.2584228515625, 1.49578857421875, 1.733154296875, 1.97052001953125, 2.2078857421875, 2.44525146484375, 2.6826171875, 2.91998291015625, 3.1573486328125, 3.39471435546875, 3.632080078125, 3.86944580078125, 4.1068115234375, 4.34417724609375, 4.58154296875, 4.81890869140625, 5.0562744140625, 5.29364013671875, 5.531005859375, 5.76837158203125, 6.0057373046875, 6.24310302734375, 6.48046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 1.0, 2.0, 3.0, 6.0, 12.0, 17.0, 29.0, 31.0, 53.0, 111.0, 138.0, 194.0, 302.0, 472.0, 692.0, 1020.0, 1713.0, 2819.0, 4733.0, 8347.0, 15167.0, 28809.0, 56098.0, 116518.0, 234271.0, 271465.0, 153128.0, 72193.0, 35969.0, 18949.0, 10344.0, 5850.0, 3467.0, 2055.0, 1295.0, 810.0, 476.0, 330.0, 238.0, 136.0, 92.0, 70.0, 41.0, 29.0, 29.0, 9.0, 13.0, 4.0, 2.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.2265625, -13.770263671875, -13.31396484375, -12.857666015625, -12.4013671875, -11.945068359375, -11.48876953125, -11.032470703125, -10.576171875, -10.119873046875, -9.66357421875, -9.207275390625, -8.7509765625, -8.294677734375, -7.83837890625, -7.382080078125, -6.92578125, -6.469482421875, -6.01318359375, -5.556884765625, -5.1005859375, -4.644287109375, -4.18798828125, -3.731689453125, -3.275390625, -2.819091796875, -2.36279296875, -1.906494140625, -1.4501953125, -0.993896484375, -0.53759765625, -0.081298828125, 0.375, 0.831298828125, 1.28759765625, 1.743896484375, 2.2001953125, 2.656494140625, 3.11279296875, 3.569091796875, 4.025390625, 4.481689453125, 4.93798828125, 5.394287109375, 5.8505859375, 6.306884765625, 6.76318359375, 7.219482421875, 7.67578125, 8.132080078125, 8.58837890625, 9.044677734375, 9.5009765625, 9.957275390625, 10.41357421875, 10.869873046875, 11.326171875, 11.782470703125, 12.23876953125, 12.695068359375, 13.1513671875, 13.607666015625, 14.06396484375, 14.520263671875, 14.9765625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 8.0, 9.0, 22.0, 41.0, 66.0, 119.0, 211.0, 191.0, 140.0, 75.0, 40.0, 28.0, 13.0, 12.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032520294189453125, -0.003156810998916626, -0.0030615925788879395, -0.002966374158859253, -0.0028711557388305664, -0.00277593731880188, -0.0026807188987731934, -0.002585500478744507, -0.0024902820587158203, -0.002395063638687134, -0.0022998452186584473, -0.0022046267986297607, -0.0021094083786010742, -0.0020141899585723877, -0.0019189715385437012, -0.0018237531185150146, -0.0017285346984863281, -0.0016333162784576416, -0.001538097858428955, -0.0014428794384002686, -0.001347661018371582, -0.0012524425983428955, -0.001157224178314209, -0.0010620057582855225, -0.0009667873382568359, -0.0008715689182281494, -0.0007763504981994629, -0.0006811320781707764, -0.0005859136581420898, -0.0004906952381134033, -0.0003954768180847168, -0.0003002583980560303, -0.00020503997802734375, -0.00010982155799865723, -1.4603137969970703e-05, 8.061528205871582e-05, 0.00017583370208740234, 0.00027105212211608887, 0.0003662705421447754, 0.0004614889621734619, 0.0005567073822021484, 0.000651925802230835, 0.0007471442222595215, 0.000842362642288208, 0.0009375810623168945, 0.001032799482345581, 0.0011280179023742676, 0.001223236322402954, 0.0013184547424316406, 0.0014136731624603271, 0.0015088915824890137, 0.0016041100025177002, 0.0016993284225463867, 0.0017945468425750732, 0.0018897652626037598, 0.0019849836826324463, 0.002080202102661133, 0.0021754205226898193, 0.002270638942718506, 0.0023658573627471924, 0.002461075782775879, 0.0025562942028045654, 0.002651512622833252, 0.0027467310428619385, 0.002841949462890625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [5.0, 0.0, 4.0, 2.0, 5.0, 8.0, 7.0, 16.0, 24.0, 27.0, 34.0, 47.0, 76.0, 105.0, 147.0, 208.0, 320.0, 408.0, 695.0, 1043.0, 1670.0, 2823.0, 4781.0, 8687.0, 16421.0, 31078.0, 61176.0, 120849.0, 216285.0, 248167.0, 160613.0, 82283.0, 42082.0, 21088.0, 11492.0, 6227.0, 3683.0, 2118.0, 1304.0, 801.0, 574.0, 366.0, 240.0, 157.0, 132.0, 78.0, 76.0, 44.0, 30.0, 16.0, 14.0, 14.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.4273681640625, -10.057861328125, -9.6883544921875, -9.31884765625, -8.9493408203125, -8.579833984375, -8.2103271484375, -7.8408203125, -7.4713134765625, -7.101806640625, -6.7322998046875, -6.36279296875, -5.9932861328125, -5.623779296875, -5.2542724609375, -4.884765625, -4.5152587890625, -4.145751953125, -3.7762451171875, -3.40673828125, -3.0372314453125, -2.667724609375, -2.2982177734375, -1.9287109375, -1.5592041015625, -1.189697265625, -0.8201904296875, -0.45068359375, -0.0811767578125, 0.288330078125, 0.6578369140625, 1.02734375, 1.3968505859375, 1.766357421875, 2.1358642578125, 2.50537109375, 2.8748779296875, 3.244384765625, 3.6138916015625, 3.9833984375, 4.3529052734375, 4.722412109375, 5.0919189453125, 5.46142578125, 5.8309326171875, 6.200439453125, 6.5699462890625, 6.939453125, 7.3089599609375, 7.678466796875, 8.0479736328125, 8.41748046875, 8.7869873046875, 9.156494140625, 9.5260009765625, 9.8955078125, 10.2650146484375, 10.634521484375, 11.0040283203125, 11.37353515625, 11.7430419921875, 12.112548828125, 12.4820556640625, 12.8515625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 7.0, 10.0, 14.0, 15.0, 15.0, 31.0, 26.0, 36.0, 30.0, 33.0, 59.0, 53.0, 66.0, 52.0, 65.0, 59.0, 57.0, 50.0, 50.0, 43.0, 41.0, 35.0, 28.0, 22.0, 16.0, 9.0, 12.0, 6.0, 9.0, 13.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1015625, -3.9578857421875, -3.814208984375, -3.6705322265625, -3.52685546875, -3.3831787109375, -3.239501953125, -3.0958251953125, -2.9521484375, -2.8084716796875, -2.664794921875, -2.5211181640625, -2.37744140625, -2.2337646484375, -2.090087890625, -1.9464111328125, -1.802734375, -1.6590576171875, -1.515380859375, -1.3717041015625, -1.22802734375, -1.0843505859375, -0.940673828125, -0.7969970703125, -0.6533203125, -0.5096435546875, -0.365966796875, -0.2222900390625, -0.07861328125, 0.0650634765625, 0.208740234375, 0.3524169921875, 0.49609375, 0.6397705078125, 0.783447265625, 0.9271240234375, 1.07080078125, 1.2144775390625, 1.358154296875, 1.5018310546875, 1.6455078125, 1.7891845703125, 1.932861328125, 2.0765380859375, 2.22021484375, 2.3638916015625, 2.507568359375, 2.6512451171875, 2.794921875, 2.9385986328125, 3.082275390625, 3.2259521484375, 3.36962890625, 3.5133056640625, 3.656982421875, 3.8006591796875, 3.9443359375, 4.0880126953125, 4.231689453125, 4.3753662109375, 4.51904296875, 4.6627197265625, 4.806396484375, 4.9500732421875, 5.09375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 8.0, 7.0, 13.0, 22.0, 27.0, 28.0, 39.0, 55.0, 72.0, 79.0, 81.0, 96.0, 92.0, 76.0, 73.0, 49.0, 43.0, 32.0, 29.0, 18.0, 11.0, 10.0, 7.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-25.841167449951172, -25.240509033203125, -24.639850616455078, -24.03919219970703, -23.438533782958984, -22.837873458862305, -22.237215042114258, -21.63655662536621, -21.035898208618164, -20.435239791870117, -19.83458137512207, -19.233922958374023, -18.633262634277344, -18.032604217529297, -17.43194580078125, -16.831287384033203, -16.230628967285156, -15.62997055053711, -15.029312133789062, -14.4286527633667, -13.827994346618652, -13.227335929870605, -12.626676559448242, -12.026018142700195, -11.425359725952148, -10.824701309204102, -10.224042892456055, -9.623383522033691, -9.022725105285645, -8.422066688537598, -7.821407794952393, -7.2207489013671875, -6.620092391967773, -6.019433975219727, -5.4187750816345215, -4.818116188049316, -4.2174577713012695, -3.6167991161346436, -3.0161404609680176, -2.4154815673828125, -1.8148231506347656, -1.2141644954681396, -0.6135058403015137, -0.012847185134887695, 0.5878114700317383, 1.1884701251983643, 1.7891287803649902, 2.3897876739501953, 2.990446090698242, 3.591104745864868, 4.191763401031494, 4.792422294616699, 5.393080711364746, 5.993739128112793, 6.594398021697998, 7.195056915283203, 7.79571533203125, 8.396373748779297, 8.997032165527344, 9.597691535949707, 10.198349952697754, 10.7990083694458, 11.399667739868164, 12.000326156616211, 12.600984573364258]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 12.0, 12.0, 17.0, 19.0, 25.0, 24.0, 37.0, 37.0, 36.0, 36.0, 54.0, 46.0, 52.0, 54.0, 43.0, 53.0, 47.0, 37.0, 47.0, 41.0, 35.0, 32.0, 28.0, 30.0, 28.0, 17.0, 20.0, 13.0, 7.0, 14.0, 6.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.295372009277344, -9.920835494995117, -9.546298027038574, -9.171761512756348, -8.797224044799805, -8.422687530517578, -8.048151016235352, -7.673613548278809, -7.299076557159424, -6.924539566040039, -6.550002574920654, -6.1754655838012695, -5.800929069519043, -5.4263916015625, -5.051855087280273, -4.677318096160889, -4.302781105041504, -3.928244113922119, -3.5537071228027344, -3.1791703701019287, -2.804633378982544, -2.430096387863159, -2.0555596351623535, -1.6810226440429688, -1.306485652923584, -0.931948721408844, -0.557411789894104, -0.1828749179840088, 0.19166207313537598, 0.5661990642547607, 0.9407358169555664, 1.3152728080749512, 1.6898088455200195, 2.0643458366394043, 2.438882827758789, 2.8134195804595947, 3.1879565715789795, 3.5624935626983643, 3.93703031539917, 4.311567306518555, 4.6861042976379395, 5.060641288757324, 5.435178279876709, 5.809715270996094, 6.18425178527832, 6.558789253234863, 6.93332576751709, 7.307862758636475, 7.682399749755859, 8.056936264038086, 8.431473731994629, 8.806010246276855, 9.180547714233398, 9.555084228515625, 9.929620742797852, 10.304158210754395, 10.678695678710938, 11.053232192993164, 11.427769660949707, 11.802306175231934, 12.176843643188477, 12.551380157470703, 12.92591667175293, 13.300454139709473, 13.6749906539917]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 17.0, 32.0, 42.0, 61.0, 121.0, 171.0, 281.0, 432.0, 693.0, 1089.0, 1863.0, 2904.0, 4685.0, 8345.0, 15506.0, 31468.0, 73631.0, 198259.0, 585573.0, 1322488.0, 1198663.0, 470127.0, 156635.0, 59323.0, 27081.0, 13832.0, 7924.0, 4823.0, 2886.0, 1807.0, 1243.0, 733.0, 519.0, 349.0, 203.0, 137.0, 107.0, 61.0, 37.0, 26.0, 26.0, 12.0, 24.0, 8.0, 6.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.625, -12.1376953125, -11.650390625, -11.1630859375, -10.67578125, -10.1884765625, -9.701171875, -9.2138671875, -8.7265625, -8.2392578125, -7.751953125, -7.2646484375, -6.77734375, -6.2900390625, -5.802734375, -5.3154296875, -4.828125, -4.3408203125, -3.853515625, -3.3662109375, -2.87890625, -2.3916015625, -1.904296875, -1.4169921875, -0.9296875, -0.4423828125, 0.044921875, 0.5322265625, 1.01953125, 1.5068359375, 1.994140625, 2.4814453125, 2.96875, 3.4560546875, 3.943359375, 4.4306640625, 4.91796875, 5.4052734375, 5.892578125, 6.3798828125, 6.8671875, 7.3544921875, 7.841796875, 8.3291015625, 8.81640625, 9.3037109375, 9.791015625, 10.2783203125, 10.765625, 11.2529296875, 11.740234375, 12.2275390625, 12.71484375, 13.2021484375, 13.689453125, 14.1767578125, 14.6640625, 15.1513671875, 15.638671875, 16.1259765625, 16.61328125, 17.1005859375, 17.587890625, 18.0751953125, 18.5625]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 12.0, 26.0, 9.0, 21.0, 20.0, 19.0, 20.0, 38.0, 37.0, 41.0, 44.0, 47.0, 43.0, 55.0, 46.0, 59.0, 43.0, 44.0, 46.0, 34.0, 45.0, 34.0, 43.0, 30.0, 27.0, 19.0, 18.0, 16.0, 11.0, 12.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.60546875, -6.37115478515625, -6.1368408203125, -5.90252685546875, -5.668212890625, -5.43389892578125, -5.1995849609375, -4.96527099609375, -4.73095703125, -4.49664306640625, -4.2623291015625, -4.02801513671875, -3.793701171875, -3.55938720703125, -3.3250732421875, -3.09075927734375, -2.8564453125, -2.62213134765625, -2.3878173828125, -2.15350341796875, -1.919189453125, -1.68487548828125, -1.4505615234375, -1.21624755859375, -0.98193359375, -0.74761962890625, -0.5133056640625, -0.27899169921875, -0.044677734375, 0.18963623046875, 0.4239501953125, 0.65826416015625, 0.892578125, 1.12689208984375, 1.3612060546875, 1.59552001953125, 1.829833984375, 2.06414794921875, 2.2984619140625, 2.53277587890625, 2.76708984375, 3.00140380859375, 3.2357177734375, 3.47003173828125, 3.704345703125, 3.93865966796875, 4.1729736328125, 4.40728759765625, 4.6416015625, 4.87591552734375, 5.1102294921875, 5.34454345703125, 5.578857421875, 5.81317138671875, 6.0474853515625, 6.28179931640625, 6.51611328125, 6.75042724609375, 6.9847412109375, 7.21905517578125, 7.453369140625, 7.68768310546875, 7.9219970703125, 8.15631103515625, 8.390625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 13.0, 12.0, 25.0, 28.0, 45.0, 59.0, 81.0, 121.0, 164.0, 220.0, 278.0, 436.0, 664.0, 920.0, 1384.0, 2090.0, 3160.0, 5056.0, 8349.0, 14509.0, 26638.0, 53499.0, 120344.0, 300798.0, 739296.0, 1237663.0, 949442.0, 416959.0, 163327.0, 69959.0, 33600.0, 17791.0, 10161.0, 6001.0, 3693.0, 2398.0, 1599.0, 1096.0, 696.0, 501.0, 352.0, 236.0, 157.0, 125.0, 82.0, 60.0, 51.0, 29.0, 29.0, 15.0, 13.0, 9.0, 14.0, 5.0, 2.0, 3.0, 5.0], "bins": [-13.8359375, -13.4124755859375, -12.989013671875, -12.5655517578125, -12.14208984375, -11.7186279296875, -11.295166015625, -10.8717041015625, -10.4482421875, -10.0247802734375, -9.601318359375, -9.1778564453125, -8.75439453125, -8.3309326171875, -7.907470703125, -7.4840087890625, -7.060546875, -6.6370849609375, -6.213623046875, -5.7901611328125, -5.36669921875, -4.9432373046875, -4.519775390625, -4.0963134765625, -3.6728515625, -3.2493896484375, -2.825927734375, -2.4024658203125, -1.97900390625, -1.5555419921875, -1.132080078125, -0.7086181640625, -0.28515625, 0.1383056640625, 0.561767578125, 0.9852294921875, 1.40869140625, 1.8321533203125, 2.255615234375, 2.6790771484375, 3.1025390625, 3.5260009765625, 3.949462890625, 4.3729248046875, 4.79638671875, 5.2198486328125, 5.643310546875, 6.0667724609375, 6.490234375, 6.9136962890625, 7.337158203125, 7.7606201171875, 8.18408203125, 8.6075439453125, 9.031005859375, 9.4544677734375, 9.8779296875, 10.3013916015625, 10.724853515625, 11.1483154296875, 11.57177734375, 11.9952392578125, 12.418701171875, 12.8421630859375, 13.265625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 5.0, 2.0, 1.0, 5.0, 7.0, 12.0, 9.0, 13.0, 17.0, 19.0, 39.0, 44.0, 38.0, 44.0, 63.0, 78.0, 91.0, 119.0, 164.0, 179.0, 219.0, 224.0, 292.0, 300.0, 322.0, 308.0, 284.0, 242.0, 231.0, 168.0, 123.0, 102.0, 76.0, 55.0, 43.0, 35.0, 29.0, 22.0, 13.0, 12.0, 6.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.97265625, -3.848297119140625, -3.72393798828125, -3.599578857421875, -3.4752197265625, -3.350860595703125, -3.22650146484375, -3.102142333984375, -2.977783203125, -2.853424072265625, -2.72906494140625, -2.604705810546875, -2.4803466796875, -2.355987548828125, -2.23162841796875, -2.107269287109375, -1.98291015625, -1.858551025390625, -1.73419189453125, -1.609832763671875, -1.4854736328125, -1.361114501953125, -1.23675537109375, -1.112396240234375, -0.988037109375, -0.863677978515625, -0.73931884765625, -0.614959716796875, -0.4906005859375, -0.366241455078125, -0.24188232421875, -0.117523193359375, 0.0068359375, 0.131195068359375, 0.25555419921875, 0.379913330078125, 0.5042724609375, 0.628631591796875, 0.75299072265625, 0.877349853515625, 1.001708984375, 1.126068115234375, 1.25042724609375, 1.374786376953125, 1.4991455078125, 1.623504638671875, 1.74786376953125, 1.872222900390625, 1.99658203125, 2.120941162109375, 2.24530029296875, 2.369659423828125, 2.4940185546875, 2.618377685546875, 2.74273681640625, 2.867095947265625, 2.991455078125, 3.115814208984375, 3.24017333984375, 3.364532470703125, 3.4888916015625, 3.613250732421875, 3.73760986328125, 3.861968994140625, 3.986328125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 2.0, 5.0, 4.0, 8.0, 16.0, 21.0, 28.0, 24.0, 29.0, 38.0, 60.0, 95.0, 79.0, 95.0, 94.0, 81.0, 66.0, 62.0, 50.0, 38.0, 24.0, 17.0, 15.0, 14.0, 8.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.773818969726562, -19.277854919433594, -18.781892776489258, -18.28592872619629, -17.789966583251953, -17.294002532958984, -16.798038482666016, -16.30207633972168, -15.806112289428711, -15.310149192810059, -14.814186096191406, -14.318222045898438, -13.822258949279785, -13.326295852661133, -12.830331802368164, -12.334368705749512, -11.83840560913086, -11.342442512512207, -10.846479415893555, -10.350515365600586, -9.854552268981934, -9.358589172363281, -8.862625122070312, -8.36666202545166, -7.870698928833008, -7.3747358322143555, -6.878772258758545, -6.382808685302734, -5.886845588684082, -5.39088249206543, -4.894918918609619, -4.398955345153809, -3.90299129486084, -3.4070279598236084, -2.911064624786377, -2.4151012897491455, -1.919137954711914, -1.4231746196746826, -0.9272112846374512, -0.4312479496002197, 0.06471538543701172, 0.5606787204742432, 1.0566420555114746, 1.552605390548706, 2.0485687255859375, 2.544532060623169, 3.0404953956604004, 3.536458730697632, 4.032422065734863, 4.528385162353516, 5.024348735809326, 5.520312309265137, 6.016275405883789, 6.512238502502441, 7.008202075958252, 7.5041656494140625, 8.000128746032715, 8.496091842651367, 8.992055892944336, 9.488018989562988, 9.98398208618164, 10.479945182800293, 10.975908279418945, 11.471872329711914, 11.967835426330566]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 3.0, 5.0, 11.0, 12.0, 14.0, 10.0, 28.0, 22.0, 23.0, 36.0, 32.0, 47.0, 37.0, 39.0, 59.0, 39.0, 50.0, 55.0, 35.0, 52.0, 50.0, 45.0, 43.0, 39.0, 31.0, 36.0, 26.0, 24.0, 23.0, 13.0, 15.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.06433391571045, -7.751862525939941, -7.439391136169434, -7.126920223236084, -6.814448833465576, -6.501977443695068, -6.189506530761719, -5.877035140991211, -5.564563751220703, -5.252092361450195, -4.9396209716796875, -4.627150058746338, -4.31467866897583, -4.002207279205322, -3.6897361278533936, -3.377264976501465, -3.064793586730957, -2.752322196960449, -2.4398510456085205, -2.127379894256592, -1.814908504486084, -1.5024372339248657, -1.1899659633636475, -0.8774948120117188, -0.5650234222412109, -0.2525521516799927, 0.059919118881225586, 0.37239038944244385, 0.6848616600036621, 0.9973329305648804, 1.3098042011260986, 1.6222753524780273, 1.9347476959228516, 2.2472190856933594, 2.559690237045288, 2.872161388397217, 3.1846327781677246, 3.4971041679382324, 3.809575319290161, 4.12204647064209, 4.434517860412598, 4.7469892501831055, 5.059460639953613, 5.371931552886963, 5.684402942657471, 5.9968743324279785, 6.309345245361328, 6.621816635131836, 6.934288024902344, 7.246759414672852, 7.559230804443359, 7.871701717376709, 8.184173583984375, 8.496644020080566, 8.809115409851074, 9.121586799621582, 9.43405818939209, 9.746529579162598, 10.059000968933105, 10.371472358703613, 10.683942794799805, 10.996414184570312, 11.30888557434082, 11.621356964111328, 11.933828353881836]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 6.0, 7.0, 6.0, 12.0, 22.0, 37.0, 56.0, 82.0, 165.0, 275.0, 466.0, 859.0, 1379.0, 2560.0, 4849.0, 9978.0, 20139.0, 42353.0, 89061.0, 173141.0, 250691.0, 215615.0, 121925.0, 58782.0, 27933.0, 13622.0, 6626.0, 3481.0, 1910.0, 1078.0, 579.0, 337.0, 213.0, 118.0, 63.0, 36.0, 27.0, 26.0, 14.0, 14.0, 5.0, 4.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.26171875, -6.0643310546875, -5.866943359375, -5.6695556640625, -5.47216796875, -5.2747802734375, -5.077392578125, -4.8800048828125, -4.6826171875, -4.4852294921875, -4.287841796875, -4.0904541015625, -3.89306640625, -3.6956787109375, -3.498291015625, -3.3009033203125, -3.103515625, -2.9061279296875, -2.708740234375, -2.5113525390625, -2.31396484375, -2.1165771484375, -1.919189453125, -1.7218017578125, -1.5244140625, -1.3270263671875, -1.129638671875, -0.9322509765625, -0.73486328125, -0.5374755859375, -0.340087890625, -0.1427001953125, 0.0546875, 0.2520751953125, 0.449462890625, 0.6468505859375, 0.84423828125, 1.0416259765625, 1.239013671875, 1.4364013671875, 1.6337890625, 1.8311767578125, 2.028564453125, 2.2259521484375, 2.42333984375, 2.6207275390625, 2.818115234375, 3.0155029296875, 3.212890625, 3.4102783203125, 3.607666015625, 3.8050537109375, 4.00244140625, 4.1998291015625, 4.397216796875, 4.5946044921875, 4.7919921875, 4.9893798828125, 5.186767578125, 5.3841552734375, 5.58154296875, 5.7789306640625, 5.976318359375, 6.1737060546875, 6.37109375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 6.0, 8.0, 10.0, 8.0, 13.0, 22.0, 17.0, 23.0, 21.0, 25.0, 29.0, 47.0, 44.0, 54.0, 38.0, 54.0, 54.0, 42.0, 57.0, 46.0, 60.0, 41.0, 40.0, 34.0, 38.0, 27.0, 29.0, 20.0, 21.0, 26.0, 12.0, 7.0, 5.0, 4.0, 5.0, 2.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.578125, -8.2431640625, -7.908203125, -7.5732421875, -7.23828125, -6.9033203125, -6.568359375, -6.2333984375, -5.8984375, -5.5634765625, -5.228515625, -4.8935546875, -4.55859375, -4.2236328125, -3.888671875, -3.5537109375, -3.21875, -2.8837890625, -2.548828125, -2.2138671875, -1.87890625, -1.5439453125, -1.208984375, -0.8740234375, -0.5390625, -0.2041015625, 0.130859375, 0.4658203125, 0.80078125, 1.1357421875, 1.470703125, 1.8056640625, 2.140625, 2.4755859375, 2.810546875, 3.1455078125, 3.48046875, 3.8154296875, 4.150390625, 4.4853515625, 4.8203125, 5.1552734375, 5.490234375, 5.8251953125, 6.16015625, 6.4951171875, 6.830078125, 7.1650390625, 7.5, 7.8349609375, 8.169921875, 8.5048828125, 8.83984375, 9.1748046875, 9.509765625, 9.8447265625, 10.1796875, 10.5146484375, 10.849609375, 11.1845703125, 11.51953125, 11.8544921875, 12.189453125, 12.5244140625, 12.859375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 12.0, 17.0, 25.0, 38.0, 51.0, 78.0, 129.0, 180.0, 284.0, 433.0, 710.0, 1117.0, 1830.0, 2931.0, 5138.0, 8590.0, 15624.0, 29895.0, 57690.0, 114596.0, 206387.0, 249978.0, 167959.0, 87880.0, 44559.0, 22858.0, 12448.0, 6851.0, 3930.0, 2296.0, 1487.0, 917.0, 515.0, 346.0, 258.0, 164.0, 105.0, 84.0, 54.0, 23.0, 21.0, 19.0, 11.0, 14.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.23046875, -6.04339599609375, -5.8563232421875, -5.66925048828125, -5.482177734375, -5.29510498046875, -5.1080322265625, -4.92095947265625, -4.73388671875, -4.54681396484375, -4.3597412109375, -4.17266845703125, -3.985595703125, -3.79852294921875, -3.6114501953125, -3.42437744140625, -3.2373046875, -3.05023193359375, -2.8631591796875, -2.67608642578125, -2.489013671875, -2.30194091796875, -2.1148681640625, -1.92779541015625, -1.74072265625, -1.55364990234375, -1.3665771484375, -1.17950439453125, -0.992431640625, -0.80535888671875, -0.6182861328125, -0.43121337890625, -0.244140625, -0.05706787109375, 0.1300048828125, 0.31707763671875, 0.504150390625, 0.69122314453125, 0.8782958984375, 1.06536865234375, 1.25244140625, 1.43951416015625, 1.6265869140625, 1.81365966796875, 2.000732421875, 2.18780517578125, 2.3748779296875, 2.56195068359375, 2.7490234375, 2.93609619140625, 3.1231689453125, 3.31024169921875, 3.497314453125, 3.68438720703125, 3.8714599609375, 4.05853271484375, 4.24560546875, 4.43267822265625, 4.6197509765625, 4.80682373046875, 4.993896484375, 5.18096923828125, 5.3680419921875, 5.55511474609375, 5.7421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 6.0, 7.0, 12.0, 15.0, 12.0, 17.0, 11.0, 23.0, 13.0, 19.0, 24.0, 40.0, 37.0, 37.0, 24.0, 52.0, 53.0, 41.0, 46.0, 38.0, 38.0, 50.0, 36.0, 28.0, 30.0, 35.0, 39.0, 28.0, 21.0, 31.0, 18.0, 17.0, 14.0, 12.0, 16.0, 15.0, 12.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.328125, -5.1619873046875, -4.995849609375, -4.8297119140625, -4.66357421875, -4.4974365234375, -4.331298828125, -4.1651611328125, -3.9990234375, -3.8328857421875, -3.666748046875, -3.5006103515625, -3.33447265625, -3.1683349609375, -3.002197265625, -2.8360595703125, -2.669921875, -2.5037841796875, -2.337646484375, -2.1715087890625, -2.00537109375, -1.8392333984375, -1.673095703125, -1.5069580078125, -1.3408203125, -1.1746826171875, -1.008544921875, -0.8424072265625, -0.67626953125, -0.5101318359375, -0.343994140625, -0.1778564453125, -0.01171875, 0.1544189453125, 0.320556640625, 0.4866943359375, 0.65283203125, 0.8189697265625, 0.985107421875, 1.1512451171875, 1.3173828125, 1.4835205078125, 1.649658203125, 1.8157958984375, 1.98193359375, 2.1480712890625, 2.314208984375, 2.4803466796875, 2.646484375, 2.8126220703125, 2.978759765625, 3.1448974609375, 3.31103515625, 3.4771728515625, 3.643310546875, 3.8094482421875, 3.9755859375, 4.1417236328125, 4.307861328125, 4.4739990234375, 4.64013671875, 4.8062744140625, 4.972412109375, 5.1385498046875, 5.3046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 8.0, 7.0, 12.0, 16.0, 31.0, 50.0, 72.0, 112.0, 167.0, 245.0, 394.0, 487.0, 770.0, 1156.0, 1839.0, 2797.0, 4496.0, 7144.0, 11698.0, 19852.0, 34367.0, 61421.0, 109790.0, 187446.0, 229966.0, 160415.0, 90937.0, 50373.0, 28657.0, 16728.0, 10045.0, 6201.0, 3890.0, 2357.0, 1528.0, 1042.0, 633.0, 445.0, 325.0, 191.0, 136.0, 97.0, 66.0, 50.0, 39.0, 20.0, 14.0, 11.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-2.708984375, -2.625213623046875, -2.54144287109375, -2.457672119140625, -2.3739013671875, -2.290130615234375, -2.20635986328125, -2.122589111328125, -2.038818359375, -1.955047607421875, -1.87127685546875, -1.787506103515625, -1.7037353515625, -1.619964599609375, -1.53619384765625, -1.452423095703125, -1.36865234375, -1.284881591796875, -1.20111083984375, -1.117340087890625, -1.0335693359375, -0.949798583984375, -0.86602783203125, -0.782257080078125, -0.698486328125, -0.614715576171875, -0.53094482421875, -0.447174072265625, -0.3634033203125, -0.279632568359375, -0.19586181640625, -0.112091064453125, -0.0283203125, 0.055450439453125, 0.13922119140625, 0.222991943359375, 0.3067626953125, 0.390533447265625, 0.47430419921875, 0.558074951171875, 0.641845703125, 0.725616455078125, 0.80938720703125, 0.893157958984375, 0.9769287109375, 1.060699462890625, 1.14447021484375, 1.228240966796875, 1.31201171875, 1.395782470703125, 1.47955322265625, 1.563323974609375, 1.6470947265625, 1.730865478515625, 1.81463623046875, 1.898406982421875, 1.982177734375, 2.065948486328125, 2.14971923828125, 2.233489990234375, 2.3172607421875, 2.401031494140625, 2.48480224609375, 2.568572998046875, 2.65234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 1.0, 5.0, 8.0, 17.0, 20.0, 26.0, 32.0, 26.0, 32.0, 44.0, 58.0, 52.0, 76.0, 72.0, 77.0, 73.0, 77.0, 70.0, 51.0, 47.0, 27.0, 26.0, 23.0, 13.0, 12.0, 9.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013399124145507812, -0.00012907013297080994, -0.00012414902448654175, -0.00011922791600227356, -0.00011430680751800537, -0.00010938569903373718, -0.000104464590549469, -9.95434820652008e-05, -9.462237358093262e-05, -8.970126509666443e-05, -8.478015661239624e-05, -7.985904812812805e-05, -7.493793964385986e-05, -7.001683115959167e-05, -6.509572267532349e-05, -6.01746141910553e-05, -5.525350570678711e-05, -5.033239722251892e-05, -4.541128873825073e-05, -4.0490180253982544e-05, -3.5569071769714355e-05, -3.064796328544617e-05, -2.572685480117798e-05, -2.080574631690979e-05, -1.58846378326416e-05, -1.0963529348373413e-05, -6.042420864105225e-06, -1.1213123798370361e-06, 3.7997961044311523e-06, 8.72090458869934e-06, 1.364201307296753e-05, 1.8563121557235718e-05, 2.3484230041503906e-05, 2.8405338525772095e-05, 3.332644701004028e-05, 3.824755549430847e-05, 4.316866397857666e-05, 4.808977246284485e-05, 5.301088094711304e-05, 5.7931989431381226e-05, 6.285309791564941e-05, 6.77742063999176e-05, 7.269531488418579e-05, 7.761642336845398e-05, 8.253753185272217e-05, 8.745864033699036e-05, 9.237974882125854e-05, 9.730085730552673e-05, 0.00010222196578979492, 0.00010714307427406311, 0.0001120641827583313, 0.00011698529124259949, 0.00012190639972686768, 0.00012682750821113586, 0.00013174861669540405, 0.00013666972517967224, 0.00014159083366394043, 0.00014651194214820862, 0.0001514330506324768, 0.000156354159116745, 0.00016127526760101318, 0.00016619637608528137, 0.00017111748456954956, 0.00017603859305381775, 0.00018095970153808594]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 3.0, 6.0, 6.0, 8.0, 17.0, 20.0, 22.0, 46.0, 42.0, 61.0, 89.0, 124.0, 178.0, 255.0, 346.0, 489.0, 782.0, 1096.0, 1629.0, 2572.0, 4186.0, 7087.0, 11940.0, 21176.0, 38071.0, 69708.0, 125017.0, 193593.0, 211403.0, 154513.0, 89675.0, 48628.0, 27048.0, 15170.0, 8678.0, 5340.0, 3238.0, 2067.0, 1293.0, 887.0, 603.0, 403.0, 298.0, 211.0, 142.0, 102.0, 74.0, 63.0, 39.0, 32.0, 19.0, 26.0, 11.0, 9.0, 6.0, 7.0, 6.0, 1.0, 4.0, 2.0, 2.0], "bins": [-2.58984375, -2.506866455078125, -2.42388916015625, -2.340911865234375, -2.2579345703125, -2.174957275390625, -2.09197998046875, -2.009002685546875, -1.926025390625, -1.843048095703125, -1.76007080078125, -1.677093505859375, -1.5941162109375, -1.511138916015625, -1.42816162109375, -1.345184326171875, -1.26220703125, -1.179229736328125, -1.09625244140625, -1.013275146484375, -0.9302978515625, -0.847320556640625, -0.76434326171875, -0.681365966796875, -0.598388671875, -0.515411376953125, -0.43243408203125, -0.349456787109375, -0.2664794921875, -0.183502197265625, -0.10052490234375, -0.017547607421875, 0.0654296875, 0.148406982421875, 0.23138427734375, 0.314361572265625, 0.3973388671875, 0.480316162109375, 0.56329345703125, 0.646270751953125, 0.729248046875, 0.812225341796875, 0.89520263671875, 0.978179931640625, 1.0611572265625, 1.144134521484375, 1.22711181640625, 1.310089111328125, 1.39306640625, 1.476043701171875, 1.55902099609375, 1.641998291015625, 1.7249755859375, 1.807952880859375, 1.89093017578125, 1.973907470703125, 2.056884765625, 2.139862060546875, 2.22283935546875, 2.305816650390625, 2.3887939453125, 2.471771240234375, 2.55474853515625, 2.637725830078125, 2.720703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 6.0, 7.0, 7.0, 17.0, 16.0, 18.0, 28.0, 32.0, 46.0, 43.0, 49.0, 44.0, 50.0, 59.0, 70.0, 65.0, 70.0, 63.0, 48.0, 37.0, 36.0, 34.0, 27.0, 26.0, 18.0, 14.0, 11.0, 14.0, 5.0, 3.0, 3.0, 9.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.953125, -0.920989990234375, -0.88885498046875, -0.856719970703125, -0.8245849609375, -0.792449951171875, -0.76031494140625, -0.728179931640625, -0.696044921875, -0.663909912109375, -0.63177490234375, -0.599639892578125, -0.5675048828125, -0.535369873046875, -0.50323486328125, -0.471099853515625, -0.43896484375, -0.406829833984375, -0.37469482421875, -0.342559814453125, -0.3104248046875, -0.278289794921875, -0.24615478515625, -0.214019775390625, -0.181884765625, -0.149749755859375, -0.11761474609375, -0.085479736328125, -0.0533447265625, -0.021209716796875, 0.01092529296875, 0.043060302734375, 0.0751953125, 0.107330322265625, 0.13946533203125, 0.171600341796875, 0.2037353515625, 0.235870361328125, 0.26800537109375, 0.300140380859375, 0.332275390625, 0.364410400390625, 0.39654541015625, 0.428680419921875, 0.4608154296875, 0.492950439453125, 0.52508544921875, 0.557220458984375, 0.58935546875, 0.621490478515625, 0.65362548828125, 0.685760498046875, 0.7178955078125, 0.750030517578125, 0.78216552734375, 0.814300537109375, 0.846435546875, 0.878570556640625, 0.91070556640625, 0.942840576171875, 0.9749755859375, 1.007110595703125, 1.03924560546875, 1.071380615234375, 1.103515625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 3.0, 11.0, 15.0, 15.0, 29.0, 17.0, 34.0, 39.0, 53.0, 77.0, 76.0, 89.0, 84.0, 94.0, 73.0, 56.0, 49.0, 48.0, 32.0, 19.0, 17.0, 13.0, 18.0, 9.0, 7.0, 1.0, 6.0, 3.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.91670036315918, -18.446056365966797, -17.975412368774414, -17.504770278930664, -17.03412628173828, -16.5634822845459, -16.092838287353516, -15.62219524383545, -15.151552200317383, -14.680908203125, -14.210265159606934, -13.73962116241455, -13.268978118896484, -12.798334121704102, -12.327690124511719, -11.857047080993652, -11.38640308380127, -10.915759086608887, -10.44511604309082, -9.974472045898438, -9.503829002380371, -9.033185005187988, -8.562541961669922, -8.091897964477539, -7.6212544441223145, -7.15061092376709, -6.679967403411865, -6.209323883056641, -5.738679885864258, -5.268036842346191, -4.797392845153809, -4.326749324798584, -3.856106758117676, -3.385463237762451, -2.9148197174072266, -2.444175958633423, -1.9735324382781982, -1.5028889179229736, -1.03224515914917, -0.5616016387939453, -0.0909581184387207, 0.3796854615211487, 0.8503290414810181, 1.3209726810455322, 1.7916162014007568, 2.2622597217559814, 2.732903480529785, 3.2035470008850098, 3.6741905212402344, 4.144834041595459, 4.615477561950684, 5.086121559143066, 5.556764602661133, 6.027408599853516, 6.49805212020874, 6.968695640563965, 7.4393391609191895, 7.909982681274414, 8.380626678466797, 8.851269721984863, 9.321913719177246, 9.792556762695312, 10.263200759887695, 10.733844757080078, 11.204487800598145]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 9.0, 12.0, 11.0, 26.0, 14.0, 24.0, 33.0, 30.0, 42.0, 32.0, 41.0, 52.0, 52.0, 44.0, 42.0, 44.0, 42.0, 52.0, 51.0, 42.0, 42.0, 36.0, 31.0, 36.0, 19.0, 25.0, 19.0, 22.0, 12.0, 12.0, 14.0, 4.0, 5.0, 1.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.915238380432129, -7.616649150848389, -7.31805944442749, -7.01947021484375, -6.720880508422852, -6.422291278839111, -6.123702049255371, -5.825112342834473, -5.526523113250732, -5.227933883666992, -4.929344177246094, -4.6307549476623535, -4.332165718078613, -4.033576011657715, -3.7349867820739746, -3.4363973140716553, -3.137807846069336, -2.8392183780670166, -2.5406289100646973, -2.242039680480957, -1.9434502124786377, -1.6448607444763184, -1.3462713956832886, -1.0476820468902588, -0.7490925788879395, -0.4505031704902649, -0.15191376209259033, 0.14667564630508423, 0.4452650547027588, 0.7438545227050781, 1.042443871498108, 1.3410332202911377, 1.6396217346191406, 1.93821120262146, 2.2368006706237793, 2.5353899002075195, 2.833979368209839, 3.132568836212158, 3.4311580657958984, 3.7297475337982178, 4.028337001800537, 4.326926231384277, 4.625515937805176, 4.924105167388916, 5.222694396972656, 5.521284103393555, 5.819873332977295, 6.118462562561035, 6.417052268981934, 6.715641498565674, 7.014231204986572, 7.3128204345703125, 7.611410140991211, 7.909999370574951, 8.208588600158691, 8.50717830657959, 8.805767059326172, 9.10435676574707, 9.402945518493652, 9.70153522491455, 10.00012493133545, 10.298713684082031, 10.59730339050293, 10.895893096923828, 11.194482803344727]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 16.0, 17.0, 22.0, 39.0, 61.0, 77.0, 106.0, 168.0, 212.0, 339.0, 510.0, 822.0, 1365.0, 2355.0, 4180.0, 7801.0, 15534.0, 30372.0, 63036.0, 127715.0, 222245.0, 245273.0, 161568.0, 82468.0, 40066.0, 19482.0, 9901.0, 5306.0, 2975.0, 1685.0, 977.0, 636.0, 377.0, 284.0, 172.0, 112.0, 89.0, 53.0, 46.0, 22.0, 15.0, 9.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.34375, -13.9114990234375, -13.479248046875, -13.0469970703125, -12.61474609375, -12.1824951171875, -11.750244140625, -11.3179931640625, -10.8857421875, -10.4534912109375, -10.021240234375, -9.5889892578125, -9.15673828125, -8.7244873046875, -8.292236328125, -7.8599853515625, -7.427734375, -6.9954833984375, -6.563232421875, -6.1309814453125, -5.69873046875, -5.2664794921875, -4.834228515625, -4.4019775390625, -3.9697265625, -3.5374755859375, -3.105224609375, -2.6729736328125, -2.24072265625, -1.8084716796875, -1.376220703125, -0.9439697265625, -0.51171875, -0.0794677734375, 0.352783203125, 0.7850341796875, 1.21728515625, 1.6495361328125, 2.081787109375, 2.5140380859375, 2.9462890625, 3.3785400390625, 3.810791015625, 4.2430419921875, 4.67529296875, 5.1075439453125, 5.539794921875, 5.9720458984375, 6.404296875, 6.8365478515625, 7.268798828125, 7.7010498046875, 8.13330078125, 8.5655517578125, 8.997802734375, 9.4300537109375, 9.8623046875, 10.2945556640625, 10.726806640625, 11.1590576171875, 11.59130859375, 12.0235595703125, 12.455810546875, 12.8880615234375, 13.3203125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 4.0, 9.0, 13.0, 17.0, 21.0, 20.0, 22.0, 19.0, 26.0, 31.0, 38.0, 33.0, 39.0, 51.0, 38.0, 50.0, 38.0, 54.0, 44.0, 49.0, 46.0, 33.0, 44.0, 29.0, 25.0, 31.0, 35.0, 15.0, 20.0, 17.0, 15.0, 20.0, 8.0, 6.0, 8.0, 8.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.22882080078125, -6.9537353515625, -6.67864990234375, -6.403564453125, -6.12847900390625, -5.8533935546875, -5.57830810546875, -5.30322265625, -5.02813720703125, -4.7530517578125, -4.47796630859375, -4.202880859375, -3.92779541015625, -3.6527099609375, -3.37762451171875, -3.1025390625, -2.82745361328125, -2.5523681640625, -2.27728271484375, -2.002197265625, -1.72711181640625, -1.4520263671875, -1.17694091796875, -0.90185546875, -0.62677001953125, -0.3516845703125, -0.07659912109375, 0.198486328125, 0.47357177734375, 0.7486572265625, 1.02374267578125, 1.298828125, 1.57391357421875, 1.8489990234375, 2.12408447265625, 2.399169921875, 2.67425537109375, 2.9493408203125, 3.22442626953125, 3.49951171875, 3.77459716796875, 4.0496826171875, 4.32476806640625, 4.599853515625, 4.87493896484375, 5.1500244140625, 5.42510986328125, 5.7001953125, 5.97528076171875, 6.2503662109375, 6.52545166015625, 6.800537109375, 7.07562255859375, 7.3507080078125, 7.62579345703125, 7.90087890625, 8.17596435546875, 8.4510498046875, 8.72613525390625, 9.001220703125, 9.27630615234375, 9.5513916015625, 9.82647705078125, 10.1015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 16.0, 20.0, 24.0, 29.0, 49.0, 66.0, 110.0, 121.0, 207.0, 366.0, 572.0, 834.0, 1457.0, 2435.0, 4351.0, 7806.0, 14861.0, 30503.0, 65238.0, 136089.0, 235478.0, 248071.0, 153392.0, 74359.0, 34994.0, 17006.0, 8631.0, 4684.0, 2604.0, 1607.0, 956.0, 550.0, 382.0, 231.0, 129.0, 89.0, 72.0, 41.0, 30.0, 25.0, 20.0, 14.0, 6.0, 8.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-14.1484375, -13.7208251953125, -13.293212890625, -12.8656005859375, -12.43798828125, -12.0103759765625, -11.582763671875, -11.1551513671875, -10.7275390625, -10.2999267578125, -9.872314453125, -9.4447021484375, -9.01708984375, -8.5894775390625, -8.161865234375, -7.7342529296875, -7.306640625, -6.8790283203125, -6.451416015625, -6.0238037109375, -5.59619140625, -5.1685791015625, -4.740966796875, -4.3133544921875, -3.8857421875, -3.4581298828125, -3.030517578125, -2.6029052734375, -2.17529296875, -1.7476806640625, -1.320068359375, -0.8924560546875, -0.46484375, -0.0372314453125, 0.390380859375, 0.8179931640625, 1.24560546875, 1.6732177734375, 2.100830078125, 2.5284423828125, 2.9560546875, 3.3836669921875, 3.811279296875, 4.2388916015625, 4.66650390625, 5.0941162109375, 5.521728515625, 5.9493408203125, 6.376953125, 6.8045654296875, 7.232177734375, 7.6597900390625, 8.08740234375, 8.5150146484375, 8.942626953125, 9.3702392578125, 9.7978515625, 10.2254638671875, 10.653076171875, 11.0806884765625, 11.50830078125, 11.9359130859375, 12.363525390625, 12.7911376953125, 13.21875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 7.0, 7.0, 8.0, 13.0, 21.0, 18.0, 21.0, 32.0, 22.0, 38.0, 39.0, 41.0, 47.0, 40.0, 47.0, 61.0, 58.0, 46.0, 47.0, 46.0, 46.0, 41.0, 42.0, 40.0, 40.0, 23.0, 20.0, 17.0, 16.0, 8.0, 13.0, 9.0, 4.0, 9.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.76348876953125, -5.5543212890625, -5.34515380859375, -5.135986328125, -4.92681884765625, -4.7176513671875, -4.50848388671875, -4.29931640625, -4.09014892578125, -3.8809814453125, -3.67181396484375, -3.462646484375, -3.25347900390625, -3.0443115234375, -2.83514404296875, -2.6259765625, -2.41680908203125, -2.2076416015625, -1.99847412109375, -1.789306640625, -1.58013916015625, -1.3709716796875, -1.16180419921875, -0.95263671875, -0.74346923828125, -0.5343017578125, -0.32513427734375, -0.115966796875, 0.09320068359375, 0.3023681640625, 0.51153564453125, 0.720703125, 0.92987060546875, 1.1390380859375, 1.34820556640625, 1.557373046875, 1.76654052734375, 1.9757080078125, 2.18487548828125, 2.39404296875, 2.60321044921875, 2.8123779296875, 3.02154541015625, 3.230712890625, 3.43988037109375, 3.6490478515625, 3.85821533203125, 4.0673828125, 4.27655029296875, 4.4857177734375, 4.69488525390625, 4.904052734375, 5.11322021484375, 5.3223876953125, 5.53155517578125, 5.74072265625, 5.94989013671875, 6.1590576171875, 6.36822509765625, 6.577392578125, 6.78656005859375, 6.9957275390625, 7.20489501953125, 7.4140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 9.0, 15.0, 19.0, 20.0, 29.0, 52.0, 57.0, 93.0, 125.0, 206.0, 285.0, 381.0, 587.0, 823.0, 1340.0, 1933.0, 3023.0, 4672.0, 7564.0, 12540.0, 21208.0, 37520.0, 68896.0, 126420.0, 205030.0, 219139.0, 148047.0, 81190.0, 43976.0, 24822.0, 14380.0, 8794.0, 5252.0, 3437.0, 2204.0, 1408.0, 955.0, 636.0, 422.0, 329.0, 219.0, 150.0, 115.0, 68.0, 46.0, 47.0, 29.0, 14.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-8.3046875, -8.0379638671875, -7.771240234375, -7.5045166015625, -7.23779296875, -6.9710693359375, -6.704345703125, -6.4376220703125, -6.1708984375, -5.9041748046875, -5.637451171875, -5.3707275390625, -5.10400390625, -4.8372802734375, -4.570556640625, -4.3038330078125, -4.037109375, -3.7703857421875, -3.503662109375, -3.2369384765625, -2.97021484375, -2.7034912109375, -2.436767578125, -2.1700439453125, -1.9033203125, -1.6365966796875, -1.369873046875, -1.1031494140625, -0.83642578125, -0.5697021484375, -0.302978515625, -0.0362548828125, 0.23046875, 0.4971923828125, 0.763916015625, 1.0306396484375, 1.29736328125, 1.5640869140625, 1.830810546875, 2.0975341796875, 2.3642578125, 2.6309814453125, 2.897705078125, 3.1644287109375, 3.43115234375, 3.6978759765625, 3.964599609375, 4.2313232421875, 4.498046875, 4.7647705078125, 5.031494140625, 5.2982177734375, 5.56494140625, 5.8316650390625, 6.098388671875, 6.3651123046875, 6.6318359375, 6.8985595703125, 7.165283203125, 7.4320068359375, 7.69873046875, 7.9654541015625, 8.232177734375, 8.4989013671875, 8.765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 4.0, 7.0, 11.0, 8.0, 12.0, 18.0, 10.0, 32.0, 28.0, 67.0, 74.0, 84.0, 77.0, 105.0, 97.0, 76.0, 73.0, 68.0, 47.0, 31.0, 29.0, 13.0, 3.0, 7.0, 8.0, 2.0, 2.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013284683227539062, -0.001292213797569275, -0.0012559592723846436, -0.0012197047472000122, -0.0011834502220153809, -0.0011471956968307495, -0.0011109411716461182, -0.0010746866464614868, -0.0010384321212768555, -0.0010021775960922241, -0.0009659230709075928, -0.0009296685457229614, -0.0008934140205383301, -0.0008571594953536987, -0.0008209049701690674, -0.000784650444984436, -0.0007483959197998047, -0.0007121413946151733, -0.000675886869430542, -0.0006396323442459106, -0.0006033778190612793, -0.000567123293876648, -0.0005308687686920166, -0.0004946142435073853, -0.0004583597183227539, -0.00042210519313812256, -0.0003858506679534912, -0.00034959614276885986, -0.0003133416175842285, -0.00027708709239959717, -0.00024083256721496582, -0.00020457804203033447, -0.00016832351684570312, -0.00013206899166107178, -9.581446647644043e-05, -5.955994129180908e-05, -2.3305416107177734e-05, 1.2949109077453613e-05, 4.920363426208496e-05, 8.545815944671631e-05, 0.00012171268463134766, 0.000157967209815979, 0.00019422173500061035, 0.0002304762601852417, 0.00026673078536987305, 0.0003029853105545044, 0.00033923983573913574, 0.0003754943609237671, 0.00041174888610839844, 0.0004480034112930298, 0.00048425793647766113, 0.0005205124616622925, 0.0005567669868469238, 0.0005930215120315552, 0.0006292760372161865, 0.0006655305624008179, 0.0007017850875854492, 0.0007380396127700806, 0.0007742941379547119, 0.0008105486631393433, 0.0008468031883239746, 0.000883057713508606, 0.0009193122386932373, 0.0009555667638778687, 0.0009918212890625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 7.0, 5.0, 5.0, 10.0, 10.0, 18.0, 16.0, 37.0, 49.0, 63.0, 83.0, 115.0, 150.0, 231.0, 272.0, 404.0, 595.0, 887.0, 1265.0, 1804.0, 2687.0, 4326.0, 6681.0, 10943.0, 18730.0, 33817.0, 61366.0, 111070.0, 179707.0, 214825.0, 167832.0, 100293.0, 54776.0, 30140.0, 17298.0, 9919.0, 6269.0, 3803.0, 2497.0, 1667.0, 1161.0, 761.0, 584.0, 413.0, 283.0, 207.0, 138.0, 113.0, 78.0, 47.0, 39.0, 23.0, 20.0, 11.0, 6.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-7.28515625, -7.06036376953125, -6.8355712890625, -6.61077880859375, -6.385986328125, -6.16119384765625, -5.9364013671875, -5.71160888671875, -5.48681640625, -5.26202392578125, -5.0372314453125, -4.81243896484375, -4.587646484375, -4.36285400390625, -4.1380615234375, -3.91326904296875, -3.6884765625, -3.46368408203125, -3.2388916015625, -3.01409912109375, -2.789306640625, -2.56451416015625, -2.3397216796875, -2.11492919921875, -1.89013671875, -1.66534423828125, -1.4405517578125, -1.21575927734375, -0.990966796875, -0.76617431640625, -0.5413818359375, -0.31658935546875, -0.091796875, 0.13299560546875, 0.3577880859375, 0.58258056640625, 0.807373046875, 1.03216552734375, 1.2569580078125, 1.48175048828125, 1.70654296875, 1.93133544921875, 2.1561279296875, 2.38092041015625, 2.605712890625, 2.83050537109375, 3.0552978515625, 3.28009033203125, 3.5048828125, 3.72967529296875, 3.9544677734375, 4.17926025390625, 4.404052734375, 4.62884521484375, 4.8536376953125, 5.07843017578125, 5.30322265625, 5.52801513671875, 5.7528076171875, 5.97760009765625, 6.202392578125, 6.42718505859375, 6.6519775390625, 6.87677001953125, 7.1015625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 11.0, 7.0, 11.0, 12.0, 12.0, 19.0, 25.0, 36.0, 51.0, 50.0, 63.0, 75.0, 64.0, 78.0, 95.0, 83.0, 56.0, 44.0, 39.0, 26.0, 26.0, 23.0, 12.0, 21.0, 17.0, 7.0, 6.0, 9.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.0625, -3.94134521484375, -3.8201904296875, -3.69903564453125, -3.577880859375, -3.45672607421875, -3.3355712890625, -3.21441650390625, -3.09326171875, -2.97210693359375, -2.8509521484375, -2.72979736328125, -2.608642578125, -2.48748779296875, -2.3663330078125, -2.24517822265625, -2.1240234375, -2.00286865234375, -1.8817138671875, -1.76055908203125, -1.639404296875, -1.51824951171875, -1.3970947265625, -1.27593994140625, -1.15478515625, -1.03363037109375, -0.9124755859375, -0.79132080078125, -0.670166015625, -0.54901123046875, -0.4278564453125, -0.30670166015625, -0.185546875, -0.06439208984375, 0.0567626953125, 0.17791748046875, 0.299072265625, 0.42022705078125, 0.5413818359375, 0.66253662109375, 0.78369140625, 0.90484619140625, 1.0260009765625, 1.14715576171875, 1.268310546875, 1.38946533203125, 1.5106201171875, 1.63177490234375, 1.7529296875, 1.87408447265625, 1.9952392578125, 2.11639404296875, 2.237548828125, 2.35870361328125, 2.4798583984375, 2.60101318359375, 2.72216796875, 2.84332275390625, 2.9644775390625, 3.08563232421875, 3.206787109375, 3.32794189453125, 3.4490966796875, 3.57025146484375, 3.69140625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 10.0, 11.0, 11.0, 20.0, 32.0, 33.0, 37.0, 65.0, 69.0, 90.0, 89.0, 97.0, 88.0, 69.0, 65.0, 55.0, 40.0, 26.0, 23.0, 16.0, 17.0, 6.0, 2.0, 5.0, 3.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-21.103822708129883, -20.61128044128418, -20.118736267089844, -19.62619400024414, -19.133651733398438, -18.641109466552734, -18.1485652923584, -17.656023025512695, -17.163480758666992, -16.67093849182129, -16.178394317626953, -15.68585205078125, -15.193309783935547, -14.700766563415527, -14.208223342895508, -13.715681076049805, -13.223136901855469, -12.73059368133545, -12.238051414489746, -11.745508193969727, -11.252965927124023, -10.760422706604004, -10.267879486083984, -9.775337219238281, -9.282794952392578, -8.790251731872559, -8.297709465026855, -7.805166244506836, -7.312623500823975, -6.820080757141113, -6.327538013458252, -5.834995269775391, -5.342452049255371, -4.84990930557251, -4.357366561889648, -3.864823579788208, -3.3722805976867676, -2.8797378540039062, -2.387195110321045, -1.8946521282196045, -1.4021093845367432, -0.9095665216445923, -0.4170237183570862, 0.07551908493041992, 0.5680619478225708, 1.0606048107147217, 1.553147554397583, 2.0456905364990234, 2.5382332801818848, 3.030776023864746, 3.5233190059661865, 4.015861511230469, 4.508404731750488, 5.00094747543335, 5.493490219116211, 5.9860334396362305, 6.478575706481934, 6.971118450164795, 7.463661193847656, 7.956204414367676, 8.448746681213379, 8.941289901733398, 9.433832168579102, 9.926375389099121, 10.41891860961914]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 8.0, 7.0, 9.0, 12.0, 9.0, 29.0, 17.0, 42.0, 36.0, 29.0, 50.0, 42.0, 55.0, 51.0, 43.0, 60.0, 56.0, 52.0, 54.0, 46.0, 42.0, 42.0, 33.0, 33.0, 27.0, 25.0, 25.0, 19.0, 5.0, 14.0, 2.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.959763526916504, -7.626382827758789, -7.293002605438232, -6.959622383117676, -6.626241683959961, -6.292860984802246, -5.9594807624816895, -5.626100540161133, -5.292719841003418, -4.959339141845703, -4.6259589195251465, -4.29257869720459, -3.959197998046875, -3.6258175373077393, -3.2924370765686035, -2.9590566158294678, -2.625676155090332, -2.2922956943511963, -1.9589152336120605, -1.6255347728729248, -1.292154312133789, -0.9587738513946533, -0.6253933906555176, -0.29201292991638184, 0.041367530822753906, 0.37474799156188965, 0.7081284523010254, 1.0415089130401611, 1.3748893737792969, 1.7082698345184326, 2.0416502952575684, 2.375030755996704, 2.7084102630615234, 3.041790723800659, 3.375171184539795, 3.7085516452789307, 4.041932106018066, 4.375312805175781, 4.708693027496338, 5.0420732498168945, 5.375453948974609, 5.708834648132324, 6.042214870452881, 6.3755950927734375, 6.708975791931152, 7.042356491088867, 7.375736713409424, 7.7091169357299805, 8.042497634887695, 8.37587833404541, 8.709259033203125, 9.042638778686523, 9.376019477844238, 9.709400177001953, 10.042779922485352, 10.376160621643066, 10.709541320800781, 11.042922019958496, 11.376302719116211, 11.70968246459961, 12.043063163757324, 12.376443862915039, 12.709823608398438, 13.043204307556152, 13.376585006713867]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 17.0, 17.0, 27.0, 56.0, 96.0, 138.0, 233.0, 452.0, 793.0, 1408.0, 2541.0, 4609.0, 9246.0, 20977.0, 55162.0, 184988.0, 759341.0, 1785325.0, 1004664.0, 244679.0, 68288.0, 25350.0, 11690.0, 6073.0, 3291.0, 1918.0, 1096.0, 671.0, 390.0, 238.0, 163.0, 104.0, 82.0, 42.0, 32.0, 15.0, 20.0, 11.0, 17.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4609375, -12.9139404296875, -12.366943359375, -11.8199462890625, -11.27294921875, -10.7259521484375, -10.178955078125, -9.6319580078125, -9.0849609375, -8.5379638671875, -7.990966796875, -7.4439697265625, -6.89697265625, -6.3499755859375, -5.802978515625, -5.2559814453125, -4.708984375, -4.1619873046875, -3.614990234375, -3.0679931640625, -2.52099609375, -1.9739990234375, -1.427001953125, -0.8800048828125, -0.3330078125, 0.2139892578125, 0.760986328125, 1.3079833984375, 1.85498046875, 2.4019775390625, 2.948974609375, 3.4959716796875, 4.04296875, 4.5899658203125, 5.136962890625, 5.6839599609375, 6.23095703125, 6.7779541015625, 7.324951171875, 7.8719482421875, 8.4189453125, 8.9659423828125, 9.512939453125, 10.0599365234375, 10.60693359375, 11.1539306640625, 11.700927734375, 12.2479248046875, 12.794921875, 13.3419189453125, 13.888916015625, 14.4359130859375, 14.98291015625, 15.5299072265625, 16.076904296875, 16.6239013671875, 17.1708984375, 17.7178955078125, 18.264892578125, 18.8118896484375, 19.35888671875, 19.9058837890625, 20.452880859375, 20.9998779296875, 21.546875]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 2.0, 2.0, 7.0, 9.0, 9.0, 19.0, 11.0, 13.0, 14.0, 23.0, 39.0, 37.0, 24.0, 36.0, 50.0, 35.0, 59.0, 52.0, 46.0, 51.0, 57.0, 40.0, 53.0, 47.0, 48.0, 32.0, 23.0, 24.0, 25.0, 21.0, 21.0, 15.0, 21.0, 10.0, 9.0, 6.0, 3.0, 3.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.61785888671875, -5.4036865234375, -5.18951416015625, -4.975341796875, -4.76116943359375, -4.5469970703125, -4.33282470703125, -4.11865234375, -3.90447998046875, -3.6903076171875, -3.47613525390625, -3.261962890625, -3.04779052734375, -2.8336181640625, -2.61944580078125, -2.4052734375, -2.19110107421875, -1.9769287109375, -1.76275634765625, -1.548583984375, -1.33441162109375, -1.1202392578125, -0.90606689453125, -0.69189453125, -0.47772216796875, -0.2635498046875, -0.04937744140625, 0.164794921875, 0.37896728515625, 0.5931396484375, 0.80731201171875, 1.021484375, 1.23565673828125, 1.4498291015625, 1.66400146484375, 1.878173828125, 2.09234619140625, 2.3065185546875, 2.52069091796875, 2.73486328125, 2.94903564453125, 3.1632080078125, 3.37738037109375, 3.591552734375, 3.80572509765625, 4.0198974609375, 4.23406982421875, 4.4482421875, 4.66241455078125, 4.8765869140625, 5.09075927734375, 5.304931640625, 5.51910400390625, 5.7332763671875, 5.94744873046875, 6.16162109375, 6.37579345703125, 6.5899658203125, 6.80413818359375, 7.018310546875, 7.23248291015625, 7.4466552734375, 7.66082763671875, 7.875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 9.0, 13.0, 11.0, 21.0, 24.0, 42.0, 60.0, 91.0, 126.0, 225.0, 279.0, 423.0, 707.0, 1015.0, 1593.0, 2438.0, 4033.0, 6499.0, 11341.0, 20916.0, 42291.0, 98135.0, 264602.0, 750351.0, 1408421.0, 974687.0, 361524.0, 130288.0, 54245.0, 25694.0, 13824.0, 7870.0, 4606.0, 2857.0, 1691.0, 1153.0, 723.0, 463.0, 381.0, 190.0, 138.0, 93.0, 59.0, 42.0, 22.0, 30.0, 15.0, 5.0, 10.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9296875, -12.5078125, -12.0859375, -11.6640625, -11.2421875, -10.8203125, -10.3984375, -9.9765625, -9.5546875, -9.1328125, -8.7109375, -8.2890625, -7.8671875, -7.4453125, -7.0234375, -6.6015625, -6.1796875, -5.7578125, -5.3359375, -4.9140625, -4.4921875, -4.0703125, -3.6484375, -3.2265625, -2.8046875, -2.3828125, -1.9609375, -1.5390625, -1.1171875, -0.6953125, -0.2734375, 0.1484375, 0.5703125, 0.9921875, 1.4140625, 1.8359375, 2.2578125, 2.6796875, 3.1015625, 3.5234375, 3.9453125, 4.3671875, 4.7890625, 5.2109375, 5.6328125, 6.0546875, 6.4765625, 6.8984375, 7.3203125, 7.7421875, 8.1640625, 8.5859375, 9.0078125, 9.4296875, 9.8515625, 10.2734375, 10.6953125, 11.1171875, 11.5390625, 11.9609375, 12.3828125, 12.8046875, 13.2265625, 13.6484375, 14.0703125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 8.0, 13.0, 12.0, 13.0, 23.0, 28.0, 29.0, 35.0, 31.0, 69.0, 73.0, 91.0, 135.0, 183.0, 214.0, 258.0, 281.0, 342.0, 359.0, 327.0, 281.0, 285.0, 235.0, 198.0, 135.0, 98.0, 71.0, 53.0, 47.0, 33.0, 17.0, 24.0, 13.0, 9.0, 14.0, 6.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4158935546875, -3.296630859375, -3.1773681640625, -3.05810546875, -2.9388427734375, -2.819580078125, -2.7003173828125, -2.5810546875, -2.4617919921875, -2.342529296875, -2.2232666015625, -2.10400390625, -1.9847412109375, -1.865478515625, -1.7462158203125, -1.626953125, -1.5076904296875, -1.388427734375, -1.2691650390625, -1.14990234375, -1.0306396484375, -0.911376953125, -0.7921142578125, -0.6728515625, -0.5535888671875, -0.434326171875, -0.3150634765625, -0.19580078125, -0.0765380859375, 0.042724609375, 0.1619873046875, 0.28125, 0.4005126953125, 0.519775390625, 0.6390380859375, 0.75830078125, 0.8775634765625, 0.996826171875, 1.1160888671875, 1.2353515625, 1.3546142578125, 1.473876953125, 1.5931396484375, 1.71240234375, 1.8316650390625, 1.950927734375, 2.0701904296875, 2.189453125, 2.3087158203125, 2.427978515625, 2.5472412109375, 2.66650390625, 2.7857666015625, 2.905029296875, 3.0242919921875, 3.1435546875, 3.2628173828125, 3.382080078125, 3.5013427734375, 3.62060546875, 3.7398681640625, 3.859130859375, 3.9783935546875, 4.09765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 2.0, 7.0, 8.0, 7.0, 20.0, 15.0, 34.0, 37.0, 64.0, 76.0, 92.0, 100.0, 131.0, 108.0, 87.0, 52.0, 49.0, 33.0, 36.0, 14.0, 7.0, 5.0, 10.0, 2.0, 2.0, 8.0, 1.0, 2.0], "bins": [-27.16619300842285, -26.602209091186523, -26.038225173950195, -25.4742431640625, -24.910259246826172, -24.346275329589844, -23.782291412353516, -23.218307495117188, -22.65432357788086, -22.09033966064453, -21.526355743408203, -20.962371826171875, -20.39838981628418, -19.83440589904785, -19.270421981811523, -18.706438064575195, -18.1424560546875, -17.578472137451172, -17.014488220214844, -16.450504302978516, -15.886521339416504, -15.322538375854492, -14.758554458618164, -14.194570541381836, -13.630586624145508, -13.06660270690918, -12.502619743347168, -11.93863582611084, -11.374651908874512, -10.8106689453125, -10.246685028076172, -9.682701110839844, -9.118718147277832, -8.554734230041504, -7.990750789642334, -7.426767349243164, -6.862783432006836, -6.298799991607666, -5.734816551208496, -5.170832633972168, -4.606849193572998, -4.042865753173828, -3.4788818359375, -2.91489839553833, -2.350914716720581, -1.786931037902832, -1.222947597503662, -0.6589639186859131, -0.09498023986816406, 0.4690033793449402, 1.0329869985580444, 1.596970558166504, 2.160954236984253, 2.724937915802002, 3.288921356201172, 3.852905035018921, 4.41688871383667, 4.98087215423584, 5.544856071472168, 6.108839511871338, 6.672822952270508, 7.236806869506836, 7.800790309906006, 8.364773750305176, 8.928757667541504]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 2.0, 7.0, 12.0, 9.0, 23.0, 22.0, 12.0, 40.0, 38.0, 40.0, 43.0, 36.0, 38.0, 45.0, 43.0, 43.0, 46.0, 38.0, 54.0, 43.0, 42.0, 43.0, 37.0, 35.0, 36.0, 34.0, 22.0, 22.0, 21.0, 14.0, 13.0, 6.0, 9.0, 8.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.928322792053223, -6.660472393035889, -6.3926215171813965, -6.1247711181640625, -5.8569207191467285, -5.5890703201293945, -5.321219444274902, -5.053369045257568, -4.785518646240234, -4.5176682472229, -4.249817371368408, -3.981966972351074, -3.7141165733337402, -3.446265935897827, -3.178415298461914, -2.91056489944458, -2.642714023590088, -2.374863386154175, -2.107012987136841, -1.8391623497009277, -1.5713118314743042, -1.3034613132476807, -1.0356106758117676, -0.767760157585144, -0.4999096393585205, -0.23205909132957458, 0.03579145669937134, 0.30364203453063965, 0.5714925527572632, 0.8393430709838867, 1.1071937084197998, 1.3750442266464233, 1.6428947448730469, 1.9107452630996704, 2.178595781326294, 2.446446418762207, 2.714296817779541, 2.982147455215454, 3.249998092651367, 3.517848491668701, 3.7856991291046143, 4.053549766540527, 4.321400165557861, 4.589250564575195, 4.8571014404296875, 5.1249518394470215, 5.3928022384643555, 5.660653114318848, 5.928503513336182, 6.196353912353516, 6.464204788208008, 6.732055187225342, 6.999905586242676, 7.267756462097168, 7.535606861114502, 7.803457260131836, 8.071308135986328, 8.33915901184082, 8.607008934020996, 8.874859809875488, 9.14271068572998, 9.410560607910156, 9.678411483764648, 9.94626235961914, 10.214112281799316]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 3.0, 4.0, 4.0, 11.0, 11.0, 16.0, 24.0, 43.0, 51.0, 67.0, 95.0, 128.0, 247.0, 291.0, 502.0, 683.0, 1069.0, 1573.0, 2775.0, 4581.0, 8499.0, 16815.0, 34681.0, 76604.0, 164416.0, 268300.0, 233550.0, 122469.0, 55753.0, 25693.0, 12724.0, 6691.0, 3871.0, 2252.0, 1361.0, 856.0, 569.0, 388.0, 271.0, 210.0, 130.0, 76.0, 54.0, 55.0, 29.0, 20.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.671875, -6.46844482421875, -6.2650146484375, -6.06158447265625, -5.858154296875, -5.65472412109375, -5.4512939453125, -5.24786376953125, -5.04443359375, -4.84100341796875, -4.6375732421875, -4.43414306640625, -4.230712890625, -4.02728271484375, -3.8238525390625, -3.62042236328125, -3.4169921875, -3.21356201171875, -3.0101318359375, -2.80670166015625, -2.603271484375, -2.39984130859375, -2.1964111328125, -1.99298095703125, -1.78955078125, -1.58612060546875, -1.3826904296875, -1.17926025390625, -0.975830078125, -0.77239990234375, -0.5689697265625, -0.36553955078125, -0.162109375, 0.04132080078125, 0.2447509765625, 0.44818115234375, 0.651611328125, 0.85504150390625, 1.0584716796875, 1.26190185546875, 1.46533203125, 1.66876220703125, 1.8721923828125, 2.07562255859375, 2.279052734375, 2.48248291015625, 2.6859130859375, 2.88934326171875, 3.0927734375, 3.29620361328125, 3.4996337890625, 3.70306396484375, 3.906494140625, 4.10992431640625, 4.3133544921875, 4.51678466796875, 4.72021484375, 4.92364501953125, 5.1270751953125, 5.33050537109375, 5.533935546875, 5.73736572265625, 5.9407958984375, 6.14422607421875, 6.34765625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 5.0, 3.0, 4.0, 12.0, 14.0, 16.0, 30.0, 16.0, 27.0, 28.0, 33.0, 43.0, 28.0, 29.0, 55.0, 53.0, 37.0, 44.0, 49.0, 44.0, 43.0, 45.0, 35.0, 38.0, 24.0, 34.0, 28.0, 40.0, 25.0, 23.0, 17.0, 20.0, 10.0, 6.0, 7.0, 2.0, 8.0, 1.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.296875, -7.031982421875, -6.76708984375, -6.502197265625, -6.2373046875, -5.972412109375, -5.70751953125, -5.442626953125, -5.177734375, -4.912841796875, -4.64794921875, -4.383056640625, -4.1181640625, -3.853271484375, -3.58837890625, -3.323486328125, -3.05859375, -2.793701171875, -2.52880859375, -2.263916015625, -1.9990234375, -1.734130859375, -1.46923828125, -1.204345703125, -0.939453125, -0.674560546875, -0.40966796875, -0.144775390625, 0.1201171875, 0.385009765625, 0.64990234375, 0.914794921875, 1.1796875, 1.444580078125, 1.70947265625, 1.974365234375, 2.2392578125, 2.504150390625, 2.76904296875, 3.033935546875, 3.298828125, 3.563720703125, 3.82861328125, 4.093505859375, 4.3583984375, 4.623291015625, 4.88818359375, 5.153076171875, 5.41796875, 5.682861328125, 5.94775390625, 6.212646484375, 6.4775390625, 6.742431640625, 7.00732421875, 7.272216796875, 7.537109375, 7.802001953125, 8.06689453125, 8.331787109375, 8.5966796875, 8.861572265625, 9.12646484375, 9.391357421875, 9.65625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 11.0, 11.0, 23.0, 32.0, 39.0, 48.0, 65.0, 105.0, 141.0, 211.0, 330.0, 468.0, 797.0, 1249.0, 2088.0, 3933.0, 7563.0, 16684.0, 41342.0, 117416.0, 310971.0, 331507.0, 131268.0, 45780.0, 18216.0, 8173.0, 4146.0, 2296.0, 1289.0, 784.0, 477.0, 310.0, 230.0, 157.0, 100.0, 80.0, 60.0, 36.0, 38.0, 25.0, 20.0, 10.0, 9.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.165771484375, -7.89404296875, -7.622314453125, -7.3505859375, -7.078857421875, -6.80712890625, -6.535400390625, -6.263671875, -5.991943359375, -5.72021484375, -5.448486328125, -5.1767578125, -4.905029296875, -4.63330078125, -4.361572265625, -4.08984375, -3.818115234375, -3.54638671875, -3.274658203125, -3.0029296875, -2.731201171875, -2.45947265625, -2.187744140625, -1.916015625, -1.644287109375, -1.37255859375, -1.100830078125, -0.8291015625, -0.557373046875, -0.28564453125, -0.013916015625, 0.2578125, 0.529541015625, 0.80126953125, 1.072998046875, 1.3447265625, 1.616455078125, 1.88818359375, 2.159912109375, 2.431640625, 2.703369140625, 2.97509765625, 3.246826171875, 3.5185546875, 3.790283203125, 4.06201171875, 4.333740234375, 4.60546875, 4.877197265625, 5.14892578125, 5.420654296875, 5.6923828125, 5.964111328125, 6.23583984375, 6.507568359375, 6.779296875, 7.051025390625, 7.32275390625, 7.594482421875, 7.8662109375, 8.137939453125, 8.40966796875, 8.681396484375, 8.953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 5.0, 12.0, 14.0, 12.0, 17.0, 26.0, 26.0, 26.0, 29.0, 47.0, 27.0, 36.0, 31.0, 49.0, 38.0, 44.0, 47.0, 55.0, 40.0, 43.0, 49.0, 51.0, 30.0, 27.0, 33.0, 21.0, 21.0, 24.0, 22.0, 21.0, 11.0, 5.0, 13.0, 5.0, 4.0, 8.0, 3.0, 4.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.8880615234375, -4.733154296875, -4.5782470703125, -4.42333984375, -4.2684326171875, -4.113525390625, -3.9586181640625, -3.8037109375, -3.6488037109375, -3.493896484375, -3.3389892578125, -3.18408203125, -3.0291748046875, -2.874267578125, -2.7193603515625, -2.564453125, -2.4095458984375, -2.254638671875, -2.0997314453125, -1.94482421875, -1.7899169921875, -1.635009765625, -1.4801025390625, -1.3251953125, -1.1702880859375, -1.015380859375, -0.8604736328125, -0.70556640625, -0.5506591796875, -0.395751953125, -0.2408447265625, -0.0859375, 0.0689697265625, 0.223876953125, 0.3787841796875, 0.53369140625, 0.6885986328125, 0.843505859375, 0.9984130859375, 1.1533203125, 1.3082275390625, 1.463134765625, 1.6180419921875, 1.77294921875, 1.9278564453125, 2.082763671875, 2.2376708984375, 2.392578125, 2.5474853515625, 2.702392578125, 2.8572998046875, 3.01220703125, 3.1671142578125, 3.322021484375, 3.4769287109375, 3.6318359375, 3.7867431640625, 3.941650390625, 4.0965576171875, 4.25146484375, 4.4063720703125, 4.561279296875, 4.7161865234375, 4.87109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 7.0, 4.0, 10.0, 10.0, 15.0, 31.0, 34.0, 47.0, 65.0, 102.0, 145.0, 189.0, 299.0, 419.0, 556.0, 875.0, 1296.0, 1842.0, 2930.0, 4738.0, 8068.0, 13717.0, 24765.0, 46898.0, 92712.0, 184641.0, 271072.0, 188673.0, 95111.0, 47937.0, 25217.0, 14065.0, 8047.0, 4913.0, 3034.0, 1928.0, 1295.0, 869.0, 594.0, 414.0, 278.0, 189.0, 164.0, 99.0, 85.0, 52.0, 26.0, 29.0, 19.0, 16.0, 7.0, 7.0, 8.0, 3.0, 0.0, 2.0, 2.0], "bins": [-2.888671875, -2.802490234375, -2.71630859375, -2.630126953125, -2.5439453125, -2.457763671875, -2.37158203125, -2.285400390625, -2.19921875, -2.113037109375, -2.02685546875, -1.940673828125, -1.8544921875, -1.768310546875, -1.68212890625, -1.595947265625, -1.509765625, -1.423583984375, -1.33740234375, -1.251220703125, -1.1650390625, -1.078857421875, -0.99267578125, -0.906494140625, -0.8203125, -0.734130859375, -0.64794921875, -0.561767578125, -0.4755859375, -0.389404296875, -0.30322265625, -0.217041015625, -0.130859375, -0.044677734375, 0.04150390625, 0.127685546875, 0.2138671875, 0.300048828125, 0.38623046875, 0.472412109375, 0.55859375, 0.644775390625, 0.73095703125, 0.817138671875, 0.9033203125, 0.989501953125, 1.07568359375, 1.161865234375, 1.248046875, 1.334228515625, 1.42041015625, 1.506591796875, 1.5927734375, 1.678955078125, 1.76513671875, 1.851318359375, 1.9375, 2.023681640625, 2.10986328125, 2.196044921875, 2.2822265625, 2.368408203125, 2.45458984375, 2.540771484375, 2.626953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 6.0, 3.0, 9.0, 17.0, 17.0, 35.0, 50.0, 79.0, 109.0, 147.0, 135.0, 133.0, 78.0, 45.0, 37.0, 19.0, 21.0, 13.0, 10.0, 6.0, 7.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00033473968505859375, -0.00032637640833854675, -0.00031801313161849976, -0.00030964985489845276, -0.00030128657817840576, -0.00029292330145835876, -0.00028456002473831177, -0.00027619674801826477, -0.0002678334712982178, -0.0002594701945781708, -0.0002511069178581238, -0.00024274364113807678, -0.00023438036441802979, -0.0002260170876979828, -0.0002176538109779358, -0.0002092905342578888, -0.0002009272575378418, -0.0001925639808177948, -0.0001842007040977478, -0.0001758374273777008, -0.0001674741506576538, -0.0001591108739376068, -0.00015074759721755981, -0.00014238432049751282, -0.00013402104377746582, -0.00012565776705741882, -0.00011729449033737183, -0.00010893121361732483, -0.00010056793689727783, -9.220466017723083e-05, -8.384138345718384e-05, -7.547810673713684e-05, -6.711483001708984e-05, -5.875155329704285e-05, -5.038827657699585e-05, -4.202499985694885e-05, -3.3661723136901855e-05, -2.529844641685486e-05, -1.693516969680786e-05, -8.571892976760864e-06, -2.086162567138672e-07, 8.15466046333313e-06, 1.6517937183380127e-05, 2.4881213903427124e-05, 3.324449062347412e-05, 4.160776734352112e-05, 4.9971044063568115e-05, 5.833432078361511e-05, 6.669759750366211e-05, 7.50608742237091e-05, 8.34241509437561e-05, 9.17874276638031e-05, 0.0001001507043838501, 0.0001085139811038971, 0.00011687725782394409, 0.0001252405345439911, 0.00013360381126403809, 0.00014196708798408508, 0.00015033036470413208, 0.00015869364142417908, 0.00016705691814422607, 0.00017542019486427307, 0.00018378347158432007, 0.00019214674830436707, 0.00020051002502441406]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 8.0, 13.0, 19.0, 22.0, 28.0, 37.0, 55.0, 89.0, 134.0, 190.0, 257.0, 389.0, 636.0, 1064.0, 1683.0, 2857.0, 4840.0, 8473.0, 15461.0, 29517.0, 58471.0, 116942.0, 207675.0, 245904.0, 169182.0, 89026.0, 44298.0, 22551.0, 11964.0, 6690.0, 3979.0, 2253.0, 1355.0, 858.0, 550.0, 365.0, 219.0, 138.0, 109.0, 79.0, 51.0, 35.0, 23.0, 14.0, 10.0, 12.0, 9.0, 9.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.470367431640625, -2.38604736328125, -2.301727294921875, -2.2174072265625, -2.133087158203125, -2.04876708984375, -1.964447021484375, -1.880126953125, -1.795806884765625, -1.71148681640625, -1.627166748046875, -1.5428466796875, -1.458526611328125, -1.37420654296875, -1.289886474609375, -1.20556640625, -1.121246337890625, -1.03692626953125, -0.952606201171875, -0.8682861328125, -0.783966064453125, -0.69964599609375, -0.615325927734375, -0.531005859375, -0.446685791015625, -0.36236572265625, -0.278045654296875, -0.1937255859375, -0.109405517578125, -0.02508544921875, 0.059234619140625, 0.1435546875, 0.227874755859375, 0.31219482421875, 0.396514892578125, 0.4808349609375, 0.565155029296875, 0.64947509765625, 0.733795166015625, 0.818115234375, 0.902435302734375, 0.98675537109375, 1.071075439453125, 1.1553955078125, 1.239715576171875, 1.32403564453125, 1.408355712890625, 1.49267578125, 1.576995849609375, 1.66131591796875, 1.745635986328125, 1.8299560546875, 1.914276123046875, 1.99859619140625, 2.082916259765625, 2.167236328125, 2.251556396484375, 2.33587646484375, 2.420196533203125, 2.5045166015625, 2.588836669921875, 2.67315673828125, 2.757476806640625, 2.841796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 6.0, 4.0, 8.0, 11.0, 8.0, 13.0, 14.0, 12.0, 20.0, 19.0, 47.0, 39.0, 54.0, 43.0, 56.0, 50.0, 64.0, 74.0, 71.0, 70.0, 58.0, 43.0, 42.0, 35.0, 37.0, 19.0, 18.0, 12.0, 12.0, 14.0, 7.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.984375, -0.9542999267578125, -0.924224853515625, -0.8941497802734375, -0.86407470703125, -0.8339996337890625, -0.803924560546875, -0.7738494873046875, -0.7437744140625, -0.7136993408203125, -0.683624267578125, -0.6535491943359375, -0.62347412109375, -0.5933990478515625, -0.563323974609375, -0.5332489013671875, -0.503173828125, -0.4730987548828125, -0.443023681640625, -0.4129486083984375, -0.38287353515625, -0.3527984619140625, -0.322723388671875, -0.2926483154296875, -0.2625732421875, -0.2324981689453125, -0.202423095703125, -0.1723480224609375, -0.14227294921875, -0.1121978759765625, -0.082122802734375, -0.0520477294921875, -0.02197265625, 0.0081024169921875, 0.038177490234375, 0.0682525634765625, 0.09832763671875, 0.1284027099609375, 0.158477783203125, 0.1885528564453125, 0.2186279296875, 0.2487030029296875, 0.278778076171875, 0.3088531494140625, 0.33892822265625, 0.3690032958984375, 0.399078369140625, 0.4291534423828125, 0.459228515625, 0.4893035888671875, 0.519378662109375, 0.5494537353515625, 0.57952880859375, 0.6096038818359375, 0.639678955078125, 0.6697540283203125, 0.6998291015625, 0.7299041748046875, 0.759979248046875, 0.7900543212890625, 0.82012939453125, 0.8502044677734375, 0.880279541015625, 0.9103546142578125, 0.9404296875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 8.0, 11.0, 9.0, 16.0, 37.0, 29.0, 51.0, 71.0, 87.0, 100.0, 113.0, 112.0, 93.0, 67.0, 54.0, 35.0, 37.0, 23.0, 13.0, 8.0, 7.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0], "bins": [-25.433486938476562, -24.898591995239258, -24.363698959350586, -23.82880401611328, -23.293909072875977, -22.759014129638672, -22.22412109375, -21.689226150512695, -21.15433120727539, -20.619436264038086, -20.084543228149414, -19.54964828491211, -19.014753341674805, -18.4798583984375, -17.944965362548828, -17.410070419311523, -16.87517547607422, -16.340280532836914, -15.805386543273926, -15.270492553710938, -14.735597610473633, -14.200703620910645, -13.665809631347656, -13.130914688110352, -12.59602165222168, -12.061127662658691, -11.526232719421387, -10.991338729858398, -10.456443786621094, -9.921549797058105, -9.386655807495117, -8.851760864257812, -8.316866874694824, -7.781972408294678, -7.247077941894531, -6.712183952331543, -6.177289009094238, -5.64239501953125, -5.1075005531311035, -4.572606086730957, -4.0377116203308105, -3.502817153930664, -2.9679226875305176, -2.43302845954895, -1.8981339931488037, -1.3632395267486572, -0.8283452987670898, -0.29345083236694336, 0.24144363403320312, 0.7763380408287048, 1.3112324476242065, 1.8461267948150635, 2.38102126121521, 2.9159157276153564, 3.450809955596924, 3.9857044219970703, 4.520598888397217, 5.055493354797363, 5.59038782119751, 6.125282287597656, 6.6601762771606445, 7.195071220397949, 7.7299652099609375, 8.264860153198242, 8.79975414276123]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 7.0, 6.0, 1.0, 7.0, 7.0, 14.0, 20.0, 22.0, 18.0, 24.0, 47.0, 36.0, 43.0, 34.0, 40.0, 34.0, 56.0, 47.0, 35.0, 49.0, 43.0, 44.0, 43.0, 42.0, 37.0, 46.0, 29.0, 37.0, 23.0, 26.0, 11.0, 22.0, 13.0, 7.0, 11.0, 4.0, 5.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.845996856689453, -6.58424711227417, -6.3224968910217285, -6.060747146606445, -5.798996925354004, -5.537247180938721, -5.2754974365234375, -5.013747215270996, -4.751996994018555, -4.4902472496032715, -4.22849702835083, -3.966747283935547, -3.7049970626831055, -3.4432473182678223, -3.18149733543396, -2.9197473526000977, -2.6579976081848145, -2.396247625350952, -2.13449764251709, -1.872747778892517, -1.6109977960586548, -1.3492478132247925, -1.0874979496002197, -0.8257479667663574, -0.5639979839324951, -0.3022480309009552, -0.04049807786941528, 0.22125184535980225, 0.48300182819366455, 0.7447518110275269, 1.0065016746520996, 1.268251657485962, 1.5300016403198242, 1.7917516231536865, 2.053501605987549, 2.315251350402832, 2.5770015716552734, 2.8387513160705566, 3.100501298904419, 3.3622512817382812, 3.6240012645721436, 3.885751247406006, 4.147500991821289, 4.4092512130737305, 4.671000957489014, 4.932751178741455, 5.194500923156738, 5.45625114440918, 5.718000888824463, 5.979750633239746, 6.2415008544921875, 6.503250598907471, 6.765000820159912, 7.026750564575195, 7.288500785827637, 7.55025053024292, 7.812000274658203, 8.073750495910645, 8.33549976348877, 8.597249984741211, 8.859000205993652, 9.120750427246094, 9.382499694824219, 9.64424991607666, 9.906000137329102]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 8.0, 18.0, 24.0, 25.0, 61.0, 71.0, 111.0, 181.0, 248.0, 418.0, 677.0, 1051.0, 1732.0, 3022.0, 5077.0, 9310.0, 16698.0, 30940.0, 59182.0, 108461.0, 175261.0, 213872.0, 177737.0, 111084.0, 61038.0, 32403.0, 17479.0, 9371.0, 5291.0, 2876.0, 1767.0, 1105.0, 760.0, 396.0, 271.0, 169.0, 126.0, 62.0, 44.0, 38.0, 31.0, 13.0, 7.0, 10.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.45361328125, -8.1572265625, -7.86083984375, -7.564453125, -7.26806640625, -6.9716796875, -6.67529296875, -6.37890625, -6.08251953125, -5.7861328125, -5.48974609375, -5.193359375, -4.89697265625, -4.6005859375, -4.30419921875, -4.0078125, -3.71142578125, -3.4150390625, -3.11865234375, -2.822265625, -2.52587890625, -2.2294921875, -1.93310546875, -1.63671875, -1.34033203125, -1.0439453125, -0.74755859375, -0.451171875, -0.15478515625, 0.1416015625, 0.43798828125, 0.734375, 1.03076171875, 1.3271484375, 1.62353515625, 1.919921875, 2.21630859375, 2.5126953125, 2.80908203125, 3.10546875, 3.40185546875, 3.6982421875, 3.99462890625, 4.291015625, 4.58740234375, 4.8837890625, 5.18017578125, 5.4765625, 5.77294921875, 6.0693359375, 6.36572265625, 6.662109375, 6.95849609375, 7.2548828125, 7.55126953125, 7.84765625, 8.14404296875, 8.4404296875, 8.73681640625, 9.033203125, 9.32958984375, 9.6259765625, 9.92236328125, 10.21875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 3.0, 7.0, 3.0, 12.0, 10.0, 11.0, 26.0, 22.0, 26.0, 26.0, 26.0, 52.0, 35.0, 47.0, 49.0, 42.0, 50.0, 45.0, 48.0, 45.0, 58.0, 36.0, 42.0, 30.0, 36.0, 47.0, 37.0, 20.0, 26.0, 17.0, 20.0, 11.0, 7.0, 6.0, 6.0, 11.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.46875, -7.185791015625, -6.90283203125, -6.619873046875, -6.3369140625, -6.053955078125, -5.77099609375, -5.488037109375, -5.205078125, -4.922119140625, -4.63916015625, -4.356201171875, -4.0732421875, -3.790283203125, -3.50732421875, -3.224365234375, -2.94140625, -2.658447265625, -2.37548828125, -2.092529296875, -1.8095703125, -1.526611328125, -1.24365234375, -0.960693359375, -0.677734375, -0.394775390625, -0.11181640625, 0.171142578125, 0.4541015625, 0.737060546875, 1.02001953125, 1.302978515625, 1.5859375, 1.868896484375, 2.15185546875, 2.434814453125, 2.7177734375, 3.000732421875, 3.28369140625, 3.566650390625, 3.849609375, 4.132568359375, 4.41552734375, 4.698486328125, 4.9814453125, 5.264404296875, 5.54736328125, 5.830322265625, 6.11328125, 6.396240234375, 6.67919921875, 6.962158203125, 7.2451171875, 7.528076171875, 7.81103515625, 8.093994140625, 8.376953125, 8.659912109375, 8.94287109375, 9.225830078125, 9.5087890625, 9.791748046875, 10.07470703125, 10.357666015625, 10.640625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 16.0, 19.0, 26.0, 50.0, 62.0, 107.0, 152.0, 209.0, 265.0, 468.0, 687.0, 1007.0, 1466.0, 2450.0, 3775.0, 5633.0, 9077.0, 13986.0, 22380.0, 35907.0, 55373.0, 84791.0, 119623.0, 148684.0, 151731.0, 127512.0, 92697.0, 61784.0, 39696.0, 24961.0, 15834.0, 9940.0, 6450.0, 3956.0, 2591.0, 1773.0, 1159.0, 763.0, 467.0, 339.0, 220.0, 156.0, 97.0, 71.0, 49.0, 28.0, 21.0, 15.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.265625, -6.06427001953125, -5.8629150390625, -5.66156005859375, -5.460205078125, -5.25885009765625, -5.0574951171875, -4.85614013671875, -4.65478515625, -4.45343017578125, -4.2520751953125, -4.05072021484375, -3.849365234375, -3.64801025390625, -3.4466552734375, -3.24530029296875, -3.0439453125, -2.84259033203125, -2.6412353515625, -2.43988037109375, -2.238525390625, -2.03717041015625, -1.8358154296875, -1.63446044921875, -1.43310546875, -1.23175048828125, -1.0303955078125, -0.82904052734375, -0.627685546875, -0.42633056640625, -0.2249755859375, -0.02362060546875, 0.177734375, 0.37908935546875, 0.5804443359375, 0.78179931640625, 0.983154296875, 1.18450927734375, 1.3858642578125, 1.58721923828125, 1.78857421875, 1.98992919921875, 2.1912841796875, 2.39263916015625, 2.593994140625, 2.79534912109375, 2.9967041015625, 3.19805908203125, 3.3994140625, 3.60076904296875, 3.8021240234375, 4.00347900390625, 4.204833984375, 4.40618896484375, 4.6075439453125, 4.80889892578125, 5.01025390625, 5.21160888671875, 5.4129638671875, 5.61431884765625, 5.815673828125, 6.01702880859375, 6.2183837890625, 6.41973876953125, 6.62109375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 5.0, 10.0, 4.0, 16.0, 12.0, 15.0, 18.0, 13.0, 25.0, 28.0, 36.0, 28.0, 34.0, 33.0, 42.0, 34.0, 41.0, 26.0, 45.0, 35.0, 46.0, 47.0, 44.0, 38.0, 40.0, 45.0, 28.0, 39.0, 28.0, 27.0, 23.0, 15.0, 9.0, 13.0, 5.0, 13.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-5.703125, -5.5421142578125, -5.381103515625, -5.2200927734375, -5.05908203125, -4.8980712890625, -4.737060546875, -4.5760498046875, -4.4150390625, -4.2540283203125, -4.093017578125, -3.9320068359375, -3.77099609375, -3.6099853515625, -3.448974609375, -3.2879638671875, -3.126953125, -2.9659423828125, -2.804931640625, -2.6439208984375, -2.48291015625, -2.3218994140625, -2.160888671875, -1.9998779296875, -1.8388671875, -1.6778564453125, -1.516845703125, -1.3558349609375, -1.19482421875, -1.0338134765625, -0.872802734375, -0.7117919921875, -0.55078125, -0.3897705078125, -0.228759765625, -0.0677490234375, 0.09326171875, 0.2542724609375, 0.415283203125, 0.5762939453125, 0.7373046875, 0.8983154296875, 1.059326171875, 1.2203369140625, 1.38134765625, 1.5423583984375, 1.703369140625, 1.8643798828125, 2.025390625, 2.1864013671875, 2.347412109375, 2.5084228515625, 2.66943359375, 2.8304443359375, 2.991455078125, 3.1524658203125, 3.3134765625, 3.4744873046875, 3.635498046875, 3.7965087890625, 3.95751953125, 4.1185302734375, 4.279541015625, 4.4405517578125, 4.6015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 8.0, 9.0, 12.0, 24.0, 21.0, 44.0, 32.0, 73.0, 100.0, 126.0, 209.0, 272.0, 392.0, 649.0, 989.0, 1437.0, 2313.0, 3578.0, 5931.0, 10159.0, 18480.0, 37698.0, 84099.0, 198554.0, 313097.0, 201003.0, 85660.0, 37973.0, 19083.0, 10254.0, 5927.0, 3509.0, 2315.0, 1493.0, 968.0, 640.0, 415.0, 299.0, 211.0, 156.0, 108.0, 70.0, 48.0, 28.0, 31.0, 15.0, 14.0, 6.0, 12.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.2890625, -8.9942626953125, -8.699462890625, -8.4046630859375, -8.10986328125, -7.8150634765625, -7.520263671875, -7.2254638671875, -6.9306640625, -6.6358642578125, -6.341064453125, -6.0462646484375, -5.75146484375, -5.4566650390625, -5.161865234375, -4.8670654296875, -4.572265625, -4.2774658203125, -3.982666015625, -3.6878662109375, -3.39306640625, -3.0982666015625, -2.803466796875, -2.5086669921875, -2.2138671875, -1.9190673828125, -1.624267578125, -1.3294677734375, -1.03466796875, -0.7398681640625, -0.445068359375, -0.1502685546875, 0.14453125, 0.4393310546875, 0.734130859375, 1.0289306640625, 1.32373046875, 1.6185302734375, 1.913330078125, 2.2081298828125, 2.5029296875, 2.7977294921875, 3.092529296875, 3.3873291015625, 3.68212890625, 3.9769287109375, 4.271728515625, 4.5665283203125, 4.861328125, 5.1561279296875, 5.450927734375, 5.7457275390625, 6.04052734375, 6.3353271484375, 6.630126953125, 6.9249267578125, 7.2197265625, 7.5145263671875, 7.809326171875, 8.1041259765625, 8.39892578125, 8.6937255859375, 8.988525390625, 9.2833251953125, 9.578125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 8.0, 9.0, 12.0, 20.0, 15.0, 29.0, 34.0, 52.0, 58.0, 84.0, 113.0, 97.0, 96.0, 77.0, 63.0, 54.0, 43.0, 37.0, 21.0, 20.0, 12.0, 12.0, 6.0, 8.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000797271728515625, -0.0007695257663726807, -0.0007417798042297363, -0.000714033842086792, -0.0006862878799438477, -0.0006585419178009033, -0.000630795955657959, -0.0006030499935150146, -0.0005753040313720703, -0.000547558069229126, -0.0005198121070861816, -0.0004920661449432373, -0.00046432018280029297, -0.00043657422065734863, -0.0004088282585144043, -0.00038108229637145996, -0.0003533363342285156, -0.0003255903720855713, -0.00029784440994262695, -0.0002700984477996826, -0.00024235248565673828, -0.00021460652351379395, -0.0001868605613708496, -0.00015911459922790527, -0.00013136863708496094, -0.0001036226749420166, -7.587671279907227e-05, -4.813075065612793e-05, -2.0384788513183594e-05, 7.361173629760742e-06, 3.510713577270508e-05, 6.285309791564941e-05, 9.059906005859375e-05, 0.00011834502220153809, 0.00014609098434448242, 0.00017383694648742676, 0.0002015829086303711, 0.00022932887077331543, 0.00025707483291625977, 0.0002848207950592041, 0.00031256675720214844, 0.0003403127193450928, 0.0003680586814880371, 0.00039580464363098145, 0.0004235506057739258, 0.0004512965679168701, 0.00047904253005981445, 0.0005067884922027588, 0.0005345344543457031, 0.0005622804164886475, 0.0005900263786315918, 0.0006177723407745361, 0.0006455183029174805, 0.0006732642650604248, 0.0007010102272033691, 0.0007287561893463135, 0.0007565021514892578, 0.0007842481136322021, 0.0008119940757751465, 0.0008397400379180908, 0.0008674860000610352, 0.0008952319622039795, 0.0009229779243469238, 0.0009507238864898682, 0.0009784698486328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 7.0, 14.0, 13.0, 23.0, 38.0, 50.0, 66.0, 106.0, 140.0, 252.0, 334.0, 536.0, 882.0, 1299.0, 2337.0, 3796.0, 6771.0, 12865.0, 24882.0, 52954.0, 121479.0, 251597.0, 282534.0, 153842.0, 66757.0, 30372.0, 15127.0, 8064.0, 4461.0, 2575.0, 1628.0, 947.0, 644.0, 389.0, 257.0, 179.0, 101.0, 79.0, 59.0, 34.0, 19.0, 16.0, 7.0, 6.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6015625, -7.3406982421875, -7.079833984375, -6.8189697265625, -6.55810546875, -6.2972412109375, -6.036376953125, -5.7755126953125, -5.5146484375, -5.2537841796875, -4.992919921875, -4.7320556640625, -4.47119140625, -4.2103271484375, -3.949462890625, -3.6885986328125, -3.427734375, -3.1668701171875, -2.906005859375, -2.6451416015625, -2.38427734375, -2.1234130859375, -1.862548828125, -1.6016845703125, -1.3408203125, -1.0799560546875, -0.819091796875, -0.5582275390625, -0.29736328125, -0.0364990234375, 0.224365234375, 0.4852294921875, 0.74609375, 1.0069580078125, 1.267822265625, 1.5286865234375, 1.78955078125, 2.0504150390625, 2.311279296875, 2.5721435546875, 2.8330078125, 3.0938720703125, 3.354736328125, 3.6156005859375, 3.87646484375, 4.1373291015625, 4.398193359375, 4.6590576171875, 4.919921875, 5.1807861328125, 5.441650390625, 5.7025146484375, 5.96337890625, 6.2242431640625, 6.485107421875, 6.7459716796875, 7.0068359375, 7.2677001953125, 7.528564453125, 7.7894287109375, 8.05029296875, 8.3111572265625, 8.572021484375, 8.8328857421875, 9.09375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 6.0, 4.0, 10.0, 5.0, 6.0, 14.0, 23.0, 21.0, 32.0, 34.0, 27.0, 41.0, 54.0, 72.0, 74.0, 54.0, 77.0, 78.0, 50.0, 47.0, 41.0, 51.0, 40.0, 26.0, 23.0, 22.0, 11.0, 9.0, 7.0, 5.0, 6.0, 5.0, 8.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.025390625, -2.93170166015625, -2.8380126953125, -2.74432373046875, -2.650634765625, -2.55694580078125, -2.4632568359375, -2.36956787109375, -2.27587890625, -2.18218994140625, -2.0885009765625, -1.99481201171875, -1.901123046875, -1.80743408203125, -1.7137451171875, -1.62005615234375, -1.5263671875, -1.43267822265625, -1.3389892578125, -1.24530029296875, -1.151611328125, -1.05792236328125, -0.9642333984375, -0.87054443359375, -0.77685546875, -0.68316650390625, -0.5894775390625, -0.49578857421875, -0.402099609375, -0.30841064453125, -0.2147216796875, -0.12103271484375, -0.02734375, 0.06634521484375, 0.1600341796875, 0.25372314453125, 0.347412109375, 0.44110107421875, 0.5347900390625, 0.62847900390625, 0.72216796875, 0.81585693359375, 0.9095458984375, 1.00323486328125, 1.096923828125, 1.19061279296875, 1.2843017578125, 1.37799072265625, 1.4716796875, 1.56536865234375, 1.6590576171875, 1.75274658203125, 1.846435546875, 1.94012451171875, 2.0338134765625, 2.12750244140625, 2.22119140625, 2.31488037109375, 2.4085693359375, 2.50225830078125, 2.595947265625, 2.68963623046875, 2.7833251953125, 2.87701416015625, 2.970703125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 11.0, 13.0, 28.0, 34.0, 48.0, 63.0, 97.0, 128.0, 126.0, 128.0, 83.0, 72.0, 50.0, 28.0, 39.0, 22.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.0544490814209, -27.434873580932617, -26.815296173095703, -26.195720672607422, -25.57614517211914, -24.956567764282227, -24.336992263793945, -23.71741485595703, -23.09783935546875, -22.47826385498047, -21.858686447143555, -21.239110946655273, -20.619535446166992, -19.999958038330078, -19.380382537841797, -18.760807037353516, -18.141231536865234, -17.521656036376953, -16.90207862854004, -16.282503128051758, -15.66292667388916, -15.043350219726562, -14.423774719238281, -13.804198265075684, -13.184621810913086, -12.565045356750488, -11.945469856262207, -11.32589340209961, -10.706316947937012, -10.086740493774414, -9.467164993286133, -8.847588539123535, -8.228013038635254, -7.6084370613098145, -6.988860607147217, -6.369284629821777, -5.74970817565918, -5.13013219833374, -4.510556221008301, -3.890979766845703, -3.2714037895202637, -2.651827573776245, -2.0322513580322266, -1.412675380706787, -0.7930991649627686, -0.17352294921875, 0.44605302810668945, 1.065629482269287, 1.6852054595947266, 2.304781675338745, 2.9243578910827637, 3.543933868408203, 4.163510322570801, 4.78308629989624, 5.40266227722168, 6.022238731384277, 6.641814708709717, 7.261390686035156, 7.880967140197754, 8.500543594360352, 9.120119094848633, 9.73969554901123, 10.359272003173828, 10.97884750366211, 11.598423957824707]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 2.0, 3.0, 6.0, 6.0, 14.0, 14.0, 10.0, 12.0, 25.0, 19.0, 32.0, 36.0, 40.0, 38.0, 43.0, 37.0, 53.0, 44.0, 44.0, 42.0, 54.0, 43.0, 33.0, 41.0, 41.0, 39.0, 25.0, 44.0, 33.0, 27.0, 30.0, 12.0, 10.0, 9.0, 9.0, 5.0, 5.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.750573635101318, -7.480526447296143, -7.210478782653809, -6.940431594848633, -6.670384407043457, -6.400337219238281, -6.130289554595947, -5.8602423667907715, -5.5901947021484375, -5.320147514343262, -5.050099849700928, -4.780052661895752, -4.510005474090576, -4.239957809448242, -3.9699106216430664, -3.6998634338378906, -3.429816246032715, -3.15976881980896, -2.889721632003784, -2.6196742057800293, -2.3496270179748535, -2.0795795917510986, -1.8095321655273438, -1.5394848585128784, -1.269437551498413, -0.9993902444839478, -0.7293428778648376, -0.45929551124572754, -0.1892482042312622, 0.08079910278320312, 0.350846529006958, 0.6208938360214233, 0.8909406661987305, 1.1609879732131958, 1.4310352802276611, 1.701082706451416, 1.9711300134658813, 2.2411773204803467, 2.5112247467041016, 2.7812719345092773, 3.0513193607330322, 3.321366786956787, 3.591413974761963, 3.8614614009857178, 4.131508827209473, 4.401556015014648, 4.671603202819824, 4.941650867462158, 5.211698055267334, 5.48174524307251, 5.751792907714844, 6.0218400955200195, 6.291887283325195, 6.561934471130371, 6.831982135772705, 7.102029323577881, 7.372076988220215, 7.642124176025391, 7.912171840667725, 8.182218551635742, 8.452266693115234, 8.72231388092041, 8.992361068725586, 9.262408256530762, 9.532455444335938]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 3.0, 13.0, 12.0, 26.0, 24.0, 36.0, 69.0, 117.0, 159.0, 219.0, 368.0, 542.0, 887.0, 1180.0, 1825.0, 2742.0, 4020.0, 6135.0, 9636.0, 16096.0, 28944.0, 59459.0, 138556.0, 368594.0, 929145.0, 1326848.0, 783901.0, 294085.0, 110893.0, 47914.0, 23810.0, 13381.0, 8167.0, 5259.0, 3480.0, 2252.0, 1597.0, 1033.0, 768.0, 556.0, 435.0, 296.0, 213.0, 168.0, 106.0, 86.0, 51.0, 58.0, 42.0, 36.0, 16.0, 11.0, 7.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.0625, -9.7200927734375, -9.377685546875, -9.0352783203125, -8.69287109375, -8.3504638671875, -8.008056640625, -7.6656494140625, -7.3232421875, -6.9808349609375, -6.638427734375, -6.2960205078125, -5.95361328125, -5.6112060546875, -5.268798828125, -4.9263916015625, -4.583984375, -4.2415771484375, -3.899169921875, -3.5567626953125, -3.21435546875, -2.8719482421875, -2.529541015625, -2.1871337890625, -1.8447265625, -1.5023193359375, -1.159912109375, -0.8175048828125, -0.47509765625, -0.1326904296875, 0.209716796875, 0.5521240234375, 0.89453125, 1.2369384765625, 1.579345703125, 1.9217529296875, 2.26416015625, 2.6065673828125, 2.948974609375, 3.2913818359375, 3.6337890625, 3.9761962890625, 4.318603515625, 4.6610107421875, 5.00341796875, 5.3458251953125, 5.688232421875, 6.0306396484375, 6.373046875, 6.7154541015625, 7.057861328125, 7.4002685546875, 7.74267578125, 8.0850830078125, 8.427490234375, 8.7698974609375, 9.1123046875, 9.4547119140625, 9.797119140625, 10.1395263671875, 10.48193359375, 10.8243408203125, 11.166748046875, 11.5091552734375, 11.8515625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 9.0, 20.0, 13.0, 14.0, 32.0, 21.0, 43.0, 42.0, 42.0, 42.0, 45.0, 38.0, 41.0, 44.0, 40.0, 50.0, 48.0, 48.0, 53.0, 41.0, 41.0, 38.0, 31.0, 22.0, 24.0, 22.0, 20.0, 12.0, 9.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.98046875, -4.7952880859375, -4.610107421875, -4.4249267578125, -4.23974609375, -4.0545654296875, -3.869384765625, -3.6842041015625, -3.4990234375, -3.3138427734375, -3.128662109375, -2.9434814453125, -2.75830078125, -2.5731201171875, -2.387939453125, -2.2027587890625, -2.017578125, -1.8323974609375, -1.647216796875, -1.4620361328125, -1.27685546875, -1.0916748046875, -0.906494140625, -0.7213134765625, -0.5361328125, -0.3509521484375, -0.165771484375, 0.0194091796875, 0.20458984375, 0.3897705078125, 0.574951171875, 0.7601318359375, 0.9453125, 1.1304931640625, 1.315673828125, 1.5008544921875, 1.68603515625, 1.8712158203125, 2.056396484375, 2.2415771484375, 2.4267578125, 2.6119384765625, 2.797119140625, 2.9822998046875, 3.16748046875, 3.3526611328125, 3.537841796875, 3.7230224609375, 3.908203125, 4.0933837890625, 4.278564453125, 4.4637451171875, 4.64892578125, 4.8341064453125, 5.019287109375, 5.2044677734375, 5.3896484375, 5.5748291015625, 5.760009765625, 5.9451904296875, 6.13037109375, 6.3155517578125, 6.500732421875, 6.6859130859375, 6.87109375]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 4.0, 11.0, 17.0, 31.0, 29.0, 53.0, 61.0, 104.0, 153.0, 252.0, 387.0, 546.0, 881.0, 1320.0, 2122.0, 3431.0, 5768.0, 10085.0, 18962.0, 37517.0, 83033.0, 215724.0, 614281.0, 1326252.0, 1130829.0, 451278.0, 159922.0, 64512.0, 29838.0, 15452.0, 8467.0, 4850.0, 2934.0, 1765.0, 1203.0, 751.0, 496.0, 311.0, 209.0, 142.0, 92.0, 65.0, 68.0, 23.0, 11.0, 13.0, 10.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -12.0318603515625, -11.641845703125, -11.2518310546875, -10.86181640625, -10.4718017578125, -10.081787109375, -9.6917724609375, -9.3017578125, -8.9117431640625, -8.521728515625, -8.1317138671875, -7.74169921875, -7.3516845703125, -6.961669921875, -6.5716552734375, -6.181640625, -5.7916259765625, -5.401611328125, -5.0115966796875, -4.62158203125, -4.2315673828125, -3.841552734375, -3.4515380859375, -3.0615234375, -2.6715087890625, -2.281494140625, -1.8914794921875, -1.50146484375, -1.1114501953125, -0.721435546875, -0.3314208984375, 0.05859375, 0.4486083984375, 0.838623046875, 1.2286376953125, 1.61865234375, 2.0086669921875, 2.398681640625, 2.7886962890625, 3.1787109375, 3.5687255859375, 3.958740234375, 4.3487548828125, 4.73876953125, 5.1287841796875, 5.518798828125, 5.9088134765625, 6.298828125, 6.6888427734375, 7.078857421875, 7.4688720703125, 7.85888671875, 8.2489013671875, 8.638916015625, 9.0289306640625, 9.4189453125, 9.8089599609375, 10.198974609375, 10.5889892578125, 10.97900390625, 11.3690185546875, 11.759033203125, 12.1490478515625, 12.5390625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 5.0, 4.0, 5.0, 9.0, 9.0, 8.0, 20.0, 30.0, 23.0, 38.0, 53.0, 68.0, 71.0, 88.0, 115.0, 142.0, 191.0, 238.0, 267.0, 318.0, 353.0, 340.0, 295.0, 257.0, 258.0, 200.0, 170.0, 123.0, 84.0, 83.0, 60.0, 36.0, 24.0, 20.0, 17.0, 18.0, 10.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.4964599609375, -3.387451171875, -3.2784423828125, -3.16943359375, -3.0604248046875, -2.951416015625, -2.8424072265625, -2.7333984375, -2.6243896484375, -2.515380859375, -2.4063720703125, -2.29736328125, -2.1883544921875, -2.079345703125, -1.9703369140625, -1.861328125, -1.7523193359375, -1.643310546875, -1.5343017578125, -1.42529296875, -1.3162841796875, -1.207275390625, -1.0982666015625, -0.9892578125, -0.8802490234375, -0.771240234375, -0.6622314453125, -0.55322265625, -0.4442138671875, -0.335205078125, -0.2261962890625, -0.1171875, -0.0081787109375, 0.100830078125, 0.2098388671875, 0.31884765625, 0.4278564453125, 0.536865234375, 0.6458740234375, 0.7548828125, 0.8638916015625, 0.972900390625, 1.0819091796875, 1.19091796875, 1.2999267578125, 1.408935546875, 1.5179443359375, 1.626953125, 1.7359619140625, 1.844970703125, 1.9539794921875, 2.06298828125, 2.1719970703125, 2.281005859375, 2.3900146484375, 2.4990234375, 2.6080322265625, 2.717041015625, 2.8260498046875, 2.93505859375, 3.0440673828125, 3.153076171875, 3.2620849609375, 3.37109375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 7.0, 10.0, 17.0, 19.0, 23.0, 35.0, 54.0, 65.0, 76.0, 102.0, 117.0, 124.0, 93.0, 72.0, 48.0, 41.0, 31.0, 21.0, 10.0, 12.0, 6.0, 4.0, 7.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-20.712648391723633, -20.2382755279541, -19.76390266418457, -19.28952980041504, -18.815156936645508, -18.340784072875977, -17.866411209106445, -17.39203643798828, -16.91766357421875, -16.44329071044922, -15.968917846679688, -15.494544982910156, -15.020172119140625, -14.545799255371094, -14.071425437927246, -13.597052574157715, -13.1226806640625, -12.648307800292969, -12.173934936523438, -11.699562072753906, -11.225189208984375, -10.750816345214844, -10.276442527770996, -9.802069664001465, -9.327696800231934, -8.853323936462402, -8.378951072692871, -7.904577732086182, -7.43020486831665, -6.955832004547119, -6.48145866394043, -6.007085800170898, -5.532713890075684, -5.058341026306152, -4.583968162536621, -4.109594821929932, -3.6352219581604004, -3.160849094390869, -2.686475992202759, -2.2121028900146484, -1.7377300262451172, -1.2633570432662964, -0.7889840602874756, -0.3146110773086548, 0.15976190567016602, 0.6341347694396973, 1.1085078716278076, 1.582880973815918, 2.057253837585449, 2.5316267013549805, 3.005999803543091, 3.480372905731201, 3.9547457695007324, 4.429118633270264, 4.903491973876953, 5.377864837646484, 5.852237701416016, 6.326610565185547, 6.800983428955078, 7.275356769561768, 7.749729633331299, 8.224102020263672, 8.69847583770752, 9.17284870147705, 9.647221565246582]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 11.0, 8.0, 4.0, 10.0, 17.0, 17.0, 14.0, 31.0, 29.0, 25.0, 39.0, 32.0, 37.0, 39.0, 44.0, 48.0, 37.0, 46.0, 48.0, 50.0, 46.0, 38.0, 39.0, 32.0, 43.0, 36.0, 33.0, 18.0, 20.0, 22.0, 13.0, 12.0, 16.0, 9.0, 8.0, 7.0, 4.0, 1.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.637454509735107, -6.406438827514648, -6.175422668457031, -5.944406986236572, -5.713391304016113, -5.482375144958496, -5.251359462738037, -5.020343780517578, -4.789327621459961, -4.558311939239502, -4.327295780181885, -4.096280097961426, -3.865264415740967, -3.6342484951019287, -3.4032325744628906, -3.1722168922424316, -2.9412012100219727, -2.7101852893829346, -2.4791696071624756, -2.2481536865234375, -2.0171380043029785, -1.7861220836639404, -1.5551061630249023, -1.3240903615951538, -1.0930745601654053, -0.8620587587356567, -0.6310428977012634, -0.4000270366668701, -0.16901123523712158, 0.06200456619262695, 0.29302048683166504, 0.5240362882614136, 0.7550516128540039, 0.9860674142837524, 1.217083215713501, 1.448099136352539, 1.6791149377822876, 1.9101307392120361, 2.141146659851074, 2.372162342071533, 2.6031782627105713, 2.8341941833496094, 3.0652098655700684, 3.2962257862091064, 3.5272417068481445, 3.7582573890686035, 3.9892733097076416, 4.22028923034668, 4.451304912567139, 4.682320594787598, 4.913336753845215, 5.144352436065674, 5.375368118286133, 5.60638427734375, 5.837399959564209, 6.068415641784668, 6.299431800842285, 6.530447483062744, 6.761463642120361, 6.99247932434082, 7.223495006561279, 7.454510688781738, 7.6855268478393555, 7.9165425300598145, 8.147558212280273]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 12.0, 17.0, 22.0, 31.0, 46.0, 84.0, 163.0, 233.0, 327.0, 567.0, 828.0, 1232.0, 2042.0, 3340.0, 5506.0, 9286.0, 16414.0, 29923.0, 54945.0, 100624.0, 167494.0, 216817.0, 183048.0, 113678.0, 63101.0, 33701.0, 18603.0, 10535.0, 5854.0, 3721.0, 2274.0, 1503.0, 909.0, 563.0, 397.0, 240.0, 146.0, 112.0, 61.0, 52.0, 33.0, 23.0, 20.0, 12.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.912109375, -3.799072265625, -3.68603515625, -3.572998046875, -3.4599609375, -3.346923828125, -3.23388671875, -3.120849609375, -3.0078125, -2.894775390625, -2.78173828125, -2.668701171875, -2.5556640625, -2.442626953125, -2.32958984375, -2.216552734375, -2.103515625, -1.990478515625, -1.87744140625, -1.764404296875, -1.6513671875, -1.538330078125, -1.42529296875, -1.312255859375, -1.19921875, -1.086181640625, -0.97314453125, -0.860107421875, -0.7470703125, -0.634033203125, -0.52099609375, -0.407958984375, -0.294921875, -0.181884765625, -0.06884765625, 0.044189453125, 0.1572265625, 0.270263671875, 0.38330078125, 0.496337890625, 0.609375, 0.722412109375, 0.83544921875, 0.948486328125, 1.0615234375, 1.174560546875, 1.28759765625, 1.400634765625, 1.513671875, 1.626708984375, 1.73974609375, 1.852783203125, 1.9658203125, 2.078857421875, 2.19189453125, 2.304931640625, 2.41796875, 2.531005859375, 2.64404296875, 2.757080078125, 2.8701171875, 2.983154296875, 3.09619140625, 3.209228515625, 3.322265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 9.0, 7.0, 5.0, 17.0, 23.0, 30.0, 29.0, 32.0, 33.0, 46.0, 36.0, 42.0, 41.0, 48.0, 48.0, 61.0, 45.0, 61.0, 44.0, 47.0, 41.0, 39.0, 28.0, 33.0, 33.0, 25.0, 18.0, 14.0, 12.0, 7.0, 7.0, 9.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.92578125, -7.65899658203125, -7.3922119140625, -7.12542724609375, -6.858642578125, -6.59185791015625, -6.3250732421875, -6.05828857421875, -5.79150390625, -5.52471923828125, -5.2579345703125, -4.99114990234375, -4.724365234375, -4.45758056640625, -4.1907958984375, -3.92401123046875, -3.6572265625, -3.39044189453125, -3.1236572265625, -2.85687255859375, -2.590087890625, -2.32330322265625, -2.0565185546875, -1.78973388671875, -1.52294921875, -1.25616455078125, -0.9893798828125, -0.72259521484375, -0.455810546875, -0.18902587890625, 0.0777587890625, 0.34454345703125, 0.611328125, 0.87811279296875, 1.1448974609375, 1.41168212890625, 1.678466796875, 1.94525146484375, 2.2120361328125, 2.47882080078125, 2.74560546875, 3.01239013671875, 3.2791748046875, 3.54595947265625, 3.812744140625, 4.07952880859375, 4.3463134765625, 4.61309814453125, 4.8798828125, 5.14666748046875, 5.4134521484375, 5.68023681640625, 5.947021484375, 6.21380615234375, 6.4805908203125, 6.74737548828125, 7.01416015625, 7.28094482421875, 7.5477294921875, 7.81451416015625, 8.081298828125, 8.34808349609375, 8.6148681640625, 8.88165283203125, 9.1484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 12.0, 14.0, 18.0, 24.0, 25.0, 38.0, 59.0, 83.0, 101.0, 150.0, 218.0, 306.0, 452.0, 581.0, 936.0, 1405.0, 2110.0, 3387.0, 5446.0, 9304.0, 16323.0, 29764.0, 56348.0, 104852.0, 179795.0, 228031.0, 177687.0, 103956.0, 55691.0, 29860.0, 16515.0, 9350.0, 5566.0, 3562.0, 2194.0, 1431.0, 937.0, 615.0, 391.0, 278.0, 207.0, 155.0, 98.0, 80.0, 50.0, 38.0, 32.0, 22.0, 18.0, 8.0, 4.0, 5.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0], "bins": [-3.640625, -3.5250244140625, -3.409423828125, -3.2938232421875, -3.17822265625, -3.0626220703125, -2.947021484375, -2.8314208984375, -2.7158203125, -2.6002197265625, -2.484619140625, -2.3690185546875, -2.25341796875, -2.1378173828125, -2.022216796875, -1.9066162109375, -1.791015625, -1.6754150390625, -1.559814453125, -1.4442138671875, -1.32861328125, -1.2130126953125, -1.097412109375, -0.9818115234375, -0.8662109375, -0.7506103515625, -0.635009765625, -0.5194091796875, -0.40380859375, -0.2882080078125, -0.172607421875, -0.0570068359375, 0.05859375, 0.1741943359375, 0.289794921875, 0.4053955078125, 0.52099609375, 0.6365966796875, 0.752197265625, 0.8677978515625, 0.9833984375, 1.0989990234375, 1.214599609375, 1.3302001953125, 1.44580078125, 1.5614013671875, 1.677001953125, 1.7926025390625, 1.908203125, 2.0238037109375, 2.139404296875, 2.2550048828125, 2.37060546875, 2.4862060546875, 2.601806640625, 2.7174072265625, 2.8330078125, 2.9486083984375, 3.064208984375, 3.1798095703125, 3.29541015625, 3.4110107421875, 3.526611328125, 3.6422119140625, 3.7578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 5.0, 10.0, 9.0, 15.0, 17.0, 14.0, 18.0, 30.0, 31.0, 30.0, 39.0, 40.0, 31.0, 38.0, 40.0, 44.0, 50.0, 42.0, 33.0, 37.0, 62.0, 40.0, 44.0, 34.0, 25.0, 27.0, 31.0, 30.0, 28.0, 14.0, 10.0, 17.0, 8.0, 15.0, 4.0, 6.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.240814208984375, -4.11053466796875, -3.980255126953125, -3.8499755859375, -3.719696044921875, -3.58941650390625, -3.459136962890625, -3.328857421875, -3.198577880859375, -3.06829833984375, -2.938018798828125, -2.8077392578125, -2.677459716796875, -2.54718017578125, -2.416900634765625, -2.28662109375, -2.156341552734375, -2.02606201171875, -1.895782470703125, -1.7655029296875, -1.635223388671875, -1.50494384765625, -1.374664306640625, -1.244384765625, -1.114105224609375, -0.98382568359375, -0.853546142578125, -0.7232666015625, -0.592987060546875, -0.46270751953125, -0.332427978515625, -0.2021484375, -0.071868896484375, 0.05841064453125, 0.188690185546875, 0.3189697265625, 0.449249267578125, 0.57952880859375, 0.709808349609375, 0.840087890625, 0.970367431640625, 1.10064697265625, 1.230926513671875, 1.3612060546875, 1.491485595703125, 1.62176513671875, 1.752044677734375, 1.88232421875, 2.012603759765625, 2.14288330078125, 2.273162841796875, 2.4034423828125, 2.533721923828125, 2.66400146484375, 2.794281005859375, 2.924560546875, 3.054840087890625, 3.18511962890625, 3.315399169921875, 3.4456787109375, 3.575958251953125, 3.70623779296875, 3.836517333984375, 3.966796875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 11.0, 19.0, 23.0, 29.0, 39.0, 58.0, 74.0, 106.0, 146.0, 223.0, 332.0, 536.0, 747.0, 1253.0, 1998.0, 3246.0, 5677.0, 10285.0, 17707.0, 33165.0, 63175.0, 122049.0, 215060.0, 241949.0, 154615.0, 81061.0, 42210.0, 22490.0, 12363.0, 6887.0, 4122.0, 2517.0, 1577.0, 945.0, 594.0, 420.0, 294.0, 168.0, 121.0, 96.0, 49.0, 38.0, 22.0, 20.0, 7.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5218505859375, -1.471435546875, -1.4210205078125, -1.37060546875, -1.3201904296875, -1.269775390625, -1.2193603515625, -1.1689453125, -1.1185302734375, -1.068115234375, -1.0177001953125, -0.96728515625, -0.9168701171875, -0.866455078125, -0.8160400390625, -0.765625, -0.7152099609375, -0.664794921875, -0.6143798828125, -0.56396484375, -0.5135498046875, -0.463134765625, -0.4127197265625, -0.3623046875, -0.3118896484375, -0.261474609375, -0.2110595703125, -0.16064453125, -0.1102294921875, -0.059814453125, -0.0093994140625, 0.041015625, 0.0914306640625, 0.141845703125, 0.1922607421875, 0.24267578125, 0.2930908203125, 0.343505859375, 0.3939208984375, 0.4443359375, 0.4947509765625, 0.545166015625, 0.5955810546875, 0.64599609375, 0.6964111328125, 0.746826171875, 0.7972412109375, 0.84765625, 0.8980712890625, 0.948486328125, 0.9989013671875, 1.04931640625, 1.0997314453125, 1.150146484375, 1.2005615234375, 1.2509765625, 1.3013916015625, 1.351806640625, 1.4022216796875, 1.45263671875, 1.5030517578125, 1.553466796875, 1.6038818359375, 1.654296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 17.0, 17.0, 46.0, 45.0, 61.0, 75.0, 118.0, 126.0, 105.0, 102.0, 73.0, 62.0, 50.0, 19.0, 24.0, 14.0, 11.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010824203491210938, -0.00010389834642410278, -9.955465793609619e-05, -9.52109694480896e-05, -9.086728096008301e-05, -8.652359247207642e-05, -8.217990398406982e-05, -7.783621549606323e-05, -7.349252700805664e-05, -6.914883852005005e-05, -6.480515003204346e-05, -6.0461461544036865e-05, -5.6117773056030273e-05, -5.177408456802368e-05, -4.743039608001709e-05, -4.30867075920105e-05, -3.8743019104003906e-05, -3.4399330615997314e-05, -3.0055642127990723e-05, -2.571195363998413e-05, -2.136826515197754e-05, -1.7024576663970947e-05, -1.2680888175964355e-05, -8.337199687957764e-06, -3.993511199951172e-06, 3.501772880554199e-07, 4.693865776062012e-06, 9.037554264068604e-06, 1.3381242752075195e-05, 1.7724931240081787e-05, 2.206861972808838e-05, 2.641230821609497e-05, 3.075599670410156e-05, 3.5099685192108154e-05, 3.9443373680114746e-05, 4.378706216812134e-05, 4.813075065612793e-05, 5.247443914413452e-05, 5.681812763214111e-05, 6.11618161201477e-05, 6.55055046081543e-05, 6.984919309616089e-05, 7.419288158416748e-05, 7.853657007217407e-05, 8.288025856018066e-05, 8.722394704818726e-05, 9.156763553619385e-05, 9.591132402420044e-05, 0.00010025501251220703, 0.00010459870100021362, 0.00010894238948822021, 0.0001132860779762268, 0.0001176297664642334, 0.00012197345495223999, 0.00012631714344024658, 0.00013066083192825317, 0.00013500452041625977, 0.00013934820890426636, 0.00014369189739227295, 0.00014803558588027954, 0.00015237927436828613, 0.00015672296285629272, 0.00016106665134429932, 0.0001654103398323059, 0.0001697540283203125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 15.0, 20.0, 22.0, 25.0, 44.0, 54.0, 102.0, 131.0, 211.0, 310.0, 461.0, 861.0, 1363.0, 2341.0, 4499.0, 9170.0, 20323.0, 48707.0, 118257.0, 245967.0, 294160.0, 171542.0, 72537.0, 30178.0, 13439.0, 6295.0, 3088.0, 1683.0, 1032.0, 586.0, 371.0, 249.0, 144.0, 111.0, 87.0, 50.0, 28.0, 28.0, 13.0, 16.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.37109375, -2.30181884765625, -2.2325439453125, -2.16326904296875, -2.093994140625, -2.02471923828125, -1.9554443359375, -1.88616943359375, -1.81689453125, -1.74761962890625, -1.6783447265625, -1.60906982421875, -1.539794921875, -1.47052001953125, -1.4012451171875, -1.33197021484375, -1.2626953125, -1.19342041015625, -1.1241455078125, -1.05487060546875, -0.985595703125, -0.91632080078125, -0.8470458984375, -0.77777099609375, -0.70849609375, -0.63922119140625, -0.5699462890625, -0.50067138671875, -0.431396484375, -0.36212158203125, -0.2928466796875, -0.22357177734375, -0.154296875, -0.08502197265625, -0.0157470703125, 0.05352783203125, 0.122802734375, 0.19207763671875, 0.2613525390625, 0.33062744140625, 0.39990234375, 0.46917724609375, 0.5384521484375, 0.60772705078125, 0.677001953125, 0.74627685546875, 0.8155517578125, 0.88482666015625, 0.9541015625, 1.02337646484375, 1.0926513671875, 1.16192626953125, 1.231201171875, 1.30047607421875, 1.3697509765625, 1.43902587890625, 1.50830078125, 1.57757568359375, 1.6468505859375, 1.71612548828125, 1.785400390625, 1.85467529296875, 1.9239501953125, 1.99322509765625, 2.0625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 6.0, 4.0, 11.0, 11.0, 21.0, 18.0, 31.0, 27.0, 35.0, 50.0, 63.0, 86.0, 97.0, 78.0, 100.0, 70.0, 58.0, 48.0, 35.0, 39.0, 25.0, 18.0, 22.0, 11.0, 7.0, 8.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71875, -0.6937713623046875, -0.668792724609375, -0.6438140869140625, -0.61883544921875, -0.5938568115234375, -0.568878173828125, -0.5438995361328125, -0.5189208984375, -0.4939422607421875, -0.468963623046875, -0.4439849853515625, -0.41900634765625, -0.3940277099609375, -0.369049072265625, -0.3440704345703125, -0.319091796875, -0.2941131591796875, -0.269134521484375, -0.2441558837890625, -0.21917724609375, -0.1941986083984375, -0.169219970703125, -0.1442413330078125, -0.1192626953125, -0.0942840576171875, -0.069305419921875, -0.0443267822265625, -0.01934814453125, 0.0056304931640625, 0.030609130859375, 0.0555877685546875, 0.08056640625, 0.1055450439453125, 0.130523681640625, 0.1555023193359375, 0.18048095703125, 0.2054595947265625, 0.230438232421875, 0.2554168701171875, 0.2803955078125, 0.3053741455078125, 0.330352783203125, 0.3553314208984375, 0.38031005859375, 0.4052886962890625, 0.430267333984375, 0.4552459716796875, 0.480224609375, 0.5052032470703125, 0.530181884765625, 0.5551605224609375, 0.58013916015625, 0.6051177978515625, 0.630096435546875, 0.6550750732421875, 0.6800537109375, 0.7050323486328125, 0.730010986328125, 0.7549896240234375, 0.77996826171875, 0.8049468994140625, 0.829925537109375, 0.8549041748046875, 0.8798828125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 16.0, 17.0, 27.0, 22.0, 54.0, 63.0, 66.0, 100.0, 109.0, 117.0, 95.0, 81.0, 53.0, 43.0, 39.0, 22.0, 23.0, 7.0, 9.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 3.0], "bins": [-19.901113510131836, -19.447967529296875, -18.994821548461914, -18.541675567626953, -18.088529586791992, -17.63538360595703, -17.182239532470703, -16.729093551635742, -16.27594757080078, -15.82280158996582, -15.36965560913086, -14.916509628295898, -14.463364601135254, -14.010218620300293, -13.557072639465332, -13.103926658630371, -12.65078067779541, -12.19763469696045, -11.744488716125488, -11.291343688964844, -10.838197708129883, -10.385051727294922, -9.931905746459961, -9.478759765625, -9.025613784790039, -8.572467803955078, -8.119321823120117, -7.6661763191223145, -7.213030815124512, -6.759884834289551, -6.30673885345459, -5.853592872619629, -5.400448799133301, -4.94730281829834, -4.494157314300537, -4.041011333465576, -3.5878655910491943, -3.1347198486328125, -2.6815738677978516, -2.2284281253814697, -1.775282382965088, -1.322136640548706, -0.8689907789230347, -0.4158449172973633, 0.037300825119018555, 0.4904465675354004, 0.9435925483703613, 1.3967382907867432, 1.849884033203125, 2.303029775619507, 2.7561755180358887, 3.2093214988708496, 3.6624672412872314, 4.115612983703613, 4.568758964538574, 5.021904945373535, 5.475050449371338, 5.928196430206299, 6.381341934204102, 6.8344879150390625, 7.287633895874023, 7.740779399871826, 8.193925857543945, 8.64707088470459, 9.10021686553955]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 10.0, 7.0, 6.0, 7.0, 20.0, 19.0, 9.0, 26.0, 36.0, 21.0, 29.0, 47.0, 31.0, 40.0, 36.0, 47.0, 42.0, 51.0, 48.0, 40.0, 45.0, 42.0, 36.0, 41.0, 29.0, 41.0, 32.0, 28.0, 19.0, 23.0, 14.0, 15.0, 13.0, 9.0, 11.0, 7.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.676895618438721, -6.449435710906982, -6.221975803375244, -5.994515895843506, -5.767055988311768, -5.539596080780029, -5.312136650085449, -5.084676742553711, -4.857216835021973, -4.629756927490234, -4.402297019958496, -4.174837112426758, -3.9473772048950195, -3.7199172973632812, -3.492457628250122, -3.264997720718384, -3.0375375747680664, -2.810077667236328, -2.58261775970459, -2.3551578521728516, -2.1276979446411133, -1.9002381563186646, -1.6727783679962158, -1.4453184604644775, -1.2178585529327393, -0.990398645401001, -0.7629387974739075, -0.535478949546814, -0.3080190420150757, -0.0805591344833374, 0.14690065383911133, 0.3743605613708496, 0.6018204689025879, 0.8292803764343262, 1.0567402839660645, 1.2842000722885132, 1.5116599798202515, 1.7391198873519897, 1.9665796756744385, 2.1940395832061768, 2.421499490737915, 2.6489593982696533, 2.8764193058013916, 3.103878974914551, 3.331338882446289, 3.5587987899780273, 3.7862586975097656, 4.013718605041504, 4.241178512573242, 4.4686384201049805, 4.696098327636719, 4.923558235168457, 5.151018142700195, 5.378478050231934, 5.605937957763672, 5.83339786529541, 6.060857772827148, 6.288317680358887, 6.515777587890625, 6.743237495422363, 6.970697402954102, 7.19815731048584, 7.425617218017578, 7.653077125549316, 7.8805365562438965]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 6.0, 4.0, 10.0, 13.0, 31.0, 30.0, 48.0, 92.0, 156.0, 256.0, 393.0, 672.0, 1180.0, 2182.0, 4261.0, 9014.0, 20437.0, 50131.0, 131945.0, 287788.0, 299019.0, 144304.0, 55108.0, 21834.0, 9701.0, 4594.0, 2294.0, 1295.0, 667.0, 424.0, 249.0, 148.0, 92.0, 57.0, 38.0, 25.0, 18.0, 18.0, 10.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7265625, -12.316650390625, -11.90673828125, -11.496826171875, -11.0869140625, -10.677001953125, -10.26708984375, -9.857177734375, -9.447265625, -9.037353515625, -8.62744140625, -8.217529296875, -7.8076171875, -7.397705078125, -6.98779296875, -6.577880859375, -6.16796875, -5.758056640625, -5.34814453125, -4.938232421875, -4.5283203125, -4.118408203125, -3.70849609375, -3.298583984375, -2.888671875, -2.478759765625, -2.06884765625, -1.658935546875, -1.2490234375, -0.839111328125, -0.42919921875, -0.019287109375, 0.390625, 0.800537109375, 1.21044921875, 1.620361328125, 2.0302734375, 2.440185546875, 2.85009765625, 3.260009765625, 3.669921875, 4.079833984375, 4.48974609375, 4.899658203125, 5.3095703125, 5.719482421875, 6.12939453125, 6.539306640625, 6.94921875, 7.359130859375, 7.76904296875, 8.178955078125, 8.5888671875, 8.998779296875, 9.40869140625, 9.818603515625, 10.228515625, 10.638427734375, 11.04833984375, 11.458251953125, 11.8681640625, 12.278076171875, 12.68798828125, 13.097900390625, 13.5078125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 6.0, 8.0, 9.0, 14.0, 10.0, 15.0, 13.0, 20.0, 21.0, 28.0, 48.0, 39.0, 40.0, 40.0, 39.0, 45.0, 40.0, 50.0, 50.0, 57.0, 38.0, 43.0, 41.0, 36.0, 35.0, 33.0, 24.0, 21.0, 29.0, 24.0, 16.0, 14.0, 10.0, 7.0, 7.0, 7.0, 7.0, 3.0, 2.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.35546875, -7.11383056640625, -6.8721923828125, -6.63055419921875, -6.388916015625, -6.14727783203125, -5.9056396484375, -5.66400146484375, -5.42236328125, -5.18072509765625, -4.9390869140625, -4.69744873046875, -4.455810546875, -4.21417236328125, -3.9725341796875, -3.73089599609375, -3.4892578125, -3.24761962890625, -3.0059814453125, -2.76434326171875, -2.522705078125, -2.28106689453125, -2.0394287109375, -1.79779052734375, -1.55615234375, -1.31451416015625, -1.0728759765625, -0.83123779296875, -0.589599609375, -0.34796142578125, -0.1063232421875, 0.13531494140625, 0.376953125, 0.61859130859375, 0.8602294921875, 1.10186767578125, 1.343505859375, 1.58514404296875, 1.8267822265625, 2.06842041015625, 2.31005859375, 2.55169677734375, 2.7933349609375, 3.03497314453125, 3.276611328125, 3.51824951171875, 3.7598876953125, 4.00152587890625, 4.2431640625, 4.48480224609375, 4.7264404296875, 4.96807861328125, 5.209716796875, 5.45135498046875, 5.6929931640625, 5.93463134765625, 6.17626953125, 6.41790771484375, 6.6595458984375, 6.90118408203125, 7.142822265625, 7.38446044921875, 7.6260986328125, 7.86773681640625, 8.109375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 11.0, 15.0, 14.0, 37.0, 60.0, 80.0, 108.0, 151.0, 217.0, 360.0, 512.0, 752.0, 1306.0, 1896.0, 3006.0, 4771.0, 7884.0, 13098.0, 21438.0, 36839.0, 62660.0, 104407.0, 158559.0, 189645.0, 164865.0, 111193.0, 66692.0, 38705.0, 22845.0, 13740.0, 8414.0, 5192.0, 3311.0, 2002.0, 1272.0, 837.0, 553.0, 365.0, 253.0, 151.0, 101.0, 68.0, 51.0, 32.0, 20.0, 18.0, 12.0, 8.0, 10.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.77471923828125, -6.5455322265625, -6.31634521484375, -6.087158203125, -5.85797119140625, -5.6287841796875, -5.39959716796875, -5.17041015625, -4.94122314453125, -4.7120361328125, -4.48284912109375, -4.253662109375, -4.02447509765625, -3.7952880859375, -3.56610107421875, -3.3369140625, -3.10772705078125, -2.8785400390625, -2.64935302734375, -2.420166015625, -2.19097900390625, -1.9617919921875, -1.73260498046875, -1.50341796875, -1.27423095703125, -1.0450439453125, -0.81585693359375, -0.586669921875, -0.35748291015625, -0.1282958984375, 0.10089111328125, 0.330078125, 0.55926513671875, 0.7884521484375, 1.01763916015625, 1.246826171875, 1.47601318359375, 1.7052001953125, 1.93438720703125, 2.16357421875, 2.39276123046875, 2.6219482421875, 2.85113525390625, 3.080322265625, 3.30950927734375, 3.5386962890625, 3.76788330078125, 3.9970703125, 4.22625732421875, 4.4554443359375, 4.68463134765625, 4.913818359375, 5.14300537109375, 5.3721923828125, 5.60137939453125, 5.83056640625, 6.05975341796875, 6.2889404296875, 6.51812744140625, 6.747314453125, 6.97650146484375, 7.2056884765625, 7.43487548828125, 7.6640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 12.0, 13.0, 13.0, 12.0, 14.0, 27.0, 40.0, 44.0, 41.0, 57.0, 39.0, 55.0, 52.0, 50.0, 54.0, 63.0, 48.0, 47.0, 65.0, 47.0, 38.0, 40.0, 26.0, 30.0, 13.0, 22.0, 17.0, 8.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.54296875, -6.3497314453125, -6.156494140625, -5.9632568359375, -5.77001953125, -5.5767822265625, -5.383544921875, -5.1903076171875, -4.9970703125, -4.8038330078125, -4.610595703125, -4.4173583984375, -4.22412109375, -4.0308837890625, -3.837646484375, -3.6444091796875, -3.451171875, -3.2579345703125, -3.064697265625, -2.8714599609375, -2.67822265625, -2.4849853515625, -2.291748046875, -2.0985107421875, -1.9052734375, -1.7120361328125, -1.518798828125, -1.3255615234375, -1.13232421875, -0.9390869140625, -0.745849609375, -0.5526123046875, -0.359375, -0.1661376953125, 0.027099609375, 0.2203369140625, 0.41357421875, 0.6068115234375, 0.800048828125, 0.9932861328125, 1.1865234375, 1.3797607421875, 1.572998046875, 1.7662353515625, 1.95947265625, 2.1527099609375, 2.345947265625, 2.5391845703125, 2.732421875, 2.9256591796875, 3.118896484375, 3.3121337890625, 3.50537109375, 3.6986083984375, 3.891845703125, 4.0850830078125, 4.2783203125, 4.4715576171875, 4.664794921875, 4.8580322265625, 5.05126953125, 5.2445068359375, 5.437744140625, 5.6309814453125, 5.82421875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 16.0, 17.0, 22.0, 39.0, 38.0, 82.0, 92.0, 159.0, 301.0, 447.0, 711.0, 1063.0, 1789.0, 2896.0, 4912.0, 8747.0, 15956.0, 31083.0, 63219.0, 130513.0, 236922.0, 252239.0, 148285.0, 72247.0, 35144.0, 17922.0, 9874.0, 5464.0, 3164.0, 1929.0, 1188.0, 738.0, 486.0, 306.0, 173.0, 133.0, 80.0, 60.0, 26.0, 25.0, 20.0, 9.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6796875, -5.49700927734375, -5.3143310546875, -5.13165283203125, -4.948974609375, -4.76629638671875, -4.5836181640625, -4.40093994140625, -4.21826171875, -4.03558349609375, -3.8529052734375, -3.67022705078125, -3.487548828125, -3.30487060546875, -3.1221923828125, -2.93951416015625, -2.7568359375, -2.57415771484375, -2.3914794921875, -2.20880126953125, -2.026123046875, -1.84344482421875, -1.6607666015625, -1.47808837890625, -1.29541015625, -1.11273193359375, -0.9300537109375, -0.74737548828125, -0.564697265625, -0.38201904296875, -0.1993408203125, -0.01666259765625, 0.166015625, 0.34869384765625, 0.5313720703125, 0.71405029296875, 0.896728515625, 1.07940673828125, 1.2620849609375, 1.44476318359375, 1.62744140625, 1.81011962890625, 1.9927978515625, 2.17547607421875, 2.358154296875, 2.54083251953125, 2.7235107421875, 2.90618896484375, 3.0888671875, 3.27154541015625, 3.4542236328125, 3.63690185546875, 3.819580078125, 4.00225830078125, 4.1849365234375, 4.36761474609375, 4.55029296875, 4.73297119140625, 4.9156494140625, 5.09832763671875, 5.281005859375, 5.46368408203125, 5.6463623046875, 5.82904052734375, 6.01171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 7.0, 9.0, 9.0, 28.0, 23.0, 31.0, 30.0, 41.0, 49.0, 63.0, 81.0, 85.0, 75.0, 77.0, 70.0, 54.0, 63.0, 44.0, 32.0, 20.0, 25.0, 12.0, 10.0, 10.0, 10.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003352165222167969, -0.0003203153610229492, -0.00030541419982910156, -0.0002905130386352539, -0.00027561187744140625, -0.0002607107162475586, -0.00024580955505371094, -0.00023090839385986328, -0.00021600723266601562, -0.00020110607147216797, -0.0001862049102783203, -0.00017130374908447266, -0.000156402587890625, -0.00014150142669677734, -0.0001266002655029297, -0.00011169910430908203, -9.679794311523438e-05, -8.189678192138672e-05, -6.699562072753906e-05, -5.2094459533691406e-05, -3.719329833984375e-05, -2.2292137145996094e-05, -7.3909759521484375e-06, 7.510185241699219e-06, 2.2411346435546875e-05, 3.731250762939453e-05, 5.221366882324219e-05, 6.711483001708984e-05, 8.20159912109375e-05, 9.691715240478516e-05, 0.00011181831359863281, 0.00012671947479248047, 0.00014162063598632812, 0.00015652179718017578, 0.00017142295837402344, 0.0001863241195678711, 0.00020122528076171875, 0.0002161264419555664, 0.00023102760314941406, 0.0002459287643432617, 0.0002608299255371094, 0.00027573108673095703, 0.0002906322479248047, 0.00030553340911865234, 0.0003204345703125, 0.00033533573150634766, 0.0003502368927001953, 0.00036513805389404297, 0.0003800392150878906, 0.0003949403762817383, 0.00040984153747558594, 0.0004247426986694336, 0.00043964385986328125, 0.0004545450210571289, 0.00046944618225097656, 0.0004843473434448242, 0.0004992485046386719, 0.0005141496658325195, 0.0005290508270263672, 0.0005439519882202148, 0.0005588531494140625, 0.0005737543106079102, 0.0005886554718017578, 0.0006035566329956055, 0.0006184577941894531]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 9.0, 11.0, 10.0, 15.0, 33.0, 43.0, 56.0, 79.0, 103.0, 139.0, 245.0, 379.0, 561.0, 953.0, 1560.0, 2764.0, 5090.0, 9860.0, 20535.0, 44515.0, 99783.0, 208832.0, 285699.0, 195431.0, 91809.0, 40651.0, 18820.0, 9254.0, 4703.0, 2588.0, 1521.0, 888.0, 549.0, 300.0, 233.0, 169.0, 103.0, 72.0, 49.0, 43.0, 26.0, 15.0, 13.0, 14.0, 5.0, 9.0, 2.0, 3.0, 0.0, 1.0, 4.0, 2.0, 2.0], "bins": [-6.0546875, -5.8736572265625, -5.692626953125, -5.5115966796875, -5.33056640625, -5.1495361328125, -4.968505859375, -4.7874755859375, -4.6064453125, -4.4254150390625, -4.244384765625, -4.0633544921875, -3.88232421875, -3.7012939453125, -3.520263671875, -3.3392333984375, -3.158203125, -2.9771728515625, -2.796142578125, -2.6151123046875, -2.43408203125, -2.2530517578125, -2.072021484375, -1.8909912109375, -1.7099609375, -1.5289306640625, -1.347900390625, -1.1668701171875, -0.98583984375, -0.8048095703125, -0.623779296875, -0.4427490234375, -0.26171875, -0.0806884765625, 0.100341796875, 0.2813720703125, 0.46240234375, 0.6434326171875, 0.824462890625, 1.0054931640625, 1.1865234375, 1.3675537109375, 1.548583984375, 1.7296142578125, 1.91064453125, 2.0916748046875, 2.272705078125, 2.4537353515625, 2.634765625, 2.8157958984375, 2.996826171875, 3.1778564453125, 3.35888671875, 3.5399169921875, 3.720947265625, 3.9019775390625, 4.0830078125, 4.2640380859375, 4.445068359375, 4.6260986328125, 4.80712890625, 4.9881591796875, 5.169189453125, 5.3502197265625, 5.53125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 6.0, 9.0, 12.0, 9.0, 16.0, 16.0, 35.0, 43.0, 62.0, 63.0, 88.0, 98.0, 97.0, 106.0, 71.0, 64.0, 47.0, 43.0, 24.0, 22.0, 12.0, 12.0, 15.0, 6.0, 6.0, 6.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.224609375, -2.149261474609375, -2.07391357421875, -1.998565673828125, -1.9232177734375, -1.847869873046875, -1.77252197265625, -1.697174072265625, -1.621826171875, -1.546478271484375, -1.47113037109375, -1.395782470703125, -1.3204345703125, -1.245086669921875, -1.16973876953125, -1.094390869140625, -1.01904296875, -0.943695068359375, -0.86834716796875, -0.792999267578125, -0.7176513671875, -0.642303466796875, -0.56695556640625, -0.491607666015625, -0.416259765625, -0.340911865234375, -0.26556396484375, -0.190216064453125, -0.1148681640625, -0.039520263671875, 0.03582763671875, 0.111175537109375, 0.1865234375, 0.261871337890625, 0.33721923828125, 0.412567138671875, 0.4879150390625, 0.563262939453125, 0.63861083984375, 0.713958740234375, 0.789306640625, 0.864654541015625, 0.94000244140625, 1.015350341796875, 1.0906982421875, 1.166046142578125, 1.24139404296875, 1.316741943359375, 1.39208984375, 1.467437744140625, 1.54278564453125, 1.618133544921875, 1.6934814453125, 1.768829345703125, 1.84417724609375, 1.919525146484375, 1.994873046875, 2.070220947265625, 2.14556884765625, 2.220916748046875, 2.2962646484375, 2.371612548828125, 2.44696044921875, 2.522308349609375, 2.59765625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 5.0, 10.0, 17.0, 19.0, 33.0, 66.0, 72.0, 83.0, 109.0, 126.0, 116.0, 76.0, 74.0, 55.0, 37.0, 27.0, 21.0, 18.0, 9.0, 3.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0], "bins": [-22.312911987304688, -21.832881927490234, -21.352853775024414, -20.87282371520996, -20.392793655395508, -19.912765502929688, -19.432735443115234, -18.95270538330078, -18.47267723083496, -17.992647171020508, -17.512619018554688, -17.032588958740234, -16.55255889892578, -16.07253074645996, -15.592500686645508, -15.112471580505371, -14.632441520690918, -14.152412414550781, -13.672382354736328, -13.192353248596191, -12.712324142456055, -12.232294082641602, -11.752264976501465, -11.272235870361328, -10.792205810546875, -10.312176704406738, -9.832146644592285, -9.352117538452148, -8.872088432312012, -8.392059326171875, -7.912029266357422, -7.432000160217285, -6.951970100402832, -6.471940517425537, -5.9919114112854, -5.5118818283081055, -5.031852722167969, -4.551823139190674, -4.071793556213379, -3.591764211654663, -3.1117348670959473, -2.6317055225372314, -2.1516761779785156, -1.6716465950012207, -1.1916172504425049, -0.7115879058837891, -0.23155832290649414, 0.24847102165222168, 0.7285003662109375, 1.2085297107696533, 1.6885591745376587, 2.168588638305664, 2.64861798286438, 3.1286473274230957, 3.6086769104003906, 4.088706016540527, 4.568735599517822, 5.048765182495117, 5.528794288635254, 6.008823871612549, 6.488853454589844, 6.9688825607299805, 7.448912143707275, 7.92894172668457, 8.408970832824707]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 8.0, 3.0, 6.0, 11.0, 10.0, 12.0, 11.0, 12.0, 11.0, 22.0, 19.0, 14.0, 34.0, 40.0, 34.0, 26.0, 47.0, 29.0, 29.0, 51.0, 43.0, 45.0, 42.0, 39.0, 42.0, 37.0, 41.0, 40.0, 41.0, 34.0, 21.0, 22.0, 20.0, 16.0, 20.0, 13.0, 10.0, 9.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-6.974536895751953, -6.759966850280762, -6.545396327972412, -6.3308258056640625, -6.116255760192871, -5.90168571472168, -5.68711519241333, -5.4725446701049805, -5.257974624633789, -5.043404579162598, -4.828834056854248, -4.614263534545898, -4.399693489074707, -4.185123443603516, -3.970552921295166, -3.7559826374053955, -3.541412353515625, -3.3268420696258545, -3.112271785736084, -2.8977015018463135, -2.683131217956543, -2.4685609340667725, -2.253990650177002, -2.0394203662872314, -1.824850082397461, -1.6102797985076904, -1.39570951461792, -1.1811392307281494, -0.9665689468383789, -0.7519986629486084, -0.5374283790588379, -0.3228580951690674, -0.10828733444213867, 0.10628294944763184, 0.32085323333740234, 0.5354235172271729, 0.7499938011169434, 0.9645640850067139, 1.1791343688964844, 1.3937046527862549, 1.6082749366760254, 1.822845220565796, 2.0374155044555664, 2.251985788345337, 2.4665560722351074, 2.681126356124878, 2.8956966400146484, 3.110266923904419, 3.3248372077941895, 3.53940749168396, 3.7539777755737305, 3.968548059463501, 4.1831183433532715, 4.397688865661621, 4.6122589111328125, 4.826828956604004, 5.0413994789123535, 5.255970001220703, 5.4705400466918945, 5.685110092163086, 5.8996806144714355, 6.114251136779785, 6.328821182250977, 6.543391227722168, 6.757961750030518]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 13.0, 7.0, 22.0, 30.0, 43.0, 66.0, 75.0, 128.0, 201.0, 245.0, 401.0, 553.0, 878.0, 1197.0, 1810.0, 2629.0, 4247.0, 6712.0, 11056.0, 20109.0, 40163.0, 96840.0, 280401.0, 849752.0, 1492744.0, 895756.0, 296332.0, 100727.0, 41135.0, 19846.0, 10991.0, 6558.0, 4083.0, 2785.0, 1741.0, 1220.0, 858.0, 547.0, 396.0, 301.0, 224.0, 138.0, 103.0, 76.0, 39.0, 34.0, 29.0, 12.0, 21.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0], "bins": [-11.7421875, -11.3919677734375, -11.041748046875, -10.6915283203125, -10.34130859375, -9.9910888671875, -9.640869140625, -9.2906494140625, -8.9404296875, -8.5902099609375, -8.239990234375, -7.8897705078125, -7.53955078125, -7.1893310546875, -6.839111328125, -6.4888916015625, -6.138671875, -5.7884521484375, -5.438232421875, -5.0880126953125, -4.73779296875, -4.3875732421875, -4.037353515625, -3.6871337890625, -3.3369140625, -2.9866943359375, -2.636474609375, -2.2862548828125, -1.93603515625, -1.5858154296875, -1.235595703125, -0.8853759765625, -0.53515625, -0.1849365234375, 0.165283203125, 0.5155029296875, 0.86572265625, 1.2159423828125, 1.566162109375, 1.9163818359375, 2.2666015625, 2.6168212890625, 2.967041015625, 3.3172607421875, 3.66748046875, 4.0177001953125, 4.367919921875, 4.7181396484375, 5.068359375, 5.4185791015625, 5.768798828125, 6.1190185546875, 6.46923828125, 6.8194580078125, 7.169677734375, 7.5198974609375, 7.8701171875, 8.2203369140625, 8.570556640625, 8.9207763671875, 9.27099609375, 9.6212158203125, 9.971435546875, 10.3216552734375, 10.671875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 2.0, 3.0, 6.0, 8.0, 3.0, 8.0, 10.0, 17.0, 14.0, 19.0, 22.0, 23.0, 24.0, 48.0, 31.0, 35.0, 41.0, 38.0, 47.0, 36.0, 53.0, 38.0, 43.0, 35.0, 46.0, 42.0, 42.0, 36.0, 29.0, 35.0, 29.0, 29.0, 18.0, 19.0, 14.0, 12.0, 12.0, 4.0, 6.0, 2.0, 9.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-4.78515625, -4.6336669921875, -4.482177734375, -4.3306884765625, -4.17919921875, -4.0277099609375, -3.876220703125, -3.7247314453125, -3.5732421875, -3.4217529296875, -3.270263671875, -3.1187744140625, -2.96728515625, -2.8157958984375, -2.664306640625, -2.5128173828125, -2.361328125, -2.2098388671875, -2.058349609375, -1.9068603515625, -1.75537109375, -1.6038818359375, -1.452392578125, -1.3009033203125, -1.1494140625, -0.9979248046875, -0.846435546875, -0.6949462890625, -0.54345703125, -0.3919677734375, -0.240478515625, -0.0889892578125, 0.0625, 0.2139892578125, 0.365478515625, 0.5169677734375, 0.66845703125, 0.8199462890625, 0.971435546875, 1.1229248046875, 1.2744140625, 1.4259033203125, 1.577392578125, 1.7288818359375, 1.88037109375, 2.0318603515625, 2.183349609375, 2.3348388671875, 2.486328125, 2.6378173828125, 2.789306640625, 2.9407958984375, 3.09228515625, 3.2437744140625, 3.395263671875, 3.5467529296875, 3.6982421875, 3.8497314453125, 4.001220703125, 4.1527099609375, 4.30419921875, 4.4556884765625, 4.607177734375, 4.7586669921875, 4.91015625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 6.0, 16.0, 14.0, 20.0, 27.0, 55.0, 76.0, 93.0, 148.0, 238.0, 349.0, 584.0, 875.0, 1403.0, 2361.0, 3903.0, 6657.0, 11571.0, 21220.0, 42003.0, 93784.0, 245867.0, 697837.0, 1389951.0, 1027406.0, 385821.0, 139917.0, 57928.0, 28268.0, 14889.0, 8483.0, 4723.0, 2933.0, 1814.0, 1118.0, 672.0, 435.0, 293.0, 186.0, 128.0, 73.0, 46.0, 36.0, 27.0, 14.0, 11.0, 4.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.93310546875, -10.5771484375, -10.22119140625, -9.865234375, -9.50927734375, -9.1533203125, -8.79736328125, -8.44140625, -8.08544921875, -7.7294921875, -7.37353515625, -7.017578125, -6.66162109375, -6.3056640625, -5.94970703125, -5.59375, -5.23779296875, -4.8818359375, -4.52587890625, -4.169921875, -3.81396484375, -3.4580078125, -3.10205078125, -2.74609375, -2.39013671875, -2.0341796875, -1.67822265625, -1.322265625, -0.96630859375, -0.6103515625, -0.25439453125, 0.1015625, 0.45751953125, 0.8134765625, 1.16943359375, 1.525390625, 1.88134765625, 2.2373046875, 2.59326171875, 2.94921875, 3.30517578125, 3.6611328125, 4.01708984375, 4.373046875, 4.72900390625, 5.0849609375, 5.44091796875, 5.796875, 6.15283203125, 6.5087890625, 6.86474609375, 7.220703125, 7.57666015625, 7.9326171875, 8.28857421875, 8.64453125, 9.00048828125, 9.3564453125, 9.71240234375, 10.068359375, 10.42431640625, 10.7802734375, 11.13623046875, 11.4921875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 7.0, 11.0, 17.0, 17.0, 19.0, 17.0, 26.0, 37.0, 51.0, 48.0, 73.0, 121.0, 138.0, 175.0, 218.0, 249.0, 324.0, 318.0, 351.0, 335.0, 289.0, 287.0, 215.0, 178.0, 126.0, 93.0, 87.0, 60.0, 34.0, 35.0, 22.0, 21.0, 25.0, 11.0, 12.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-3.646484375, -3.546051025390625, -3.44561767578125, -3.345184326171875, -3.2447509765625, -3.144317626953125, -3.04388427734375, -2.943450927734375, -2.843017578125, -2.742584228515625, -2.64215087890625, -2.541717529296875, -2.4412841796875, -2.340850830078125, -2.24041748046875, -2.139984130859375, -2.03955078125, -1.939117431640625, -1.83868408203125, -1.738250732421875, -1.6378173828125, -1.537384033203125, -1.43695068359375, -1.336517333984375, -1.236083984375, -1.135650634765625, -1.03521728515625, -0.934783935546875, -0.8343505859375, -0.733917236328125, -0.63348388671875, -0.533050537109375, -0.4326171875, -0.332183837890625, -0.23175048828125, -0.131317138671875, -0.0308837890625, 0.069549560546875, 0.16998291015625, 0.270416259765625, 0.370849609375, 0.471282958984375, 0.57171630859375, 0.672149658203125, 0.7725830078125, 0.873016357421875, 0.97344970703125, 1.073883056640625, 1.17431640625, 1.274749755859375, 1.37518310546875, 1.475616455078125, 1.5760498046875, 1.676483154296875, 1.77691650390625, 1.877349853515625, 1.977783203125, 2.078216552734375, 2.17864990234375, 2.279083251953125, 2.3795166015625, 2.479949951171875, 2.58038330078125, 2.680816650390625, 2.78125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 12.0, 10.0, 11.0, 8.0, 25.0, 26.0, 48.0, 62.0, 83.0, 103.0, 104.0, 107.0, 113.0, 84.0, 62.0, 41.0, 32.0, 14.0, 11.0, 9.0, 8.0, 7.0, 6.0, 3.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.898653030395508, -16.463951110839844, -16.029247283935547, -15.594545364379883, -15.159843444824219, -14.725141525268555, -14.290438652038574, -13.855735778808594, -13.42103385925293, -12.986331939697266, -12.551629066467285, -12.116926193237305, -11.68222427368164, -11.247522354125977, -10.812819480895996, -10.378116607666016, -9.943414688110352, -9.508712768554688, -9.074009895324707, -8.639307022094727, -8.204605102539062, -7.76990270614624, -7.335200309753418, -6.900497913360596, -6.465795516967773, -6.031093120574951, -5.596390724182129, -5.161688327789307, -4.726985931396484, -4.292283535003662, -3.85758113861084, -3.4228787422180176, -2.9881763458251953, -2.553473949432373, -2.118771553039551, -1.6840691566467285, -1.2493667602539062, -0.814664363861084, -0.3799619674682617, 0.05474042892456055, 0.4894428253173828, 0.9241452217102051, 1.3588476181030273, 1.7935500144958496, 2.228252410888672, 2.662954807281494, 3.0976572036743164, 3.5323596000671387, 3.967061996459961, 4.401764392852783, 4.8364667892456055, 5.271169185638428, 5.70587158203125, 6.140573978424072, 6.5752763748168945, 7.009978771209717, 7.444681167602539, 7.879383563995361, 8.314085960388184, 8.748788833618164, 9.183490753173828, 9.618192672729492, 10.052895545959473, 10.487598419189453, 10.922300338745117]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 8.0, 6.0, 10.0, 8.0, 16.0, 12.0, 12.0, 24.0, 35.0, 27.0, 25.0, 38.0, 23.0, 30.0, 39.0, 49.0, 46.0, 46.0, 42.0, 45.0, 48.0, 46.0, 35.0, 45.0, 33.0, 34.0, 30.0, 26.0, 23.0, 24.0, 20.0, 17.0, 10.0, 14.0, 13.0, 5.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.5228424072265625, -6.318317413330078, -6.113792896270752, -5.909267902374268, -5.704742908477783, -5.500218391418457, -5.295693397521973, -5.091168403625488, -4.886643409729004, -4.6821184158325195, -4.477593898773193, -4.273068904876709, -4.068543910980225, -3.8640191555023193, -3.659494400024414, -3.4549694061279297, -3.2504448890686035, -3.0459201335906982, -2.841395139694214, -2.6368703842163086, -2.432345390319824, -2.227820634841919, -2.0232958793640137, -1.8187710046768188, -1.614246129989624, -1.4097212553024292, -1.2051963806152344, -1.000671625137329, -0.7961467504501343, -0.5916218757629395, -0.3870971202850342, -0.18257224559783936, 0.02195262908935547, 0.2264774739742279, 0.43100231885910034, 0.6355271339416504, 0.8400520086288452, 1.04457688331604, 1.2491016387939453, 1.4536265134811401, 1.658151388168335, 1.8626762628555298, 2.0672011375427246, 2.27172589302063, 2.476250648498535, 2.6807756423950195, 2.885300397872925, 3.08982515335083, 3.2943501472473145, 3.4988749027252197, 3.703399896621704, 3.9079246520996094, 4.112449645996094, 4.316974639892578, 4.521499156951904, 4.726024150848389, 4.930548667907715, 5.135073661804199, 5.339598178863525, 5.54412317276001, 5.748648166656494, 5.95317268371582, 6.157697677612305, 6.362222671508789, 6.566747665405273]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 6.0, 8.0, 16.0, 6.0, 19.0, 34.0, 47.0, 66.0, 107.0, 158.0, 194.0, 319.0, 517.0, 715.0, 1138.0, 1837.0, 2895.0, 4740.0, 7895.0, 13871.0, 25092.0, 46797.0, 88202.0, 157128.0, 220225.0, 200159.0, 125540.0, 67672.0, 35798.0, 19567.0, 10995.0, 6361.0, 3771.0, 2322.0, 1498.0, 947.0, 605.0, 428.0, 275.0, 189.0, 122.0, 86.0, 82.0, 40.0, 23.0, 21.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-3.76171875, -3.653594970703125, -3.54547119140625, -3.437347412109375, -3.3292236328125, -3.221099853515625, -3.11297607421875, -3.004852294921875, -2.896728515625, -2.788604736328125, -2.68048095703125, -2.572357177734375, -2.4642333984375, -2.356109619140625, -2.24798583984375, -2.139862060546875, -2.03173828125, -1.923614501953125, -1.81549072265625, -1.707366943359375, -1.5992431640625, -1.491119384765625, -1.38299560546875, -1.274871826171875, -1.166748046875, -1.058624267578125, -0.95050048828125, -0.842376708984375, -0.7342529296875, -0.626129150390625, -0.51800537109375, -0.409881591796875, -0.3017578125, -0.193634033203125, -0.08551025390625, 0.022613525390625, 0.1307373046875, 0.238861083984375, 0.34698486328125, 0.455108642578125, 0.563232421875, 0.671356201171875, 0.77947998046875, 0.887603759765625, 0.9957275390625, 1.103851318359375, 1.21197509765625, 1.320098876953125, 1.42822265625, 1.536346435546875, 1.64447021484375, 1.752593994140625, 1.8607177734375, 1.968841552734375, 2.07696533203125, 2.185089111328125, 2.293212890625, 2.401336669921875, 2.50946044921875, 2.617584228515625, 2.7257080078125, 2.833831787109375, 2.94195556640625, 3.050079345703125, 3.158203125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 5.0, 5.0, 7.0, 9.0, 8.0, 13.0, 17.0, 32.0, 26.0, 14.0, 30.0, 28.0, 35.0, 42.0, 37.0, 33.0, 56.0, 51.0, 61.0, 43.0, 48.0, 42.0, 46.0, 35.0, 32.0, 39.0, 27.0, 29.0, 19.0, 23.0, 15.0, 21.0, 9.0, 16.0, 3.0, 8.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.0625, -6.8323974609375, -6.602294921875, -6.3721923828125, -6.14208984375, -5.9119873046875, -5.681884765625, -5.4517822265625, -5.2216796875, -4.9915771484375, -4.761474609375, -4.5313720703125, -4.30126953125, -4.0711669921875, -3.841064453125, -3.6109619140625, -3.380859375, -3.1507568359375, -2.920654296875, -2.6905517578125, -2.46044921875, -2.2303466796875, -2.000244140625, -1.7701416015625, -1.5400390625, -1.3099365234375, -1.079833984375, -0.8497314453125, -0.61962890625, -0.3895263671875, -0.159423828125, 0.0706787109375, 0.30078125, 0.5308837890625, 0.760986328125, 0.9910888671875, 1.22119140625, 1.4512939453125, 1.681396484375, 1.9114990234375, 2.1416015625, 2.3717041015625, 2.601806640625, 2.8319091796875, 3.06201171875, 3.2921142578125, 3.522216796875, 3.7523193359375, 3.982421875, 4.2125244140625, 4.442626953125, 4.6727294921875, 4.90283203125, 5.1329345703125, 5.363037109375, 5.5931396484375, 5.8232421875, 6.0533447265625, 6.283447265625, 6.5135498046875, 6.74365234375, 6.9737548828125, 7.203857421875, 7.4339599609375, 7.6640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 11.0, 14.0, 20.0, 20.0, 31.0, 45.0, 62.0, 80.0, 114.0, 157.0, 244.0, 293.0, 476.0, 717.0, 1120.0, 1643.0, 2708.0, 4233.0, 6996.0, 12577.0, 22852.0, 41910.0, 79970.0, 146193.0, 224220.0, 213420.0, 131520.0, 70487.0, 37572.0, 20098.0, 11202.0, 6510.0, 4031.0, 2336.0, 1486.0, 966.0, 675.0, 473.0, 313.0, 237.0, 152.0, 106.0, 80.0, 45.0, 44.0, 30.0, 28.0, 13.0, 9.0, 8.0, 1.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-3.451171875, -3.339508056640625, -3.22784423828125, -3.116180419921875, -3.0045166015625, -2.892852783203125, -2.78118896484375, -2.669525146484375, -2.557861328125, -2.446197509765625, -2.33453369140625, -2.222869873046875, -2.1112060546875, -1.999542236328125, -1.88787841796875, -1.776214599609375, -1.66455078125, -1.552886962890625, -1.44122314453125, -1.329559326171875, -1.2178955078125, -1.106231689453125, -0.99456787109375, -0.882904052734375, -0.771240234375, -0.659576416015625, -0.54791259765625, -0.436248779296875, -0.3245849609375, -0.212921142578125, -0.10125732421875, 0.010406494140625, 0.1220703125, 0.233734130859375, 0.34539794921875, 0.457061767578125, 0.5687255859375, 0.680389404296875, 0.79205322265625, 0.903717041015625, 1.015380859375, 1.127044677734375, 1.23870849609375, 1.350372314453125, 1.4620361328125, 1.573699951171875, 1.68536376953125, 1.797027587890625, 1.90869140625, 2.020355224609375, 2.13201904296875, 2.243682861328125, 2.3553466796875, 2.467010498046875, 2.57867431640625, 2.690338134765625, 2.802001953125, 2.913665771484375, 3.02532958984375, 3.136993408203125, 3.2486572265625, 3.360321044921875, 3.47198486328125, 3.583648681640625, 3.6953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 6.0, 11.0, 16.0, 21.0, 12.0, 13.0, 22.0, 24.0, 23.0, 27.0, 24.0, 37.0, 29.0, 44.0, 31.0, 47.0, 25.0, 45.0, 30.0, 35.0, 38.0, 29.0, 39.0, 34.0, 35.0, 33.0, 28.0, 27.0, 27.0, 26.0, 24.0, 21.0, 19.0, 16.0, 12.0, 13.0, 7.0, 11.0, 9.0, 5.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.41015625, -3.30206298828125, -3.1939697265625, -3.08587646484375, -2.977783203125, -2.86968994140625, -2.7615966796875, -2.65350341796875, -2.54541015625, -2.43731689453125, -2.3292236328125, -2.22113037109375, -2.113037109375, -2.00494384765625, -1.8968505859375, -1.78875732421875, -1.6806640625, -1.57257080078125, -1.4644775390625, -1.35638427734375, -1.248291015625, -1.14019775390625, -1.0321044921875, -0.92401123046875, -0.81591796875, -0.70782470703125, -0.5997314453125, -0.49163818359375, -0.383544921875, -0.27545166015625, -0.1673583984375, -0.05926513671875, 0.048828125, 0.15692138671875, 0.2650146484375, 0.37310791015625, 0.481201171875, 0.58929443359375, 0.6973876953125, 0.80548095703125, 0.91357421875, 1.02166748046875, 1.1297607421875, 1.23785400390625, 1.345947265625, 1.45404052734375, 1.5621337890625, 1.67022705078125, 1.7783203125, 1.88641357421875, 1.9945068359375, 2.10260009765625, 2.210693359375, 2.31878662109375, 2.4268798828125, 2.53497314453125, 2.64306640625, 2.75115966796875, 2.8592529296875, 2.96734619140625, 3.075439453125, 3.18353271484375, 3.2916259765625, 3.39971923828125, 3.5078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 5.0, 11.0, 12.0, 17.0, 22.0, 22.0, 49.0, 47.0, 80.0, 89.0, 154.0, 211.0, 362.0, 642.0, 969.0, 1709.0, 3057.0, 5482.0, 10704.0, 21590.0, 47945.0, 116188.0, 274946.0, 312961.0, 140950.0, 57719.0, 25392.0, 12483.0, 6377.0, 3356.0, 1977.0, 1110.0, 683.0, 418.0, 278.0, 160.0, 110.0, 77.0, 46.0, 48.0, 23.0, 19.0, 17.0, 8.0, 14.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-2.330078125, -2.25750732421875, -2.1849365234375, -2.11236572265625, -2.039794921875, -1.96722412109375, -1.8946533203125, -1.82208251953125, -1.74951171875, -1.67694091796875, -1.6043701171875, -1.53179931640625, -1.459228515625, -1.38665771484375, -1.3140869140625, -1.24151611328125, -1.1689453125, -1.09637451171875, -1.0238037109375, -0.95123291015625, -0.878662109375, -0.80609130859375, -0.7335205078125, -0.66094970703125, -0.58837890625, -0.51580810546875, -0.4432373046875, -0.37066650390625, -0.298095703125, -0.22552490234375, -0.1529541015625, -0.08038330078125, -0.0078125, 0.06475830078125, 0.1373291015625, 0.20989990234375, 0.282470703125, 0.35504150390625, 0.4276123046875, 0.50018310546875, 0.57275390625, 0.64532470703125, 0.7178955078125, 0.79046630859375, 0.863037109375, 0.93560791015625, 1.0081787109375, 1.08074951171875, 1.1533203125, 1.22589111328125, 1.2984619140625, 1.37103271484375, 1.443603515625, 1.51617431640625, 1.5887451171875, 1.66131591796875, 1.73388671875, 1.80645751953125, 1.8790283203125, 1.95159912109375, 2.024169921875, 2.09674072265625, 2.1693115234375, 2.24188232421875, 2.314453125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 8.0, 3.0, 12.0, 15.0, 24.0, 29.0, 45.0, 58.0, 71.0, 93.0, 97.0, 109.0, 104.0, 74.0, 70.0, 52.0, 48.0, 29.0, 25.0, 15.0, 6.0, 7.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011557340621948242, -0.00011135917156934738, -0.00010714493691921234, -0.0001029307022690773, -9.871646761894226e-05, -9.450223296880722e-05, -9.028799831867218e-05, -8.607376366853714e-05, -8.18595290184021e-05, -7.764529436826706e-05, -7.343105971813202e-05, -6.921682506799698e-05, -6.500259041786194e-05, -6.07883557677269e-05, -5.657412111759186e-05, -5.235988646745682e-05, -4.814565181732178e-05, -4.393141716718674e-05, -3.97171825170517e-05, -3.5502947866916656e-05, -3.1288713216781616e-05, -2.7074478566646576e-05, -2.2860243916511536e-05, -1.8646009266376495e-05, -1.4431774616241455e-05, -1.0217539966106415e-05, -6.0033053159713745e-06, -1.7890706658363342e-06, 2.425163984298706e-06, 6.639398634433746e-06, 1.0853633284568787e-05, 1.5067867934703827e-05, 1.9282102584838867e-05, 2.3496337234973907e-05, 2.7710571885108948e-05, 3.192480653524399e-05, 3.613904118537903e-05, 4.035327583551407e-05, 4.456751048564911e-05, 4.878174513578415e-05, 5.299597978591919e-05, 5.721021443605423e-05, 6.142444908618927e-05, 6.563868373632431e-05, 6.985291838645935e-05, 7.406715303659439e-05, 7.828138768672943e-05, 8.249562233686447e-05, 8.670985698699951e-05, 9.092409163713455e-05, 9.513832628726959e-05, 9.935256093740463e-05, 0.00010356679558753967, 0.00010778103023767471, 0.00011199526488780975, 0.0001162094995379448, 0.00012042373418807983, 0.00012463796883821487, 0.00012885220348834991, 0.00013306643813848495, 0.00013728067278862, 0.00014149490743875504, 0.00014570914208889008, 0.00014992337673902512, 0.00015413761138916016]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 8.0, 10.0, 18.0, 19.0, 25.0, 56.0, 78.0, 129.0, 191.0, 296.0, 458.0, 735.0, 1299.0, 2162.0, 3820.0, 6881.0, 13817.0, 30205.0, 71794.0, 175588.0, 314336.0, 239409.0, 104900.0, 42722.0, 18876.0, 9224.0, 4697.0, 2697.0, 1568.0, 924.0, 607.0, 354.0, 206.0, 147.0, 101.0, 66.0, 40.0, 30.0, 20.0, 15.0, 6.0, 3.0, 3.0, 6.0, 4.0, 5.0, 3.0], "bins": [-2.70703125, -2.6352386474609375, -2.563446044921875, -2.4916534423828125, -2.41986083984375, -2.3480682373046875, -2.276275634765625, -2.2044830322265625, -2.1326904296875, -2.0608978271484375, -1.989105224609375, -1.9173126220703125, -1.84552001953125, -1.7737274169921875, -1.701934814453125, -1.6301422119140625, -1.558349609375, -1.4865570068359375, -1.414764404296875, -1.3429718017578125, -1.27117919921875, -1.1993865966796875, -1.127593994140625, -1.0558013916015625, -0.9840087890625, -0.9122161865234375, -0.840423583984375, -0.7686309814453125, -0.69683837890625, -0.6250457763671875, -0.553253173828125, -0.4814605712890625, -0.40966796875, -0.3378753662109375, -0.266082763671875, -0.1942901611328125, -0.12249755859375, -0.0507049560546875, 0.021087646484375, 0.0928802490234375, 0.1646728515625, 0.2364654541015625, 0.308258056640625, 0.3800506591796875, 0.45184326171875, 0.5236358642578125, 0.595428466796875, 0.6672210693359375, 0.739013671875, 0.8108062744140625, 0.882598876953125, 0.9543914794921875, 1.02618408203125, 1.0979766845703125, 1.169769287109375, 1.2415618896484375, 1.3133544921875, 1.3851470947265625, 1.456939697265625, 1.5287322998046875, 1.60052490234375, 1.6723175048828125, 1.744110107421875, 1.8159027099609375, 1.8876953125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 8.0, 11.0, 8.0, 22.0, 19.0, 37.0, 28.0, 40.0, 49.0, 50.0, 54.0, 67.0, 58.0, 79.0, 62.0, 55.0, 63.0, 45.0, 50.0, 24.0, 36.0, 37.0, 22.0, 15.0, 14.0, 5.0, 10.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58935546875, -0.5704879760742188, -0.5516204833984375, -0.5327529907226562, -0.513885498046875, -0.49501800537109375, -0.4761505126953125, -0.45728302001953125, -0.43841552734375, -0.41954803466796875, -0.4006805419921875, -0.38181304931640625, -0.362945556640625, -0.34407806396484375, -0.3252105712890625, -0.30634307861328125, -0.2874755859375, -0.26860809326171875, -0.2497406005859375, -0.23087310791015625, -0.212005615234375, -0.19313812255859375, -0.1742706298828125, -0.15540313720703125, -0.13653564453125, -0.11766815185546875, -0.0988006591796875, -0.07993316650390625, -0.061065673828125, -0.04219818115234375, -0.0233306884765625, -0.00446319580078125, 0.014404296875, 0.03327178955078125, 0.0521392822265625, 0.07100677490234375, 0.089874267578125, 0.10874176025390625, 0.1276092529296875, 0.14647674560546875, 0.16534423828125, 0.18421173095703125, 0.2030792236328125, 0.22194671630859375, 0.240814208984375, 0.25968170166015625, 0.2785491943359375, 0.29741668701171875, 0.3162841796875, 0.33515167236328125, 0.3540191650390625, 0.37288665771484375, 0.391754150390625, 0.41062164306640625, 0.4294891357421875, 0.44835662841796875, 0.46722412109375, 0.48609161376953125, 0.5049591064453125, 0.5238265991210938, 0.542694091796875, 0.5615615844726562, 0.5804290771484375, 0.5992965698242188, 0.6181640625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 9.0, 10.0, 9.0, 15.0, 16.0, 31.0, 51.0, 65.0, 75.0, 108.0, 99.0, 125.0, 108.0, 81.0, 50.0, 49.0, 23.0, 20.0, 9.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.352155685424805, -16.916059494018555, -16.479961395263672, -16.043865203857422, -15.607767105102539, -15.171670913696289, -14.735572814941406, -14.299476623535156, -13.86337947845459, -13.427282333374023, -12.991185188293457, -12.55508804321289, -12.118990898132324, -11.682893753051758, -11.246797561645508, -10.810700416564941, -10.374603271484375, -9.938506126403809, -9.502408981323242, -9.066311836242676, -8.63021469116211, -8.19411849975586, -7.758020877838135, -7.321924209594727, -6.885826110839844, -6.449728965759277, -6.013631820678711, -5.5775346755981445, -5.141438007354736, -4.70534086227417, -4.2692437171936035, -3.833146810531616, -3.397049903869629, -2.9609527587890625, -2.524855852127075, -2.088758707046509, -1.652661681175232, -1.216564655303955, -0.7804675102233887, -0.34437060356140137, 0.09172654151916504, 0.5278235673904419, 0.9639206528663635, 1.4000177383422852, 1.836114764213562, 2.272211790084839, 2.7083089351654053, 3.1444058418273926, 3.580502986907959, 4.016600131988525, 4.452697277069092, 4.8887939453125, 5.324891090393066, 5.760988235473633, 6.197085380554199, 6.633182525634766, 7.069279670715332, 7.505376815795898, 7.941473960876465, 8.377571105957031, 8.813668251037598, 9.249765396118164, 9.685861587524414, 10.12195873260498, 10.558055877685547]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 11.0, 9.0, 7.0, 8.0, 17.0, 13.0, 17.0, 24.0, 36.0, 25.0, 30.0, 31.0, 25.0, 40.0, 44.0, 45.0, 43.0, 56.0, 41.0, 45.0, 45.0, 46.0, 34.0, 36.0, 36.0, 35.0, 35.0, 19.0, 21.0, 25.0, 17.0, 12.0, 13.0, 13.0, 9.0, 6.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-6.585238933563232, -6.3816914558410645, -6.1781439781188965, -5.9745965003967285, -5.771048545837402, -5.567501068115234, -5.363953590393066, -5.160406112670898, -4.9568586349487305, -4.7533111572265625, -4.5497636795043945, -4.346216201782227, -4.142668724060059, -3.9391210079193115, -3.7355732917785645, -3.5320258140563965, -3.3284783363342285, -3.1249308586120605, -2.9213833808898926, -2.7178356647491455, -2.5142881870269775, -2.3107407093048096, -2.1071929931640625, -1.9036455154418945, -1.7000980377197266, -1.4965505599975586, -1.293002963066101, -1.0894553661346436, -0.8859078884124756, -0.6823604106903076, -0.4788128137588501, -0.2752652168273926, -0.07171773910522461, 0.13182979822158813, 0.3353773355484009, 0.5389248728752136, 0.7424724102020264, 0.9460198879241943, 1.1495674848556519, 1.3531150817871094, 1.5566625595092773, 1.7602100372314453, 1.9637576341629028, 2.1673052310943604, 2.3708527088165283, 2.5744001865386963, 2.7779479026794434, 2.9814953804016113, 3.1850428581237793, 3.3885903358459473, 3.5921378135681152, 3.7956855297088623, 3.9992330074310303, 4.202780723571777, 4.406328201293945, 4.609875679016113, 4.813423156738281, 5.016970634460449, 5.220518112182617, 5.424065589904785, 5.627613067626953, 5.831160545349121, 6.034708499908447, 6.238255977630615, 6.441803455352783]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 12.0, 15.0, 32.0, 40.0, 61.0, 59.0, 135.0, 181.0, 251.0, 371.0, 547.0, 878.0, 1307.0, 2067.0, 3256.0, 5411.0, 9334.0, 15767.0, 28727.0, 52994.0, 95855.0, 156487.0, 200991.0, 184104.0, 125888.0, 72467.0, 38995.0, 21476.0, 11873.0, 7084.0, 4377.0, 2616.0, 1651.0, 1045.0, 691.0, 486.0, 310.0, 223.0, 154.0, 83.0, 71.0, 56.0, 35.0, 31.0, 11.0, 17.0, 8.0, 8.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.6015625, -6.4000244140625, -6.198486328125, -5.9969482421875, -5.79541015625, -5.5938720703125, -5.392333984375, -5.1907958984375, -4.9892578125, -4.7877197265625, -4.586181640625, -4.3846435546875, -4.18310546875, -3.9815673828125, -3.780029296875, -3.5784912109375, -3.376953125, -3.1754150390625, -2.973876953125, -2.7723388671875, -2.57080078125, -2.3692626953125, -2.167724609375, -1.9661865234375, -1.7646484375, -1.5631103515625, -1.361572265625, -1.1600341796875, -0.95849609375, -0.7569580078125, -0.555419921875, -0.3538818359375, -0.15234375, 0.0491943359375, 0.250732421875, 0.4522705078125, 0.65380859375, 0.8553466796875, 1.056884765625, 1.2584228515625, 1.4599609375, 1.6614990234375, 1.863037109375, 2.0645751953125, 2.26611328125, 2.4676513671875, 2.669189453125, 2.8707275390625, 3.072265625, 3.2738037109375, 3.475341796875, 3.6768798828125, 3.87841796875, 4.0799560546875, 4.281494140625, 4.4830322265625, 4.6845703125, 4.8861083984375, 5.087646484375, 5.2891845703125, 5.49072265625, 5.6922607421875, 5.893798828125, 6.0953369140625, 6.296875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 6.0, 6.0, 15.0, 17.0, 18.0, 26.0, 39.0, 23.0, 25.0, 37.0, 44.0, 38.0, 41.0, 44.0, 57.0, 57.0, 36.0, 52.0, 59.0, 46.0, 29.0, 38.0, 38.0, 36.0, 32.0, 16.0, 18.0, 15.0, 15.0, 13.0, 11.0, 8.0, 5.0, 4.0, 4.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.74609375, -6.51226806640625, -6.2784423828125, -6.04461669921875, -5.810791015625, -5.57696533203125, -5.3431396484375, -5.10931396484375, -4.87548828125, -4.64166259765625, -4.4078369140625, -4.17401123046875, -3.940185546875, -3.70635986328125, -3.4725341796875, -3.23870849609375, -3.0048828125, -2.77105712890625, -2.5372314453125, -2.30340576171875, -2.069580078125, -1.83575439453125, -1.6019287109375, -1.36810302734375, -1.13427734375, -0.90045166015625, -0.6666259765625, -0.43280029296875, -0.198974609375, 0.03485107421875, 0.2686767578125, 0.50250244140625, 0.736328125, 0.97015380859375, 1.2039794921875, 1.43780517578125, 1.671630859375, 1.90545654296875, 2.1392822265625, 2.37310791015625, 2.60693359375, 2.84075927734375, 3.0745849609375, 3.30841064453125, 3.542236328125, 3.77606201171875, 4.0098876953125, 4.24371337890625, 4.4775390625, 4.71136474609375, 4.9451904296875, 5.17901611328125, 5.412841796875, 5.64666748046875, 5.8804931640625, 6.11431884765625, 6.34814453125, 6.58197021484375, 6.8157958984375, 7.04962158203125, 7.283447265625, 7.51727294921875, 7.7510986328125, 7.98492431640625, 8.21875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 3.0, 5.0, 16.0, 10.0, 23.0, 36.0, 54.0, 63.0, 104.0, 175.0, 210.0, 357.0, 482.0, 711.0, 1123.0, 1710.0, 2720.0, 4101.0, 6663.0, 10718.0, 17180.0, 27830.0, 45874.0, 73337.0, 111592.0, 148560.0, 164165.0, 143737.0, 105837.0, 68861.0, 42825.0, 26254.0, 15879.0, 9838.0, 6241.0, 3889.0, 2557.0, 1590.0, 1060.0, 707.0, 451.0, 327.0, 229.0, 130.0, 104.0, 74.0, 39.0, 33.0, 23.0, 13.0, 12.0, 13.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-5.32421875, -5.1600341796875, -4.995849609375, -4.8316650390625, -4.66748046875, -4.5032958984375, -4.339111328125, -4.1749267578125, -4.0107421875, -3.8465576171875, -3.682373046875, -3.5181884765625, -3.35400390625, -3.1898193359375, -3.025634765625, -2.8614501953125, -2.697265625, -2.5330810546875, -2.368896484375, -2.2047119140625, -2.04052734375, -1.8763427734375, -1.712158203125, -1.5479736328125, -1.3837890625, -1.2196044921875, -1.055419921875, -0.8912353515625, -0.72705078125, -0.5628662109375, -0.398681640625, -0.2344970703125, -0.0703125, 0.0938720703125, 0.258056640625, 0.4222412109375, 0.58642578125, 0.7506103515625, 0.914794921875, 1.0789794921875, 1.2431640625, 1.4073486328125, 1.571533203125, 1.7357177734375, 1.89990234375, 2.0640869140625, 2.228271484375, 2.3924560546875, 2.556640625, 2.7208251953125, 2.885009765625, 3.0491943359375, 3.21337890625, 3.3775634765625, 3.541748046875, 3.7059326171875, 3.8701171875, 4.0343017578125, 4.198486328125, 4.3626708984375, 4.52685546875, 4.6910400390625, 4.855224609375, 5.0194091796875, 5.18359375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 1.0, 2.0, 5.0, 8.0, 9.0, 8.0, 14.0, 16.0, 21.0, 17.0, 13.0, 22.0, 20.0, 23.0, 29.0, 28.0, 33.0, 33.0, 30.0, 42.0, 50.0, 34.0, 47.0, 55.0, 36.0, 37.0, 47.0, 43.0, 23.0, 25.0, 28.0, 34.0, 19.0, 19.0, 17.0, 17.0, 16.0, 11.0, 12.0, 14.0, 8.0, 12.0, 3.0, 6.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8359375, -3.720062255859375, -3.60418701171875, -3.488311767578125, -3.3724365234375, -3.256561279296875, -3.14068603515625, -3.024810791015625, -2.908935546875, -2.793060302734375, -2.67718505859375, -2.561309814453125, -2.4454345703125, -2.329559326171875, -2.21368408203125, -2.097808837890625, -1.98193359375, -1.866058349609375, -1.75018310546875, -1.634307861328125, -1.5184326171875, -1.402557373046875, -1.28668212890625, -1.170806884765625, -1.054931640625, -0.939056396484375, -0.82318115234375, -0.707305908203125, -0.5914306640625, -0.475555419921875, -0.35968017578125, -0.243804931640625, -0.1279296875, -0.012054443359375, 0.10382080078125, 0.219696044921875, 0.3355712890625, 0.451446533203125, 0.56732177734375, 0.683197021484375, 0.799072265625, 0.914947509765625, 1.03082275390625, 1.146697998046875, 1.2625732421875, 1.378448486328125, 1.49432373046875, 1.610198974609375, 1.72607421875, 1.841949462890625, 1.95782470703125, 2.073699951171875, 2.1895751953125, 2.305450439453125, 2.42132568359375, 2.537200927734375, 2.653076171875, 2.768951416015625, 2.88482666015625, 3.000701904296875, 3.1165771484375, 3.232452392578125, 3.34832763671875, 3.464202880859375, 3.580078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 14.0, 20.0, 27.0, 42.0, 68.0, 107.0, 148.0, 243.0, 327.0, 505.0, 749.0, 1171.0, 1956.0, 3274.0, 5429.0, 9239.0, 16854.0, 30431.0, 56266.0, 101486.0, 165711.0, 209393.0, 181772.0, 115838.0, 65605.0, 35515.0, 19333.0, 11054.0, 6229.0, 3621.0, 2205.0, 1365.0, 818.0, 570.0, 381.0, 271.0, 172.0, 130.0, 67.0, 44.0, 35.0, 23.0, 17.0, 9.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0], "bins": [-3.712890625, -3.608673095703125, -3.50445556640625, -3.400238037109375, -3.2960205078125, -3.191802978515625, -3.08758544921875, -2.983367919921875, -2.879150390625, -2.774932861328125, -2.67071533203125, -2.566497802734375, -2.4622802734375, -2.358062744140625, -2.25384521484375, -2.149627685546875, -2.04541015625, -1.941192626953125, -1.83697509765625, -1.732757568359375, -1.6285400390625, -1.524322509765625, -1.42010498046875, -1.315887451171875, -1.211669921875, -1.107452392578125, -1.00323486328125, -0.899017333984375, -0.7947998046875, -0.690582275390625, -0.58636474609375, -0.482147216796875, -0.3779296875, -0.273712158203125, -0.16949462890625, -0.065277099609375, 0.0389404296875, 0.143157958984375, 0.24737548828125, 0.351593017578125, 0.455810546875, 0.560028076171875, 0.66424560546875, 0.768463134765625, 0.8726806640625, 0.976898193359375, 1.08111572265625, 1.185333251953125, 1.28955078125, 1.393768310546875, 1.49798583984375, 1.602203369140625, 1.7064208984375, 1.810638427734375, 1.91485595703125, 2.019073486328125, 2.123291015625, 2.227508544921875, 2.33172607421875, 2.435943603515625, 2.5401611328125, 2.644378662109375, 2.74859619140625, 2.852813720703125, 2.95703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 10.0, 10.0, 8.0, 13.0, 17.0, 17.0, 29.0, 46.0, 47.0, 64.0, 63.0, 64.0, 81.0, 78.0, 83.0, 69.0, 60.0, 56.0, 44.0, 26.0, 19.0, 25.0, 18.0, 10.0, 13.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002994537353515625, -0.00028853118419647217, -0.00027760863304138184, -0.0002666860818862915, -0.00025576353073120117, -0.00024484097957611084, -0.0002339184284210205, -0.00022299587726593018, -0.00021207332611083984, -0.0002011507749557495, -0.00019022822380065918, -0.00017930567264556885, -0.00016838312149047852, -0.00015746057033538818, -0.00014653801918029785, -0.00013561546802520752, -0.0001246929168701172, -0.00011377036571502686, -0.00010284781455993652, -9.192526340484619e-05, -8.100271224975586e-05, -7.008016109466553e-05, -5.9157609939575195e-05, -4.823505878448486e-05, -3.731250762939453e-05, -2.63899564743042e-05, -1.5467405319213867e-05, -4.544854164123535e-06, 6.377696990966797e-06, 1.730024814605713e-05, 2.822279930114746e-05, 3.914535045623779e-05, 5.0067901611328125e-05, 6.099045276641846e-05, 7.191300392150879e-05, 8.283555507659912e-05, 9.375810623168945e-05, 0.00010468065738677979, 0.00011560320854187012, 0.00012652575969696045, 0.00013744831085205078, 0.0001483708620071411, 0.00015929341316223145, 0.00017021596431732178, 0.0001811385154724121, 0.00019206106662750244, 0.00020298361778259277, 0.0002139061689376831, 0.00022482872009277344, 0.00023575127124786377, 0.0002466738224029541, 0.00025759637355804443, 0.00026851892471313477, 0.0002794414758682251, 0.00029036402702331543, 0.00030128657817840576, 0.0003122091293334961, 0.0003231316804885864, 0.00033405423164367676, 0.0003449767827987671, 0.0003558993339538574, 0.00036682188510894775, 0.0003777444362640381, 0.0003886669874191284, 0.00039958953857421875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 9.0, 15.0, 25.0, 17.0, 25.0, 56.0, 100.0, 130.0, 239.0, 359.0, 597.0, 978.0, 1797.0, 3267.0, 6138.0, 11531.0, 22807.0, 45645.0, 90281.0, 161897.0, 226078.0, 206504.0, 130399.0, 68414.0, 34340.0, 17136.0, 8821.0, 4689.0, 2690.0, 1429.0, 808.0, 498.0, 302.0, 209.0, 123.0, 58.0, 42.0, 36.0, 21.0, 11.0, 12.0, 6.0, 4.0, 7.0, 2.0, 2.0, 0.0, 2.0], "bins": [-4.1875, -4.073699951171875, -3.95989990234375, -3.846099853515625, -3.7322998046875, -3.618499755859375, -3.50469970703125, -3.390899658203125, -3.277099609375, -3.163299560546875, -3.04949951171875, -2.935699462890625, -2.8218994140625, -2.708099365234375, -2.59429931640625, -2.480499267578125, -2.36669921875, -2.252899169921875, -2.13909912109375, -2.025299072265625, -1.9114990234375, -1.797698974609375, -1.68389892578125, -1.570098876953125, -1.456298828125, -1.342498779296875, -1.22869873046875, -1.114898681640625, -1.0010986328125, -0.887298583984375, -0.77349853515625, -0.659698486328125, -0.5458984375, -0.432098388671875, -0.31829833984375, -0.204498291015625, -0.0906982421875, 0.023101806640625, 0.13690185546875, 0.250701904296875, 0.364501953125, 0.478302001953125, 0.59210205078125, 0.705902099609375, 0.8197021484375, 0.933502197265625, 1.04730224609375, 1.161102294921875, 1.27490234375, 1.388702392578125, 1.50250244140625, 1.616302490234375, 1.7301025390625, 1.843902587890625, 1.95770263671875, 2.071502685546875, 2.185302734375, 2.299102783203125, 2.41290283203125, 2.526702880859375, 2.6405029296875, 2.754302978515625, 2.86810302734375, 2.981903076171875, 3.095703125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 6.0, 13.0, 14.0, 16.0, 18.0, 24.0, 42.0, 40.0, 59.0, 62.0, 78.0, 80.0, 79.0, 81.0, 65.0, 73.0, 49.0, 60.0, 38.0, 13.0, 20.0, 21.0, 8.0, 5.0, 12.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.6259765625, -1.582733154296875, -1.53948974609375, -1.496246337890625, -1.4530029296875, -1.409759521484375, -1.36651611328125, -1.323272705078125, -1.280029296875, -1.236785888671875, -1.19354248046875, -1.150299072265625, -1.1070556640625, -1.063812255859375, -1.02056884765625, -0.977325439453125, -0.93408203125, -0.890838623046875, -0.84759521484375, -0.804351806640625, -0.7611083984375, -0.717864990234375, -0.67462158203125, -0.631378173828125, -0.588134765625, -0.544891357421875, -0.50164794921875, -0.458404541015625, -0.4151611328125, -0.371917724609375, -0.32867431640625, -0.285430908203125, -0.2421875, -0.198944091796875, -0.15570068359375, -0.112457275390625, -0.0692138671875, -0.025970458984375, 0.01727294921875, 0.060516357421875, 0.103759765625, 0.147003173828125, 0.19024658203125, 0.233489990234375, 0.2767333984375, 0.319976806640625, 0.36322021484375, 0.406463623046875, 0.44970703125, 0.492950439453125, 0.53619384765625, 0.579437255859375, 0.6226806640625, 0.665924072265625, 0.70916748046875, 0.752410888671875, 0.795654296875, 0.838897705078125, 0.88214111328125, 0.925384521484375, 0.9686279296875, 1.011871337890625, 1.05511474609375, 1.098358154296875, 1.1416015625]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 11.0, 6.0, 8.0, 9.0, 7.0, 16.0, 17.0, 30.0, 34.0, 62.0, 85.0, 82.0, 111.0, 102.0, 96.0, 70.0, 73.0, 54.0, 36.0, 34.0, 10.0, 12.0, 10.0, 7.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.316097259521484, -14.924983024597168, -14.533867835998535, -14.142753601074219, -13.751639366149902, -13.36052417755127, -12.969409942626953, -12.57829475402832, -12.187180519104004, -11.796066284179688, -11.404951095581055, -11.013836860656738, -10.622722625732422, -10.231607437133789, -9.840493202209473, -9.449378967285156, -9.058263778686523, -8.667149543762207, -8.276034355163574, -7.884920120239258, -7.493805408477783, -7.102690696716309, -6.711576461791992, -6.320461750030518, -5.929347991943359, -5.538233280181885, -5.147119045257568, -4.756004333496094, -4.364889621734619, -3.9737751483917236, -3.582660675048828, -3.1915459632873535, -2.800431251525879, -2.4093167781829834, -2.018202066421509, -1.6270875930786133, -1.2359730005264282, -0.8448584079742432, -0.45374393463134766, -0.06262922286987305, 0.32848525047302246, 0.7195998430252075, 1.1107144355773926, 1.501828908920288, 1.8929435014724731, 2.284058094024658, 2.6751725673675537, 3.0662872791290283, 3.457401752471924, 3.8485162258148193, 4.239630699157715, 4.6307454109191895, 5.021860122680664, 5.4129743576049805, 5.804089069366455, 6.19520378112793, 6.586318016052246, 6.977432727813721, 7.368546962738037, 7.759661674499512, 8.150775909423828, 8.541891098022461, 8.933005332946777, 9.324119567871094, 9.715234756469727]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 7.0, 5.0, 9.0, 14.0, 12.0, 19.0, 9.0, 15.0, 23.0, 25.0, 28.0, 27.0, 39.0, 44.0, 39.0, 43.0, 51.0, 49.0, 52.0, 42.0, 32.0, 52.0, 39.0, 48.0, 30.0, 32.0, 24.0, 30.0, 24.0, 22.0, 18.0, 9.0, 11.0, 14.0, 9.0, 12.0, 12.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.461526393890381, -6.257798194885254, -6.054069519042969, -5.850341320037842, -5.646613121032715, -5.442884922027588, -5.239156723022461, -5.035428047180176, -4.831699848175049, -4.627971649169922, -4.424242973327637, -4.22051477432251, -4.016786575317383, -3.813058376312256, -3.60932993888855, -3.4056015014648438, -3.201873302459717, -2.99814510345459, -2.794416666030884, -2.5906882286071777, -2.386960029602051, -2.183231830596924, -1.9795033931732178, -1.7757750749588013, -1.5720467567443848, -1.3683184385299683, -1.1645901203155518, -0.9608618021011353, -0.7571334838867188, -0.5534051656723022, -0.34967684745788574, -0.14594852924346924, 0.05777931213378906, 0.26150763034820557, 0.46523594856262207, 0.6689642667770386, 0.8726925849914551, 1.0764209032058716, 1.280149221420288, 1.4838775396347046, 1.687605857849121, 1.8913341760635376, 2.095062494277954, 2.29879093170166, 2.502519130706787, 2.706247329711914, 2.90997576713562, 3.113704204559326, 3.317432403564453, 3.52116060256958, 3.724889039993286, 3.928617477416992, 4.132345676422119, 4.336073875427246, 4.539802551269531, 4.743530750274658, 4.947258949279785, 5.150987148284912, 5.354715347290039, 5.558444023132324, 5.762172222137451, 5.965900421142578, 6.169629096984863, 6.37335729598999, 6.577085494995117]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 10.0, 16.0, 31.0, 34.0, 60.0, 87.0, 123.0, 154.0, 236.0, 295.0, 474.0, 687.0, 1037.0, 1576.0, 2345.0, 3522.0, 5888.0, 9360.0, 17051.0, 33053.0, 76030.0, 210161.0, 663047.0, 1474848.0, 1097783.0, 372793.0, 120593.0, 47379.0, 22198.0, 12034.0, 7291.0, 4536.0, 2899.0, 2006.0, 1342.0, 967.0, 653.0, 473.0, 331.0, 245.0, 174.0, 131.0, 82.0, 59.0, 60.0, 35.0, 22.0, 21.0, 18.0, 11.0, 10.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 2.0], "bins": [-9.8046875, -9.47509765625, -9.1455078125, -8.81591796875, -8.486328125, -8.15673828125, -7.8271484375, -7.49755859375, -7.16796875, -6.83837890625, -6.5087890625, -6.17919921875, -5.849609375, -5.52001953125, -5.1904296875, -4.86083984375, -4.53125, -4.20166015625, -3.8720703125, -3.54248046875, -3.212890625, -2.88330078125, -2.5537109375, -2.22412109375, -1.89453125, -1.56494140625, -1.2353515625, -0.90576171875, -0.576171875, -0.24658203125, 0.0830078125, 0.41259765625, 0.7421875, 1.07177734375, 1.4013671875, 1.73095703125, 2.060546875, 2.39013671875, 2.7197265625, 3.04931640625, 3.37890625, 3.70849609375, 4.0380859375, 4.36767578125, 4.697265625, 5.02685546875, 5.3564453125, 5.68603515625, 6.015625, 6.34521484375, 6.6748046875, 7.00439453125, 7.333984375, 7.66357421875, 7.9931640625, 8.32275390625, 8.65234375, 8.98193359375, 9.3115234375, 9.64111328125, 9.970703125, 10.30029296875, 10.6298828125, 10.95947265625, 11.2890625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 7.0, 4.0, 9.0, 9.0, 2.0, 15.0, 12.0, 15.0, 17.0, 23.0, 25.0, 29.0, 34.0, 28.0, 42.0, 49.0, 40.0, 45.0, 46.0, 51.0, 48.0, 52.0, 38.0, 56.0, 41.0, 36.0, 36.0, 33.0, 24.0, 21.0, 18.0, 13.0, 15.0, 17.0, 7.0, 13.0, 11.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.65625, -4.50616455078125, -4.3560791015625, -4.20599365234375, -4.055908203125, -3.90582275390625, -3.7557373046875, -3.60565185546875, -3.45556640625, -3.30548095703125, -3.1553955078125, -3.00531005859375, -2.855224609375, -2.70513916015625, -2.5550537109375, -2.40496826171875, -2.2548828125, -2.10479736328125, -1.9547119140625, -1.80462646484375, -1.654541015625, -1.50445556640625, -1.3543701171875, -1.20428466796875, -1.05419921875, -0.90411376953125, -0.7540283203125, -0.60394287109375, -0.453857421875, -0.30377197265625, -0.1536865234375, -0.00360107421875, 0.146484375, 0.29656982421875, 0.4466552734375, 0.59674072265625, 0.746826171875, 0.89691162109375, 1.0469970703125, 1.19708251953125, 1.34716796875, 1.49725341796875, 1.6473388671875, 1.79742431640625, 1.947509765625, 2.09759521484375, 2.2476806640625, 2.39776611328125, 2.5478515625, 2.69793701171875, 2.8480224609375, 2.99810791015625, 3.148193359375, 3.29827880859375, 3.4483642578125, 3.59844970703125, 3.74853515625, 3.89862060546875, 4.0487060546875, 4.19879150390625, 4.348876953125, 4.49896240234375, 4.6490478515625, 4.79913330078125, 4.94921875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 9.0, 14.0, 16.0, 36.0, 31.0, 57.0, 100.0, 127.0, 247.0, 388.0, 639.0, 1125.0, 2056.0, 3502.0, 6591.0, 12933.0, 26734.0, 62844.0, 178864.0, 615104.0, 1594887.0, 1152115.0, 346036.0, 108639.0, 41538.0, 18800.0, 9426.0, 4859.0, 2772.0, 1566.0, 893.0, 515.0, 320.0, 196.0, 105.0, 66.0, 51.0, 27.0, 19.0, 17.0, 10.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.6171875, -13.2139892578125, -12.810791015625, -12.4075927734375, -12.00439453125, -11.6011962890625, -11.197998046875, -10.7947998046875, -10.3916015625, -9.9884033203125, -9.585205078125, -9.1820068359375, -8.77880859375, -8.3756103515625, -7.972412109375, -7.5692138671875, -7.166015625, -6.7628173828125, -6.359619140625, -5.9564208984375, -5.55322265625, -5.1500244140625, -4.746826171875, -4.3436279296875, -3.9404296875, -3.5372314453125, -3.134033203125, -2.7308349609375, -2.32763671875, -1.9244384765625, -1.521240234375, -1.1180419921875, -0.71484375, -0.3116455078125, 0.091552734375, 0.4947509765625, 0.89794921875, 1.3011474609375, 1.704345703125, 2.1075439453125, 2.5107421875, 2.9139404296875, 3.317138671875, 3.7203369140625, 4.12353515625, 4.5267333984375, 4.929931640625, 5.3331298828125, 5.736328125, 6.1395263671875, 6.542724609375, 6.9459228515625, 7.34912109375, 7.7523193359375, 8.155517578125, 8.5587158203125, 8.9619140625, 9.3651123046875, 9.768310546875, 10.1715087890625, 10.57470703125, 10.9779052734375, 11.381103515625, 11.7843017578125, 12.1875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 8.0, 8.0, 6.0, 5.0, 12.0, 12.0, 18.0, 20.0, 21.0, 23.0, 41.0, 41.0, 60.0, 64.0, 76.0, 118.0, 143.0, 189.0, 233.0, 249.0, 309.0, 306.0, 299.0, 305.0, 293.0, 262.0, 213.0, 166.0, 113.0, 115.0, 65.0, 65.0, 48.0, 41.0, 26.0, 24.0, 21.0, 17.0, 8.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.169921875, -3.082427978515625, -2.99493408203125, -2.907440185546875, -2.8199462890625, -2.732452392578125, -2.64495849609375, -2.557464599609375, -2.469970703125, -2.382476806640625, -2.29498291015625, -2.207489013671875, -2.1199951171875, -2.032501220703125, -1.94500732421875, -1.857513427734375, -1.77001953125, -1.682525634765625, -1.59503173828125, -1.507537841796875, -1.4200439453125, -1.332550048828125, -1.24505615234375, -1.157562255859375, -1.070068359375, -0.982574462890625, -0.89508056640625, -0.807586669921875, -0.7200927734375, -0.632598876953125, -0.54510498046875, -0.457611083984375, -0.3701171875, -0.282623291015625, -0.19512939453125, -0.107635498046875, -0.0201416015625, 0.067352294921875, 0.15484619140625, 0.242340087890625, 0.329833984375, 0.417327880859375, 0.50482177734375, 0.592315673828125, 0.6798095703125, 0.767303466796875, 0.85479736328125, 0.942291259765625, 1.02978515625, 1.117279052734375, 1.20477294921875, 1.292266845703125, 1.3797607421875, 1.467254638671875, 1.55474853515625, 1.642242431640625, 1.729736328125, 1.817230224609375, 1.90472412109375, 1.992218017578125, 2.0797119140625, 2.167205810546875, 2.25469970703125, 2.342193603515625, 2.4296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 15.0, 19.0, 37.0, 65.0, 69.0, 111.0, 160.0, 166.0, 107.0, 76.0, 54.0, 34.0, 20.0, 16.0, 14.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-25.68865966796875, -25.15268898010254, -24.61672019958496, -24.08074951171875, -23.544780731201172, -23.00881004333496, -22.472841262817383, -21.936870574951172, -21.400901794433594, -20.864931106567383, -20.328962326049805, -19.792991638183594, -19.257022857666016, -18.721052169799805, -18.185083389282227, -17.649112701416016, -17.113142013549805, -16.577171325683594, -16.041202545166016, -15.505232810974121, -14.969263076782227, -14.433292388916016, -13.897322654724121, -13.361352920532227, -12.825383186340332, -12.289413452148438, -11.753443717956543, -11.217473983764648, -10.681503295898438, -10.14553451538086, -9.609563827514648, -9.073594093322754, -8.537625312805176, -8.001655578613281, -7.465685844421387, -6.929715633392334, -6.3937458992004395, -5.857776165008545, -5.321805953979492, -4.785836219787598, -4.249866485595703, -3.7138967514038086, -3.177926778793335, -2.6419568061828613, -2.105987071990967, -1.5700173377990723, -1.0340473651885986, -0.498077392578125, 0.03789234161376953, 0.5738621950149536, 1.1098320484161377, 1.6458019018173218, 2.181771755218506, 2.7177414894104004, 3.253711462020874, 3.7896814346313477, 4.325651168823242, 4.861620903015137, 5.397590637207031, 5.933560848236084, 6.4695305824279785, 7.005500316619873, 7.541470527648926, 8.07744026184082, 8.613409996032715]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 5.0, 9.0, 8.0, 5.0, 13.0, 8.0, 8.0, 20.0, 18.0, 16.0, 21.0, 33.0, 36.0, 36.0, 33.0, 32.0, 39.0, 48.0, 40.0, 51.0, 39.0, 43.0, 46.0, 31.0, 44.0, 42.0, 40.0, 41.0, 30.0, 32.0, 22.0, 15.0, 15.0, 15.0, 14.0, 15.0, 10.0, 4.0, 5.0, 7.0, 4.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.42673921585083, -5.243031978607178, -5.059325218200684, -4.875617980957031, -4.691911220550537, -4.508203983306885, -4.324497222900391, -4.140789985656738, -3.957082986831665, -3.773375988006592, -3.5896689891815186, -3.4059619903564453, -3.222254753112793, -3.038547992706299, -2.8548407554626465, -2.6711337566375732, -2.4874267578125, -2.3037197589874268, -2.1200127601623535, -1.9363056421279907, -1.7525986433029175, -1.5688916444778442, -1.3851845264434814, -1.2014775276184082, -1.017770528793335, -0.8340635299682617, -0.6503564715385437, -0.4666494131088257, -0.28294241428375244, -0.0992354154586792, 0.0844717025756836, 0.26817870140075684, 0.4518852233886719, 0.6355922222137451, 0.8192992806434631, 1.0030063390731812, 1.1867133378982544, 1.3704203367233276, 1.5541274547576904, 1.7378344535827637, 1.921541452407837, 2.10524845123291, 2.2889554500579834, 2.4726624488830566, 2.656369686126709, 2.840076446533203, 3.0237836837768555, 3.2074906826019287, 3.391197681427002, 3.574904680252075, 3.7586116790771484, 3.942318916320801, 4.126025676727295, 4.309732913970947, 4.493439674377441, 4.677146911621094, 4.860854148864746, 5.044561386108398, 5.228268146514893, 5.411975383758545, 5.595682144165039, 5.779389381408691, 5.963096618652344, 6.146803379058838, 6.330510139465332]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 4.0, 10.0, 21.0, 14.0, 22.0, 35.0, 43.0, 63.0, 116.0, 152.0, 206.0, 346.0, 506.0, 920.0, 1475.0, 2599.0, 4551.0, 8722.0, 16875.0, 34882.0, 74953.0, 155643.0, 258979.0, 237157.0, 130094.0, 60664.0, 28759.0, 14133.0, 7106.0, 3898.0, 2165.0, 1247.0, 755.0, 486.0, 333.0, 203.0, 128.0, 87.0, 59.0, 47.0, 31.0, 20.0, 18.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0], "bins": [-4.09375, -3.972869873046875, -3.85198974609375, -3.731109619140625, -3.6102294921875, -3.489349365234375, -3.36846923828125, -3.247589111328125, -3.126708984375, -3.005828857421875, -2.88494873046875, -2.764068603515625, -2.6431884765625, -2.522308349609375, -2.40142822265625, -2.280548095703125, -2.15966796875, -2.038787841796875, -1.91790771484375, -1.797027587890625, -1.6761474609375, -1.555267333984375, -1.43438720703125, -1.313507080078125, -1.192626953125, -1.071746826171875, -0.95086669921875, -0.829986572265625, -0.7091064453125, -0.588226318359375, -0.46734619140625, -0.346466064453125, -0.2255859375, -0.104705810546875, 0.01617431640625, 0.137054443359375, 0.2579345703125, 0.378814697265625, 0.49969482421875, 0.620574951171875, 0.741455078125, 0.862335205078125, 0.98321533203125, 1.104095458984375, 1.2249755859375, 1.345855712890625, 1.46673583984375, 1.587615966796875, 1.70849609375, 1.829376220703125, 1.95025634765625, 2.071136474609375, 2.1920166015625, 2.312896728515625, 2.43377685546875, 2.554656982421875, 2.675537109375, 2.796417236328125, 2.91729736328125, 3.038177490234375, 3.1590576171875, 3.279937744140625, 3.40081787109375, 3.521697998046875, 3.642578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 15.0, 17.0, 11.0, 13.0, 33.0, 17.0, 19.0, 38.0, 36.0, 25.0, 42.0, 43.0, 49.0, 53.0, 46.0, 46.0, 53.0, 47.0, 43.0, 36.0, 46.0, 31.0, 28.0, 36.0, 27.0, 16.0, 22.0, 22.0, 12.0, 17.0, 9.0, 3.0, 3.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.953125, -5.7430419921875, -5.532958984375, -5.3228759765625, -5.11279296875, -4.9027099609375, -4.692626953125, -4.4825439453125, -4.2724609375, -4.0623779296875, -3.852294921875, -3.6422119140625, -3.43212890625, -3.2220458984375, -3.011962890625, -2.8018798828125, -2.591796875, -2.3817138671875, -2.171630859375, -1.9615478515625, -1.75146484375, -1.5413818359375, -1.331298828125, -1.1212158203125, -0.9111328125, -0.7010498046875, -0.490966796875, -0.2808837890625, -0.07080078125, 0.1392822265625, 0.349365234375, 0.5594482421875, 0.76953125, 0.9796142578125, 1.189697265625, 1.3997802734375, 1.60986328125, 1.8199462890625, 2.030029296875, 2.2401123046875, 2.4501953125, 2.6602783203125, 2.870361328125, 3.0804443359375, 3.29052734375, 3.5006103515625, 3.710693359375, 3.9207763671875, 4.130859375, 4.3409423828125, 4.551025390625, 4.7611083984375, 4.97119140625, 5.1812744140625, 5.391357421875, 5.6014404296875, 5.8115234375, 6.0216064453125, 6.231689453125, 6.4417724609375, 6.65185546875, 6.8619384765625, 7.072021484375, 7.2821044921875, 7.4921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 18.0, 20.0, 28.0, 45.0, 69.0, 83.0, 141.0, 215.0, 344.0, 540.0, 992.0, 1828.0, 3648.0, 7641.0, 17346.0, 43661.0, 122207.0, 312116.0, 325180.0, 130735.0, 47263.0, 18169.0, 7933.0, 3796.0, 1949.0, 1013.0, 570.0, 327.0, 196.0, 126.0, 94.0, 66.0, 55.0, 32.0, 11.0, 18.0, 12.0, 10.0, 2.0, 7.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.88671875, -5.7137451171875, -5.540771484375, -5.3677978515625, -5.19482421875, -5.0218505859375, -4.848876953125, -4.6759033203125, -4.5029296875, -4.3299560546875, -4.156982421875, -3.9840087890625, -3.81103515625, -3.6380615234375, -3.465087890625, -3.2921142578125, -3.119140625, -2.9461669921875, -2.773193359375, -2.6002197265625, -2.42724609375, -2.2542724609375, -2.081298828125, -1.9083251953125, -1.7353515625, -1.5623779296875, -1.389404296875, -1.2164306640625, -1.04345703125, -0.8704833984375, -0.697509765625, -0.5245361328125, -0.3515625, -0.1785888671875, -0.005615234375, 0.1673583984375, 0.34033203125, 0.5133056640625, 0.686279296875, 0.8592529296875, 1.0322265625, 1.2052001953125, 1.378173828125, 1.5511474609375, 1.72412109375, 1.8970947265625, 2.070068359375, 2.2430419921875, 2.416015625, 2.5889892578125, 2.761962890625, 2.9349365234375, 3.10791015625, 3.2808837890625, 3.453857421875, 3.6268310546875, 3.7998046875, 3.9727783203125, 4.145751953125, 4.3187255859375, 4.49169921875, 4.6646728515625, 4.837646484375, 5.0106201171875, 5.18359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 5.0, 5.0, 7.0, 7.0, 5.0, 10.0, 14.0, 12.0, 10.0, 23.0, 20.0, 20.0, 14.0, 23.0, 37.0, 32.0, 38.0, 46.0, 38.0, 42.0, 33.0, 42.0, 34.0, 33.0, 34.0, 50.0, 32.0, 42.0, 29.0, 25.0, 27.0, 33.0, 24.0, 23.0, 18.0, 23.0, 16.0, 15.0, 9.0, 7.0, 7.0, 2.0, 8.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.169921875, -3.068115234375, -2.96630859375, -2.864501953125, -2.7626953125, -2.660888671875, -2.55908203125, -2.457275390625, -2.35546875, -2.253662109375, -2.15185546875, -2.050048828125, -1.9482421875, -1.846435546875, -1.74462890625, -1.642822265625, -1.541015625, -1.439208984375, -1.33740234375, -1.235595703125, -1.1337890625, -1.031982421875, -0.93017578125, -0.828369140625, -0.7265625, -0.624755859375, -0.52294921875, -0.421142578125, -0.3193359375, -0.217529296875, -0.11572265625, -0.013916015625, 0.087890625, 0.189697265625, 0.29150390625, 0.393310546875, 0.4951171875, 0.596923828125, 0.69873046875, 0.800537109375, 0.90234375, 1.004150390625, 1.10595703125, 1.207763671875, 1.3095703125, 1.411376953125, 1.51318359375, 1.614990234375, 1.716796875, 1.818603515625, 1.92041015625, 2.022216796875, 2.1240234375, 2.225830078125, 2.32763671875, 2.429443359375, 2.53125, 2.633056640625, 2.73486328125, 2.836669921875, 2.9384765625, 3.040283203125, 3.14208984375, 3.243896484375, 3.345703125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 11.0, 13.0, 7.0, 17.0, 33.0, 36.0, 69.0, 83.0, 113.0, 170.0, 305.0, 399.0, 672.0, 1079.0, 1695.0, 3049.0, 5597.0, 10990.0, 24776.0, 65665.0, 206028.0, 418578.0, 197147.0, 63849.0, 24085.0, 10809.0, 5526.0, 2997.0, 1699.0, 1008.0, 659.0, 462.0, 282.0, 212.0, 138.0, 94.0, 59.0, 49.0, 21.0, 21.0, 18.0, 12.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.494140625, -2.4173583984375, -2.340576171875, -2.2637939453125, -2.18701171875, -2.1102294921875, -2.033447265625, -1.9566650390625, -1.8798828125, -1.8031005859375, -1.726318359375, -1.6495361328125, -1.57275390625, -1.4959716796875, -1.419189453125, -1.3424072265625, -1.265625, -1.1888427734375, -1.112060546875, -1.0352783203125, -0.95849609375, -0.8817138671875, -0.804931640625, -0.7281494140625, -0.6513671875, -0.5745849609375, -0.497802734375, -0.4210205078125, -0.34423828125, -0.2674560546875, -0.190673828125, -0.1138916015625, -0.037109375, 0.0396728515625, 0.116455078125, 0.1932373046875, 0.27001953125, 0.3468017578125, 0.423583984375, 0.5003662109375, 0.5771484375, 0.6539306640625, 0.730712890625, 0.8074951171875, 0.88427734375, 0.9610595703125, 1.037841796875, 1.1146240234375, 1.19140625, 1.2681884765625, 1.344970703125, 1.4217529296875, 1.49853515625, 1.5753173828125, 1.652099609375, 1.7288818359375, 1.8056640625, 1.8824462890625, 1.959228515625, 2.0360107421875, 2.11279296875, 2.1895751953125, 2.266357421875, 2.3431396484375, 2.419921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 4.0, 8.0, 9.0, 6.0, 13.0, 25.0, 21.0, 36.0, 54.0, 63.0, 104.0, 106.0, 101.0, 103.0, 70.0, 63.0, 49.0, 42.0, 29.0, 20.0, 9.0, 6.0, 11.0, 11.0, 8.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.016824722290039e-05, -7.675494998693466e-05, -7.334165275096893e-05, -6.99283555150032e-05, -6.651505827903748e-05, -6.310176104307175e-05, -5.968846380710602e-05, -5.627516657114029e-05, -5.286186933517456e-05, -4.944857209920883e-05, -4.60352748632431e-05, -4.2621977627277374e-05, -3.9208680391311646e-05, -3.579538315534592e-05, -3.238208591938019e-05, -2.896878868341446e-05, -2.555549144744873e-05, -2.2142194211483002e-05, -1.8728896975517273e-05, -1.5315599739551544e-05, -1.1902302503585815e-05, -8.489005267620087e-06, -5.075708031654358e-06, -1.6624107956886292e-06, 1.7508864402770996e-06, 5.164183676242828e-06, 8.577480912208557e-06, 1.1990778148174286e-05, 1.5404075384140015e-05, 1.8817372620105743e-05, 2.2230669856071472e-05, 2.56439670920372e-05, 2.905726432800293e-05, 3.247056156396866e-05, 3.588385879993439e-05, 3.9297156035900116e-05, 4.2710453271865845e-05, 4.6123750507831573e-05, 4.95370477437973e-05, 5.295034497976303e-05, 5.636364221572876e-05, 5.977693945169449e-05, 6.319023668766022e-05, 6.660353392362595e-05, 7.001683115959167e-05, 7.34301283955574e-05, 7.684342563152313e-05, 8.025672286748886e-05, 8.367002010345459e-05, 8.708331733942032e-05, 9.049661457538605e-05, 9.390991181135178e-05, 9.73232090473175e-05, 0.00010073650628328323, 0.00010414980351924896, 0.00010756310075521469, 0.00011097639799118042, 0.00011438969522714615, 0.00011780299246311188, 0.0001212162896990776, 0.00012462958693504333, 0.00012804288417100906, 0.0001314561814069748, 0.00013486947864294052, 0.00013828277587890625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 7.0, 9.0, 7.0, 11.0, 23.0, 24.0, 38.0, 56.0, 66.0, 108.0, 147.0, 229.0, 355.0, 558.0, 867.0, 1292.0, 2210.0, 3837.0, 7004.0, 13744.0, 29994.0, 74610.0, 204991.0, 363198.0, 207947.0, 75783.0, 30688.0, 13810.0, 7156.0, 3758.0, 2214.0, 1311.0, 816.0, 544.0, 358.0, 261.0, 180.0, 114.0, 67.0, 56.0, 25.0, 29.0, 10.0, 12.0, 10.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.55078125, -2.47894287109375, -2.4071044921875, -2.33526611328125, -2.263427734375, -2.19158935546875, -2.1197509765625, -2.04791259765625, -1.97607421875, -1.90423583984375, -1.8323974609375, -1.76055908203125, -1.688720703125, -1.61688232421875, -1.5450439453125, -1.47320556640625, -1.4013671875, -1.32952880859375, -1.2576904296875, -1.18585205078125, -1.114013671875, -1.04217529296875, -0.9703369140625, -0.89849853515625, -0.82666015625, -0.75482177734375, -0.6829833984375, -0.61114501953125, -0.539306640625, -0.46746826171875, -0.3956298828125, -0.32379150390625, -0.251953125, -0.18011474609375, -0.1082763671875, -0.03643798828125, 0.035400390625, 0.10723876953125, 0.1790771484375, 0.25091552734375, 0.32275390625, 0.39459228515625, 0.4664306640625, 0.53826904296875, 0.610107421875, 0.68194580078125, 0.7537841796875, 0.82562255859375, 0.8974609375, 0.96929931640625, 1.0411376953125, 1.11297607421875, 1.184814453125, 1.25665283203125, 1.3284912109375, 1.40032958984375, 1.47216796875, 1.54400634765625, 1.6158447265625, 1.68768310546875, 1.759521484375, 1.83135986328125, 1.9031982421875, 1.97503662109375, 2.046875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 7.0, 6.0, 8.0, 7.0, 8.0, 15.0, 11.0, 13.0, 16.0, 28.0, 36.0, 43.0, 60.0, 68.0, 75.0, 79.0, 97.0, 80.0, 68.0, 44.0, 42.0, 41.0, 25.0, 19.0, 16.0, 9.0, 12.0, 5.0, 12.0, 6.0, 5.0, 7.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.57421875, -0.5567398071289062, -0.5392608642578125, -0.5217819213867188, -0.504302978515625, -0.48682403564453125, -0.4693450927734375, -0.45186614990234375, -0.43438720703125, -0.41690826416015625, -0.3994293212890625, -0.38195037841796875, -0.364471435546875, -0.34699249267578125, -0.3295135498046875, -0.31203460693359375, -0.2945556640625, -0.27707672119140625, -0.2595977783203125, -0.24211883544921875, -0.224639892578125, -0.20716094970703125, -0.1896820068359375, -0.17220306396484375, -0.15472412109375, -0.13724517822265625, -0.1197662353515625, -0.10228729248046875, -0.084808349609375, -0.06732940673828125, -0.0498504638671875, -0.03237152099609375, -0.014892578125, 0.00258636474609375, 0.0200653076171875, 0.03754425048828125, 0.055023193359375, 0.07250213623046875, 0.0899810791015625, 0.10746002197265625, 0.12493896484375, 0.14241790771484375, 0.1598968505859375, 0.17737579345703125, 0.194854736328125, 0.21233367919921875, 0.2298126220703125, 0.24729156494140625, 0.2647705078125, 0.28224945068359375, 0.2997283935546875, 0.31720733642578125, 0.334686279296875, 0.35216522216796875, 0.3696441650390625, 0.38712310791015625, 0.40460205078125, 0.42208099365234375, 0.4395599365234375, 0.45703887939453125, 0.474517822265625, 0.49199676513671875, 0.5094757080078125, 0.5269546508789062, 0.54443359375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 0.0, 3.0, 3.0, 7.0, 14.0, 12.0, 19.0, 40.0, 67.0, 73.0, 118.0, 156.0, 168.0, 109.0, 74.0, 44.0, 36.0, 22.0, 13.0, 14.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-26.084308624267578, -25.53853416442871, -24.992759704589844, -24.446983337402344, -23.901208877563477, -23.35543441772461, -22.809659957885742, -22.263885498046875, -21.718111038208008, -21.17233657836914, -20.626562118530273, -20.080787658691406, -19.535011291503906, -18.98923683166504, -18.443462371826172, -17.897687911987305, -17.351913452148438, -16.80613899230957, -16.260364532470703, -15.71458911895752, -15.168814659118652, -14.623039245605469, -14.077264785766602, -13.531490325927734, -12.985713958740234, -12.439939498901367, -11.894164085388184, -11.348389625549316, -10.80261516571045, -10.256839752197266, -9.711065292358398, -9.165290832519531, -8.619516372680664, -8.073741912841797, -7.5279669761657715, -6.982192039489746, -6.436417579650879, -5.8906426429748535, -5.344867706298828, -4.799093246459961, -4.2533183097839355, -3.7075436115264893, -3.161768913269043, -2.6159939765930176, -2.0702192783355713, -1.524444580078125, -0.9786696434020996, -0.4328949451446533, 0.11287975311279297, 0.658654510974884, 1.204429268836975, 1.750204086303711, 2.2959787845611572, 2.8417534828186035, 3.387528419494629, 3.933303117752075, 4.4790778160095215, 5.024852752685547, 5.570627212524414, 6.1164021492004395, 6.662177085876465, 7.207951545715332, 7.753726482391357, 8.299501419067383, 8.84527587890625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 5.0, 10.0, 9.0, 7.0, 14.0, 21.0, 16.0, 16.0, 24.0, 30.0, 36.0, 40.0, 35.0, 28.0, 43.0, 46.0, 40.0, 45.0, 49.0, 45.0, 35.0, 46.0, 41.0, 39.0, 43.0, 37.0, 29.0, 33.0, 14.0, 19.0, 14.0, 16.0, 15.0, 12.0, 8.0, 5.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.448026180267334, -5.263195514678955, -5.078364849090576, -4.893533706665039, -4.70870304107666, -4.523872375488281, -4.339041709899902, -4.154211044311523, -3.9693801403045654, -3.7845494747161865, -3.5997185707092285, -3.4148879051208496, -3.2300572395324707, -3.0452263355255127, -2.860395669937134, -2.675564765930176, -2.490734100341797, -2.305903434753418, -2.12107253074646, -1.936241865158081, -1.7514110803604126, -1.5665802955627441, -1.3817496299743652, -1.1969188451766968, -1.0120880603790283, -0.8272572755813599, -0.6424265503883362, -0.4575958251953125, -0.27276504039764404, -0.08793425559997559, 0.09689640998840332, 0.2817271947860718, 0.46655845642089844, 0.6513892412185669, 0.8362199664115906, 1.0210506916046143, 1.2058814764022827, 1.3907122611999512, 1.57554292678833, 1.7603737115859985, 1.945204496383667, 2.130035161972046, 2.314866065979004, 2.499696731567383, 2.6845273971557617, 2.8693583011627197, 3.0541889667510986, 3.2390198707580566, 3.4238505363464355, 3.6086812019348145, 3.7935121059417725, 3.9783427715301514, 4.163173675537109, 4.348004341125488, 4.532835006713867, 4.717665672302246, 4.902496337890625, 5.087327003479004, 5.272157669067383, 5.456988334655762, 5.641819477081299, 5.826650142669678, 6.011480808258057, 6.1963114738464355, 6.381142616271973]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 12.0, 11.0, 15.0, 28.0, 41.0, 35.0, 67.0, 98.0, 159.0, 249.0, 367.0, 612.0, 1066.0, 1777.0, 3430.0, 6396.0, 13542.0, 30277.0, 70867.0, 154646.0, 254420.0, 248014.0, 143420.0, 64999.0, 27962.0, 12239.0, 6061.0, 3242.0, 1745.0, 1056.0, 605.0, 376.0, 224.0, 153.0, 119.0, 77.0, 43.0, 37.0, 14.0, 18.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-8.640625, -8.3861083984375, -8.131591796875, -7.8770751953125, -7.62255859375, -7.3680419921875, -7.113525390625, -6.8590087890625, -6.6044921875, -6.3499755859375, -6.095458984375, -5.8409423828125, -5.58642578125, -5.3319091796875, -5.077392578125, -4.8228759765625, -4.568359375, -4.3138427734375, -4.059326171875, -3.8048095703125, -3.55029296875, -3.2957763671875, -3.041259765625, -2.7867431640625, -2.5322265625, -2.2777099609375, -2.023193359375, -1.7686767578125, -1.51416015625, -1.2596435546875, -1.005126953125, -0.7506103515625, -0.49609375, -0.2415771484375, 0.012939453125, 0.2674560546875, 0.52197265625, 0.7764892578125, 1.031005859375, 1.2855224609375, 1.5400390625, 1.7945556640625, 2.049072265625, 2.3035888671875, 2.55810546875, 2.8126220703125, 3.067138671875, 3.3216552734375, 3.576171875, 3.8306884765625, 4.085205078125, 4.3397216796875, 4.59423828125, 4.8487548828125, 5.103271484375, 5.3577880859375, 5.6123046875, 5.8668212890625, 6.121337890625, 6.3758544921875, 6.63037109375, 6.8848876953125, 7.139404296875, 7.3939208984375, 7.6484375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 6.0, 10.0, 8.0, 5.0, 8.0, 7.0, 16.0, 13.0, 14.0, 23.0, 22.0, 24.0, 34.0, 37.0, 35.0, 45.0, 34.0, 37.0, 34.0, 42.0, 39.0, 48.0, 43.0, 46.0, 35.0, 53.0, 40.0, 43.0, 27.0, 33.0, 19.0, 21.0, 21.0, 12.0, 15.0, 9.0, 12.0, 5.0, 3.0, 8.0, 4.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.78125, -5.58740234375, -5.3935546875, -5.19970703125, -5.005859375, -4.81201171875, -4.6181640625, -4.42431640625, -4.23046875, -4.03662109375, -3.8427734375, -3.64892578125, -3.455078125, -3.26123046875, -3.0673828125, -2.87353515625, -2.6796875, -2.48583984375, -2.2919921875, -2.09814453125, -1.904296875, -1.71044921875, -1.5166015625, -1.32275390625, -1.12890625, -0.93505859375, -0.7412109375, -0.54736328125, -0.353515625, -0.15966796875, 0.0341796875, 0.22802734375, 0.421875, 0.61572265625, 0.8095703125, 1.00341796875, 1.197265625, 1.39111328125, 1.5849609375, 1.77880859375, 1.97265625, 2.16650390625, 2.3603515625, 2.55419921875, 2.748046875, 2.94189453125, 3.1357421875, 3.32958984375, 3.5234375, 3.71728515625, 3.9111328125, 4.10498046875, 4.298828125, 4.49267578125, 4.6865234375, 4.88037109375, 5.07421875, 5.26806640625, 5.4619140625, 5.65576171875, 5.849609375, 6.04345703125, 6.2373046875, 6.43115234375, 6.625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 15.0, 14.0, 19.0, 25.0, 38.0, 48.0, 92.0, 140.0, 180.0, 267.0, 442.0, 748.0, 1207.0, 2059.0, 3652.0, 6653.0, 12578.0, 24152.0, 47157.0, 88375.0, 152226.0, 207081.0, 199171.0, 137222.0, 78292.0, 40679.0, 21114.0, 10928.0, 5982.0, 3244.0, 1867.0, 1032.0, 699.0, 377.0, 232.0, 171.0, 120.0, 76.0, 62.0, 30.0, 26.0, 16.0, 7.0, 10.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.53515625, -6.33648681640625, -6.1378173828125, -5.93914794921875, -5.740478515625, -5.54180908203125, -5.3431396484375, -5.14447021484375, -4.94580078125, -4.74713134765625, -4.5484619140625, -4.34979248046875, -4.151123046875, -3.95245361328125, -3.7537841796875, -3.55511474609375, -3.3564453125, -3.15777587890625, -2.9591064453125, -2.76043701171875, -2.561767578125, -2.36309814453125, -2.1644287109375, -1.96575927734375, -1.76708984375, -1.56842041015625, -1.3697509765625, -1.17108154296875, -0.972412109375, -0.77374267578125, -0.5750732421875, -0.37640380859375, -0.177734375, 0.02093505859375, 0.2196044921875, 0.41827392578125, 0.616943359375, 0.81561279296875, 1.0142822265625, 1.21295166015625, 1.41162109375, 1.61029052734375, 1.8089599609375, 2.00762939453125, 2.206298828125, 2.40496826171875, 2.6036376953125, 2.80230712890625, 3.0009765625, 3.19964599609375, 3.3983154296875, 3.59698486328125, 3.795654296875, 3.99432373046875, 4.1929931640625, 4.39166259765625, 4.59033203125, 4.78900146484375, 4.9876708984375, 5.18634033203125, 5.385009765625, 5.58367919921875, 5.7823486328125, 5.98101806640625, 6.1796875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 12.0, 14.0, 19.0, 22.0, 19.0, 20.0, 36.0, 27.0, 22.0, 31.0, 35.0, 35.0, 29.0, 44.0, 49.0, 44.0, 40.0, 39.0, 29.0, 40.0, 42.0, 36.0, 33.0, 27.0, 37.0, 21.0, 25.0, 29.0, 17.0, 13.0, 19.0, 14.0, 12.0, 15.0, 7.0, 7.0, 12.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.84503173828125, -2.7408447265625, -2.63665771484375, -2.532470703125, -2.42828369140625, -2.3240966796875, -2.21990966796875, -2.11572265625, -2.01153564453125, -1.9073486328125, -1.80316162109375, -1.698974609375, -1.59478759765625, -1.4906005859375, -1.38641357421875, -1.2822265625, -1.17803955078125, -1.0738525390625, -0.96966552734375, -0.865478515625, -0.76129150390625, -0.6571044921875, -0.55291748046875, -0.44873046875, -0.34454345703125, -0.2403564453125, -0.13616943359375, -0.031982421875, 0.07220458984375, 0.1763916015625, 0.28057861328125, 0.384765625, 0.48895263671875, 0.5931396484375, 0.69732666015625, 0.801513671875, 0.90570068359375, 1.0098876953125, 1.11407470703125, 1.21826171875, 1.32244873046875, 1.4266357421875, 1.53082275390625, 1.635009765625, 1.73919677734375, 1.8433837890625, 1.94757080078125, 2.0517578125, 2.15594482421875, 2.2601318359375, 2.36431884765625, 2.468505859375, 2.57269287109375, 2.6768798828125, 2.78106689453125, 2.88525390625, 2.98944091796875, 3.0936279296875, 3.19781494140625, 3.302001953125, 3.40618896484375, 3.5103759765625, 3.61456298828125, 3.71875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 18.0, 21.0, 23.0, 24.0, 45.0, 59.0, 83.0, 120.0, 167.0, 268.0, 419.0, 713.0, 1127.0, 1960.0, 3407.0, 6098.0, 11195.0, 21851.0, 44670.0, 95016.0, 185230.0, 258946.0, 203304.0, 108820.0, 51697.0, 24551.0, 12575.0, 6785.0, 3837.0, 2153.0, 1229.0, 733.0, 474.0, 322.0, 190.0, 111.0, 74.0, 57.0, 47.0, 24.0, 25.0, 17.0, 17.0, 5.0, 11.0, 2.0, 3.0, 7.0, 1.0, 5.0, 5.0, 2.0], "bins": [-4.0, -3.88092041015625, -3.7618408203125, -3.64276123046875, -3.523681640625, -3.40460205078125, -3.2855224609375, -3.16644287109375, -3.04736328125, -2.92828369140625, -2.8092041015625, -2.69012451171875, -2.571044921875, -2.45196533203125, -2.3328857421875, -2.21380615234375, -2.0947265625, -1.97564697265625, -1.8565673828125, -1.73748779296875, -1.618408203125, -1.49932861328125, -1.3802490234375, -1.26116943359375, -1.14208984375, -1.02301025390625, -0.9039306640625, -0.78485107421875, -0.665771484375, -0.54669189453125, -0.4276123046875, -0.30853271484375, -0.189453125, -0.07037353515625, 0.0487060546875, 0.16778564453125, 0.286865234375, 0.40594482421875, 0.5250244140625, 0.64410400390625, 0.76318359375, 0.88226318359375, 1.0013427734375, 1.12042236328125, 1.239501953125, 1.35858154296875, 1.4776611328125, 1.59674072265625, 1.7158203125, 1.83489990234375, 1.9539794921875, 2.07305908203125, 2.192138671875, 2.31121826171875, 2.4302978515625, 2.54937744140625, 2.66845703125, 2.78753662109375, 2.9066162109375, 3.02569580078125, 3.144775390625, 3.26385498046875, 3.3829345703125, 3.50201416015625, 3.62109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 16.0, 27.0, 31.0, 23.0, 42.0, 48.0, 52.0, 81.0, 69.0, 63.0, 74.0, 75.0, 69.0, 56.0, 63.0, 46.0, 35.0, 23.0, 19.0, 15.0, 14.0, 12.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00032806396484375, -0.00031822919845581055, -0.0003083944320678711, -0.00029855966567993164, -0.0002887248992919922, -0.00027889013290405273, -0.0002690553665161133, -0.00025922060012817383, -0.0002493858337402344, -0.00023955106735229492, -0.00022971630096435547, -0.00021988153457641602, -0.00021004676818847656, -0.0002002120018005371, -0.00019037723541259766, -0.0001805424690246582, -0.00017070770263671875, -0.0001608729362487793, -0.00015103816986083984, -0.0001412034034729004, -0.00013136863708496094, -0.00012153387069702148, -0.00011169910430908203, -0.00010186433792114258, -9.202957153320312e-05, -8.219480514526367e-05, -7.236003875732422e-05, -6.252527236938477e-05, -5.269050598144531e-05, -4.285573959350586e-05, -3.3020973205566406e-05, -2.3186206817626953e-05, -1.33514404296875e-05, -3.516674041748047e-06, 6.318092346191406e-06, 1.615285873413086e-05, 2.5987625122070312e-05, 3.5822391510009766e-05, 4.565715789794922e-05, 5.549192428588867e-05, 6.532669067382812e-05, 7.516145706176758e-05, 8.499622344970703e-05, 9.483098983764648e-05, 0.00010466575622558594, 0.00011450052261352539, 0.00012433528900146484, 0.0001341700553894043, 0.00014400482177734375, 0.0001538395881652832, 0.00016367435455322266, 0.0001735091209411621, 0.00018334388732910156, 0.00019317865371704102, 0.00020301342010498047, 0.00021284818649291992, 0.00022268295288085938, 0.00023251771926879883, 0.00024235248565673828, 0.00025218725204467773, 0.0002620220184326172, 0.00027185678482055664, 0.0002816915512084961, 0.00029152631759643555, 0.000301361083984375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 9.0, 11.0, 12.0, 27.0, 31.0, 50.0, 62.0, 94.0, 194.0, 294.0, 474.0, 796.0, 1322.0, 2304.0, 4126.0, 7518.0, 14704.0, 29987.0, 63092.0, 131120.0, 229817.0, 250037.0, 158447.0, 78204.0, 37086.0, 18101.0, 9400.0, 4727.0, 2605.0, 1534.0, 935.0, 574.0, 299.0, 205.0, 113.0, 92.0, 55.0, 34.0, 22.0, 17.0, 10.0, 8.0, 8.0, 5.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69921875, -3.584136962890625, -3.46905517578125, -3.353973388671875, -3.2388916015625, -3.123809814453125, -3.00872802734375, -2.893646240234375, -2.778564453125, -2.663482666015625, -2.54840087890625, -2.433319091796875, -2.3182373046875, -2.203155517578125, -2.08807373046875, -1.972991943359375, -1.85791015625, -1.742828369140625, -1.62774658203125, -1.512664794921875, -1.3975830078125, -1.282501220703125, -1.16741943359375, -1.052337646484375, -0.937255859375, -0.822174072265625, -0.70709228515625, -0.592010498046875, -0.4769287109375, -0.361846923828125, -0.24676513671875, -0.131683349609375, -0.0166015625, 0.098480224609375, 0.21356201171875, 0.328643798828125, 0.4437255859375, 0.558807373046875, 0.67388916015625, 0.788970947265625, 0.904052734375, 1.019134521484375, 1.13421630859375, 1.249298095703125, 1.3643798828125, 1.479461669921875, 1.59454345703125, 1.709625244140625, 1.82470703125, 1.939788818359375, 2.05487060546875, 2.169952392578125, 2.2850341796875, 2.400115966796875, 2.51519775390625, 2.630279541015625, 2.745361328125, 2.860443115234375, 2.97552490234375, 3.090606689453125, 3.2056884765625, 3.320770263671875, 3.43585205078125, 3.550933837890625, 3.666015625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 8.0, 6.0, 4.0, 8.0, 9.0, 8.0, 12.0, 13.0, 9.0, 12.0, 26.0, 25.0, 26.0, 38.0, 37.0, 42.0, 40.0, 53.0, 51.0, 56.0, 44.0, 59.0, 49.0, 49.0, 40.0, 45.0, 42.0, 36.0, 29.0, 23.0, 24.0, 15.0, 11.0, 10.0, 14.0, 9.0, 6.0, 3.0, 5.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69189453125, -0.6657943725585938, -0.6396942138671875, -0.6135940551757812, -0.587493896484375, -0.5613937377929688, -0.5352935791015625, -0.5091934204101562, -0.48309326171875, -0.45699310302734375, -0.4308929443359375, -0.40479278564453125, -0.378692626953125, -0.35259246826171875, -0.3264923095703125, -0.30039215087890625, -0.2742919921875, -0.24819183349609375, -0.2220916748046875, -0.19599151611328125, -0.169891357421875, -0.14379119873046875, -0.1176910400390625, -0.09159088134765625, -0.06549072265625, -0.03939056396484375, -0.0132904052734375, 0.01280975341796875, 0.038909912109375, 0.06501007080078125, 0.0911102294921875, 0.11721038818359375, 0.143310546875, 0.16941070556640625, 0.1955108642578125, 0.22161102294921875, 0.247711181640625, 0.27381134033203125, 0.2999114990234375, 0.32601165771484375, 0.35211181640625, 0.37821197509765625, 0.4043121337890625, 0.43041229248046875, 0.456512451171875, 0.48261260986328125, 0.5087127685546875, 0.5348129272460938, 0.5609130859375, 0.5870132446289062, 0.6131134033203125, 0.6392135620117188, 0.665313720703125, 0.6914138793945312, 0.7175140380859375, 0.7436141967773438, 0.76971435546875, 0.7958145141601562, 0.8219146728515625, 0.8480148315429688, 0.874114990234375, 0.9002151489257812, 0.9263153076171875, 0.9524154663085938, 0.978515625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 12.0, 15.0, 20.0, 48.0, 69.0, 112.0, 142.0, 165.0, 137.0, 95.0, 54.0, 53.0, 23.0, 18.0, 11.0, 11.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.881580352783203, -26.314258575439453, -25.746936798095703, -25.179616928100586, -24.612295150756836, -24.044973373413086, -23.477651596069336, -22.910329818725586, -22.34300994873047, -21.77568817138672, -21.20836639404297, -20.64104652404785, -20.0737247467041, -19.50640296936035, -18.9390811920166, -18.37175941467285, -17.8044376373291, -17.23711585998535, -16.6697940826416, -16.102474212646484, -15.535152435302734, -14.967830657958984, -14.400508880615234, -13.833187103271484, -13.26586627960205, -12.6985445022583, -12.131223678588867, -11.563901901245117, -10.996580123901367, -10.429259300231934, -9.861937522888184, -9.29461669921875, -8.727293014526367, -8.159971237182617, -7.592650413513184, -7.025328636169434, -6.458007335662842, -5.89068603515625, -5.3233642578125, -4.756042957305908, -4.188721656799316, -3.6214003562927246, -3.0540788173675537, -2.486757278442383, -1.919435977935791, -1.3521146774291992, -0.7847931385040283, -0.21747159957885742, 0.3498497009277344, 0.9171711206436157, 1.484492540359497, 2.051814079284668, 2.6191353797912598, 3.1864566802978516, 3.7537782192230225, 4.321099758148193, 4.888421058654785, 5.455742359161377, 6.023063659667969, 6.590385437011719, 7.1577067375183105, 7.725028038024902, 8.292349815368652, 8.859670639038086, 9.426992416381836]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 8.0, 11.0, 11.0, 9.0, 11.0, 13.0, 19.0, 28.0, 29.0, 33.0, 37.0, 40.0, 35.0, 42.0, 45.0, 48.0, 50.0, 45.0, 38.0, 41.0, 51.0, 36.0, 36.0, 53.0, 32.0, 26.0, 25.0, 21.0, 22.0, 18.0, 17.0, 13.0, 14.0, 9.0, 4.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.047612190246582, -5.851572513580322, -5.6555328369140625, -5.459493160247803, -5.263453483581543, -5.067413806915283, -4.871374130249023, -4.675334930419922, -4.479294776916504, -4.283255100250244, -4.087215423583984, -3.8911757469177246, -3.695136070251465, -3.499096393585205, -3.3030569553375244, -3.1070172786712646, -2.910977840423584, -2.714938163757324, -2.5188984870910645, -2.3228588104248047, -2.126819133758545, -1.9307795763015747, -1.7347400188446045, -1.5387003421783447, -1.342660665512085, -1.1466209888458252, -0.9505813717842102, -0.7545417547225952, -0.5585020780563354, -0.3624624013900757, -0.16642284393310547, 0.029616832733154297, 0.22565650939941406, 0.42169615626335144, 0.6177358031272888, 0.8137754201889038, 1.0098150968551636, 1.2058547735214233, 1.4018943309783936, 1.5979340076446533, 1.793973684310913, 1.9900133609771729, 2.1860530376434326, 2.3820924758911133, 2.578132152557373, 2.774171829223633, 2.9702115058898926, 3.1662511825561523, 3.362290859222412, 3.558330535888672, 3.7543702125549316, 3.9504098892211914, 4.146449565887451, 4.342489242553711, 4.5385284423828125, 4.7345685958862305, 4.930607795715332, 5.126647472381592, 5.322687149047852, 5.518726825714111, 5.714766502380371, 5.910806179046631, 6.106845855712891, 6.302885055541992, 6.49892520904541]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 8.0, 4.0, 9.0, 13.0, 18.0, 36.0, 42.0, 74.0, 97.0, 144.0, 227.0, 358.0, 499.0, 802.0, 1181.0, 1863.0, 3022.0, 4978.0, 8409.0, 15414.0, 30658.0, 72428.0, 208449.0, 672589.0, 1518427.0, 1098244.0, 354119.0, 110107.0, 42115.0, 20063.0, 10761.0, 6481.0, 4144.0, 2695.0, 1708.0, 1167.0, 845.0, 564.0, 412.0, 313.0, 230.0, 152.0, 108.0, 68.0, 79.0, 42.0, 29.0, 24.0, 20.0, 14.0, 10.0, 13.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.1328125, -9.7919921875, -9.451171875, -9.1103515625, -8.76953125, -8.4287109375, -8.087890625, -7.7470703125, -7.40625, -7.0654296875, -6.724609375, -6.3837890625, -6.04296875, -5.7021484375, -5.361328125, -5.0205078125, -4.6796875, -4.3388671875, -3.998046875, -3.6572265625, -3.31640625, -2.9755859375, -2.634765625, -2.2939453125, -1.953125, -1.6123046875, -1.271484375, -0.9306640625, -0.58984375, -0.2490234375, 0.091796875, 0.4326171875, 0.7734375, 1.1142578125, 1.455078125, 1.7958984375, 2.13671875, 2.4775390625, 2.818359375, 3.1591796875, 3.5, 3.8408203125, 4.181640625, 4.5224609375, 4.86328125, 5.2041015625, 5.544921875, 5.8857421875, 6.2265625, 6.5673828125, 6.908203125, 7.2490234375, 7.58984375, 7.9306640625, 8.271484375, 8.6123046875, 8.953125, 9.2939453125, 9.634765625, 9.9755859375, 10.31640625, 10.6572265625, 10.998046875, 11.3388671875, 11.6796875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 9.0, 8.0, 12.0, 18.0, 21.0, 21.0, 25.0, 32.0, 38.0, 40.0, 45.0, 36.0, 46.0, 40.0, 45.0, 50.0, 44.0, 38.0, 52.0, 47.0, 40.0, 39.0, 35.0, 29.0, 25.0, 24.0, 27.0, 15.0, 15.0, 13.0, 10.0, 13.0, 6.0, 8.0, 9.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.09765625, -3.95611572265625, -3.8145751953125, -3.67303466796875, -3.531494140625, -3.38995361328125, -3.2484130859375, -3.10687255859375, -2.96533203125, -2.82379150390625, -2.6822509765625, -2.54071044921875, -2.399169921875, -2.25762939453125, -2.1160888671875, -1.97454833984375, -1.8330078125, -1.69146728515625, -1.5499267578125, -1.40838623046875, -1.266845703125, -1.12530517578125, -0.9837646484375, -0.84222412109375, -0.70068359375, -0.55914306640625, -0.4176025390625, -0.27606201171875, -0.134521484375, 0.00701904296875, 0.1485595703125, 0.29010009765625, 0.431640625, 0.57318115234375, 0.7147216796875, 0.85626220703125, 0.997802734375, 1.13934326171875, 1.2808837890625, 1.42242431640625, 1.56396484375, 1.70550537109375, 1.8470458984375, 1.98858642578125, 2.130126953125, 2.27166748046875, 2.4132080078125, 2.55474853515625, 2.6962890625, 2.83782958984375, 2.9793701171875, 3.12091064453125, 3.262451171875, 3.40399169921875, 3.5455322265625, 3.68707275390625, 3.82861328125, 3.97015380859375, 4.1116943359375, 4.25323486328125, 4.394775390625, 4.53631591796875, 4.6778564453125, 4.81939697265625, 4.9609375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 6.0, 10.0, 15.0, 32.0, 35.0, 40.0, 76.0, 127.0, 171.0, 293.0, 462.0, 719.0, 1174.0, 1925.0, 3166.0, 5461.0, 9947.0, 18527.0, 38631.0, 92651.0, 276086.0, 906867.0, 1616696.0, 814525.0, 246723.0, 84189.0, 35899.0, 17325.0, 9430.0, 5185.0, 3104.0, 1850.0, 1086.0, 664.0, 433.0, 255.0, 161.0, 98.0, 61.0, 54.0, 41.0, 29.0, 19.0, 11.0, 7.0, 7.0, 1.0, 4.0, 1.0], "bins": [-14.25, -13.8695068359375, -13.489013671875, -13.1085205078125, -12.72802734375, -12.3475341796875, -11.967041015625, -11.5865478515625, -11.2060546875, -10.8255615234375, -10.445068359375, -10.0645751953125, -9.68408203125, -9.3035888671875, -8.923095703125, -8.5426025390625, -8.162109375, -7.7816162109375, -7.401123046875, -7.0206298828125, -6.64013671875, -6.2596435546875, -5.879150390625, -5.4986572265625, -5.1181640625, -4.7376708984375, -4.357177734375, -3.9766845703125, -3.59619140625, -3.2156982421875, -2.835205078125, -2.4547119140625, -2.07421875, -1.6937255859375, -1.313232421875, -0.9327392578125, -0.55224609375, -0.1717529296875, 0.208740234375, 0.5892333984375, 0.9697265625, 1.3502197265625, 1.730712890625, 2.1112060546875, 2.49169921875, 2.8721923828125, 3.252685546875, 3.6331787109375, 4.013671875, 4.3941650390625, 4.774658203125, 5.1551513671875, 5.53564453125, 5.9161376953125, 6.296630859375, 6.6771240234375, 7.0576171875, 7.4381103515625, 7.818603515625, 8.1990966796875, 8.57958984375, 8.9600830078125, 9.340576171875, 9.7210693359375, 10.1015625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 2.0, 4.0, 5.0, 11.0, 11.0, 13.0, 22.0, 14.0, 17.0, 21.0, 33.0, 42.0, 55.0, 67.0, 93.0, 103.0, 154.0, 196.0, 219.0, 256.0, 328.0, 305.0, 336.0, 314.0, 290.0, 236.0, 202.0, 162.0, 129.0, 93.0, 92.0, 54.0, 54.0, 27.0, 27.0, 17.0, 12.0, 15.0, 14.0, 5.0, 6.0, 4.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.109375, -3.0235595703125, -2.937744140625, -2.8519287109375, -2.76611328125, -2.6802978515625, -2.594482421875, -2.5086669921875, -2.4228515625, -2.3370361328125, -2.251220703125, -2.1654052734375, -2.07958984375, -1.9937744140625, -1.907958984375, -1.8221435546875, -1.736328125, -1.6505126953125, -1.564697265625, -1.4788818359375, -1.39306640625, -1.3072509765625, -1.221435546875, -1.1356201171875, -1.0498046875, -0.9639892578125, -0.878173828125, -0.7923583984375, -0.70654296875, -0.6207275390625, -0.534912109375, -0.4490966796875, -0.36328125, -0.2774658203125, -0.191650390625, -0.1058349609375, -0.02001953125, 0.0657958984375, 0.151611328125, 0.2374267578125, 0.3232421875, 0.4090576171875, 0.494873046875, 0.5806884765625, 0.66650390625, 0.7523193359375, 0.838134765625, 0.9239501953125, 1.009765625, 1.0955810546875, 1.181396484375, 1.2672119140625, 1.35302734375, 1.4388427734375, 1.524658203125, 1.6104736328125, 1.6962890625, 1.7821044921875, 1.867919921875, 1.9537353515625, 2.03955078125, 2.1253662109375, 2.211181640625, 2.2969970703125, 2.3828125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 13.0, 3.0, 12.0, 16.0, 39.0, 51.0, 98.0, 133.0, 150.0, 141.0, 141.0, 71.0, 45.0, 31.0, 23.0, 4.0, 8.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.53737449645996, -23.95140266418457, -23.365428924560547, -22.779457092285156, -22.193485260009766, -21.607511520385742, -21.02153968811035, -20.435565948486328, -19.849594116210938, -19.263622283935547, -18.677648544311523, -18.091676712036133, -17.50570297241211, -16.91973114013672, -16.333759307861328, -15.747786521911621, -15.161813735961914, -14.575840950012207, -13.9898681640625, -13.40389633178711, -12.817923545837402, -12.231950759887695, -11.645978927612305, -11.060006141662598, -10.47403335571289, -9.888060569763184, -9.302087783813477, -8.716115951538086, -8.130143165588379, -7.544170379638672, -6.958198070526123, -6.372225761413574, -5.786252021789551, -5.200279235839844, -4.614306926727295, -4.028334617614746, -3.442361831665039, -2.856389284133911, -2.270416736602783, -1.6844444274902344, -1.0984716415405273, -0.5124990940093994, 0.07347345352172852, 0.6594460010528564, 1.2454185485839844, 1.8313910961151123, 2.4173636436462402, 3.003335952758789, 3.589308738708496, 4.175281524658203, 4.761253833770752, 5.347226142883301, 5.933198928833008, 6.519171714782715, 7.105144023895264, 7.6911163330078125, 8.27708911895752, 8.863061904907227, 9.449033737182617, 10.035006523132324, 10.620979309082031, 11.206952095031738, 11.792924880981445, 12.378896713256836, 12.964869499206543]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 9.0, 8.0, 9.0, 5.0, 12.0, 16.0, 20.0, 29.0, 35.0, 23.0, 21.0, 39.0, 42.0, 44.0, 43.0, 48.0, 52.0, 47.0, 36.0, 51.0, 45.0, 47.0, 38.0, 31.0, 32.0, 24.0, 36.0, 25.0, 21.0, 20.0, 12.0, 19.0, 13.0, 4.0, 2.0, 10.0, 7.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.803647994995117, -5.616357803344727, -5.429068088531494, -5.2417778968811035, -5.054487705230713, -4.867197513580322, -4.67990779876709, -4.492617607116699, -4.305327415466309, -4.118037223815918, -3.9307472705841064, -3.743457317352295, -3.5561671257019043, -3.3688771724700928, -3.1815872192382812, -2.9942970275878906, -2.807007074356079, -2.6197171211242676, -2.432426929473877, -2.2451369762420654, -2.057846784591675, -1.8705568313598633, -1.6832667589187622, -1.4959766864776611, -1.30868661403656, -1.121396541595459, -0.9341064691543579, -0.7468164563179016, -0.5595263838768005, -0.37223631143569946, -0.18494629859924316, 0.00234377384185791, 0.18963384628295898, 0.37692391872406006, 0.5642139911651611, 0.7515040040016174, 0.9387940764427185, 1.1260840892791748, 1.3133741617202759, 1.500664234161377, 1.687954306602478, 1.875244379043579, 2.0625343322753906, 2.2498245239257812, 2.4371144771575928, 2.6244046688079834, 2.811694622039795, 2.9989848136901855, 3.186274766921997, 3.3735647201538086, 3.560854911804199, 3.7481448650360107, 3.9354350566864014, 4.122725009918213, 4.3100152015686035, 4.497304916381836, 4.684595108032227, 4.871885299682617, 5.05917501449585, 5.24646520614624, 5.433755397796631, 5.6210455894470215, 5.808335304260254, 5.9956254959106445, 6.182915687561035]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 11.0, 18.0, 17.0, 33.0, 59.0, 77.0, 133.0, 181.0, 242.0, 375.0, 560.0, 926.0, 1414.0, 2326.0, 3680.0, 6196.0, 10307.0, 18784.0, 34191.0, 63978.0, 118464.0, 191582.0, 220152.0, 164259.0, 95255.0, 50967.0, 27224.0, 14852.0, 8628.0, 5240.0, 3028.0, 1915.0, 1224.0, 808.0, 474.0, 320.0, 196.0, 151.0, 88.0, 66.0, 48.0, 29.0, 23.0, 16.0, 11.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.51171875, -2.428863525390625, -2.34600830078125, -2.263153076171875, -2.1802978515625, -2.097442626953125, -2.01458740234375, -1.931732177734375, -1.848876953125, -1.766021728515625, -1.68316650390625, -1.600311279296875, -1.5174560546875, -1.434600830078125, -1.35174560546875, -1.268890380859375, -1.18603515625, -1.103179931640625, -1.02032470703125, -0.937469482421875, -0.8546142578125, -0.771759033203125, -0.68890380859375, -0.606048583984375, -0.523193359375, -0.440338134765625, -0.35748291015625, -0.274627685546875, -0.1917724609375, -0.108917236328125, -0.02606201171875, 0.056793212890625, 0.1396484375, 0.222503662109375, 0.30535888671875, 0.388214111328125, 0.4710693359375, 0.553924560546875, 0.63677978515625, 0.719635009765625, 0.802490234375, 0.885345458984375, 0.96820068359375, 1.051055908203125, 1.1339111328125, 1.216766357421875, 1.29962158203125, 1.382476806640625, 1.46533203125, 1.548187255859375, 1.63104248046875, 1.713897705078125, 1.7967529296875, 1.879608154296875, 1.96246337890625, 2.045318603515625, 2.128173828125, 2.211029052734375, 2.29388427734375, 2.376739501953125, 2.4595947265625, 2.542449951171875, 2.62530517578125, 2.708160400390625, 2.791015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 7.0, 3.0, 6.0, 10.0, 13.0, 19.0, 19.0, 24.0, 22.0, 27.0, 30.0, 25.0, 42.0, 36.0, 49.0, 36.0, 53.0, 46.0, 48.0, 40.0, 55.0, 52.0, 32.0, 36.0, 39.0, 30.0, 26.0, 21.0, 19.0, 22.0, 18.0, 18.0, 14.0, 13.0, 8.0, 7.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2109375, -6.0069580078125, -5.802978515625, -5.5989990234375, -5.39501953125, -5.1910400390625, -4.987060546875, -4.7830810546875, -4.5791015625, -4.3751220703125, -4.171142578125, -3.9671630859375, -3.76318359375, -3.5592041015625, -3.355224609375, -3.1512451171875, -2.947265625, -2.7432861328125, -2.539306640625, -2.3353271484375, -2.13134765625, -1.9273681640625, -1.723388671875, -1.5194091796875, -1.3154296875, -1.1114501953125, -0.907470703125, -0.7034912109375, -0.49951171875, -0.2955322265625, -0.091552734375, 0.1124267578125, 0.31640625, 0.5203857421875, 0.724365234375, 0.9283447265625, 1.13232421875, 1.3363037109375, 1.540283203125, 1.7442626953125, 1.9482421875, 2.1522216796875, 2.356201171875, 2.5601806640625, 2.76416015625, 2.9681396484375, 3.172119140625, 3.3760986328125, 3.580078125, 3.7840576171875, 3.988037109375, 4.1920166015625, 4.39599609375, 4.5999755859375, 4.803955078125, 5.0079345703125, 5.2119140625, 5.4158935546875, 5.619873046875, 5.8238525390625, 6.02783203125, 6.2318115234375, 6.435791015625, 6.6397705078125, 6.84375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 16.0, 16.0, 21.0, 37.0, 61.0, 73.0, 122.0, 153.0, 205.0, 339.0, 546.0, 759.0, 1118.0, 1788.0, 2709.0, 4175.0, 6882.0, 11190.0, 19480.0, 34496.0, 63712.0, 115253.0, 187886.0, 220225.0, 161505.0, 94139.0, 51392.0, 28438.0, 16294.0, 9262.0, 5745.0, 3616.0, 2284.0, 1470.0, 1023.0, 683.0, 426.0, 310.0, 217.0, 171.0, 89.0, 59.0, 71.0, 42.0, 24.0, 8.0, 7.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.73046875, -2.643310546875, -2.55615234375, -2.468994140625, -2.3818359375, -2.294677734375, -2.20751953125, -2.120361328125, -2.033203125, -1.946044921875, -1.85888671875, -1.771728515625, -1.6845703125, -1.597412109375, -1.51025390625, -1.423095703125, -1.3359375, -1.248779296875, -1.16162109375, -1.074462890625, -0.9873046875, -0.900146484375, -0.81298828125, -0.725830078125, -0.638671875, -0.551513671875, -0.46435546875, -0.377197265625, -0.2900390625, -0.202880859375, -0.11572265625, -0.028564453125, 0.05859375, 0.145751953125, 0.23291015625, 0.320068359375, 0.4072265625, 0.494384765625, 0.58154296875, 0.668701171875, 0.755859375, 0.843017578125, 0.93017578125, 1.017333984375, 1.1044921875, 1.191650390625, 1.27880859375, 1.365966796875, 1.453125, 1.540283203125, 1.62744140625, 1.714599609375, 1.8017578125, 1.888916015625, 1.97607421875, 2.063232421875, 2.150390625, 2.237548828125, 2.32470703125, 2.411865234375, 2.4990234375, 2.586181640625, 2.67333984375, 2.760498046875, 2.84765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 6.0, 6.0, 3.0, 7.0, 8.0, 10.0, 16.0, 13.0, 12.0, 28.0, 21.0, 28.0, 29.0, 33.0, 41.0, 31.0, 40.0, 26.0, 37.0, 45.0, 33.0, 46.0, 34.0, 39.0, 46.0, 40.0, 30.0, 30.0, 25.0, 27.0, 31.0, 27.0, 17.0, 19.0, 16.0, 22.0, 10.0, 18.0, 10.0, 9.0, 11.0, 13.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.423828125, -3.31988525390625, -3.2159423828125, -3.11199951171875, -3.008056640625, -2.90411376953125, -2.8001708984375, -2.69622802734375, -2.59228515625, -2.48834228515625, -2.3843994140625, -2.28045654296875, -2.176513671875, -2.07257080078125, -1.9686279296875, -1.86468505859375, -1.7607421875, -1.65679931640625, -1.5528564453125, -1.44891357421875, -1.344970703125, -1.24102783203125, -1.1370849609375, -1.03314208984375, -0.92919921875, -0.82525634765625, -0.7213134765625, -0.61737060546875, -0.513427734375, -0.40948486328125, -0.3055419921875, -0.20159912109375, -0.09765625, 0.00628662109375, 0.1102294921875, 0.21417236328125, 0.318115234375, 0.42205810546875, 0.5260009765625, 0.62994384765625, 0.73388671875, 0.83782958984375, 0.9417724609375, 1.04571533203125, 1.149658203125, 1.25360107421875, 1.3575439453125, 1.46148681640625, 1.5654296875, 1.66937255859375, 1.7733154296875, 1.87725830078125, 1.981201171875, 2.08514404296875, 2.1890869140625, 2.29302978515625, 2.39697265625, 2.50091552734375, 2.6048583984375, 2.70880126953125, 2.812744140625, 2.91668701171875, 3.0206298828125, 3.12457275390625, 3.228515625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 3.0, 10.0, 10.0, 16.0, 12.0, 32.0, 41.0, 63.0, 100.0, 137.0, 214.0, 381.0, 606.0, 967.0, 1764.0, 3272.0, 6472.0, 14159.0, 32317.0, 85225.0, 241519.0, 377921.0, 174343.0, 61837.0, 24872.0, 10950.0, 5233.0, 2717.0, 1304.0, 783.0, 462.0, 298.0, 171.0, 118.0, 70.0, 47.0, 41.0, 31.0, 12.0, 10.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.060546875, -1.996826171875, -1.93310546875, -1.869384765625, -1.8056640625, -1.741943359375, -1.67822265625, -1.614501953125, -1.55078125, -1.487060546875, -1.42333984375, -1.359619140625, -1.2958984375, -1.232177734375, -1.16845703125, -1.104736328125, -1.041015625, -0.977294921875, -0.91357421875, -0.849853515625, -0.7861328125, -0.722412109375, -0.65869140625, -0.594970703125, -0.53125, -0.467529296875, -0.40380859375, -0.340087890625, -0.2763671875, -0.212646484375, -0.14892578125, -0.085205078125, -0.021484375, 0.042236328125, 0.10595703125, 0.169677734375, 0.2333984375, 0.297119140625, 0.36083984375, 0.424560546875, 0.48828125, 0.552001953125, 0.61572265625, 0.679443359375, 0.7431640625, 0.806884765625, 0.87060546875, 0.934326171875, 0.998046875, 1.061767578125, 1.12548828125, 1.189208984375, 1.2529296875, 1.316650390625, 1.38037109375, 1.444091796875, 1.5078125, 1.571533203125, 1.63525390625, 1.698974609375, 1.7626953125, 1.826416015625, 1.89013671875, 1.953857421875, 2.017578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 6.0, 9.0, 7.0, 4.0, 13.0, 9.0, 16.0, 17.0, 25.0, 44.0, 41.0, 50.0, 56.0, 68.0, 96.0, 79.0, 73.0, 78.0, 68.0, 53.0, 43.0, 37.0, 28.0, 20.0, 12.0, 11.0, 8.0, 6.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.784366607666016e-05, -7.53793865442276e-05, -7.291510701179504e-05, -7.045082747936249e-05, -6.798654794692993e-05, -6.552226841449738e-05, -6.305798888206482e-05, -6.059370934963226e-05, -5.812942981719971e-05, -5.566515028476715e-05, -5.3200870752334595e-05, -5.073659121990204e-05, -4.827231168746948e-05, -4.5808032155036926e-05, -4.334375262260437e-05, -4.0879473090171814e-05, -3.841519355773926e-05, -3.59509140253067e-05, -3.3486634492874146e-05, -3.102235496044159e-05, -2.8558075428009033e-05, -2.6093795895576477e-05, -2.362951636314392e-05, -2.1165236830711365e-05, -1.870095729827881e-05, -1.6236677765846252e-05, -1.3772398233413696e-05, -1.130811870098114e-05, -8.843839168548584e-06, -6.379559636116028e-06, -3.915280103683472e-06, -1.4510005712509155e-06, 1.0132789611816406e-06, 3.4775584936141968e-06, 5.941838026046753e-06, 8.406117558479309e-06, 1.0870397090911865e-05, 1.3334676623344421e-05, 1.5798956155776978e-05, 1.8263235688209534e-05, 2.072751522064209e-05, 2.3191794753074646e-05, 2.5656074285507202e-05, 2.8120353817939758e-05, 3.0584633350372314e-05, 3.304891288280487e-05, 3.551319241523743e-05, 3.797747194766998e-05, 4.044175148010254e-05, 4.2906031012535095e-05, 4.537031054496765e-05, 4.783459007740021e-05, 5.0298869609832764e-05, 5.276314914226532e-05, 5.5227428674697876e-05, 5.769170820713043e-05, 6.015598773956299e-05, 6.262026727199554e-05, 6.50845468044281e-05, 6.754882633686066e-05, 7.001310586929321e-05, 7.247738540172577e-05, 7.494166493415833e-05, 7.740594446659088e-05, 7.987022399902344e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 13.0, 15.0, 32.0, 50.0, 79.0, 112.0, 184.0, 255.0, 383.0, 564.0, 975.0, 1763.0, 3135.0, 5807.0, 11872.0, 25440.0, 59941.0, 146921.0, 290096.0, 272251.0, 130115.0, 52715.0, 22710.0, 10691.0, 5418.0, 2874.0, 1560.0, 898.0, 596.0, 359.0, 243.0, 155.0, 90.0, 73.0, 57.0, 34.0, 18.0, 10.0, 11.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5458984375, -1.492462158203125, -1.43902587890625, -1.385589599609375, -1.3321533203125, -1.278717041015625, -1.22528076171875, -1.171844482421875, -1.118408203125, -1.064971923828125, -1.01153564453125, -0.958099365234375, -0.9046630859375, -0.851226806640625, -0.79779052734375, -0.744354248046875, -0.69091796875, -0.637481689453125, -0.58404541015625, -0.530609130859375, -0.4771728515625, -0.423736572265625, -0.37030029296875, -0.316864013671875, -0.263427734375, -0.209991455078125, -0.15655517578125, -0.103118896484375, -0.0496826171875, 0.003753662109375, 0.05718994140625, 0.110626220703125, 0.1640625, 0.217498779296875, 0.27093505859375, 0.324371337890625, 0.3778076171875, 0.431243896484375, 0.48468017578125, 0.538116455078125, 0.591552734375, 0.644989013671875, 0.69842529296875, 0.751861572265625, 0.8052978515625, 0.858734130859375, 0.91217041015625, 0.965606689453125, 1.01904296875, 1.072479248046875, 1.12591552734375, 1.179351806640625, 1.2327880859375, 1.286224365234375, 1.33966064453125, 1.393096923828125, 1.446533203125, 1.499969482421875, 1.55340576171875, 1.606842041015625, 1.6602783203125, 1.713714599609375, 1.76715087890625, 1.820587158203125, 1.8740234375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 3.0, 7.0, 12.0, 6.0, 13.0, 8.0, 15.0, 15.0, 23.0, 21.0, 17.0, 28.0, 32.0, 31.0, 43.0, 58.0, 62.0, 60.0, 79.0, 54.0, 61.0, 51.0, 52.0, 44.0, 31.0, 24.0, 22.0, 21.0, 18.0, 13.0, 11.0, 8.0, 10.0, 5.0, 13.0, 8.0, 6.0, 5.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.377197265625, -0.36551666259765625, -0.3538360595703125, -0.34215545654296875, -0.330474853515625, -0.31879425048828125, -0.3071136474609375, -0.29543304443359375, -0.28375244140625, -0.27207183837890625, -0.2603912353515625, -0.24871063232421875, -0.237030029296875, -0.22534942626953125, -0.2136688232421875, -0.20198822021484375, -0.1903076171875, -0.17862701416015625, -0.1669464111328125, -0.15526580810546875, -0.143585205078125, -0.13190460205078125, -0.1202239990234375, -0.10854339599609375, -0.09686279296875, -0.08518218994140625, -0.0735015869140625, -0.06182098388671875, -0.050140380859375, -0.03845977783203125, -0.0267791748046875, -0.01509857177734375, -0.00341796875, 0.00826263427734375, 0.0199432373046875, 0.03162384033203125, 0.043304443359375, 0.05498504638671875, 0.0666656494140625, 0.07834625244140625, 0.09002685546875, 0.10170745849609375, 0.1133880615234375, 0.12506866455078125, 0.136749267578125, 0.14842987060546875, 0.1601104736328125, 0.17179107666015625, 0.1834716796875, 0.19515228271484375, 0.2068328857421875, 0.21851348876953125, 0.230194091796875, 0.24187469482421875, 0.2535552978515625, 0.26523590087890625, 0.27691650390625, 0.28859710693359375, 0.3002777099609375, 0.31195831298828125, 0.323638916015625, 0.33531951904296875, 0.3470001220703125, 0.35868072509765625, 0.370361328125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 8.0, 11.0, 5.0, 14.0, 18.0, 38.0, 60.0, 99.0, 136.0, 160.0, 135.0, 127.0, 67.0, 48.0, 30.0, 16.0, 8.0, 10.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.418651580810547, -23.833621978759766, -23.248592376708984, -22.66356086730957, -22.07853126525879, -21.493501663208008, -20.908470153808594, -20.323440551757812, -19.73841094970703, -19.15338134765625, -18.56835174560547, -17.983320236206055, -17.398290634155273, -16.813261032104492, -16.228229522705078, -15.643199920654297, -15.058170318603516, -14.473140716552734, -13.888110160827637, -13.303079605102539, -12.718050003051758, -12.133020401000977, -11.547989845275879, -10.962959289550781, -10.3779296875, -9.792900085449219, -9.207869529724121, -8.622838973999023, -8.037809371948242, -7.452779293060303, -6.867749214172363, -6.282719135284424, -5.697690010070801, -5.112659931182861, -4.527629852294922, -3.9425997734069824, -3.357569694519043, -2.7725396156311035, -2.187509536743164, -1.6024794578552246, -1.0174493789672852, -0.4324193000793457, 0.15261077880859375, 0.7376408576965332, 1.3226709365844727, 1.907701015472412, 2.4927310943603516, 3.077761173248291, 3.6627912521362305, 4.24782133102417, 4.832851409912109, 5.417881488800049, 6.002911567687988, 6.587941646575928, 7.172971725463867, 7.758001804351807, 8.343031883239746, 8.928062438964844, 9.513092041015625, 10.098121643066406, 10.683152198791504, 11.268182754516602, 11.853212356567383, 12.438241958618164, 13.023272514343262]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 4.0, 1.0, 10.0, 10.0, 8.0, 6.0, 14.0, 15.0, 29.0, 22.0, 29.0, 26.0, 31.0, 36.0, 42.0, 44.0, 34.0, 51.0, 53.0, 53.0, 37.0, 49.0, 45.0, 43.0, 44.0, 25.0, 29.0, 29.0, 33.0, 26.0, 17.0, 20.0, 15.0, 18.0, 11.0, 5.0, 4.0, 5.0, 10.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.686367511749268, -5.500733375549316, -5.315099239349365, -5.129465103149414, -4.943830966949463, -4.758196830749512, -4.5725626945495605, -4.386928558349609, -4.201294422149658, -4.015660285949707, -3.830026149749756, -3.6443920135498047, -3.4587578773498535, -3.2731237411499023, -3.087489604949951, -2.90185546875, -2.7162210941314697, -2.5305869579315186, -2.3449528217315674, -2.159318685531616, -1.973684549331665, -1.7880504131317139, -1.6024161577224731, -1.416782021522522, -1.2311478853225708, -1.0455137491226196, -0.8598796129226685, -0.6742454171180725, -0.48861128091812134, -0.30297714471817017, -0.11734294891357422, 0.06829118728637695, 0.2539253234863281, 0.4395594596862793, 0.6251935958862305, 0.8108277916908264, 0.9964619278907776, 1.182096004486084, 1.3677302598953247, 1.5533643960952759, 1.738998532295227, 1.9246326684951782, 2.110266923904419, 2.29590106010437, 2.4815351963043213, 2.6671693325042725, 2.8528034687042236, 3.038437604904175, 3.224071741104126, 3.409705877304077, 3.5953400135040283, 3.7809741497039795, 3.9666082859039307, 4.152242660522461, 4.337876796722412, 4.523510932922363, 4.7091450691223145, 4.894779205322266, 5.080413341522217, 5.266047477722168, 5.451681613922119, 5.63731575012207, 5.8229498863220215, 6.008584022521973, 6.194218158721924]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 11.0, 11.0, 18.0, 23.0, 51.0, 73.0, 98.0, 155.0, 197.0, 327.0, 507.0, 860.0, 1400.0, 2339.0, 3844.0, 6710.0, 11952.0, 21587.0, 41710.0, 78042.0, 136078.0, 195617.0, 204053.0, 150009.0, 88622.0, 47182.0, 25226.0, 13357.0, 7570.0, 4322.0, 2523.0, 1510.0, 975.0, 554.0, 357.0, 248.0, 146.0, 93.0, 58.0, 38.0, 34.0, 26.0, 17.0, 6.0, 6.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.61328125, -5.42681884765625, -5.2403564453125, -5.05389404296875, -4.867431640625, -4.68096923828125, -4.4945068359375, -4.30804443359375, -4.12158203125, -3.93511962890625, -3.7486572265625, -3.56219482421875, -3.375732421875, -3.18927001953125, -3.0028076171875, -2.81634521484375, -2.6298828125, -2.44342041015625, -2.2569580078125, -2.07049560546875, -1.884033203125, -1.69757080078125, -1.5111083984375, -1.32464599609375, -1.13818359375, -0.95172119140625, -0.7652587890625, -0.57879638671875, -0.392333984375, -0.20587158203125, -0.0194091796875, 0.16705322265625, 0.353515625, 0.53997802734375, 0.7264404296875, 0.91290283203125, 1.099365234375, 1.28582763671875, 1.4722900390625, 1.65875244140625, 1.84521484375, 2.03167724609375, 2.2181396484375, 2.40460205078125, 2.591064453125, 2.77752685546875, 2.9639892578125, 3.15045166015625, 3.3369140625, 3.52337646484375, 3.7098388671875, 3.89630126953125, 4.082763671875, 4.26922607421875, 4.4556884765625, 4.64215087890625, 4.82861328125, 5.01507568359375, 5.2015380859375, 5.38800048828125, 5.574462890625, 5.76092529296875, 5.9473876953125, 6.13385009765625, 6.3203125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 3.0, 2.0, 4.0, 7.0, 5.0, 15.0, 8.0, 14.0, 20.0, 23.0, 29.0, 29.0, 33.0, 33.0, 44.0, 45.0, 50.0, 49.0, 59.0, 63.0, 50.0, 46.0, 48.0, 46.0, 38.0, 37.0, 31.0, 34.0, 32.0, 17.0, 16.0, 14.0, 7.0, 16.0, 9.0, 7.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.33203125, -6.11053466796875, -5.8890380859375, -5.66754150390625, -5.446044921875, -5.22454833984375, -5.0030517578125, -4.78155517578125, -4.56005859375, -4.33856201171875, -4.1170654296875, -3.89556884765625, -3.674072265625, -3.45257568359375, -3.2310791015625, -3.00958251953125, -2.7880859375, -2.56658935546875, -2.3450927734375, -2.12359619140625, -1.902099609375, -1.68060302734375, -1.4591064453125, -1.23760986328125, -1.01611328125, -0.79461669921875, -0.5731201171875, -0.35162353515625, -0.130126953125, 0.09136962890625, 0.3128662109375, 0.53436279296875, 0.755859375, 0.97735595703125, 1.1988525390625, 1.42034912109375, 1.641845703125, 1.86334228515625, 2.0848388671875, 2.30633544921875, 2.52783203125, 2.74932861328125, 2.9708251953125, 3.19232177734375, 3.413818359375, 3.63531494140625, 3.8568115234375, 4.07830810546875, 4.2998046875, 4.52130126953125, 4.7427978515625, 4.96429443359375, 5.185791015625, 5.40728759765625, 5.6287841796875, 5.85028076171875, 6.07177734375, 6.29327392578125, 6.5147705078125, 6.73626708984375, 6.957763671875, 7.17926025390625, 7.4007568359375, 7.62225341796875, 7.84375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 9.0, 11.0, 12.0, 21.0, 22.0, 49.0, 78.0, 143.0, 190.0, 339.0, 610.0, 1103.0, 2084.0, 3696.0, 7526.0, 14794.0, 29994.0, 59645.0, 112618.0, 185530.0, 222434.0, 181205.0, 109720.0, 58138.0, 29036.0, 14226.0, 7143.0, 3789.0, 1877.0, 1102.0, 592.0, 321.0, 204.0, 105.0, 78.0, 45.0, 30.0, 16.0, 12.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.037353515625, -5.83251953125, -5.627685546875, -5.4228515625, -5.218017578125, -5.01318359375, -4.808349609375, -4.603515625, -4.398681640625, -4.19384765625, -3.989013671875, -3.7841796875, -3.579345703125, -3.37451171875, -3.169677734375, -2.96484375, -2.760009765625, -2.55517578125, -2.350341796875, -2.1455078125, -1.940673828125, -1.73583984375, -1.531005859375, -1.326171875, -1.121337890625, -0.91650390625, -0.711669921875, -0.5068359375, -0.302001953125, -0.09716796875, 0.107666015625, 0.3125, 0.517333984375, 0.72216796875, 0.927001953125, 1.1318359375, 1.336669921875, 1.54150390625, 1.746337890625, 1.951171875, 2.156005859375, 2.36083984375, 2.565673828125, 2.7705078125, 2.975341796875, 3.18017578125, 3.385009765625, 3.58984375, 3.794677734375, 3.99951171875, 4.204345703125, 4.4091796875, 4.614013671875, 4.81884765625, 5.023681640625, 5.228515625, 5.433349609375, 5.63818359375, 5.843017578125, 6.0478515625, 6.252685546875, 6.45751953125, 6.662353515625, 6.8671875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 9.0, 7.0, 10.0, 13.0, 16.0, 27.0, 21.0, 22.0, 27.0, 29.0, 29.0, 35.0, 45.0, 40.0, 52.0, 40.0, 40.0, 42.0, 53.0, 50.0, 44.0, 42.0, 29.0, 33.0, 25.0, 35.0, 27.0, 19.0, 29.0, 16.0, 12.0, 13.0, 13.0, 8.0, 14.0, 6.0, 1.0, 7.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.208984375, -3.095550537109375, -2.98211669921875, -2.868682861328125, -2.7552490234375, -2.641815185546875, -2.52838134765625, -2.414947509765625, -2.301513671875, -2.188079833984375, -2.07464599609375, -1.961212158203125, -1.8477783203125, -1.734344482421875, -1.62091064453125, -1.507476806640625, -1.39404296875, -1.280609130859375, -1.16717529296875, -1.053741455078125, -0.9403076171875, -0.826873779296875, -0.71343994140625, -0.600006103515625, -0.486572265625, -0.373138427734375, -0.25970458984375, -0.146270751953125, -0.0328369140625, 0.080596923828125, 0.19403076171875, 0.307464599609375, 0.4208984375, 0.534332275390625, 0.64776611328125, 0.761199951171875, 0.8746337890625, 0.988067626953125, 1.10150146484375, 1.214935302734375, 1.328369140625, 1.441802978515625, 1.55523681640625, 1.668670654296875, 1.7821044921875, 1.895538330078125, 2.00897216796875, 2.122406005859375, 2.23583984375, 2.349273681640625, 2.46270751953125, 2.576141357421875, 2.6895751953125, 2.803009033203125, 2.91644287109375, 3.029876708984375, 3.143310546875, 3.256744384765625, 3.37017822265625, 3.483612060546875, 3.5970458984375, 3.710479736328125, 3.82391357421875, 3.937347412109375, 4.05078125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 15.0, 16.0, 26.0, 50.0, 50.0, 74.0, 99.0, 146.0, 191.0, 325.0, 490.0, 757.0, 1191.0, 2057.0, 3662.0, 6525.0, 11963.0, 23049.0, 44396.0, 85892.0, 153464.0, 217060.0, 205989.0, 135610.0, 73421.0, 37987.0, 19700.0, 10545.0, 5716.0, 3187.0, 1854.0, 1023.0, 708.0, 418.0, 257.0, 176.0, 119.0, 99.0, 62.0, 54.0, 42.0, 30.0, 13.0, 16.0, 6.0, 4.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.60888671875, -2.5185546875, -2.42822265625, -2.337890625, -2.24755859375, -2.1572265625, -2.06689453125, -1.9765625, -1.88623046875, -1.7958984375, -1.70556640625, -1.615234375, -1.52490234375, -1.4345703125, -1.34423828125, -1.25390625, -1.16357421875, -1.0732421875, -0.98291015625, -0.892578125, -0.80224609375, -0.7119140625, -0.62158203125, -0.53125, -0.44091796875, -0.3505859375, -0.26025390625, -0.169921875, -0.07958984375, 0.0107421875, 0.10107421875, 0.19140625, 0.28173828125, 0.3720703125, 0.46240234375, 0.552734375, 0.64306640625, 0.7333984375, 0.82373046875, 0.9140625, 1.00439453125, 1.0947265625, 1.18505859375, 1.275390625, 1.36572265625, 1.4560546875, 1.54638671875, 1.63671875, 1.72705078125, 1.8173828125, 1.90771484375, 1.998046875, 2.08837890625, 2.1787109375, 2.26904296875, 2.359375, 2.44970703125, 2.5400390625, 2.63037109375, 2.720703125, 2.81103515625, 2.9013671875, 2.99169921875, 3.08203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 5.0, 12.0, 4.0, 10.0, 9.0, 11.0, 15.0, 24.0, 18.0, 33.0, 30.0, 35.0, 46.0, 38.0, 36.0, 54.0, 36.0, 55.0, 52.0, 59.0, 48.0, 47.0, 47.0, 40.0, 32.0, 28.0, 25.0, 25.0, 23.0, 15.0, 13.0, 13.0, 11.0, 4.0, 10.0, 10.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00017440319061279297, -0.00016897358000278473, -0.0001635439693927765, -0.00015811435878276825, -0.00015268474817276, -0.00014725513756275177, -0.00014182552695274353, -0.0001363959163427353, -0.00013096630573272705, -0.0001255366951227188, -0.00012010708451271057, -0.00011467747390270233, -0.00010924786329269409, -0.00010381825268268585, -9.838864207267761e-05, -9.295903146266937e-05, -8.752942085266113e-05, -8.209981024265289e-05, -7.667019963264465e-05, -7.124058902263641e-05, -6.581097841262817e-05, -6.0381367802619934e-05, -5.4951757192611694e-05, -4.9522146582603455e-05, -4.4092535972595215e-05, -3.8662925362586975e-05, -3.3233314752578735e-05, -2.7803704142570496e-05, -2.2374093532562256e-05, -1.6944482922554016e-05, -1.1514872312545776e-05, -6.085261702537537e-06, -6.556510925292969e-07, 4.773959517478943e-06, 1.0203570127487183e-05, 1.5633180737495422e-05, 2.1062791347503662e-05, 2.6492401957511902e-05, 3.192201256752014e-05, 3.735162317752838e-05, 4.278123378753662e-05, 4.821084439754486e-05, 5.36404550075531e-05, 5.907006561756134e-05, 6.449967622756958e-05, 6.992928683757782e-05, 7.535889744758606e-05, 8.07885080575943e-05, 8.621811866760254e-05, 9.164772927761078e-05, 9.707733988761902e-05, 0.00010250695049762726, 0.0001079365611076355, 0.00011336617171764374, 0.00011879578232765198, 0.00012422539293766022, 0.00012965500354766846, 0.0001350846141576767, 0.00014051422476768494, 0.00014594383537769318, 0.00015137344598770142, 0.00015680305659770966, 0.0001622326672077179, 0.00016766227781772614, 0.00017309188842773438]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 11.0, 10.0, 14.0, 20.0, 26.0, 33.0, 49.0, 54.0, 86.0, 151.0, 171.0, 265.0, 507.0, 844.0, 1609.0, 3299.0, 7060.0, 16246.0, 40014.0, 97698.0, 212139.0, 292363.0, 209654.0, 97023.0, 39170.0, 16094.0, 6972.0, 3218.0, 1619.0, 807.0, 428.0, 270.0, 169.0, 134.0, 90.0, 60.0, 59.0, 25.0, 24.0, 21.0, 14.0, 9.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1796875, -3.06402587890625, -2.9483642578125, -2.83270263671875, -2.717041015625, -2.60137939453125, -2.4857177734375, -2.37005615234375, -2.25439453125, -2.13873291015625, -2.0230712890625, -1.90740966796875, -1.791748046875, -1.67608642578125, -1.5604248046875, -1.44476318359375, -1.3291015625, -1.21343994140625, -1.0977783203125, -0.98211669921875, -0.866455078125, -0.75079345703125, -0.6351318359375, -0.51947021484375, -0.40380859375, -0.28814697265625, -0.1724853515625, -0.05682373046875, 0.058837890625, 0.17449951171875, 0.2901611328125, 0.40582275390625, 0.521484375, 0.63714599609375, 0.7528076171875, 0.86846923828125, 0.984130859375, 1.09979248046875, 1.2154541015625, 1.33111572265625, 1.44677734375, 1.56243896484375, 1.6781005859375, 1.79376220703125, 1.909423828125, 2.02508544921875, 2.1407470703125, 2.25640869140625, 2.3720703125, 2.48773193359375, 2.6033935546875, 2.71905517578125, 2.834716796875, 2.95037841796875, 3.0660400390625, 3.18170166015625, 3.29736328125, 3.41302490234375, 3.5286865234375, 3.64434814453125, 3.760009765625, 3.87567138671875, 3.9913330078125, 4.10699462890625, 4.22265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 8.0, 6.0, 7.0, 8.0, 12.0, 9.0, 11.0, 19.0, 20.0, 16.0, 25.0, 49.0, 27.0, 37.0, 44.0, 53.0, 58.0, 49.0, 63.0, 52.0, 51.0, 55.0, 48.0, 39.0, 44.0, 31.0, 34.0, 21.0, 24.0, 19.0, 12.0, 13.0, 13.0, 5.0, 8.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.658203125, -0.6347808837890625, -0.611358642578125, -0.5879364013671875, -0.56451416015625, -0.5410919189453125, -0.517669677734375, -0.4942474365234375, -0.4708251953125, -0.4474029541015625, -0.423980712890625, -0.4005584716796875, -0.37713623046875, -0.3537139892578125, -0.330291748046875, -0.3068695068359375, -0.283447265625, -0.2600250244140625, -0.236602783203125, -0.2131805419921875, -0.18975830078125, -0.1663360595703125, -0.142913818359375, -0.1194915771484375, -0.0960693359375, -0.0726470947265625, -0.049224853515625, -0.0258026123046875, -0.00238037109375, 0.0210418701171875, 0.044464111328125, 0.0678863525390625, 0.09130859375, 0.1147308349609375, 0.138153076171875, 0.1615753173828125, 0.18499755859375, 0.2084197998046875, 0.231842041015625, 0.2552642822265625, 0.2786865234375, 0.3021087646484375, 0.325531005859375, 0.3489532470703125, 0.37237548828125, 0.3957977294921875, 0.419219970703125, 0.4426422119140625, 0.466064453125, 0.4894866943359375, 0.512908935546875, 0.5363311767578125, 0.55975341796875, 0.5831756591796875, 0.606597900390625, 0.6300201416015625, 0.6534423828125, 0.6768646240234375, 0.700286865234375, 0.7237091064453125, 0.74713134765625, 0.7705535888671875, 0.793975830078125, 0.8173980712890625, 0.8408203125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 5.0, 4.0, 15.0, 15.0, 25.0, 51.0, 73.0, 116.0, 153.0, 134.0, 133.0, 103.0, 64.0, 35.0, 23.0, 15.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.390901565551758, -21.834444046020508, -21.27798843383789, -20.72153091430664, -20.16507339477539, -19.60861587524414, -19.052160263061523, -18.495702743530273, -17.939247131347656, -17.382789611816406, -16.82633399963379, -16.26987648010254, -15.713418960571289, -15.156962394714355, -14.600505828857422, -14.044048309326172, -13.487590789794922, -12.931134223937988, -12.374676704406738, -11.818220138549805, -11.261762619018555, -10.705306053161621, -10.148849487304688, -9.592391967773438, -9.035935401916504, -8.47947883605957, -7.92302131652832, -7.366564750671387, -6.810107707977295, -6.253650665283203, -5.6971940994262695, -5.140737056732178, -4.584280014038086, -4.027822971343994, -3.4713661670684814, -2.9149093627929688, -2.358452320098877, -1.8019952774047852, -1.2455384731292725, -0.6890816688537598, -0.13262462615966797, 0.4238322973251343, 0.9802892208099365, 1.5367461442947388, 2.093203067779541, 2.649660110473633, 3.2061169147491455, 3.762573719024658, 4.31903076171875, 4.875487804412842, 5.431944847106934, 5.988401412963867, 6.544858455657959, 7.101315498352051, 7.657772064208984, 8.214229583740234, 8.770686149597168, 9.327142715454102, 9.883600234985352, 10.440056800842285, 10.996513366699219, 11.552970886230469, 12.109427452087402, 12.665884017944336, 13.222341537475586]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 7.0, 10.0, 7.0, 17.0, 10.0, 15.0, 16.0, 24.0, 29.0, 26.0, 34.0, 27.0, 32.0, 45.0, 44.0, 24.0, 47.0, 43.0, 40.0, 42.0, 37.0, 48.0, 43.0, 34.0, 24.0, 26.0, 40.0, 24.0, 33.0, 21.0, 11.0, 13.0, 15.0, 14.0, 10.0, 13.0, 4.0, 5.0, 8.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.121384620666504, -4.95353364944458, -4.785682201385498, -4.617831230163574, -4.44998025894165, -4.282129287719727, -4.1142778396606445, -3.9464268684387207, -3.778575897216797, -3.610724687576294, -3.44287371635437, -3.275022506713867, -3.1071715354919434, -2.9393203258514404, -2.7714691162109375, -2.6036181449890137, -2.4357669353485107, -2.267915725708008, -2.100064754486084, -1.932213544845581, -1.7643625736236572, -1.5965113639831543, -1.428660273551941, -1.2608091831207275, -1.0929580926895142, -0.9251070022583008, -0.7572559118270874, -0.5894047617912292, -0.42155367136001587, -0.2537025809288025, -0.08585143089294434, 0.08199965953826904, 0.24985074996948242, 0.4177018404006958, 0.5855529308319092, 0.7534040808677673, 0.9212551712989807, 1.0891063213348389, 1.2569574117660522, 1.4248085021972656, 1.592659592628479, 1.7605106830596924, 1.9283617734909058, 2.096212863922119, 2.264064073562622, 2.431915044784546, 2.599766254425049, 2.7676172256469727, 2.9354684352874756, 3.1033196449279785, 3.2711706161499023, 3.4390218257904053, 3.606872797012329, 3.774724006652832, 3.942574977874756, 4.11042594909668, 4.278277397155762, 4.4461283683776855, 4.613979816436768, 4.781830787658691, 4.949681758880615, 5.117532730102539, 5.285384178161621, 5.453235149383545, 5.621086120605469]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 10.0, 12.0, 10.0, 20.0, 29.0, 41.0, 57.0, 85.0, 116.0, 177.0, 288.0, 355.0, 599.0, 879.0, 1493.0, 2363.0, 3821.0, 6575.0, 12141.0, 25232.0, 64131.0, 223690.0, 932350.0, 1871904.0, 760020.0, 179736.0, 55171.0, 23322.0, 11923.0, 6687.0, 3897.0, 2439.0, 1528.0, 1039.0, 681.0, 433.0, 290.0, 213.0, 160.0, 107.0, 75.0, 54.0, 35.0, 36.0, 16.0, 14.0, 9.0, 6.0, 8.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0], "bins": [-12.9765625, -12.576416015625, -12.17626953125, -11.776123046875, -11.3759765625, -10.975830078125, -10.57568359375, -10.175537109375, -9.775390625, -9.375244140625, -8.97509765625, -8.574951171875, -8.1748046875, -7.774658203125, -7.37451171875, -6.974365234375, -6.57421875, -6.174072265625, -5.77392578125, -5.373779296875, -4.9736328125, -4.573486328125, -4.17333984375, -3.773193359375, -3.373046875, -2.972900390625, -2.57275390625, -2.172607421875, -1.7724609375, -1.372314453125, -0.97216796875, -0.572021484375, -0.171875, 0.228271484375, 0.62841796875, 1.028564453125, 1.4287109375, 1.828857421875, 2.22900390625, 2.629150390625, 3.029296875, 3.429443359375, 3.82958984375, 4.229736328125, 4.6298828125, 5.030029296875, 5.43017578125, 5.830322265625, 6.23046875, 6.630615234375, 7.03076171875, 7.430908203125, 7.8310546875, 8.231201171875, 8.63134765625, 9.031494140625, 9.431640625, 9.831787109375, 10.23193359375, 10.632080078125, 11.0322265625, 11.432373046875, 11.83251953125, 12.232666015625, 12.6328125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 7.0, 7.0, 5.0, 17.0, 19.0, 14.0, 12.0, 10.0, 20.0, 29.0, 34.0, 37.0, 38.0, 43.0, 59.0, 40.0, 36.0, 47.0, 40.0, 54.0, 48.0, 42.0, 47.0, 32.0, 36.0, 28.0, 37.0, 20.0, 25.0, 18.0, 13.0, 11.0, 15.0, 13.0, 9.0, 6.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.34375, -4.20880126953125, -4.0738525390625, -3.93890380859375, -3.803955078125, -3.66900634765625, -3.5340576171875, -3.39910888671875, -3.26416015625, -3.12921142578125, -2.9942626953125, -2.85931396484375, -2.724365234375, -2.58941650390625, -2.4544677734375, -2.31951904296875, -2.1845703125, -2.04962158203125, -1.9146728515625, -1.77972412109375, -1.644775390625, -1.50982666015625, -1.3748779296875, -1.23992919921875, -1.10498046875, -0.97003173828125, -0.8350830078125, -0.70013427734375, -0.565185546875, -0.43023681640625, -0.2952880859375, -0.16033935546875, -0.025390625, 0.10955810546875, 0.2445068359375, 0.37945556640625, 0.514404296875, 0.64935302734375, 0.7843017578125, 0.91925048828125, 1.05419921875, 1.18914794921875, 1.3240966796875, 1.45904541015625, 1.593994140625, 1.72894287109375, 1.8638916015625, 1.99884033203125, 2.1337890625, 2.26873779296875, 2.4036865234375, 2.53863525390625, 2.673583984375, 2.80853271484375, 2.9434814453125, 3.07843017578125, 3.21337890625, 3.34832763671875, 3.4832763671875, 3.61822509765625, 3.753173828125, 3.88812255859375, 4.0230712890625, 4.15802001953125, 4.29296875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 24.0, 25.0, 35.0, 55.0, 77.0, 139.0, 229.0, 343.0, 553.0, 913.0, 1525.0, 2553.0, 4294.0, 7599.0, 13629.0, 26086.0, 56007.0, 144541.0, 472255.0, 1407689.0, 1360993.0, 445860.0, 138213.0, 54084.0, 25620.0, 13104.0, 7350.0, 4251.0, 2475.0, 1450.0, 876.0, 535.0, 343.0, 196.0, 121.0, 90.0, 46.0, 36.0, 10.0, 17.0, 7.0, 4.0, 6.0, 7.0, 6.0, 1.0, 0.0, 3.0], "bins": [-13.921875, -13.534912109375, -13.14794921875, -12.760986328125, -12.3740234375, -11.987060546875, -11.60009765625, -11.213134765625, -10.826171875, -10.439208984375, -10.05224609375, -9.665283203125, -9.2783203125, -8.891357421875, -8.50439453125, -8.117431640625, -7.73046875, -7.343505859375, -6.95654296875, -6.569580078125, -6.1826171875, -5.795654296875, -5.40869140625, -5.021728515625, -4.634765625, -4.247802734375, -3.86083984375, -3.473876953125, -3.0869140625, -2.699951171875, -2.31298828125, -1.926025390625, -1.5390625, -1.152099609375, -0.76513671875, -0.378173828125, 0.0087890625, 0.395751953125, 0.78271484375, 1.169677734375, 1.556640625, 1.943603515625, 2.33056640625, 2.717529296875, 3.1044921875, 3.491455078125, 3.87841796875, 4.265380859375, 4.65234375, 5.039306640625, 5.42626953125, 5.813232421875, 6.2001953125, 6.587158203125, 6.97412109375, 7.361083984375, 7.748046875, 8.135009765625, 8.52197265625, 8.908935546875, 9.2958984375, 9.682861328125, 10.06982421875, 10.456787109375, 10.84375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 6.0, 13.0, 13.0, 16.0, 26.0, 26.0, 35.0, 39.0, 59.0, 71.0, 96.0, 129.0, 174.0, 219.0, 264.0, 321.0, 350.0, 373.0, 333.0, 304.0, 247.0, 217.0, 154.0, 129.0, 112.0, 60.0, 65.0, 38.0, 45.0, 33.0, 18.0, 14.0, 14.0, 16.0, 9.0, 5.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.921875, -2.832122802734375, -2.74237060546875, -2.652618408203125, -2.5628662109375, -2.473114013671875, -2.38336181640625, -2.293609619140625, -2.203857421875, -2.114105224609375, -2.02435302734375, -1.934600830078125, -1.8448486328125, -1.755096435546875, -1.66534423828125, -1.575592041015625, -1.48583984375, -1.396087646484375, -1.30633544921875, -1.216583251953125, -1.1268310546875, -1.037078857421875, -0.94732666015625, -0.857574462890625, -0.767822265625, -0.678070068359375, -0.58831787109375, -0.498565673828125, -0.4088134765625, -0.319061279296875, -0.22930908203125, -0.139556884765625, -0.0498046875, 0.039947509765625, 0.12969970703125, 0.219451904296875, 0.3092041015625, 0.398956298828125, 0.48870849609375, 0.578460693359375, 0.668212890625, 0.757965087890625, 0.84771728515625, 0.937469482421875, 1.0272216796875, 1.116973876953125, 1.20672607421875, 1.296478271484375, 1.38623046875, 1.475982666015625, 1.56573486328125, 1.655487060546875, 1.7452392578125, 1.834991455078125, 1.92474365234375, 2.014495849609375, 2.104248046875, 2.194000244140625, 2.28375244140625, 2.373504638671875, 2.4632568359375, 2.553009033203125, 2.64276123046875, 2.732513427734375, 2.822265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 11.0, 8.0, 8.0, 18.0, 32.0, 33.0, 57.0, 91.0, 152.0, 145.0, 130.0, 115.0, 62.0, 51.0, 32.0, 22.0, 8.0, 12.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.550376892089844, -20.00428581237793, -19.458194732666016, -18.9121036529541, -18.366012573242188, -17.819923400878906, -17.27383041381836, -16.727741241455078, -16.181650161743164, -15.63555908203125, -15.089468002319336, -14.543376922607422, -13.997286796569824, -13.45119571685791, -12.905104637145996, -12.359013557434082, -11.812922477722168, -11.266831398010254, -10.72074031829834, -10.174650192260742, -9.628559112548828, -9.082468032836914, -8.536376953125, -7.990285873413086, -7.44419527053833, -6.898104190826416, -6.35201358795166, -5.805922508239746, -5.259831428527832, -4.713740825653076, -4.167649745941162, -3.621558904647827, -3.0754690170288086, -2.5293781757354736, -1.9832872152328491, -1.4371962547302246, -0.8911054134368896, -0.3450145721435547, 0.20107650756835938, 0.7471673488616943, 1.2932581901550293, 1.8393490314483643, 2.385439872741699, 2.9315309524536133, 3.4776217937469482, 4.023712635040283, 4.569803714752197, 5.115894317626953, 5.661985397338867, 6.208076477050781, 6.754167079925537, 7.300258159637451, 7.846348762512207, 8.392439842224121, 8.938530921936035, 9.48462200164795, 10.030712127685547, 10.576803207397461, 11.122894287109375, 11.668985366821289, 12.215075492858887, 12.7611665725708, 13.307257652282715, 13.853348731994629, 14.399439811706543]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 11.0, 5.0, 13.0, 13.0, 12.0, 18.0, 12.0, 12.0, 29.0, 29.0, 32.0, 39.0, 45.0, 52.0, 37.0, 52.0, 42.0, 46.0, 42.0, 45.0, 34.0, 50.0, 45.0, 32.0, 41.0, 28.0, 24.0, 15.0, 27.0, 16.0, 19.0, 9.0, 14.0, 9.0, 12.0, 12.0, 3.0, 1.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.3932414054870605, -5.21558141708374, -5.03792142868042, -4.8602614402771, -4.682601451873779, -4.504941463470459, -4.327281951904297, -4.149621963500977, -3.971961736679077, -3.794301748275757, -3.6166417598724365, -3.4389820098876953, -3.261322021484375, -3.0836620330810547, -2.9060020446777344, -2.728342056274414, -2.5506820678710938, -2.3730220794677734, -2.195362091064453, -2.017702102661133, -1.840042233467102, -1.6623822450637817, -1.484722375869751, -1.3070623874664307, -1.1294023990631104, -0.95174241065979, -0.7740824818611145, -0.596422553062439, -0.41876256465911865, -0.24110257625579834, -0.06344270706176758, 0.11421728134155273, 0.29187774658203125, 0.4695377051830292, 0.6471976637840271, 0.8248575925827026, 1.002517580986023, 1.1801775693893433, 1.357837438583374, 1.5354974269866943, 1.7131574153900146, 1.890817403793335, 2.0684773921966553, 2.2461371421813965, 2.423797130584717, 2.601457118988037, 2.7791171073913574, 2.9567770957946777, 3.134437084197998, 3.3120970726013184, 3.4897570610046387, 3.667417049407959, 3.8450770378112793, 4.0227370262146, 4.200396537780762, 4.378056526184082, 4.555716514587402, 4.733376502990723, 4.911036491394043, 5.088696479797363, 5.266356468200684, 5.444016456604004, 5.621676445007324, 5.7993364334106445, 5.976996421813965]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 11.0, 15.0, 21.0, 34.0, 42.0, 71.0, 113.0, 148.0, 234.0, 313.0, 522.0, 781.0, 1228.0, 1945.0, 3232.0, 5237.0, 8964.0, 15778.0, 28061.0, 51888.0, 95986.0, 167766.0, 223434.0, 189945.0, 113315.0, 60878.0, 33337.0, 18640.0, 10471.0, 6254.0, 3686.0, 2235.0, 1429.0, 903.0, 567.0, 380.0, 212.0, 150.0, 110.0, 67.0, 49.0, 26.0, 33.0, 10.0, 7.0, 11.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.548828125, -2.46563720703125, -2.3824462890625, -2.29925537109375, -2.216064453125, -2.13287353515625, -2.0496826171875, -1.96649169921875, -1.88330078125, -1.80010986328125, -1.7169189453125, -1.63372802734375, -1.550537109375, -1.46734619140625, -1.3841552734375, -1.30096435546875, -1.2177734375, -1.13458251953125, -1.0513916015625, -0.96820068359375, -0.885009765625, -0.80181884765625, -0.7186279296875, -0.63543701171875, -0.55224609375, -0.46905517578125, -0.3858642578125, -0.30267333984375, -0.219482421875, -0.13629150390625, -0.0531005859375, 0.03009033203125, 0.11328125, 0.19647216796875, 0.2796630859375, 0.36285400390625, 0.446044921875, 0.52923583984375, 0.6124267578125, 0.69561767578125, 0.77880859375, 0.86199951171875, 0.9451904296875, 1.02838134765625, 1.111572265625, 1.19476318359375, 1.2779541015625, 1.36114501953125, 1.4443359375, 1.52752685546875, 1.6107177734375, 1.69390869140625, 1.777099609375, 1.86029052734375, 1.9434814453125, 2.02667236328125, 2.10986328125, 2.19305419921875, 2.2762451171875, 2.35943603515625, 2.442626953125, 2.52581787109375, 2.6090087890625, 2.69219970703125, 2.775390625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 11.0, 3.0, 8.0, 6.0, 10.0, 12.0, 14.0, 13.0, 21.0, 21.0, 21.0, 25.0, 50.0, 35.0, 38.0, 37.0, 46.0, 43.0, 37.0, 51.0, 53.0, 47.0, 51.0, 36.0, 39.0, 35.0, 35.0, 22.0, 30.0, 17.0, 25.0, 15.0, 18.0, 14.0, 10.0, 11.0, 6.0, 8.0, 8.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.591064453125, -5.39697265625, -5.202880859375, -5.0087890625, -4.814697265625, -4.62060546875, -4.426513671875, -4.232421875, -4.038330078125, -3.84423828125, -3.650146484375, -3.4560546875, -3.261962890625, -3.06787109375, -2.873779296875, -2.6796875, -2.485595703125, -2.29150390625, -2.097412109375, -1.9033203125, -1.709228515625, -1.51513671875, -1.321044921875, -1.126953125, -0.932861328125, -0.73876953125, -0.544677734375, -0.3505859375, -0.156494140625, 0.03759765625, 0.231689453125, 0.42578125, 0.619873046875, 0.81396484375, 1.008056640625, 1.2021484375, 1.396240234375, 1.59033203125, 1.784423828125, 1.978515625, 2.172607421875, 2.36669921875, 2.560791015625, 2.7548828125, 2.948974609375, 3.14306640625, 3.337158203125, 3.53125, 3.725341796875, 3.91943359375, 4.113525390625, 4.3076171875, 4.501708984375, 4.69580078125, 4.889892578125, 5.083984375, 5.278076171875, 5.47216796875, 5.666259765625, 5.8603515625, 6.054443359375, 6.24853515625, 6.442626953125, 6.63671875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 14.0, 16.0, 16.0, 40.0, 56.0, 81.0, 137.0, 190.0, 298.0, 442.0, 708.0, 1054.0, 1731.0, 2836.0, 4658.0, 7940.0, 13910.0, 25070.0, 45288.0, 83133.0, 148019.0, 219186.0, 204188.0, 128598.0, 70903.0, 38729.0, 21234.0, 12154.0, 6958.0, 4186.0, 2493.0, 1582.0, 957.0, 584.0, 377.0, 257.0, 188.0, 124.0, 77.0, 45.0, 29.0, 31.0, 14.0, 7.0, 5.0, 3.0, 3.0, 0.0, 6.0, 3.0, 1.0], "bins": [-3.181640625, -3.09039306640625, -2.9991455078125, -2.90789794921875, -2.816650390625, -2.72540283203125, -2.6341552734375, -2.54290771484375, -2.45166015625, -2.36041259765625, -2.2691650390625, -2.17791748046875, -2.086669921875, -1.99542236328125, -1.9041748046875, -1.81292724609375, -1.7216796875, -1.63043212890625, -1.5391845703125, -1.44793701171875, -1.356689453125, -1.26544189453125, -1.1741943359375, -1.08294677734375, -0.99169921875, -0.90045166015625, -0.8092041015625, -0.71795654296875, -0.626708984375, -0.53546142578125, -0.4442138671875, -0.35296630859375, -0.26171875, -0.17047119140625, -0.0792236328125, 0.01202392578125, 0.103271484375, 0.19451904296875, 0.2857666015625, 0.37701416015625, 0.46826171875, 0.55950927734375, 0.6507568359375, 0.74200439453125, 0.833251953125, 0.92449951171875, 1.0157470703125, 1.10699462890625, 1.1982421875, 1.28948974609375, 1.3807373046875, 1.47198486328125, 1.563232421875, 1.65447998046875, 1.7457275390625, 1.83697509765625, 1.92822265625, 2.01947021484375, 2.1107177734375, 2.20196533203125, 2.293212890625, 2.38446044921875, 2.4757080078125, 2.56695556640625, 2.658203125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 8.0, 16.0, 11.0, 16.0, 19.0, 17.0, 24.0, 16.0, 35.0, 28.0, 30.0, 33.0, 42.0, 35.0, 33.0, 38.0, 47.0, 40.0, 47.0, 42.0, 47.0, 43.0, 33.0, 28.0, 35.0, 28.0, 33.0, 34.0, 23.0, 26.0, 21.0, 16.0, 12.0, 2.0, 7.0, 9.0, 7.0, 4.0, 2.0, 0.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.421875, -3.3111572265625, -3.200439453125, -3.0897216796875, -2.97900390625, -2.8682861328125, -2.757568359375, -2.6468505859375, -2.5361328125, -2.4254150390625, -2.314697265625, -2.2039794921875, -2.09326171875, -1.9825439453125, -1.871826171875, -1.7611083984375, -1.650390625, -1.5396728515625, -1.428955078125, -1.3182373046875, -1.20751953125, -1.0968017578125, -0.986083984375, -0.8753662109375, -0.7646484375, -0.6539306640625, -0.543212890625, -0.4324951171875, -0.32177734375, -0.2110595703125, -0.100341796875, 0.0103759765625, 0.12109375, 0.2318115234375, 0.342529296875, 0.4532470703125, 0.56396484375, 0.6746826171875, 0.785400390625, 0.8961181640625, 1.0068359375, 1.1175537109375, 1.228271484375, 1.3389892578125, 1.44970703125, 1.5604248046875, 1.671142578125, 1.7818603515625, 1.892578125, 2.0032958984375, 2.114013671875, 2.2247314453125, 2.33544921875, 2.4461669921875, 2.556884765625, 2.6676025390625, 2.7783203125, 2.8890380859375, 2.999755859375, 3.1104736328125, 3.22119140625, 3.3319091796875, 3.442626953125, 3.5533447265625, 3.6640625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 7.0, 12.0, 10.0, 19.0, 28.0, 40.0, 59.0, 110.0, 140.0, 212.0, 337.0, 503.0, 831.0, 1324.0, 2190.0, 3526.0, 6337.0, 11223.0, 21065.0, 41669.0, 86252.0, 183396.0, 288517.0, 203576.0, 97735.0, 46746.0, 23485.0, 12340.0, 6781.0, 3777.0, 2415.0, 1360.0, 866.0, 550.0, 369.0, 240.0, 147.0, 119.0, 70.0, 48.0, 36.0, 19.0, 29.0, 15.0, 10.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3359375, -1.290771484375, -1.24560546875, -1.200439453125, -1.1552734375, -1.110107421875, -1.06494140625, -1.019775390625, -0.974609375, -0.929443359375, -0.88427734375, -0.839111328125, -0.7939453125, -0.748779296875, -0.70361328125, -0.658447265625, -0.61328125, -0.568115234375, -0.52294921875, -0.477783203125, -0.4326171875, -0.387451171875, -0.34228515625, -0.297119140625, -0.251953125, -0.206787109375, -0.16162109375, -0.116455078125, -0.0712890625, -0.026123046875, 0.01904296875, 0.064208984375, 0.109375, 0.154541015625, 0.19970703125, 0.244873046875, 0.2900390625, 0.335205078125, 0.38037109375, 0.425537109375, 0.470703125, 0.515869140625, 0.56103515625, 0.606201171875, 0.6513671875, 0.696533203125, 0.74169921875, 0.786865234375, 0.83203125, 0.877197265625, 0.92236328125, 0.967529296875, 1.0126953125, 1.057861328125, 1.10302734375, 1.148193359375, 1.193359375, 1.238525390625, 1.28369140625, 1.328857421875, 1.3740234375, 1.419189453125, 1.46435546875, 1.509521484375, 1.5546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 4.0, 4.0, 12.0, 13.0, 16.0, 25.0, 38.0, 25.0, 46.0, 55.0, 84.0, 66.0, 71.0, 81.0, 85.0, 72.0, 70.0, 51.0, 51.0, 26.0, 24.0, 29.0, 12.0, 10.0, 8.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.115436553955078e-05, -5.862768739461899e-05, -5.6101009249687195e-05, -5.35743311047554e-05, -5.104765295982361e-05, -4.8520974814891815e-05, -4.599429666996002e-05, -4.346761852502823e-05, -4.0940940380096436e-05, -3.841426223516464e-05, -3.588758409023285e-05, -3.3360905945301056e-05, -3.083422780036926e-05, -2.830754965543747e-05, -2.5780871510505676e-05, -2.3254193365573883e-05, -2.072751522064209e-05, -1.8200837075710297e-05, -1.5674158930778503e-05, -1.314748078584671e-05, -1.0620802640914917e-05, -8.094124495983124e-06, -5.5674463510513306e-06, -3.0407682061195374e-06, -5.140900611877441e-07, 2.012588083744049e-06, 4.539266228675842e-06, 7.0659443736076355e-06, 9.592622518539429e-06, 1.2119300663471222e-05, 1.4645978808403015e-05, 1.717265695333481e-05, 1.96993350982666e-05, 2.2226013243198395e-05, 2.4752691388130188e-05, 2.727936953306198e-05, 2.9806047677993774e-05, 3.233272582292557e-05, 3.485940396785736e-05, 3.7386082112789154e-05, 3.991276025772095e-05, 4.243943840265274e-05, 4.4966116547584534e-05, 4.749279469251633e-05, 5.001947283744812e-05, 5.254615098237991e-05, 5.5072829127311707e-05, 5.75995072722435e-05, 6.012618541717529e-05, 6.265286356210709e-05, 6.517954170703888e-05, 6.770621985197067e-05, 7.023289799690247e-05, 7.275957614183426e-05, 7.528625428676605e-05, 7.781293243169785e-05, 8.033961057662964e-05, 8.286628872156143e-05, 8.539296686649323e-05, 8.791964501142502e-05, 9.044632315635681e-05, 9.29730013012886e-05, 9.54996794462204e-05, 9.802635759115219e-05, 0.00010055303573608398]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 4.0, 15.0, 20.0, 24.0, 30.0, 65.0, 104.0, 180.0, 313.0, 555.0, 880.0, 1609.0, 2770.0, 5202.0, 10626.0, 22395.0, 49745.0, 114703.0, 237027.0, 288863.0, 171968.0, 76332.0, 33402.0, 15474.0, 7509.0, 3898.0, 2003.0, 1206.0, 676.0, 365.0, 247.0, 137.0, 73.0, 45.0, 27.0, 20.0, 14.0, 11.0, 11.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6064453125, -1.556640625, -1.5068359375, -1.45703125, -1.4072265625, -1.357421875, -1.3076171875, -1.2578125, -1.2080078125, -1.158203125, -1.1083984375, -1.05859375, -1.0087890625, -0.958984375, -0.9091796875, -0.859375, -0.8095703125, -0.759765625, -0.7099609375, -0.66015625, -0.6103515625, -0.560546875, -0.5107421875, -0.4609375, -0.4111328125, -0.361328125, -0.3115234375, -0.26171875, -0.2119140625, -0.162109375, -0.1123046875, -0.0625, -0.0126953125, 0.037109375, 0.0869140625, 0.13671875, 0.1865234375, 0.236328125, 0.2861328125, 0.3359375, 0.3857421875, 0.435546875, 0.4853515625, 0.53515625, 0.5849609375, 0.634765625, 0.6845703125, 0.734375, 0.7841796875, 0.833984375, 0.8837890625, 0.93359375, 0.9833984375, 1.033203125, 1.0830078125, 1.1328125, 1.1826171875, 1.232421875, 1.2822265625, 1.33203125, 1.3818359375, 1.431640625, 1.4814453125, 1.53125, 1.5810546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 2.0, 3.0, 3.0, 10.0, 11.0, 8.0, 12.0, 10.0, 16.0, 23.0, 26.0, 31.0, 28.0, 37.0, 31.0, 48.0, 62.0, 53.0, 78.0, 60.0, 67.0, 40.0, 47.0, 49.0, 47.0, 33.0, 36.0, 17.0, 21.0, 18.0, 14.0, 8.0, 13.0, 6.0, 3.0, 5.0, 6.0, 5.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3701171875, -0.3580360412597656, -0.34595489501953125, -0.3338737487792969, -0.3217926025390625, -0.3097114562988281, -0.29763031005859375, -0.2855491638183594, -0.273468017578125, -0.2613868713378906, -0.24930572509765625, -0.23722457885742188, -0.2251434326171875, -0.21306228637695312, -0.20098114013671875, -0.18889999389648438, -0.17681884765625, -0.16473770141601562, -0.15265655517578125, -0.14057540893554688, -0.1284942626953125, -0.11641311645507812, -0.10433197021484375, -0.09225082397460938, -0.080169677734375, -0.06808853149414062, -0.05600738525390625, -0.043926239013671875, -0.0318450927734375, -0.019763946533203125, -0.00768280029296875, 0.004398345947265625, 0.0164794921875, 0.028560638427734375, 0.04064178466796875, 0.052722930908203125, 0.0648040771484375, 0.07688522338867188, 0.08896636962890625, 0.10104751586914062, 0.113128662109375, 0.12520980834960938, 0.13729095458984375, 0.14937210083007812, 0.1614532470703125, 0.17353439331054688, 0.18561553955078125, 0.19769668579101562, 0.20977783203125, 0.22185897827148438, 0.23394012451171875, 0.24602127075195312, 0.2581024169921875, 0.2701835632324219, 0.28226470947265625, 0.2943458557128906, 0.306427001953125, 0.3185081481933594, 0.33058929443359375, 0.3426704406738281, 0.3547515869140625, 0.3668327331542969, 0.37891387939453125, 0.3909950256347656, 0.403076171875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 11.0, 6.0, 8.0, 26.0, 30.0, 48.0, 63.0, 112.0, 167.0, 137.0, 129.0, 95.0, 45.0, 50.0, 29.0, 12.0, 10.0, 13.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.687089920043945, -20.13101577758789, -19.57494354248047, -19.018869400024414, -18.462797164916992, -17.906723022460938, -17.350650787353516, -16.79457664489746, -16.238502502441406, -15.682429313659668, -15.12635612487793, -14.570282936096191, -14.014209747314453, -13.458135604858398, -12.90206241607666, -12.345989227294922, -11.7899169921875, -11.233843803405762, -10.677770614624023, -10.121697425842285, -9.565624237060547, -9.009550094604492, -8.453476905822754, -7.897403717041016, -7.341330528259277, -6.785257339477539, -6.229184150695801, -5.673110485076904, -5.117037296295166, -4.560964107513428, -4.004890441894531, -3.448817253112793, -2.892742156982422, -2.3366689682006836, -1.7805955410003662, -1.2245222330093384, -0.6684489250183105, -0.11237573623657227, 0.4436976909637451, 0.9997711181640625, 1.5558443069458008, 2.111917495727539, 2.6679909229278564, 3.224064350128174, 3.780137538909912, 4.33621072769165, 4.892284393310547, 5.448357582092285, 6.004430770874023, 6.560503959655762, 7.1165771484375, 7.6726508140563965, 8.228723526000977, 8.784797668457031, 9.34087085723877, 9.896944046020508, 10.453017234802246, 11.009090423583984, 11.565163612365723, 12.121236801147461, 12.677310943603516, 13.233383178710938, 13.789457321166992, 14.34553050994873, 14.901603698730469]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 10.0, 3.0, 10.0, 17.0, 10.0, 19.0, 13.0, 11.0, 27.0, 31.0, 32.0, 38.0, 42.0, 49.0, 44.0, 50.0, 44.0, 47.0, 44.0, 42.0, 47.0, 41.0, 44.0, 39.0, 36.0, 26.0, 23.0, 18.0, 28.0, 14.0, 19.0, 12.0, 15.0, 4.0, 13.0, 12.0, 2.0, 3.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.409811973571777, -5.231508255004883, -5.053204536437988, -4.874900817871094, -4.696597099304199, -4.518293380737305, -4.33998966217041, -4.161685943603516, -3.983381986618042, -3.8050782680511475, -3.626774549484253, -3.4484705924987793, -3.2701668739318848, -3.0918631553649902, -2.9135594367980957, -2.735255718231201, -2.5569519996643066, -2.378648281097412, -2.2003445625305176, -2.022040843963623, -1.843737006187439, -1.6654332876205444, -1.4871294498443604, -1.3088257312774658, -1.1305220127105713, -0.9522182941436768, -0.7739145159721375, -0.5956107378005981, -0.4173070192337036, -0.23900330066680908, -0.060699462890625, 0.11760425567626953, 0.29590845108032227, 0.4742121994495392, 0.6525159478187561, 0.8308197259902954, 1.00912344455719, 1.1874271631240845, 1.3657310009002686, 1.544034719467163, 1.7223384380340576, 1.9006421566009521, 2.0789458751678467, 2.2572498321533203, 2.435553550720215, 2.6138572692871094, 2.792160987854004, 2.9704647064208984, 3.148768424987793, 3.3270721435546875, 3.505375862121582, 3.6836795806884766, 3.861983299255371, 4.040287017822266, 4.21859073638916, 4.396894454956055, 4.575198173522949, 4.753501892089844, 4.931805610656738, 5.110109329223633, 5.288413047790527, 5.466716766357422, 5.645020484924316, 5.823324203491211, 6.001628398895264]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 10.0, 27.0, 16.0, 37.0, 47.0, 69.0, 116.0, 149.0, 195.0, 344.0, 504.0, 826.0, 1237.0, 2005.0, 3076.0, 5054.0, 8207.0, 14395.0, 25203.0, 46073.0, 85212.0, 146706.0, 204086.0, 196716.0, 135226.0, 76079.0, 40931.0, 22587.0, 12909.0, 7688.0, 4727.0, 2882.0, 1775.0, 1192.0, 730.0, 511.0, 285.0, 227.0, 171.0, 116.0, 69.0, 31.0, 27.0, 26.0, 12.0, 14.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.73785400390625, -5.5460205078125, -5.35418701171875, -5.162353515625, -4.97052001953125, -4.7786865234375, -4.58685302734375, -4.39501953125, -4.20318603515625, -4.0113525390625, -3.81951904296875, -3.627685546875, -3.43585205078125, -3.2440185546875, -3.05218505859375, -2.8603515625, -2.66851806640625, -2.4766845703125, -2.28485107421875, -2.093017578125, -1.90118408203125, -1.7093505859375, -1.51751708984375, -1.32568359375, -1.13385009765625, -0.9420166015625, -0.75018310546875, -0.558349609375, -0.36651611328125, -0.1746826171875, 0.01715087890625, 0.208984375, 0.40081787109375, 0.5926513671875, 0.78448486328125, 0.976318359375, 1.16815185546875, 1.3599853515625, 1.55181884765625, 1.74365234375, 1.93548583984375, 2.1273193359375, 2.31915283203125, 2.510986328125, 2.70281982421875, 2.8946533203125, 3.08648681640625, 3.2783203125, 3.47015380859375, 3.6619873046875, 3.85382080078125, 4.045654296875, 4.23748779296875, 4.4293212890625, 4.62115478515625, 4.81298828125, 5.00482177734375, 5.1966552734375, 5.38848876953125, 5.580322265625, 5.77215576171875, 5.9639892578125, 6.15582275390625, 6.34765625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 7.0, 9.0, 9.0, 10.0, 5.0, 10.0, 18.0, 25.0, 30.0, 28.0, 38.0, 28.0, 43.0, 45.0, 34.0, 61.0, 52.0, 52.0, 52.0, 47.0, 43.0, 31.0, 49.0, 35.0, 36.0, 16.0, 22.0, 29.0, 17.0, 20.0, 15.0, 14.0, 6.0, 10.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.74609375, -5.54779052734375, -5.3494873046875, -5.15118408203125, -4.952880859375, -4.75457763671875, -4.5562744140625, -4.35797119140625, -4.15966796875, -3.96136474609375, -3.7630615234375, -3.56475830078125, -3.366455078125, -3.16815185546875, -2.9698486328125, -2.77154541015625, -2.5732421875, -2.37493896484375, -2.1766357421875, -1.97833251953125, -1.780029296875, -1.58172607421875, -1.3834228515625, -1.18511962890625, -0.98681640625, -0.78851318359375, -0.5902099609375, -0.39190673828125, -0.193603515625, 0.00469970703125, 0.2030029296875, 0.40130615234375, 0.599609375, 0.79791259765625, 0.9962158203125, 1.19451904296875, 1.392822265625, 1.59112548828125, 1.7894287109375, 1.98773193359375, 2.18603515625, 2.38433837890625, 2.5826416015625, 2.78094482421875, 2.979248046875, 3.17755126953125, 3.3758544921875, 3.57415771484375, 3.7724609375, 3.97076416015625, 4.1690673828125, 4.36737060546875, 4.565673828125, 4.76397705078125, 4.9622802734375, 5.16058349609375, 5.35888671875, 5.55718994140625, 5.7554931640625, 5.95379638671875, 6.152099609375, 6.35040283203125, 6.5487060546875, 6.74700927734375, 6.9453125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 9.0, 9.0, 19.0, 28.0, 33.0, 60.0, 79.0, 124.0, 224.0, 346.0, 518.0, 774.0, 1294.0, 2080.0, 3532.0, 5756.0, 9737.0, 16360.0, 27774.0, 48325.0, 81047.0, 126411.0, 171101.0, 178320.0, 142424.0, 93766.0, 56983.0, 33313.0, 19427.0, 11281.0, 6768.0, 3997.0, 2496.0, 1498.0, 967.0, 601.0, 381.0, 254.0, 139.0, 90.0, 75.0, 50.0, 31.0, 16.0, 14.0, 3.0, 11.0, 10.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.765625, -4.59637451171875, -4.4271240234375, -4.25787353515625, -4.088623046875, -3.91937255859375, -3.7501220703125, -3.58087158203125, -3.41162109375, -3.24237060546875, -3.0731201171875, -2.90386962890625, -2.734619140625, -2.56536865234375, -2.3961181640625, -2.22686767578125, -2.0576171875, -1.88836669921875, -1.7191162109375, -1.54986572265625, -1.380615234375, -1.21136474609375, -1.0421142578125, -0.87286376953125, -0.70361328125, -0.53436279296875, -0.3651123046875, -0.19586181640625, -0.026611328125, 0.14263916015625, 0.3118896484375, 0.48114013671875, 0.650390625, 0.81964111328125, 0.9888916015625, 1.15814208984375, 1.327392578125, 1.49664306640625, 1.6658935546875, 1.83514404296875, 2.00439453125, 2.17364501953125, 2.3428955078125, 2.51214599609375, 2.681396484375, 2.85064697265625, 3.0198974609375, 3.18914794921875, 3.3583984375, 3.52764892578125, 3.6968994140625, 3.86614990234375, 4.035400390625, 4.20465087890625, 4.3739013671875, 4.54315185546875, 4.71240234375, 4.88165283203125, 5.0509033203125, 5.22015380859375, 5.389404296875, 5.55865478515625, 5.7279052734375, 5.89715576171875, 6.06640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 10.0, 7.0, 14.0, 12.0, 14.0, 18.0, 8.0, 18.0, 18.0, 37.0, 34.0, 34.0, 38.0, 33.0, 42.0, 40.0, 39.0, 28.0, 39.0, 35.0, 39.0, 25.0, 41.0, 39.0, 46.0, 35.0, 24.0, 35.0, 29.0, 21.0, 13.0, 13.0, 21.0, 18.0, 16.0, 11.0, 16.0, 7.0, 3.0, 11.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.537109375, -3.431396484375, -3.32568359375, -3.219970703125, -3.1142578125, -3.008544921875, -2.90283203125, -2.797119140625, -2.69140625, -2.585693359375, -2.47998046875, -2.374267578125, -2.2685546875, -2.162841796875, -2.05712890625, -1.951416015625, -1.845703125, -1.739990234375, -1.63427734375, -1.528564453125, -1.4228515625, -1.317138671875, -1.21142578125, -1.105712890625, -1.0, -0.894287109375, -0.78857421875, -0.682861328125, -0.5771484375, -0.471435546875, -0.36572265625, -0.260009765625, -0.154296875, -0.048583984375, 0.05712890625, 0.162841796875, 0.2685546875, 0.374267578125, 0.47998046875, 0.585693359375, 0.69140625, 0.797119140625, 0.90283203125, 1.008544921875, 1.1142578125, 1.219970703125, 1.32568359375, 1.431396484375, 1.537109375, 1.642822265625, 1.74853515625, 1.854248046875, 1.9599609375, 2.065673828125, 2.17138671875, 2.277099609375, 2.3828125, 2.488525390625, 2.59423828125, 2.699951171875, 2.8056640625, 2.911376953125, 3.01708984375, 3.122802734375, 3.228515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 10.0, 12.0, 28.0, 46.0, 83.0, 128.0, 238.0, 399.0, 713.0, 1317.0, 2390.0, 4660.0, 9410.0, 19544.0, 43760.0, 100926.0, 215071.0, 292830.0, 195306.0, 88075.0, 38699.0, 17423.0, 8375.0, 4181.0, 2158.0, 1262.0, 637.0, 366.0, 203.0, 124.0, 78.0, 40.0, 15.0, 16.0, 12.0, 7.0, 4.0, 0.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.826171875, -3.70440673828125, -3.5826416015625, -3.46087646484375, -3.339111328125, -3.21734619140625, -3.0955810546875, -2.97381591796875, -2.85205078125, -2.73028564453125, -2.6085205078125, -2.48675537109375, -2.364990234375, -2.24322509765625, -2.1214599609375, -1.99969482421875, -1.8779296875, -1.75616455078125, -1.6343994140625, -1.51263427734375, -1.390869140625, -1.26910400390625, -1.1473388671875, -1.02557373046875, -0.90380859375, -0.78204345703125, -0.6602783203125, -0.53851318359375, -0.416748046875, -0.29498291015625, -0.1732177734375, -0.05145263671875, 0.0703125, 0.19207763671875, 0.3138427734375, 0.43560791015625, 0.557373046875, 0.67913818359375, 0.8009033203125, 0.92266845703125, 1.04443359375, 1.16619873046875, 1.2879638671875, 1.40972900390625, 1.531494140625, 1.65325927734375, 1.7750244140625, 1.89678955078125, 2.0185546875, 2.14031982421875, 2.2620849609375, 2.38385009765625, 2.505615234375, 2.62738037109375, 2.7491455078125, 2.87091064453125, 2.99267578125, 3.11444091796875, 3.2362060546875, 3.35797119140625, 3.479736328125, 3.60150146484375, 3.7232666015625, 3.84503173828125, 3.966796875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 7.0, 3.0, 11.0, 13.0, 17.0, 22.0, 25.0, 39.0, 55.0, 74.0, 84.0, 107.0, 93.0, 98.0, 76.0, 71.0, 58.0, 39.0, 36.0, 18.0, 13.0, 17.0, 11.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000308990478515625, -0.0002985522150993347, -0.00028811395168304443, -0.00027767568826675415, -0.00026723742485046387, -0.0002567991614341736, -0.0002463608980178833, -0.00023592263460159302, -0.00022548437118530273, -0.00021504610776901245, -0.00020460784435272217, -0.00019416958093643188, -0.0001837313175201416, -0.00017329305410385132, -0.00016285479068756104, -0.00015241652727127075, -0.00014197826385498047, -0.00013154000043869019, -0.0001211017370223999, -0.00011066347360610962, -0.00010022521018981934, -8.978694677352905e-05, -7.934868335723877e-05, -6.891041994094849e-05, -5.84721565246582e-05, -4.803389310836792e-05, -3.759562969207764e-05, -2.7157366275787354e-05, -1.671910285949707e-05, -6.280839443206787e-06, 4.157423973083496e-06, 1.459568738937378e-05, 2.5033950805664062e-05, 3.5472214221954346e-05, 4.591047763824463e-05, 5.634874105453491e-05, 6.67870044708252e-05, 7.722526788711548e-05, 8.766353130340576e-05, 9.810179471969604e-05, 0.00010854005813598633, 0.00011897832155227661, 0.0001294165849685669, 0.00013985484838485718, 0.00015029311180114746, 0.00016073137521743774, 0.00017116963863372803, 0.0001816079020500183, 0.0001920461654663086, 0.00020248442888259888, 0.00021292269229888916, 0.00022336095571517944, 0.00023379921913146973, 0.00024423748254776, 0.0002546757459640503, 0.0002651140093803406, 0.00027555227279663086, 0.00028599053621292114, 0.0002964287996292114, 0.0003068670630455017, 0.000317305326461792, 0.0003277435898780823, 0.00033818185329437256, 0.00034862011671066284, 0.0003590583801269531]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 8.0, 8.0, 11.0, 17.0, 32.0, 50.0, 59.0, 111.0, 166.0, 292.0, 458.0, 869.0, 1553.0, 2765.0, 5329.0, 10905.0, 23021.0, 51293.0, 113212.0, 220454.0, 273010.0, 182596.0, 87322.0, 39039.0, 17839.0, 8530.0, 4385.0, 2241.0, 1249.0, 670.0, 389.0, 236.0, 165.0, 86.0, 55.0, 42.0, 30.0, 27.0, 12.0, 8.0, 6.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.685546875, -3.574981689453125, -3.46441650390625, -3.353851318359375, -3.2432861328125, -3.132720947265625, -3.02215576171875, -2.911590576171875, -2.801025390625, -2.690460205078125, -2.57989501953125, -2.469329833984375, -2.3587646484375, -2.248199462890625, -2.13763427734375, -2.027069091796875, -1.91650390625, -1.805938720703125, -1.69537353515625, -1.584808349609375, -1.4742431640625, -1.363677978515625, -1.25311279296875, -1.142547607421875, -1.031982421875, -0.921417236328125, -0.81085205078125, -0.700286865234375, -0.5897216796875, -0.479156494140625, -0.36859130859375, -0.258026123046875, -0.1474609375, -0.036895751953125, 0.07366943359375, 0.184234619140625, 0.2947998046875, 0.405364990234375, 0.51593017578125, 0.626495361328125, 0.737060546875, 0.847625732421875, 0.95819091796875, 1.068756103515625, 1.1793212890625, 1.289886474609375, 1.40045166015625, 1.511016845703125, 1.62158203125, 1.732147216796875, 1.84271240234375, 1.953277587890625, 2.0638427734375, 2.174407958984375, 2.28497314453125, 2.395538330078125, 2.506103515625, 2.616668701171875, 2.72723388671875, 2.837799072265625, 2.9483642578125, 3.058929443359375, 3.16949462890625, 3.280059814453125, 3.390625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 8.0, 10.0, 11.0, 11.0, 18.0, 17.0, 29.0, 26.0, 25.0, 45.0, 42.0, 44.0, 53.0, 60.0, 68.0, 57.0, 59.0, 55.0, 55.0, 63.0, 41.0, 28.0, 30.0, 36.0, 12.0, 25.0, 16.0, 9.0, 9.0, 11.0, 8.0, 2.0, 4.0, 1.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6720123291015625, -0.646270751953125, -0.6205291748046875, -0.59478759765625, -0.5690460205078125, -0.543304443359375, -0.5175628662109375, -0.4918212890625, -0.4660797119140625, -0.440338134765625, -0.4145965576171875, -0.38885498046875, -0.3631134033203125, -0.337371826171875, -0.3116302490234375, -0.285888671875, -0.2601470947265625, -0.234405517578125, -0.2086639404296875, -0.18292236328125, -0.1571807861328125, -0.131439208984375, -0.1056976318359375, -0.0799560546875, -0.0542144775390625, -0.028472900390625, -0.0027313232421875, 0.02301025390625, 0.0487518310546875, 0.074493408203125, 0.1002349853515625, 0.1259765625, 0.1517181396484375, 0.177459716796875, 0.2032012939453125, 0.22894287109375, 0.2546844482421875, 0.280426025390625, 0.3061676025390625, 0.3319091796875, 0.3576507568359375, 0.383392333984375, 0.4091339111328125, 0.43487548828125, 0.4606170654296875, 0.486358642578125, 0.5121002197265625, 0.537841796875, 0.5635833740234375, 0.589324951171875, 0.6150665283203125, 0.64080810546875, 0.6665496826171875, 0.692291259765625, 0.7180328369140625, 0.7437744140625, 0.7695159912109375, 0.795257568359375, 0.8209991455078125, 0.84674072265625, 0.8724822998046875, 0.898223876953125, 0.9239654541015625, 0.94970703125]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 10.0, 12.0, 27.0, 35.0, 46.0, 81.0, 121.0, 160.0, 137.0, 113.0, 93.0, 53.0, 41.0, 16.0, 17.0, 16.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.06598472595215, -19.508255004882812, -18.950525283813477, -18.39279556274414, -17.835065841674805, -17.27733612060547, -16.719606399536133, -16.161876678466797, -15.604147911071777, -15.046418190002441, -14.488688468933105, -13.93095874786377, -13.37322998046875, -12.815500259399414, -12.257770538330078, -11.700040817260742, -11.142311096191406, -10.58458137512207, -10.026851654052734, -9.469121932983398, -8.911392211914062, -8.353662490844727, -7.795933723449707, -7.238204002380371, -6.680474281311035, -6.122744560241699, -5.565014839172363, -5.0072855949401855, -4.44955587387085, -3.8918261528015137, -3.334096670150757, -2.7763671875, -2.2186365127563477, -1.6609069108963013, -1.1031773090362549, -0.5454477071762085, 0.01228189468383789, 0.5700116157531738, 1.1277410984039307, 1.6854705810546875, 2.2432003021240234, 2.8009300231933594, 3.358659505844116, 3.916388988494873, 4.474118709564209, 5.031848430633545, 5.589577674865723, 6.147307395935059, 6.7050371170043945, 7.2627668380737305, 7.820496559143066, 8.378226280212402, 8.935955047607422, 9.493684768676758, 10.051414489746094, 10.60914421081543, 11.166873931884766, 11.724603652954102, 12.282333374023438, 12.840063095092773, 13.39779281616211, 13.955522537231445, 14.513251304626465, 15.0709810256958, 15.628710746765137]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 10.0, 8.0, 12.0, 18.0, 13.0, 17.0, 19.0, 25.0, 44.0, 34.0, 33.0, 35.0, 48.0, 56.0, 55.0, 44.0, 43.0, 51.0, 44.0, 55.0, 36.0, 38.0, 33.0, 35.0, 26.0, 26.0, 18.0, 17.0, 15.0, 21.0, 12.0, 14.0, 5.0, 9.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.087007522583008, -5.894461631774902, -5.701915740966797, -5.509369850158691, -5.316823959350586, -5.1242780685424805, -4.931732177734375, -4.7391862869262695, -4.546640396118164, -4.354094505310059, -4.161548614501953, -3.9690027236938477, -3.776456832885742, -3.5839109420776367, -3.3913652896881104, -3.198819398880005, -3.0062737464904785, -2.813727855682373, -2.6211819648742676, -2.428636074066162, -2.2360901832580566, -2.043544292449951, -1.8509986400604248, -1.6584527492523193, -1.4659068584442139, -1.2733609676361084, -1.080815076828003, -0.888269305229187, -0.6957234144210815, -0.5031775236129761, -0.31063175201416016, -0.11808586120605469, 0.07445955276489258, 0.26700541377067566, 0.45955127477645874, 0.6520971059799194, 0.8446429967880249, 1.0371888875961304, 1.2297346591949463, 1.4222805500030518, 1.6148264408111572, 1.8073723316192627, 1.9999182224273682, 2.1924638748168945, 2.385009765625, 2.5775556564331055, 2.770101547241211, 2.9626474380493164, 3.155193328857422, 3.3477392196655273, 3.540285110473633, 3.7328310012817383, 3.9253768920898438, 4.117922782897949, 4.310468673706055, 4.50301456451416, 4.695560455322266, 4.888106346130371, 5.080652236938477, 5.273198127746582, 5.4657440185546875, 5.658289909362793, 5.850835800170898, 6.043381690979004, 6.235927104949951]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 8.0, 19.0, 22.0, 36.0, 50.0, 65.0, 125.0, 191.0, 306.0, 487.0, 831.0, 1352.0, 2463.0, 4417.0, 8154.0, 16809.0, 40339.0, 126505.0, 552500.0, 1868822.0, 1190665.0, 255359.0, 69516.0, 26788.0, 12748.0, 6750.0, 3629.0, 2159.0, 1225.0, 767.0, 423.0, 244.0, 197.0, 111.0, 60.0, 49.0, 31.0, 28.0, 9.0, 7.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.6171875, -14.1710205078125, -13.724853515625, -13.2786865234375, -12.83251953125, -12.3863525390625, -11.940185546875, -11.4940185546875, -11.0478515625, -10.6016845703125, -10.155517578125, -9.7093505859375, -9.26318359375, -8.8170166015625, -8.370849609375, -7.9246826171875, -7.478515625, -7.0323486328125, -6.586181640625, -6.1400146484375, -5.69384765625, -5.2476806640625, -4.801513671875, -4.3553466796875, -3.9091796875, -3.4630126953125, -3.016845703125, -2.5706787109375, -2.12451171875, -1.6783447265625, -1.232177734375, -0.7860107421875, -0.33984375, 0.1063232421875, 0.552490234375, 0.9986572265625, 1.44482421875, 1.8909912109375, 2.337158203125, 2.7833251953125, 3.2294921875, 3.6756591796875, 4.121826171875, 4.5679931640625, 5.01416015625, 5.4603271484375, 5.906494140625, 6.3526611328125, 6.798828125, 7.2449951171875, 7.691162109375, 8.1373291015625, 8.58349609375, 9.0296630859375, 9.475830078125, 9.9219970703125, 10.3681640625, 10.8143310546875, 11.260498046875, 11.7066650390625, 12.15283203125, 12.5989990234375, 13.045166015625, 13.4913330078125, 13.9375]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 8.0, 0.0, 6.0, 8.0, 5.0, 17.0, 9.0, 14.0, 21.0, 18.0, 26.0, 32.0, 40.0, 37.0, 35.0, 43.0, 53.0, 41.0, 49.0, 50.0, 59.0, 46.0, 40.0, 38.0, 41.0, 41.0, 34.0, 34.0, 32.0, 20.0, 20.0, 16.0, 9.0, 14.0, 15.0, 11.0, 5.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.8828125, -4.735107421875, -4.58740234375, -4.439697265625, -4.2919921875, -4.144287109375, -3.99658203125, -3.848876953125, -3.701171875, -3.553466796875, -3.40576171875, -3.258056640625, -3.1103515625, -2.962646484375, -2.81494140625, -2.667236328125, -2.51953125, -2.371826171875, -2.22412109375, -2.076416015625, -1.9287109375, -1.781005859375, -1.63330078125, -1.485595703125, -1.337890625, -1.190185546875, -1.04248046875, -0.894775390625, -0.7470703125, -0.599365234375, -0.45166015625, -0.303955078125, -0.15625, -0.008544921875, 0.13916015625, 0.286865234375, 0.4345703125, 0.582275390625, 0.72998046875, 0.877685546875, 1.025390625, 1.173095703125, 1.32080078125, 1.468505859375, 1.6162109375, 1.763916015625, 1.91162109375, 2.059326171875, 2.20703125, 2.354736328125, 2.50244140625, 2.650146484375, 2.7978515625, 2.945556640625, 3.09326171875, 3.240966796875, 3.388671875, 3.536376953125, 3.68408203125, 3.831787109375, 3.9794921875, 4.127197265625, 4.27490234375, 4.422607421875, 4.5703125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 0.0, 5.0, 8.0, 10.0, 5.0, 19.0, 26.0, 32.0, 44.0, 77.0, 135.0, 218.0, 311.0, 474.0, 710.0, 1033.0, 1695.0, 2512.0, 3875.0, 6205.0, 9902.0, 16566.0, 29506.0, 57571.0, 127713.0, 327277.0, 862588.0, 1385073.0, 809094.0, 304184.0, 120422.0, 55681.0, 28796.0, 15986.0, 9655.0, 5914.0, 3810.0, 2508.0, 1600.0, 1109.0, 674.0, 426.0, 283.0, 184.0, 122.0, 92.0, 52.0, 33.0, 25.0, 23.0, 8.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3515625, -10.0225830078125, -9.693603515625, -9.3646240234375, -9.03564453125, -8.7066650390625, -8.377685546875, -8.0487060546875, -7.7197265625, -7.3907470703125, -7.061767578125, -6.7327880859375, -6.40380859375, -6.0748291015625, -5.745849609375, -5.4168701171875, -5.087890625, -4.7589111328125, -4.429931640625, -4.1009521484375, -3.77197265625, -3.4429931640625, -3.114013671875, -2.7850341796875, -2.4560546875, -2.1270751953125, -1.798095703125, -1.4691162109375, -1.14013671875, -0.8111572265625, -0.482177734375, -0.1531982421875, 0.17578125, 0.5047607421875, 0.833740234375, 1.1627197265625, 1.49169921875, 1.8206787109375, 2.149658203125, 2.4786376953125, 2.8076171875, 3.1365966796875, 3.465576171875, 3.7945556640625, 4.12353515625, 4.4525146484375, 4.781494140625, 5.1104736328125, 5.439453125, 5.7684326171875, 6.097412109375, 6.4263916015625, 6.75537109375, 7.0843505859375, 7.413330078125, 7.7423095703125, 8.0712890625, 8.4002685546875, 8.729248046875, 9.0582275390625, 9.38720703125, 9.7161865234375, 10.045166015625, 10.3741455078125, 10.703125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 19.0, 18.0, 20.0, 28.0, 25.0, 35.0, 65.0, 77.0, 103.0, 152.0, 203.0, 225.0, 288.0, 326.0, 363.0, 374.0, 351.0, 310.0, 232.0, 188.0, 156.0, 119.0, 83.0, 61.0, 58.0, 36.0, 31.0, 27.0, 21.0, 13.0, 12.0, 14.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.994140625, -2.89825439453125, -2.8023681640625, -2.70648193359375, -2.610595703125, -2.51470947265625, -2.4188232421875, -2.32293701171875, -2.22705078125, -2.13116455078125, -2.0352783203125, -1.93939208984375, -1.843505859375, -1.74761962890625, -1.6517333984375, -1.55584716796875, -1.4599609375, -1.36407470703125, -1.2681884765625, -1.17230224609375, -1.076416015625, -0.98052978515625, -0.8846435546875, -0.78875732421875, -0.69287109375, -0.59698486328125, -0.5010986328125, -0.40521240234375, -0.309326171875, -0.21343994140625, -0.1175537109375, -0.02166748046875, 0.07421875, 0.17010498046875, 0.2659912109375, 0.36187744140625, 0.457763671875, 0.55364990234375, 0.6495361328125, 0.74542236328125, 0.84130859375, 0.93719482421875, 1.0330810546875, 1.12896728515625, 1.224853515625, 1.32073974609375, 1.4166259765625, 1.51251220703125, 1.6083984375, 1.70428466796875, 1.8001708984375, 1.89605712890625, 1.991943359375, 2.08782958984375, 2.1837158203125, 2.27960205078125, 2.37548828125, 2.47137451171875, 2.5672607421875, 2.66314697265625, 2.759033203125, 2.85491943359375, 2.9508056640625, 3.04669189453125, 3.142578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 8.0, 11.0, 8.0, 16.0, 25.0, 18.0, 45.0, 59.0, 86.0, 102.0, 112.0, 99.0, 85.0, 87.0, 58.0, 47.0, 38.0, 24.0, 14.0, 12.0, 8.0, 10.0, 7.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.78668975830078, -16.36717987060547, -15.947669982910156, -15.528160095214844, -15.108650207519531, -14.689140319824219, -14.269630432128906, -13.850119590759277, -13.430609703063965, -13.011099815368652, -12.59158992767334, -12.172080039978027, -11.752570152282715, -11.333059310913086, -10.913549423217773, -10.494039535522461, -10.074529647827148, -9.655019760131836, -9.235509872436523, -8.815999984741211, -8.396490097045898, -7.976979732513428, -7.557469844818115, -7.1379594802856445, -6.718450546264648, -6.298940658569336, -5.879430770874023, -5.459920883178711, -5.04041051864624, -4.620900630950928, -4.201390743255615, -3.7818806171417236, -3.362370491027832, -2.9428606033325195, -2.523350477218628, -2.1038405895233154, -1.6843305826187134, -1.2648205757141113, -0.8453106880187988, -0.4258005619049072, -0.0062906742095947266, 0.41321930289268494, 0.8327292799949646, 1.2522392272949219, 1.671749234199524, 2.091259241104126, 2.5107691287994385, 2.93027925491333, 3.3497891426086426, 3.769299030303955, 4.188808917999268, 4.608319282531738, 5.027829170227051, 5.447339057922363, 5.866848945617676, 6.286358833312988, 6.705868721008301, 7.125378608703613, 7.544888496398926, 7.964398384094238, 8.38390827178955, 8.80341911315918, 9.222929000854492, 9.642438888549805, 10.061948776245117]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 5.0, 8.0, 8.0, 9.0, 10.0, 9.0, 15.0, 12.0, 13.0, 12.0, 20.0, 31.0, 29.0, 33.0, 45.0, 54.0, 48.0, 57.0, 32.0, 53.0, 43.0, 43.0, 36.0, 54.0, 36.0, 18.0, 39.0, 27.0, 19.0, 19.0, 23.0, 22.0, 24.0, 12.0, 21.0, 10.0, 8.0, 7.0, 7.0, 7.0, 8.0, 6.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-5.5707597732543945, -5.3931732177734375, -5.2155866622924805, -5.037999629974365, -4.860413074493408, -4.682826519012451, -4.505239486694336, -4.327652931213379, -4.150066375732422, -3.972479820251465, -3.7948930263519287, -3.6173062324523926, -3.4397196769714355, -3.2621331214904785, -3.0845463275909424, -2.9069595336914062, -2.729372978210449, -2.551786422729492, -2.374199628829956, -2.19661283493042, -2.019026279449463, -1.8414396047592163, -1.6638529300689697, -1.4862662553787231, -1.3086795806884766, -1.13109290599823, -0.9535062313079834, -0.7759195566177368, -0.5983328819274902, -0.42074620723724365, -0.24315953254699707, -0.06557285785675049, 0.11201333999633789, 0.2896000146865845, 0.46718668937683105, 0.6447733640670776, 0.8223600387573242, 0.9999467134475708, 1.1775333881378174, 1.355120062828064, 1.5327067375183105, 1.7102934122085571, 1.8878800868988037, 2.06546688079834, 2.243053436279297, 2.420639991760254, 2.59822678565979, 2.775813579559326, 2.953400135040283, 3.1309866905212402, 3.3085734844207764, 3.4861602783203125, 3.6637468338012695, 3.8413333892822266, 4.018919944763184, 4.196506977081299, 4.374093532562256, 4.551680088043213, 4.729267120361328, 4.906853675842285, 5.084440231323242, 5.262026786804199, 5.439613342285156, 5.6172003746032715, 5.7947869300842285]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 9.0, 11.0, 8.0, 16.0, 31.0, 33.0, 65.0, 69.0, 102.0, 168.0, 213.0, 325.0, 567.0, 886.0, 1410.0, 2279.0, 4028.0, 7049.0, 13017.0, 25841.0, 53692.0, 116743.0, 229037.0, 271589.0, 166900.0, 77805.0, 36093.0, 17767.0, 9573.0, 5218.0, 2974.0, 1912.0, 1078.0, 705.0, 439.0, 279.0, 214.0, 146.0, 59.0, 77.0, 34.0, 28.0, 20.0, 9.0, 13.0, 9.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.951171875, -3.832305908203125, -3.71343994140625, -3.594573974609375, -3.4757080078125, -3.356842041015625, -3.23797607421875, -3.119110107421875, -3.000244140625, -2.881378173828125, -2.76251220703125, -2.643646240234375, -2.5247802734375, -2.405914306640625, -2.28704833984375, -2.168182373046875, -2.04931640625, -1.930450439453125, -1.81158447265625, -1.692718505859375, -1.5738525390625, -1.454986572265625, -1.33612060546875, -1.217254638671875, -1.098388671875, -0.979522705078125, -0.86065673828125, -0.741790771484375, -0.6229248046875, -0.504058837890625, -0.38519287109375, -0.266326904296875, -0.1474609375, -0.028594970703125, 0.09027099609375, 0.209136962890625, 0.3280029296875, 0.446868896484375, 0.56573486328125, 0.684600830078125, 0.803466796875, 0.922332763671875, 1.04119873046875, 1.160064697265625, 1.2789306640625, 1.397796630859375, 1.51666259765625, 1.635528564453125, 1.75439453125, 1.873260498046875, 1.99212646484375, 2.110992431640625, 2.2298583984375, 2.348724365234375, 2.46759033203125, 2.586456298828125, 2.705322265625, 2.824188232421875, 2.94305419921875, 3.061920166015625, 3.1807861328125, 3.299652099609375, 3.41851806640625, 3.537384033203125, 3.65625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 9.0, 13.0, 17.0, 15.0, 14.0, 17.0, 21.0, 29.0, 35.0, 41.0, 40.0, 59.0, 48.0, 53.0, 69.0, 45.0, 40.0, 50.0, 36.0, 34.0, 36.0, 33.0, 29.0, 22.0, 24.0, 25.0, 21.0, 18.0, 12.0, 18.0, 9.0, 11.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-6.53125, -6.32598876953125, -6.1207275390625, -5.91546630859375, -5.710205078125, -5.50494384765625, -5.2996826171875, -5.09442138671875, -4.88916015625, -4.68389892578125, -4.4786376953125, -4.27337646484375, -4.068115234375, -3.86285400390625, -3.6575927734375, -3.45233154296875, -3.2470703125, -3.04180908203125, -2.8365478515625, -2.63128662109375, -2.426025390625, -2.22076416015625, -2.0155029296875, -1.81024169921875, -1.60498046875, -1.39971923828125, -1.1944580078125, -0.98919677734375, -0.783935546875, -0.57867431640625, -0.3734130859375, -0.16815185546875, 0.037109375, 0.24237060546875, 0.4476318359375, 0.65289306640625, 0.858154296875, 1.06341552734375, 1.2686767578125, 1.47393798828125, 1.67919921875, 1.88446044921875, 2.0897216796875, 2.29498291015625, 2.500244140625, 2.70550537109375, 2.9107666015625, 3.11602783203125, 3.3212890625, 3.52655029296875, 3.7318115234375, 3.93707275390625, 4.142333984375, 4.34759521484375, 4.5528564453125, 4.75811767578125, 4.96337890625, 5.16864013671875, 5.3739013671875, 5.57916259765625, 5.784423828125, 5.98968505859375, 6.1949462890625, 6.40020751953125, 6.60546875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 7.0, 12.0, 20.0, 28.0, 39.0, 51.0, 76.0, 87.0, 147.0, 262.0, 397.0, 633.0, 1047.0, 1807.0, 3488.0, 6705.0, 13986.0, 32610.0, 85409.0, 233418.0, 366787.0, 183807.0, 67159.0, 26309.0, 11637.0, 5665.0, 2854.0, 1623.0, 931.0, 550.0, 323.0, 216.0, 138.0, 91.0, 78.0, 51.0, 24.0, 19.0, 13.0, 14.0, 9.0, 12.0, 8.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4140625, -5.24151611328125, -5.0689697265625, -4.89642333984375, -4.723876953125, -4.55133056640625, -4.3787841796875, -4.20623779296875, -4.03369140625, -3.86114501953125, -3.6885986328125, -3.51605224609375, -3.343505859375, -3.17095947265625, -2.9984130859375, -2.82586669921875, -2.6533203125, -2.48077392578125, -2.3082275390625, -2.13568115234375, -1.963134765625, -1.79058837890625, -1.6180419921875, -1.44549560546875, -1.27294921875, -1.10040283203125, -0.9278564453125, -0.75531005859375, -0.582763671875, -0.41021728515625, -0.2376708984375, -0.06512451171875, 0.107421875, 0.27996826171875, 0.4525146484375, 0.62506103515625, 0.797607421875, 0.97015380859375, 1.1427001953125, 1.31524658203125, 1.48779296875, 1.66033935546875, 1.8328857421875, 2.00543212890625, 2.177978515625, 2.35052490234375, 2.5230712890625, 2.69561767578125, 2.8681640625, 3.04071044921875, 3.2132568359375, 3.38580322265625, 3.558349609375, 3.73089599609375, 3.9034423828125, 4.07598876953125, 4.24853515625, 4.42108154296875, 4.5936279296875, 4.76617431640625, 4.938720703125, 5.11126708984375, 5.2838134765625, 5.45635986328125, 5.62890625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 6.0, 11.0, 8.0, 17.0, 6.0, 13.0, 19.0, 18.0, 12.0, 36.0, 33.0, 37.0, 34.0, 38.0, 33.0, 29.0, 40.0, 30.0, 38.0, 38.0, 43.0, 43.0, 41.0, 40.0, 41.0, 35.0, 31.0, 30.0, 24.0, 20.0, 23.0, 22.0, 21.0, 15.0, 8.0, 12.0, 12.0, 5.0, 9.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.115234375, -3.015777587890625, -2.91632080078125, -2.816864013671875, -2.7174072265625, -2.617950439453125, -2.51849365234375, -2.419036865234375, -2.319580078125, -2.220123291015625, -2.12066650390625, -2.021209716796875, -1.9217529296875, -1.822296142578125, -1.72283935546875, -1.623382568359375, -1.52392578125, -1.424468994140625, -1.32501220703125, -1.225555419921875, -1.1260986328125, -1.026641845703125, -0.92718505859375, -0.827728271484375, -0.728271484375, -0.628814697265625, -0.52935791015625, -0.429901123046875, -0.3304443359375, -0.230987548828125, -0.13153076171875, -0.032073974609375, 0.0673828125, 0.166839599609375, 0.26629638671875, 0.365753173828125, 0.4652099609375, 0.564666748046875, 0.66412353515625, 0.763580322265625, 0.863037109375, 0.962493896484375, 1.06195068359375, 1.161407470703125, 1.2608642578125, 1.360321044921875, 1.45977783203125, 1.559234619140625, 1.65869140625, 1.758148193359375, 1.85760498046875, 1.957061767578125, 2.0565185546875, 2.155975341796875, 2.25543212890625, 2.354888916015625, 2.454345703125, 2.553802490234375, 2.65325927734375, 2.752716064453125, 2.8521728515625, 2.951629638671875, 3.05108642578125, 3.150543212890625, 3.25]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 11.0, 16.0, 23.0, 26.0, 56.0, 75.0, 100.0, 178.0, 233.0, 364.0, 631.0, 1084.0, 1948.0, 4369.0, 14569.0, 112339.0, 753259.0, 133996.0, 15873.0, 4556.0, 1952.0, 1099.0, 650.0, 350.0, 268.0, 162.0, 114.0, 78.0, 49.0, 33.0, 28.0, 23.0, 9.0, 6.0, 5.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.12890625, -4.942626953125, -4.75634765625, -4.570068359375, -4.3837890625, -4.197509765625, -4.01123046875, -3.824951171875, -3.638671875, -3.452392578125, -3.26611328125, -3.079833984375, -2.8935546875, -2.707275390625, -2.52099609375, -2.334716796875, -2.1484375, -1.962158203125, -1.77587890625, -1.589599609375, -1.4033203125, -1.217041015625, -1.03076171875, -0.844482421875, -0.658203125, -0.471923828125, -0.28564453125, -0.099365234375, 0.0869140625, 0.273193359375, 0.45947265625, 0.645751953125, 0.83203125, 1.018310546875, 1.20458984375, 1.390869140625, 1.5771484375, 1.763427734375, 1.94970703125, 2.135986328125, 2.322265625, 2.508544921875, 2.69482421875, 2.881103515625, 3.0673828125, 3.253662109375, 3.43994140625, 3.626220703125, 3.8125, 3.998779296875, 4.18505859375, 4.371337890625, 4.5576171875, 4.743896484375, 4.93017578125, 5.116455078125, 5.302734375, 5.489013671875, 5.67529296875, 5.861572265625, 6.0478515625, 6.234130859375, 6.42041015625, 6.606689453125, 6.79296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 12.0, 14.0, 33.0, 38.0, 78.0, 106.0, 111.0, 140.0, 145.0, 90.0, 68.0, 44.0, 31.0, 24.0, 6.0, 14.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00015854835510253906, -0.0001535024493932724, -0.00014845654368400574, -0.00014341063797473907, -0.0001383647322654724, -0.00013331882655620575, -0.0001282729208469391, -0.00012322701513767242, -0.00011818110942840576, -0.0001131352037191391, -0.00010808929800987244, -0.00010304339230060577, -9.799748659133911e-05, -9.295158088207245e-05, -8.790567517280579e-05, -8.285976946353912e-05, -7.781386375427246e-05, -7.27679580450058e-05, -6.772205233573914e-05, -6.267614662647247e-05, -5.763024091720581e-05, -5.258433520793915e-05, -4.7538429498672485e-05, -4.249252378940582e-05, -3.744661808013916e-05, -3.24007123708725e-05, -2.7354806661605835e-05, -2.2308900952339172e-05, -1.726299524307251e-05, -1.2217089533805847e-05, -7.1711838245391846e-06, -2.125278115272522e-06, 2.9206275939941406e-06, 7.966533303260803e-06, 1.3012439012527466e-05, 1.805834472179413e-05, 2.310425043106079e-05, 2.8150156140327454e-05, 3.3196061849594116e-05, 3.824196755886078e-05, 4.328787326812744e-05, 4.8333778977394104e-05, 5.3379684686660767e-05, 5.842559039592743e-05, 6.347149610519409e-05, 6.851740181446075e-05, 7.356330752372742e-05, 7.860921323299408e-05, 8.365511894226074e-05, 8.87010246515274e-05, 9.374693036079407e-05, 9.879283607006073e-05, 0.00010383874177932739, 0.00010888464748859406, 0.00011393055319786072, 0.00011897645890712738, 0.00012402236461639404, 0.0001290682703256607, 0.00013411417603492737, 0.00013916008174419403, 0.0001442059874534607, 0.00014925189316272736, 0.00015429779887199402, 0.00015934370458126068, 0.00016438961029052734]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 8.0, 6.0, 10.0, 19.0, 24.0, 28.0, 44.0, 69.0, 76.0, 147.0, 173.0, 257.0, 414.0, 555.0, 841.0, 1250.0, 1782.0, 2698.0, 4405.0, 7731.0, 17595.0, 50507.0, 178522.0, 419372.0, 246006.0, 69524.0, 22679.0, 9539.0, 4901.0, 3065.0, 1987.0, 1377.0, 894.0, 636.0, 401.0, 323.0, 221.0, 148.0, 97.0, 49.0, 42.0, 48.0, 22.0, 16.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 3.0], "bins": [-2.66796875, -2.586212158203125, -2.50445556640625, -2.422698974609375, -2.3409423828125, -2.259185791015625, -2.17742919921875, -2.095672607421875, -2.013916015625, -1.932159423828125, -1.85040283203125, -1.768646240234375, -1.6868896484375, -1.605133056640625, -1.52337646484375, -1.441619873046875, -1.35986328125, -1.278106689453125, -1.19635009765625, -1.114593505859375, -1.0328369140625, -0.951080322265625, -0.86932373046875, -0.787567138671875, -0.705810546875, -0.624053955078125, -0.54229736328125, -0.460540771484375, -0.3787841796875, -0.297027587890625, -0.21527099609375, -0.133514404296875, -0.0517578125, 0.029998779296875, 0.11175537109375, 0.193511962890625, 0.2752685546875, 0.357025146484375, 0.43878173828125, 0.520538330078125, 0.602294921875, 0.684051513671875, 0.76580810546875, 0.847564697265625, 0.9293212890625, 1.011077880859375, 1.09283447265625, 1.174591064453125, 1.25634765625, 1.338104248046875, 1.41986083984375, 1.501617431640625, 1.5833740234375, 1.665130615234375, 1.74688720703125, 1.828643798828125, 1.910400390625, 1.992156982421875, 2.07391357421875, 2.155670166015625, 2.2374267578125, 2.319183349609375, 2.40093994140625, 2.482696533203125, 2.564453125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 9.0, 12.0, 21.0, 28.0, 45.0, 62.0, 72.0, 91.0, 124.0, 114.0, 104.0, 84.0, 69.0, 52.0, 36.0, 21.0, 15.0, 14.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71533203125, -0.6910781860351562, -0.6668243408203125, -0.6425704956054688, -0.618316650390625, -0.5940628051757812, -0.5698089599609375, -0.5455551147460938, -0.52130126953125, -0.49704742431640625, -0.4727935791015625, -0.44853973388671875, -0.424285888671875, -0.40003204345703125, -0.3757781982421875, -0.35152435302734375, -0.3272705078125, -0.30301666259765625, -0.2787628173828125, -0.25450897216796875, -0.230255126953125, -0.20600128173828125, -0.1817474365234375, -0.15749359130859375, -0.13323974609375, -0.10898590087890625, -0.0847320556640625, -0.06047821044921875, -0.036224365234375, -0.01197052001953125, 0.0122833251953125, 0.03653717041015625, 0.060791015625, 0.08504486083984375, 0.1092987060546875, 0.13355255126953125, 0.157806396484375, 0.18206024169921875, 0.2063140869140625, 0.23056793212890625, 0.25482177734375, 0.27907562255859375, 0.3033294677734375, 0.32758331298828125, 0.351837158203125, 0.37609100341796875, 0.4003448486328125, 0.42459869384765625, 0.4488525390625, 0.47310638427734375, 0.4973602294921875, 0.5216140747070312, 0.545867919921875, 0.5701217651367188, 0.5943756103515625, 0.6186294555664062, 0.64288330078125, 0.6671371459960938, 0.6913909912109375, 0.7156448364257812, 0.739898681640625, 0.7641525268554688, 0.7884063720703125, 0.8126602172851562, 0.8369140625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 2.0, 6.0, 7.0, 5.0, 14.0, 8.0, 20.0, 21.0, 26.0, 42.0, 68.0, 89.0, 101.0, 88.0, 117.0, 78.0, 86.0, 58.0, 46.0, 36.0, 28.0, 10.0, 13.0, 7.0, 8.0, 8.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.774717330932617, -16.364784240722656, -15.954852104187012, -15.544919967651367, -15.134987831115723, -14.725055694580078, -14.315122604370117, -13.905190467834473, -13.495258331298828, -13.085326194763184, -12.675393104553223, -12.265460968017578, -11.855528831481934, -11.445596694946289, -11.035663604736328, -10.625731468200684, -10.215798377990723, -9.805866241455078, -9.395933151245117, -8.986001014709473, -8.576068878173828, -8.166135787963867, -7.756203651428223, -7.346271514892578, -6.936338901519775, -6.526406288146973, -6.116474151611328, -5.706541538238525, -5.296608924865723, -4.886676788330078, -4.476744174957275, -4.066811561584473, -3.656879425048828, -3.2469470500946045, -2.837014675140381, -2.427082061767578, -2.0171496868133545, -1.6072173118591309, -1.1972846984863281, -0.7873523235321045, -0.37741994857788086, 0.03251248598098755, 0.44244492053985596, 0.8523774147033691, 1.2623097896575928, 1.6722421646118164, 2.082174777984619, 2.4921071529388428, 2.9020395278930664, 3.31197190284729, 3.7219042778015137, 4.131836891174316, 4.541769027709961, 4.951701641082764, 5.361634254455566, 5.771566390991211, 6.181499004364014, 6.591431617736816, 7.001363754272461, 7.411296367645264, 7.821228981018066, 8.231161117553711, 8.641094207763672, 9.051026344299316, 9.460958480834961]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 4.0, 10.0, 10.0, 11.0, 9.0, 13.0, 17.0, 10.0, 13.0, 19.0, 27.0, 36.0, 32.0, 49.0, 49.0, 52.0, 51.0, 36.0, 53.0, 43.0, 43.0, 42.0, 53.0, 27.0, 34.0, 29.0, 27.0, 17.0, 25.0, 21.0, 21.0, 21.0, 18.0, 13.0, 14.0, 7.0, 3.0, 8.0, 7.0, 11.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-5.590302467346191, -5.411503791809082, -5.2327046394348145, -5.053905963897705, -4.8751068115234375, -4.696308135986328, -4.517509460449219, -4.338710308074951, -4.159911155700684, -3.981112241744995, -3.8023133277893066, -3.6235146522521973, -3.4447154998779297, -3.2659168243408203, -3.087117910385132, -2.9083189964294434, -2.729520320892334, -2.5507214069366455, -2.371922492980957, -2.1931238174438477, -2.01432466506958, -1.8355258703231812, -1.6567270755767822, -1.4779281616210938, -1.2991292476654053, -1.1203303337097168, -0.9415314793586731, -0.7627326250076294, -0.5839337110519409, -0.40513479709625244, -0.22633600234985352, -0.04753708839416504, 0.13126134872436523, 0.3100602328777313, 0.4888591170310974, 0.6676579713821411, 0.8464568853378296, 1.025255799293518, 1.204054594039917, 1.3828535079956055, 1.561652421951294, 1.7404513359069824, 1.919250249862671, 2.0980491638183594, 2.2768478393554688, 2.4556469917297363, 2.6344456672668457, 2.813244581222534, 2.9920434951782227, 3.170842409133911, 3.3496413230895996, 3.528439998626709, 3.7072391510009766, 3.886037826538086, 4.064836502075195, 4.243635654449463, 4.4224348068237305, 4.60123348236084, 4.780032634735107, 4.958831310272217, 5.137630462646484, 5.316429138183594, 5.495227813720703, 5.674026966094971, 5.85282564163208]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 15.0, 30.0, 25.0, 40.0, 57.0, 75.0, 144.0, 202.0, 302.0, 505.0, 752.0, 1211.0, 2033.0, 3406.0, 6069.0, 10282.0, 18800.0, 35587.0, 69496.0, 127710.0, 198160.0, 218023.0, 159242.0, 91630.0, 48007.0, 25108.0, 13253.0, 7380.0, 4307.0, 2554.0, 1503.0, 940.0, 567.0, 381.0, 248.0, 142.0, 124.0, 86.0, 56.0, 37.0, 18.0, 11.0, 12.0, 10.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.86328125, -6.6434326171875, -6.423583984375, -6.2037353515625, -5.98388671875, -5.7640380859375, -5.544189453125, -5.3243408203125, -5.1044921875, -4.8846435546875, -4.664794921875, -4.4449462890625, -4.22509765625, -4.0052490234375, -3.785400390625, -3.5655517578125, -3.345703125, -3.1258544921875, -2.906005859375, -2.6861572265625, -2.46630859375, -2.2464599609375, -2.026611328125, -1.8067626953125, -1.5869140625, -1.3670654296875, -1.147216796875, -0.9273681640625, -0.70751953125, -0.4876708984375, -0.267822265625, -0.0479736328125, 0.171875, 0.3917236328125, 0.611572265625, 0.8314208984375, 1.05126953125, 1.2711181640625, 1.490966796875, 1.7108154296875, 1.9306640625, 2.1505126953125, 2.370361328125, 2.5902099609375, 2.81005859375, 3.0299072265625, 3.249755859375, 3.4696044921875, 3.689453125, 3.9093017578125, 4.129150390625, 4.3489990234375, 4.56884765625, 4.7886962890625, 5.008544921875, 5.2283935546875, 5.4482421875, 5.6680908203125, 5.887939453125, 6.1077880859375, 6.32763671875, 6.5474853515625, 6.767333984375, 6.9871826171875, 7.20703125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 5.0, 11.0, 6.0, 12.0, 9.0, 16.0, 13.0, 11.0, 28.0, 19.0, 33.0, 28.0, 47.0, 49.0, 52.0, 53.0, 52.0, 39.0, 50.0, 49.0, 48.0, 54.0, 46.0, 35.0, 22.0, 26.0, 21.0, 20.0, 16.0, 18.0, 23.0, 16.0, 9.0, 12.0, 10.0, 7.0, 6.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.9453125, -5.73651123046875, -5.5277099609375, -5.31890869140625, -5.110107421875, -4.90130615234375, -4.6925048828125, -4.48370361328125, -4.27490234375, -4.06610107421875, -3.8572998046875, -3.64849853515625, -3.439697265625, -3.23089599609375, -3.0220947265625, -2.81329345703125, -2.6044921875, -2.39569091796875, -2.1868896484375, -1.97808837890625, -1.769287109375, -1.56048583984375, -1.3516845703125, -1.14288330078125, -0.93408203125, -0.72528076171875, -0.5164794921875, -0.30767822265625, -0.098876953125, 0.10992431640625, 0.3187255859375, 0.52752685546875, 0.736328125, 0.94512939453125, 1.1539306640625, 1.36273193359375, 1.571533203125, 1.78033447265625, 1.9891357421875, 2.19793701171875, 2.40673828125, 2.61553955078125, 2.8243408203125, 3.03314208984375, 3.241943359375, 3.45074462890625, 3.6595458984375, 3.86834716796875, 4.0771484375, 4.28594970703125, 4.4947509765625, 4.70355224609375, 4.912353515625, 5.12115478515625, 5.3299560546875, 5.53875732421875, 5.74755859375, 5.95635986328125, 6.1651611328125, 6.37396240234375, 6.582763671875, 6.79156494140625, 7.0003662109375, 7.20916748046875, 7.41796875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 8.0, 18.0, 19.0, 38.0, 51.0, 107.0, 141.0, 193.0, 362.0, 512.0, 802.0, 1344.0, 2128.0, 3406.0, 5405.0, 8992.0, 14603.0, 24279.0, 40624.0, 66423.0, 104780.0, 147647.0, 170023.0, 155588.0, 114215.0, 73126.0, 44696.0, 26888.0, 16261.0, 9723.0, 5948.0, 3764.0, 2373.0, 1491.0, 974.0, 606.0, 367.0, 225.0, 160.0, 92.0, 62.0, 37.0, 25.0, 12.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.94140625, -5.76458740234375, -5.5877685546875, -5.41094970703125, -5.234130859375, -5.05731201171875, -4.8804931640625, -4.70367431640625, -4.52685546875, -4.35003662109375, -4.1732177734375, -3.99639892578125, -3.819580078125, -3.64276123046875, -3.4659423828125, -3.28912353515625, -3.1123046875, -2.93548583984375, -2.7586669921875, -2.58184814453125, -2.405029296875, -2.22821044921875, -2.0513916015625, -1.87457275390625, -1.69775390625, -1.52093505859375, -1.3441162109375, -1.16729736328125, -0.990478515625, -0.81365966796875, -0.6368408203125, -0.46002197265625, -0.283203125, -0.10638427734375, 0.0704345703125, 0.24725341796875, 0.424072265625, 0.60089111328125, 0.7777099609375, 0.95452880859375, 1.13134765625, 1.30816650390625, 1.4849853515625, 1.66180419921875, 1.838623046875, 2.01544189453125, 2.1922607421875, 2.36907958984375, 2.5458984375, 2.72271728515625, 2.8995361328125, 3.07635498046875, 3.253173828125, 3.42999267578125, 3.6068115234375, 3.78363037109375, 3.96044921875, 4.13726806640625, 4.3140869140625, 4.49090576171875, 4.667724609375, 4.84454345703125, 5.0213623046875, 5.19818115234375, 5.375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 8.0, 8.0, 4.0, 6.0, 11.0, 5.0, 13.0, 14.0, 8.0, 10.0, 18.0, 20.0, 24.0, 30.0, 30.0, 28.0, 36.0, 34.0, 38.0, 48.0, 44.0, 39.0, 36.0, 36.0, 32.0, 36.0, 49.0, 33.0, 29.0, 34.0, 29.0, 26.0, 17.0, 29.0, 27.0, 20.0, 18.0, 13.0, 9.0, 10.0, 8.0, 10.0, 3.0, 11.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.607421875, -3.500885009765625, -3.39434814453125, -3.287811279296875, -3.1812744140625, -3.074737548828125, -2.96820068359375, -2.861663818359375, -2.755126953125, -2.648590087890625, -2.54205322265625, -2.435516357421875, -2.3289794921875, -2.222442626953125, -2.11590576171875, -2.009368896484375, -1.90283203125, -1.796295166015625, -1.68975830078125, -1.583221435546875, -1.4766845703125, -1.370147705078125, -1.26361083984375, -1.157073974609375, -1.050537109375, -0.944000244140625, -0.83746337890625, -0.730926513671875, -0.6243896484375, -0.517852783203125, -0.41131591796875, -0.304779052734375, -0.1982421875, -0.091705322265625, 0.01483154296875, 0.121368408203125, 0.2279052734375, 0.334442138671875, 0.44097900390625, 0.547515869140625, 0.654052734375, 0.760589599609375, 0.86712646484375, 0.973663330078125, 1.0802001953125, 1.186737060546875, 1.29327392578125, 1.399810791015625, 1.50634765625, 1.612884521484375, 1.71942138671875, 1.825958251953125, 1.9324951171875, 2.039031982421875, 2.14556884765625, 2.252105712890625, 2.358642578125, 2.465179443359375, 2.57171630859375, 2.678253173828125, 2.7847900390625, 2.891326904296875, 2.99786376953125, 3.104400634765625, 3.2109375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 11.0, 9.0, 19.0, 32.0, 38.0, 60.0, 90.0, 134.0, 253.0, 364.0, 625.0, 1016.0, 1850.0, 3329.0, 6545.0, 13539.0, 32502.0, 86202.0, 233350.0, 354851.0, 192993.0, 69633.0, 26817.0, 11591.0, 5651.0, 3002.0, 1690.0, 930.0, 516.0, 321.0, 203.0, 152.0, 72.0, 52.0, 35.0, 28.0, 16.0, 11.0, 7.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.55780029296875, -4.3851318359375, -4.21246337890625, -4.039794921875, -3.86712646484375, -3.6944580078125, -3.52178955078125, -3.34912109375, -3.17645263671875, -3.0037841796875, -2.83111572265625, -2.658447265625, -2.48577880859375, -2.3131103515625, -2.14044189453125, -1.9677734375, -1.79510498046875, -1.6224365234375, -1.44976806640625, -1.277099609375, -1.10443115234375, -0.9317626953125, -0.75909423828125, -0.58642578125, -0.41375732421875, -0.2410888671875, -0.06842041015625, 0.104248046875, 0.27691650390625, 0.4495849609375, 0.62225341796875, 0.794921875, 0.96759033203125, 1.1402587890625, 1.31292724609375, 1.485595703125, 1.65826416015625, 1.8309326171875, 2.00360107421875, 2.17626953125, 2.34893798828125, 2.5216064453125, 2.69427490234375, 2.866943359375, 3.03961181640625, 3.2122802734375, 3.38494873046875, 3.5576171875, 3.73028564453125, 3.9029541015625, 4.07562255859375, 4.248291015625, 4.42095947265625, 4.5936279296875, 4.76629638671875, 4.93896484375, 5.11163330078125, 5.2843017578125, 5.45697021484375, 5.629638671875, 5.80230712890625, 5.9749755859375, 6.14764404296875, 6.3203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 14.0, 11.0, 18.0, 22.0, 28.0, 29.0, 52.0, 66.0, 80.0, 97.0, 115.0, 93.0, 97.0, 62.0, 52.0, 37.0, 27.0, 21.0, 20.0, 12.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004901885986328125, -0.000474683940410614, -0.00045917928218841553, -0.00044367462396621704, -0.00042816996574401855, -0.00041266530752182007, -0.0003971606492996216, -0.0003816559910774231, -0.0003661513328552246, -0.0003506466746330261, -0.00033514201641082764, -0.00031963735818862915, -0.00030413269996643066, -0.0002886280417442322, -0.0002731233835220337, -0.0002576187252998352, -0.00024211406707763672, -0.00022660940885543823, -0.00021110475063323975, -0.00019560009241104126, -0.00018009543418884277, -0.0001645907759666443, -0.0001490861177444458, -0.00013358145952224731, -0.00011807680130004883, -0.00010257214307785034, -8.706748485565186e-05, -7.156282663345337e-05, -5.605816841125488e-05, -4.0553510189056396e-05, -2.504885196685791e-05, -9.544193744659424e-06, 5.9604644775390625e-06, 2.146512269973755e-05, 3.6969780921936035e-05, 5.247443914413452e-05, 6.797909736633301e-05, 8.34837555885315e-05, 9.898841381072998e-05, 0.00011449307203292847, 0.00012999773025512695, 0.00014550238847732544, 0.00016100704669952393, 0.0001765117049217224, 0.0001920163631439209, 0.00020752102136611938, 0.00022302567958831787, 0.00023853033781051636, 0.00025403499603271484, 0.00026953965425491333, 0.0002850443124771118, 0.0003005489706993103, 0.0003160536289215088, 0.0003315582871437073, 0.00034706294536590576, 0.00036256760358810425, 0.00037807226181030273, 0.0003935769200325012, 0.0004090815782546997, 0.0004245862364768982, 0.0004400908946990967, 0.00045559555292129517, 0.00047110021114349365, 0.00048660486936569214, 0.0005021095275878906]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 9.0, 11.0, 9.0, 8.0, 16.0, 24.0, 26.0, 39.0, 66.0, 82.0, 135.0, 179.0, 286.0, 406.0, 634.0, 1088.0, 1724.0, 3135.0, 5845.0, 11313.0, 23942.0, 53273.0, 119490.0, 227504.0, 270080.0, 174149.0, 82495.0, 36669.0, 16937.0, 8459.0, 4349.0, 2308.0, 1373.0, 884.0, 532.0, 342.0, 222.0, 147.0, 121.0, 76.0, 46.0, 31.0, 27.0, 19.0, 14.0, 13.0, 8.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.669921875, -3.548675537109375, -3.42742919921875, -3.306182861328125, -3.1849365234375, -3.063690185546875, -2.94244384765625, -2.821197509765625, -2.699951171875, -2.578704833984375, -2.45745849609375, -2.336212158203125, -2.2149658203125, -2.093719482421875, -1.97247314453125, -1.851226806640625, -1.72998046875, -1.608734130859375, -1.48748779296875, -1.366241455078125, -1.2449951171875, -1.123748779296875, -1.00250244140625, -0.881256103515625, -0.760009765625, -0.638763427734375, -0.51751708984375, -0.396270751953125, -0.2750244140625, -0.153778076171875, -0.03253173828125, 0.088714599609375, 0.2099609375, 0.331207275390625, 0.45245361328125, 0.573699951171875, 0.6949462890625, 0.816192626953125, 0.93743896484375, 1.058685302734375, 1.179931640625, 1.301177978515625, 1.42242431640625, 1.543670654296875, 1.6649169921875, 1.786163330078125, 1.90740966796875, 2.028656005859375, 2.14990234375, 2.271148681640625, 2.39239501953125, 2.513641357421875, 2.6348876953125, 2.756134033203125, 2.87738037109375, 2.998626708984375, 3.119873046875, 3.241119384765625, 3.36236572265625, 3.483612060546875, 3.6048583984375, 3.726104736328125, 3.84735107421875, 3.968597412109375, 4.08984375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 11.0, 16.0, 19.0, 27.0, 42.0, 46.0, 39.0, 42.0, 66.0, 77.0, 67.0, 66.0, 87.0, 73.0, 66.0, 57.0, 50.0, 33.0, 25.0, 17.0, 23.0, 19.0, 6.0, 8.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.0828857421875, -1.048583984375, -1.0142822265625, -0.97998046875, -0.9456787109375, -0.911376953125, -0.8770751953125, -0.8427734375, -0.8084716796875, -0.774169921875, -0.7398681640625, -0.70556640625, -0.6712646484375, -0.636962890625, -0.6026611328125, -0.568359375, -0.5340576171875, -0.499755859375, -0.4654541015625, -0.43115234375, -0.3968505859375, -0.362548828125, -0.3282470703125, -0.2939453125, -0.2596435546875, -0.225341796875, -0.1910400390625, -0.15673828125, -0.1224365234375, -0.088134765625, -0.0538330078125, -0.01953125, 0.0147705078125, 0.049072265625, 0.0833740234375, 0.11767578125, 0.1519775390625, 0.186279296875, 0.2205810546875, 0.2548828125, 0.2891845703125, 0.323486328125, 0.3577880859375, 0.39208984375, 0.4263916015625, 0.460693359375, 0.4949951171875, 0.529296875, 0.5635986328125, 0.597900390625, 0.6322021484375, 0.66650390625, 0.7008056640625, 0.735107421875, 0.7694091796875, 0.8037109375, 0.8380126953125, 0.872314453125, 0.9066162109375, 0.94091796875, 0.9752197265625, 1.009521484375, 1.0438232421875, 1.078125]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 6.0, 4.0, 4.0, 8.0, 6.0, 8.0, 11.0, 23.0, 21.0, 33.0, 46.0, 69.0, 94.0, 94.0, 98.0, 119.0, 76.0, 75.0, 63.0, 45.0, 27.0, 19.0, 10.0, 17.0, 6.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.112650871276855, -14.689648628234863, -14.266647338867188, -13.843645095825195, -13.420642852783203, -12.997641563415527, -12.574639320373535, -12.15163803100586, -11.728635787963867, -11.305633544921875, -10.8826322555542, -10.459630012512207, -10.036628723144531, -9.613626480102539, -9.190624237060547, -8.767621994018555, -8.344620704650879, -7.921618938446045, -7.498617172241211, -7.075614929199219, -6.652613162994385, -6.229611396789551, -5.806609153747559, -5.383607387542725, -4.960605621337891, -4.537603855133057, -4.114602088928223, -3.6915998458862305, -3.2685980796813965, -2.8455963134765625, -2.4225943088531494, -1.9995923042297363, -1.5765914916992188, -1.1535896062850952, -0.7305877208709717, -0.30758583545684814, 0.11541604995727539, 0.5384178161621094, 0.9614198207855225, 1.3844218254089355, 1.8074235916137695, 2.2304253578186035, 2.6534273624420166, 3.0764293670654297, 3.4994311332702637, 3.9224328994750977, 4.34543514251709, 4.768436908721924, 5.191438674926758, 5.614440441131592, 6.037442207336426, 6.460444450378418, 6.883446216583252, 7.306447982788086, 7.729450225830078, 8.15245246887207, 8.575453758239746, 8.998456001281738, 9.421457290649414, 9.844459533691406, 10.267461776733398, 10.690463066101074, 11.113465309143066, 11.536466598510742, 11.959468841552734]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 1.0, 6.0, 7.0, 4.0, 14.0, 10.0, 9.0, 15.0, 15.0, 25.0, 18.0, 24.0, 23.0, 39.0, 37.0, 45.0, 34.0, 39.0, 42.0, 45.0, 49.0, 50.0, 45.0, 46.0, 30.0, 36.0, 37.0, 35.0, 32.0, 19.0, 29.0, 16.0, 22.0, 21.0, 14.0, 11.0, 11.0, 11.0, 8.0, 5.0, 4.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.358779430389404, -5.175360202789307, -4.991940498352051, -4.808521270751953, -4.625101566314697, -4.4416823387146, -4.258262634277344, -4.074843406677246, -3.8914239406585693, -3.7080044746398926, -3.524585008621216, -3.341165542602539, -3.1577463150024414, -2.9743266105651855, -2.790907382965088, -2.607487916946411, -2.4240684509277344, -2.2406489849090576, -2.057229518890381, -1.8738101720809937, -1.690390706062317, -1.5069712400436401, -1.323551893234253, -1.1401324272155762, -0.9567129611968994, -0.7732934951782227, -0.5898740887641907, -0.4064546823501587, -0.22303521633148193, -0.039615750312805176, 0.14380359649658203, 0.3272230625152588, 0.5106430053710938, 0.6940624713897705, 0.8774818778038025, 1.0609012842178345, 1.2443207502365112, 1.427740216255188, 1.6111595630645752, 1.794579029083252, 1.9779984951019287, 2.1614179611206055, 2.3448374271392822, 2.528256893157959, 2.7116761207580566, 2.8950958251953125, 3.07851505279541, 3.261934518814087, 3.4453539848327637, 3.6287734508514404, 3.812192916870117, 3.995612144470215, 4.179031848907471, 4.362451076507568, 4.545870780944824, 4.729290008544922, 4.9127092361450195, 5.096128463745117, 5.279548168182373, 5.462967395782471, 5.646387100219727, 5.829806327819824, 6.013225555419922, 6.196645259857178, 6.380064964294434]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [5.0, 5.0, 10.0, 12.0, 22.0, 18.0, 39.0, 38.0, 62.0, 62.0, 106.0, 110.0, 185.0, 246.0, 315.0, 468.0, 726.0, 1081.0, 1481.0, 2164.0, 3266.0, 5118.0, 8057.0, 13691.0, 24979.0, 52693.0, 131531.0, 395882.0, 1119774.0, 1446652.0, 634057.0, 199218.0, 73613.0, 32729.0, 17169.0, 9748.0, 6123.0, 4091.0, 2698.0, 1814.0, 1218.0, 822.0, 643.0, 413.0, 324.0, 214.0, 147.0, 135.0, 96.0, 66.0, 33.0, 39.0, 22.0, 16.0, 18.0, 6.0, 4.0, 8.0, 8.0, 7.0, 2.0, 1.0, 1.0, 3.0], "bins": [-9.9375, -9.5972900390625, -9.257080078125, -8.9168701171875, -8.57666015625, -8.2364501953125, -7.896240234375, -7.5560302734375, -7.2158203125, -6.8756103515625, -6.535400390625, -6.1951904296875, -5.85498046875, -5.5147705078125, -5.174560546875, -4.8343505859375, -4.494140625, -4.1539306640625, -3.813720703125, -3.4735107421875, -3.13330078125, -2.7930908203125, -2.452880859375, -2.1126708984375, -1.7724609375, -1.4322509765625, -1.092041015625, -0.7518310546875, -0.41162109375, -0.0714111328125, 0.268798828125, 0.6090087890625, 0.94921875, 1.2894287109375, 1.629638671875, 1.9698486328125, 2.31005859375, 2.6502685546875, 2.990478515625, 3.3306884765625, 3.6708984375, 4.0111083984375, 4.351318359375, 4.6915283203125, 5.03173828125, 5.3719482421875, 5.712158203125, 6.0523681640625, 6.392578125, 6.7327880859375, 7.072998046875, 7.4132080078125, 7.75341796875, 8.0936279296875, 8.433837890625, 8.7740478515625, 9.1142578125, 9.4544677734375, 9.794677734375, 10.1348876953125, 10.47509765625, 10.8153076171875, 11.155517578125, 11.4957275390625, 11.8359375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 4.0, 8.0, 6.0, 8.0, 6.0, 14.0, 11.0, 20.0, 28.0, 19.0, 26.0, 22.0, 30.0, 30.0, 41.0, 46.0, 46.0, 42.0, 50.0, 54.0, 48.0, 45.0, 41.0, 33.0, 35.0, 36.0, 27.0, 28.0, 20.0, 26.0, 27.0, 17.0, 16.0, 12.0, 15.0, 7.0, 7.0, 12.0, 7.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2578125, -4.11669921875, -3.9755859375, -3.83447265625, -3.693359375, -3.55224609375, -3.4111328125, -3.27001953125, -3.12890625, -2.98779296875, -2.8466796875, -2.70556640625, -2.564453125, -2.42333984375, -2.2822265625, -2.14111328125, -2.0, -1.85888671875, -1.7177734375, -1.57666015625, -1.435546875, -1.29443359375, -1.1533203125, -1.01220703125, -0.87109375, -0.72998046875, -0.5888671875, -0.44775390625, -0.306640625, -0.16552734375, -0.0244140625, 0.11669921875, 0.2578125, 0.39892578125, 0.5400390625, 0.68115234375, 0.822265625, 0.96337890625, 1.1044921875, 1.24560546875, 1.38671875, 1.52783203125, 1.6689453125, 1.81005859375, 1.951171875, 2.09228515625, 2.2333984375, 2.37451171875, 2.515625, 2.65673828125, 2.7978515625, 2.93896484375, 3.080078125, 3.22119140625, 3.3623046875, 3.50341796875, 3.64453125, 3.78564453125, 3.9267578125, 4.06787109375, 4.208984375, 4.35009765625, 4.4912109375, 4.63232421875, 4.7734375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 16.0, 26.0, 37.0, 41.0, 64.0, 116.0, 169.0, 237.0, 318.0, 517.0, 756.0, 1168.0, 1838.0, 2886.0, 4624.0, 7738.0, 13341.0, 23641.0, 46836.0, 105669.0, 292107.0, 900650.0, 1574979.0, 773121.0, 251936.0, 94994.0, 42929.0, 21896.0, 12219.0, 7246.0, 4300.0, 2709.0, 1814.0, 1159.0, 718.0, 451.0, 332.0, 226.0, 138.0, 96.0, 74.0, 47.0, 31.0, 20.0, 18.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.3125, -12.914306640625, -12.51611328125, -12.117919921875, -11.7197265625, -11.321533203125, -10.92333984375, -10.525146484375, -10.126953125, -9.728759765625, -9.33056640625, -8.932373046875, -8.5341796875, -8.135986328125, -7.73779296875, -7.339599609375, -6.94140625, -6.543212890625, -6.14501953125, -5.746826171875, -5.3486328125, -4.950439453125, -4.55224609375, -4.154052734375, -3.755859375, -3.357666015625, -2.95947265625, -2.561279296875, -2.1630859375, -1.764892578125, -1.36669921875, -0.968505859375, -0.5703125, -0.172119140625, 0.22607421875, 0.624267578125, 1.0224609375, 1.420654296875, 1.81884765625, 2.217041015625, 2.615234375, 3.013427734375, 3.41162109375, 3.809814453125, 4.2080078125, 4.606201171875, 5.00439453125, 5.402587890625, 5.80078125, 6.198974609375, 6.59716796875, 6.995361328125, 7.3935546875, 7.791748046875, 8.18994140625, 8.588134765625, 8.986328125, 9.384521484375, 9.78271484375, 10.180908203125, 10.5791015625, 10.977294921875, 11.37548828125, 11.773681640625, 12.171875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 6.0, 10.0, 13.0, 17.0, 14.0, 14.0, 37.0, 43.0, 62.0, 63.0, 91.0, 136.0, 149.0, 207.0, 286.0, 308.0, 329.0, 457.0, 398.0, 307.0, 258.0, 195.0, 160.0, 101.0, 99.0, 72.0, 39.0, 41.0, 32.0, 30.0, 17.0, 18.0, 11.0, 13.0, 8.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.283203125, -3.1790771484375, -3.074951171875, -2.9708251953125, -2.86669921875, -2.7625732421875, -2.658447265625, -2.5543212890625, -2.4501953125, -2.3460693359375, -2.241943359375, -2.1378173828125, -2.03369140625, -1.9295654296875, -1.825439453125, -1.7213134765625, -1.6171875, -1.5130615234375, -1.408935546875, -1.3048095703125, -1.20068359375, -1.0965576171875, -0.992431640625, -0.8883056640625, -0.7841796875, -0.6800537109375, -0.575927734375, -0.4718017578125, -0.36767578125, -0.2635498046875, -0.159423828125, -0.0552978515625, 0.048828125, 0.1529541015625, 0.257080078125, 0.3612060546875, 0.46533203125, 0.5694580078125, 0.673583984375, 0.7777099609375, 0.8818359375, 0.9859619140625, 1.090087890625, 1.1942138671875, 1.29833984375, 1.4024658203125, 1.506591796875, 1.6107177734375, 1.71484375, 1.8189697265625, 1.923095703125, 2.0272216796875, 2.13134765625, 2.2354736328125, 2.339599609375, 2.4437255859375, 2.5478515625, 2.6519775390625, 2.756103515625, 2.8602294921875, 2.96435546875, 3.0684814453125, 3.172607421875, 3.2767333984375, 3.380859375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 6.0, 4.0, 2.0, 3.0, 10.0, 7.0, 10.0, 17.0, 28.0, 34.0, 44.0, 56.0, 74.0, 90.0, 85.0, 103.0, 99.0, 79.0, 53.0, 43.0, 32.0, 30.0, 23.0, 14.0, 8.0, 10.0, 4.0, 8.0, 4.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.243199348449707, -10.845352172851562, -10.447504997253418, -10.04965877532959, -9.651811599731445, -9.2539644241333, -8.856117248535156, -8.458271026611328, -8.060423851013184, -7.662576675415039, -7.264729976654053, -6.866882801055908, -6.469036102294922, -6.071188926696777, -5.673341751098633, -5.2754950523376465, -4.877647876739502, -4.479800701141357, -4.081954002380371, -3.6841068267822266, -3.2862601280212402, -2.8884129524230957, -2.4905660152435303, -2.092719078063965, -1.6948721408843994, -1.297025203704834, -0.8991782069206238, -0.5013312101364136, -0.10348427295684814, 0.2943626642227173, 0.6922097206115723, 1.0900566577911377, 1.4879035949707031, 1.8857505321502686, 2.283597469329834, 2.6814446449279785, 3.079291343688965, 3.4771385192871094, 3.874985456466675, 4.27283239364624, 4.670679092407227, 5.068526268005371, 5.466372966766357, 5.864220142364502, 6.262066841125488, 6.659914016723633, 7.057761192321777, 7.455607891082764, 7.853455066680908, 8.251301765441895, 8.649148941040039, 9.046996116638184, 9.444843292236328, 9.842689514160156, 10.2405366897583, 10.638383865356445, 11.03623104095459, 11.434078216552734, 11.831925392150879, 12.229771614074707, 12.627618789672852, 13.025465965270996, 13.42331314086914, 13.821159362792969, 14.219006538391113]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 12.0, 19.0, 13.0, 15.0, 27.0, 23.0, 24.0, 30.0, 25.0, 49.0, 40.0, 42.0, 35.0, 51.0, 45.0, 48.0, 40.0, 42.0, 43.0, 50.0, 46.0, 33.0, 37.0, 33.0, 18.0, 18.0, 19.0, 10.0, 17.0, 14.0, 11.0, 11.0, 11.0, 5.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.619811058044434, -6.416428565979004, -6.213045597076416, -6.009663105010986, -5.806280136108398, -5.602897644042969, -5.399515151977539, -5.196132183074951, -4.992749214172363, -4.789366722106934, -4.585983753204346, -4.382601261138916, -4.179218292236328, -3.9758358001708984, -3.7724530696868896, -3.569070339202881, -3.365687847137451, -3.1623051166534424, -2.9589223861694336, -2.755539894104004, -2.552156925201416, -2.3487744331359863, -2.1453917026519775, -1.9420089721679688, -1.73862624168396, -1.5352435111999512, -1.3318607807159424, -1.1284781694412231, -0.9250954389572144, -0.7217127084732056, -0.5183300971984863, -0.31494736671447754, -0.11156511306762695, 0.09181758761405945, 0.29520028829574585, 0.49858295917510986, 0.7019656896591187, 0.9053484201431274, 1.1087310314178467, 1.3121137619018555, 1.5154964923858643, 1.718879222869873, 1.9222619533538818, 2.1256446838378906, 2.3290271759033203, 2.532410144805908, 2.735792636871338, 2.9391753673553467, 3.1425580978393555, 3.3459408283233643, 3.549323558807373, 3.7527060508728027, 3.9560890197753906, 4.15947151184082, 4.36285400390625, 4.566236972808838, 4.769619941711426, 4.9730024337768555, 5.176385402679443, 5.379767894744873, 5.583150863647461, 5.786533355712891, 5.98991584777832, 6.193298816680908, 6.396681308746338]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 14.0, 17.0, 25.0, 37.0, 66.0, 115.0, 180.0, 287.0, 459.0, 864.0, 1664.0, 2885.0, 5339.0, 10808.0, 22532.0, 51957.0, 126479.0, 268143.0, 292636.0, 150130.0, 61948.0, 26167.0, 12326.0, 6101.0, 3229.0, 1738.0, 1019.0, 577.0, 306.0, 191.0, 122.0, 71.0, 39.0, 24.0, 15.0, 11.0, 12.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.904296875, -3.770111083984375, -3.63592529296875, -3.501739501953125, -3.3675537109375, -3.233367919921875, -3.09918212890625, -2.964996337890625, -2.830810546875, -2.696624755859375, -2.56243896484375, -2.428253173828125, -2.2940673828125, -2.159881591796875, -2.02569580078125, -1.891510009765625, -1.75732421875, -1.623138427734375, -1.48895263671875, -1.354766845703125, -1.2205810546875, -1.086395263671875, -0.95220947265625, -0.818023681640625, -0.683837890625, -0.549652099609375, -0.41546630859375, -0.281280517578125, -0.1470947265625, -0.012908935546875, 0.12127685546875, 0.255462646484375, 0.3896484375, 0.523834228515625, 0.65802001953125, 0.792205810546875, 0.9263916015625, 1.060577392578125, 1.19476318359375, 1.328948974609375, 1.463134765625, 1.597320556640625, 1.73150634765625, 1.865692138671875, 1.9998779296875, 2.134063720703125, 2.26824951171875, 2.402435302734375, 2.53662109375, 2.670806884765625, 2.80499267578125, 2.939178466796875, 3.0733642578125, 3.207550048828125, 3.34173583984375, 3.475921630859375, 3.610107421875, 3.744293212890625, 3.87847900390625, 4.012664794921875, 4.1468505859375, 4.281036376953125, 4.41522216796875, 4.549407958984375, 4.68359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 6.0, 7.0, 11.0, 10.0, 14.0, 11.0, 17.0, 16.0, 23.0, 38.0, 39.0, 35.0, 35.0, 31.0, 36.0, 38.0, 52.0, 41.0, 54.0, 35.0, 39.0, 47.0, 37.0, 35.0, 36.0, 44.0, 31.0, 27.0, 21.0, 23.0, 15.0, 10.0, 15.0, 9.0, 9.0, 14.0, 6.0, 2.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.9691162109375, -5.754638671875, -5.5401611328125, -5.32568359375, -5.1112060546875, -4.896728515625, -4.6822509765625, -4.4677734375, -4.2532958984375, -4.038818359375, -3.8243408203125, -3.60986328125, -3.3953857421875, -3.180908203125, -2.9664306640625, -2.751953125, -2.5374755859375, -2.322998046875, -2.1085205078125, -1.89404296875, -1.6795654296875, -1.465087890625, -1.2506103515625, -1.0361328125, -0.8216552734375, -0.607177734375, -0.3927001953125, -0.17822265625, 0.0362548828125, 0.250732421875, 0.4652099609375, 0.6796875, 0.8941650390625, 1.108642578125, 1.3231201171875, 1.53759765625, 1.7520751953125, 1.966552734375, 2.1810302734375, 2.3955078125, 2.6099853515625, 2.824462890625, 3.0389404296875, 3.25341796875, 3.4678955078125, 3.682373046875, 3.8968505859375, 4.111328125, 4.3258056640625, 4.540283203125, 4.7547607421875, 4.96923828125, 5.1837158203125, 5.398193359375, 5.6126708984375, 5.8271484375, 6.0416259765625, 6.256103515625, 6.4705810546875, 6.68505859375, 6.8995361328125, 7.114013671875, 7.3284912109375, 7.54296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 10.0, 11.0, 11.0, 18.0, 26.0, 37.0, 62.0, 83.0, 124.0, 199.0, 268.0, 491.0, 706.0, 1182.0, 2001.0, 3281.0, 6008.0, 11264.0, 22823.0, 48024.0, 109720.0, 239330.0, 298801.0, 164578.0, 72008.0, 32699.0, 15926.0, 8079.0, 4299.0, 2506.0, 1472.0, 915.0, 548.0, 350.0, 246.0, 127.0, 120.0, 58.0, 51.0, 33.0, 22.0, 13.0, 14.0, 4.0, 0.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.634033203125, -4.49462890625, -4.355224609375, -4.2158203125, -4.076416015625, -3.93701171875, -3.797607421875, -3.658203125, -3.518798828125, -3.37939453125, -3.239990234375, -3.1005859375, -2.961181640625, -2.82177734375, -2.682373046875, -2.54296875, -2.403564453125, -2.26416015625, -2.124755859375, -1.9853515625, -1.845947265625, -1.70654296875, -1.567138671875, -1.427734375, -1.288330078125, -1.14892578125, -1.009521484375, -0.8701171875, -0.730712890625, -0.59130859375, -0.451904296875, -0.3125, -0.173095703125, -0.03369140625, 0.105712890625, 0.2451171875, 0.384521484375, 0.52392578125, 0.663330078125, 0.802734375, 0.942138671875, 1.08154296875, 1.220947265625, 1.3603515625, 1.499755859375, 1.63916015625, 1.778564453125, 1.91796875, 2.057373046875, 2.19677734375, 2.336181640625, 2.4755859375, 2.614990234375, 2.75439453125, 2.893798828125, 3.033203125, 3.172607421875, 3.31201171875, 3.451416015625, 3.5908203125, 3.730224609375, 3.86962890625, 4.009033203125, 4.1484375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 2.0, 6.0, 5.0, 11.0, 9.0, 10.0, 8.0, 14.0, 19.0, 16.0, 18.0, 23.0, 26.0, 32.0, 36.0, 27.0, 39.0, 36.0, 39.0, 32.0, 37.0, 34.0, 55.0, 39.0, 45.0, 28.0, 41.0, 37.0, 38.0, 33.0, 27.0, 22.0, 21.0, 16.0, 20.0, 16.0, 16.0, 12.0, 11.0, 9.0, 7.0, 5.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.572265625, -3.4583740234375, -3.344482421875, -3.2305908203125, -3.11669921875, -3.0028076171875, -2.888916015625, -2.7750244140625, -2.6611328125, -2.5472412109375, -2.433349609375, -2.3194580078125, -2.20556640625, -2.0916748046875, -1.977783203125, -1.8638916015625, -1.75, -1.6361083984375, -1.522216796875, -1.4083251953125, -1.29443359375, -1.1805419921875, -1.066650390625, -0.9527587890625, -0.8388671875, -0.7249755859375, -0.611083984375, -0.4971923828125, -0.38330078125, -0.2694091796875, -0.155517578125, -0.0416259765625, 0.072265625, 0.1861572265625, 0.300048828125, 0.4139404296875, 0.52783203125, 0.6417236328125, 0.755615234375, 0.8695068359375, 0.9833984375, 1.0972900390625, 1.211181640625, 1.3250732421875, 1.43896484375, 1.5528564453125, 1.666748046875, 1.7806396484375, 1.89453125, 2.0084228515625, 2.122314453125, 2.2362060546875, 2.35009765625, 2.4639892578125, 2.577880859375, 2.6917724609375, 2.8056640625, 2.9195556640625, 3.033447265625, 3.1473388671875, 3.26123046875, 3.3751220703125, 3.489013671875, 3.6029052734375, 3.716796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 4.0, 12.0, 8.0, 18.0, 30.0, 27.0, 35.0, 44.0, 80.0, 147.0, 204.0, 331.0, 557.0, 869.0, 1612.0, 2817.0, 5302.0, 9989.0, 19836.0, 42365.0, 94755.0, 213089.0, 312344.0, 187283.0, 81982.0, 37029.0, 17904.0, 8852.0, 4717.0, 2586.0, 1521.0, 835.0, 497.0, 313.0, 180.0, 129.0, 83.0, 62.0, 39.0, 30.0, 13.0, 15.0, 4.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.537109375, -1.478912353515625, -1.42071533203125, -1.362518310546875, -1.3043212890625, -1.246124267578125, -1.18792724609375, -1.129730224609375, -1.071533203125, -1.013336181640625, -0.95513916015625, -0.896942138671875, -0.8387451171875, -0.780548095703125, -0.72235107421875, -0.664154052734375, -0.60595703125, -0.547760009765625, -0.48956298828125, -0.431365966796875, -0.3731689453125, -0.314971923828125, -0.25677490234375, -0.198577880859375, -0.140380859375, -0.082183837890625, -0.02398681640625, 0.034210205078125, 0.0924072265625, 0.150604248046875, 0.20880126953125, 0.266998291015625, 0.3251953125, 0.383392333984375, 0.44158935546875, 0.499786376953125, 0.5579833984375, 0.616180419921875, 0.67437744140625, 0.732574462890625, 0.790771484375, 0.848968505859375, 0.90716552734375, 0.965362548828125, 1.0235595703125, 1.081756591796875, 1.13995361328125, 1.198150634765625, 1.25634765625, 1.314544677734375, 1.37274169921875, 1.430938720703125, 1.4891357421875, 1.547332763671875, 1.60552978515625, 1.663726806640625, 1.721923828125, 1.780120849609375, 1.83831787109375, 1.896514892578125, 1.9547119140625, 2.012908935546875, 2.07110595703125, 2.129302978515625, 2.1875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 6.0, 9.0, 9.0, 14.0, 19.0, 12.0, 29.0, 30.0, 40.0, 34.0, 42.0, 61.0, 62.0, 78.0, 74.0, 98.0, 75.0, 50.0, 56.0, 34.0, 32.0, 15.0, 16.0, 21.0, 16.0, 11.0, 9.0, 6.0, 4.0, 8.0, 3.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.683038711547852e-05, -7.397402077913284e-05, -7.111765444278717e-05, -6.82612881064415e-05, -6.540492177009583e-05, -6.254855543375015e-05, -5.969218909740448e-05, -5.683582276105881e-05, -5.3979456424713135e-05, -5.112309008836746e-05, -4.826672375202179e-05, -4.541035741567612e-05, -4.2553991079330444e-05, -3.969762474298477e-05, -3.68412584066391e-05, -3.3984892070293427e-05, -3.1128525733947754e-05, -2.827215939760208e-05, -2.541579306125641e-05, -2.2559426724910736e-05, -1.9703060388565063e-05, -1.684669405221939e-05, -1.3990327715873718e-05, -1.1133961379528046e-05, -8.277595043182373e-06, -5.4212287068367004e-06, -2.564862370491028e-06, 2.915039658546448e-07, 3.1478703022003174e-06, 6.00423663854599e-06, 8.860602974891663e-06, 1.1716969311237335e-05, 1.4573335647583008e-05, 1.742970198392868e-05, 2.0286068320274353e-05, 2.3142434656620026e-05, 2.5998800992965698e-05, 2.885516732931137e-05, 3.1711533665657043e-05, 3.4567900002002716e-05, 3.742426633834839e-05, 4.028063267469406e-05, 4.3136999011039734e-05, 4.5993365347385406e-05, 4.884973168373108e-05, 5.170609802007675e-05, 5.4562464356422424e-05, 5.74188306927681e-05, 6.027519702911377e-05, 6.313156336545944e-05, 6.598792970180511e-05, 6.884429603815079e-05, 7.170066237449646e-05, 7.455702871084213e-05, 7.74133950471878e-05, 8.026976138353348e-05, 8.312612771987915e-05, 8.598249405622482e-05, 8.88388603925705e-05, 9.169522672891617e-05, 9.455159306526184e-05, 9.740795940160751e-05, 0.00010026432573795319, 0.00010312069207429886, 0.00010597705841064453]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 11.0, 26.0, 35.0, 48.0, 68.0, 87.0, 127.0, 182.0, 265.0, 441.0, 590.0, 892.0, 1335.0, 1957.0, 3013.0, 4679.0, 7401.0, 11880.0, 19055.0, 31177.0, 52951.0, 87158.0, 135755.0, 180966.0, 175507.0, 127328.0, 80007.0, 48168.0, 29041.0, 17773.0, 10719.0, 6951.0, 4397.0, 2864.0, 1853.0, 1185.0, 869.0, 554.0, 448.0, 251.0, 192.0, 105.0, 64.0, 55.0, 41.0, 33.0, 26.0, 14.0, 5.0, 8.0, 1.0, 3.0], "bins": [-1.2646484375, -1.2294387817382812, -1.1942291259765625, -1.1590194702148438, -1.123809814453125, -1.0886001586914062, -1.0533905029296875, -1.0181808471679688, -0.98297119140625, -0.9477615356445312, -0.9125518798828125, -0.8773422241210938, -0.842132568359375, -0.8069229125976562, -0.7717132568359375, -0.7365036010742188, -0.7012939453125, -0.6660842895507812, -0.6308746337890625, -0.5956649780273438, -0.560455322265625, -0.5252456665039062, -0.4900360107421875, -0.45482635498046875, -0.41961669921875, -0.38440704345703125, -0.3491973876953125, -0.31398773193359375, -0.278778076171875, -0.24356842041015625, -0.2083587646484375, -0.17314910888671875, -0.137939453125, -0.10272979736328125, -0.0675201416015625, -0.03231048583984375, 0.002899169921875, 0.03810882568359375, 0.0733184814453125, 0.10852813720703125, 0.14373779296875, 0.17894744873046875, 0.2141571044921875, 0.24936676025390625, 0.284576416015625, 0.31978607177734375, 0.3549957275390625, 0.39020538330078125, 0.4254150390625, 0.46062469482421875, 0.4958343505859375, 0.5310440063476562, 0.566253662109375, 0.6014633178710938, 0.6366729736328125, 0.6718826293945312, 0.70709228515625, 0.7423019409179688, 0.7775115966796875, 0.8127212524414062, 0.847930908203125, 0.8831405639648438, 0.9183502197265625, 0.9535598754882812, 0.98876953125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 7.0, 8.0, 11.0, 18.0, 24.0, 12.0, 25.0, 28.0, 47.0, 46.0, 40.0, 62.0, 57.0, 59.0, 73.0, 65.0, 50.0, 43.0, 50.0, 33.0, 47.0, 38.0, 38.0, 24.0, 23.0, 13.0, 12.0, 11.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453857421875, -0.4390678405761719, -0.42427825927734375, -0.4094886779785156, -0.3946990966796875, -0.3799095153808594, -0.36511993408203125, -0.3503303527832031, -0.335540771484375, -0.3207511901855469, -0.30596160888671875, -0.2911720275878906, -0.2763824462890625, -0.2615928649902344, -0.24680328369140625, -0.23201370239257812, -0.21722412109375, -0.20243453979492188, -0.18764495849609375, -0.17285537719726562, -0.1580657958984375, -0.14327621459960938, -0.12848663330078125, -0.11369705200195312, -0.098907470703125, -0.08411788940429688, -0.06932830810546875, -0.054538726806640625, -0.0397491455078125, -0.024959564208984375, -0.01016998291015625, 0.004619598388671875, 0.0194091796875, 0.034198760986328125, 0.04898834228515625, 0.06377792358398438, 0.0785675048828125, 0.09335708618164062, 0.10814666748046875, 0.12293624877929688, 0.137725830078125, 0.15251541137695312, 0.16730499267578125, 0.18209457397460938, 0.1968841552734375, 0.21167373657226562, 0.22646331787109375, 0.24125289916992188, 0.25604248046875, 0.2708320617675781, 0.28562164306640625, 0.3004112243652344, 0.3152008056640625, 0.3299903869628906, 0.34477996826171875, 0.3595695495605469, 0.374359130859375, 0.3891487121582031, 0.40393829345703125, 0.4187278747558594, 0.4335174560546875, 0.4483070373535156, 0.46309661865234375, 0.4778861999511719, 0.49267578125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 1.0, 4.0, 6.0, 8.0, 10.0, 15.0, 17.0, 37.0, 44.0, 46.0, 64.0, 85.0, 77.0, 100.0, 113.0, 87.0, 59.0, 51.0, 39.0, 31.0, 21.0, 14.0, 14.0, 8.0, 7.0, 5.0, 8.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.886992454528809, -11.485967636108398, -11.084942817687988, -10.683918952941895, -10.282894134521484, -9.881869316101074, -9.480844497680664, -9.07982063293457, -8.67879581451416, -8.27777099609375, -7.876746654510498, -7.475721836090088, -7.074697494506836, -6.673672676086426, -6.272647857666016, -5.871623516082764, -5.4705986976623535, -5.069573879241943, -4.668549537658691, -4.267524719238281, -3.8665003776550293, -3.465475559234619, -3.064450979232788, -2.663426399230957, -2.262401819229126, -1.861377239227295, -1.4603526592254639, -1.0593279600143433, -0.6583033800125122, -0.2572786808013916, 0.14374589920043945, 0.5447704792022705, 0.9457950592041016, 1.3468196392059326, 1.7478442192077637, 2.148869037628174, 2.549893379211426, 2.950918197631836, 3.351942777633667, 3.752967357635498, 4.15399169921875, 4.55501651763916, 4.956040859222412, 5.357065677642822, 5.758090019226074, 6.159114837646484, 6.5601396560668945, 6.9611639976501465, 7.362188816070557, 7.763213634490967, 8.164237976074219, 8.565262794494629, 8.966287612915039, 9.367311477661133, 9.768336296081543, 10.169361114501953, 10.570385932922363, 10.971410751342773, 11.372435569763184, 11.773459434509277, 12.174484252929688, 12.575509071350098, 12.976533889770508, 13.377557754516602, 13.778582572937012]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 11.0, 10.0, 14.0, 18.0, 17.0, 27.0, 19.0, 31.0, 24.0, 32.0, 43.0, 42.0, 41.0, 43.0, 43.0, 50.0, 41.0, 50.0, 38.0, 42.0, 52.0, 42.0, 34.0, 41.0, 27.0, 21.0, 19.0, 18.0, 16.0, 11.0, 12.0, 16.0, 7.0, 10.0, 8.0, 5.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.692758083343506, -6.487729072570801, -6.282700061798096, -6.077670574188232, -5.872641563415527, -5.667612552642822, -5.462583541870117, -5.257554054260254, -5.052525043487549, -4.847496032714844, -4.642467021942139, -4.437437534332275, -4.23240852355957, -4.027379512786865, -3.82235050201416, -3.617321252822876, -3.412292242050171, -3.207263231277466, -3.0022339820861816, -2.7972049713134766, -2.5921757221221924, -2.3871467113494873, -2.182117462158203, -1.977088451385498, -1.7720593214035034, -1.5670301914215088, -1.3620010614395142, -1.1569719314575195, -0.9519428610801697, -0.7469137907028198, -0.5418846607208252, -0.33685553073883057, -0.13182640075683594, 0.0732027143239975, 0.27823182940483093, 0.4832609295845032, 0.6882900595664978, 0.8933191299438477, 1.0983482599258423, 1.303377389907837, 1.5084065198898315, 1.7134356498718262, 1.9184647798538208, 2.1234939098358154, 2.3285229206085205, 2.5335521697998047, 2.7385811805725098, 2.943610191345215, 3.148639440536499, 3.353668451309204, 3.5586977005004883, 3.7637267112731934, 3.9687559604644775, 4.173785209655762, 4.378814220428467, 4.583843231201172, 4.788872241973877, 4.993901252746582, 5.198930263519287, 5.40395975112915, 5.6089887619018555, 5.8140177726745605, 6.019046783447266, 6.224076271057129, 6.429105281829834]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 3.0, 11.0, 22.0, 28.0, 45.0, 58.0, 102.0, 193.0, 276.0, 492.0, 775.0, 1511.0, 2792.0, 5228.0, 9924.0, 20563.0, 45467.0, 105193.0, 217887.0, 283480.0, 191770.0, 88065.0, 38146.0, 17687.0, 8662.0, 4503.0, 2431.0, 1317.0, 787.0, 428.0, 295.0, 133.0, 99.0, 60.0, 39.0, 28.0, 20.0, 10.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.0711669921875, -8.751708984375, -8.4322509765625, -8.11279296875, -7.7933349609375, -7.473876953125, -7.1544189453125, -6.8349609375, -6.5155029296875, -6.196044921875, -5.8765869140625, -5.55712890625, -5.2376708984375, -4.918212890625, -4.5987548828125, -4.279296875, -3.9598388671875, -3.640380859375, -3.3209228515625, -3.00146484375, -2.6820068359375, -2.362548828125, -2.0430908203125, -1.7236328125, -1.4041748046875, -1.084716796875, -0.7652587890625, -0.44580078125, -0.1263427734375, 0.193115234375, 0.5125732421875, 0.83203125, 1.1514892578125, 1.470947265625, 1.7904052734375, 2.10986328125, 2.4293212890625, 2.748779296875, 3.0682373046875, 3.3876953125, 3.7071533203125, 4.026611328125, 4.3460693359375, 4.66552734375, 4.9849853515625, 5.304443359375, 5.6239013671875, 5.943359375, 6.2628173828125, 6.582275390625, 6.9017333984375, 7.22119140625, 7.5406494140625, 7.860107421875, 8.1795654296875, 8.4990234375, 8.8184814453125, 9.137939453125, 9.4573974609375, 9.77685546875, 10.0963134765625, 10.415771484375, 10.7352294921875, 11.0546875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 5.0, 12.0, 11.0, 15.0, 14.0, 24.0, 16.0, 24.0, 29.0, 36.0, 46.0, 31.0, 41.0, 51.0, 42.0, 50.0, 51.0, 40.0, 48.0, 43.0, 39.0, 49.0, 48.0, 34.0, 37.0, 21.0, 25.0, 10.0, 19.0, 11.0, 14.0, 15.0, 14.0, 3.0, 9.0, 1.0, 2.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.390625, -7.1602783203125, -6.929931640625, -6.6995849609375, -6.46923828125, -6.2388916015625, -6.008544921875, -5.7781982421875, -5.5478515625, -5.3175048828125, -5.087158203125, -4.8568115234375, -4.62646484375, -4.3961181640625, -4.165771484375, -3.9354248046875, -3.705078125, -3.4747314453125, -3.244384765625, -3.0140380859375, -2.78369140625, -2.5533447265625, -2.322998046875, -2.0926513671875, -1.8623046875, -1.6319580078125, -1.401611328125, -1.1712646484375, -0.94091796875, -0.7105712890625, -0.480224609375, -0.2498779296875, -0.01953125, 0.2108154296875, 0.441162109375, 0.6715087890625, 0.90185546875, 1.1322021484375, 1.362548828125, 1.5928955078125, 1.8232421875, 2.0535888671875, 2.283935546875, 2.5142822265625, 2.74462890625, 2.9749755859375, 3.205322265625, 3.4356689453125, 3.666015625, 3.8963623046875, 4.126708984375, 4.3570556640625, 4.58740234375, 4.8177490234375, 5.048095703125, 5.2784423828125, 5.5087890625, 5.7391357421875, 5.969482421875, 6.1998291015625, 6.43017578125, 6.6605224609375, 6.890869140625, 7.1212158203125, 7.3515625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 8.0, 7.0, 15.0, 31.0, 38.0, 39.0, 74.0, 90.0, 118.0, 205.0, 309.0, 420.0, 628.0, 902.0, 1330.0, 1947.0, 2933.0, 4206.0, 6453.0, 9537.0, 15009.0, 23234.0, 36270.0, 56728.0, 86297.0, 120430.0, 148615.0, 149512.0, 125178.0, 89698.0, 59289.0, 38030.0, 24302.0, 15595.0, 10252.0, 6726.0, 4573.0, 3071.0, 2056.0, 1356.0, 992.0, 651.0, 457.0, 301.0, 215.0, 131.0, 82.0, 62.0, 49.0, 40.0, 23.0, 17.0, 11.0, 8.0, 3.0, 1.0, 3.0, 2.0], "bins": [-5.87109375, -5.6934814453125, -5.515869140625, -5.3382568359375, -5.16064453125, -4.9830322265625, -4.805419921875, -4.6278076171875, -4.4501953125, -4.2725830078125, -4.094970703125, -3.9173583984375, -3.73974609375, -3.5621337890625, -3.384521484375, -3.2069091796875, -3.029296875, -2.8516845703125, -2.674072265625, -2.4964599609375, -2.31884765625, -2.1412353515625, -1.963623046875, -1.7860107421875, -1.6083984375, -1.4307861328125, -1.253173828125, -1.0755615234375, -0.89794921875, -0.7203369140625, -0.542724609375, -0.3651123046875, -0.1875, -0.0098876953125, 0.167724609375, 0.3453369140625, 0.52294921875, 0.7005615234375, 0.878173828125, 1.0557861328125, 1.2333984375, 1.4110107421875, 1.588623046875, 1.7662353515625, 1.94384765625, 2.1214599609375, 2.299072265625, 2.4766845703125, 2.654296875, 2.8319091796875, 3.009521484375, 3.1871337890625, 3.36474609375, 3.5423583984375, 3.719970703125, 3.8975830078125, 4.0751953125, 4.2528076171875, 4.430419921875, 4.6080322265625, 4.78564453125, 4.9632568359375, 5.140869140625, 5.3184814453125, 5.49609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 2.0, 5.0, 1.0, 7.0, 6.0, 9.0, 15.0, 14.0, 15.0, 20.0, 14.0, 34.0, 26.0, 20.0, 36.0, 36.0, 33.0, 26.0, 32.0, 39.0, 38.0, 47.0, 33.0, 34.0, 32.0, 31.0, 43.0, 28.0, 34.0, 42.0, 39.0, 26.0, 26.0, 27.0, 15.0, 20.0, 14.0, 17.0, 8.0, 11.0, 13.0, 12.0, 3.0, 8.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.447265625, -3.33770751953125, -3.2281494140625, -3.11859130859375, -3.009033203125, -2.89947509765625, -2.7899169921875, -2.68035888671875, -2.57080078125, -2.46124267578125, -2.3516845703125, -2.24212646484375, -2.132568359375, -2.02301025390625, -1.9134521484375, -1.80389404296875, -1.6943359375, -1.58477783203125, -1.4752197265625, -1.36566162109375, -1.256103515625, -1.14654541015625, -1.0369873046875, -0.92742919921875, -0.81787109375, -0.70831298828125, -0.5987548828125, -0.48919677734375, -0.379638671875, -0.27008056640625, -0.1605224609375, -0.05096435546875, 0.05859375, 0.16815185546875, 0.2777099609375, 0.38726806640625, 0.496826171875, 0.60638427734375, 0.7159423828125, 0.82550048828125, 0.93505859375, 1.04461669921875, 1.1541748046875, 1.26373291015625, 1.373291015625, 1.48284912109375, 1.5924072265625, 1.70196533203125, 1.8115234375, 1.92108154296875, 2.0306396484375, 2.14019775390625, 2.249755859375, 2.35931396484375, 2.4688720703125, 2.57843017578125, 2.68798828125, 2.79754638671875, 2.9071044921875, 3.01666259765625, 3.126220703125, 3.23577880859375, 3.3453369140625, 3.45489501953125, 3.564453125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 4.0, 14.0, 21.0, 25.0, 32.0, 46.0, 51.0, 86.0, 135.0, 182.0, 272.0, 368.0, 561.0, 909.0, 1501.0, 2530.0, 4871.0, 9877.0, 24879.0, 74628.0, 240596.0, 402327.0, 188422.0, 57827.0, 19786.0, 8440.0, 4070.0, 2247.0, 1283.0, 821.0, 555.0, 360.0, 250.0, 164.0, 109.0, 77.0, 62.0, 38.0, 33.0, 24.0, 14.0, 10.0, 16.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0], "bins": [-8.8515625, -8.6014404296875, -8.351318359375, -8.1011962890625, -7.85107421875, -7.6009521484375, -7.350830078125, -7.1007080078125, -6.8505859375, -6.6004638671875, -6.350341796875, -6.1002197265625, -5.85009765625, -5.5999755859375, -5.349853515625, -5.0997314453125, -4.849609375, -4.5994873046875, -4.349365234375, -4.0992431640625, -3.84912109375, -3.5989990234375, -3.348876953125, -3.0987548828125, -2.8486328125, -2.5985107421875, -2.348388671875, -2.0982666015625, -1.84814453125, -1.5980224609375, -1.347900390625, -1.0977783203125, -0.84765625, -0.5975341796875, -0.347412109375, -0.0972900390625, 0.15283203125, 0.4029541015625, 0.653076171875, 0.9031982421875, 1.1533203125, 1.4034423828125, 1.653564453125, 1.9036865234375, 2.15380859375, 2.4039306640625, 2.654052734375, 2.9041748046875, 3.154296875, 3.4044189453125, 3.654541015625, 3.9046630859375, 4.15478515625, 4.4049072265625, 4.655029296875, 4.9051513671875, 5.1552734375, 5.4053955078125, 5.655517578125, 5.9056396484375, 6.15576171875, 6.4058837890625, 6.656005859375, 6.9061279296875, 7.15625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 11.0, 23.0, 33.0, 33.0, 57.0, 83.0, 113.0, 115.0, 133.0, 112.0, 75.0, 66.0, 46.0, 29.0, 16.0, 8.0, 7.0, 5.0, 8.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0008387565612792969, -0.0008166208863258362, -0.0007944852113723755, -0.0007723495364189148, -0.0007502138614654541, -0.0007280781865119934, -0.0007059425115585327, -0.000683806836605072, -0.0006616711616516113, -0.0006395354866981506, -0.0006173998117446899, -0.0005952641367912292, -0.0005731284618377686, -0.0005509927868843079, -0.0005288571119308472, -0.0005067214369773865, -0.0004845857620239258, -0.0004624500870704651, -0.0004403144121170044, -0.0004181787371635437, -0.000396043062210083, -0.0003739073872566223, -0.0003517717123031616, -0.00032963603734970093, -0.00030750036239624023, -0.00028536468744277954, -0.00026322901248931885, -0.00024109333753585815, -0.00021895766258239746, -0.00019682198762893677, -0.00017468631267547607, -0.00015255063772201538, -0.0001304149627685547, -0.000108279287815094, -8.61436128616333e-05, -6.400793790817261e-05, -4.1872262954711914e-05, -1.973658800125122e-05, 2.3990869522094727e-06, 2.4534761905670166e-05, 4.667043685913086e-05, 6.880611181259155e-05, 9.094178676605225e-05, 0.00011307746171951294, 0.00013521313667297363, 0.00015734881162643433, 0.00017948448657989502, 0.0002016201615333557, 0.0002237558364868164, 0.0002458915114402771, 0.0002680271863937378, 0.0002901628613471985, 0.0003122985363006592, 0.0003344342112541199, 0.00035656988620758057, 0.00037870556116104126, 0.00040084123611450195, 0.00042297691106796265, 0.00044511258602142334, 0.00046724826097488403, 0.0004893839359283447, 0.0005115196108818054, 0.0005336552858352661, 0.0005557909607887268, 0.0005779266357421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 3.0, 7.0, 14.0, 12.0, 17.0, 18.0, 28.0, 50.0, 51.0, 65.0, 97.0, 113.0, 159.0, 239.0, 354.0, 548.0, 868.0, 1398.0, 2335.0, 4552.0, 9224.0, 20685.0, 49610.0, 125809.0, 266374.0, 295385.0, 158301.0, 62888.0, 25484.0, 11189.0, 5344.0, 2824.0, 1587.0, 958.0, 621.0, 380.0, 272.0, 193.0, 129.0, 87.0, 70.0, 45.0, 32.0, 32.0, 20.0, 19.0, 20.0, 17.0, 8.0, 3.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.3671875, -5.19476318359375, -5.0223388671875, -4.84991455078125, -4.677490234375, -4.50506591796875, -4.3326416015625, -4.16021728515625, -3.98779296875, -3.81536865234375, -3.6429443359375, -3.47052001953125, -3.298095703125, -3.12567138671875, -2.9532470703125, -2.78082275390625, -2.6083984375, -2.43597412109375, -2.2635498046875, -2.09112548828125, -1.918701171875, -1.74627685546875, -1.5738525390625, -1.40142822265625, -1.22900390625, -1.05657958984375, -0.8841552734375, -0.71173095703125, -0.539306640625, -0.36688232421875, -0.1944580078125, -0.02203369140625, 0.150390625, 0.32281494140625, 0.4952392578125, 0.66766357421875, 0.840087890625, 1.01251220703125, 1.1849365234375, 1.35736083984375, 1.52978515625, 1.70220947265625, 1.8746337890625, 2.04705810546875, 2.219482421875, 2.39190673828125, 2.5643310546875, 2.73675537109375, 2.9091796875, 3.08160400390625, 3.2540283203125, 3.42645263671875, 3.598876953125, 3.77130126953125, 3.9437255859375, 4.11614990234375, 4.28857421875, 4.46099853515625, 4.6334228515625, 4.80584716796875, 4.978271484375, 5.15069580078125, 5.3231201171875, 5.49554443359375, 5.66796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 10.0, 9.0, 10.0, 14.0, 23.0, 27.0, 29.0, 33.0, 46.0, 49.0, 57.0, 51.0, 50.0, 60.0, 53.0, 62.0, 66.0, 47.0, 33.0, 52.0, 45.0, 23.0, 21.0, 28.0, 13.0, 19.0, 10.0, 16.0, 6.0, 7.0, 5.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0251388549804688, -0.9955902099609375, -0.9660415649414062, -0.936492919921875, -0.9069442749023438, -0.8773956298828125, -0.8478469848632812, -0.81829833984375, -0.7887496948242188, -0.7592010498046875, -0.7296524047851562, -0.700103759765625, -0.6705551147460938, -0.6410064697265625, -0.6114578247070312, -0.5819091796875, -0.5523605346679688, -0.5228118896484375, -0.49326324462890625, -0.463714599609375, -0.43416595458984375, -0.4046173095703125, -0.37506866455078125, -0.34552001953125, -0.31597137451171875, -0.2864227294921875, -0.25687408447265625, -0.227325439453125, -0.19777679443359375, -0.1682281494140625, -0.13867950439453125, -0.109130859375, -0.07958221435546875, -0.0500335693359375, -0.02048492431640625, 0.009063720703125, 0.03861236572265625, 0.0681610107421875, 0.09770965576171875, 0.12725830078125, 0.15680694580078125, 0.1863555908203125, 0.21590423583984375, 0.245452880859375, 0.27500152587890625, 0.3045501708984375, 0.33409881591796875, 0.3636474609375, 0.39319610595703125, 0.4227447509765625, 0.45229339599609375, 0.481842041015625, 0.5113906860351562, 0.5409393310546875, 0.5704879760742188, 0.60003662109375, 0.6295852661132812, 0.6591339111328125, 0.6886825561523438, 0.718231201171875, 0.7477798461914062, 0.7773284912109375, 0.8068771362304688, 0.83642578125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 7.0, 6.0, 10.0, 7.0, 15.0, 17.0, 20.0, 31.0, 34.0, 40.0, 49.0, 52.0, 67.0, 76.0, 78.0, 91.0, 83.0, 68.0, 59.0, 47.0, 29.0, 21.0, 15.0, 18.0, 7.0, 11.0, 9.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.766605377197266, -12.398869514465332, -12.031133651733398, -11.663397789001465, -11.295661926269531, -10.927926063537598, -10.560190200805664, -10.192453384399414, -9.824718475341797, -9.456982612609863, -9.08924674987793, -8.721510887145996, -8.353775024414062, -7.986039161682129, -7.618302822113037, -7.2505669593811035, -6.882830619812012, -6.515094757080078, -6.1473588943481445, -5.779623031616211, -5.411887168884277, -5.044151306152344, -4.676414966583252, -4.308679103851318, -3.9409432411193848, -3.573207378387451, -3.2054715156555176, -2.837735414505005, -2.4699995517730713, -2.1022636890411377, -1.734527587890625, -1.3667917251586914, -0.9990549087524414, -0.631318986415863, -0.26358306407928467, 0.10415291786193848, 0.47188878059387207, 0.8396246433258057, 1.2073607444763184, 1.575096607208252, 1.9428324699401855, 2.310568332672119, 2.6783041954040527, 3.0460402965545654, 3.413776159286499, 3.7815120220184326, 4.149248123168945, 4.516983985900879, 4.8847198486328125, 5.252455711364746, 5.62019157409668, 5.987927436828613, 6.355663299560547, 6.7233991622924805, 7.091135501861572, 7.458871364593506, 7.8266072273254395, 8.194343566894531, 8.562079429626465, 8.929815292358398, 9.297551155090332, 9.665287017822266, 10.0330228805542, 10.400758743286133, 10.768494606018066]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 14.0, 10.0, 18.0, 14.0, 22.0, 16.0, 19.0, 31.0, 25.0, 37.0, 38.0, 28.0, 39.0, 41.0, 41.0, 48.0, 41.0, 53.0, 40.0, 48.0, 48.0, 42.0, 37.0, 40.0, 24.0, 21.0, 25.0, 27.0, 17.0, 16.0, 16.0, 11.0, 9.0, 13.0, 5.0, 7.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.657054424285889, -6.4504265785217285, -6.24379825592041, -6.03717041015625, -5.83054256439209, -5.6239142417907715, -5.417286396026611, -5.210658073425293, -5.004030227661133, -4.797402381896973, -4.590774059295654, -4.384146213531494, -4.177517890930176, -3.9708900451660156, -3.7642621994018555, -3.557634115219116, -3.351006031036377, -3.1443779468536377, -2.9377498626708984, -2.7311220169067383, -2.524493932723999, -2.3178658485412598, -2.1112380027770996, -1.9046099185943604, -1.697981834411621, -1.4913537502288818, -1.2847257852554321, -1.0780978202819824, -0.8714697360992432, -0.6648416519165039, -0.4582136869430542, -0.2515857219696045, -0.044957637786865234, 0.16167038679122925, 0.36829841136932373, 0.5749264359474182, 0.7815544605255127, 0.988182544708252, 1.1948105096817017, 1.4014384746551514, 1.6080665588378906, 1.8146946430206299, 2.021322727203369, 2.2279505729675293, 2.4345786571502686, 2.641206741333008, 2.847834587097168, 3.0544626712799072, 3.2610907554626465, 3.4677188396453857, 3.674346923828125, 3.880974769592285, 4.087602615356445, 4.294230937957764, 4.500858783721924, 4.707487106323242, 4.914114952087402, 5.1207427978515625, 5.327371120452881, 5.533998966217041, 5.740627288818359, 5.9472551345825195, 6.15388298034668, 6.36051082611084, 6.567139148712158]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 3.0, 13.0, 17.0, 23.0, 32.0, 46.0, 64.0, 96.0, 127.0, 166.0, 297.0, 428.0, 639.0, 931.0, 1464.0, 2358.0, 3799.0, 6331.0, 11409.0, 23234.0, 56169.0, 181894.0, 755632.0, 1896832.0, 923910.0, 210503.0, 61378.0, 24878.0, 12418.0, 7052.0, 4243.0, 2607.0, 1719.0, 1182.0, 729.0, 541.0, 372.0, 238.0, 161.0, 92.0, 75.0, 47.0, 44.0, 29.0, 12.0, 13.0, 12.0, 5.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-14.140625, -13.662353515625, -13.18408203125, -12.705810546875, -12.2275390625, -11.749267578125, -11.27099609375, -10.792724609375, -10.314453125, -9.836181640625, -9.35791015625, -8.879638671875, -8.4013671875, -7.923095703125, -7.44482421875, -6.966552734375, -6.48828125, -6.010009765625, -5.53173828125, -5.053466796875, -4.5751953125, -4.096923828125, -3.61865234375, -3.140380859375, -2.662109375, -2.183837890625, -1.70556640625, -1.227294921875, -0.7490234375, -0.270751953125, 0.20751953125, 0.685791015625, 1.1640625, 1.642333984375, 2.12060546875, 2.598876953125, 3.0771484375, 3.555419921875, 4.03369140625, 4.511962890625, 4.990234375, 5.468505859375, 5.94677734375, 6.425048828125, 6.9033203125, 7.381591796875, 7.85986328125, 8.338134765625, 8.81640625, 9.294677734375, 9.77294921875, 10.251220703125, 10.7294921875, 11.207763671875, 11.68603515625, 12.164306640625, 12.642578125, 13.120849609375, 13.59912109375, 14.077392578125, 14.5556640625, 15.033935546875, 15.51220703125, 15.990478515625, 16.46875]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 5.0, 9.0, 7.0, 15.0, 18.0, 12.0, 16.0, 22.0, 30.0, 29.0, 26.0, 24.0, 34.0, 43.0, 44.0, 55.0, 51.0, 47.0, 42.0, 46.0, 47.0, 39.0, 38.0, 49.0, 34.0, 32.0, 24.0, 31.0, 25.0, 15.0, 27.0, 15.0, 13.0, 6.0, 7.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90625, -4.73455810546875, -4.5628662109375, -4.39117431640625, -4.219482421875, -4.04779052734375, -3.8760986328125, -3.70440673828125, -3.53271484375, -3.36102294921875, -3.1893310546875, -3.01763916015625, -2.845947265625, -2.67425537109375, -2.5025634765625, -2.33087158203125, -2.1591796875, -1.98748779296875, -1.8157958984375, -1.64410400390625, -1.472412109375, -1.30072021484375, -1.1290283203125, -0.95733642578125, -0.78564453125, -0.61395263671875, -0.4422607421875, -0.27056884765625, -0.098876953125, 0.07281494140625, 0.2445068359375, 0.41619873046875, 0.587890625, 0.75958251953125, 0.9312744140625, 1.10296630859375, 1.274658203125, 1.44635009765625, 1.6180419921875, 1.78973388671875, 1.96142578125, 2.13311767578125, 2.3048095703125, 2.47650146484375, 2.648193359375, 2.81988525390625, 2.9915771484375, 3.16326904296875, 3.3349609375, 3.50665283203125, 3.6783447265625, 3.85003662109375, 4.021728515625, 4.19342041015625, 4.3651123046875, 4.53680419921875, 4.70849609375, 4.88018798828125, 5.0518798828125, 5.22357177734375, 5.395263671875, 5.56695556640625, 5.7386474609375, 5.91033935546875, 6.08203125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 8.0, 14.0, 23.0, 28.0, 50.0, 56.0, 81.0, 106.0, 185.0, 235.0, 391.0, 509.0, 909.0, 1401.0, 2145.0, 3558.0, 5896.0, 10092.0, 17860.0, 35015.0, 74872.0, 188767.0, 558661.0, 1423087.0, 1185673.0, 413764.0, 144223.0, 60083.0, 29089.0, 15166.0, 8616.0, 5185.0, 3044.0, 1881.0, 1229.0, 817.0, 463.0, 344.0, 245.0, 146.0, 94.0, 82.0, 48.0, 48.0, 22.0, 18.0, 17.0, 8.0, 11.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.8509521484375, -12.420654296875, -11.9903564453125, -11.56005859375, -11.1297607421875, -10.699462890625, -10.2691650390625, -9.8388671875, -9.4085693359375, -8.978271484375, -8.5479736328125, -8.11767578125, -7.6873779296875, -7.257080078125, -6.8267822265625, -6.396484375, -5.9661865234375, -5.535888671875, -5.1055908203125, -4.67529296875, -4.2449951171875, -3.814697265625, -3.3843994140625, -2.9541015625, -2.5238037109375, -2.093505859375, -1.6632080078125, -1.23291015625, -0.8026123046875, -0.372314453125, 0.0579833984375, 0.48828125, 0.9185791015625, 1.348876953125, 1.7791748046875, 2.20947265625, 2.6397705078125, 3.070068359375, 3.5003662109375, 3.9306640625, 4.3609619140625, 4.791259765625, 5.2215576171875, 5.65185546875, 6.0821533203125, 6.512451171875, 6.9427490234375, 7.373046875, 7.8033447265625, 8.233642578125, 8.6639404296875, 9.09423828125, 9.5245361328125, 9.954833984375, 10.3851318359375, 10.8154296875, 11.2457275390625, 11.676025390625, 12.1063232421875, 12.53662109375, 12.9669189453125, 13.397216796875, 13.8275146484375, 14.2578125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 9.0, 9.0, 13.0, 12.0, 22.0, 29.0, 41.0, 54.0, 75.0, 116.0, 119.0, 142.0, 215.0, 273.0, 302.0, 398.0, 370.0, 390.0, 323.0, 264.0, 218.0, 151.0, 117.0, 104.0, 77.0, 38.0, 45.0, 28.0, 24.0, 25.0, 11.0, 8.0, 9.0, 12.0, 9.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.220703125, -3.10845947265625, -2.9962158203125, -2.88397216796875, -2.771728515625, -2.65948486328125, -2.5472412109375, -2.43499755859375, -2.32275390625, -2.21051025390625, -2.0982666015625, -1.98602294921875, -1.873779296875, -1.76153564453125, -1.6492919921875, -1.53704833984375, -1.4248046875, -1.31256103515625, -1.2003173828125, -1.08807373046875, -0.975830078125, -0.86358642578125, -0.7513427734375, -0.63909912109375, -0.52685546875, -0.41461181640625, -0.3023681640625, -0.19012451171875, -0.077880859375, 0.03436279296875, 0.1466064453125, 0.25885009765625, 0.37109375, 0.48333740234375, 0.5955810546875, 0.70782470703125, 0.820068359375, 0.93231201171875, 1.0445556640625, 1.15679931640625, 1.26904296875, 1.38128662109375, 1.4935302734375, 1.60577392578125, 1.718017578125, 1.83026123046875, 1.9425048828125, 2.05474853515625, 2.1669921875, 2.27923583984375, 2.3914794921875, 2.50372314453125, 2.615966796875, 2.72821044921875, 2.8404541015625, 2.95269775390625, 3.06494140625, 3.17718505859375, 3.2894287109375, 3.40167236328125, 3.513916015625, 3.62615966796875, 3.7384033203125, 3.85064697265625, 3.962890625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 0.0, 5.0, 3.0, 8.0, 8.0, 13.0, 13.0, 16.0, 12.0, 20.0, 25.0, 28.0, 29.0, 37.0, 71.0, 66.0, 59.0, 90.0, 79.0, 64.0, 78.0, 50.0, 43.0, 47.0, 29.0, 20.0, 20.0, 8.0, 9.0, 15.0, 6.0, 4.0, 4.0, 1.0, 0.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.491689682006836, -11.13202953338623, -10.772369384765625, -10.412710189819336, -10.05305004119873, -9.693389892578125, -9.333730697631836, -8.97407054901123, -8.614410400390625, -8.25475025177002, -7.895090579986572, -7.535430908203125, -7.1757707595825195, -6.816110610961914, -6.456450939178467, -6.0967912673950195, -5.737131118774414, -5.377470970153809, -5.017811298370361, -4.658151626586914, -4.298491477966309, -3.9388315677642822, -3.579171657562256, -3.2195117473602295, -2.859851837158203, -2.5001919269561768, -2.1405320167541504, -1.780872106552124, -1.4212121963500977, -1.0615522861480713, -0.7018923759460449, -0.34223246574401855, 0.01742839813232422, 0.3770883083343506, 0.736748218536377, 1.0964081287384033, 1.4560680389404297, 1.815727949142456, 2.1753878593444824, 2.535047769546509, 2.894707679748535, 3.2543675899505615, 3.614027500152588, 3.9736874103546143, 4.333347320556641, 4.693007469177246, 5.052667140960693, 5.412326812744141, 5.771986961364746, 6.131647109985352, 6.491306781768799, 6.850966453552246, 7.210626602172852, 7.570286750793457, 7.929946422576904, 8.289606094360352, 8.649266242980957, 9.008926391601562, 9.368585586547852, 9.728245735168457, 10.087905883789062, 10.447566032409668, 10.807226181030273, 11.166885375976562, 11.526545524597168]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 9.0, 7.0, 10.0, 13.0, 14.0, 21.0, 19.0, 23.0, 31.0, 27.0, 18.0, 34.0, 39.0, 48.0, 45.0, 36.0, 39.0, 51.0, 47.0, 49.0, 51.0, 42.0, 35.0, 40.0, 28.0, 29.0, 32.0, 16.0, 30.0, 17.0, 20.0, 18.0, 10.0, 13.0, 4.0, 9.0, 4.0, 6.0, 3.0, 1.0, 10.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.589496612548828, -6.378467559814453, -6.16743803024292, -5.956408977508545, -5.74537992477417, -5.534350395202637, -5.323321342468262, -5.112292289733887, -4.901263236999512, -4.690234184265137, -4.4792046546936035, -4.2681756019592285, -4.0571465492248535, -3.8461172580718994, -3.6350879669189453, -3.4240589141845703, -3.213029384613037, -3.002000093460083, -2.790971040725708, -2.579941749572754, -2.368912696838379, -2.157883405685425, -1.9468541145324707, -1.7358249425888062, -1.5247957706451416, -1.313766598701477, -1.1027374267578125, -0.8917081356048584, -0.6806789636611938, -0.4696497917175293, -0.2586205005645752, -0.047591328620910645, 0.1634373664855957, 0.37446656823158264, 0.5854957699775696, 0.7965250015258789, 1.0075541734695435, 1.218583345413208, 1.429612636566162, 1.6406418085098267, 1.8516709804534912, 2.0627002716064453, 2.2737293243408203, 2.4847586154937744, 2.6957879066467285, 2.9068169593811035, 3.1178462505340576, 3.3288755416870117, 3.5399045944213867, 3.750933885574341, 3.961962938308716, 4.17299222946167, 4.384021282196045, 4.595050811767578, 4.806079864501953, 5.017108917236328, 5.228137969970703, 5.439167022705078, 5.650196552276611, 5.861225605010986, 6.072254657745361, 6.2832841873168945, 6.4943132400512695, 6.7053422927856445, 6.916371822357178]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 7.0, 2.0, 10.0, 12.0, 17.0, 20.0, 30.0, 44.0, 61.0, 85.0, 126.0, 179.0, 296.0, 465.0, 792.0, 1357.0, 2295.0, 4328.0, 8437.0, 18189.0, 41483.0, 101676.0, 241635.0, 324343.0, 175003.0, 70466.0, 29286.0, 13451.0, 6469.0, 3385.0, 1862.0, 1014.0, 591.0, 381.0, 259.0, 158.0, 110.0, 63.0, 64.0, 29.0, 20.0, 20.0, 13.0, 5.0, 8.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.2783203125, -5.091796875, -4.9052734375, -4.71875, -4.5322265625, -4.345703125, -4.1591796875, -3.97265625, -3.7861328125, -3.599609375, -3.4130859375, -3.2265625, -3.0400390625, -2.853515625, -2.6669921875, -2.48046875, -2.2939453125, -2.107421875, -1.9208984375, -1.734375, -1.5478515625, -1.361328125, -1.1748046875, -0.98828125, -0.8017578125, -0.615234375, -0.4287109375, -0.2421875, -0.0556640625, 0.130859375, 0.3173828125, 0.50390625, 0.6904296875, 0.876953125, 1.0634765625, 1.25, 1.4365234375, 1.623046875, 1.8095703125, 1.99609375, 2.1826171875, 2.369140625, 2.5556640625, 2.7421875, 2.9287109375, 3.115234375, 3.3017578125, 3.48828125, 3.6748046875, 3.861328125, 4.0478515625, 4.234375, 4.4208984375, 4.607421875, 4.7939453125, 4.98046875, 5.1669921875, 5.353515625, 5.5400390625, 5.7265625, 5.9130859375, 6.099609375, 6.2861328125, 6.47265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 9.0, 9.0, 14.0, 17.0, 22.0, 27.0, 24.0, 28.0, 26.0, 32.0, 39.0, 30.0, 42.0, 41.0, 53.0, 43.0, 39.0, 64.0, 47.0, 47.0, 40.0, 38.0, 20.0, 39.0, 25.0, 25.0, 30.0, 20.0, 21.0, 19.0, 13.0, 13.0, 5.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.9296875, -7.6927490234375, -7.455810546875, -7.2188720703125, -6.98193359375, -6.7449951171875, -6.508056640625, -6.2711181640625, -6.0341796875, -5.7972412109375, -5.560302734375, -5.3233642578125, -5.08642578125, -4.8494873046875, -4.612548828125, -4.3756103515625, -4.138671875, -3.9017333984375, -3.664794921875, -3.4278564453125, -3.19091796875, -2.9539794921875, -2.717041015625, -2.4801025390625, -2.2431640625, -2.0062255859375, -1.769287109375, -1.5323486328125, -1.29541015625, -1.0584716796875, -0.821533203125, -0.5845947265625, -0.34765625, -0.1107177734375, 0.126220703125, 0.3631591796875, 0.60009765625, 0.8370361328125, 1.073974609375, 1.3109130859375, 1.5478515625, 1.7847900390625, 2.021728515625, 2.2586669921875, 2.49560546875, 2.7325439453125, 2.969482421875, 3.2064208984375, 3.443359375, 3.6802978515625, 3.917236328125, 4.1541748046875, 4.39111328125, 4.6280517578125, 4.864990234375, 5.1019287109375, 5.3388671875, 5.5758056640625, 5.812744140625, 6.0496826171875, 6.28662109375, 6.5235595703125, 6.760498046875, 6.9974365234375, 7.234375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 2.0, 8.0, 10.0, 10.0, 21.0, 31.0, 37.0, 51.0, 80.0, 88.0, 142.0, 181.0, 309.0, 461.0, 635.0, 1119.0, 1884.0, 3577.0, 7527.0, 18517.0, 53972.0, 177150.0, 411685.0, 249450.0, 76587.0, 24757.0, 9842.0, 4497.0, 2293.0, 1249.0, 778.0, 532.0, 297.0, 230.0, 152.0, 107.0, 75.0, 56.0, 34.0, 32.0, 27.0, 20.0, 9.0, 10.0, 6.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.58984375, -7.35003662109375, -7.1102294921875, -6.87042236328125, -6.630615234375, -6.39080810546875, -6.1510009765625, -5.91119384765625, -5.67138671875, -5.43157958984375, -5.1917724609375, -4.95196533203125, -4.712158203125, -4.47235107421875, -4.2325439453125, -3.99273681640625, -3.7529296875, -3.51312255859375, -3.2733154296875, -3.03350830078125, -2.793701171875, -2.55389404296875, -2.3140869140625, -2.07427978515625, -1.83447265625, -1.59466552734375, -1.3548583984375, -1.11505126953125, -0.875244140625, -0.63543701171875, -0.3956298828125, -0.15582275390625, 0.083984375, 0.32379150390625, 0.5635986328125, 0.80340576171875, 1.043212890625, 1.28302001953125, 1.5228271484375, 1.76263427734375, 2.00244140625, 2.24224853515625, 2.4820556640625, 2.72186279296875, 2.961669921875, 3.20147705078125, 3.4412841796875, 3.68109130859375, 3.9208984375, 4.16070556640625, 4.4005126953125, 4.64031982421875, 4.880126953125, 5.11993408203125, 5.3597412109375, 5.59954833984375, 5.83935546875, 6.07916259765625, 6.3189697265625, 6.55877685546875, 6.798583984375, 7.03839111328125, 7.2781982421875, 7.51800537109375, 7.7578125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 8.0, 10.0, 8.0, 20.0, 16.0, 13.0, 24.0, 21.0, 35.0, 35.0, 39.0, 44.0, 44.0, 48.0, 59.0, 62.0, 44.0, 48.0, 41.0, 40.0, 47.0, 53.0, 37.0, 37.0, 22.0, 27.0, 25.0, 16.0, 27.0, 9.0, 12.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.192138671875, -4.04443359375, -3.896728515625, -3.7490234375, -3.601318359375, -3.45361328125, -3.305908203125, -3.158203125, -3.010498046875, -2.86279296875, -2.715087890625, -2.5673828125, -2.419677734375, -2.27197265625, -2.124267578125, -1.9765625, -1.828857421875, -1.68115234375, -1.533447265625, -1.3857421875, -1.238037109375, -1.09033203125, -0.942626953125, -0.794921875, -0.647216796875, -0.49951171875, -0.351806640625, -0.2041015625, -0.056396484375, 0.09130859375, 0.239013671875, 0.38671875, 0.534423828125, 0.68212890625, 0.829833984375, 0.9775390625, 1.125244140625, 1.27294921875, 1.420654296875, 1.568359375, 1.716064453125, 1.86376953125, 2.011474609375, 2.1591796875, 2.306884765625, 2.45458984375, 2.602294921875, 2.75, 2.897705078125, 3.04541015625, 3.193115234375, 3.3408203125, 3.488525390625, 3.63623046875, 3.783935546875, 3.931640625, 4.079345703125, 4.22705078125, 4.374755859375, 4.5224609375, 4.670166015625, 4.81787109375, 4.965576171875, 5.11328125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 3.0, 11.0, 14.0, 13.0, 15.0, 21.0, 30.0, 28.0, 47.0, 67.0, 102.0, 121.0, 198.0, 259.0, 351.0, 511.0, 712.0, 979.0, 1570.0, 2345.0, 4195.0, 8351.0, 25072.0, 260932.0, 663862.0, 52918.0, 11748.0, 5229.0, 2948.0, 1837.0, 1191.0, 840.0, 564.0, 407.0, 297.0, 209.0, 133.0, 117.0, 86.0, 56.0, 47.0, 31.0, 16.0, 17.0, 10.0, 12.0, 11.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-8.625, -8.357177734375, -8.08935546875, -7.821533203125, -7.5537109375, -7.285888671875, -7.01806640625, -6.750244140625, -6.482421875, -6.214599609375, -5.94677734375, -5.678955078125, -5.4111328125, -5.143310546875, -4.87548828125, -4.607666015625, -4.33984375, -4.072021484375, -3.80419921875, -3.536376953125, -3.2685546875, -3.000732421875, -2.73291015625, -2.465087890625, -2.197265625, -1.929443359375, -1.66162109375, -1.393798828125, -1.1259765625, -0.858154296875, -0.59033203125, -0.322509765625, -0.0546875, 0.213134765625, 0.48095703125, 0.748779296875, 1.0166015625, 1.284423828125, 1.55224609375, 1.820068359375, 2.087890625, 2.355712890625, 2.62353515625, 2.891357421875, 3.1591796875, 3.427001953125, 3.69482421875, 3.962646484375, 4.23046875, 4.498291015625, 4.76611328125, 5.033935546875, 5.3017578125, 5.569580078125, 5.83740234375, 6.105224609375, 6.373046875, 6.640869140625, 6.90869140625, 7.176513671875, 7.4443359375, 7.712158203125, 7.97998046875, 8.247802734375, 8.515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 22.0, 189.0, 569.0, 151.0, 23.0, 10.0, 4.0, 0.0, 3.0, 6.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007205009460449219, -0.0006897374987602234, -0.0006589740514755249, -0.0006282106041908264, -0.0005974471569061279, -0.0005666837096214294, -0.000535920262336731, -0.0005051568150520325, -0.000474393367767334, -0.0004436299204826355, -0.000412866473197937, -0.0003821030259132385, -0.00035133957862854004, -0.00032057613134384155, -0.00028981268405914307, -0.0002590492367744446, -0.0002282857894897461, -0.0001975223422050476, -0.00016675889492034912, -0.00013599544763565063, -0.00010523200035095215, -7.446855306625366e-05, -4.3705105781555176e-05, -1.294165849685669e-05, 1.7821788787841797e-05, 4.858523607254028e-05, 7.934868335723877e-05, 0.00011011213064193726, 0.00014087557792663574, 0.00017163902521133423, 0.00020240247249603271, 0.0002331659197807312, 0.0002639293670654297, 0.0002946928143501282, 0.00032545626163482666, 0.00035621970891952515, 0.00038698315620422363, 0.0004177466034889221, 0.0004485100507736206, 0.0004792734980583191, 0.0005100369453430176, 0.0005408003926277161, 0.0005715638399124146, 0.000602327287197113, 0.0006330907344818115, 0.00066385418176651, 0.0006946176290512085, 0.000725381076335907, 0.0007561445236206055, 0.000786907970905304, 0.0008176714181900024, 0.0008484348654747009, 0.0008791983127593994, 0.0009099617600440979, 0.0009407252073287964, 0.0009714886546134949, 0.0010022521018981934, 0.0010330155491828918, 0.0010637789964675903, 0.0010945424437522888, 0.0011253058910369873, 0.0011560693383216858, 0.0011868327856063843, 0.0012175962328910828, 0.0012483596801757812]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 2.0, 9.0, 7.0, 14.0, 12.0, 40.0, 34.0, 55.0, 55.0, 112.0, 135.0, 184.0, 268.0, 408.0, 633.0, 845.0, 1339.0, 2150.0, 3346.0, 5266.0, 9995.0, 34310.0, 337643.0, 560556.0, 61174.0, 12865.0, 6181.0, 3824.0, 2372.0, 1527.0, 979.0, 676.0, 476.0, 317.0, 206.0, 156.0, 104.0, 72.0, 68.0, 43.0, 31.0, 27.0, 12.0, 13.0, 4.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0], "bins": [-8.125, -7.90020751953125, -7.6754150390625, -7.45062255859375, -7.225830078125, -7.00103759765625, -6.7762451171875, -6.55145263671875, -6.32666015625, -6.10186767578125, -5.8770751953125, -5.65228271484375, -5.427490234375, -5.20269775390625, -4.9779052734375, -4.75311279296875, -4.5283203125, -4.30352783203125, -4.0787353515625, -3.85394287109375, -3.629150390625, -3.40435791015625, -3.1795654296875, -2.95477294921875, -2.72998046875, -2.50518798828125, -2.2803955078125, -2.05560302734375, -1.830810546875, -1.60601806640625, -1.3812255859375, -1.15643310546875, -0.931640625, -0.70684814453125, -0.4820556640625, -0.25726318359375, -0.032470703125, 0.19232177734375, 0.4171142578125, 0.64190673828125, 0.86669921875, 1.09149169921875, 1.3162841796875, 1.54107666015625, 1.765869140625, 1.99066162109375, 2.2154541015625, 2.44024658203125, 2.6650390625, 2.88983154296875, 3.1146240234375, 3.33941650390625, 3.564208984375, 3.78900146484375, 4.0137939453125, 4.23858642578125, 4.46337890625, 4.68817138671875, 4.9129638671875, 5.13775634765625, 5.362548828125, 5.58734130859375, 5.8121337890625, 6.03692626953125, 6.26171875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 11.0, 11.0, 10.0, 24.0, 70.0, 103.0, 205.0, 239.0, 156.0, 84.0, 33.0, 15.0, 11.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.144195556640625, -2.07550048828125, -2.006805419921875, -1.9381103515625, -1.869415283203125, -1.80072021484375, -1.732025146484375, -1.663330078125, -1.594635009765625, -1.52593994140625, -1.457244873046875, -1.3885498046875, -1.319854736328125, -1.25115966796875, -1.182464599609375, -1.11376953125, -1.045074462890625, -0.97637939453125, -0.907684326171875, -0.8389892578125, -0.770294189453125, -0.70159912109375, -0.632904052734375, -0.564208984375, -0.495513916015625, -0.42681884765625, -0.358123779296875, -0.2894287109375, -0.220733642578125, -0.15203857421875, -0.083343505859375, -0.0146484375, 0.054046630859375, 0.12274169921875, 0.191436767578125, 0.2601318359375, 0.328826904296875, 0.39752197265625, 0.466217041015625, 0.534912109375, 0.603607177734375, 0.67230224609375, 0.740997314453125, 0.8096923828125, 0.878387451171875, 0.94708251953125, 1.015777587890625, 1.08447265625, 1.153167724609375, 1.22186279296875, 1.290557861328125, 1.3592529296875, 1.427947998046875, 1.49664306640625, 1.565338134765625, 1.634033203125, 1.702728271484375, 1.77142333984375, 1.840118408203125, 1.9088134765625, 1.977508544921875, 2.04620361328125, 2.114898681640625, 2.18359375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 5.0, 6.0, 7.0, 15.0, 15.0, 14.0, 19.0, 21.0, 27.0, 30.0, 35.0, 49.0, 59.0, 77.0, 79.0, 87.0, 83.0, 64.0, 71.0, 53.0, 32.0, 34.0, 23.0, 17.0, 15.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 5.0, 4.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.94861888885498, -11.57848072052002, -11.208342552185059, -10.838205337524414, -10.468067169189453, -10.097929000854492, -9.727790832519531, -9.35765266418457, -8.98751449584961, -8.617376327514648, -8.247238159179688, -7.877100467681885, -7.506962776184082, -7.136824607849121, -6.76668643951416, -6.396548271179199, -6.026411056518555, -5.656272888183594, -5.286135196685791, -4.91599702835083, -4.545859336853027, -4.175721168518066, -3.8055830001831055, -3.4354450702667236, -3.065307140350342, -2.69516921043396, -2.325031280517578, -1.9548931121826172, -1.5847551822662354, -1.2146172523498535, -0.8444790840148926, -0.47434115409851074, -0.1042022705078125, 0.2659357190132141, 0.6360737085342407, 1.006211757659912, 1.376349687576294, 1.7464876174926758, 2.1166257858276367, 2.4867637157440186, 2.8569016456604004, 3.2270395755767822, 3.597177505493164, 3.967315673828125, 4.337453842163086, 4.707591533660889, 5.07772970199585, 5.447867393493652, 5.818005561828613, 6.188143730163574, 6.558281421661377, 6.928419589996338, 7.298557281494141, 7.668695449829102, 8.038833618164062, 8.408971786499023, 8.779109954833984, 9.149248123168945, 9.519386291503906, 9.889524459838867, 10.259661674499512, 10.629799842834473, 10.999938011169434, 11.370076179504395, 11.740213394165039]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 7.0, 16.0, 14.0, 19.0, 13.0, 27.0, 30.0, 22.0, 32.0, 23.0, 42.0, 39.0, 37.0, 49.0, 48.0, 43.0, 41.0, 53.0, 48.0, 52.0, 39.0, 36.0, 30.0, 36.0, 24.0, 19.0, 32.0, 20.0, 18.0, 17.0, 16.0, 5.0, 8.0, 11.0, 3.0, 5.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.725652694702148, -6.512574195861816, -6.299495697021484, -6.086417198181152, -5.873338222503662, -5.66025972366333, -5.447181224822998, -5.234102725982666, -5.021024227142334, -4.807945728302002, -4.59486722946167, -4.38178825378418, -4.168709754943848, -3.9556312561035156, -3.7425527572631836, -3.5294742584228516, -3.3163955211639404, -3.1033170223236084, -2.8902382850646973, -2.6771597862243652, -2.464081287384033, -2.251002788543701, -2.03792405128479, -1.824845552444458, -1.6117669343948364, -1.3986883163452148, -1.1856098175048828, -0.9725311994552612, -0.7594526410102844, -0.5463740825653076, -0.33329546451568604, -0.120216965675354, 0.09286165237426758, 0.3059402108192444, 0.5190187692642212, 0.7320973873138428, 0.9451759457588196, 1.1582545042037964, 1.371333122253418, 1.58441162109375, 1.7974902391433716, 2.010568857192993, 2.223647356033325, 2.4367260932922363, 2.6498045921325684, 2.8628830909729004, 3.0759615898132324, 3.2890400886535645, 3.5021188259124756, 3.7151973247528076, 3.9282760620117188, 4.141354560852051, 4.354433059692383, 4.567511558532715, 4.780590057373047, 4.993668556213379, 5.206747531890869, 5.419826030731201, 5.632904529571533, 5.845983505249023, 6.0590620040893555, 6.2721405029296875, 6.4852190017700195, 6.698297500610352, 6.911375999450684]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 9.0, 5.0, 9.0, 20.0, 25.0, 47.0, 63.0, 105.0, 160.0, 259.0, 418.0, 613.0, 950.0, 1544.0, 2645.0, 4416.0, 7494.0, 13376.0, 24847.0, 48985.0, 95581.0, 175267.0, 238016.0, 196659.0, 112975.0, 57861.0, 29211.0, 15540.0, 8659.0, 4978.0, 2869.0, 1749.0, 1121.0, 713.0, 429.0, 292.0, 209.0, 144.0, 95.0, 56.0, 45.0, 28.0, 25.0, 13.0, 12.0, 4.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.359375, -9.04345703125, -8.7275390625, -8.41162109375, -8.095703125, -7.77978515625, -7.4638671875, -7.14794921875, -6.83203125, -6.51611328125, -6.2001953125, -5.88427734375, -5.568359375, -5.25244140625, -4.9365234375, -4.62060546875, -4.3046875, -3.98876953125, -3.6728515625, -3.35693359375, -3.041015625, -2.72509765625, -2.4091796875, -2.09326171875, -1.77734375, -1.46142578125, -1.1455078125, -0.82958984375, -0.513671875, -0.19775390625, 0.1181640625, 0.43408203125, 0.75, 1.06591796875, 1.3818359375, 1.69775390625, 2.013671875, 2.32958984375, 2.6455078125, 2.96142578125, 3.27734375, 3.59326171875, 3.9091796875, 4.22509765625, 4.541015625, 4.85693359375, 5.1728515625, 5.48876953125, 5.8046875, 6.12060546875, 6.4365234375, 6.75244140625, 7.068359375, 7.38427734375, 7.7001953125, 8.01611328125, 8.33203125, 8.64794921875, 8.9638671875, 9.27978515625, 9.595703125, 9.91162109375, 10.2275390625, 10.54345703125, 10.859375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 16.0, 11.0, 16.0, 17.0, 18.0, 14.0, 27.0, 34.0, 30.0, 36.0, 43.0, 45.0, 50.0, 38.0, 36.0, 56.0, 57.0, 47.0, 45.0, 41.0, 39.0, 38.0, 37.0, 31.0, 25.0, 23.0, 24.0, 16.0, 16.0, 11.0, 11.0, 6.0, 6.0, 7.0, 7.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.5845947265625, -6.348876953125, -6.1131591796875, -5.87744140625, -5.6417236328125, -5.406005859375, -5.1702880859375, -4.9345703125, -4.6988525390625, -4.463134765625, -4.2274169921875, -3.99169921875, -3.7559814453125, -3.520263671875, -3.2845458984375, -3.048828125, -2.8131103515625, -2.577392578125, -2.3416748046875, -2.10595703125, -1.8702392578125, -1.634521484375, -1.3988037109375, -1.1630859375, -0.9273681640625, -0.691650390625, -0.4559326171875, -0.22021484375, 0.0155029296875, 0.251220703125, 0.4869384765625, 0.72265625, 0.9583740234375, 1.194091796875, 1.4298095703125, 1.66552734375, 1.9012451171875, 2.136962890625, 2.3726806640625, 2.6083984375, 2.8441162109375, 3.079833984375, 3.3155517578125, 3.55126953125, 3.7869873046875, 4.022705078125, 4.2584228515625, 4.494140625, 4.7298583984375, 4.965576171875, 5.2012939453125, 5.43701171875, 5.6727294921875, 5.908447265625, 6.1441650390625, 6.3798828125, 6.6156005859375, 6.851318359375, 7.0870361328125, 7.32275390625, 7.5584716796875, 7.794189453125, 8.0299072265625, 8.265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 20.0, 22.0, 53.0, 61.0, 99.0, 154.0, 207.0, 335.0, 485.0, 749.0, 1109.0, 1661.0, 2514.0, 3804.0, 5674.0, 8725.0, 13943.0, 22326.0, 36246.0, 57952.0, 90350.0, 128863.0, 158955.0, 156415.0, 124464.0, 85814.0, 54835.0, 33727.0, 21348.0, 13269.0, 8412.0, 5307.0, 3587.0, 2340.0, 1629.0, 1005.0, 670.0, 455.0, 315.0, 218.0, 161.0, 89.0, 62.0, 37.0, 30.0, 17.0, 9.0, 12.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1171875, -6.89434814453125, -6.6715087890625, -6.44866943359375, -6.225830078125, -6.00299072265625, -5.7801513671875, -5.55731201171875, -5.33447265625, -5.11163330078125, -4.8887939453125, -4.66595458984375, -4.443115234375, -4.22027587890625, -3.9974365234375, -3.77459716796875, -3.5517578125, -3.32891845703125, -3.1060791015625, -2.88323974609375, -2.660400390625, -2.43756103515625, -2.2147216796875, -1.99188232421875, -1.76904296875, -1.54620361328125, -1.3233642578125, -1.10052490234375, -0.877685546875, -0.65484619140625, -0.4320068359375, -0.20916748046875, 0.013671875, 0.23651123046875, 0.4593505859375, 0.68218994140625, 0.905029296875, 1.12786865234375, 1.3507080078125, 1.57354736328125, 1.79638671875, 2.01922607421875, 2.2420654296875, 2.46490478515625, 2.687744140625, 2.91058349609375, 3.1334228515625, 3.35626220703125, 3.5791015625, 3.80194091796875, 4.0247802734375, 4.24761962890625, 4.470458984375, 4.69329833984375, 4.9161376953125, 5.13897705078125, 5.36181640625, 5.58465576171875, 5.8074951171875, 6.03033447265625, 6.253173828125, 6.47601318359375, 6.6988525390625, 6.92169189453125, 7.14453125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 6.0, 8.0, 8.0, 10.0, 22.0, 19.0, 30.0, 27.0, 29.0, 24.0, 35.0, 33.0, 44.0, 48.0, 49.0, 44.0, 31.0, 50.0, 42.0, 39.0, 55.0, 28.0, 36.0, 26.0, 40.0, 38.0, 31.0, 23.0, 20.0, 20.0, 8.0, 10.0, 14.0, 9.0, 6.0, 6.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.28125, -4.14935302734375, -4.0174560546875, -3.88555908203125, -3.753662109375, -3.62176513671875, -3.4898681640625, -3.35797119140625, -3.22607421875, -3.09417724609375, -2.9622802734375, -2.83038330078125, -2.698486328125, -2.56658935546875, -2.4346923828125, -2.30279541015625, -2.1708984375, -2.03900146484375, -1.9071044921875, -1.77520751953125, -1.643310546875, -1.51141357421875, -1.3795166015625, -1.24761962890625, -1.11572265625, -0.98382568359375, -0.8519287109375, -0.72003173828125, -0.588134765625, -0.45623779296875, -0.3243408203125, -0.19244384765625, -0.060546875, 0.07135009765625, 0.2032470703125, 0.33514404296875, 0.467041015625, 0.59893798828125, 0.7308349609375, 0.86273193359375, 0.99462890625, 1.12652587890625, 1.2584228515625, 1.39031982421875, 1.522216796875, 1.65411376953125, 1.7860107421875, 1.91790771484375, 2.0498046875, 2.18170166015625, 2.3135986328125, 2.44549560546875, 2.577392578125, 2.70928955078125, 2.8411865234375, 2.97308349609375, 3.10498046875, 3.23687744140625, 3.3687744140625, 3.50067138671875, 3.632568359375, 3.76446533203125, 3.8963623046875, 4.02825927734375, 4.16015625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 11.0, 19.0, 26.0, 35.0, 70.0, 84.0, 108.0, 161.0, 252.0, 323.0, 465.0, 694.0, 1039.0, 1597.0, 2485.0, 3919.0, 6602.0, 11237.0, 20564.0, 41359.0, 90431.0, 201356.0, 301644.0, 190950.0, 85704.0, 39675.0, 19750.0, 10830.0, 6173.0, 3826.0, 2397.0, 1529.0, 1003.0, 655.0, 471.0, 327.0, 263.0, 166.0, 99.0, 69.0, 58.0, 37.0, 29.0, 20.0, 12.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.2764892578125, -7.029541015625, -6.7825927734375, -6.53564453125, -6.2886962890625, -6.041748046875, -5.7947998046875, -5.5478515625, -5.3009033203125, -5.053955078125, -4.8070068359375, -4.56005859375, -4.3131103515625, -4.066162109375, -3.8192138671875, -3.572265625, -3.3253173828125, -3.078369140625, -2.8314208984375, -2.58447265625, -2.3375244140625, -2.090576171875, -1.8436279296875, -1.5966796875, -1.3497314453125, -1.102783203125, -0.8558349609375, -0.60888671875, -0.3619384765625, -0.114990234375, 0.1319580078125, 0.37890625, 0.6258544921875, 0.872802734375, 1.1197509765625, 1.36669921875, 1.6136474609375, 1.860595703125, 2.1075439453125, 2.3544921875, 2.6014404296875, 2.848388671875, 3.0953369140625, 3.34228515625, 3.5892333984375, 3.836181640625, 4.0831298828125, 4.330078125, 4.5770263671875, 4.823974609375, 5.0709228515625, 5.31787109375, 5.5648193359375, 5.811767578125, 6.0587158203125, 6.3056640625, 6.5526123046875, 6.799560546875, 7.0465087890625, 7.29345703125, 7.5404052734375, 7.787353515625, 8.0343017578125, 8.28125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 9.0, 10.0, 10.0, 12.0, 15.0, 20.0, 26.0, 54.0, 69.0, 117.0, 138.0, 137.0, 122.0, 88.0, 53.0, 32.0, 17.0, 13.0, 14.0, 8.0, 12.0, 4.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013942718505859375, -0.001353532075881958, -0.0013127923011779785, -0.001272052526473999, -0.0012313127517700195, -0.00119057297706604, -0.0011498332023620605, -0.001109093427658081, -0.0010683536529541016, -0.001027613878250122, -0.0009868741035461426, -0.0009461343288421631, -0.0009053945541381836, -0.0008646547794342041, -0.0008239150047302246, -0.0007831752300262451, -0.0007424354553222656, -0.0007016956806182861, -0.0006609559059143066, -0.0006202161312103271, -0.0005794763565063477, -0.0005387365818023682, -0.0004979968070983887, -0.0004572570323944092, -0.0004165172576904297, -0.0003757774829864502, -0.0003350377082824707, -0.0002942979335784912, -0.0002535581588745117, -0.00021281838417053223, -0.00017207860946655273, -0.00013133883476257324, -9.059906005859375e-05, -4.985928535461426e-05, -9.119510650634766e-06, 3.1620264053344727e-05, 7.236003875732422e-05, 0.00011309981346130371, 0.0001538395881652832, 0.0001945793628692627, 0.0002353191375732422, 0.0002760589122772217, 0.00031679868698120117, 0.00035753846168518066, 0.00039827823638916016, 0.00043901801109313965, 0.00047975778579711914, 0.0005204975605010986, 0.0005612373352050781, 0.0006019771099090576, 0.0006427168846130371, 0.0006834566593170166, 0.0007241964340209961, 0.0007649362087249756, 0.0008056759834289551, 0.0008464157581329346, 0.0008871555328369141, 0.0009278953075408936, 0.000968635082244873, 0.0010093748569488525, 0.001050114631652832, 0.0010908544063568115, 0.001131594181060791, 0.0011723339557647705, 0.00121307373046875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 2.0, 10.0, 17.0, 17.0, 24.0, 25.0, 37.0, 67.0, 101.0, 154.0, 227.0, 386.0, 595.0, 954.0, 1620.0, 2782.0, 5165.0, 9888.0, 21391.0, 50834.0, 128822.0, 287580.0, 299007.0, 138326.0, 54282.0, 22941.0, 10597.0, 5360.0, 2893.0, 1746.0, 1001.0, 576.0, 367.0, 259.0, 176.0, 89.0, 67.0, 50.0, 29.0, 31.0, 16.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.62890625, -7.38311767578125, -7.1373291015625, -6.89154052734375, -6.645751953125, -6.39996337890625, -6.1541748046875, -5.90838623046875, -5.66259765625, -5.41680908203125, -5.1710205078125, -4.92523193359375, -4.679443359375, -4.43365478515625, -4.1878662109375, -3.94207763671875, -3.6962890625, -3.45050048828125, -3.2047119140625, -2.95892333984375, -2.713134765625, -2.46734619140625, -2.2215576171875, -1.97576904296875, -1.72998046875, -1.48419189453125, -1.2384033203125, -0.99261474609375, -0.746826171875, -0.50103759765625, -0.2552490234375, -0.00946044921875, 0.236328125, 0.48211669921875, 0.7279052734375, 0.97369384765625, 1.219482421875, 1.46527099609375, 1.7110595703125, 1.95684814453125, 2.20263671875, 2.44842529296875, 2.6942138671875, 2.94000244140625, 3.185791015625, 3.43157958984375, 3.6773681640625, 3.92315673828125, 4.1689453125, 4.41473388671875, 4.6605224609375, 4.90631103515625, 5.152099609375, 5.39788818359375, 5.6436767578125, 5.88946533203125, 6.13525390625, 6.38104248046875, 6.6268310546875, 6.87261962890625, 7.118408203125, 7.36419677734375, 7.6099853515625, 7.85577392578125, 8.1015625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 6.0, 15.0, 21.0, 22.0, 28.0, 48.0, 56.0, 61.0, 75.0, 76.0, 105.0, 95.0, 92.0, 72.0, 44.0, 29.0, 49.0, 28.0, 16.0, 13.0, 12.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8173828125, -1.7564849853515625, -1.695587158203125, -1.6346893310546875, -1.57379150390625, -1.5128936767578125, -1.451995849609375, -1.3910980224609375, -1.3302001953125, -1.2693023681640625, -1.208404541015625, -1.1475067138671875, -1.08660888671875, -1.0257110595703125, -0.964813232421875, -0.9039154052734375, -0.843017578125, -0.7821197509765625, -0.721221923828125, -0.6603240966796875, -0.59942626953125, -0.5385284423828125, -0.477630615234375, -0.4167327880859375, -0.3558349609375, -0.2949371337890625, -0.234039306640625, -0.1731414794921875, -0.11224365234375, -0.0513458251953125, 0.009552001953125, 0.0704498291015625, 0.13134765625, 0.1922454833984375, 0.253143310546875, 0.3140411376953125, 0.37493896484375, 0.4358367919921875, 0.496734619140625, 0.5576324462890625, 0.6185302734375, 0.6794281005859375, 0.740325927734375, 0.8012237548828125, 0.86212158203125, 0.9230194091796875, 0.983917236328125, 1.0448150634765625, 1.105712890625, 1.1666107177734375, 1.227508544921875, 1.2884063720703125, 1.34930419921875, 1.4102020263671875, 1.471099853515625, 1.5319976806640625, 1.5928955078125, 1.6537933349609375, 1.714691162109375, 1.7755889892578125, 1.83648681640625, 1.8973846435546875, 1.958282470703125, 2.0191802978515625, 2.080078125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 9.0, 3.0, 6.0, 8.0, 9.0, 13.0, 20.0, 16.0, 16.0, 31.0, 34.0, 37.0, 47.0, 47.0, 64.0, 84.0, 76.0, 78.0, 71.0, 67.0, 46.0, 54.0, 23.0, 24.0, 18.0, 18.0, 14.0, 13.0, 6.0, 11.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.410075187683105, -10.060137748718262, -9.710200309753418, -9.360262870788574, -9.010326385498047, -8.660388946533203, -8.31045150756836, -7.960514068603516, -7.610576629638672, -7.260639190673828, -6.910701751708984, -6.560764789581299, -6.210827350616455, -5.860889911651611, -5.510952949523926, -5.161015510559082, -4.811078071594238, -4.4611406326293945, -4.111203193664551, -3.7612662315368652, -3.4113287925720215, -3.0613913536071777, -2.711454153060913, -2.3615169525146484, -2.0115795135498047, -1.6616421937942505, -1.3117048740386963, -0.9617675542831421, -0.6118302345275879, -0.2618929147720337, 0.08804440498352051, 0.43798160552978516, 0.7879199981689453, 1.1378573179244995, 1.4877946376800537, 1.837731957435608, 2.187669277191162, 2.537606716156006, 2.8875439167022705, 3.237481117248535, 3.587418556213379, 3.9373559951782227, 4.287293434143066, 4.637230396270752, 4.987167835235596, 5.3371052742004395, 5.687042236328125, 6.036979675292969, 6.3869171142578125, 6.736854553222656, 7.0867919921875, 7.4367289543151855, 7.786666393280029, 8.136603355407715, 8.486540794372559, 8.836478233337402, 9.186415672302246, 9.53635311126709, 9.886290550231934, 10.236227989196777, 10.586164474487305, 10.936101913452148, 11.286039352416992, 11.635976791381836, 11.98591423034668]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 12.0, 22.0, 19.0, 24.0, 29.0, 27.0, 30.0, 38.0, 54.0, 43.0, 34.0, 43.0, 41.0, 34.0, 62.0, 43.0, 40.0, 55.0, 35.0, 35.0, 44.0, 25.0, 27.0, 21.0, 21.0, 18.0, 21.0, 8.0, 10.0, 15.0, 7.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.289765357971191, -6.0647687911987305, -5.8397722244262695, -5.614776134490967, -5.389779567718506, -5.164783000946045, -4.939786434173584, -4.714790344238281, -4.48979377746582, -4.264797210693359, -4.039800643920898, -3.8148043155670166, -3.5898079872131348, -3.364811420440674, -3.139814853668213, -2.914818525314331, -2.68982195854187, -2.464825391769409, -2.2398290634155273, -2.0148324966430664, -1.7898361682891846, -1.5648396015167236, -1.3398431539535522, -1.1148467063903809, -0.8898502588272095, -0.6648538112640381, -0.4398573338985443, -0.21486085653305054, 0.01013559103012085, 0.235132098197937, 0.4601285457611084, 0.6851249933242798, 0.9101214408874512, 1.1351178884506226, 1.360114336013794, 1.5851109027862549, 1.8101072311401367, 2.0351037979125977, 2.2601003646850586, 2.4850966930389404, 2.7100930213928223, 2.935089588165283, 3.160085916519165, 3.385082483291626, 3.610078811645508, 3.8350753784179688, 4.06007194519043, 4.285068511962891, 4.510065078735352, 4.7350616455078125, 4.960058212280273, 5.185054302215576, 5.410050868988037, 5.635047435760498, 5.860044002532959, 6.085040092468262, 6.310036659240723, 6.535033226013184, 6.7600297927856445, 6.985025882720947, 7.210022449493408, 7.435019016265869, 7.66001558303833, 7.885011672973633, 8.110008239746094]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 12.0, 12.0, 16.0, 32.0, 29.0, 43.0, 62.0, 83.0, 115.0, 171.0, 243.0, 353.0, 512.0, 722.0, 1090.0, 1596.0, 2241.0, 3453.0, 5493.0, 8775.0, 15236.0, 28961.0, 66039.0, 193883.0, 691573.0, 1666464.0, 1043290.0, 287048.0, 89198.0, 36660.0, 18499.0, 10915.0, 6815.0, 4499.0, 3016.0, 2073.0, 1490.0, 994.0, 774.0, 527.0, 344.0, 293.0, 199.0, 137.0, 97.0, 57.0, 49.0, 39.0, 19.0, 11.0, 7.0, 6.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-14.2890625, -13.837890625, -13.38671875, -12.935546875, -12.484375, -12.033203125, -11.58203125, -11.130859375, -10.6796875, -10.228515625, -9.77734375, -9.326171875, -8.875, -8.423828125, -7.97265625, -7.521484375, -7.0703125, -6.619140625, -6.16796875, -5.716796875, -5.265625, -4.814453125, -4.36328125, -3.912109375, -3.4609375, -3.009765625, -2.55859375, -2.107421875, -1.65625, -1.205078125, -0.75390625, -0.302734375, 0.1484375, 0.599609375, 1.05078125, 1.501953125, 1.953125, 2.404296875, 2.85546875, 3.306640625, 3.7578125, 4.208984375, 4.66015625, 5.111328125, 5.5625, 6.013671875, 6.46484375, 6.916015625, 7.3671875, 7.818359375, 8.26953125, 8.720703125, 9.171875, 9.623046875, 10.07421875, 10.525390625, 10.9765625, 11.427734375, 11.87890625, 12.330078125, 12.78125, 13.232421875, 13.68359375, 14.134765625, 14.5859375]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 15.0, 8.0, 12.0, 13.0, 17.0, 23.0, 22.0, 26.0, 25.0, 37.0, 38.0, 39.0, 40.0, 38.0, 42.0, 49.0, 50.0, 51.0, 46.0, 46.0, 47.0, 35.0, 33.0, 48.0, 26.0, 30.0, 22.0, 24.0, 18.0, 11.0, 18.0, 10.0, 9.0, 10.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.00390625, -4.824462890625, -4.64501953125, -4.465576171875, -4.2861328125, -4.106689453125, -3.92724609375, -3.747802734375, -3.568359375, -3.388916015625, -3.20947265625, -3.030029296875, -2.8505859375, -2.671142578125, -2.49169921875, -2.312255859375, -2.1328125, -1.953369140625, -1.77392578125, -1.594482421875, -1.4150390625, -1.235595703125, -1.05615234375, -0.876708984375, -0.697265625, -0.517822265625, -0.33837890625, -0.158935546875, 0.0205078125, 0.199951171875, 0.37939453125, 0.558837890625, 0.73828125, 0.917724609375, 1.09716796875, 1.276611328125, 1.4560546875, 1.635498046875, 1.81494140625, 1.994384765625, 2.173828125, 2.353271484375, 2.53271484375, 2.712158203125, 2.8916015625, 3.071044921875, 3.25048828125, 3.429931640625, 3.609375, 3.788818359375, 3.96826171875, 4.147705078125, 4.3271484375, 4.506591796875, 4.68603515625, 4.865478515625, 5.044921875, 5.224365234375, 5.40380859375, 5.583251953125, 5.7626953125, 5.942138671875, 6.12158203125, 6.301025390625, 6.48046875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 0.0, 6.0, 9.0, 12.0, 18.0, 39.0, 59.0, 73.0, 89.0, 150.0, 266.0, 346.0, 620.0, 960.0, 1448.0, 2484.0, 4003.0, 6581.0, 11436.0, 20966.0, 41287.0, 91338.0, 243095.0, 740936.0, 1553758.0, 945064.0, 311708.0, 112577.0, 48908.0, 24153.0, 12932.0, 7424.0, 4372.0, 2682.0, 1604.0, 1039.0, 623.0, 440.0, 270.0, 170.0, 113.0, 69.0, 50.0, 29.0, 22.0, 28.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.359375, -14.888427734375, -14.41748046875, -13.946533203125, -13.4755859375, -13.004638671875, -12.53369140625, -12.062744140625, -11.591796875, -11.120849609375, -10.64990234375, -10.178955078125, -9.7080078125, -9.237060546875, -8.76611328125, -8.295166015625, -7.82421875, -7.353271484375, -6.88232421875, -6.411376953125, -5.9404296875, -5.469482421875, -4.99853515625, -4.527587890625, -4.056640625, -3.585693359375, -3.11474609375, -2.643798828125, -2.1728515625, -1.701904296875, -1.23095703125, -0.760009765625, -0.2890625, 0.181884765625, 0.65283203125, 1.123779296875, 1.5947265625, 2.065673828125, 2.53662109375, 3.007568359375, 3.478515625, 3.949462890625, 4.42041015625, 4.891357421875, 5.3623046875, 5.833251953125, 6.30419921875, 6.775146484375, 7.24609375, 7.717041015625, 8.18798828125, 8.658935546875, 9.1298828125, 9.600830078125, 10.07177734375, 10.542724609375, 11.013671875, 11.484619140625, 11.95556640625, 12.426513671875, 12.8974609375, 13.368408203125, 13.83935546875, 14.310302734375, 14.78125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 11.0, 6.0, 4.0, 11.0, 11.0, 17.0, 20.0, 22.0, 38.0, 54.0, 47.0, 62.0, 93.0, 113.0, 156.0, 204.0, 278.0, 303.0, 326.0, 380.0, 346.0, 325.0, 250.0, 213.0, 188.0, 136.0, 118.0, 77.0, 61.0, 46.0, 44.0, 30.0, 15.0, 16.0, 14.0, 10.0, 9.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.046875, -3.930755615234375, -3.81463623046875, -3.698516845703125, -3.5823974609375, -3.466278076171875, -3.35015869140625, -3.234039306640625, -3.117919921875, -3.001800537109375, -2.88568115234375, -2.769561767578125, -2.6534423828125, -2.537322998046875, -2.42120361328125, -2.305084228515625, -2.18896484375, -2.072845458984375, -1.95672607421875, -1.840606689453125, -1.7244873046875, -1.608367919921875, -1.49224853515625, -1.376129150390625, -1.260009765625, -1.143890380859375, -1.02777099609375, -0.911651611328125, -0.7955322265625, -0.679412841796875, -0.56329345703125, -0.447174072265625, -0.3310546875, -0.214935302734375, -0.09881591796875, 0.017303466796875, 0.1334228515625, 0.249542236328125, 0.36566162109375, 0.481781005859375, 0.597900390625, 0.714019775390625, 0.83013916015625, 0.946258544921875, 1.0623779296875, 1.178497314453125, 1.29461669921875, 1.410736083984375, 1.52685546875, 1.642974853515625, 1.75909423828125, 1.875213623046875, 1.9913330078125, 2.107452392578125, 2.22357177734375, 2.339691162109375, 2.455810546875, 2.571929931640625, 2.68804931640625, 2.804168701171875, 2.9202880859375, 3.036407470703125, 3.15252685546875, 3.268646240234375, 3.384765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 1.0, 8.0, 12.0, 10.0, 12.0, 23.0, 29.0, 39.0, 42.0, 64.0, 84.0, 101.0, 108.0, 100.0, 100.0, 71.0, 48.0, 43.0, 27.0, 17.0, 6.0, 17.0, 5.0, 5.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.42683982849121, -19.897809982299805, -19.368778228759766, -18.83974838256836, -18.310718536376953, -17.781688690185547, -17.252656936645508, -16.7236270904541, -16.194595336914062, -15.66556453704834, -15.136534690856934, -14.607503890991211, -14.078474044799805, -13.549443244934082, -13.02041244506836, -12.491382598876953, -11.962352752685547, -11.433321952819824, -10.904292106628418, -10.375261306762695, -9.846231460571289, -9.317200660705566, -8.788169860839844, -8.259140014648438, -7.730109214782715, -7.20107889175415, -6.672048568725586, -6.143017768859863, -5.613987445831299, -5.084957122802734, -4.555926322937012, -4.026895999908447, -3.49786376953125, -2.9688334465026855, -2.439802885055542, -1.910772442817688, -1.381742000579834, -0.8527116775512695, -0.323681116104126, 0.20534944534301758, 0.734379768371582, 1.263410210609436, 1.79244065284729, 2.3214712142944336, 2.850501537322998, 3.3795318603515625, 3.908562421798706, 4.43759298324585, 4.966623306274414, 5.4956536293029785, 6.024683952331543, 6.553714752197266, 7.08274507522583, 7.6117753982543945, 8.140806198120117, 8.669836044311523, 9.198866844177246, 9.727897644042969, 10.256927490234375, 10.785958290100098, 11.31498908996582, 11.844018936157227, 12.37304973602295, 12.902080535888672, 13.431110382080078]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 10.0, 12.0, 8.0, 20.0, 15.0, 19.0, 22.0, 37.0, 36.0, 33.0, 38.0, 45.0, 40.0, 36.0, 42.0, 54.0, 38.0, 50.0, 46.0, 39.0, 45.0, 45.0, 42.0, 27.0, 25.0, 30.0, 21.0, 26.0, 6.0, 20.0, 10.0, 8.0, 14.0, 6.0, 8.0, 7.0, 2.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.962804794311523, -5.730165481567383, -5.497525691986084, -5.264886379241943, -5.0322465896606445, -4.799607276916504, -4.566967487335205, -4.3343281745910645, -4.101688385009766, -3.869048833847046, -3.636409282684326, -3.4037697315216064, -3.1711301803588867, -2.938490867614746, -2.7058510780334473, -2.4732117652893066, -2.240572214126587, -2.007932662963867, -1.7752931118011475, -1.5426535606384277, -1.310014009475708, -1.0773745775222778, -0.8447350263595581, -0.6120954751968384, -0.37945592403411865, -0.14681638777256012, 0.08582314848899841, 0.31846266984939575, 0.5511022210121155, 0.7837417125701904, 1.0163812637329102, 1.2490208148956299, 1.4816603660583496, 1.7142999172210693, 1.946939468383789, 2.179579019546509, 2.4122185707092285, 2.644857883453369, 2.877497673034668, 3.1101369857788086, 3.3427767753601074, 3.575416326522827, 3.808055877685547, 4.0406951904296875, 4.273334980010986, 4.505974292755127, 4.738614082336426, 4.971253395080566, 5.203892707824707, 5.436532020568848, 5.6691718101501465, 5.901811122894287, 6.134450912475586, 6.367090225219727, 6.599730014801025, 6.832369327545166, 7.065009117126465, 7.2976484298706055, 7.530288219451904, 7.762927532196045, 7.995567321777344, 8.228206634521484, 8.460845947265625, 8.693486213684082, 8.926125526428223]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 11.0, 13.0, 32.0, 49.0, 60.0, 101.0, 142.0, 217.0, 333.0, 510.0, 718.0, 1127.0, 1817.0, 2907.0, 4524.0, 7105.0, 11868.0, 18701.0, 30847.0, 51283.0, 85739.0, 133781.0, 176830.0, 175829.0, 131316.0, 83177.0, 50188.0, 30137.0, 18538.0, 11145.0, 7025.0, 4472.0, 2889.0, 1760.0, 1157.0, 711.0, 501.0, 310.0, 217.0, 141.0, 101.0, 74.0, 49.0, 31.0, 25.0, 17.0, 6.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.79296875, -2.699798583984375, -2.60662841796875, -2.513458251953125, -2.4202880859375, -2.327117919921875, -2.23394775390625, -2.140777587890625, -2.047607421875, -1.954437255859375, -1.86126708984375, -1.768096923828125, -1.6749267578125, -1.581756591796875, -1.48858642578125, -1.395416259765625, -1.30224609375, -1.209075927734375, -1.11590576171875, -1.022735595703125, -0.9295654296875, -0.836395263671875, -0.74322509765625, -0.650054931640625, -0.556884765625, -0.463714599609375, -0.37054443359375, -0.277374267578125, -0.1842041015625, -0.091033935546875, 0.00213623046875, 0.095306396484375, 0.1884765625, 0.281646728515625, 0.37481689453125, 0.467987060546875, 0.5611572265625, 0.654327392578125, 0.74749755859375, 0.840667724609375, 0.933837890625, 1.027008056640625, 1.12017822265625, 1.213348388671875, 1.3065185546875, 1.399688720703125, 1.49285888671875, 1.586029052734375, 1.67919921875, 1.772369384765625, 1.86553955078125, 1.958709716796875, 2.0518798828125, 2.145050048828125, 2.23822021484375, 2.331390380859375, 2.424560546875, 2.517730712890625, 2.61090087890625, 2.704071044921875, 2.7972412109375, 2.890411376953125, 2.98358154296875, 3.076751708984375, 3.169921875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 0.0, 2.0, 8.0, 10.0, 13.0, 17.0, 12.0, 21.0, 23.0, 15.0, 26.0, 43.0, 40.0, 38.0, 64.0, 45.0, 31.0, 49.0, 43.0, 45.0, 37.0, 63.0, 53.0, 38.0, 28.0, 37.0, 38.0, 29.0, 22.0, 14.0, 26.0, 11.0, 13.0, 11.0, 10.0, 7.0, 9.0, 3.0, 4.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.640869140625, -6.37548828125, -6.110107421875, -5.8447265625, -5.579345703125, -5.31396484375, -5.048583984375, -4.783203125, -4.517822265625, -4.25244140625, -3.987060546875, -3.7216796875, -3.456298828125, -3.19091796875, -2.925537109375, -2.66015625, -2.394775390625, -2.12939453125, -1.864013671875, -1.5986328125, -1.333251953125, -1.06787109375, -0.802490234375, -0.537109375, -0.271728515625, -0.00634765625, 0.259033203125, 0.5244140625, 0.789794921875, 1.05517578125, 1.320556640625, 1.5859375, 1.851318359375, 2.11669921875, 2.382080078125, 2.6474609375, 2.912841796875, 3.17822265625, 3.443603515625, 3.708984375, 3.974365234375, 4.23974609375, 4.505126953125, 4.7705078125, 5.035888671875, 5.30126953125, 5.566650390625, 5.83203125, 6.097412109375, 6.36279296875, 6.628173828125, 6.8935546875, 7.158935546875, 7.42431640625, 7.689697265625, 7.955078125, 8.220458984375, 8.48583984375, 8.751220703125, 9.0166015625, 9.281982421875, 9.54736328125, 9.812744140625, 10.078125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 5.0, 5.0, 5.0, 5.0, 8.0, 17.0, 25.0, 31.0, 32.0, 86.0, 98.0, 181.0, 266.0, 343.0, 495.0, 769.0, 1325.0, 2093.0, 3425.0, 5755.0, 9812.0, 17097.0, 30585.0, 56433.0, 100837.0, 170518.0, 222068.0, 179706.0, 108664.0, 60297.0, 33052.0, 18355.0, 10467.0, 6004.0, 3542.0, 2223.0, 1391.0, 875.0, 575.0, 389.0, 227.0, 146.0, 119.0, 56.0, 53.0, 35.0, 22.0, 18.0, 14.0, 4.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.59375, -3.476165771484375, -3.35858154296875, -3.240997314453125, -3.1234130859375, -3.005828857421875, -2.88824462890625, -2.770660400390625, -2.653076171875, -2.535491943359375, -2.41790771484375, -2.300323486328125, -2.1827392578125, -2.065155029296875, -1.94757080078125, -1.829986572265625, -1.71240234375, -1.594818115234375, -1.47723388671875, -1.359649658203125, -1.2420654296875, -1.124481201171875, -1.00689697265625, -0.889312744140625, -0.771728515625, -0.654144287109375, -0.53656005859375, -0.418975830078125, -0.3013916015625, -0.183807373046875, -0.06622314453125, 0.051361083984375, 0.1689453125, 0.286529541015625, 0.40411376953125, 0.521697998046875, 0.6392822265625, 0.756866455078125, 0.87445068359375, 0.992034912109375, 1.109619140625, 1.227203369140625, 1.34478759765625, 1.462371826171875, 1.5799560546875, 1.697540283203125, 1.81512451171875, 1.932708740234375, 2.05029296875, 2.167877197265625, 2.28546142578125, 2.403045654296875, 2.5206298828125, 2.638214111328125, 2.75579833984375, 2.873382568359375, 2.990966796875, 3.108551025390625, 3.22613525390625, 3.343719482421875, 3.4613037109375, 3.578887939453125, 3.69647216796875, 3.814056396484375, 3.931640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 4.0, 8.0, 12.0, 11.0, 9.0, 24.0, 17.0, 21.0, 26.0, 27.0, 28.0, 34.0, 46.0, 30.0, 30.0, 40.0, 27.0, 33.0, 37.0, 40.0, 43.0, 39.0, 32.0, 40.0, 36.0, 40.0, 26.0, 26.0, 29.0, 22.0, 21.0, 22.0, 22.0, 21.0, 12.0, 12.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.125, -4.000030517578125, -3.87506103515625, -3.750091552734375, -3.6251220703125, -3.500152587890625, -3.37518310546875, -3.250213623046875, -3.125244140625, -3.000274658203125, -2.87530517578125, -2.750335693359375, -2.6253662109375, -2.500396728515625, -2.37542724609375, -2.250457763671875, -2.12548828125, -2.000518798828125, -1.87554931640625, -1.750579833984375, -1.6256103515625, -1.500640869140625, -1.37567138671875, -1.250701904296875, -1.125732421875, -1.000762939453125, -0.87579345703125, -0.750823974609375, -0.6258544921875, -0.500885009765625, -0.37591552734375, -0.250946044921875, -0.1259765625, -0.001007080078125, 0.12396240234375, 0.248931884765625, 0.3739013671875, 0.498870849609375, 0.62384033203125, 0.748809814453125, 0.873779296875, 0.998748779296875, 1.12371826171875, 1.248687744140625, 1.3736572265625, 1.498626708984375, 1.62359619140625, 1.748565673828125, 1.87353515625, 1.998504638671875, 2.12347412109375, 2.248443603515625, 2.3734130859375, 2.498382568359375, 2.62335205078125, 2.748321533203125, 2.873291015625, 2.998260498046875, 3.12322998046875, 3.248199462890625, 3.3731689453125, 3.498138427734375, 3.62310791015625, 3.748077392578125, 3.873046875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 16.0, 15.0, 21.0, 28.0, 39.0, 65.0, 106.0, 141.0, 232.0, 440.0, 677.0, 1243.0, 2459.0, 4913.0, 10542.0, 24434.0, 62917.0, 172843.0, 368186.0, 246789.0, 90876.0, 34456.0, 13956.0, 6364.0, 3054.0, 1564.0, 911.0, 448.0, 304.0, 159.0, 119.0, 71.0, 47.0, 39.0, 23.0, 16.0, 11.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.671539306640625, -2.58721923828125, -2.502899169921875, -2.4185791015625, -2.334259033203125, -2.24993896484375, -2.165618896484375, -2.081298828125, -1.996978759765625, -1.91265869140625, -1.828338623046875, -1.7440185546875, -1.659698486328125, -1.57537841796875, -1.491058349609375, -1.40673828125, -1.322418212890625, -1.23809814453125, -1.153778076171875, -1.0694580078125, -0.985137939453125, -0.90081787109375, -0.816497802734375, -0.732177734375, -0.647857666015625, -0.56353759765625, -0.479217529296875, -0.3948974609375, -0.310577392578125, -0.22625732421875, -0.141937255859375, -0.0576171875, 0.026702880859375, 0.11102294921875, 0.195343017578125, 0.2796630859375, 0.363983154296875, 0.44830322265625, 0.532623291015625, 0.616943359375, 0.701263427734375, 0.78558349609375, 0.869903564453125, 0.9542236328125, 1.038543701171875, 1.12286376953125, 1.207183837890625, 1.29150390625, 1.375823974609375, 1.46014404296875, 1.544464111328125, 1.6287841796875, 1.713104248046875, 1.79742431640625, 1.881744384765625, 1.966064453125, 2.050384521484375, 2.13470458984375, 2.219024658203125, 2.3033447265625, 2.387664794921875, 2.47198486328125, 2.556304931640625, 2.640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 6.0, 5.0, 6.0, 4.0, 13.0, 13.0, 9.0, 13.0, 25.0, 36.0, 58.0, 49.0, 72.0, 60.0, 75.0, 71.0, 79.0, 80.0, 69.0, 46.0, 48.0, 42.0, 34.0, 21.0, 13.0, 13.0, 11.0, 6.0, 10.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-0.00012099742889404297, -0.00011779461055994034, -0.00011459179222583771, -0.00011138897389173508, -0.00010818615555763245, -0.00010498333722352982, -0.00010178051888942719, -9.857770055532455e-05, -9.537488222122192e-05, -9.217206388711929e-05, -8.896924555301666e-05, -8.576642721891403e-05, -8.25636088848114e-05, -7.936079055070877e-05, -7.615797221660614e-05, -7.295515388250351e-05, -6.975233554840088e-05, -6.654951721429825e-05, -6.334669888019562e-05, -6.014388054609299e-05, -5.6941062211990356e-05, -5.3738243877887726e-05, -5.0535425543785095e-05, -4.7332607209682465e-05, -4.4129788875579834e-05, -4.09269705414772e-05, -3.772415220737457e-05, -3.452133387327194e-05, -3.131851553916931e-05, -2.811569720506668e-05, -2.491287887096405e-05, -2.171006053686142e-05, -1.850724220275879e-05, -1.530442386865616e-05, -1.2101605534553528e-05, -8.898787200450897e-06, -5.695968866348267e-06, -2.493150532245636e-06, 7.096678018569946e-07, 3.912486135959625e-06, 7.115304470062256e-06, 1.0318122804164886e-05, 1.3520941138267517e-05, 1.6723759472370148e-05, 1.992657780647278e-05, 2.312939614057541e-05, 2.633221447467804e-05, 2.953503280878067e-05, 3.27378511428833e-05, 3.594066947698593e-05, 3.914348781108856e-05, 4.234630614519119e-05, 4.554912447929382e-05, 4.8751942813396454e-05, 5.1954761147499084e-05, 5.5157579481601715e-05, 5.8360397815704346e-05, 6.156321614980698e-05, 6.476603448390961e-05, 6.796885281801224e-05, 7.117167115211487e-05, 7.43744894862175e-05, 7.757730782032013e-05, 8.078012615442276e-05, 8.398294448852539e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 15.0, 17.0, 24.0, 26.0, 38.0, 79.0, 85.0, 139.0, 241.0, 342.0, 579.0, 986.0, 1545.0, 2673.0, 4802.0, 8759.0, 17015.0, 35431.0, 79728.0, 178788.0, 290031.0, 226368.0, 107185.0, 46923.0, 21704.0, 11047.0, 5784.0, 3258.0, 1892.0, 1099.0, 684.0, 436.0, 290.0, 170.0, 108.0, 78.0, 52.0, 46.0, 19.0, 12.0, 11.0, 14.0, 8.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.29296875, -2.2205810546875, -2.148193359375, -2.0758056640625, -2.00341796875, -1.9310302734375, -1.858642578125, -1.7862548828125, -1.7138671875, -1.6414794921875, -1.569091796875, -1.4967041015625, -1.42431640625, -1.3519287109375, -1.279541015625, -1.2071533203125, -1.134765625, -1.0623779296875, -0.989990234375, -0.9176025390625, -0.84521484375, -0.7728271484375, -0.700439453125, -0.6280517578125, -0.5556640625, -0.4832763671875, -0.410888671875, -0.3385009765625, -0.26611328125, -0.1937255859375, -0.121337890625, -0.0489501953125, 0.0234375, 0.0958251953125, 0.168212890625, 0.2406005859375, 0.31298828125, 0.3853759765625, 0.457763671875, 0.5301513671875, 0.6025390625, 0.6749267578125, 0.747314453125, 0.8197021484375, 0.89208984375, 0.9644775390625, 1.036865234375, 1.1092529296875, 1.181640625, 1.2540283203125, 1.326416015625, 1.3988037109375, 1.47119140625, 1.5435791015625, 1.615966796875, 1.6883544921875, 1.7607421875, 1.8331298828125, 1.905517578125, 1.9779052734375, 2.05029296875, 2.1226806640625, 2.195068359375, 2.2674560546875, 2.33984375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 6.0, 8.0, 13.0, 17.0, 14.0, 23.0, 25.0, 37.0, 51.0, 58.0, 58.0, 65.0, 70.0, 67.0, 54.0, 58.0, 80.0, 47.0, 49.0, 43.0, 32.0, 27.0, 25.0, 12.0, 10.0, 11.0, 6.0, 8.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55908203125, -0.5410079956054688, -0.5229339599609375, -0.5048599243164062, -0.486785888671875, -0.46871185302734375, -0.4506378173828125, -0.43256378173828125, -0.41448974609375, -0.39641571044921875, -0.3783416748046875, -0.36026763916015625, -0.342193603515625, -0.32411956787109375, -0.3060455322265625, -0.28797149658203125, -0.2698974609375, -0.25182342529296875, -0.2337493896484375, -0.21567535400390625, -0.197601318359375, -0.17952728271484375, -0.1614532470703125, -0.14337921142578125, -0.12530517578125, -0.10723114013671875, -0.0891571044921875, -0.07108306884765625, -0.053009033203125, -0.03493499755859375, -0.0168609619140625, 0.00121307373046875, 0.019287109375, 0.03736114501953125, 0.0554351806640625, 0.07350921630859375, 0.091583251953125, 0.10965728759765625, 0.1277313232421875, 0.14580535888671875, 0.16387939453125, 0.18195343017578125, 0.2000274658203125, 0.21810150146484375, 0.236175537109375, 0.25424957275390625, 0.2723236083984375, 0.29039764404296875, 0.3084716796875, 0.32654571533203125, 0.3446197509765625, 0.36269378662109375, 0.380767822265625, 0.39884185791015625, 0.4169158935546875, 0.43498992919921875, 0.45306396484375, 0.47113800048828125, 0.4892120361328125, 0.5072860717773438, 0.525360107421875, 0.5434341430664062, 0.5615081787109375, 0.5795822143554688, 0.59765625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 2.0, 7.0, 13.0, 10.0, 16.0, 22.0, 33.0, 37.0, 44.0, 68.0, 104.0, 98.0, 95.0, 114.0, 81.0, 68.0, 52.0, 34.0, 30.0, 11.0, 14.0, 8.0, 6.0, 9.0, 6.0, 4.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.80108070373535, -20.27338981628418, -19.745698928833008, -19.218008041381836, -18.690317153930664, -18.162626266479492, -17.63493537902832, -17.10724449157715, -16.579553604125977, -16.051862716674805, -15.524171829223633, -14.996480941772461, -14.468790054321289, -13.941099166870117, -13.413408279418945, -12.885717391967773, -12.358026504516602, -11.83033561706543, -11.302644729614258, -10.774953842163086, -10.247262954711914, -9.719572067260742, -9.19188117980957, -8.664190292358398, -8.136499404907227, -7.608808517456055, -7.081117630004883, -6.553426742553711, -6.025735855102539, -5.498044967651367, -4.970354080200195, -4.442663192749023, -3.9149703979492188, -3.387279510498047, -2.859588623046875, -2.331897735595703, -1.8042068481445312, -1.2765159606933594, -0.7488250732421875, -0.22113418579101562, 0.30655670166015625, 0.8342475891113281, 1.3619384765625, 1.8896293640136719, 2.4173202514648438, 2.9450111389160156, 3.4727020263671875, 4.000392913818359, 4.528083801269531, 5.055774688720703, 5.583465576171875, 6.111156463623047, 6.638847351074219, 7.166538238525391, 7.6942291259765625, 8.221920013427734, 8.749610900878906, 9.277301788330078, 9.80499267578125, 10.332683563232422, 10.860374450683594, 11.388065338134766, 11.915756225585938, 12.44344711303711, 12.971138000488281]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 5.0, 9.0, 11.0, 9.0, 21.0, 17.0, 16.0, 22.0, 33.0, 39.0, 38.0, 39.0, 45.0, 35.0, 35.0, 55.0, 47.0, 40.0, 51.0, 43.0, 39.0, 45.0, 52.0, 34.0, 27.0, 27.0, 31.0, 18.0, 25.0, 7.0, 16.0, 13.0, 5.0, 16.0, 6.0, 10.0, 5.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.937016487121582, -5.702924728393555, -5.4688334465026855, -5.234741687774658, -5.000649929046631, -4.766558647155762, -4.532466888427734, -4.298375129699707, -4.06428337097168, -3.8301918506622314, -3.596100091934204, -3.362008571624756, -3.1279168128967285, -2.8938252925872803, -2.659733772277832, -2.4256420135498047, -2.1915504932403564, -1.9574588537216187, -1.7233672142028809, -1.4892756938934326, -1.2551839351654053, -1.021092414855957, -0.7870007753372192, -0.5529091358184814, -0.31881749629974365, -0.08472587168216705, 0.14936575293540955, 0.38345736265182495, 0.6175490021705627, 0.8516405820846558, 1.0857322216033936, 1.3198238611221313, 1.5539155006408691, 1.788007140159607, 2.0220987796783447, 2.256190299987793, 2.4902820587158203, 2.7243735790252686, 2.958465099334717, 3.192556858062744, 3.4266486167907715, 3.6607401371002197, 3.894831895828247, 4.128923416137695, 4.363015174865723, 4.59710693359375, 4.831198215484619, 5.0652899742126465, 5.299381256103516, 5.533473014831543, 5.767564296722412, 6.0016560554504395, 6.235747814178467, 6.469839096069336, 6.703930854797363, 6.938022613525391, 7.172114372253418, 7.406206130981445, 7.6402974128723145, 7.874389171600342, 8.108480453491211, 8.342572212219238, 8.576663970947266, 8.810755729675293, 9.04484748840332]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 11.0, 9.0, 10.0, 17.0, 27.0, 24.0, 45.0, 54.0, 87.0, 108.0, 133.0, 235.0, 357.0, 611.0, 1064.0, 1774.0, 3252.0, 6268.0, 12952.0, 28631.0, 70927.0, 179953.0, 324307.0, 242316.0, 100625.0, 39511.0, 17310.0, 8217.0, 4194.0, 2222.0, 1195.0, 704.0, 435.0, 292.0, 199.0, 130.0, 107.0, 66.0, 43.0, 37.0, 22.0, 16.0, 12.0, 11.0, 14.0, 9.0, 6.0, 2.0, 0.0, 5.0], "bins": [-17.859375, -17.37255859375, -16.8857421875, -16.39892578125, -15.912109375, -15.42529296875, -14.9384765625, -14.45166015625, -13.96484375, -13.47802734375, -12.9912109375, -12.50439453125, -12.017578125, -11.53076171875, -11.0439453125, -10.55712890625, -10.0703125, -9.58349609375, -9.0966796875, -8.60986328125, -8.123046875, -7.63623046875, -7.1494140625, -6.66259765625, -6.17578125, -5.68896484375, -5.2021484375, -4.71533203125, -4.228515625, -3.74169921875, -3.2548828125, -2.76806640625, -2.28125, -1.79443359375, -1.3076171875, -0.82080078125, -0.333984375, 0.15283203125, 0.6396484375, 1.12646484375, 1.61328125, 2.10009765625, 2.5869140625, 3.07373046875, 3.560546875, 4.04736328125, 4.5341796875, 5.02099609375, 5.5078125, 5.99462890625, 6.4814453125, 6.96826171875, 7.455078125, 7.94189453125, 8.4287109375, 8.91552734375, 9.40234375, 9.88916015625, 10.3759765625, 10.86279296875, 11.349609375, 11.83642578125, 12.3232421875, 12.81005859375, 13.296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 5.0, 14.0, 13.0, 18.0, 19.0, 20.0, 22.0, 25.0, 32.0, 30.0, 42.0, 50.0, 49.0, 48.0, 46.0, 45.0, 49.0, 43.0, 44.0, 54.0, 45.0, 38.0, 34.0, 43.0, 32.0, 14.0, 15.0, 21.0, 22.0, 6.0, 11.0, 7.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.47265625, -6.21771240234375, -5.9627685546875, -5.70782470703125, -5.452880859375, -5.19793701171875, -4.9429931640625, -4.68804931640625, -4.43310546875, -4.17816162109375, -3.9232177734375, -3.66827392578125, -3.413330078125, -3.15838623046875, -2.9034423828125, -2.64849853515625, -2.3935546875, -2.13861083984375, -1.8836669921875, -1.62872314453125, -1.373779296875, -1.11883544921875, -0.8638916015625, -0.60894775390625, -0.35400390625, -0.09906005859375, 0.1558837890625, 0.41082763671875, 0.665771484375, 0.92071533203125, 1.1756591796875, 1.43060302734375, 1.685546875, 1.94049072265625, 2.1954345703125, 2.45037841796875, 2.705322265625, 2.96026611328125, 3.2152099609375, 3.47015380859375, 3.72509765625, 3.98004150390625, 4.2349853515625, 4.48992919921875, 4.744873046875, 4.99981689453125, 5.2547607421875, 5.50970458984375, 5.7646484375, 6.01959228515625, 6.2745361328125, 6.52947998046875, 6.784423828125, 7.03936767578125, 7.2943115234375, 7.54925537109375, 7.80419921875, 8.05914306640625, 8.3140869140625, 8.56903076171875, 8.823974609375, 9.07891845703125, 9.3338623046875, 9.58880615234375, 9.84375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 13.0, 7.0, 13.0, 16.0, 38.0, 44.0, 52.0, 101.0, 145.0, 191.0, 246.0, 398.0, 534.0, 847.0, 1236.0, 1869.0, 2918.0, 4530.0, 6966.0, 11375.0, 18580.0, 31009.0, 52711.0, 87498.0, 134230.0, 176699.0, 174099.0, 130215.0, 83749.0, 50162.0, 29933.0, 17881.0, 10906.0, 6772.0, 4290.0, 2778.0, 1832.0, 1209.0, 776.0, 525.0, 350.0, 258.0, 184.0, 120.0, 65.0, 50.0, 40.0, 34.0, 21.0, 12.0, 12.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.81640625, -7.55548095703125, -7.2945556640625, -7.03363037109375, -6.772705078125, -6.51177978515625, -6.2508544921875, -5.98992919921875, -5.72900390625, -5.46807861328125, -5.2071533203125, -4.94622802734375, -4.685302734375, -4.42437744140625, -4.1634521484375, -3.90252685546875, -3.6416015625, -3.38067626953125, -3.1197509765625, -2.85882568359375, -2.597900390625, -2.33697509765625, -2.0760498046875, -1.81512451171875, -1.55419921875, -1.29327392578125, -1.0323486328125, -0.77142333984375, -0.510498046875, -0.24957275390625, 0.0113525390625, 0.27227783203125, 0.533203125, 0.79412841796875, 1.0550537109375, 1.31597900390625, 1.576904296875, 1.83782958984375, 2.0987548828125, 2.35968017578125, 2.62060546875, 2.88153076171875, 3.1424560546875, 3.40338134765625, 3.664306640625, 3.92523193359375, 4.1861572265625, 4.44708251953125, 4.7080078125, 4.96893310546875, 5.2298583984375, 5.49078369140625, 5.751708984375, 6.01263427734375, 6.2735595703125, 6.53448486328125, 6.79541015625, 7.05633544921875, 7.3172607421875, 7.57818603515625, 7.839111328125, 8.10003662109375, 8.3609619140625, 8.62188720703125, 8.8828125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 3.0, 6.0, 8.0, 13.0, 16.0, 16.0, 16.0, 22.0, 20.0, 28.0, 23.0, 31.0, 48.0, 47.0, 38.0, 43.0, 45.0, 46.0, 38.0, 51.0, 42.0, 42.0, 35.0, 37.0, 33.0, 33.0, 37.0, 24.0, 19.0, 20.0, 22.0, 16.0, 17.0, 20.0, 7.0, 10.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4765625, -4.335205078125, -4.19384765625, -4.052490234375, -3.9111328125, -3.769775390625, -3.62841796875, -3.487060546875, -3.345703125, -3.204345703125, -3.06298828125, -2.921630859375, -2.7802734375, -2.638916015625, -2.49755859375, -2.356201171875, -2.21484375, -2.073486328125, -1.93212890625, -1.790771484375, -1.6494140625, -1.508056640625, -1.36669921875, -1.225341796875, -1.083984375, -0.942626953125, -0.80126953125, -0.659912109375, -0.5185546875, -0.377197265625, -0.23583984375, -0.094482421875, 0.046875, 0.188232421875, 0.32958984375, 0.470947265625, 0.6123046875, 0.753662109375, 0.89501953125, 1.036376953125, 1.177734375, 1.319091796875, 1.46044921875, 1.601806640625, 1.7431640625, 1.884521484375, 2.02587890625, 2.167236328125, 2.30859375, 2.449951171875, 2.59130859375, 2.732666015625, 2.8740234375, 3.015380859375, 3.15673828125, 3.298095703125, 3.439453125, 3.580810546875, 3.72216796875, 3.863525390625, 4.0048828125, 4.146240234375, 4.28759765625, 4.428955078125, 4.5703125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 10.0, 9.0, 16.0, 18.0, 35.0, 44.0, 51.0, 73.0, 83.0, 114.0, 178.0, 261.0, 342.0, 515.0, 769.0, 1211.0, 1914.0, 3216.0, 5829.0, 11494.0, 24379.0, 58145.0, 153820.0, 338384.0, 265839.0, 103274.0, 40149.0, 17780.0, 8681.0, 4575.0, 2567.0, 1579.0, 985.0, 643.0, 445.0, 315.0, 234.0, 153.0, 126.0, 94.0, 51.0, 45.0, 36.0, 17.0, 16.0, 9.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-8.6015625, -8.322265625, -8.04296875, -7.763671875, -7.484375, -7.205078125, -6.92578125, -6.646484375, -6.3671875, -6.087890625, -5.80859375, -5.529296875, -5.25, -4.970703125, -4.69140625, -4.412109375, -4.1328125, -3.853515625, -3.57421875, -3.294921875, -3.015625, -2.736328125, -2.45703125, -2.177734375, -1.8984375, -1.619140625, -1.33984375, -1.060546875, -0.78125, -0.501953125, -0.22265625, 0.056640625, 0.3359375, 0.615234375, 0.89453125, 1.173828125, 1.453125, 1.732421875, 2.01171875, 2.291015625, 2.5703125, 2.849609375, 3.12890625, 3.408203125, 3.6875, 3.966796875, 4.24609375, 4.525390625, 4.8046875, 5.083984375, 5.36328125, 5.642578125, 5.921875, 6.201171875, 6.48046875, 6.759765625, 7.0390625, 7.318359375, 7.59765625, 7.876953125, 8.15625, 8.435546875, 8.71484375, 8.994140625, 9.2734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 7.0, 10.0, 27.0, 30.0, 40.0, 60.0, 80.0, 106.0, 134.0, 133.0, 126.0, 73.0, 54.0, 25.0, 27.0, 27.0, 12.0, 9.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005993843078613281, -0.0005640164017677307, -0.0005286484956741333, -0.0004932805895805359, -0.0004579126834869385, -0.00042254477739334106, -0.00038717687129974365, -0.00035180896520614624, -0.00031644105911254883, -0.0002810731530189514, -0.000245705246925354, -0.0002103373408317566, -0.00017496943473815918, -0.00013960152864456177, -0.00010423362255096436, -6.886571645736694e-05, -3.349781036376953e-05, 1.8700957298278809e-06, 3.723800182342529e-05, 7.26059079170227e-05, 0.00010797381401062012, 0.00014334172010421753, 0.00017870962619781494, 0.00021407753229141235, 0.00024944543838500977, 0.0002848133444786072, 0.0003201812505722046, 0.000355549156665802, 0.0003909170627593994, 0.0004262849688529968, 0.00046165287494659424, 0.0004970207810401917, 0.0005323886871337891, 0.0005677565932273865, 0.0006031244993209839, 0.0006384924054145813, 0.0006738603115081787, 0.0007092282176017761, 0.0007445961236953735, 0.000779964029788971, 0.0008153319358825684, 0.0008506998419761658, 0.0008860677480697632, 0.0009214356541633606, 0.000956803560256958, 0.0009921714663505554, 0.0010275393724441528, 0.0010629072785377502, 0.0010982751846313477, 0.001133643090724945, 0.0011690109968185425, 0.00120437890291214, 0.0012397468090057373, 0.0012751147150993347, 0.0013104826211929321, 0.0013458505272865295, 0.001381218433380127, 0.0014165863394737244, 0.0014519542455673218, 0.0014873221516609192, 0.0015226900577545166, 0.001558057963848114, 0.0015934258699417114, 0.0016287937760353088, 0.0016641616821289062]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 7.0, 10.0, 9.0, 12.0, 13.0, 25.0, 27.0, 58.0, 66.0, 71.0, 118.0, 132.0, 190.0, 328.0, 435.0, 548.0, 859.0, 1370.0, 2410.0, 4476.0, 9733.0, 27191.0, 96521.0, 359731.0, 385439.0, 107186.0, 29529.0, 10495.0, 4585.0, 2469.0, 1477.0, 944.0, 619.0, 398.0, 322.0, 182.0, 165.0, 136.0, 64.0, 48.0, 40.0, 29.0, 31.0, 19.0, 9.0, 8.0, 10.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.8203125, -11.4625244140625, -11.104736328125, -10.7469482421875, -10.38916015625, -10.0313720703125, -9.673583984375, -9.3157958984375, -8.9580078125, -8.6002197265625, -8.242431640625, -7.8846435546875, -7.52685546875, -7.1690673828125, -6.811279296875, -6.4534912109375, -6.095703125, -5.7379150390625, -5.380126953125, -5.0223388671875, -4.66455078125, -4.3067626953125, -3.948974609375, -3.5911865234375, -3.2333984375, -2.8756103515625, -2.517822265625, -2.1600341796875, -1.80224609375, -1.4444580078125, -1.086669921875, -0.7288818359375, -0.37109375, -0.0133056640625, 0.344482421875, 0.7022705078125, 1.06005859375, 1.4178466796875, 1.775634765625, 2.1334228515625, 2.4912109375, 2.8489990234375, 3.206787109375, 3.5645751953125, 3.92236328125, 4.2801513671875, 4.637939453125, 4.9957275390625, 5.353515625, 5.7113037109375, 6.069091796875, 6.4268798828125, 6.78466796875, 7.1424560546875, 7.500244140625, 7.8580322265625, 8.2158203125, 8.5736083984375, 8.931396484375, 9.2891845703125, 9.64697265625, 10.0047607421875, 10.362548828125, 10.7203369140625, 11.078125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 16.0, 14.0, 22.0, 40.0, 43.0, 77.0, 69.0, 88.0, 89.0, 93.0, 100.0, 65.0, 51.0, 53.0, 30.0, 31.0, 20.0, 14.0, 16.0, 7.0, 8.0, 8.0, 1.0, 0.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.109375, -2.045440673828125, -1.98150634765625, -1.917572021484375, -1.8536376953125, -1.789703369140625, -1.72576904296875, -1.661834716796875, -1.597900390625, -1.533966064453125, -1.47003173828125, -1.406097412109375, -1.3421630859375, -1.278228759765625, -1.21429443359375, -1.150360107421875, -1.08642578125, -1.022491455078125, -0.95855712890625, -0.894622802734375, -0.8306884765625, -0.766754150390625, -0.70281982421875, -0.638885498046875, -0.574951171875, -0.511016845703125, -0.44708251953125, -0.383148193359375, -0.3192138671875, -0.255279541015625, -0.19134521484375, -0.127410888671875, -0.0634765625, 0.000457763671875, 0.06439208984375, 0.128326416015625, 0.1922607421875, 0.256195068359375, 0.32012939453125, 0.384063720703125, 0.447998046875, 0.511932373046875, 0.57586669921875, 0.639801025390625, 0.7037353515625, 0.767669677734375, 0.83160400390625, 0.895538330078125, 0.95947265625, 1.023406982421875, 1.08734130859375, 1.151275634765625, 1.2152099609375, 1.279144287109375, 1.34307861328125, 1.407012939453125, 1.470947265625, 1.534881591796875, 1.59881591796875, 1.662750244140625, 1.7266845703125, 1.790618896484375, 1.85455322265625, 1.918487548828125, 1.982421875]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 6.0, 11.0, 7.0, 17.0, 22.0, 21.0, 31.0, 41.0, 61.0, 71.0, 72.0, 95.0, 100.0, 83.0, 83.0, 59.0, 59.0, 32.0, 31.0, 18.0, 14.0, 8.0, 6.0, 4.0, 3.0, 8.0, 7.0, 5.0, 2.0, 7.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.568994522094727, -17.1079158782959, -16.646839141845703, -16.185760498046875, -15.724681854248047, -15.263603210449219, -14.802525520324707, -14.341447830200195, -13.880369186401367, -13.419290542602539, -12.958212852478027, -12.497135162353516, -12.036056518554688, -11.57497787475586, -11.113900184631348, -10.652822494506836, -10.191743850708008, -9.73066520690918, -9.269587516784668, -8.808509826660156, -8.347431182861328, -7.886353015899658, -7.425274848937988, -6.964196681976318, -6.503118515014648, -6.0420403480529785, -5.580962181091309, -5.119884014129639, -4.658805847167969, -4.197727680206299, -3.736649513244629, -3.275571346282959, -2.8144941329956055, -2.3534159660339355, -1.8923377990722656, -1.4312596321105957, -0.9701814651489258, -0.5091032981872559, -0.04802513122558594, 0.413053035736084, 0.8741312026977539, 1.3352093696594238, 1.7962875366210938, 2.2573657035827637, 2.7184438705444336, 3.1795220375061035, 3.6406002044677734, 4.101678371429443, 4.562756538391113, 5.023834705352783, 5.484912872314453, 5.945991039276123, 6.407069206237793, 6.868147373199463, 7.329225540161133, 7.790303707122803, 8.251381874084473, 8.712459564208984, 9.173538208007812, 9.63461685180664, 10.095694541931152, 10.556772232055664, 11.017850875854492, 11.47892951965332, 11.940007209777832]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 4.0, 7.0, 8.0, 12.0, 14.0, 9.0, 15.0, 19.0, 13.0, 26.0, 30.0, 24.0, 22.0, 37.0, 37.0, 34.0, 34.0, 47.0, 42.0, 42.0, 51.0, 25.0, 40.0, 43.0, 38.0, 42.0, 34.0, 31.0, 25.0, 29.0, 26.0, 28.0, 14.0, 11.0, 19.0, 14.0, 13.0, 8.0, 8.0, 7.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.356032371520996, -6.140588760375977, -5.925145149230957, -5.7097015380859375, -5.494257926940918, -5.278814315795898, -5.063370227813721, -4.847926616668701, -4.632483005523682, -4.417039394378662, -4.201595783233643, -3.986151933670044, -3.7707083225250244, -3.555264711380005, -3.3398208618164062, -3.1243772506713867, -2.908933639526367, -2.6934900283813477, -2.478046417236328, -2.2626025676727295, -2.04715895652771, -1.8317153453826904, -1.6162716150283813, -1.4008278846740723, -1.1853842735290527, -0.9699406027793884, -0.7544969320297241, -0.5390532612800598, -0.3236095905303955, -0.10816597938537598, 0.1072777509689331, 0.3227214813232422, 0.5381655693054199, 0.7536092400550842, 0.9690529108047485, 1.1844966411590576, 1.3999402523040771, 1.6153838634490967, 1.8308275938034058, 2.046271324157715, 2.2617149353027344, 2.477158546447754, 2.6926021575927734, 2.908046007156372, 3.1234896183013916, 3.338933229446411, 3.5543770790100098, 3.7698206901550293, 3.985264301300049, 4.200707912445068, 4.416151523590088, 4.631595134735107, 4.847039222717285, 5.062482833862305, 5.277926445007324, 5.493370056152344, 5.708813667297363, 5.924257278442383, 6.139700889587402, 6.355144500732422, 6.570588111877441, 6.786031723022461, 7.001475811004639, 7.216919422149658, 7.432363033294678]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 7.0, 6.0, 11.0, 13.0, 28.0, 35.0, 45.0, 70.0, 95.0, 143.0, 191.0, 232.0, 366.0, 552.0, 837.0, 1153.0, 1767.0, 2827.0, 4471.0, 7926.0, 14437.0, 30283.0, 76994.0, 238904.0, 818973.0, 1646066.0, 922064.0, 267452.0, 85237.0, 33872.0, 16212.0, 8609.0, 5099.0, 3151.0, 2025.0, 1311.0, 940.0, 597.0, 357.0, 266.0, 203.0, 124.0, 104.0, 75.0, 48.0, 36.0, 31.0, 17.0, 10.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.3984375, -13.9112548828125, -13.424072265625, -12.9368896484375, -12.44970703125, -11.9625244140625, -11.475341796875, -10.9881591796875, -10.5009765625, -10.0137939453125, -9.526611328125, -9.0394287109375, -8.55224609375, -8.0650634765625, -7.577880859375, -7.0906982421875, -6.603515625, -6.1163330078125, -5.629150390625, -5.1419677734375, -4.65478515625, -4.1676025390625, -3.680419921875, -3.1932373046875, -2.7060546875, -2.2188720703125, -1.731689453125, -1.2445068359375, -0.75732421875, -0.2701416015625, 0.217041015625, 0.7042236328125, 1.19140625, 1.6785888671875, 2.165771484375, 2.6529541015625, 3.14013671875, 3.6273193359375, 4.114501953125, 4.6016845703125, 5.0888671875, 5.5760498046875, 6.063232421875, 6.5504150390625, 7.03759765625, 7.5247802734375, 8.011962890625, 8.4991455078125, 8.986328125, 9.4735107421875, 9.960693359375, 10.4478759765625, 10.93505859375, 11.4222412109375, 11.909423828125, 12.3966064453125, 12.8837890625, 13.3709716796875, 13.858154296875, 14.3453369140625, 14.83251953125, 15.3197021484375, 15.806884765625, 16.2940673828125, 16.78125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 5.0, 4.0, 3.0, 5.0, 10.0, 10.0, 12.0, 10.0, 14.0, 18.0, 24.0, 28.0, 20.0, 20.0, 21.0, 32.0, 37.0, 43.0, 37.0, 50.0, 36.0, 40.0, 51.0, 37.0, 39.0, 50.0, 32.0, 35.0, 45.0, 31.0, 20.0, 34.0, 25.0, 18.0, 17.0, 14.0, 14.0, 19.0, 11.0, 10.0, 5.0, 8.0, 4.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.33203125, -5.16217041015625, -4.9923095703125, -4.82244873046875, -4.652587890625, -4.48272705078125, -4.3128662109375, -4.14300537109375, -3.97314453125, -3.80328369140625, -3.6334228515625, -3.46356201171875, -3.293701171875, -3.12384033203125, -2.9539794921875, -2.78411865234375, -2.6142578125, -2.44439697265625, -2.2745361328125, -2.10467529296875, -1.934814453125, -1.76495361328125, -1.5950927734375, -1.42523193359375, -1.25537109375, -1.08551025390625, -0.9156494140625, -0.74578857421875, -0.575927734375, -0.40606689453125, -0.2362060546875, -0.06634521484375, 0.103515625, 0.27337646484375, 0.4432373046875, 0.61309814453125, 0.782958984375, 0.95281982421875, 1.1226806640625, 1.29254150390625, 1.46240234375, 1.63226318359375, 1.8021240234375, 1.97198486328125, 2.141845703125, 2.31170654296875, 2.4815673828125, 2.65142822265625, 2.8212890625, 2.99114990234375, 3.1610107421875, 3.33087158203125, 3.500732421875, 3.67059326171875, 3.8404541015625, 4.01031494140625, 4.18017578125, 4.35003662109375, 4.5198974609375, 4.68975830078125, 4.859619140625, 5.02947998046875, 5.1993408203125, 5.36920166015625, 5.5390625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 4.0, 6.0, 9.0, 13.0, 17.0, 26.0, 38.0, 57.0, 78.0, 117.0, 186.0, 292.0, 388.0, 537.0, 794.0, 1145.0, 1669.0, 2507.0, 3722.0, 5647.0, 8855.0, 13888.0, 23814.0, 42211.0, 80304.0, 165807.0, 368606.0, 783440.0, 1133589.0, 806814.0, 383455.0, 173822.0, 83359.0, 43570.0, 24479.0, 14548.0, 8907.0, 5788.0, 3878.0, 2553.0, 1695.0, 1147.0, 767.0, 536.0, 365.0, 261.0, 163.0, 130.0, 99.0, 57.0, 47.0, 34.0, 15.0, 13.0, 11.0, 6.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0], "bins": [-11.3203125, -10.949462890625, -10.57861328125, -10.207763671875, -9.8369140625, -9.466064453125, -9.09521484375, -8.724365234375, -8.353515625, -7.982666015625, -7.61181640625, -7.240966796875, -6.8701171875, -6.499267578125, -6.12841796875, -5.757568359375, -5.38671875, -5.015869140625, -4.64501953125, -4.274169921875, -3.9033203125, -3.532470703125, -3.16162109375, -2.790771484375, -2.419921875, -2.049072265625, -1.67822265625, -1.307373046875, -0.9365234375, -0.565673828125, -0.19482421875, 0.176025390625, 0.546875, 0.917724609375, 1.28857421875, 1.659423828125, 2.0302734375, 2.401123046875, 2.77197265625, 3.142822265625, 3.513671875, 3.884521484375, 4.25537109375, 4.626220703125, 4.9970703125, 5.367919921875, 5.73876953125, 6.109619140625, 6.48046875, 6.851318359375, 7.22216796875, 7.593017578125, 7.9638671875, 8.334716796875, 8.70556640625, 9.076416015625, 9.447265625, 9.818115234375, 10.18896484375, 10.559814453125, 10.9306640625, 11.301513671875, 11.67236328125, 12.043212890625, 12.4140625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 5.0, 7.0, 16.0, 13.0, 18.0, 26.0, 35.0, 35.0, 51.0, 60.0, 79.0, 101.0, 117.0, 175.0, 254.0, 257.0, 315.0, 337.0, 357.0, 308.0, 250.0, 268.0, 244.0, 157.0, 152.0, 100.0, 76.0, 61.0, 48.0, 30.0, 30.0, 18.0, 19.0, 17.0, 6.0, 11.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.11328125, -3.991424560546875, -3.86956787109375, -3.747711181640625, -3.6258544921875, -3.503997802734375, -3.38214111328125, -3.260284423828125, -3.138427734375, -3.016571044921875, -2.89471435546875, -2.772857666015625, -2.6510009765625, -2.529144287109375, -2.40728759765625, -2.285430908203125, -2.16357421875, -2.041717529296875, -1.91986083984375, -1.798004150390625, -1.6761474609375, -1.554290771484375, -1.43243408203125, -1.310577392578125, -1.188720703125, -1.066864013671875, -0.94500732421875, -0.823150634765625, -0.7012939453125, -0.579437255859375, -0.45758056640625, -0.335723876953125, -0.2138671875, -0.092010498046875, 0.02984619140625, 0.151702880859375, 0.2735595703125, 0.395416259765625, 0.51727294921875, 0.639129638671875, 0.760986328125, 0.882843017578125, 1.00469970703125, 1.126556396484375, 1.2484130859375, 1.370269775390625, 1.49212646484375, 1.613983154296875, 1.73583984375, 1.857696533203125, 1.97955322265625, 2.101409912109375, 2.2232666015625, 2.345123291015625, 2.46697998046875, 2.588836669921875, 2.710693359375, 2.832550048828125, 2.95440673828125, 3.076263427734375, 3.1981201171875, 3.319976806640625, 3.44183349609375, 3.563690185546875, 3.685546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 9.0, 11.0, 24.0, 29.0, 34.0, 47.0, 58.0, 69.0, 93.0, 83.0, 111.0, 75.0, 77.0, 60.0, 48.0, 33.0, 21.0, 20.0, 18.0, 7.0, 7.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.337761878967285, -11.842564582824707, -11.347367286682129, -10.85216999053955, -10.356972694396973, -9.861775398254395, -9.3665771484375, -8.871379852294922, -8.376182556152344, -7.880985260009766, -7.3857879638671875, -6.890590667724609, -6.395393371582031, -5.900196075439453, -5.404998302459717, -4.909801006317139, -4.414604187011719, -3.9194068908691406, -3.4242095947265625, -2.9290120601654053, -2.433814764022827, -1.938617467880249, -1.4434199333190918, -0.9482226371765137, -0.45302534103393555, 0.042172014713287354, 0.5373693704605103, 1.032566785812378, 1.527764081954956, 2.022961378097534, 2.5181589126586914, 3.0133562088012695, 3.5085525512695312, 4.003749847412109, 4.4989471435546875, 4.994144439697266, 5.489341735839844, 5.984539031982422, 6.479736804962158, 6.974934101104736, 7.4701313972473145, 7.965328693389893, 8.460526466369629, 8.955723762512207, 9.450921058654785, 9.946118354797363, 10.441315650939941, 10.93651294708252, 11.431710243225098, 11.926907539367676, 12.422104835510254, 12.917302131652832, 13.41249942779541, 13.907696723937988, 14.402894973754883, 14.898092269897461, 15.393289566040039, 15.888486862182617, 16.383684158325195, 16.878881454467773, 17.37407875061035, 17.86927604675293, 18.364473342895508, 18.859670639038086, 19.354867935180664]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 11.0, 8.0, 9.0, 10.0, 13.0, 13.0, 18.0, 12.0, 25.0, 20.0, 22.0, 29.0, 33.0, 31.0, 23.0, 34.0, 37.0, 40.0, 48.0, 39.0, 29.0, 39.0, 41.0, 45.0, 38.0, 31.0, 35.0, 26.0, 36.0, 31.0, 27.0, 25.0, 21.0, 21.0, 15.0, 11.0, 6.0, 11.0, 7.0, 7.0, 4.0, 3.0, 5.0, 3.0, 4.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.325138568878174, -7.107594966888428, -6.89005184173584, -6.672508239746094, -6.454965114593506, -6.23742151260376, -6.019878387451172, -5.802334785461426, -5.58479118347168, -5.367247581481934, -5.149704456329346, -4.9321608543396, -4.714617729187012, -4.497074127197266, -4.2795305252075195, -4.061987400054932, -3.8444442749023438, -3.6269009113311768, -3.4093575477600098, -3.1918139457702637, -2.974270820617676, -2.7567272186279297, -2.5391838550567627, -2.3216404914855957, -2.1040971279144287, -1.8865537643432617, -1.6690104007720947, -1.4514669179916382, -1.2339235544204712, -1.0163801908493042, -0.7988367080688477, -0.5812933444976807, -0.3637504577636719, -0.1462070643901825, 0.07133632898330688, 0.28887975215911865, 0.5064231157302856, 0.7239664793014526, 0.9415099620819092, 1.1590533256530762, 1.3765966892242432, 1.5941400527954102, 1.8116834163665771, 2.029226779937744, 2.2467703819274902, 2.464313507080078, 2.681857109069824, 2.899400472640991, 3.116943836212158, 3.334487199783325, 3.552030563354492, 3.7695741653442383, 3.987117290496826, 4.204660892486572, 4.42220401763916, 4.639747619628906, 4.857291221618652, 5.074834823608398, 5.292377948760986, 5.509921550750732, 5.72746467590332, 5.945008277893066, 6.1625518798828125, 6.3800950050354, 6.597638130187988]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 10.0, 14.0, 15.0, 21.0, 30.0, 49.0, 65.0, 89.0, 137.0, 223.0, 346.0, 476.0, 756.0, 1170.0, 1992.0, 3540.0, 6200.0, 11504.0, 23589.0, 48340.0, 102757.0, 200967.0, 269399.0, 189706.0, 95300.0, 44866.0, 21579.0, 11053.0, 5980.0, 3262.0, 1935.0, 1181.0, 700.0, 413.0, 250.0, 205.0, 111.0, 104.0, 67.0, 39.0, 34.0, 23.0, 17.0, 10.0, 10.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.59765625, -5.413818359375, -5.22998046875, -5.046142578125, -4.8623046875, -4.678466796875, -4.49462890625, -4.310791015625, -4.126953125, -3.943115234375, -3.75927734375, -3.575439453125, -3.3916015625, -3.207763671875, -3.02392578125, -2.840087890625, -2.65625, -2.472412109375, -2.28857421875, -2.104736328125, -1.9208984375, -1.737060546875, -1.55322265625, -1.369384765625, -1.185546875, -1.001708984375, -0.81787109375, -0.634033203125, -0.4501953125, -0.266357421875, -0.08251953125, 0.101318359375, 0.28515625, 0.468994140625, 0.65283203125, 0.836669921875, 1.0205078125, 1.204345703125, 1.38818359375, 1.572021484375, 1.755859375, 1.939697265625, 2.12353515625, 2.307373046875, 2.4912109375, 2.675048828125, 2.85888671875, 3.042724609375, 3.2265625, 3.410400390625, 3.59423828125, 3.778076171875, 3.9619140625, 4.145751953125, 4.32958984375, 4.513427734375, 4.697265625, 4.881103515625, 5.06494140625, 5.248779296875, 5.4326171875, 5.616455078125, 5.80029296875, 5.984130859375, 6.16796875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 7.0, 9.0, 9.0, 12.0, 13.0, 11.0, 17.0, 22.0, 22.0, 20.0, 15.0, 34.0, 24.0, 31.0, 34.0, 39.0, 34.0, 32.0, 31.0, 47.0, 29.0, 37.0, 33.0, 39.0, 40.0, 35.0, 50.0, 34.0, 25.0, 27.0, 24.0, 22.0, 25.0, 16.0, 11.0, 18.0, 11.0, 8.0, 7.0, 10.0, 4.0, 4.0, 6.0, 1.0, 6.0, 2.0, 3.0, 3.0, 3.0], "bins": [-8.046875, -7.8193359375, -7.591796875, -7.3642578125, -7.13671875, -6.9091796875, -6.681640625, -6.4541015625, -6.2265625, -5.9990234375, -5.771484375, -5.5439453125, -5.31640625, -5.0888671875, -4.861328125, -4.6337890625, -4.40625, -4.1787109375, -3.951171875, -3.7236328125, -3.49609375, -3.2685546875, -3.041015625, -2.8134765625, -2.5859375, -2.3583984375, -2.130859375, -1.9033203125, -1.67578125, -1.4482421875, -1.220703125, -0.9931640625, -0.765625, -0.5380859375, -0.310546875, -0.0830078125, 0.14453125, 0.3720703125, 0.599609375, 0.8271484375, 1.0546875, 1.2822265625, 1.509765625, 1.7373046875, 1.96484375, 2.1923828125, 2.419921875, 2.6474609375, 2.875, 3.1025390625, 3.330078125, 3.5576171875, 3.78515625, 4.0126953125, 4.240234375, 4.4677734375, 4.6953125, 4.9228515625, 5.150390625, 5.3779296875, 5.60546875, 5.8330078125, 6.060546875, 6.2880859375, 6.515625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 9.0, 4.0, 14.0, 16.0, 22.0, 23.0, 29.0, 56.0, 62.0, 94.0, 116.0, 176.0, 271.0, 437.0, 659.0, 1182.0, 2117.0, 4111.0, 8571.0, 19977.0, 53458.0, 162739.0, 391602.0, 261443.0, 86192.0, 30653.0, 12241.0, 5484.0, 2765.0, 1523.0, 905.0, 486.0, 348.0, 236.0, 146.0, 109.0, 72.0, 56.0, 41.0, 24.0, 24.0, 13.0, 12.0, 9.0, 11.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.7901611328125, -8.494384765625, -8.1986083984375, -7.90283203125, -7.6070556640625, -7.311279296875, -7.0155029296875, -6.7197265625, -6.4239501953125, -6.128173828125, -5.8323974609375, -5.53662109375, -5.2408447265625, -4.945068359375, -4.6492919921875, -4.353515625, -4.0577392578125, -3.761962890625, -3.4661865234375, -3.17041015625, -2.8746337890625, -2.578857421875, -2.2830810546875, -1.9873046875, -1.6915283203125, -1.395751953125, -1.0999755859375, -0.80419921875, -0.5084228515625, -0.212646484375, 0.0831298828125, 0.37890625, 0.6746826171875, 0.970458984375, 1.2662353515625, 1.56201171875, 1.8577880859375, 2.153564453125, 2.4493408203125, 2.7451171875, 3.0408935546875, 3.336669921875, 3.6324462890625, 3.92822265625, 4.2239990234375, 4.519775390625, 4.8155517578125, 5.111328125, 5.4071044921875, 5.702880859375, 5.9986572265625, 6.29443359375, 6.5902099609375, 6.885986328125, 7.1817626953125, 7.4775390625, 7.7733154296875, 8.069091796875, 8.3648681640625, 8.66064453125, 8.9564208984375, 9.252197265625, 9.5479736328125, 9.84375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 13.0, 13.0, 8.0, 16.0, 18.0, 15.0, 16.0, 30.0, 34.0, 31.0, 33.0, 35.0, 44.0, 46.0, 61.0, 34.0, 53.0, 38.0, 53.0, 46.0, 34.0, 36.0, 33.0, 33.0, 32.0, 27.0, 25.0, 19.0, 24.0, 22.0, 14.0, 9.0, 12.0, 8.0, 2.0, 7.0, 2.0, 4.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4765625, -4.32147216796875, -4.1663818359375, -4.01129150390625, -3.856201171875, -3.70111083984375, -3.5460205078125, -3.39093017578125, -3.23583984375, -3.08074951171875, -2.9256591796875, -2.77056884765625, -2.615478515625, -2.46038818359375, -2.3052978515625, -2.15020751953125, -1.9951171875, -1.84002685546875, -1.6849365234375, -1.52984619140625, -1.374755859375, -1.21966552734375, -1.0645751953125, -0.90948486328125, -0.75439453125, -0.59930419921875, -0.4442138671875, -0.28912353515625, -0.134033203125, 0.02105712890625, 0.1761474609375, 0.33123779296875, 0.486328125, 0.64141845703125, 0.7965087890625, 0.95159912109375, 1.106689453125, 1.26177978515625, 1.4168701171875, 1.57196044921875, 1.72705078125, 1.88214111328125, 2.0372314453125, 2.19232177734375, 2.347412109375, 2.50250244140625, 2.6575927734375, 2.81268310546875, 2.9677734375, 3.12286376953125, 3.2779541015625, 3.43304443359375, 3.588134765625, 3.74322509765625, 3.8983154296875, 4.05340576171875, 4.20849609375, 4.36358642578125, 4.5186767578125, 4.67376708984375, 4.828857421875, 4.98394775390625, 5.1390380859375, 5.29412841796875, 5.44921875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 16.0, 32.0, 39.0, 48.0, 80.0, 109.0, 210.0, 304.0, 469.0, 728.0, 1270.0, 2039.0, 3728.0, 6515.0, 12807.0, 26260.0, 58624.0, 141844.0, 299858.0, 273765.0, 121231.0, 50602.0, 22876.0, 11092.0, 5891.0, 3202.0, 1830.0, 1099.0, 721.0, 451.0, 286.0, 182.0, 124.0, 78.0, 37.0, 30.0, 22.0, 13.0, 6.0, 7.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.037384033203125, -2.94781494140625, -2.858245849609375, -2.7686767578125, -2.679107666015625, -2.58953857421875, -2.499969482421875, -2.410400390625, -2.320831298828125, -2.23126220703125, -2.141693115234375, -2.0521240234375, -1.962554931640625, -1.87298583984375, -1.783416748046875, -1.69384765625, -1.604278564453125, -1.51470947265625, -1.425140380859375, -1.3355712890625, -1.246002197265625, -1.15643310546875, -1.066864013671875, -0.977294921875, -0.887725830078125, -0.79815673828125, -0.708587646484375, -0.6190185546875, -0.529449462890625, -0.43988037109375, -0.350311279296875, -0.2607421875, -0.171173095703125, -0.08160400390625, 0.007965087890625, 0.0975341796875, 0.187103271484375, 0.27667236328125, 0.366241455078125, 0.455810546875, 0.545379638671875, 0.63494873046875, 0.724517822265625, 0.8140869140625, 0.903656005859375, 0.99322509765625, 1.082794189453125, 1.17236328125, 1.261932373046875, 1.35150146484375, 1.441070556640625, 1.5306396484375, 1.620208740234375, 1.70977783203125, 1.799346923828125, 1.888916015625, 1.978485107421875, 2.06805419921875, 2.157623291015625, 2.2471923828125, 2.336761474609375, 2.42633056640625, 2.515899658203125, 2.60546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 0.0, 6.0, 4.0, 13.0, 7.0, 25.0, 38.0, 77.0, 92.0, 139.0, 143.0, 130.0, 112.0, 68.0, 40.0, 31.0, 12.0, 14.0, 15.0, 11.0, 6.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002231597900390625, -0.0002144351601600647, -0.0002057105302810669, -0.0001969859004020691, -0.0001882612705230713, -0.00017953664064407349, -0.00017081201076507568, -0.00016208738088607788, -0.00015336275100708008, -0.00014463812112808228, -0.00013591349124908447, -0.00012718886137008667, -0.00011846423149108887, -0.00010973960161209106, -0.00010101497173309326, -9.229034185409546e-05, -8.356571197509766e-05, -7.484108209609985e-05, -6.611645221710205e-05, -5.739182233810425e-05, -4.8667192459106445e-05, -3.994256258010864e-05, -3.121793270111084e-05, -2.2493302822113037e-05, -1.3768672943115234e-05, -5.044043064117432e-06, 3.680586814880371e-06, 1.2405216693878174e-05, 2.1129846572875977e-05, 2.985447645187378e-05, 3.857910633087158e-05, 4.7303736209869385e-05, 5.602836608886719e-05, 6.475299596786499e-05, 7.347762584686279e-05, 8.22022557258606e-05, 9.09268856048584e-05, 9.96515154838562e-05, 0.000108376145362854, 0.0001171007752418518, 0.0001258254051208496, 0.0001345500349998474, 0.00014327466487884521, 0.00015199929475784302, 0.00016072392463684082, 0.00016944855451583862, 0.00017817318439483643, 0.00018689781427383423, 0.00019562244415283203, 0.00020434707403182983, 0.00021307170391082764, 0.00022179633378982544, 0.00023052096366882324, 0.00023924559354782104, 0.00024797022342681885, 0.00025669485330581665, 0.00026541948318481445, 0.00027414411306381226, 0.00028286874294281006, 0.00029159337282180786, 0.00030031800270080566, 0.00030904263257980347, 0.00031776726245880127, 0.00032649189233779907, 0.0003352165222167969]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 8.0, 8.0, 7.0, 16.0, 19.0, 21.0, 34.0, 49.0, 49.0, 93.0, 156.0, 203.0, 281.0, 405.0, 582.0, 868.0, 1271.0, 1982.0, 2995.0, 4643.0, 7778.0, 13684.0, 24056.0, 43770.0, 82959.0, 151859.0, 224579.0, 205959.0, 126473.0, 67746.0, 35906.0, 20039.0, 11276.0, 6732.0, 4094.0, 2728.0, 1700.0, 1113.0, 690.0, 513.0, 364.0, 250.0, 161.0, 142.0, 78.0, 58.0, 44.0, 41.0, 31.0, 12.0, 16.0, 5.0, 9.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.078125, -2.00848388671875, -1.9388427734375, -1.86920166015625, -1.799560546875, -1.72991943359375, -1.6602783203125, -1.59063720703125, -1.52099609375, -1.45135498046875, -1.3817138671875, -1.31207275390625, -1.242431640625, -1.17279052734375, -1.1031494140625, -1.03350830078125, -0.9638671875, -0.89422607421875, -0.8245849609375, -0.75494384765625, -0.685302734375, -0.61566162109375, -0.5460205078125, -0.47637939453125, -0.40673828125, -0.33709716796875, -0.2674560546875, -0.19781494140625, -0.128173828125, -0.05853271484375, 0.0111083984375, 0.08074951171875, 0.150390625, 0.22003173828125, 0.2896728515625, 0.35931396484375, 0.428955078125, 0.49859619140625, 0.5682373046875, 0.63787841796875, 0.70751953125, 0.77716064453125, 0.8468017578125, 0.91644287109375, 0.986083984375, 1.05572509765625, 1.1253662109375, 1.19500732421875, 1.2646484375, 1.33428955078125, 1.4039306640625, 1.47357177734375, 1.543212890625, 1.61285400390625, 1.6824951171875, 1.75213623046875, 1.82177734375, 1.89141845703125, 1.9610595703125, 2.03070068359375, 2.100341796875, 2.16998291015625, 2.2396240234375, 2.30926513671875, 2.37890625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 10.0, 10.0, 13.0, 20.0, 14.0, 22.0, 18.0, 22.0, 34.0, 44.0, 56.0, 56.0, 73.0, 78.0, 78.0, 79.0, 79.0, 65.0, 44.0, 39.0, 34.0, 26.0, 21.0, 15.0, 9.0, 9.0, 6.0, 5.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.669921875, -0.6461105346679688, -0.6222991943359375, -0.5984878540039062, -0.574676513671875, -0.5508651733398438, -0.5270538330078125, -0.5032424926757812, -0.47943115234375, -0.45561981201171875, -0.4318084716796875, -0.40799713134765625, -0.384185791015625, -0.36037445068359375, -0.3365631103515625, -0.31275177001953125, -0.2889404296875, -0.26512908935546875, -0.2413177490234375, -0.21750640869140625, -0.193695068359375, -0.16988372802734375, -0.1460723876953125, -0.12226104736328125, -0.09844970703125, -0.07463836669921875, -0.0508270263671875, -0.02701568603515625, -0.003204345703125, 0.02060699462890625, 0.0444183349609375, 0.06822967529296875, 0.092041015625, 0.11585235595703125, 0.1396636962890625, 0.16347503662109375, 0.187286376953125, 0.21109771728515625, 0.2349090576171875, 0.25872039794921875, 0.28253173828125, 0.30634307861328125, 0.3301544189453125, 0.35396575927734375, 0.377777099609375, 0.40158843994140625, 0.4253997802734375, 0.44921112060546875, 0.4730224609375, 0.49683380126953125, 0.5206451416015625, 0.5444564819335938, 0.568267822265625, 0.5920791625976562, 0.6158905029296875, 0.6397018432617188, 0.66351318359375, 0.6873245239257812, 0.7111358642578125, 0.7349472045898438, 0.758758544921875, 0.7825698852539062, 0.8063812255859375, 0.8301925659179688, 0.85400390625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 5.0, 10.0, 6.0, 11.0, 14.0, 20.0, 29.0, 33.0, 40.0, 50.0, 64.0, 87.0, 82.0, 107.0, 88.0, 67.0, 64.0, 51.0, 43.0, 22.0, 20.0, 21.0, 10.0, 8.0, 8.0, 8.0, 12.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.04301643371582, -12.565839767456055, -12.088663101196289, -11.611486434936523, -11.134309768676758, -10.657133102416992, -10.179956436157227, -9.702778816223145, -9.225602149963379, -8.748425483703613, -8.271248817443848, -7.794072151184082, -7.316895008087158, -6.839718341827393, -6.362541675567627, -5.885364532470703, -5.408188343048096, -4.93101167678833, -4.4538350105285645, -3.9766581058502197, -3.499481201171875, -3.0223045349121094, -2.5451278686523438, -2.067950963973999, -1.5907742977142334, -1.1135975122451782, -0.6364207863807678, -0.15924406051635742, 0.31793272495269775, 0.7951095104217529, 1.2722861766815186, 1.7494630813598633, 2.226639747619629, 2.7038164138793945, 3.1809933185577393, 3.658169984817505, 4.13534688949585, 4.612523555755615, 5.089700222015381, 5.566877365112305, 6.04405403137207, 6.521230697631836, 6.998407363891602, 7.475584030151367, 7.952761173248291, 8.429937362670898, 8.907114028930664, 9.384291648864746, 9.861467361450195, 10.338644027709961, 10.815820693969727, 11.292997360229492, 11.770174026489258, 12.247350692749023, 12.724527359008789, 13.201704978942871, 13.678881645202637, 14.156058311462402, 14.633234977722168, 15.110411643981934, 15.5875883102417, 16.06476593017578, 16.541942596435547, 17.019119262695312, 17.496295928955078]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 10.0, 8.0, 8.0, 7.0, 17.0, 12.0, 15.0, 17.0, 19.0, 25.0, 19.0, 29.0, 37.0, 27.0, 26.0, 29.0, 45.0, 33.0, 44.0, 46.0, 33.0, 36.0, 44.0, 43.0, 43.0, 35.0, 23.0, 35.0, 28.0, 29.0, 31.0, 31.0, 25.0, 15.0, 14.0, 11.0, 5.0, 12.0, 5.0, 7.0, 3.0, 2.0, 8.0, 2.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.166965484619141, -6.947599411010742, -6.728233337402344, -6.508867263793945, -6.289501190185547, -6.070135116577148, -5.85076904296875, -5.631402969360352, -5.412036895751953, -5.192670822143555, -4.973304748535156, -4.753938674926758, -4.534572601318359, -4.315206527709961, -4.0958404541015625, -3.876474618911743, -3.657108783721924, -3.4377427101135254, -3.218376636505127, -2.9990105628967285, -2.77964448928833, -2.5602784156799316, -2.3409125804901123, -2.121546506881714, -1.9021804332733154, -1.682814359664917, -1.4634482860565186, -1.2440823316574097, -1.0247162580490112, -0.8053501844406128, -0.5859842300415039, -0.36661815643310547, -0.14725255966186523, 0.07211348414421082, 0.29147952795028687, 0.5108455419540405, 0.730211615562439, 0.9495776891708374, 1.1689436435699463, 1.3883097171783447, 1.6076757907867432, 1.8270418643951416, 2.04640793800354, 2.2657737731933594, 2.485139846801758, 2.7045059204101562, 2.9238719940185547, 3.143238067626953, 3.3626041412353516, 3.58197021484375, 3.8013362884521484, 4.020702362060547, 4.240068435668945, 4.459434509277344, 4.678800582885742, 4.898166656494141, 5.117532730102539, 5.3368988037109375, 5.556264877319336, 5.775630950927734, 5.994997024536133, 6.214363098144531, 6.43372917175293, 6.653095245361328, 6.872460842132568]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 6.0, 13.0, 17.0, 22.0, 37.0, 52.0, 67.0, 130.0, 166.0, 302.0, 396.0, 604.0, 929.0, 1500.0, 2328.0, 3647.0, 5674.0, 9153.0, 14856.0, 24964.0, 42198.0, 70673.0, 112718.0, 158122.0, 177387.0, 152491.0, 105922.0, 65256.0, 38650.0, 22903.0, 13878.0, 8547.0, 5293.0, 3365.0, 2163.0, 1440.0, 937.0, 628.0, 399.0, 253.0, 156.0, 94.0, 70.0, 56.0, 31.0, 17.0, 16.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0], "bins": [-8.2109375, -7.972412109375, -7.73388671875, -7.495361328125, -7.2568359375, -7.018310546875, -6.77978515625, -6.541259765625, -6.302734375, -6.064208984375, -5.82568359375, -5.587158203125, -5.3486328125, -5.110107421875, -4.87158203125, -4.633056640625, -4.39453125, -4.156005859375, -3.91748046875, -3.678955078125, -3.4404296875, -3.201904296875, -2.96337890625, -2.724853515625, -2.486328125, -2.247802734375, -2.00927734375, -1.770751953125, -1.5322265625, -1.293701171875, -1.05517578125, -0.816650390625, -0.578125, -0.339599609375, -0.10107421875, 0.137451171875, 0.3759765625, 0.614501953125, 0.85302734375, 1.091552734375, 1.330078125, 1.568603515625, 1.80712890625, 2.045654296875, 2.2841796875, 2.522705078125, 2.76123046875, 2.999755859375, 3.23828125, 3.476806640625, 3.71533203125, 3.953857421875, 4.1923828125, 4.430908203125, 4.66943359375, 4.907958984375, 5.146484375, 5.385009765625, 5.62353515625, 5.862060546875, 6.1005859375, 6.339111328125, 6.57763671875, 6.816162109375, 7.0546875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 4.0, 9.0, 14.0, 10.0, 14.0, 16.0, 18.0, 19.0, 22.0, 24.0, 24.0, 31.0, 29.0, 35.0, 36.0, 36.0, 42.0, 43.0, 44.0, 43.0, 36.0, 37.0, 54.0, 38.0, 28.0, 27.0, 36.0, 35.0, 38.0, 23.0, 25.0, 21.0, 16.0, 11.0, 11.0, 7.0, 6.0, 7.0, 10.0, 2.0, 2.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.50390625, -7.26513671875, -7.0263671875, -6.78759765625, -6.548828125, -6.31005859375, -6.0712890625, -5.83251953125, -5.59375, -5.35498046875, -5.1162109375, -4.87744140625, -4.638671875, -4.39990234375, -4.1611328125, -3.92236328125, -3.68359375, -3.44482421875, -3.2060546875, -2.96728515625, -2.728515625, -2.48974609375, -2.2509765625, -2.01220703125, -1.7734375, -1.53466796875, -1.2958984375, -1.05712890625, -0.818359375, -0.57958984375, -0.3408203125, -0.10205078125, 0.13671875, 0.37548828125, 0.6142578125, 0.85302734375, 1.091796875, 1.33056640625, 1.5693359375, 1.80810546875, 2.046875, 2.28564453125, 2.5244140625, 2.76318359375, 3.001953125, 3.24072265625, 3.4794921875, 3.71826171875, 3.95703125, 4.19580078125, 4.4345703125, 4.67333984375, 4.912109375, 5.15087890625, 5.3896484375, 5.62841796875, 5.8671875, 6.10595703125, 6.3447265625, 6.58349609375, 6.822265625, 7.06103515625, 7.2998046875, 7.53857421875, 7.77734375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 10.0, 7.0, 6.0, 12.0, 14.0, 22.0, 53.0, 68.0, 86.0, 122.0, 193.0, 313.0, 436.0, 640.0, 975.0, 1481.0, 2269.0, 3398.0, 5251.0, 7976.0, 12539.0, 19412.0, 30493.0, 46615.0, 69563.0, 98329.0, 127017.0, 141299.0, 134556.0, 109491.0, 79912.0, 54763.0, 35909.0, 22964.0, 14646.0, 9716.0, 6079.0, 4021.0, 2602.0, 1790.0, 1187.0, 755.0, 516.0, 368.0, 229.0, 145.0, 101.0, 70.0, 57.0, 37.0, 21.0, 15.0, 6.0, 10.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5, -5.31475830078125, -5.1295166015625, -4.94427490234375, -4.759033203125, -4.57379150390625, -4.3885498046875, -4.20330810546875, -4.01806640625, -3.83282470703125, -3.6475830078125, -3.46234130859375, -3.277099609375, -3.09185791015625, -2.9066162109375, -2.72137451171875, -2.5361328125, -2.35089111328125, -2.1656494140625, -1.98040771484375, -1.795166015625, -1.60992431640625, -1.4246826171875, -1.23944091796875, -1.05419921875, -0.86895751953125, -0.6837158203125, -0.49847412109375, -0.313232421875, -0.12799072265625, 0.0572509765625, 0.24249267578125, 0.427734375, 0.61297607421875, 0.7982177734375, 0.98345947265625, 1.168701171875, 1.35394287109375, 1.5391845703125, 1.72442626953125, 1.90966796875, 2.09490966796875, 2.2801513671875, 2.46539306640625, 2.650634765625, 2.83587646484375, 3.0211181640625, 3.20635986328125, 3.3916015625, 3.57684326171875, 3.7620849609375, 3.94732666015625, 4.132568359375, 4.31781005859375, 4.5030517578125, 4.68829345703125, 4.87353515625, 5.05877685546875, 5.2440185546875, 5.42926025390625, 5.614501953125, 5.79974365234375, 5.9849853515625, 6.17022705078125, 6.35546875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 9.0, 4.0, 5.0, 8.0, 10.0, 10.0, 10.0, 21.0, 21.0, 13.0, 15.0, 21.0, 27.0, 26.0, 35.0, 41.0, 30.0, 28.0, 39.0, 39.0, 46.0, 33.0, 33.0, 40.0, 46.0, 39.0, 30.0, 38.0, 31.0, 35.0, 33.0, 28.0, 27.0, 23.0, 27.0, 17.0, 9.0, 6.0, 7.0, 10.0, 3.0, 4.0, 7.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.48828125, -4.3525390625, -4.216796875, -4.0810546875, -3.9453125, -3.8095703125, -3.673828125, -3.5380859375, -3.40234375, -3.2666015625, -3.130859375, -2.9951171875, -2.859375, -2.7236328125, -2.587890625, -2.4521484375, -2.31640625, -2.1806640625, -2.044921875, -1.9091796875, -1.7734375, -1.6376953125, -1.501953125, -1.3662109375, -1.23046875, -1.0947265625, -0.958984375, -0.8232421875, -0.6875, -0.5517578125, -0.416015625, -0.2802734375, -0.14453125, -0.0087890625, 0.126953125, 0.2626953125, 0.3984375, 0.5341796875, 0.669921875, 0.8056640625, 0.94140625, 1.0771484375, 1.212890625, 1.3486328125, 1.484375, 1.6201171875, 1.755859375, 1.8916015625, 2.02734375, 2.1630859375, 2.298828125, 2.4345703125, 2.5703125, 2.7060546875, 2.841796875, 2.9775390625, 3.11328125, 3.2490234375, 3.384765625, 3.5205078125, 3.65625, 3.7919921875, 3.927734375, 4.0634765625, 4.19921875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 24.0, 35.0, 50.0, 60.0, 88.0, 135.0, 192.0, 264.0, 414.0, 575.0, 921.0, 1285.0, 1954.0, 3071.0, 4746.0, 7884.0, 12971.0, 22389.0, 38754.0, 69762.0, 117746.0, 174639.0, 196186.0, 157243.0, 99712.0, 57185.0, 32347.0, 18451.0, 10903.0, 6559.0, 4105.0, 2598.0, 1710.0, 1099.0, 803.0, 534.0, 358.0, 237.0, 164.0, 114.0, 69.0, 53.0, 44.0, 36.0, 20.0, 15.0, 10.0, 2.0, 6.0, 3.0, 1.0, 3.0], "bins": [-4.74609375, -4.60784912109375, -4.4696044921875, -4.33135986328125, -4.193115234375, -4.05487060546875, -3.9166259765625, -3.77838134765625, -3.64013671875, -3.50189208984375, -3.3636474609375, -3.22540283203125, -3.087158203125, -2.94891357421875, -2.8106689453125, -2.67242431640625, -2.5341796875, -2.39593505859375, -2.2576904296875, -2.11944580078125, -1.981201171875, -1.84295654296875, -1.7047119140625, -1.56646728515625, -1.42822265625, -1.28997802734375, -1.1517333984375, -1.01348876953125, -0.875244140625, -0.73699951171875, -0.5987548828125, -0.46051025390625, -0.322265625, -0.18402099609375, -0.0457763671875, 0.09246826171875, 0.230712890625, 0.36895751953125, 0.5072021484375, 0.64544677734375, 0.78369140625, 0.92193603515625, 1.0601806640625, 1.19842529296875, 1.336669921875, 1.47491455078125, 1.6131591796875, 1.75140380859375, 1.8896484375, 2.02789306640625, 2.1661376953125, 2.30438232421875, 2.442626953125, 2.58087158203125, 2.7191162109375, 2.85736083984375, 2.99560546875, 3.13385009765625, 3.2720947265625, 3.41033935546875, 3.548583984375, 3.68682861328125, 3.8250732421875, 3.96331787109375, 4.1015625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 6.0, 9.0, 8.0, 10.0, 14.0, 23.0, 29.0, 37.0, 44.0, 54.0, 65.0, 101.0, 82.0, 93.0, 87.0, 64.0, 62.0, 36.0, 31.0, 32.0, 27.0, 23.0, 16.0, 9.0, 2.0, 4.0, 7.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.0006494522094726562, -0.0006327927112579346, -0.0006161332130432129, -0.0005994737148284912, -0.0005828142166137695, -0.0005661547183990479, -0.0005494952201843262, -0.0005328357219696045, -0.0005161762237548828, -0.0004995167255401611, -0.00048285722732543945, -0.0004661977291107178, -0.0004495382308959961, -0.0004328787326812744, -0.00041621923446655273, -0.00039955973625183105, -0.0003829002380371094, -0.0003662407398223877, -0.000349581241607666, -0.00033292174339294434, -0.00031626224517822266, -0.000299602746963501, -0.0002829432487487793, -0.0002662837505340576, -0.00024962425231933594, -0.00023296475410461426, -0.00021630525588989258, -0.0001996457576751709, -0.00018298625946044922, -0.00016632676124572754, -0.00014966726303100586, -0.00013300776481628418, -0.0001163482666015625, -9.968876838684082e-05, -8.302927017211914e-05, -6.636977195739746e-05, -4.971027374267578e-05, -3.30507755279541e-05, -1.6391277313232422e-05, 2.682209014892578e-07, 1.6927719116210938e-05, 3.358721733093262e-05, 5.02467155456543e-05, 6.690621376037598e-05, 8.356571197509766e-05, 0.00010022521018981934, 0.00011688470840454102, 0.0001335442066192627, 0.00015020370483398438, 0.00016686320304870605, 0.00018352270126342773, 0.00020018219947814941, 0.0002168416976928711, 0.00023350119590759277, 0.00025016069412231445, 0.00026682019233703613, 0.0002834796905517578, 0.0003001391887664795, 0.00031679868698120117, 0.00033345818519592285, 0.00035011768341064453, 0.0003667771816253662, 0.0003834366798400879, 0.00040009617805480957, 0.00041675567626953125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 7.0, 9.0, 17.0, 40.0, 43.0, 77.0, 101.0, 132.0, 220.0, 320.0, 465.0, 720.0, 1113.0, 1628.0, 2511.0, 3972.0, 6169.0, 10087.0, 16978.0, 28581.0, 50143.0, 85862.0, 139064.0, 187445.0, 183319.0, 132643.0, 81110.0, 46249.0, 27046.0, 16224.0, 9631.0, 5847.0, 3747.0, 2382.0, 1571.0, 1034.0, 691.0, 425.0, 295.0, 205.0, 120.0, 89.0, 66.0, 50.0, 32.0, 26.0, 17.0, 7.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.3125, -4.177490234375, -4.04248046875, -3.907470703125, -3.7724609375, -3.637451171875, -3.50244140625, -3.367431640625, -3.232421875, -3.097412109375, -2.96240234375, -2.827392578125, -2.6923828125, -2.557373046875, -2.42236328125, -2.287353515625, -2.15234375, -2.017333984375, -1.88232421875, -1.747314453125, -1.6123046875, -1.477294921875, -1.34228515625, -1.207275390625, -1.072265625, -0.937255859375, -0.80224609375, -0.667236328125, -0.5322265625, -0.397216796875, -0.26220703125, -0.127197265625, 0.0078125, 0.142822265625, 0.27783203125, 0.412841796875, 0.5478515625, 0.682861328125, 0.81787109375, 0.952880859375, 1.087890625, 1.222900390625, 1.35791015625, 1.492919921875, 1.6279296875, 1.762939453125, 1.89794921875, 2.032958984375, 2.16796875, 2.302978515625, 2.43798828125, 2.572998046875, 2.7080078125, 2.843017578125, 2.97802734375, 3.113037109375, 3.248046875, 3.383056640625, 3.51806640625, 3.653076171875, 3.7880859375, 3.923095703125, 4.05810546875, 4.193115234375, 4.328125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 1.0, 8.0, 8.0, 14.0, 11.0, 16.0, 16.0, 24.0, 23.0, 26.0, 40.0, 35.0, 36.0, 42.0, 53.0, 39.0, 45.0, 65.0, 48.0, 49.0, 62.0, 46.0, 39.0, 36.0, 29.0, 23.0, 30.0, 27.0, 19.0, 13.0, 17.0, 6.0, 12.0, 7.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.837890625, -0.8059234619140625, -0.773956298828125, -0.7419891357421875, -0.71002197265625, -0.6780548095703125, -0.646087646484375, -0.6141204833984375, -0.5821533203125, -0.5501861572265625, -0.518218994140625, -0.4862518310546875, -0.45428466796875, -0.4223175048828125, -0.390350341796875, -0.3583831787109375, -0.326416015625, -0.2944488525390625, -0.262481689453125, -0.2305145263671875, -0.19854736328125, -0.1665802001953125, -0.134613037109375, -0.1026458740234375, -0.0706787109375, -0.0387115478515625, -0.006744384765625, 0.0252227783203125, 0.05718994140625, 0.0891571044921875, 0.121124267578125, 0.1530914306640625, 0.18505859375, 0.2170257568359375, 0.248992919921875, 0.2809600830078125, 0.31292724609375, 0.3448944091796875, 0.376861572265625, 0.4088287353515625, 0.4407958984375, 0.4727630615234375, 0.504730224609375, 0.5366973876953125, 0.56866455078125, 0.6006317138671875, 0.632598876953125, 0.6645660400390625, 0.696533203125, 0.7285003662109375, 0.760467529296875, 0.7924346923828125, 0.82440185546875, 0.8563690185546875, 0.888336181640625, 0.9203033447265625, 0.9522705078125, 0.9842376708984375, 1.016204833984375, 1.0481719970703125, 1.08013916015625, 1.1121063232421875, 1.144073486328125, 1.1760406494140625, 1.2080078125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 2.0, 7.0, 5.0, 5.0, 7.0, 12.0, 8.0, 20.0, 26.0, 27.0, 30.0, 47.0, 57.0, 75.0, 90.0, 97.0, 79.0, 80.0, 65.0, 62.0, 52.0, 21.0, 30.0, 15.0, 22.0, 11.0, 12.0, 9.0, 8.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.518157958984375, -12.053613662719727, -11.589069366455078, -11.124526023864746, -10.659981727600098, -10.19543743133545, -9.730894088745117, -9.266349792480469, -8.80180549621582, -8.337261199951172, -7.872717380523682, -7.408173561096191, -6.943629264831543, -6.4790849685668945, -6.014541149139404, -5.549997329711914, -5.085453033447266, -4.620908737182617, -4.156364917755127, -3.6918208599090576, -3.2272768020629883, -2.762732744216919, -2.2981886863708496, -1.8336446285247803, -1.369100570678711, -0.9045565128326416, -0.44001245498657227, 0.02453160285949707, 0.4890756607055664, 0.9536197185516357, 1.418163776397705, 1.8827078342437744, 2.3472518920898438, 2.811795949935913, 3.2763400077819824, 3.7408840656280518, 4.205428123474121, 4.6699724197387695, 5.13451623916626, 5.59906005859375, 6.063604354858398, 6.528148651123047, 6.992692470550537, 7.457236289978027, 7.921780586242676, 8.386324882507324, 8.850868225097656, 9.315412521362305, 9.779956817626953, 10.244501113891602, 10.70904541015625, 11.173588752746582, 11.63813304901123, 12.102677345275879, 12.567220687866211, 13.03176498413086, 13.496309280395508, 13.960853576660156, 14.425397872924805, 14.889941215515137, 15.354485511779785, 15.819029808044434, 16.283573150634766, 16.748117446899414, 17.212661743164062]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 8.0, 6.0, 7.0, 13.0, 12.0, 11.0, 16.0, 12.0, 20.0, 16.0, 17.0, 14.0, 15.0, 26.0, 23.0, 34.0, 23.0, 32.0, 37.0, 31.0, 38.0, 30.0, 36.0, 28.0, 37.0, 33.0, 34.0, 41.0, 22.0, 40.0, 25.0, 18.0, 27.0, 26.0, 22.0, 20.0, 17.0, 15.0, 19.0, 14.0, 12.0, 12.0, 9.0, 11.0, 7.0, 4.0, 2.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0], "bins": [-6.223653316497803, -6.032013893127441, -5.84037446975708, -5.648735046386719, -5.457096099853516, -5.265456676483154, -5.073817253112793, -4.882177829742432, -4.69053840637207, -4.498898983001709, -4.307259559631348, -4.1156206130981445, -3.923981189727783, -3.732341766357422, -3.5407023429870605, -3.349062919616699, -3.157423973083496, -2.9657845497131348, -2.7741453647613525, -2.582505941390991, -2.390866756439209, -2.1992273330688477, -2.0075879096984863, -1.8159486055374146, -1.6243093013763428, -1.432669997215271, -1.2410306930541992, -1.049391269683838, -0.8577519655227661, -0.6661126613616943, -0.474473237991333, -0.28283393383026123, -0.09119510650634766, 0.10044422745704651, 0.2920835614204407, 0.4837229251861572, 0.675362229347229, 0.8670015335083008, 1.058640956878662, 1.2502802610397339, 1.4419195652008057, 1.6335588693618774, 1.8251981735229492, 2.0168375968933105, 2.208477020263672, 2.400116205215454, 2.5917556285858154, 2.7833948135375977, 2.975034236907959, 3.1666736602783203, 3.3583128452301025, 3.549952268600464, 3.741591453552246, 3.9332308769226074, 4.124870300292969, 4.31650972366333, 4.508149147033691, 4.699788570404053, 4.891427993774414, 5.083066940307617, 5.2747063636779785, 5.46634578704834, 5.657985210418701, 5.8496246337890625, 6.041263580322266]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 12.0, 10.0, 30.0, 38.0, 66.0, 92.0, 125.0, 176.0, 282.0, 402.0, 679.0, 1031.0, 1716.0, 2699.0, 4745.0, 8258.0, 15533.0, 32158.0, 79999.0, 249575.0, 884544.0, 1681002.0, 854376.0, 233409.0, 75306.0, 31496.0, 15335.0, 8434.0, 4926.0, 2912.0, 1834.0, 1167.0, 703.0, 453.0, 277.0, 186.0, 103.0, 66.0, 43.0, 28.0, 16.0, 6.0, 4.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.140625, -19.572998046875, -19.00537109375, -18.437744140625, -17.8701171875, -17.302490234375, -16.73486328125, -16.167236328125, -15.599609375, -15.031982421875, -14.46435546875, -13.896728515625, -13.3291015625, -12.761474609375, -12.19384765625, -11.626220703125, -11.05859375, -10.490966796875, -9.92333984375, -9.355712890625, -8.7880859375, -8.220458984375, -7.65283203125, -7.085205078125, -6.517578125, -5.949951171875, -5.38232421875, -4.814697265625, -4.2470703125, -3.679443359375, -3.11181640625, -2.544189453125, -1.9765625, -1.408935546875, -0.84130859375, -0.273681640625, 0.2939453125, 0.861572265625, 1.42919921875, 1.996826171875, 2.564453125, 3.132080078125, 3.69970703125, 4.267333984375, 4.8349609375, 5.402587890625, 5.97021484375, 6.537841796875, 7.10546875, 7.673095703125, 8.24072265625, 8.808349609375, 9.3759765625, 9.943603515625, 10.51123046875, 11.078857421875, 11.646484375, 12.214111328125, 12.78173828125, 13.349365234375, 13.9169921875, 14.484619140625, 15.05224609375, 15.619873046875, 16.1875]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 4.0, 4.0, 6.0, 5.0, 14.0, 8.0, 11.0, 11.0, 19.0, 19.0, 16.0, 20.0, 21.0, 22.0, 31.0, 30.0, 37.0, 35.0, 28.0, 42.0, 33.0, 38.0, 37.0, 44.0, 43.0, 38.0, 38.0, 38.0, 37.0, 20.0, 33.0, 25.0, 25.0, 12.0, 27.0, 20.0, 15.0, 13.0, 8.0, 11.0, 11.0, 11.0, 4.0, 11.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-5.7578125, -5.5872802734375, -5.416748046875, -5.2462158203125, -5.07568359375, -4.9051513671875, -4.734619140625, -4.5640869140625, -4.3935546875, -4.2230224609375, -4.052490234375, -3.8819580078125, -3.71142578125, -3.5408935546875, -3.370361328125, -3.1998291015625, -3.029296875, -2.8587646484375, -2.688232421875, -2.5177001953125, -2.34716796875, -2.1766357421875, -2.006103515625, -1.8355712890625, -1.6650390625, -1.4945068359375, -1.323974609375, -1.1534423828125, -0.98291015625, -0.8123779296875, -0.641845703125, -0.4713134765625, -0.30078125, -0.1302490234375, 0.040283203125, 0.2108154296875, 0.38134765625, 0.5518798828125, 0.722412109375, 0.8929443359375, 1.0634765625, 1.2340087890625, 1.404541015625, 1.5750732421875, 1.74560546875, 1.9161376953125, 2.086669921875, 2.2572021484375, 2.427734375, 2.5982666015625, 2.768798828125, 2.9393310546875, 3.10986328125, 3.2803955078125, 3.450927734375, 3.6214599609375, 3.7919921875, 3.9625244140625, 4.133056640625, 4.3035888671875, 4.47412109375, 4.6446533203125, 4.815185546875, 4.9857177734375, 5.15625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 11.0, 12.0, 16.0, 20.0, 27.0, 42.0, 54.0, 91.0, 142.0, 197.0, 296.0, 503.0, 748.0, 1164.0, 1820.0, 3046.0, 5046.0, 8678.0, 15543.0, 30315.0, 63791.0, 150907.0, 408227.0, 1041186.0, 1349849.0, 675755.0, 246873.0, 96245.0, 43402.0, 21573.0, 11624.0, 6639.0, 3960.0, 2321.0, 1535.0, 891.0, 585.0, 395.0, 250.0, 175.0, 102.0, 77.0, 59.0, 28.0, 21.0, 11.0, 11.0, 11.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.533447265625, -16.00439453125, -15.475341796875, -14.9462890625, -14.417236328125, -13.88818359375, -13.359130859375, -12.830078125, -12.301025390625, -11.77197265625, -11.242919921875, -10.7138671875, -10.184814453125, -9.65576171875, -9.126708984375, -8.59765625, -8.068603515625, -7.53955078125, -7.010498046875, -6.4814453125, -5.952392578125, -5.42333984375, -4.894287109375, -4.365234375, -3.836181640625, -3.30712890625, -2.778076171875, -2.2490234375, -1.719970703125, -1.19091796875, -0.661865234375, -0.1328125, 0.396240234375, 0.92529296875, 1.454345703125, 1.9833984375, 2.512451171875, 3.04150390625, 3.570556640625, 4.099609375, 4.628662109375, 5.15771484375, 5.686767578125, 6.2158203125, 6.744873046875, 7.27392578125, 7.802978515625, 8.33203125, 8.861083984375, 9.39013671875, 9.919189453125, 10.4482421875, 10.977294921875, 11.50634765625, 12.035400390625, 12.564453125, 13.093505859375, 13.62255859375, 14.151611328125, 14.6806640625, 15.209716796875, 15.73876953125, 16.267822265625, 16.796875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 22.0, 19.0, 25.0, 37.0, 43.0, 74.0, 94.0, 119.0, 149.0, 218.0, 241.0, 324.0, 328.0, 364.0, 386.0, 341.0, 321.0, 233.0, 186.0, 131.0, 105.0, 65.0, 64.0, 50.0, 30.0, 27.0, 16.0, 9.0, 7.0, 12.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.29400634765625, -5.1387939453125, -4.98358154296875, -4.828369140625, -4.67315673828125, -4.5179443359375, -4.36273193359375, -4.20751953125, -4.05230712890625, -3.8970947265625, -3.74188232421875, -3.586669921875, -3.43145751953125, -3.2762451171875, -3.12103271484375, -2.9658203125, -2.81060791015625, -2.6553955078125, -2.50018310546875, -2.344970703125, -2.18975830078125, -2.0345458984375, -1.87933349609375, -1.72412109375, -1.56890869140625, -1.4136962890625, -1.25848388671875, -1.103271484375, -0.94805908203125, -0.7928466796875, -0.63763427734375, -0.482421875, -0.32720947265625, -0.1719970703125, -0.01678466796875, 0.138427734375, 0.29364013671875, 0.4488525390625, 0.60406494140625, 0.75927734375, 0.91448974609375, 1.0697021484375, 1.22491455078125, 1.380126953125, 1.53533935546875, 1.6905517578125, 1.84576416015625, 2.0009765625, 2.15618896484375, 2.3114013671875, 2.46661376953125, 2.621826171875, 2.77703857421875, 2.9322509765625, 3.08746337890625, 3.24267578125, 3.39788818359375, 3.5531005859375, 3.70831298828125, 3.863525390625, 4.01873779296875, 4.1739501953125, 4.32916259765625, 4.484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 12.0, 13.0, 15.0, 18.0, 28.0, 27.0, 51.0, 56.0, 58.0, 94.0, 101.0, 100.0, 78.0, 76.0, 75.0, 41.0, 38.0, 27.0, 17.0, 17.0, 12.0, 6.0, 9.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.99970817565918, -13.444025039672852, -12.888341903686523, -12.332657814025879, -11.77697467803955, -11.221291542053223, -10.665607452392578, -10.10992431640625, -9.554241180419922, -8.998558044433594, -8.442874908447266, -7.887190818786621, -7.331507682800293, -6.775824546813965, -6.2201409339904785, -5.664457321166992, -5.108774185180664, -4.553091049194336, -3.9974074363708496, -3.4417240619659424, -2.886040687561035, -2.330357313156128, -1.7746739387512207, -1.2189905643463135, -0.6633071899414062, -0.10762381553649902, 0.4480595588684082, 1.0037429332733154, 1.5594263076782227, 2.11510968208313, 2.670793056488037, 3.2264764308929443, 3.7821617126464844, 4.3378448486328125, 4.893528461456299, 5.449212074279785, 6.004895210266113, 6.560578346252441, 7.116261959075928, 7.671945571899414, 8.227628707885742, 8.78331184387207, 9.338994979858398, 9.894679069519043, 10.450362205505371, 11.0060453414917, 11.561729431152344, 12.117412567138672, 12.673095703125, 13.228778839111328, 13.784461975097656, 14.3401460647583, 14.895829200744629, 15.451512336730957, 16.0071964263916, 16.56287956237793, 17.118562698364258, 17.674245834350586, 18.229928970336914, 18.785612106323242, 19.341297149658203, 19.89698028564453, 20.45266342163086, 21.008346557617188, 21.564029693603516]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 7.0, 8.0, 6.0, 1.0, 10.0, 10.0, 21.0, 14.0, 22.0, 26.0, 20.0, 15.0, 22.0, 18.0, 27.0, 43.0, 35.0, 35.0, 30.0, 40.0, 46.0, 39.0, 37.0, 33.0, 27.0, 28.0, 30.0, 30.0, 22.0, 37.0, 26.0, 37.0, 28.0, 26.0, 26.0, 24.0, 14.0, 17.0, 11.0, 11.0, 10.0, 10.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.00267219543457, -6.778745174407959, -6.5548176765441895, -6.330890655517578, -6.106963157653809, -5.883036136627197, -5.659109115600586, -5.435181617736816, -5.211254596710205, -4.987327575683594, -4.763400077819824, -4.539473056793213, -4.315546035766602, -4.091618537902832, -3.8676915168762207, -3.6437642574310303, -3.41983699798584, -3.1959097385406494, -2.971982479095459, -2.7480554580688477, -2.5241281986236572, -2.300200939178467, -2.0762739181518555, -1.852346658706665, -1.6284193992614746, -1.4044921398162842, -1.1805649995803833, -0.9566377997398376, -0.732710599899292, -0.5087833404541016, -0.2848562002182007, -0.060929059982299805, 0.16299772262573242, 0.3869249224662781, 0.6108521223068237, 0.8347793221473694, 1.058706521987915, 1.2826337814331055, 1.5065609216690063, 1.7304880619049072, 1.9544153213500977, 2.178342580795288, 2.4022698402404785, 2.62619686126709, 2.8501241207122803, 3.0740513801574707, 3.297978401184082, 3.5219056606292725, 3.745832920074463, 3.9697601795196533, 4.193687438964844, 4.417614459991455, 4.641541481018066, 4.865468978881836, 5.089395999908447, 5.313323020935059, 5.537250518798828, 5.7611775398254395, 5.985105037689209, 6.20903205871582, 6.43295955657959, 6.656886577606201, 6.8808135986328125, 7.104741096496582, 7.328668117523193]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 24.0, 27.0, 40.0, 50.0, 94.0, 134.0, 211.0, 304.0, 483.0, 633.0, 1085.0, 1528.0, 2461.0, 3856.0, 6266.0, 10090.0, 16443.0, 27064.0, 44481.0, 71741.0, 110563.0, 152164.0, 171005.0, 146896.0, 104760.0, 67893.0, 41705.0, 25459.0, 15387.0, 9314.0, 5934.0, 3640.0, 2379.0, 1528.0, 1002.0, 617.0, 432.0, 257.0, 196.0, 118.0, 98.0, 66.0, 36.0, 24.0, 18.0, 12.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.533203125, -3.420806884765625, -3.30841064453125, -3.196014404296875, -3.0836181640625, -2.971221923828125, -2.85882568359375, -2.746429443359375, -2.634033203125, -2.521636962890625, -2.40924072265625, -2.296844482421875, -2.1844482421875, -2.072052001953125, -1.95965576171875, -1.847259521484375, -1.73486328125, -1.622467041015625, -1.51007080078125, -1.397674560546875, -1.2852783203125, -1.172882080078125, -1.06048583984375, -0.948089599609375, -0.835693359375, -0.723297119140625, -0.61090087890625, -0.498504638671875, -0.3861083984375, -0.273712158203125, -0.16131591796875, -0.048919677734375, 0.0634765625, 0.175872802734375, 0.28826904296875, 0.400665283203125, 0.5130615234375, 0.625457763671875, 0.73785400390625, 0.850250244140625, 0.962646484375, 1.075042724609375, 1.18743896484375, 1.299835205078125, 1.4122314453125, 1.524627685546875, 1.63702392578125, 1.749420166015625, 1.86181640625, 1.974212646484375, 2.08660888671875, 2.199005126953125, 2.3114013671875, 2.423797607421875, 2.53619384765625, 2.648590087890625, 2.760986328125, 2.873382568359375, 2.98577880859375, 3.098175048828125, 3.2105712890625, 3.322967529296875, 3.43536376953125, 3.547760009765625, 3.66015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 7.0, 11.0, 10.0, 16.0, 15.0, 19.0, 16.0, 20.0, 17.0, 32.0, 24.0, 22.0, 35.0, 30.0, 48.0, 31.0, 33.0, 43.0, 39.0, 39.0, 28.0, 39.0, 34.0, 33.0, 32.0, 30.0, 29.0, 34.0, 24.0, 33.0, 28.0, 30.0, 25.0, 10.0, 14.0, 10.0, 8.0, 12.0, 6.0, 11.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.7421875, -7.4892578125, -7.236328125, -6.9833984375, -6.73046875, -6.4775390625, -6.224609375, -5.9716796875, -5.71875, -5.4658203125, -5.212890625, -4.9599609375, -4.70703125, -4.4541015625, -4.201171875, -3.9482421875, -3.6953125, -3.4423828125, -3.189453125, -2.9365234375, -2.68359375, -2.4306640625, -2.177734375, -1.9248046875, -1.671875, -1.4189453125, -1.166015625, -0.9130859375, -0.66015625, -0.4072265625, -0.154296875, 0.0986328125, 0.3515625, 0.6044921875, 0.857421875, 1.1103515625, 1.36328125, 1.6162109375, 1.869140625, 2.1220703125, 2.375, 2.6279296875, 2.880859375, 3.1337890625, 3.38671875, 3.6396484375, 3.892578125, 4.1455078125, 4.3984375, 4.6513671875, 4.904296875, 5.1572265625, 5.41015625, 5.6630859375, 5.916015625, 6.1689453125, 6.421875, 6.6748046875, 6.927734375, 7.1806640625, 7.43359375, 7.6865234375, 7.939453125, 8.1923828125, 8.4453125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 8.0, 3.0, 6.0, 15.0, 18.0, 27.0, 36.0, 37.0, 71.0, 115.0, 118.0, 205.0, 309.0, 459.0, 675.0, 1057.0, 1515.0, 2489.0, 4063.0, 6585.0, 11127.0, 19161.0, 33962.0, 60920.0, 108180.0, 176007.0, 216019.0, 168164.0, 101960.0, 57368.0, 31846.0, 18369.0, 10617.0, 6351.0, 3836.0, 2304.0, 1554.0, 1009.0, 665.0, 470.0, 248.0, 197.0, 112.0, 84.0, 63.0, 46.0, 30.0, 21.0, 27.0, 9.0, 7.0, 8.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3671875, -4.2237548828125, -4.080322265625, -3.9368896484375, -3.79345703125, -3.6500244140625, -3.506591796875, -3.3631591796875, -3.2197265625, -3.0762939453125, -2.932861328125, -2.7894287109375, -2.64599609375, -2.5025634765625, -2.359130859375, -2.2156982421875, -2.072265625, -1.9288330078125, -1.785400390625, -1.6419677734375, -1.49853515625, -1.3551025390625, -1.211669921875, -1.0682373046875, -0.9248046875, -0.7813720703125, -0.637939453125, -0.4945068359375, -0.35107421875, -0.2076416015625, -0.064208984375, 0.0792236328125, 0.22265625, 0.3660888671875, 0.509521484375, 0.6529541015625, 0.79638671875, 0.9398193359375, 1.083251953125, 1.2266845703125, 1.3701171875, 1.5135498046875, 1.656982421875, 1.8004150390625, 1.94384765625, 2.0872802734375, 2.230712890625, 2.3741455078125, 2.517578125, 2.6610107421875, 2.804443359375, 2.9478759765625, 3.09130859375, 3.2347412109375, 3.378173828125, 3.5216064453125, 3.6650390625, 3.8084716796875, 3.951904296875, 4.0953369140625, 4.23876953125, 4.3822021484375, 4.525634765625, 4.6690673828125, 4.8125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 10.0, 11.0, 14.0, 6.0, 26.0, 22.0, 22.0, 23.0, 26.0, 29.0, 41.0, 36.0, 32.0, 31.0, 39.0, 27.0, 30.0, 49.0, 39.0, 49.0, 37.0, 34.0, 31.0, 35.0, 41.0, 24.0, 41.0, 24.0, 32.0, 24.0, 25.0, 20.0, 17.0, 12.0, 8.0, 9.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.9429931640625, -4.784423828125, -4.6258544921875, -4.46728515625, -4.3087158203125, -4.150146484375, -3.9915771484375, -3.8330078125, -3.6744384765625, -3.515869140625, -3.3572998046875, -3.19873046875, -3.0401611328125, -2.881591796875, -2.7230224609375, -2.564453125, -2.4058837890625, -2.247314453125, -2.0887451171875, -1.93017578125, -1.7716064453125, -1.613037109375, -1.4544677734375, -1.2958984375, -1.1373291015625, -0.978759765625, -0.8201904296875, -0.66162109375, -0.5030517578125, -0.344482421875, -0.1859130859375, -0.02734375, 0.1312255859375, 0.289794921875, 0.4483642578125, 0.60693359375, 0.7655029296875, 0.924072265625, 1.0826416015625, 1.2412109375, 1.3997802734375, 1.558349609375, 1.7169189453125, 1.87548828125, 2.0340576171875, 2.192626953125, 2.3511962890625, 2.509765625, 2.6683349609375, 2.826904296875, 2.9854736328125, 3.14404296875, 3.3026123046875, 3.461181640625, 3.6197509765625, 3.7783203125, 3.9368896484375, 4.095458984375, 4.2540283203125, 4.41259765625, 4.5711669921875, 4.729736328125, 4.8883056640625, 5.046875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 15.0, 10.0, 16.0, 12.0, 44.0, 51.0, 97.0, 121.0, 181.0, 330.0, 490.0, 717.0, 1167.0, 1932.0, 3115.0, 5172.0, 8824.0, 15503.0, 28344.0, 53572.0, 106871.0, 204494.0, 265835.0, 168488.0, 85204.0, 42861.0, 23222.0, 12854.0, 7463.0, 4267.0, 2693.0, 1649.0, 1067.0, 687.0, 414.0, 283.0, 155.0, 115.0, 66.0, 48.0, 35.0, 18.0, 17.0, 12.0, 10.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.625, -2.548553466796875, -2.47210693359375, -2.395660400390625, -2.3192138671875, -2.242767333984375, -2.16632080078125, -2.089874267578125, -2.013427734375, -1.936981201171875, -1.86053466796875, -1.784088134765625, -1.7076416015625, -1.631195068359375, -1.55474853515625, -1.478302001953125, -1.40185546875, -1.325408935546875, -1.24896240234375, -1.172515869140625, -1.0960693359375, -1.019622802734375, -0.94317626953125, -0.866729736328125, -0.790283203125, -0.713836669921875, -0.63739013671875, -0.560943603515625, -0.4844970703125, -0.408050537109375, -0.33160400390625, -0.255157470703125, -0.1787109375, -0.102264404296875, -0.02581787109375, 0.050628662109375, 0.1270751953125, 0.203521728515625, 0.27996826171875, 0.356414794921875, 0.432861328125, 0.509307861328125, 0.58575439453125, 0.662200927734375, 0.7386474609375, 0.815093994140625, 0.89154052734375, 0.967987060546875, 1.04443359375, 1.120880126953125, 1.19732666015625, 1.273773193359375, 1.3502197265625, 1.426666259765625, 1.50311279296875, 1.579559326171875, 1.656005859375, 1.732452392578125, 1.80889892578125, 1.885345458984375, 1.9617919921875, 2.038238525390625, 2.11468505859375, 2.191131591796875, 2.267578125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 2.0, 10.0, 17.0, 24.0, 25.0, 27.0, 52.0, 69.0, 77.0, 108.0, 95.0, 89.0, 113.0, 91.0, 53.0, 39.0, 29.0, 26.0, 14.0, 8.0, 11.0, 8.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002205371856689453, -0.00021470710635185242, -0.00020887702703475952, -0.00020304694771766663, -0.00019721686840057373, -0.00019138678908348083, -0.00018555670976638794, -0.00017972663044929504, -0.00017389655113220215, -0.00016806647181510925, -0.00016223639249801636, -0.00015640631318092346, -0.00015057623386383057, -0.00014474615454673767, -0.00013891607522964478, -0.00013308599591255188, -0.00012725591659545898, -0.00012142583727836609, -0.0001155957579612732, -0.0001097656786441803, -0.0001039355993270874, -9.810552000999451e-05, -9.227544069290161e-05, -8.644536137580872e-05, -8.061528205871582e-05, -7.478520274162292e-05, -6.895512342453003e-05, -6.312504410743713e-05, -5.729496479034424e-05, -5.146488547325134e-05, -4.563480615615845e-05, -3.980472683906555e-05, -3.3974647521972656e-05, -2.814456820487976e-05, -2.2314488887786865e-05, -1.648440957069397e-05, -1.0654330253601074e-05, -4.824250936508179e-06, 1.0058283805847168e-06, 6.835907697677612e-06, 1.2665987014770508e-05, 1.8496066331863403e-05, 2.43261456489563e-05, 3.0156224966049194e-05, 3.598630428314209e-05, 4.1816383600234985e-05, 4.764646291732788e-05, 5.3476542234420776e-05, 5.930662155151367e-05, 6.513670086860657e-05, 7.096678018569946e-05, 7.679685950279236e-05, 8.262693881988525e-05, 8.845701813697815e-05, 9.428709745407104e-05, 0.00010011717677116394, 0.00010594725608825684, 0.00011177733540534973, 0.00011760741472244263, 0.00012343749403953552, 0.00012926757335662842, 0.0001350976526737213, 0.0001409277319908142, 0.0001467578113079071, 0.000152587890625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 11.0, 15.0, 17.0, 39.0, 42.0, 67.0, 96.0, 160.0, 241.0, 342.0, 526.0, 782.0, 1306.0, 2039.0, 3511.0, 6081.0, 10868.0, 20102.0, 37840.0, 72028.0, 133232.0, 209218.0, 222573.0, 149670.0, 82328.0, 43155.0, 22720.0, 12326.0, 7015.0, 3846.0, 2350.0, 1448.0, 888.0, 556.0, 373.0, 222.0, 167.0, 112.0, 80.0, 39.0, 37.0, 18.0, 12.0, 16.0, 6.0, 12.0, 9.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.51171875, -2.43096923828125, -2.3502197265625, -2.26947021484375, -2.188720703125, -2.10797119140625, -2.0272216796875, -1.94647216796875, -1.86572265625, -1.78497314453125, -1.7042236328125, -1.62347412109375, -1.542724609375, -1.46197509765625, -1.3812255859375, -1.30047607421875, -1.2197265625, -1.13897705078125, -1.0582275390625, -0.97747802734375, -0.896728515625, -0.81597900390625, -0.7352294921875, -0.65447998046875, -0.57373046875, -0.49298095703125, -0.4122314453125, -0.33148193359375, -0.250732421875, -0.16998291015625, -0.0892333984375, -0.00848388671875, 0.072265625, 0.15301513671875, 0.2337646484375, 0.31451416015625, 0.395263671875, 0.47601318359375, 0.5567626953125, 0.63751220703125, 0.71826171875, 0.79901123046875, 0.8797607421875, 0.96051025390625, 1.041259765625, 1.12200927734375, 1.2027587890625, 1.28350830078125, 1.3642578125, 1.44500732421875, 1.5257568359375, 1.60650634765625, 1.687255859375, 1.76800537109375, 1.8487548828125, 1.92950439453125, 2.01025390625, 2.09100341796875, 2.1717529296875, 2.25250244140625, 2.333251953125, 2.41400146484375, 2.4947509765625, 2.57550048828125, 2.65625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 9.0, 3.0, 5.0, 10.0, 15.0, 4.0, 13.0, 21.0, 13.0, 19.0, 17.0, 28.0, 30.0, 24.0, 38.0, 43.0, 49.0, 48.0, 47.0, 53.0, 43.0, 36.0, 44.0, 44.0, 31.0, 36.0, 30.0, 38.0, 23.0, 30.0, 13.0, 23.0, 21.0, 12.0, 16.0, 13.0, 6.0, 8.0, 11.0, 4.0, 5.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5947265625, -0.5768814086914062, -0.5590362548828125, -0.5411911010742188, -0.523345947265625, -0.5055007934570312, -0.4876556396484375, -0.46981048583984375, -0.45196533203125, -0.43412017822265625, -0.4162750244140625, -0.39842987060546875, -0.380584716796875, -0.36273956298828125, -0.3448944091796875, -0.32704925537109375, -0.3092041015625, -0.29135894775390625, -0.2735137939453125, -0.25566864013671875, -0.237823486328125, -0.21997833251953125, -0.2021331787109375, -0.18428802490234375, -0.16644287109375, -0.14859771728515625, -0.1307525634765625, -0.11290740966796875, -0.095062255859375, -0.07721710205078125, -0.0593719482421875, -0.04152679443359375, -0.023681640625, -0.00583648681640625, 0.0120086669921875, 0.02985382080078125, 0.047698974609375, 0.06554412841796875, 0.0833892822265625, 0.10123443603515625, 0.11907958984375, 0.13692474365234375, 0.1547698974609375, 0.17261505126953125, 0.190460205078125, 0.20830535888671875, 0.2261505126953125, 0.24399566650390625, 0.2618408203125, 0.27968597412109375, 0.2975311279296875, 0.31537628173828125, 0.333221435546875, 0.35106658935546875, 0.3689117431640625, 0.38675689697265625, 0.40460205078125, 0.42244720458984375, 0.4402923583984375, 0.45813751220703125, 0.475982666015625, 0.49382781982421875, 0.5116729736328125, 0.5295181274414062, 0.54736328125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 10.0, 19.0, 18.0, 20.0, 34.0, 49.0, 59.0, 56.0, 118.0, 93.0, 94.0, 80.0, 76.0, 73.0, 38.0, 37.0, 29.0, 21.0, 10.0, 10.0, 10.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.265263557434082, -13.69668197631836, -13.128101348876953, -12.55951976776123, -11.990938186645508, -11.422357559204102, -10.853775978088379, -10.285194396972656, -9.71661376953125, -9.148032188415527, -8.579451560974121, -8.010869979858398, -7.442288398742676, -6.873707294464111, -6.305126190185547, -5.736544609069824, -5.167963027954102, -4.599381923675537, -4.0308003425598145, -3.46221923828125, -2.8936378955841064, -2.325056552886963, -1.7564754486083984, -1.1878941059112549, -0.6193127632141113, -0.05073148012161255, 0.5178498029708862, 1.0864310264587402, 1.6550123691558838, 2.2235937118530273, 2.792174816131592, 3.3607561588287354, 3.9293365478515625, 4.497917652130127, 5.06649923324585, 5.635080337524414, 6.203661918640137, 6.772243022918701, 7.340824127197266, 7.909405708312988, 8.477987289428711, 9.046568870544434, 9.61514949798584, 10.183731079101562, 10.752312660217285, 11.320894241333008, 11.889474868774414, 12.458056449890137, 13.026637077331543, 13.595218658447266, 14.163799285888672, 14.732380867004395, 15.300962448120117, 15.869543075561523, 16.438125610351562, 17.00670623779297, 17.575286865234375, 18.14386749267578, 18.71245002746582, 19.281030654907227, 19.849611282348633, 20.418193817138672, 20.986774444580078, 21.555355072021484, 22.123937606811523]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 3.0, 4.0, 14.0, 10.0, 22.0, 18.0, 19.0, 24.0, 18.0, 16.0, 23.0, 23.0, 36.0, 39.0, 30.0, 29.0, 42.0, 39.0, 39.0, 43.0, 35.0, 27.0, 31.0, 31.0, 31.0, 22.0, 33.0, 31.0, 26.0, 35.0, 23.0, 31.0, 29.0, 17.0, 13.0, 15.0, 12.0, 6.0, 9.0, 14.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.914292335510254, -6.692164421081543, -6.47003698348999, -6.247909069061279, -6.025781154632568, -5.803653717041016, -5.581525802612305, -5.359397888183594, -5.137270450592041, -4.91514253616333, -4.693015098571777, -4.470887184143066, -4.2487592697143555, -4.026631832122803, -3.804503917694092, -3.58237624168396, -3.360248327255249, -3.138120651245117, -2.9159927368164062, -2.6938650608062744, -2.4717373847961426, -2.2496094703674316, -2.0274817943573, -1.805354118347168, -1.5832263231277466, -1.3610985279083252, -1.1389708518981934, -0.916843056678772, -0.6947153210639954, -0.47258758544921875, -0.25045979022979736, -0.028332114219665527, 0.19379568099975586, 0.41592341661453247, 0.6380511522293091, 0.8601789474487305, 1.0823066234588623, 1.3044344186782837, 1.526562213897705, 1.748689889907837, 1.9708176851272583, 2.1929454803466797, 2.4150731563568115, 2.6372008323669434, 2.8593287467956543, 3.081456422805786, 3.303584098815918, 3.525712013244629, 3.7478396892547607, 3.9699673652648926, 4.1920952796936035, 4.414222717285156, 4.636350631713867, 4.858478546142578, 5.080606460571289, 5.302733898162842, 5.524861812591553, 5.746989727020264, 5.969117164611816, 6.191245079040527, 6.413372993469238, 6.635500431060791, 6.857628345489502, 7.079755783081055, 7.301883697509766]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 7.0, 4.0, 11.0, 24.0, 39.0, 48.0, 83.0, 121.0, 172.0, 263.0, 397.0, 618.0, 900.0, 1406.0, 2162.0, 3369.0, 5262.0, 7985.0, 12610.0, 19956.0, 31070.0, 47728.0, 71502.0, 101396.0, 130316.0, 144954.0, 135323.0, 107886.0, 77142.0, 51766.0, 33956.0, 21673.0, 13725.0, 8723.0, 5544.0, 3664.0, 2368.0, 1492.0, 1012.0, 654.0, 453.0, 267.0, 155.0, 115.0, 68.0, 61.0, 36.0, 32.0, 12.0, 13.0, 9.0, 3.0, 2.0, 5.0, 3.0], "bins": [-7.0546875, -6.85076904296875, -6.6468505859375, -6.44293212890625, -6.239013671875, -6.03509521484375, -5.8311767578125, -5.62725830078125, -5.42333984375, -5.21942138671875, -5.0155029296875, -4.81158447265625, -4.607666015625, -4.40374755859375, -4.1998291015625, -3.99591064453125, -3.7919921875, -3.58807373046875, -3.3841552734375, -3.18023681640625, -2.976318359375, -2.77239990234375, -2.5684814453125, -2.36456298828125, -2.16064453125, -1.95672607421875, -1.7528076171875, -1.54888916015625, -1.344970703125, -1.14105224609375, -0.9371337890625, -0.73321533203125, -0.529296875, -0.32537841796875, -0.1214599609375, 0.08245849609375, 0.286376953125, 0.49029541015625, 0.6942138671875, 0.89813232421875, 1.10205078125, 1.30596923828125, 1.5098876953125, 1.71380615234375, 1.917724609375, 2.12164306640625, 2.3255615234375, 2.52947998046875, 2.7333984375, 2.93731689453125, 3.1412353515625, 3.34515380859375, 3.549072265625, 3.75299072265625, 3.9569091796875, 4.16082763671875, 4.36474609375, 4.56866455078125, 4.7725830078125, 4.97650146484375, 5.180419921875, 5.38433837890625, 5.5882568359375, 5.79217529296875, 5.99609375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 7.0, 7.0, 6.0, 5.0, 10.0, 8.0, 17.0, 19.0, 18.0, 19.0, 21.0, 22.0, 24.0, 43.0, 42.0, 25.0, 36.0, 27.0, 32.0, 37.0, 44.0, 29.0, 39.0, 27.0, 45.0, 39.0, 34.0, 38.0, 39.0, 28.0, 35.0, 27.0, 24.0, 21.0, 17.0, 19.0, 13.0, 13.0, 9.0, 10.0, 6.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.125, -7.8763427734375, -7.627685546875, -7.3790283203125, -7.13037109375, -6.8817138671875, -6.633056640625, -6.3843994140625, -6.1357421875, -5.8870849609375, -5.638427734375, -5.3897705078125, -5.14111328125, -4.8924560546875, -4.643798828125, -4.3951416015625, -4.146484375, -3.8978271484375, -3.649169921875, -3.4005126953125, -3.15185546875, -2.9031982421875, -2.654541015625, -2.4058837890625, -2.1572265625, -1.9085693359375, -1.659912109375, -1.4112548828125, -1.16259765625, -0.9139404296875, -0.665283203125, -0.4166259765625, -0.16796875, 0.0806884765625, 0.329345703125, 0.5780029296875, 0.82666015625, 1.0753173828125, 1.323974609375, 1.5726318359375, 1.8212890625, 2.0699462890625, 2.318603515625, 2.5672607421875, 2.81591796875, 3.0645751953125, 3.313232421875, 3.5618896484375, 3.810546875, 4.0592041015625, 4.307861328125, 4.5565185546875, 4.80517578125, 5.0538330078125, 5.302490234375, 5.5511474609375, 5.7998046875, 6.0484619140625, 6.297119140625, 6.5457763671875, 6.79443359375, 7.0430908203125, 7.291748046875, 7.5404052734375, 7.7890625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 6.0, 3.0, 6.0, 3.0, 5.0, 6.0, 10.0, 11.0, 20.0, 25.0, 45.0, 76.0, 100.0, 158.0, 312.0, 498.0, 850.0, 1423.0, 2376.0, 4002.0, 6592.0, 11356.0, 19442.0, 33374.0, 57303.0, 93505.0, 138567.0, 171662.0, 167150.0, 129783.0, 86150.0, 51531.0, 29797.0, 17519.0, 10075.0, 5896.0, 3551.0, 2153.0, 1291.0, 753.0, 434.0, 257.0, 171.0, 111.0, 87.0, 39.0, 28.0, 14.0, 9.0, 10.0, 5.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.31640625, -7.07171630859375, -6.8270263671875, -6.58233642578125, -6.337646484375, -6.09295654296875, -5.8482666015625, -5.60357666015625, -5.35888671875, -5.11419677734375, -4.8695068359375, -4.62481689453125, -4.380126953125, -4.13543701171875, -3.8907470703125, -3.64605712890625, -3.4013671875, -3.15667724609375, -2.9119873046875, -2.66729736328125, -2.422607421875, -2.17791748046875, -1.9332275390625, -1.68853759765625, -1.44384765625, -1.19915771484375, -0.9544677734375, -0.70977783203125, -0.465087890625, -0.22039794921875, 0.0242919921875, 0.26898193359375, 0.513671875, 0.75836181640625, 1.0030517578125, 1.24774169921875, 1.492431640625, 1.73712158203125, 1.9818115234375, 2.22650146484375, 2.47119140625, 2.71588134765625, 2.9605712890625, 3.20526123046875, 3.449951171875, 3.69464111328125, 3.9393310546875, 4.18402099609375, 4.4287109375, 4.67340087890625, 4.9180908203125, 5.16278076171875, 5.407470703125, 5.65216064453125, 5.8968505859375, 6.14154052734375, 6.38623046875, 6.63092041015625, 6.8756103515625, 7.12030029296875, 7.364990234375, 7.60968017578125, 7.8543701171875, 8.09906005859375, 8.34375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 5.0, 7.0, 9.0, 9.0, 8.0, 15.0, 19.0, 14.0, 21.0, 28.0, 32.0, 36.0, 38.0, 44.0, 34.0, 39.0, 39.0, 42.0, 45.0, 56.0, 45.0, 54.0, 46.0, 44.0, 33.0, 34.0, 32.0, 31.0, 22.0, 29.0, 18.0, 25.0, 9.0, 13.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.00390625, -6.8275146484375, -6.651123046875, -6.4747314453125, -6.29833984375, -6.1219482421875, -5.945556640625, -5.7691650390625, -5.5927734375, -5.4163818359375, -5.239990234375, -5.0635986328125, -4.88720703125, -4.7108154296875, -4.534423828125, -4.3580322265625, -4.181640625, -4.0052490234375, -3.828857421875, -3.6524658203125, -3.47607421875, -3.2996826171875, -3.123291015625, -2.9468994140625, -2.7705078125, -2.5941162109375, -2.417724609375, -2.2413330078125, -2.06494140625, -1.8885498046875, -1.712158203125, -1.5357666015625, -1.359375, -1.1829833984375, -1.006591796875, -0.8302001953125, -0.65380859375, -0.4774169921875, -0.301025390625, -0.1246337890625, 0.0517578125, 0.2281494140625, 0.404541015625, 0.5809326171875, 0.75732421875, 0.9337158203125, 1.110107421875, 1.2864990234375, 1.462890625, 1.6392822265625, 1.815673828125, 1.9920654296875, 2.16845703125, 2.3448486328125, 2.521240234375, 2.6976318359375, 2.8740234375, 3.0504150390625, 3.226806640625, 3.4031982421875, 3.57958984375, 3.7559814453125, 3.932373046875, 4.1087646484375, 4.28515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 5.0, 16.0, 17.0, 34.0, 57.0, 73.0, 109.0, 182.0, 283.0, 473.0, 707.0, 1141.0, 1825.0, 3007.0, 4851.0, 8031.0, 13734.0, 23796.0, 41459.0, 72097.0, 118588.0, 168852.0, 186131.0, 154593.0, 103138.0, 61170.0, 35004.0, 20076.0, 11374.0, 6864.0, 4154.0, 2548.0, 1558.0, 926.0, 579.0, 430.0, 233.0, 175.0, 87.0, 67.0, 36.0, 25.0, 19.0, 11.0, 9.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.1171875, -3.99371337890625, -3.8702392578125, -3.74676513671875, -3.623291015625, -3.49981689453125, -3.3763427734375, -3.25286865234375, -3.12939453125, -3.00592041015625, -2.8824462890625, -2.75897216796875, -2.635498046875, -2.51202392578125, -2.3885498046875, -2.26507568359375, -2.1416015625, -2.01812744140625, -1.8946533203125, -1.77117919921875, -1.647705078125, -1.52423095703125, -1.4007568359375, -1.27728271484375, -1.15380859375, -1.03033447265625, -0.9068603515625, -0.78338623046875, -0.659912109375, -0.53643798828125, -0.4129638671875, -0.28948974609375, -0.166015625, -0.04254150390625, 0.0809326171875, 0.20440673828125, 0.327880859375, 0.45135498046875, 0.5748291015625, 0.69830322265625, 0.82177734375, 0.94525146484375, 1.0687255859375, 1.19219970703125, 1.315673828125, 1.43914794921875, 1.5626220703125, 1.68609619140625, 1.8095703125, 1.93304443359375, 2.0565185546875, 2.17999267578125, 2.303466796875, 2.42694091796875, 2.5504150390625, 2.67388916015625, 2.79736328125, 2.92083740234375, 3.0443115234375, 3.16778564453125, 3.291259765625, 3.41473388671875, 3.5382080078125, 3.66168212890625, 3.78515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 0.0, 3.0, 9.0, 6.0, 6.0, 15.0, 8.0, 11.0, 21.0, 22.0, 26.0, 32.0, 36.0, 45.0, 54.0, 68.0, 61.0, 64.0, 78.0, 72.0, 68.0, 59.0, 50.0, 31.0, 42.0, 24.0, 27.0, 13.0, 19.0, 7.0, 9.0, 3.0, 7.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002620220184326172, -0.000249471515417099, -0.0002369210124015808, -0.00022437050938606262, -0.00021182000637054443, -0.00019926950335502625, -0.00018671900033950806, -0.00017416849732398987, -0.00016161799430847168, -0.0001490674912929535, -0.0001365169882774353, -0.00012396648526191711, -0.00011141598224639893, -9.886547923088074e-05, -8.631497621536255e-05, -7.376447319984436e-05, -6.121397018432617e-05, -4.8663467168807983e-05, -3.6112964153289795e-05, -2.3562461137771606e-05, -1.1011958122253418e-05, 1.5385448932647705e-06, 1.4089047908782959e-05, 2.6639550924301147e-05, 3.9190053939819336e-05, 5.1740556955337524e-05, 6.429105997085571e-05, 7.68415629863739e-05, 8.939206600189209e-05, 0.00010194256901741028, 0.00011449307203292847, 0.00012704357504844666, 0.00013959407806396484, 0.00015214458107948303, 0.00016469508409500122, 0.0001772455871105194, 0.0001897960901260376, 0.00020234659314155579, 0.00021489709615707397, 0.00022744759917259216, 0.00023999810218811035, 0.00025254860520362854, 0.00026509910821914673, 0.0002776496112346649, 0.0002902001142501831, 0.0003027506172657013, 0.0003153011202812195, 0.00032785162329673767, 0.00034040212631225586, 0.00035295262932777405, 0.00036550313234329224, 0.0003780536353588104, 0.0003906041383743286, 0.0004031546413898468, 0.000415705144405365, 0.0004282556474208832, 0.00044080615043640137, 0.00045335665345191956, 0.00046590715646743774, 0.00047845765948295593, 0.0004910081624984741, 0.0005035586655139923, 0.0005161091685295105, 0.0005286596715450287, 0.0005412101745605469]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 9.0, 11.0, 9.0, 13.0, 32.0, 46.0, 63.0, 95.0, 156.0, 237.0, 351.0, 552.0, 801.0, 1293.0, 2100.0, 3428.0, 5694.0, 9482.0, 16445.0, 28935.0, 50792.0, 87574.0, 141971.0, 186588.0, 181975.0, 134386.0, 83063.0, 47134.0, 26816.0, 15616.0, 8993.0, 5236.0, 3146.0, 2013.0, 1234.0, 776.0, 464.0, 317.0, 236.0, 147.0, 98.0, 66.0, 54.0, 44.0, 25.0, 16.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.05078125, -3.9239501953125, -3.797119140625, -3.6702880859375, -3.54345703125, -3.4166259765625, -3.289794921875, -3.1629638671875, -3.0361328125, -2.9093017578125, -2.782470703125, -2.6556396484375, -2.52880859375, -2.4019775390625, -2.275146484375, -2.1483154296875, -2.021484375, -1.8946533203125, -1.767822265625, -1.6409912109375, -1.51416015625, -1.3873291015625, -1.260498046875, -1.1336669921875, -1.0068359375, -0.8800048828125, -0.753173828125, -0.6263427734375, -0.49951171875, -0.3726806640625, -0.245849609375, -0.1190185546875, 0.0078125, 0.1346435546875, 0.261474609375, 0.3883056640625, 0.51513671875, 0.6419677734375, 0.768798828125, 0.8956298828125, 1.0224609375, 1.1492919921875, 1.276123046875, 1.4029541015625, 1.52978515625, 1.6566162109375, 1.783447265625, 1.9102783203125, 2.037109375, 2.1639404296875, 2.290771484375, 2.4176025390625, 2.54443359375, 2.6712646484375, 2.798095703125, 2.9249267578125, 3.0517578125, 3.1785888671875, 3.305419921875, 3.4322509765625, 3.55908203125, 3.6859130859375, 3.812744140625, 3.9395751953125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 7.0, 10.0, 18.0, 15.0, 23.0, 20.0, 28.0, 34.0, 41.0, 51.0, 37.0, 51.0, 54.0, 53.0, 59.0, 48.0, 53.0, 59.0, 48.0, 43.0, 38.0, 30.0, 32.0, 29.0, 22.0, 20.0, 15.0, 7.0, 8.0, 7.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3046875, -1.2688369750976562, -1.2329864501953125, -1.1971359252929688, -1.161285400390625, -1.1254348754882812, -1.0895843505859375, -1.0537338256835938, -1.01788330078125, -0.9820327758789062, -0.9461822509765625, -0.9103317260742188, -0.874481201171875, -0.8386306762695312, -0.8027801513671875, -0.7669296264648438, -0.7310791015625, -0.6952285766601562, -0.6593780517578125, -0.6235275268554688, -0.587677001953125, -0.5518264770507812, -0.5159759521484375, -0.48012542724609375, -0.44427490234375, -0.40842437744140625, -0.3725738525390625, -0.33672332763671875, -0.300872802734375, -0.26502227783203125, -0.2291717529296875, -0.19332122802734375, -0.157470703125, -0.12162017822265625, -0.0857696533203125, -0.04991912841796875, -0.014068603515625, 0.02178192138671875, 0.0576324462890625, 0.09348297119140625, 0.12933349609375, 0.16518402099609375, 0.2010345458984375, 0.23688507080078125, 0.272735595703125, 0.30858612060546875, 0.3444366455078125, 0.38028717041015625, 0.4161376953125, 0.45198822021484375, 0.4878387451171875, 0.5236892700195312, 0.559539794921875, 0.5953903198242188, 0.6312408447265625, 0.6670913696289062, 0.70294189453125, 0.7387924194335938, 0.7746429443359375, 0.8104934692382812, 0.846343994140625, 0.8821945190429688, 0.9180450439453125, 0.9538955688476562, 0.98974609375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 9.0, 11.0, 4.0, 11.0, 16.0, 19.0, 25.0, 34.0, 53.0, 57.0, 73.0, 80.0, 88.0, 105.0, 82.0, 85.0, 55.0, 50.0, 37.0, 23.0, 24.0, 17.0, 6.0, 9.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.371761322021484, -12.816137313842773, -12.260513305664062, -11.704889297485352, -11.14926528930664, -10.59364128112793, -10.038016319274902, -9.482392311096191, -8.92676830291748, -8.37114429473877, -7.815520286560059, -7.2598958015441895, -6.7042717933654785, -6.148647785186768, -5.593023300170898, -5.0373992919921875, -4.481775283813477, -3.9261512756347656, -3.3705270290374756, -2.8149027824401855, -2.2592787742614746, -1.7036547660827637, -1.1480305194854736, -0.5924062728881836, -0.036782264709472656, 0.5188418626785278, 1.0744659900665283, 1.6300901174545288, 2.1857142448425293, 2.7413382530212402, 3.2969624996185303, 3.8525867462158203, 4.408210754394531, 4.963834762573242, 5.519458770751953, 6.075083255767822, 6.630707263946533, 7.186331272125244, 7.741955757141113, 8.297579765319824, 8.853203773498535, 9.408827781677246, 9.964451789855957, 10.520075798034668, 11.075700759887695, 11.631324768066406, 12.186948776245117, 12.742572784423828, 13.298196792602539, 13.85382080078125, 14.409444808959961, 14.965068817138672, 15.520692825317383, 16.076316833496094, 16.631940841674805, 17.187564849853516, 17.74319076538086, 18.29881477355957, 18.85443878173828, 19.410062789916992, 19.965686798095703, 20.521310806274414, 21.076934814453125, 21.63256072998047, 22.188182830810547]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 6.0, 3.0, 7.0, 7.0, 10.0, 7.0, 10.0, 13.0, 14.0, 15.0, 22.0, 15.0, 16.0, 27.0, 21.0, 26.0, 40.0, 30.0, 35.0, 32.0, 38.0, 30.0, 31.0, 43.0, 37.0, 51.0, 43.0, 38.0, 30.0, 29.0, 27.0, 24.0, 28.0, 26.0, 30.0, 23.0, 23.0, 17.0, 16.0, 10.0, 12.0, 13.0, 6.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-7.199282646179199, -6.966243743896484, -6.7332048416137695, -6.500165939331055, -6.26712703704834, -6.034088134765625, -5.801049709320068, -5.5680108070373535, -5.334971904754639, -5.101933002471924, -4.868894100189209, -4.635855197906494, -4.4028167724609375, -4.169777870178223, -3.936738967895508, -3.703700065612793, -3.470661163330078, -3.2376222610473633, -3.0045833587646484, -2.7715446949005127, -2.538505792617798, -2.305466890335083, -2.0724282264709473, -1.8393893241882324, -1.6063504219055176, -1.3733115196228027, -1.1402727365493774, -0.9072338938713074, -0.6741950511932373, -0.44115614891052246, -0.20811736583709717, 0.024921417236328125, 0.25796079635620117, 0.49099963903427124, 0.7240384817123413, 0.9570773243904114, 1.1901161670684814, 1.4231550693511963, 1.6561938524246216, 1.8892326354980469, 2.1222715377807617, 2.3553104400634766, 2.5883493423461914, 2.821388006210327, 3.054426908493042, 3.287465810775757, 3.5205044746398926, 3.7535433769226074, 3.9865822792053223, 4.219621181488037, 4.452660083770752, 4.685698986053467, 4.918737411499023, 5.151776313781738, 5.384815216064453, 5.617854118347168, 5.850893020629883, 6.083931922912598, 6.3169708251953125, 6.550009727478027, 6.783048629760742, 7.016087532043457, 7.249125957489014, 7.4821648597717285, 7.715203762054443]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 3.0, 9.0, 20.0, 19.0, 32.0, 44.0, 77.0, 109.0, 153.0, 232.0, 307.0, 482.0, 685.0, 1083.0, 1659.0, 2515.0, 3973.0, 6543.0, 11398.0, 21077.0, 44569.0, 110162.0, 323393.0, 920679.0, 1447071.0, 826367.0, 283672.0, 98966.0, 40716.0, 19850.0, 11023.0, 6452.0, 3907.0, 2473.0, 1566.0, 1013.0, 679.0, 460.0, 295.0, 172.0, 147.0, 86.0, 52.0, 34.0, 21.0, 10.0, 9.0, 7.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.625, -17.064453125, -16.50390625, -15.943359375, -15.3828125, -14.822265625, -14.26171875, -13.701171875, -13.140625, -12.580078125, -12.01953125, -11.458984375, -10.8984375, -10.337890625, -9.77734375, -9.216796875, -8.65625, -8.095703125, -7.53515625, -6.974609375, -6.4140625, -5.853515625, -5.29296875, -4.732421875, -4.171875, -3.611328125, -3.05078125, -2.490234375, -1.9296875, -1.369140625, -0.80859375, -0.248046875, 0.3125, 0.873046875, 1.43359375, 1.994140625, 2.5546875, 3.115234375, 3.67578125, 4.236328125, 4.796875, 5.357421875, 5.91796875, 6.478515625, 7.0390625, 7.599609375, 8.16015625, 8.720703125, 9.28125, 9.841796875, 10.40234375, 10.962890625, 11.5234375, 12.083984375, 12.64453125, 13.205078125, 13.765625, 14.326171875, 14.88671875, 15.447265625, 16.0078125, 16.568359375, 17.12890625, 17.689453125, 18.25]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 0.0, 8.0, 9.0, 9.0, 16.0, 28.0, 17.0, 26.0, 25.0, 20.0, 30.0, 32.0, 40.0, 38.0, 41.0, 32.0, 46.0, 52.0, 40.0, 37.0, 50.0, 47.0, 43.0, 44.0, 41.0, 36.0, 21.0, 28.0, 30.0, 24.0, 13.0, 15.0, 10.0, 14.0, 9.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.96875, -6.74566650390625, -6.5225830078125, -6.29949951171875, -6.076416015625, -5.85333251953125, -5.6302490234375, -5.40716552734375, -5.18408203125, -4.96099853515625, -4.7379150390625, -4.51483154296875, -4.291748046875, -4.06866455078125, -3.8455810546875, -3.62249755859375, -3.3994140625, -3.17633056640625, -2.9532470703125, -2.73016357421875, -2.507080078125, -2.28399658203125, -2.0609130859375, -1.83782958984375, -1.61474609375, -1.39166259765625, -1.1685791015625, -0.94549560546875, -0.722412109375, -0.49932861328125, -0.2762451171875, -0.05316162109375, 0.169921875, 0.39300537109375, 0.6160888671875, 0.83917236328125, 1.062255859375, 1.28533935546875, 1.5084228515625, 1.73150634765625, 1.95458984375, 2.17767333984375, 2.4007568359375, 2.62384033203125, 2.846923828125, 3.07000732421875, 3.2930908203125, 3.51617431640625, 3.7392578125, 3.96234130859375, 4.1854248046875, 4.40850830078125, 4.631591796875, 4.85467529296875, 5.0777587890625, 5.30084228515625, 5.52392578125, 5.74700927734375, 5.9700927734375, 6.19317626953125, 6.416259765625, 6.63934326171875, 6.8624267578125, 7.08551025390625, 7.30859375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 9.0, 11.0, 23.0, 33.0, 42.0, 59.0, 80.0, 121.0, 180.0, 241.0, 435.0, 608.0, 929.0, 1432.0, 2306.0, 3708.0, 6371.0, 10787.0, 20271.0, 39550.0, 85802.0, 202852.0, 502566.0, 1054377.0, 1171566.0, 626973.0, 254277.0, 105829.0, 48092.0, 23749.0, 12544.0, 7074.0, 4201.0, 2608.0, 1602.0, 981.0, 644.0, 427.0, 274.0, 206.0, 134.0, 94.0, 57.0, 50.0, 38.0, 19.0, 19.0, 10.0, 6.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0], "bins": [-18.84375, -18.27490234375, -17.7060546875, -17.13720703125, -16.568359375, -15.99951171875, -15.4306640625, -14.86181640625, -14.29296875, -13.72412109375, -13.1552734375, -12.58642578125, -12.017578125, -11.44873046875, -10.8798828125, -10.31103515625, -9.7421875, -9.17333984375, -8.6044921875, -8.03564453125, -7.466796875, -6.89794921875, -6.3291015625, -5.76025390625, -5.19140625, -4.62255859375, -4.0537109375, -3.48486328125, -2.916015625, -2.34716796875, -1.7783203125, -1.20947265625, -0.640625, -0.07177734375, 0.4970703125, 1.06591796875, 1.634765625, 2.20361328125, 2.7724609375, 3.34130859375, 3.91015625, 4.47900390625, 5.0478515625, 5.61669921875, 6.185546875, 6.75439453125, 7.3232421875, 7.89208984375, 8.4609375, 9.02978515625, 9.5986328125, 10.16748046875, 10.736328125, 11.30517578125, 11.8740234375, 12.44287109375, 13.01171875, 13.58056640625, 14.1494140625, 14.71826171875, 15.287109375, 15.85595703125, 16.4248046875, 16.99365234375, 17.5625]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 7.0, 8.0, 8.0, 12.0, 23.0, 17.0, 42.0, 32.0, 47.0, 63.0, 89.0, 90.0, 131.0, 158.0, 199.0, 238.0, 261.0, 320.0, 313.0, 300.0, 281.0, 289.0, 239.0, 195.0, 164.0, 144.0, 89.0, 78.0, 62.0, 45.0, 21.0, 28.0, 20.0, 11.0, 9.0, 10.0, 12.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.8699951171875, -3.716552734375, -3.5631103515625, -3.40966796875, -3.2562255859375, -3.102783203125, -2.9493408203125, -2.7958984375, -2.6424560546875, -2.489013671875, -2.3355712890625, -2.18212890625, -2.0286865234375, -1.875244140625, -1.7218017578125, -1.568359375, -1.4149169921875, -1.261474609375, -1.1080322265625, -0.95458984375, -0.8011474609375, -0.647705078125, -0.4942626953125, -0.3408203125, -0.1873779296875, -0.033935546875, 0.1195068359375, 0.27294921875, 0.4263916015625, 0.579833984375, 0.7332763671875, 0.88671875, 1.0401611328125, 1.193603515625, 1.3470458984375, 1.50048828125, 1.6539306640625, 1.807373046875, 1.9608154296875, 2.1142578125, 2.2677001953125, 2.421142578125, 2.5745849609375, 2.72802734375, 2.8814697265625, 3.034912109375, 3.1883544921875, 3.341796875, 3.4952392578125, 3.648681640625, 3.8021240234375, 3.95556640625, 4.1090087890625, 4.262451171875, 4.4158935546875, 4.5693359375, 4.7227783203125, 4.876220703125, 5.0296630859375, 5.18310546875, 5.3365478515625, 5.489990234375, 5.6434326171875, 5.796875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 9.0, 13.0, 6.0, 8.0, 16.0, 19.0, 23.0, 31.0, 47.0, 59.0, 62.0, 74.0, 84.0, 61.0, 77.0, 67.0, 58.0, 54.0, 47.0, 35.0, 39.0, 20.0, 19.0, 17.0, 12.0, 9.0, 7.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.190109252929688, -15.663307189941406, -15.136505126953125, -14.609703063964844, -14.082901000976562, -13.556098937988281, -13.029295921325684, -12.502493858337402, -11.975691795349121, -11.44888973236084, -10.922087669372559, -10.395285606384277, -9.86848258972168, -9.341680526733398, -8.814878463745117, -8.288076400756836, -7.761274337768555, -7.234472274780273, -6.707670211791992, -6.180867671966553, -5.6540656089782715, -5.12726354598999, -4.600461006164551, -4.0736589431762695, -3.5468568801879883, -3.020054817199707, -2.4932525157928467, -1.9664503335952759, -1.439648151397705, -0.9128460884094238, -0.3860437870025635, 0.14075851440429688, 0.6675586700439453, 1.1943608522415161, 1.721163034439087, 2.2479653358459473, 2.7747673988342285, 3.3015694618225098, 3.82837176322937, 4.3551740646362305, 4.881976127624512, 5.408778190612793, 5.935580253601074, 6.462382793426514, 6.989184856414795, 7.515986919403076, 8.042789459228516, 8.569591522216797, 9.096393585205078, 9.62319564819336, 10.14999771118164, 10.676799774169922, 11.203601837158203, 11.730403900146484, 12.257206916809082, 12.784008979797363, 13.310811042785645, 13.837613105773926, 14.364415168762207, 14.891217231750488, 15.418020248413086, 15.944822311401367, 16.47162437438965, 16.99842643737793, 17.52522850036621]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 13.0, 15.0, 8.0, 18.0, 10.0, 19.0, 20.0, 24.0, 36.0, 24.0, 25.0, 32.0, 30.0, 36.0, 40.0, 40.0, 30.0, 36.0, 32.0, 34.0, 39.0, 36.0, 33.0, 32.0, 27.0, 35.0, 34.0, 20.0, 33.0, 35.0, 18.0, 23.0, 11.0, 18.0, 20.0, 9.0, 4.0, 7.0, 8.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.16486930847168, -7.919648170471191, -7.674427032470703, -7.429205417633057, -7.183984279632568, -6.93876314163208, -6.693541526794434, -6.448320388793945, -6.203099250793457, -5.957878112792969, -5.7126569747924805, -5.467435359954834, -5.222214221954346, -4.976993083953857, -4.731771469116211, -4.486550331115723, -4.241329193115234, -3.996108055114746, -3.7508866786956787, -3.5056653022766113, -3.260444164276123, -3.0152230262756348, -2.7700016498565674, -2.5247802734375, -2.2795591354370117, -2.0343379974365234, -1.789116621017456, -1.5438953638076782, -1.2986741065979004, -1.0534528493881226, -0.8082315921783447, -0.5630103349685669, -0.31778860092163086, -0.07256734371185303, 0.1726539134979248, 0.41787517070770264, 0.6630964279174805, 0.9083176851272583, 1.1535389423370361, 1.398760199546814, 1.6439814567565918, 1.8892027139663696, 2.1344239711761475, 2.379645347595215, 2.624866485595703, 2.8700876235961914, 3.115309000015259, 3.360530376434326, 3.6057515144348145, 3.8509726524353027, 4.096194267272949, 4.3414154052734375, 4.586636543273926, 4.831857681274414, 5.077078819274902, 5.322300434112549, 5.567521572113037, 5.812742710113525, 6.057964324951172, 6.30318546295166, 6.548406600952148, 6.793627738952637, 7.038848876953125, 7.2840704917907715, 7.52929162979126]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 10.0, 6.0, 11.0, 16.0, 19.0, 40.0, 72.0, 131.0, 176.0, 245.0, 372.0, 548.0, 855.0, 1322.0, 1950.0, 2984.0, 4623.0, 7352.0, 11225.0, 17387.0, 27151.0, 42128.0, 63870.0, 94320.0, 128353.0, 151210.0, 144360.0, 114445.0, 81215.0, 53951.0, 34857.0, 22511.0, 14499.0, 9255.0, 5872.0, 3943.0, 2462.0, 1652.0, 1044.0, 727.0, 448.0, 348.0, 214.0, 138.0, 88.0, 58.0, 40.0, 29.0, 16.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.11328125, -3.99505615234375, -3.8768310546875, -3.75860595703125, -3.640380859375, -3.52215576171875, -3.4039306640625, -3.28570556640625, -3.16748046875, -3.04925537109375, -2.9310302734375, -2.81280517578125, -2.694580078125, -2.57635498046875, -2.4581298828125, -2.33990478515625, -2.2216796875, -2.10345458984375, -1.9852294921875, -1.86700439453125, -1.748779296875, -1.63055419921875, -1.5123291015625, -1.39410400390625, -1.27587890625, -1.15765380859375, -1.0394287109375, -0.92120361328125, -0.802978515625, -0.68475341796875, -0.5665283203125, -0.44830322265625, -0.330078125, -0.21185302734375, -0.0936279296875, 0.02459716796875, 0.142822265625, 0.26104736328125, 0.3792724609375, 0.49749755859375, 0.61572265625, 0.73394775390625, 0.8521728515625, 0.97039794921875, 1.088623046875, 1.20684814453125, 1.3250732421875, 1.44329833984375, 1.5615234375, 1.67974853515625, 1.7979736328125, 1.91619873046875, 2.034423828125, 2.15264892578125, 2.2708740234375, 2.38909912109375, 2.50732421875, 2.62554931640625, 2.7437744140625, 2.86199951171875, 2.980224609375, 3.09844970703125, 3.2166748046875, 3.33489990234375, 3.453125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 0.0, 2.0, 4.0, 4.0, 10.0, 6.0, 12.0, 16.0, 16.0, 11.0, 12.0, 21.0, 16.0, 21.0, 19.0, 24.0, 34.0, 36.0, 27.0, 34.0, 37.0, 31.0, 28.0, 35.0, 46.0, 33.0, 32.0, 42.0, 38.0, 27.0, 32.0, 34.0, 28.0, 24.0, 36.0, 22.0, 19.0, 13.0, 25.0, 21.0, 6.0, 16.0, 13.0, 10.0, 8.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-8.671875, -8.408935546875, -8.14599609375, -7.883056640625, -7.6201171875, -7.357177734375, -7.09423828125, -6.831298828125, -6.568359375, -6.305419921875, -6.04248046875, -5.779541015625, -5.5166015625, -5.253662109375, -4.99072265625, -4.727783203125, -4.46484375, -4.201904296875, -3.93896484375, -3.676025390625, -3.4130859375, -3.150146484375, -2.88720703125, -2.624267578125, -2.361328125, -2.098388671875, -1.83544921875, -1.572509765625, -1.3095703125, -1.046630859375, -0.78369140625, -0.520751953125, -0.2578125, 0.005126953125, 0.26806640625, 0.531005859375, 0.7939453125, 1.056884765625, 1.31982421875, 1.582763671875, 1.845703125, 2.108642578125, 2.37158203125, 2.634521484375, 2.8974609375, 3.160400390625, 3.42333984375, 3.686279296875, 3.94921875, 4.212158203125, 4.47509765625, 4.738037109375, 5.0009765625, 5.263916015625, 5.52685546875, 5.789794921875, 6.052734375, 6.315673828125, 6.57861328125, 6.841552734375, 7.1044921875, 7.367431640625, 7.63037109375, 7.893310546875, 8.15625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 10.0, 15.0, 19.0, 17.0, 38.0, 72.0, 69.0, 117.0, 162.0, 227.0, 351.0, 520.0, 846.0, 1292.0, 1995.0, 3238.0, 5207.0, 9052.0, 15945.0, 28532.0, 53484.0, 102005.0, 181014.0, 236950.0, 182284.0, 102665.0, 54421.0, 28897.0, 15875.0, 9004.0, 5313.0, 3191.0, 1973.0, 1263.0, 839.0, 480.0, 343.0, 243.0, 214.0, 116.0, 82.0, 54.0, 39.0, 20.0, 22.0, 13.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.14453125, -5.95550537109375, -5.7664794921875, -5.57745361328125, -5.388427734375, -5.19940185546875, -5.0103759765625, -4.82135009765625, -4.63232421875, -4.44329833984375, -4.2542724609375, -4.06524658203125, -3.876220703125, -3.68719482421875, -3.4981689453125, -3.30914306640625, -3.1201171875, -2.93109130859375, -2.7420654296875, -2.55303955078125, -2.364013671875, -2.17498779296875, -1.9859619140625, -1.79693603515625, -1.60791015625, -1.41888427734375, -1.2298583984375, -1.04083251953125, -0.851806640625, -0.66278076171875, -0.4737548828125, -0.28472900390625, -0.095703125, 0.09332275390625, 0.2823486328125, 0.47137451171875, 0.660400390625, 0.84942626953125, 1.0384521484375, 1.22747802734375, 1.41650390625, 1.60552978515625, 1.7945556640625, 1.98358154296875, 2.172607421875, 2.36163330078125, 2.5506591796875, 2.73968505859375, 2.9287109375, 3.11773681640625, 3.3067626953125, 3.49578857421875, 3.684814453125, 3.87384033203125, 4.0628662109375, 4.25189208984375, 4.44091796875, 4.62994384765625, 4.8189697265625, 5.00799560546875, 5.197021484375, 5.38604736328125, 5.5750732421875, 5.76409912109375, 5.953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 7.0, 8.0, 9.0, 13.0, 19.0, 18.0, 16.0, 22.0, 19.0, 24.0, 31.0, 26.0, 39.0, 30.0, 36.0, 50.0, 51.0, 41.0, 37.0, 41.0, 44.0, 41.0, 49.0, 28.0, 31.0, 42.0, 28.0, 24.0, 20.0, 22.0, 20.0, 16.0, 19.0, 10.0, 12.0, 12.0, 9.0, 5.0, 3.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.796875, -4.631103515625, -4.46533203125, -4.299560546875, -4.1337890625, -3.968017578125, -3.80224609375, -3.636474609375, -3.470703125, -3.304931640625, -3.13916015625, -2.973388671875, -2.8076171875, -2.641845703125, -2.47607421875, -2.310302734375, -2.14453125, -1.978759765625, -1.81298828125, -1.647216796875, -1.4814453125, -1.315673828125, -1.14990234375, -0.984130859375, -0.818359375, -0.652587890625, -0.48681640625, -0.321044921875, -0.1552734375, 0.010498046875, 0.17626953125, 0.342041015625, 0.5078125, 0.673583984375, 0.83935546875, 1.005126953125, 1.1708984375, 1.336669921875, 1.50244140625, 1.668212890625, 1.833984375, 1.999755859375, 2.16552734375, 2.331298828125, 2.4970703125, 2.662841796875, 2.82861328125, 2.994384765625, 3.16015625, 3.325927734375, 3.49169921875, 3.657470703125, 3.8232421875, 3.989013671875, 4.15478515625, 4.320556640625, 4.486328125, 4.652099609375, 4.81787109375, 4.983642578125, 5.1494140625, 5.315185546875, 5.48095703125, 5.646728515625, 5.8125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 8.0, 6.0, 11.0, 18.0, 17.0, 32.0, 54.0, 64.0, 75.0, 152.0, 193.0, 300.0, 418.0, 667.0, 978.0, 1538.0, 2444.0, 4111.0, 7102.0, 13252.0, 25450.0, 53319.0, 119165.0, 245616.0, 282668.0, 152558.0, 68866.0, 32122.0, 16093.0, 8462.0, 4778.0, 2848.0, 1757.0, 1152.0, 772.0, 471.0, 320.0, 203.0, 152.0, 110.0, 69.0, 54.0, 38.0, 23.0, 16.0, 11.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.560546875, -3.453155517578125, -3.34576416015625, -3.238372802734375, -3.1309814453125, -3.023590087890625, -2.91619873046875, -2.808807373046875, -2.701416015625, -2.594024658203125, -2.48663330078125, -2.379241943359375, -2.2718505859375, -2.164459228515625, -2.05706787109375, -1.949676513671875, -1.84228515625, -1.734893798828125, -1.62750244140625, -1.520111083984375, -1.4127197265625, -1.305328369140625, -1.19793701171875, -1.090545654296875, -0.983154296875, -0.875762939453125, -0.76837158203125, -0.660980224609375, -0.5535888671875, -0.446197509765625, -0.33880615234375, -0.231414794921875, -0.1240234375, -0.016632080078125, 0.09075927734375, 0.198150634765625, 0.3055419921875, 0.412933349609375, 0.52032470703125, 0.627716064453125, 0.735107421875, 0.842498779296875, 0.94989013671875, 1.057281494140625, 1.1646728515625, 1.272064208984375, 1.37945556640625, 1.486846923828125, 1.59423828125, 1.701629638671875, 1.80902099609375, 1.916412353515625, 2.0238037109375, 2.131195068359375, 2.23858642578125, 2.345977783203125, 2.453369140625, 2.560760498046875, 2.66815185546875, 2.775543212890625, 2.8829345703125, 2.990325927734375, 3.09771728515625, 3.205108642578125, 3.3125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 10.0, 10.0, 14.0, 16.0, 14.0, 20.0, 26.0, 33.0, 35.0, 46.0, 54.0, 62.0, 55.0, 89.0, 66.0, 64.0, 64.0, 52.0, 57.0, 25.0, 36.0, 26.0, 23.0, 20.0, 18.0, 13.0, 8.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0001735687255859375, -0.00016891956329345703, -0.00016427040100097656, -0.0001596212387084961, -0.00015497207641601562, -0.00015032291412353516, -0.0001456737518310547, -0.00014102458953857422, -0.00013637542724609375, -0.00013172626495361328, -0.0001270771026611328, -0.00012242794036865234, -0.00011777877807617188, -0.0001131296157836914, -0.00010848045349121094, -0.00010383129119873047, -9.918212890625e-05, -9.453296661376953e-05, -8.988380432128906e-05, -8.52346420288086e-05, -8.058547973632812e-05, -7.593631744384766e-05, -7.128715515136719e-05, -6.663799285888672e-05, -6.198883056640625e-05, -5.733966827392578e-05, -5.269050598144531e-05, -4.8041343688964844e-05, -4.3392181396484375e-05, -3.8743019104003906e-05, -3.409385681152344e-05, -2.944469451904297e-05, -2.47955322265625e-05, -2.014636993408203e-05, -1.5497207641601562e-05, -1.0848045349121094e-05, -6.198883056640625e-06, -1.5497207641601562e-06, 3.0994415283203125e-06, 7.748603820800781e-06, 1.239776611328125e-05, 1.704692840576172e-05, 2.1696090698242188e-05, 2.6345252990722656e-05, 3.0994415283203125e-05, 3.5643577575683594e-05, 4.029273986816406e-05, 4.494190216064453e-05, 4.9591064453125e-05, 5.424022674560547e-05, 5.888938903808594e-05, 6.35385513305664e-05, 6.818771362304688e-05, 7.283687591552734e-05, 7.748603820800781e-05, 8.213520050048828e-05, 8.678436279296875e-05, 9.143352508544922e-05, 9.608268737792969e-05, 0.00010073184967041016, 0.00010538101196289062, 0.0001100301742553711, 0.00011467933654785156, 0.00011932849884033203, 0.0001239776611328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 9.0, 12.0, 12.0, 22.0, 32.0, 38.0, 69.0, 95.0, 150.0, 226.0, 318.0, 481.0, 767.0, 1195.0, 1863.0, 2965.0, 5014.0, 8238.0, 14033.0, 24676.0, 44883.0, 84927.0, 153369.0, 220018.0, 202260.0, 127621.0, 68410.0, 36766.0, 20302.0, 11576.0, 7017.0, 4034.0, 2593.0, 1625.0, 1032.0, 667.0, 414.0, 268.0, 168.0, 117.0, 73.0, 56.0, 47.0, 25.0, 25.0, 15.0, 12.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.140625, -3.041961669921875, -2.94329833984375, -2.844635009765625, -2.7459716796875, -2.647308349609375, -2.54864501953125, -2.449981689453125, -2.351318359375, -2.252655029296875, -2.15399169921875, -2.055328369140625, -1.9566650390625, -1.858001708984375, -1.75933837890625, -1.660675048828125, -1.56201171875, -1.463348388671875, -1.36468505859375, -1.266021728515625, -1.1673583984375, -1.068695068359375, -0.97003173828125, -0.871368408203125, -0.772705078125, -0.674041748046875, -0.57537841796875, -0.476715087890625, -0.3780517578125, -0.279388427734375, -0.18072509765625, -0.082061767578125, 0.0166015625, 0.115264892578125, 0.21392822265625, 0.312591552734375, 0.4112548828125, 0.509918212890625, 0.60858154296875, 0.707244873046875, 0.805908203125, 0.904571533203125, 1.00323486328125, 1.101898193359375, 1.2005615234375, 1.299224853515625, 1.39788818359375, 1.496551513671875, 1.59521484375, 1.693878173828125, 1.79254150390625, 1.891204833984375, 1.9898681640625, 2.088531494140625, 2.18719482421875, 2.285858154296875, 2.384521484375, 2.483184814453125, 2.58184814453125, 2.680511474609375, 2.7791748046875, 2.877838134765625, 2.97650146484375, 3.075164794921875, 3.173828125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 5.0, 1.0, 5.0, 5.0, 6.0, 9.0, 11.0, 10.0, 13.0, 13.0, 14.0, 17.0, 31.0, 27.0, 32.0, 52.0, 60.0, 62.0, 77.0, 60.0, 61.0, 66.0, 62.0, 56.0, 46.0, 46.0, 28.0, 28.0, 15.0, 12.0, 13.0, 17.0, 9.0, 5.0, 8.0, 5.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.015625, -0.9866485595703125, -0.957672119140625, -0.9286956787109375, -0.89971923828125, -0.8707427978515625, -0.841766357421875, -0.8127899169921875, -0.7838134765625, -0.7548370361328125, -0.725860595703125, -0.6968841552734375, -0.66790771484375, -0.6389312744140625, -0.609954833984375, -0.5809783935546875, -0.552001953125, -0.5230255126953125, -0.494049072265625, -0.4650726318359375, -0.43609619140625, -0.4071197509765625, -0.378143310546875, -0.3491668701171875, -0.3201904296875, -0.2912139892578125, -0.262237548828125, -0.2332611083984375, -0.20428466796875, -0.1753082275390625, -0.146331787109375, -0.1173553466796875, -0.08837890625, -0.0594024658203125, -0.030426025390625, -0.0014495849609375, 0.02752685546875, 0.0565032958984375, 0.085479736328125, 0.1144561767578125, 0.1434326171875, 0.1724090576171875, 0.201385498046875, 0.2303619384765625, 0.25933837890625, 0.2883148193359375, 0.317291259765625, 0.3462677001953125, 0.375244140625, 0.4042205810546875, 0.433197021484375, 0.4621734619140625, 0.49114990234375, 0.5201263427734375, 0.549102783203125, 0.5780792236328125, 0.6070556640625, 0.6360321044921875, 0.665008544921875, 0.6939849853515625, 0.72296142578125, 0.7519378662109375, 0.780914306640625, 0.8098907470703125, 0.8388671875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 9.0, 10.0, 9.0, 14.0, 18.0, 25.0, 26.0, 40.0, 63.0, 59.0, 62.0, 79.0, 71.0, 68.0, 77.0, 55.0, 54.0, 60.0, 29.0, 28.0, 34.0, 21.0, 13.0, 16.0, 11.0, 8.0, 8.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.306214332580566, -14.796100616455078, -14.28598690032959, -13.775873184204102, -13.26576042175293, -12.755645751953125, -12.245532989501953, -11.735419273376465, -11.225305557250977, -10.715191841125488, -10.205078125, -9.694964408874512, -9.184850692749023, -8.674737930297852, -8.164624214172363, -7.654510498046875, -7.144396781921387, -6.634283065795898, -6.12416934967041, -5.61405611038208, -5.103942394256592, -4.5938286781311035, -4.083715438842773, -3.573601722717285, -3.063488006591797, -2.5533742904663086, -2.0432608127593994, -1.5331472158432007, -1.023033618927002, -0.5129199028015137, -0.002806425094604492, 0.5073070526123047, 1.0174198150634766, 1.5275334119796753, 2.037647008895874, 2.547760486602783, 3.0578742027282715, 3.5679879188537598, 4.07810115814209, 4.588214874267578, 5.098328590393066, 5.608442306518555, 6.118556022644043, 6.628669261932373, 7.138782978057861, 7.64889669418335, 8.15900993347168, 8.669123649597168, 9.179237365722656, 9.689351081848145, 10.199464797973633, 10.709578514099121, 11.21969223022461, 11.729804992675781, 12.23991870880127, 12.750032424926758, 13.260146141052246, 13.770259857177734, 14.280373573303223, 14.790487289428711, 15.300600051879883, 15.810714721679688, 16.32082748413086, 16.83094024658203, 17.341054916381836]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 8.0, 15.0, 13.0, 9.0, 18.0, 15.0, 16.0, 22.0, 23.0, 29.0, 27.0, 27.0, 32.0, 31.0, 39.0, 27.0, 45.0, 24.0, 46.0, 35.0, 36.0, 31.0, 32.0, 41.0, 29.0, 31.0, 33.0, 29.0, 25.0, 35.0, 32.0, 17.0, 17.0, 14.0, 21.0, 13.0, 11.0, 6.0, 8.0, 7.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.075865745544434, -7.832607269287109, -7.589348793029785, -7.346090316772461, -7.102831840515137, -6.8595733642578125, -6.616314888000488, -6.373056411743164, -6.12979793548584, -5.886539459228516, -5.643280982971191, -5.400022506713867, -5.156764030456543, -4.913505554199219, -4.6702470779418945, -4.42698860168457, -4.183730125427246, -3.940471649169922, -3.6972131729125977, -3.4539546966552734, -3.210696220397949, -2.967437744140625, -2.724179267883301, -2.4809207916259766, -2.2376623153686523, -1.9944038391113281, -1.751145362854004, -1.5078868865966797, -1.2646284103393555, -1.0213699340820312, -0.778111457824707, -0.5348529815673828, -0.2915940284729004, -0.04833555221557617, 0.19492292404174805, 0.43818140029907227, 0.6814398765563965, 0.9246983528137207, 1.167956829071045, 1.4112153053283691, 1.6544737815856934, 1.8977322578430176, 2.140990734100342, 2.384249210357666, 2.6275076866149902, 2.8707661628723145, 3.1140246391296387, 3.357283115386963, 3.600541591644287, 3.8438000679016113, 4.0870585441589355, 4.33031702041626, 4.573575496673584, 4.816833972930908, 5.060092449188232, 5.303350925445557, 5.546609401702881, 5.789867877960205, 6.033126354217529, 6.2763848304748535, 6.519643306732178, 6.762901782989502, 7.006160259246826, 7.24941873550415, 7.492677211761475]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 16.0, 17.0, 18.0, 37.0, 58.0, 87.0, 142.0, 196.0, 338.0, 499.0, 758.0, 1254.0, 1999.0, 3346.0, 5420.0, 9005.0, 14803.0, 24114.0, 39183.0, 61630.0, 93147.0, 126140.0, 149337.0, 149143.0, 122839.0, 88903.0, 59439.0, 37412.0, 23198.0, 14025.0, 8449.0, 5153.0, 3171.0, 1929.0, 1181.0, 775.0, 514.0, 331.0, 193.0, 91.0, 77.0, 49.0, 40.0, 28.0, 22.0, 7.0, 8.0, 6.0, 5.0, 4.0, 3.0], "bins": [-8.015625, -7.79266357421875, -7.5697021484375, -7.34674072265625, -7.123779296875, -6.90081787109375, -6.6778564453125, -6.45489501953125, -6.23193359375, -6.00897216796875, -5.7860107421875, -5.56304931640625, -5.340087890625, -5.11712646484375, -4.8941650390625, -4.67120361328125, -4.4482421875, -4.22528076171875, -4.0023193359375, -3.77935791015625, -3.556396484375, -3.33343505859375, -3.1104736328125, -2.88751220703125, -2.66455078125, -2.44158935546875, -2.2186279296875, -1.99566650390625, -1.772705078125, -1.54974365234375, -1.3267822265625, -1.10382080078125, -0.880859375, -0.65789794921875, -0.4349365234375, -0.21197509765625, 0.010986328125, 0.23394775390625, 0.4569091796875, 0.67987060546875, 0.90283203125, 1.12579345703125, 1.3487548828125, 1.57171630859375, 1.794677734375, 2.01763916015625, 2.2406005859375, 2.46356201171875, 2.6865234375, 2.90948486328125, 3.1324462890625, 3.35540771484375, 3.578369140625, 3.80133056640625, 4.0242919921875, 4.24725341796875, 4.47021484375, 4.69317626953125, 4.9161376953125, 5.13909912109375, 5.362060546875, 5.58502197265625, 5.8079833984375, 6.03094482421875, 6.25390625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 13.0, 7.0, 9.0, 16.0, 24.0, 22.0, 35.0, 20.0, 21.0, 32.0, 35.0, 32.0, 24.0, 30.0, 40.0, 37.0, 34.0, 47.0, 39.0, 45.0, 39.0, 33.0, 38.0, 30.0, 28.0, 34.0, 29.0, 34.0, 29.0, 10.0, 17.0, 22.0, 10.0, 12.0, 15.0, 7.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-9.75, -9.4776611328125, -9.205322265625, -8.9329833984375, -8.66064453125, -8.3883056640625, -8.115966796875, -7.8436279296875, -7.5712890625, -7.2989501953125, -7.026611328125, -6.7542724609375, -6.48193359375, -6.2095947265625, -5.937255859375, -5.6649169921875, -5.392578125, -5.1202392578125, -4.847900390625, -4.5755615234375, -4.30322265625, -4.0308837890625, -3.758544921875, -3.4862060546875, -3.2138671875, -2.9415283203125, -2.669189453125, -2.3968505859375, -2.12451171875, -1.8521728515625, -1.579833984375, -1.3074951171875, -1.03515625, -0.7628173828125, -0.490478515625, -0.2181396484375, 0.05419921875, 0.3265380859375, 0.598876953125, 0.8712158203125, 1.1435546875, 1.4158935546875, 1.688232421875, 1.9605712890625, 2.23291015625, 2.5052490234375, 2.777587890625, 3.0499267578125, 3.322265625, 3.5946044921875, 3.866943359375, 4.1392822265625, 4.41162109375, 4.6839599609375, 4.956298828125, 5.2286376953125, 5.5009765625, 5.7733154296875, 6.045654296875, 6.3179931640625, 6.59033203125, 6.8626708984375, 7.135009765625, 7.4073486328125, 7.6796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 20.0, 27.0, 44.0, 67.0, 107.0, 150.0, 203.0, 345.0, 527.0, 785.0, 1141.0, 1668.0, 2545.0, 4005.0, 6092.0, 9300.0, 14585.0, 22278.0, 34087.0, 52027.0, 73683.0, 101061.0, 124619.0, 134528.0, 126330.0, 104474.0, 77069.0, 53934.0, 36077.0, 23594.0, 14882.0, 9703.0, 6365.0, 4206.0, 2772.0, 1756.0, 1108.0, 770.0, 520.0, 350.0, 250.0, 166.0, 95.0, 77.0, 53.0, 30.0, 30.0, 17.0, 7.0, 6.0, 5.0, 3.0, 4.0], "bins": [-6.8671875, -6.66845703125, -6.4697265625, -6.27099609375, -6.072265625, -5.87353515625, -5.6748046875, -5.47607421875, -5.27734375, -5.07861328125, -4.8798828125, -4.68115234375, -4.482421875, -4.28369140625, -4.0849609375, -3.88623046875, -3.6875, -3.48876953125, -3.2900390625, -3.09130859375, -2.892578125, -2.69384765625, -2.4951171875, -2.29638671875, -2.09765625, -1.89892578125, -1.7001953125, -1.50146484375, -1.302734375, -1.10400390625, -0.9052734375, -0.70654296875, -0.5078125, -0.30908203125, -0.1103515625, 0.08837890625, 0.287109375, 0.48583984375, 0.6845703125, 0.88330078125, 1.08203125, 1.28076171875, 1.4794921875, 1.67822265625, 1.876953125, 2.07568359375, 2.2744140625, 2.47314453125, 2.671875, 2.87060546875, 3.0693359375, 3.26806640625, 3.466796875, 3.66552734375, 3.8642578125, 4.06298828125, 4.26171875, 4.46044921875, 4.6591796875, 4.85791015625, 5.056640625, 5.25537109375, 5.4541015625, 5.65283203125, 5.8515625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 9.0, 10.0, 20.0, 15.0, 13.0, 28.0, 19.0, 17.0, 29.0, 39.0, 35.0, 43.0, 51.0, 43.0, 50.0, 58.0, 56.0, 45.0, 51.0, 44.0, 30.0, 36.0, 37.0, 28.0, 39.0, 24.0, 30.0, 19.0, 14.0, 14.0, 6.0, 13.0, 6.0, 7.0, 5.0, 2.0, 1.0, 0.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.796875, -6.593994140625, -6.39111328125, -6.188232421875, -5.9853515625, -5.782470703125, -5.57958984375, -5.376708984375, -5.173828125, -4.970947265625, -4.76806640625, -4.565185546875, -4.3623046875, -4.159423828125, -3.95654296875, -3.753662109375, -3.55078125, -3.347900390625, -3.14501953125, -2.942138671875, -2.7392578125, -2.536376953125, -2.33349609375, -2.130615234375, -1.927734375, -1.724853515625, -1.52197265625, -1.319091796875, -1.1162109375, -0.913330078125, -0.71044921875, -0.507568359375, -0.3046875, -0.101806640625, 0.10107421875, 0.303955078125, 0.5068359375, 0.709716796875, 0.91259765625, 1.115478515625, 1.318359375, 1.521240234375, 1.72412109375, 1.927001953125, 2.1298828125, 2.332763671875, 2.53564453125, 2.738525390625, 2.94140625, 3.144287109375, 3.34716796875, 3.550048828125, 3.7529296875, 3.955810546875, 4.15869140625, 4.361572265625, 4.564453125, 4.767333984375, 4.97021484375, 5.173095703125, 5.3759765625, 5.578857421875, 5.78173828125, 5.984619140625, 6.1875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 25.0, 21.0, 31.0, 50.0, 75.0, 146.0, 193.0, 332.0, 590.0, 1050.0, 1907.0, 3672.0, 7199.0, 15021.0, 31750.0, 68463.0, 138895.0, 223291.0, 237199.0, 160828.0, 82660.0, 38683.0, 18324.0, 8649.0, 4323.0, 2265.0, 1248.0, 694.0, 395.0, 222.0, 118.0, 79.0, 49.0, 31.0, 20.0, 13.0, 12.0, 6.0, 7.0, 4.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51953125, -6.3284912109375, -6.137451171875, -5.9464111328125, -5.75537109375, -5.5643310546875, -5.373291015625, -5.1822509765625, -4.9912109375, -4.8001708984375, -4.609130859375, -4.4180908203125, -4.22705078125, -4.0360107421875, -3.844970703125, -3.6539306640625, -3.462890625, -3.2718505859375, -3.080810546875, -2.8897705078125, -2.69873046875, -2.5076904296875, -2.316650390625, -2.1256103515625, -1.9345703125, -1.7435302734375, -1.552490234375, -1.3614501953125, -1.17041015625, -0.9793701171875, -0.788330078125, -0.5972900390625, -0.40625, -0.2152099609375, -0.024169921875, 0.1668701171875, 0.35791015625, 0.5489501953125, 0.739990234375, 0.9310302734375, 1.1220703125, 1.3131103515625, 1.504150390625, 1.6951904296875, 1.88623046875, 2.0772705078125, 2.268310546875, 2.4593505859375, 2.650390625, 2.8414306640625, 3.032470703125, 3.2235107421875, 3.41455078125, 3.6055908203125, 3.796630859375, 3.9876708984375, 4.1787109375, 4.3697509765625, 4.560791015625, 4.7518310546875, 4.94287109375, 5.1339111328125, 5.324951171875, 5.5159912109375, 5.70703125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 10.0, 1.0, 12.0, 25.0, 19.0, 29.0, 29.0, 50.0, 34.0, 61.0, 50.0, 60.0, 62.0, 61.0, 57.0, 55.0, 75.0, 48.0, 40.0, 37.0, 21.0, 23.0, 17.0, 29.0, 15.0, 10.0, 11.0, 7.0, 9.0, 8.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040340423583984375, -0.00038981810212135315, -0.00037623196840286255, -0.00036264583468437195, -0.00034905970096588135, -0.00033547356724739075, -0.00032188743352890015, -0.00030830129981040955, -0.00029471516609191895, -0.00028112903237342834, -0.00026754289865493774, -0.00025395676493644714, -0.00024037063121795654, -0.00022678449749946594, -0.00021319836378097534, -0.00019961223006248474, -0.00018602609634399414, -0.00017243996262550354, -0.00015885382890701294, -0.00014526769518852234, -0.00013168156147003174, -0.00011809542775154114, -0.00010450929403305054, -9.092316031455994e-05, -7.733702659606934e-05, -6.375089287757874e-05, -5.0164759159088135e-05, -3.6578625440597534e-05, -2.2992491722106934e-05, -9.406358003616333e-06, 4.179775714874268e-06, 1.7765909433364868e-05, 3.135204315185547e-05, 4.493817687034607e-05, 5.852431058883667e-05, 7.211044430732727e-05, 8.569657802581787e-05, 9.928271174430847e-05, 0.00011286884546279907, 0.00012645497918128967, 0.00014004111289978027, 0.00015362724661827087, 0.00016721338033676147, 0.00018079951405525208, 0.00019438564777374268, 0.00020797178149223328, 0.00022155791521072388, 0.00023514404892921448, 0.0002487301826477051, 0.0002623163163661957, 0.0002759024500846863, 0.0002894885838031769, 0.0003030747175216675, 0.0003166608512401581, 0.0003302469849586487, 0.0003438331186771393, 0.0003574192523956299, 0.0003710053861141205, 0.0003845915198326111, 0.0003981776535511017, 0.0004117637872695923, 0.0004253499209880829, 0.0004389360547065735, 0.0004525221884250641, 0.0004661083221435547]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 17.0, 12.0, 26.0, 42.0, 57.0, 76.0, 106.0, 167.0, 237.0, 431.0, 647.0, 1005.0, 1615.0, 2609.0, 4452.0, 7948.0, 14307.0, 26158.0, 49573.0, 90812.0, 151517.0, 200993.0, 191521.0, 133835.0, 77548.0, 41684.0, 22322.0, 12130.0, 6715.0, 3830.0, 2277.0, 1437.0, 844.0, 531.0, 382.0, 258.0, 133.0, 95.0, 77.0, 38.0, 22.0, 22.0, 14.0, 12.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.83203125, -4.67022705078125, -4.5084228515625, -4.34661865234375, -4.184814453125, -4.02301025390625, -3.8612060546875, -3.69940185546875, -3.53759765625, -3.37579345703125, -3.2139892578125, -3.05218505859375, -2.890380859375, -2.72857666015625, -2.5667724609375, -2.40496826171875, -2.2431640625, -2.08135986328125, -1.9195556640625, -1.75775146484375, -1.595947265625, -1.43414306640625, -1.2723388671875, -1.11053466796875, -0.94873046875, -0.78692626953125, -0.6251220703125, -0.46331787109375, -0.301513671875, -0.13970947265625, 0.0220947265625, 0.18389892578125, 0.345703125, 0.50750732421875, 0.6693115234375, 0.83111572265625, 0.992919921875, 1.15472412109375, 1.3165283203125, 1.47833251953125, 1.64013671875, 1.80194091796875, 1.9637451171875, 2.12554931640625, 2.287353515625, 2.44915771484375, 2.6109619140625, 2.77276611328125, 2.9345703125, 3.09637451171875, 3.2581787109375, 3.41998291015625, 3.581787109375, 3.74359130859375, 3.9053955078125, 4.06719970703125, 4.22900390625, 4.39080810546875, 4.5526123046875, 4.71441650390625, 4.876220703125, 5.03802490234375, 5.1998291015625, 5.36163330078125, 5.5234375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 5.0, 12.0, 12.0, 15.0, 27.0, 45.0, 35.0, 53.0, 61.0, 62.0, 59.0, 66.0, 59.0, 69.0, 70.0, 63.0, 49.0, 42.0, 40.0, 34.0, 25.0, 16.0, 13.0, 14.0, 10.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34375, -1.296356201171875, -1.24896240234375, -1.201568603515625, -1.1541748046875, -1.106781005859375, -1.05938720703125, -1.011993408203125, -0.964599609375, -0.917205810546875, -0.86981201171875, -0.822418212890625, -0.7750244140625, -0.727630615234375, -0.68023681640625, -0.632843017578125, -0.58544921875, -0.538055419921875, -0.49066162109375, -0.443267822265625, -0.3958740234375, -0.348480224609375, -0.30108642578125, -0.253692626953125, -0.206298828125, -0.158905029296875, -0.11151123046875, -0.064117431640625, -0.0167236328125, 0.030670166015625, 0.07806396484375, 0.125457763671875, 0.1728515625, 0.220245361328125, 0.26763916015625, 0.315032958984375, 0.3624267578125, 0.409820556640625, 0.45721435546875, 0.504608154296875, 0.552001953125, 0.599395751953125, 0.64678955078125, 0.694183349609375, 0.7415771484375, 0.788970947265625, 0.83636474609375, 0.883758544921875, 0.93115234375, 0.978546142578125, 1.02593994140625, 1.073333740234375, 1.1207275390625, 1.168121337890625, 1.21551513671875, 1.262908935546875, 1.310302734375, 1.357696533203125, 1.40509033203125, 1.452484130859375, 1.4998779296875, 1.547271728515625, 1.59466552734375, 1.642059326171875, 1.689453125]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 8.0, 11.0, 6.0, 15.0, 11.0, 19.0, 29.0, 34.0, 42.0, 49.0, 51.0, 66.0, 62.0, 67.0, 72.0, 71.0, 62.0, 45.0, 47.0, 39.0, 32.0, 27.0, 34.0, 18.0, 12.0, 15.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.118241310119629, -12.634806632995605, -12.151372909545898, -11.667938232421875, -11.184503555297852, -10.701068878173828, -10.217634201049805, -9.734200477600098, -9.250765800476074, -8.76733112335205, -8.283897399902344, -7.80046272277832, -7.317028045654297, -6.833593368530273, -6.350159168243408, -5.866724967956543, -5.3832902908325195, -4.899855613708496, -4.416421413421631, -3.9329869747161865, -3.449552536010742, -2.966118097305298, -2.4826836585998535, -1.9992492198944092, -1.5158147811889648, -1.0323803424835205, -0.5489459037780762, -0.06551146507263184, 0.4179229736328125, 0.9013574123382568, 1.3847918510437012, 1.8682262897491455, 2.3516597747802734, 2.8350942134857178, 3.318528652191162, 3.8019630908966064, 4.285397529602051, 4.768832206726074, 5.2522664070129395, 5.735700607299805, 6.219135284423828, 6.702569961547852, 7.186004161834717, 7.669438362121582, 8.152873039245605, 8.636307716369629, 9.119741439819336, 9.60317611694336, 10.086610794067383, 10.570045471191406, 11.05348014831543, 11.536913871765137, 12.02034854888916, 12.503783226013184, 12.98721694946289, 13.470651626586914, 13.954086303710938, 14.437520980834961, 14.920955657958984, 15.404389381408691, 15.887824058532715, 16.371257781982422, 16.854692459106445, 17.33812713623047, 17.821561813354492]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 2.0, 5.0, 13.0, 10.0, 7.0, 13.0, 16.0, 12.0, 15.0, 21.0, 17.0, 30.0, 29.0, 21.0, 32.0, 31.0, 27.0, 26.0, 40.0, 43.0, 38.0, 47.0, 31.0, 47.0, 37.0, 29.0, 35.0, 28.0, 20.0, 24.0, 33.0, 29.0, 27.0, 19.0, 20.0, 23.0, 25.0, 16.0, 12.0, 7.0, 10.0, 8.0, 4.0, 8.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.252270698547363, -7.994381427764893, -7.736492156982422, -7.478602886199951, -7.2207136154174805, -6.96282434463501, -6.704935073852539, -6.447045803070068, -6.189156532287598, -5.931267261505127, -5.673377990722656, -5.4154887199401855, -5.157599449157715, -4.899710178375244, -4.641820907592773, -4.383931636810303, -4.126042366027832, -3.8681530952453613, -3.6102638244628906, -3.35237455368042, -3.094485282897949, -2.8365960121154785, -2.578706741333008, -2.320817470550537, -2.0629281997680664, -1.8050389289855957, -1.547149658203125, -1.2892603874206543, -1.0313711166381836, -0.7734818458557129, -0.5155925750732422, -0.2577033042907715, 0.000186920166015625, 0.25807619094848633, 0.515965461730957, 0.7738547325134277, 1.0317440032958984, 1.2896332740783691, 1.5475225448608398, 1.8054118156433105, 2.0633010864257812, 2.321190357208252, 2.5790796279907227, 2.8369688987731934, 3.094858169555664, 3.3527474403381348, 3.6106367111206055, 3.868525981903076, 4.126415252685547, 4.384304523468018, 4.642193794250488, 4.900083065032959, 5.15797233581543, 5.4158616065979, 5.673750877380371, 5.931640148162842, 6.1895294189453125, 6.447418689727783, 6.705307960510254, 6.963197231292725, 7.221086502075195, 7.478975772857666, 7.736865043640137, 7.994754314422607, 8.252643585205078]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 5.0, 15.0, 18.0, 29.0, 38.0, 53.0, 54.0, 71.0, 108.0, 171.0, 225.0, 291.0, 461.0, 670.0, 957.0, 1439.0, 2238.0, 3444.0, 5649.0, 9395.0, 17330.0, 34018.0, 74596.0, 181946.0, 474161.0, 1040454.0, 1215048.0, 670022.0, 262634.0, 101560.0, 44472.0, 21406.0, 11832.0, 6996.0, 4272.0, 2670.0, 1807.0, 1172.0, 812.0, 542.0, 366.0, 274.0, 172.0, 130.0, 73.0, 56.0, 44.0, 29.0, 18.0, 12.0, 11.0, 11.0, 1.0, 2.0, 1.0, 1.0], "bins": [-20.109375, -19.521240234375, -18.93310546875, -18.344970703125, -17.7568359375, -17.168701171875, -16.58056640625, -15.992431640625, -15.404296875, -14.816162109375, -14.22802734375, -13.639892578125, -13.0517578125, -12.463623046875, -11.87548828125, -11.287353515625, -10.69921875, -10.111083984375, -9.52294921875, -8.934814453125, -8.3466796875, -7.758544921875, -7.17041015625, -6.582275390625, -5.994140625, -5.406005859375, -4.81787109375, -4.229736328125, -3.6416015625, -3.053466796875, -2.46533203125, -1.877197265625, -1.2890625, -0.700927734375, -0.11279296875, 0.475341796875, 1.0634765625, 1.651611328125, 2.23974609375, 2.827880859375, 3.416015625, 4.004150390625, 4.59228515625, 5.180419921875, 5.7685546875, 6.356689453125, 6.94482421875, 7.532958984375, 8.12109375, 8.709228515625, 9.29736328125, 9.885498046875, 10.4736328125, 11.061767578125, 11.64990234375, 12.238037109375, 12.826171875, 13.414306640625, 14.00244140625, 14.590576171875, 15.1787109375, 15.766845703125, 16.35498046875, 16.943115234375, 17.53125]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 6.0, 8.0, 9.0, 7.0, 14.0, 10.0, 15.0, 14.0, 21.0, 23.0, 29.0, 32.0, 29.0, 31.0, 37.0, 38.0, 24.0, 41.0, 47.0, 51.0, 43.0, 38.0, 32.0, 31.0, 39.0, 49.0, 30.0, 32.0, 20.0, 31.0, 33.0, 24.0, 25.0, 20.0, 12.0, 9.0, 9.0, 10.0, 8.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.5625, -8.31329345703125, -8.0640869140625, -7.81488037109375, -7.565673828125, -7.31646728515625, -7.0672607421875, -6.81805419921875, -6.56884765625, -6.31964111328125, -6.0704345703125, -5.82122802734375, -5.572021484375, -5.32281494140625, -5.0736083984375, -4.82440185546875, -4.5751953125, -4.32598876953125, -4.0767822265625, -3.82757568359375, -3.578369140625, -3.32916259765625, -3.0799560546875, -2.83074951171875, -2.58154296875, -2.33233642578125, -2.0831298828125, -1.83392333984375, -1.584716796875, -1.33551025390625, -1.0863037109375, -0.83709716796875, -0.587890625, -0.33868408203125, -0.0894775390625, 0.15972900390625, 0.408935546875, 0.65814208984375, 0.9073486328125, 1.15655517578125, 1.40576171875, 1.65496826171875, 1.9041748046875, 2.15338134765625, 2.402587890625, 2.65179443359375, 2.9010009765625, 3.15020751953125, 3.3994140625, 3.64862060546875, 3.8978271484375, 4.14703369140625, 4.396240234375, 4.64544677734375, 4.8946533203125, 5.14385986328125, 5.39306640625, 5.64227294921875, 5.8914794921875, 6.14068603515625, 6.389892578125, 6.63909912109375, 6.8883056640625, 7.13751220703125, 7.38671875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 6.0, 7.0, 18.0, 24.0, 29.0, 47.0, 68.0, 111.0, 192.0, 307.0, 472.0, 837.0, 1437.0, 2535.0, 4242.0, 8010.0, 15069.0, 30941.0, 68509.0, 165720.0, 436001.0, 1023164.0, 1278235.0, 693838.0, 267722.0, 104799.0, 45880.0, 21604.0, 10842.0, 5864.0, 3281.0, 1829.0, 1036.0, 607.0, 373.0, 234.0, 156.0, 84.0, 61.0, 41.0, 19.0, 14.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.28125, -23.5283203125, -22.775390625, -22.0224609375, -21.26953125, -20.5166015625, -19.763671875, -19.0107421875, -18.2578125, -17.5048828125, -16.751953125, -15.9990234375, -15.24609375, -14.4931640625, -13.740234375, -12.9873046875, -12.234375, -11.4814453125, -10.728515625, -9.9755859375, -9.22265625, -8.4697265625, -7.716796875, -6.9638671875, -6.2109375, -5.4580078125, -4.705078125, -3.9521484375, -3.19921875, -2.4462890625, -1.693359375, -0.9404296875, -0.1875, 0.5654296875, 1.318359375, 2.0712890625, 2.82421875, 3.5771484375, 4.330078125, 5.0830078125, 5.8359375, 6.5888671875, 7.341796875, 8.0947265625, 8.84765625, 9.6005859375, 10.353515625, 11.1064453125, 11.859375, 12.6123046875, 13.365234375, 14.1181640625, 14.87109375, 15.6240234375, 16.376953125, 17.1298828125, 17.8828125, 18.6357421875, 19.388671875, 20.1416015625, 20.89453125, 21.6474609375, 22.400390625, 23.1533203125, 23.90625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 4.0, 7.0, 12.0, 12.0, 15.0, 22.0, 29.0, 43.0, 40.0, 62.0, 78.0, 89.0, 102.0, 129.0, 156.0, 190.0, 236.0, 252.0, 281.0, 313.0, 297.0, 260.0, 244.0, 221.0, 184.0, 184.0, 122.0, 95.0, 80.0, 70.0, 57.0, 42.0, 38.0, 26.0, 21.0, 17.0, 18.0, 7.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.859375, -5.686767578125, -5.51416015625, -5.341552734375, -5.1689453125, -4.996337890625, -4.82373046875, -4.651123046875, -4.478515625, -4.305908203125, -4.13330078125, -3.960693359375, -3.7880859375, -3.615478515625, -3.44287109375, -3.270263671875, -3.09765625, -2.925048828125, -2.75244140625, -2.579833984375, -2.4072265625, -2.234619140625, -2.06201171875, -1.889404296875, -1.716796875, -1.544189453125, -1.37158203125, -1.198974609375, -1.0263671875, -0.853759765625, -0.68115234375, -0.508544921875, -0.3359375, -0.163330078125, 0.00927734375, 0.181884765625, 0.3544921875, 0.527099609375, 0.69970703125, 0.872314453125, 1.044921875, 1.217529296875, 1.39013671875, 1.562744140625, 1.7353515625, 1.907958984375, 2.08056640625, 2.253173828125, 2.42578125, 2.598388671875, 2.77099609375, 2.943603515625, 3.1162109375, 3.288818359375, 3.46142578125, 3.634033203125, 3.806640625, 3.979248046875, 4.15185546875, 4.324462890625, 4.4970703125, 4.669677734375, 4.84228515625, 5.014892578125, 5.1875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 3.0, 6.0, 10.0, 9.0, 17.0, 12.0, 17.0, 23.0, 40.0, 29.0, 43.0, 49.0, 47.0, 63.0, 73.0, 58.0, 68.0, 73.0, 62.0, 46.0, 56.0, 21.0, 33.0, 26.0, 16.0, 20.0, 18.0, 10.0, 9.0, 10.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-21.823322296142578, -21.2429256439209, -20.66252899169922, -20.08213233947754, -19.50173568725586, -18.92133903503418, -18.3409423828125, -17.76054573059082, -17.18014907836914, -16.59975242614746, -16.01935577392578, -15.438959121704102, -14.858562469482422, -14.278165817260742, -13.697769165039062, -13.117372512817383, -12.53697681427002, -11.95658016204834, -11.37618350982666, -10.79578685760498, -10.2153902053833, -9.634993553161621, -9.054597854614258, -8.474201202392578, -7.89380407333374, -7.3134074211120605, -6.733010768890381, -6.152614593505859, -5.57221794128418, -4.9918212890625, -4.41142463684082, -3.8310279846191406, -3.250631332397461, -2.6702346801757812, -2.0898380279541016, -1.509441614151001, -0.9290449619293213, -0.3486483097076416, 0.23174810409545898, 0.8121447563171387, 1.3925414085388184, 1.972938060760498, 2.5533347129821777, 3.1337311267852783, 3.714127779006958, 4.294524192810059, 4.874920845031738, 5.455317497253418, 6.035714149475098, 6.616110801696777, 7.196507453918457, 7.776904106140137, 8.357300758361816, 8.937697410583496, 9.51809310913086, 10.098489761352539, 10.678886413574219, 11.259283065795898, 11.839679718017578, 12.420076370239258, 13.000473022460938, 13.580869674682617, 14.161266326904297, 14.741662979125977, 15.322059631347656]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 5.0, 5.0, 8.0, 6.0, 10.0, 11.0, 10.0, 17.0, 18.0, 22.0, 21.0, 26.0, 18.0, 28.0, 26.0, 28.0, 23.0, 24.0, 25.0, 35.0, 43.0, 44.0, 37.0, 38.0, 36.0, 42.0, 32.0, 45.0, 33.0, 26.0, 29.0, 32.0, 40.0, 20.0, 20.0, 17.0, 11.0, 16.0, 16.0, 12.0, 9.0, 9.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.544527053833008, -9.252277374267578, -8.960027694702148, -8.667778015136719, -8.375528335571289, -8.083277702331543, -7.791028022766113, -7.498778343200684, -7.206528663635254, -6.914278984069824, -6.6220293045043945, -6.329779148101807, -6.037529468536377, -5.745279788970947, -5.453029632568359, -5.16077995300293, -4.8685302734375, -4.57628059387207, -4.284030914306641, -3.9917807579040527, -3.699531078338623, -3.4072813987731934, -3.1150314807891846, -2.822781562805176, -2.530531883239746, -2.2382822036743164, -1.9460322856903076, -1.6537824869155884, -1.3615326881408691, -1.06928288936615, -0.7770330905914307, -0.4847831726074219, -0.19253253936767578, 0.09971725940704346, 0.3919670581817627, 0.6842168569564819, 0.9764666557312012, 1.2687164545059204, 1.5609662532806396, 1.8532161712646484, 2.145465850830078, 2.437715530395508, 2.7299654483795166, 3.0222153663635254, 3.314465045928955, 3.6067147254943848, 3.8989646434783936, 4.191214561462402, 4.483464241027832, 4.775713920593262, 5.067963600158691, 5.360213756561279, 5.652463436126709, 5.944713115692139, 6.236963272094727, 6.529212951660156, 6.821462631225586, 7.113712310791016, 7.405961990356445, 7.698212146759033, 7.990461826324463, 8.28271198272705, 8.57496166229248, 8.86721134185791, 9.15946102142334]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 10.0, 10.0, 12.0, 29.0, 40.0, 60.0, 88.0, 138.0, 178.0, 243.0, 401.0, 597.0, 912.0, 1385.0, 2170.0, 3391.0, 5123.0, 8321.0, 13289.0, 21004.0, 33787.0, 53293.0, 80650.0, 114548.0, 144007.0, 151825.0, 131105.0, 98671.0, 66650.0, 43067.0, 27612.0, 16978.0, 10487.0, 6511.0, 4127.0, 2791.0, 1656.0, 1123.0, 749.0, 500.0, 327.0, 236.0, 128.0, 121.0, 56.0, 51.0, 34.0, 13.0, 16.0, 16.0, 6.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.5625, -4.41656494140625, -4.2706298828125, -4.12469482421875, -3.978759765625, -3.83282470703125, -3.6868896484375, -3.54095458984375, -3.39501953125, -3.24908447265625, -3.1031494140625, -2.95721435546875, -2.811279296875, -2.66534423828125, -2.5194091796875, -2.37347412109375, -2.2275390625, -2.08160400390625, -1.9356689453125, -1.78973388671875, -1.643798828125, -1.49786376953125, -1.3519287109375, -1.20599365234375, -1.06005859375, -0.91412353515625, -0.7681884765625, -0.62225341796875, -0.476318359375, -0.33038330078125, -0.1844482421875, -0.03851318359375, 0.107421875, 0.25335693359375, 0.3992919921875, 0.54522705078125, 0.691162109375, 0.83709716796875, 0.9830322265625, 1.12896728515625, 1.27490234375, 1.42083740234375, 1.5667724609375, 1.71270751953125, 1.858642578125, 2.00457763671875, 2.1505126953125, 2.29644775390625, 2.4423828125, 2.58831787109375, 2.7342529296875, 2.88018798828125, 3.026123046875, 3.17205810546875, 3.3179931640625, 3.46392822265625, 3.60986328125, 3.75579833984375, 3.9017333984375, 4.04766845703125, 4.193603515625, 4.33953857421875, 4.4854736328125, 4.63140869140625, 4.77734375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 5.0, 5.0, 12.0, 11.0, 15.0, 13.0, 22.0, 18.0, 31.0, 27.0, 25.0, 29.0, 28.0, 33.0, 28.0, 39.0, 43.0, 42.0, 41.0, 45.0, 50.0, 33.0, 47.0, 33.0, 24.0, 40.0, 35.0, 25.0, 27.0, 26.0, 27.0, 19.0, 14.0, 16.0, 12.0, 10.0, 4.0, 10.0, 6.0, 8.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.703125, -10.359375, -10.015625, -9.671875, -9.328125, -8.984375, -8.640625, -8.296875, -7.953125, -7.609375, -7.265625, -6.921875, -6.578125, -6.234375, -5.890625, -5.546875, -5.203125, -4.859375, -4.515625, -4.171875, -3.828125, -3.484375, -3.140625, -2.796875, -2.453125, -2.109375, -1.765625, -1.421875, -1.078125, -0.734375, -0.390625, -0.046875, 0.296875, 0.640625, 0.984375, 1.328125, 1.671875, 2.015625, 2.359375, 2.703125, 3.046875, 3.390625, 3.734375, 4.078125, 4.421875, 4.765625, 5.109375, 5.453125, 5.796875, 6.140625, 6.484375, 6.828125, 7.171875, 7.515625, 7.859375, 8.203125, 8.546875, 8.890625, 9.234375, 9.578125, 9.921875, 10.265625, 10.609375, 10.953125, 11.296875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 4.0, 6.0, 12.0, 18.0, 21.0, 33.0, 45.0, 69.0, 76.0, 140.0, 200.0, 264.0, 433.0, 604.0, 981.0, 1423.0, 2194.0, 3418.0, 5632.0, 9102.0, 15163.0, 25778.0, 44972.0, 79186.0, 133407.0, 193336.0, 196838.0, 138453.0, 81851.0, 46632.0, 26742.0, 15693.0, 9502.0, 5873.0, 3600.0, 2311.0, 1445.0, 1037.0, 639.0, 467.0, 295.0, 200.0, 148.0, 86.0, 76.0, 41.0, 37.0, 27.0, 14.0, 14.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-6.49609375, -6.2994384765625, -6.102783203125, -5.9061279296875, -5.70947265625, -5.5128173828125, -5.316162109375, -5.1195068359375, -4.9228515625, -4.7261962890625, -4.529541015625, -4.3328857421875, -4.13623046875, -3.9395751953125, -3.742919921875, -3.5462646484375, -3.349609375, -3.1529541015625, -2.956298828125, -2.7596435546875, -2.56298828125, -2.3663330078125, -2.169677734375, -1.9730224609375, -1.7763671875, -1.5797119140625, -1.383056640625, -1.1864013671875, -0.98974609375, -0.7930908203125, -0.596435546875, -0.3997802734375, -0.203125, -0.0064697265625, 0.190185546875, 0.3868408203125, 0.58349609375, 0.7801513671875, 0.976806640625, 1.1734619140625, 1.3701171875, 1.5667724609375, 1.763427734375, 1.9600830078125, 2.15673828125, 2.3533935546875, 2.550048828125, 2.7467041015625, 2.943359375, 3.1400146484375, 3.336669921875, 3.5333251953125, 3.72998046875, 3.9266357421875, 4.123291015625, 4.3199462890625, 4.5166015625, 4.7132568359375, 4.909912109375, 5.1065673828125, 5.30322265625, 5.4998779296875, 5.696533203125, 5.8931884765625, 6.08984375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 9.0, 14.0, 11.0, 18.0, 20.0, 20.0, 23.0, 21.0, 21.0, 28.0, 36.0, 31.0, 29.0, 40.0, 45.0, 32.0, 31.0, 35.0, 39.0, 32.0, 35.0, 27.0, 35.0, 41.0, 37.0, 25.0, 36.0, 23.0, 24.0, 28.0, 25.0, 26.0, 12.0, 12.0, 10.0, 12.0, 8.0, 11.0, 5.0, 3.0, 4.0, 5.0, 5.0, 0.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8984375, -5.71002197265625, -5.5216064453125, -5.33319091796875, -5.144775390625, -4.95635986328125, -4.7679443359375, -4.57952880859375, -4.39111328125, -4.20269775390625, -4.0142822265625, -3.82586669921875, -3.637451171875, -3.44903564453125, -3.2606201171875, -3.07220458984375, -2.8837890625, -2.69537353515625, -2.5069580078125, -2.31854248046875, -2.130126953125, -1.94171142578125, -1.7532958984375, -1.56488037109375, -1.37646484375, -1.18804931640625, -0.9996337890625, -0.81121826171875, -0.622802734375, -0.43438720703125, -0.2459716796875, -0.05755615234375, 0.130859375, 0.31927490234375, 0.5076904296875, 0.69610595703125, 0.884521484375, 1.07293701171875, 1.2613525390625, 1.44976806640625, 1.63818359375, 1.82659912109375, 2.0150146484375, 2.20343017578125, 2.391845703125, 2.58026123046875, 2.7686767578125, 2.95709228515625, 3.1455078125, 3.33392333984375, 3.5223388671875, 3.71075439453125, 3.899169921875, 4.08758544921875, 4.2760009765625, 4.46441650390625, 4.65283203125, 4.84124755859375, 5.0296630859375, 5.21807861328125, 5.406494140625, 5.59490966796875, 5.7833251953125, 5.97174072265625, 6.16015625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 7.0, 6.0, 7.0, 4.0, 19.0, 19.0, 31.0, 44.0, 42.0, 101.0, 121.0, 164.0, 248.0, 334.0, 516.0, 734.0, 1112.0, 1656.0, 2536.0, 3851.0, 5913.0, 9762.0, 15977.0, 27028.0, 47516.0, 83835.0, 146839.0, 214292.0, 195513.0, 122614.0, 69070.0, 39075.0, 22508.0, 13808.0, 8186.0, 5152.0, 3308.0, 2123.0, 1461.0, 987.0, 635.0, 439.0, 268.0, 208.0, 150.0, 108.0, 71.0, 45.0, 39.0, 24.0, 17.0, 20.0, 7.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.072265625, -2.972625732421875, -2.87298583984375, -2.773345947265625, -2.6737060546875, -2.574066162109375, -2.47442626953125, -2.374786376953125, -2.275146484375, -2.175506591796875, -2.07586669921875, -1.976226806640625, -1.8765869140625, -1.776947021484375, -1.67730712890625, -1.577667236328125, -1.47802734375, -1.378387451171875, -1.27874755859375, -1.179107666015625, -1.0794677734375, -0.979827880859375, -0.88018798828125, -0.780548095703125, -0.680908203125, -0.581268310546875, -0.48162841796875, -0.381988525390625, -0.2823486328125, -0.182708740234375, -0.08306884765625, 0.016571044921875, 0.1162109375, 0.215850830078125, 0.31549072265625, 0.415130615234375, 0.5147705078125, 0.614410400390625, 0.71405029296875, 0.813690185546875, 0.913330078125, 1.012969970703125, 1.11260986328125, 1.212249755859375, 1.3118896484375, 1.411529541015625, 1.51116943359375, 1.610809326171875, 1.71044921875, 1.810089111328125, 1.90972900390625, 2.009368896484375, 2.1090087890625, 2.208648681640625, 2.30828857421875, 2.407928466796875, 2.507568359375, 2.607208251953125, 2.70684814453125, 2.806488037109375, 2.9061279296875, 3.005767822265625, 3.10540771484375, 3.205047607421875, 3.3046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 8.0, 5.0, 4.0, 5.0, 13.0, 11.0, 15.0, 18.0, 30.0, 49.0, 53.0, 57.0, 77.0, 63.0, 92.0, 76.0, 77.0, 59.0, 46.0, 62.0, 27.0, 30.0, 27.0, 17.0, 14.0, 15.0, 12.0, 11.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023162364959716797, -0.00022459588944911957, -0.00021756812930107117, -0.00021054036915302277, -0.00020351260900497437, -0.00019648484885692596, -0.00018945708870887756, -0.00018242932856082916, -0.00017540156841278076, -0.00016837380826473236, -0.00016134604811668396, -0.00015431828796863556, -0.00014729052782058716, -0.00014026276767253876, -0.00013323500752449036, -0.00012620724737644196, -0.00011917948722839355, -0.00011215172708034515, -0.00010512396693229675, -9.809620678424835e-05, -9.106844663619995e-05, -8.404068648815155e-05, -7.701292634010315e-05, -6.998516619205475e-05, -6.295740604400635e-05, -5.592964589595795e-05, -4.8901885747909546e-05, -4.1874125599861145e-05, -3.4846365451812744e-05, -2.7818605303764343e-05, -2.0790845155715942e-05, -1.3763085007667542e-05, -6.735324859619141e-06, 2.9243528842926025e-07, 7.320195436477661e-06, 1.4347955584526062e-05, 2.1375715732574463e-05, 2.8403475880622864e-05, 3.5431236028671265e-05, 4.2458996176719666e-05, 4.9486756324768066e-05, 5.651451647281647e-05, 6.354227662086487e-05, 7.057003676891327e-05, 7.759779691696167e-05, 8.462555706501007e-05, 9.165331721305847e-05, 9.868107736110687e-05, 0.00010570883750915527, 0.00011273659765720367, 0.00011976435780525208, 0.00012679211795330048, 0.00013381987810134888, 0.00014084763824939728, 0.00014787539839744568, 0.00015490315854549408, 0.00016193091869354248, 0.00016895867884159088, 0.00017598643898963928, 0.00018301419913768768, 0.00019004195928573608, 0.00019706971943378448, 0.00020409747958183289, 0.0002111252397298813, 0.0002181529998779297]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 10.0, 7.0, 14.0, 20.0, 33.0, 59.0, 86.0, 129.0, 216.0, 327.0, 556.0, 937.0, 1577.0, 2860.0, 5049.0, 8943.0, 16995.0, 32888.0, 65403.0, 129592.0, 219790.0, 239460.0, 156938.0, 80926.0, 40414.0, 20580.0, 10817.0, 5812.0, 3226.0, 1980.0, 1098.0, 687.0, 425.0, 244.0, 161.0, 104.0, 68.0, 37.0, 28.0, 22.0, 14.0, 8.0, 9.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41796875, -4.26641845703125, -4.1148681640625, -3.96331787109375, -3.811767578125, -3.66021728515625, -3.5086669921875, -3.35711669921875, -3.20556640625, -3.05401611328125, -2.9024658203125, -2.75091552734375, -2.599365234375, -2.44781494140625, -2.2962646484375, -2.14471435546875, -1.9931640625, -1.84161376953125, -1.6900634765625, -1.53851318359375, -1.386962890625, -1.23541259765625, -1.0838623046875, -0.93231201171875, -0.78076171875, -0.62921142578125, -0.4776611328125, -0.32611083984375, -0.174560546875, -0.02301025390625, 0.1285400390625, 0.28009033203125, 0.431640625, 0.58319091796875, 0.7347412109375, 0.88629150390625, 1.037841796875, 1.18939208984375, 1.3409423828125, 1.49249267578125, 1.64404296875, 1.79559326171875, 1.9471435546875, 2.09869384765625, 2.250244140625, 2.40179443359375, 2.5533447265625, 2.70489501953125, 2.8564453125, 3.00799560546875, 3.1595458984375, 3.31109619140625, 3.462646484375, 3.61419677734375, 3.7657470703125, 3.91729736328125, 4.06884765625, 4.22039794921875, 4.3719482421875, 4.52349853515625, 4.675048828125, 4.82659912109375, 4.9781494140625, 5.12969970703125, 5.28125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 7.0, 5.0, 7.0, 8.0, 8.0, 11.0, 22.0, 18.0, 15.0, 21.0, 34.0, 32.0, 44.0, 36.0, 42.0, 42.0, 31.0, 39.0, 45.0, 43.0, 50.0, 48.0, 34.0, 42.0, 31.0, 37.0, 31.0, 21.0, 34.0, 18.0, 24.0, 23.0, 9.0, 11.0, 7.0, 8.0, 8.0, 12.0, 7.0, 5.0, 2.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.7216796875, -0.6961517333984375, -0.670623779296875, -0.6450958251953125, -0.61956787109375, -0.5940399169921875, -0.568511962890625, -0.5429840087890625, -0.5174560546875, -0.4919281005859375, -0.466400146484375, -0.4408721923828125, -0.41534423828125, -0.3898162841796875, -0.364288330078125, -0.3387603759765625, -0.313232421875, -0.2877044677734375, -0.262176513671875, -0.2366485595703125, -0.21112060546875, -0.1855926513671875, -0.160064697265625, -0.1345367431640625, -0.1090087890625, -0.0834808349609375, -0.057952880859375, -0.0324249267578125, -0.00689697265625, 0.0186309814453125, 0.044158935546875, 0.0696868896484375, 0.09521484375, 0.1207427978515625, 0.146270751953125, 0.1717987060546875, 0.19732666015625, 0.2228546142578125, 0.248382568359375, 0.2739105224609375, 0.2994384765625, 0.3249664306640625, 0.350494384765625, 0.3760223388671875, 0.40155029296875, 0.4270782470703125, 0.452606201171875, 0.4781341552734375, 0.503662109375, 0.5291900634765625, 0.554718017578125, 0.5802459716796875, 0.60577392578125, 0.6313018798828125, 0.656829833984375, 0.6823577880859375, 0.7078857421875, 0.7334136962890625, 0.758941650390625, 0.7844696044921875, 0.80999755859375, 0.8355255126953125, 0.861053466796875, 0.8865814208984375, 0.912109375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 3.0, 12.0, 12.0, 12.0, 8.0, 10.0, 16.0, 40.0, 32.0, 42.0, 36.0, 61.0, 51.0, 65.0, 62.0, 61.0, 79.0, 75.0, 43.0, 49.0, 43.0, 28.0, 26.0, 24.0, 19.0, 20.0, 20.0, 9.0, 6.0, 7.0, 8.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-21.74443244934082, -21.160507202148438, -20.576580047607422, -19.99265480041504, -19.408729553222656, -18.82480239868164, -18.240877151489258, -17.656951904296875, -17.07302474975586, -16.489099502563477, -15.905172348022461, -15.321247100830078, -14.737320899963379, -14.15339469909668, -13.569469451904297, -12.985543251037598, -12.401617050170898, -11.8176908493042, -11.2337646484375, -10.649839401245117, -10.065913200378418, -9.481986999511719, -8.898061752319336, -8.314135551452637, -7.7302093505859375, -7.146283149719238, -6.562357425689697, -5.978431701660156, -5.394505500793457, -4.810579299926758, -4.226653575897217, -3.642727851867676, -3.0587997436523438, -2.4748737812042236, -1.8909478187561035, -1.3070218563079834, -0.7230958938598633, -0.13916993141174316, 0.44475603103637695, 1.028681755065918, 1.6126079559326172, 2.1965339183807373, 2.7804598808288574, 3.3643858432769775, 3.9483118057250977, 4.532238006591797, 5.116163730621338, 5.700089454650879, 6.284015655517578, 6.867941856384277, 7.451867580413818, 8.03579330444336, 8.619719505310059, 9.203645706176758, 9.78757095336914, 10.37149715423584, 10.955423355102539, 11.539349555969238, 12.123275756835938, 12.70720100402832, 13.29112720489502, 13.875053405761719, 14.458978652954102, 15.0429048538208, 15.6268310546875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 6.0, 6.0, 4.0, 5.0, 4.0, 10.0, 11.0, 11.0, 11.0, 15.0, 13.0, 26.0, 20.0, 24.0, 20.0, 20.0, 27.0, 34.0, 27.0, 19.0, 31.0, 39.0, 36.0, 33.0, 44.0, 34.0, 38.0, 45.0, 36.0, 40.0, 33.0, 31.0, 26.0, 29.0, 32.0, 24.0, 25.0, 14.0, 17.0, 14.0, 14.0, 17.0, 9.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.4180908203125, -9.128936767578125, -8.839781761169434, -8.550627708435059, -8.261472702026367, -7.972318649291992, -7.683164119720459, -7.394009590148926, -7.104855060577393, -6.815700531005859, -6.526546001434326, -6.237391471862793, -5.948237419128418, -5.659082412719727, -5.369928359985352, -5.080773830413818, -4.791619300842285, -4.502464771270752, -4.213310241699219, -3.9241559505462646, -3.6350014209747314, -3.3458468914031982, -3.056692600250244, -2.767538070678711, -2.4783835411071777, -2.1892290115356445, -1.9000746011734009, -1.6109201908111572, -1.321765661239624, -1.0326111316680908, -0.7434567213058472, -0.4543023109436035, -0.16514873504638672, 0.12400573492050171, 0.41316020488739014, 0.7023146748542786, 0.991469144821167, 1.2806236743927002, 1.5697780847549438, 1.8589324951171875, 2.1480870246887207, 2.437241554260254, 2.726396083831787, 3.015550374984741, 3.3047049045562744, 3.5938594341278076, 3.8830137252807617, 4.172168254852295, 4.461322784423828, 4.750477313995361, 5.0396318435668945, 5.328786373138428, 5.617940902709961, 5.907094955444336, 6.196249485015869, 6.485404014587402, 6.7745585441589355, 7.063713073730469, 7.352867603302002, 7.642022132873535, 7.93117618560791, 8.220331192016602, 8.509485244750977, 8.798639297485352, 9.087794303894043]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 7.0, 7.0, 7.0, 10.0, 20.0, 15.0, 24.0, 39.0, 59.0, 107.0, 132.0, 222.0, 316.0, 492.0, 731.0, 1111.0, 1627.0, 2589.0, 3845.0, 6070.0, 9146.0, 14523.0, 22195.0, 34412.0, 52319.0, 75577.0, 102914.0, 126312.0, 135792.0, 126188.0, 103888.0, 76421.0, 52480.0, 34736.0, 22575.0, 14698.0, 9358.0, 6018.0, 3968.0, 2592.0, 1653.0, 1091.0, 781.0, 511.0, 332.0, 197.0, 167.0, 100.0, 55.0, 42.0, 26.0, 25.0, 18.0, 10.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0], "bins": [-7.3046875, -7.08001708984375, -6.8553466796875, -6.63067626953125, -6.406005859375, -6.18133544921875, -5.9566650390625, -5.73199462890625, -5.50732421875, -5.28265380859375, -5.0579833984375, -4.83331298828125, -4.608642578125, -4.38397216796875, -4.1593017578125, -3.93463134765625, -3.7099609375, -3.48529052734375, -3.2606201171875, -3.03594970703125, -2.811279296875, -2.58660888671875, -2.3619384765625, -2.13726806640625, -1.91259765625, -1.68792724609375, -1.4632568359375, -1.23858642578125, -1.013916015625, -0.78924560546875, -0.5645751953125, -0.33990478515625, -0.115234375, 0.10943603515625, 0.3341064453125, 0.55877685546875, 0.783447265625, 1.00811767578125, 1.2327880859375, 1.45745849609375, 1.68212890625, 1.90679931640625, 2.1314697265625, 2.35614013671875, 2.580810546875, 2.80548095703125, 3.0301513671875, 3.25482177734375, 3.4794921875, 3.70416259765625, 3.9288330078125, 4.15350341796875, 4.378173828125, 4.60284423828125, 4.8275146484375, 5.05218505859375, 5.27685546875, 5.50152587890625, 5.7261962890625, 5.95086669921875, 6.175537109375, 6.40020751953125, 6.6248779296875, 6.84954833984375, 7.07421875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 10.0, 11.0, 12.0, 13.0, 16.0, 20.0, 22.0, 25.0, 23.0, 24.0, 29.0, 24.0, 28.0, 34.0, 38.0, 38.0, 39.0, 39.0, 32.0, 36.0, 34.0, 51.0, 27.0, 46.0, 30.0, 31.0, 33.0, 28.0, 28.0, 25.0, 20.0, 13.0, 17.0, 13.0, 10.0, 11.0, 13.0, 8.0, 8.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.640625, -10.3143310546875, -9.988037109375, -9.6617431640625, -9.33544921875, -9.0091552734375, -8.682861328125, -8.3565673828125, -8.0302734375, -7.7039794921875, -7.377685546875, -7.0513916015625, -6.72509765625, -6.3988037109375, -6.072509765625, -5.7462158203125, -5.419921875, -5.0936279296875, -4.767333984375, -4.4410400390625, -4.11474609375, -3.7884521484375, -3.462158203125, -3.1358642578125, -2.8095703125, -2.4832763671875, -2.156982421875, -1.8306884765625, -1.50439453125, -1.1781005859375, -0.851806640625, -0.5255126953125, -0.19921875, 0.1270751953125, 0.453369140625, 0.7796630859375, 1.10595703125, 1.4322509765625, 1.758544921875, 2.0848388671875, 2.4111328125, 2.7374267578125, 3.063720703125, 3.3900146484375, 3.71630859375, 4.0426025390625, 4.368896484375, 4.6951904296875, 5.021484375, 5.3477783203125, 5.674072265625, 6.0003662109375, 6.32666015625, 6.6529541015625, 6.979248046875, 7.3055419921875, 7.6318359375, 7.9581298828125, 8.284423828125, 8.6107177734375, 8.93701171875, 9.2633056640625, 9.589599609375, 9.9158935546875, 10.2421875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 9.0, 14.0, 19.0, 35.0, 52.0, 81.0, 136.0, 208.0, 343.0, 563.0, 909.0, 1552.0, 2496.0, 4200.0, 6919.0, 11430.0, 18986.0, 30039.0, 47891.0, 71701.0, 101440.0, 130042.0, 144221.0, 136666.0, 111622.0, 81290.0, 54347.0, 35030.0, 21905.0, 13464.0, 8315.0, 4871.0, 3020.0, 1883.0, 1073.0, 668.0, 441.0, 269.0, 139.0, 101.0, 57.0, 41.0, 25.0, 17.0, 10.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8828125, -7.625732421875, -7.36865234375, -7.111572265625, -6.8544921875, -6.597412109375, -6.34033203125, -6.083251953125, -5.826171875, -5.569091796875, -5.31201171875, -5.054931640625, -4.7978515625, -4.540771484375, -4.28369140625, -4.026611328125, -3.76953125, -3.512451171875, -3.25537109375, -2.998291015625, -2.7412109375, -2.484130859375, -2.22705078125, -1.969970703125, -1.712890625, -1.455810546875, -1.19873046875, -0.941650390625, -0.6845703125, -0.427490234375, -0.17041015625, 0.086669921875, 0.34375, 0.600830078125, 0.85791015625, 1.114990234375, 1.3720703125, 1.629150390625, 1.88623046875, 2.143310546875, 2.400390625, 2.657470703125, 2.91455078125, 3.171630859375, 3.4287109375, 3.685791015625, 3.94287109375, 4.199951171875, 4.45703125, 4.714111328125, 4.97119140625, 5.228271484375, 5.4853515625, 5.742431640625, 5.99951171875, 6.256591796875, 6.513671875, 6.770751953125, 7.02783203125, 7.284912109375, 7.5419921875, 7.799072265625, 8.05615234375, 8.313232421875, 8.5703125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 8.0, 11.0, 12.0, 10.0, 18.0, 13.0, 18.0, 22.0, 18.0, 32.0, 19.0, 28.0, 31.0, 42.0, 37.0, 42.0, 48.0, 31.0, 41.0, 44.0, 41.0, 34.0, 49.0, 32.0, 35.0, 31.0, 23.0, 27.0, 26.0, 25.0, 21.0, 15.0, 18.0, 18.0, 15.0, 16.0, 13.0, 4.0, 7.0, 9.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.55078125, -6.3321533203125, -6.113525390625, -5.8948974609375, -5.67626953125, -5.4576416015625, -5.239013671875, -5.0203857421875, -4.8017578125, -4.5831298828125, -4.364501953125, -4.1458740234375, -3.92724609375, -3.7086181640625, -3.489990234375, -3.2713623046875, -3.052734375, -2.8341064453125, -2.615478515625, -2.3968505859375, -2.17822265625, -1.9595947265625, -1.740966796875, -1.5223388671875, -1.3037109375, -1.0850830078125, -0.866455078125, -0.6478271484375, -0.42919921875, -0.2105712890625, 0.008056640625, 0.2266845703125, 0.4453125, 0.6639404296875, 0.882568359375, 1.1011962890625, 1.31982421875, 1.5384521484375, 1.757080078125, 1.9757080078125, 2.1943359375, 2.4129638671875, 2.631591796875, 2.8502197265625, 3.06884765625, 3.2874755859375, 3.506103515625, 3.7247314453125, 3.943359375, 4.1619873046875, 4.380615234375, 4.5992431640625, 4.81787109375, 5.0364990234375, 5.255126953125, 5.4737548828125, 5.6923828125, 5.9110107421875, 6.129638671875, 6.3482666015625, 6.56689453125, 6.7855224609375, 7.004150390625, 7.2227783203125, 7.44140625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 10.0, 23.0, 15.0, 19.0, 48.0, 55.0, 65.0, 105.0, 176.0, 253.0, 363.0, 550.0, 801.0, 1236.0, 1814.0, 2775.0, 4121.0, 6431.0, 9965.0, 15581.0, 24470.0, 37525.0, 56805.0, 81659.0, 110301.0, 132815.0, 138728.0, 123439.0, 97380.0, 68928.0, 46568.0, 30613.0, 19531.0, 12202.0, 8022.0, 5117.0, 3372.0, 2234.0, 1476.0, 934.0, 648.0, 469.0, 311.0, 203.0, 117.0, 95.0, 59.0, 43.0, 36.0, 17.0, 13.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0], "bins": [-4.015625, -3.894866943359375, -3.77410888671875, -3.653350830078125, -3.5325927734375, -3.411834716796875, -3.29107666015625, -3.170318603515625, -3.049560546875, -2.928802490234375, -2.80804443359375, -2.687286376953125, -2.5665283203125, -2.445770263671875, -2.32501220703125, -2.204254150390625, -2.08349609375, -1.962738037109375, -1.84197998046875, -1.721221923828125, -1.6004638671875, -1.479705810546875, -1.35894775390625, -1.238189697265625, -1.117431640625, -0.996673583984375, -0.87591552734375, -0.755157470703125, -0.6343994140625, -0.513641357421875, -0.39288330078125, -0.272125244140625, -0.1513671875, -0.030609130859375, 0.09014892578125, 0.210906982421875, 0.3316650390625, 0.452423095703125, 0.57318115234375, 0.693939208984375, 0.814697265625, 0.935455322265625, 1.05621337890625, 1.176971435546875, 1.2977294921875, 1.418487548828125, 1.53924560546875, 1.660003662109375, 1.78076171875, 1.901519775390625, 2.02227783203125, 2.143035888671875, 2.2637939453125, 2.384552001953125, 2.50531005859375, 2.626068115234375, 2.746826171875, 2.867584228515625, 2.98834228515625, 3.109100341796875, 3.2298583984375, 3.350616455078125, 3.47137451171875, 3.592132568359375, 3.712890625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 9.0, 8.0, 10.0, 16.0, 14.0, 20.0, 29.0, 24.0, 25.0, 40.0, 64.0, 64.0, 62.0, 64.0, 55.0, 55.0, 61.0, 56.0, 40.0, 40.0, 40.0, 29.0, 26.0, 28.0, 28.0, 14.0, 17.0, 10.0, 11.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00044417381286621094, -0.0004293955862522125, -0.0004146173596382141, -0.0003998391330242157, -0.0003850609064102173, -0.00037028267979621887, -0.00035550445318222046, -0.00034072622656822205, -0.00032594799995422363, -0.0003111697733402252, -0.0002963915467262268, -0.0002816133201122284, -0.00026683509349823, -0.00025205686688423157, -0.00023727864027023315, -0.00022250041365623474, -0.00020772218704223633, -0.00019294396042823792, -0.0001781657338142395, -0.0001633875072002411, -0.00014860928058624268, -0.00013383105397224426, -0.00011905282735824585, -0.00010427460074424744, -8.949637413024902e-05, -7.471814751625061e-05, -5.99399209022522e-05, -4.5161694288253784e-05, -3.038346767425537e-05, -1.5605241060256958e-05, -8.270144462585449e-07, 1.3951212167739868e-05, 2.872943878173828e-05, 4.3507665395736694e-05, 5.828589200973511e-05, 7.306411862373352e-05, 8.784234523773193e-05, 0.00010262057185173035, 0.00011739879846572876, 0.00013217702507972717, 0.00014695525169372559, 0.000161733478307724, 0.0001765117049217224, 0.00019128993153572083, 0.00020606815814971924, 0.00022084638476371765, 0.00023562461137771606, 0.0002504028379917145, 0.0002651810646057129, 0.0002799592912197113, 0.0002947375178337097, 0.00030951574444770813, 0.00032429397106170654, 0.00033907219767570496, 0.00035385042428970337, 0.0003686286509037018, 0.0003834068775177002, 0.0003981851041316986, 0.000412963330745697, 0.00042774155735969543, 0.00044251978397369385, 0.00045729801058769226, 0.0004720762372016907, 0.0004868544638156891, 0.0005016326904296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 14.0, 22.0, 25.0, 42.0, 81.0, 121.0, 194.0, 285.0, 415.0, 673.0, 1024.0, 1704.0, 2648.0, 4267.0, 7200.0, 11879.0, 19626.0, 33703.0, 57155.0, 93053.0, 137695.0, 171923.0, 166631.0, 128869.0, 83975.0, 50570.0, 29787.0, 17515.0, 10362.0, 6361.0, 3957.0, 2448.0, 1578.0, 983.0, 647.0, 380.0, 263.0, 156.0, 115.0, 70.0, 49.0, 27.0, 24.0, 10.0, 5.0, 9.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.109375, -4.94915771484375, -4.7889404296875, -4.62872314453125, -4.468505859375, -4.30828857421875, -4.1480712890625, -3.98785400390625, -3.82763671875, -3.66741943359375, -3.5072021484375, -3.34698486328125, -3.186767578125, -3.02655029296875, -2.8663330078125, -2.70611572265625, -2.5458984375, -2.38568115234375, -2.2254638671875, -2.06524658203125, -1.905029296875, -1.74481201171875, -1.5845947265625, -1.42437744140625, -1.26416015625, -1.10394287109375, -0.9437255859375, -0.78350830078125, -0.623291015625, -0.46307373046875, -0.3028564453125, -0.14263916015625, 0.017578125, 0.17779541015625, 0.3380126953125, 0.49822998046875, 0.658447265625, 0.81866455078125, 0.9788818359375, 1.13909912109375, 1.29931640625, 1.45953369140625, 1.6197509765625, 1.77996826171875, 1.940185546875, 2.10040283203125, 2.2606201171875, 2.42083740234375, 2.5810546875, 2.74127197265625, 2.9014892578125, 3.06170654296875, 3.221923828125, 3.38214111328125, 3.5423583984375, 3.70257568359375, 3.86279296875, 4.02301025390625, 4.1832275390625, 4.34344482421875, 4.503662109375, 4.66387939453125, 4.8240966796875, 4.98431396484375, 5.14453125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 7.0, 8.0, 13.0, 12.0, 25.0, 35.0, 24.0, 45.0, 37.0, 48.0, 36.0, 48.0, 51.0, 49.0, 53.0, 64.0, 58.0, 59.0, 53.0, 43.0, 41.0, 38.0, 31.0, 30.0, 22.0, 9.0, 11.0, 4.0, 7.0, 8.0, 5.0, 2.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3818359375, -1.3379058837890625, -1.293975830078125, -1.2500457763671875, -1.20611572265625, -1.1621856689453125, -1.118255615234375, -1.0743255615234375, -1.0303955078125, -0.9864654541015625, -0.942535400390625, -0.8986053466796875, -0.85467529296875, -0.8107452392578125, -0.766815185546875, -0.7228851318359375, -0.678955078125, -0.6350250244140625, -0.591094970703125, -0.5471649169921875, -0.50323486328125, -0.4593048095703125, -0.415374755859375, -0.3714447021484375, -0.3275146484375, -0.2835845947265625, -0.239654541015625, -0.1957244873046875, -0.15179443359375, -0.1078643798828125, -0.063934326171875, -0.0200042724609375, 0.02392578125, 0.0678558349609375, 0.111785888671875, 0.1557159423828125, 0.19964599609375, 0.2435760498046875, 0.287506103515625, 0.3314361572265625, 0.3753662109375, 0.4192962646484375, 0.463226318359375, 0.5071563720703125, 0.55108642578125, 0.5950164794921875, 0.638946533203125, 0.6828765869140625, 0.726806640625, 0.7707366943359375, 0.814666748046875, 0.8585968017578125, 0.90252685546875, 0.9464569091796875, 0.990386962890625, 1.0343170166015625, 1.0782470703125, 1.1221771240234375, 1.166107177734375, 1.2100372314453125, 1.25396728515625, 1.2978973388671875, 1.341827392578125, 1.3857574462890625, 1.4296875]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 11.0, 9.0, 10.0, 14.0, 17.0, 9.0, 22.0, 33.0, 29.0, 49.0, 47.0, 61.0, 51.0, 52.0, 64.0, 66.0, 75.0, 59.0, 56.0, 37.0, 39.0, 28.0, 22.0, 28.0, 20.0, 22.0, 8.0, 15.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.807313919067383, -19.240148544311523, -18.672983169555664, -18.105819702148438, -17.538654327392578, -16.97148895263672, -16.40432357788086, -15.837158203125, -15.269993782043457, -14.702828407287598, -14.135663986206055, -13.568498611450195, -13.001333236694336, -12.434168815612793, -11.867003440856934, -11.29983901977539, -10.732673645019531, -10.165508270263672, -9.598343849182129, -9.03117847442627, -8.464014053344727, -7.896848678588867, -7.329683303833008, -6.762518405914307, -6.1953535079956055, -5.628188610076904, -5.061023712158203, -4.493858337402344, -3.9266934394836426, -3.3595285415649414, -2.792363405227661, -2.225198268890381, -1.6580314636230469, -1.0908664464950562, -0.5237014293670654, 0.04346358776092529, 0.610628604888916, 1.1777935028076172, 1.7449586391448975, 2.3121237754821777, 2.879288673400879, 3.44645357131958, 4.013618469238281, 4.580783843994141, 5.147948741912842, 5.715113639831543, 6.282279014587402, 6.8494439125061035, 7.416608810424805, 7.983773708343506, 8.550938606262207, 9.118103981018066, 9.68526840209961, 10.252433776855469, 10.819599151611328, 11.386764526367188, 11.95392894744873, 12.52109432220459, 13.088258743286133, 13.655424118041992, 14.222589492797852, 14.789753913879395, 15.356919288635254, 15.924083709716797, 16.491249084472656]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 7.0, 3.0, 9.0, 9.0, 12.0, 5.0, 15.0, 13.0, 22.0, 19.0, 27.0, 29.0, 24.0, 24.0, 22.0, 31.0, 41.0, 37.0, 42.0, 48.0, 37.0, 41.0, 36.0, 36.0, 41.0, 41.0, 42.0, 23.0, 43.0, 34.0, 33.0, 23.0, 20.0, 19.0, 17.0, 14.0, 16.0, 12.0, 9.0, 8.0, 6.0, 4.0, 7.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.244494438171387, -9.893935203552246, -9.543375968933105, -9.192816734313965, -8.842257499694824, -8.491697311401367, -8.141138076782227, -7.790578842163086, -7.440019607543945, -7.089460372924805, -6.738901138305664, -6.388341903686523, -6.037782192230225, -5.687222957611084, -5.336663722991943, -4.9861040115356445, -4.635545253753662, -4.2849860191345215, -3.9344265460968018, -3.583867311477661, -3.2333078384399414, -2.882748603820801, -2.53218936920166, -2.1816298961639404, -1.8310706615447998, -1.4805113077163696, -1.1299519538879395, -0.7793927192687988, -0.42883336544036865, -0.07827401161193848, 0.27228522300720215, 0.6228446960449219, 0.9734039306640625, 1.3239632844924927, 1.6745226383209229, 2.0250818729400635, 2.375641345977783, 2.726200580596924, 3.0767598152160645, 3.427319288253784, 3.777878522872925, 4.1284379959106445, 4.478997230529785, 4.829556465148926, 5.180115699768066, 5.530674934387207, 5.881234169006348, 6.2317938804626465, 6.582353115081787, 6.932912349700928, 7.283471584320068, 7.634031295776367, 7.984590530395508, 8.335149765014648, 8.685708999633789, 9.03626823425293, 9.38682746887207, 9.737386703491211, 10.087945938110352, 10.438505172729492, 10.789064407348633, 11.139623641967773, 11.490182876586914, 11.840743064880371, 12.191302299499512]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 12.0, 7.0, 16.0, 22.0, 35.0, 44.0, 82.0, 110.0, 145.0, 261.0, 405.0, 648.0, 1028.0, 1616.0, 2689.0, 4948.0, 9112.0, 18598.0, 41480.0, 109493.0, 333596.0, 976617.0, 1491960.0, 790325.0, 256893.0, 85761.0, 34045.0, 15805.0, 8134.0, 4362.0, 2469.0, 1396.0, 829.0, 541.0, 270.0, 179.0, 121.0, 68.0, 55.0, 40.0, 24.0, 15.0, 8.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-31.171875, -30.265380859375, -29.35888671875, -28.452392578125, -27.5458984375, -26.639404296875, -25.73291015625, -24.826416015625, -23.919921875, -23.013427734375, -22.10693359375, -21.200439453125, -20.2939453125, -19.387451171875, -18.48095703125, -17.574462890625, -16.66796875, -15.761474609375, -14.85498046875, -13.948486328125, -13.0419921875, -12.135498046875, -11.22900390625, -10.322509765625, -9.416015625, -8.509521484375, -7.60302734375, -6.696533203125, -5.7900390625, -4.883544921875, -3.97705078125, -3.070556640625, -2.1640625, -1.257568359375, -0.35107421875, 0.555419921875, 1.4619140625, 2.368408203125, 3.27490234375, 4.181396484375, 5.087890625, 5.994384765625, 6.90087890625, 7.807373046875, 8.7138671875, 9.620361328125, 10.52685546875, 11.433349609375, 12.33984375, 13.246337890625, 14.15283203125, 15.059326171875, 15.9658203125, 16.872314453125, 17.77880859375, 18.685302734375, 19.591796875, 20.498291015625, 21.40478515625, 22.311279296875, 23.2177734375, 24.124267578125, 25.03076171875, 25.937255859375, 26.84375]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 6.0, 5.0, 10.0, 9.0, 15.0, 10.0, 11.0, 18.0, 18.0, 26.0, 14.0, 25.0, 23.0, 27.0, 32.0, 20.0, 32.0, 38.0, 49.0, 39.0, 35.0, 41.0, 41.0, 36.0, 30.0, 39.0, 37.0, 27.0, 34.0, 29.0, 39.0, 24.0, 24.0, 15.0, 23.0, 21.0, 12.0, 10.0, 12.0, 6.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.715576171875, -8.40771484375, -8.099853515625, -7.7919921875, -7.484130859375, -7.17626953125, -6.868408203125, -6.560546875, -6.252685546875, -5.94482421875, -5.636962890625, -5.3291015625, -5.021240234375, -4.71337890625, -4.405517578125, -4.09765625, -3.789794921875, -3.48193359375, -3.174072265625, -2.8662109375, -2.558349609375, -2.25048828125, -1.942626953125, -1.634765625, -1.326904296875, -1.01904296875, -0.711181640625, -0.4033203125, -0.095458984375, 0.21240234375, 0.520263671875, 0.828125, 1.135986328125, 1.44384765625, 1.751708984375, 2.0595703125, 2.367431640625, 2.67529296875, 2.983154296875, 3.291015625, 3.598876953125, 3.90673828125, 4.214599609375, 4.5224609375, 4.830322265625, 5.13818359375, 5.446044921875, 5.75390625, 6.061767578125, 6.36962890625, 6.677490234375, 6.9853515625, 7.293212890625, 7.60107421875, 7.908935546875, 8.216796875, 8.524658203125, 8.83251953125, 9.140380859375, 9.4482421875, 9.756103515625, 10.06396484375, 10.371826171875, 10.6796875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 11.0, 18.0, 12.0, 18.0, 34.0, 46.0, 98.0, 171.0, 233.0, 448.0, 723.0, 1234.0, 2021.0, 3574.0, 6007.0, 11052.0, 21441.0, 42555.0, 90706.0, 209454.0, 498209.0, 1004084.0, 1137695.0, 652965.0, 279056.0, 119080.0, 54280.0, 27078.0, 14131.0, 7517.0, 4228.0, 2448.0, 1399.0, 882.0, 545.0, 326.0, 197.0, 125.0, 70.0, 33.0, 28.0, 18.0, 7.0, 12.0, 10.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.546875, -25.63671875, -24.7265625, -23.81640625, -22.90625, -21.99609375, -21.0859375, -20.17578125, -19.265625, -18.35546875, -17.4453125, -16.53515625, -15.625, -14.71484375, -13.8046875, -12.89453125, -11.984375, -11.07421875, -10.1640625, -9.25390625, -8.34375, -7.43359375, -6.5234375, -5.61328125, -4.703125, -3.79296875, -2.8828125, -1.97265625, -1.0625, -0.15234375, 0.7578125, 1.66796875, 2.578125, 3.48828125, 4.3984375, 5.30859375, 6.21875, 7.12890625, 8.0390625, 8.94921875, 9.859375, 10.76953125, 11.6796875, 12.58984375, 13.5, 14.41015625, 15.3203125, 16.23046875, 17.140625, 18.05078125, 18.9609375, 19.87109375, 20.78125, 21.69140625, 22.6015625, 23.51171875, 24.421875, 25.33203125, 26.2421875, 27.15234375, 28.0625, 28.97265625, 29.8828125, 30.79296875, 31.703125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 10.0, 24.0, 23.0, 30.0, 40.0, 47.0, 78.0, 70.0, 99.0, 133.0, 154.0, 190.0, 258.0, 265.0, 277.0, 314.0, 327.0, 297.0, 282.0, 235.0, 203.0, 159.0, 138.0, 94.0, 94.0, 50.0, 48.0, 36.0, 29.0, 11.0, 12.0, 15.0, 11.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.749267578125, -8.49853515625, -8.247802734375, -7.9970703125, -7.746337890625, -7.49560546875, -7.244873046875, -6.994140625, -6.743408203125, -6.49267578125, -6.241943359375, -5.9912109375, -5.740478515625, -5.48974609375, -5.239013671875, -4.98828125, -4.737548828125, -4.48681640625, -4.236083984375, -3.9853515625, -3.734619140625, -3.48388671875, -3.233154296875, -2.982421875, -2.731689453125, -2.48095703125, -2.230224609375, -1.9794921875, -1.728759765625, -1.47802734375, -1.227294921875, -0.9765625, -0.725830078125, -0.47509765625, -0.224365234375, 0.0263671875, 0.277099609375, 0.52783203125, 0.778564453125, 1.029296875, 1.280029296875, 1.53076171875, 1.781494140625, 2.0322265625, 2.282958984375, 2.53369140625, 2.784423828125, 3.03515625, 3.285888671875, 3.53662109375, 3.787353515625, 4.0380859375, 4.288818359375, 4.53955078125, 4.790283203125, 5.041015625, 5.291748046875, 5.54248046875, 5.793212890625, 6.0439453125, 6.294677734375, 6.54541015625, 6.796142578125, 7.046875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 3.0, 11.0, 7.0, 10.0, 12.0, 18.0, 13.0, 22.0, 29.0, 37.0, 37.0, 47.0, 61.0, 65.0, 64.0, 54.0, 59.0, 60.0, 60.0, 44.0, 46.0, 47.0, 37.0, 33.0, 23.0, 26.0, 20.0, 7.0, 8.0, 6.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.552993774414062, -21.752286911010742, -20.951581954956055, -20.150875091552734, -19.350170135498047, -18.549463272094727, -17.748756408691406, -16.94805145263672, -16.14734649658203, -15.346640586853027, -14.545934677124023, -13.745227813720703, -12.944522857666016, -12.143815994262695, -11.343110084533691, -10.542404174804688, -9.741697311401367, -8.940991401672363, -8.14028549194336, -7.339579105377197, -6.538873195648193, -5.7381672859191895, -4.937460899353027, -4.136754989624023, -3.3360490798950195, -2.5353431701660156, -1.7346370220184326, -0.9339308738708496, -0.1332249641418457, 0.6674809455871582, 1.4681873321533203, 2.268893241882324, 3.069601058959961, 3.870306968688965, 4.671012878417969, 5.471719264984131, 6.272425174713135, 7.073131084442139, 7.873837471008301, 8.674543380737305, 9.475249290466309, 10.275955200195312, 11.076661109924316, 11.87736701965332, 12.67807388305664, 13.478778839111328, 14.279485702514648, 15.080191612243652, 15.880897521972656, 16.681604385375977, 17.482309341430664, 18.283016204833984, 19.083721160888672, 19.884428024291992, 20.685134887695312, 21.48583984375, 22.286544799804688, 23.087251663208008, 23.887956619262695, 24.688663482666016, 25.489368438720703, 26.290075302124023, 27.090782165527344, 27.89148712158203, 28.69219398498535]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 2.0, 8.0, 8.0, 6.0, 3.0, 9.0, 8.0, 11.0, 16.0, 15.0, 23.0, 18.0, 23.0, 23.0, 22.0, 39.0, 29.0, 27.0, 32.0, 47.0, 37.0, 46.0, 39.0, 66.0, 51.0, 37.0, 33.0, 31.0, 38.0, 39.0, 34.0, 29.0, 29.0, 24.0, 26.0, 7.0, 15.0, 14.0, 9.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.265556335449219, -13.828651428222656, -13.391746520996094, -12.954841613769531, -12.517937660217285, -12.081032752990723, -11.64412784576416, -11.207222938537598, -10.770318984985352, -10.333414077758789, -9.896509170532227, -9.459604263305664, -9.022700309753418, -8.585795402526855, -8.148890495300293, -7.7119855880737305, -7.275080680847168, -6.8381757736206055, -6.401271343231201, -5.964366436004639, -5.527462005615234, -5.090557098388672, -4.653652191162109, -4.216747283935547, -3.7798428535461426, -3.342938184738159, -2.906033515930176, -2.4691286087036133, -2.03222393989563, -1.5953192710876465, -1.158414363861084, -0.7215096950531006, -0.2846059799194336, 0.15229874849319458, 0.5892034769058228, 1.0261082649230957, 1.463012933731079, 1.8999176025390625, 2.336822509765625, 2.7737271785736084, 3.210631847381592, 3.647536516189575, 4.084441184997559, 4.521346092224121, 4.958250999450684, 5.395155429840088, 5.83206033706665, 6.268964767456055, 6.705869674682617, 7.14277458190918, 7.579679012298584, 8.016584396362305, 8.45348834991455, 8.890393257141113, 9.327298164367676, 9.764203071594238, 10.201107025146484, 10.638011932373047, 11.07491683959961, 11.511821746826172, 11.948725700378418, 12.38563060760498, 12.822535514831543, 13.259440422058105, 13.696345329284668]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 8.0, 4.0, 6.0, 11.0, 10.0, 30.0, 36.0, 58.0, 96.0, 145.0, 274.0, 571.0, 1082.0, 2323.0, 5339.0, 11805.0, 28068.0, 68746.0, 161561.0, 293300.0, 258309.0, 125620.0, 52538.0, 21503.0, 9309.0, 4042.0, 1821.0, 899.0, 440.0, 230.0, 135.0, 84.0, 40.0, 31.0, 19.0, 13.0, 14.0, 6.0, 8.0, 6.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.2734375, -12.8431396484375, -12.412841796875, -11.9825439453125, -11.55224609375, -11.1219482421875, -10.691650390625, -10.2613525390625, -9.8310546875, -9.4007568359375, -8.970458984375, -8.5401611328125, -8.10986328125, -7.6795654296875, -7.249267578125, -6.8189697265625, -6.388671875, -5.9583740234375, -5.528076171875, -5.0977783203125, -4.66748046875, -4.2371826171875, -3.806884765625, -3.3765869140625, -2.9462890625, -2.5159912109375, -2.085693359375, -1.6553955078125, -1.22509765625, -0.7947998046875, -0.364501953125, 0.0657958984375, 0.49609375, 0.9263916015625, 1.356689453125, 1.7869873046875, 2.21728515625, 2.6475830078125, 3.077880859375, 3.5081787109375, 3.9384765625, 4.3687744140625, 4.799072265625, 5.2293701171875, 5.65966796875, 6.0899658203125, 6.520263671875, 6.9505615234375, 7.380859375, 7.8111572265625, 8.241455078125, 8.6717529296875, 9.10205078125, 9.5323486328125, 9.962646484375, 10.3929443359375, 10.8232421875, 11.2535400390625, 11.683837890625, 12.1141357421875, 12.54443359375, 12.9747314453125, 13.405029296875, 13.8353271484375, 14.265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 2.0, 10.0, 5.0, 8.0, 13.0, 22.0, 14.0, 19.0, 22.0, 21.0, 23.0, 37.0, 26.0, 42.0, 33.0, 36.0, 45.0, 45.0, 52.0, 52.0, 34.0, 44.0, 45.0, 35.0, 36.0, 32.0, 38.0, 32.0, 31.0, 26.0, 16.0, 17.0, 13.0, 12.0, 12.0, 6.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.0, -15.5155029296875, -15.031005859375, -14.5465087890625, -14.06201171875, -13.5775146484375, -13.093017578125, -12.6085205078125, -12.1240234375, -11.6395263671875, -11.155029296875, -10.6705322265625, -10.18603515625, -9.7015380859375, -9.217041015625, -8.7325439453125, -8.248046875, -7.7635498046875, -7.279052734375, -6.7945556640625, -6.31005859375, -5.8255615234375, -5.341064453125, -4.8565673828125, -4.3720703125, -3.8875732421875, -3.403076171875, -2.9185791015625, -2.43408203125, -1.9495849609375, -1.465087890625, -0.9805908203125, -0.49609375, -0.0115966796875, 0.472900390625, 0.9573974609375, 1.44189453125, 1.9263916015625, 2.410888671875, 2.8953857421875, 3.3798828125, 3.8643798828125, 4.348876953125, 4.8333740234375, 5.31787109375, 5.8023681640625, 6.286865234375, 6.7713623046875, 7.255859375, 7.7403564453125, 8.224853515625, 8.7093505859375, 9.19384765625, 9.6783447265625, 10.162841796875, 10.6473388671875, 11.1318359375, 11.6163330078125, 12.100830078125, 12.5853271484375, 13.06982421875, 13.5543212890625, 14.038818359375, 14.5233154296875, 15.0078125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 6.0, 6.0, 19.0, 20.0, 26.0, 32.0, 60.0, 100.0, 155.0, 233.0, 393.0, 702.0, 1232.0, 2248.0, 4129.0, 8035.0, 17368.0, 38406.0, 91707.0, 213398.0, 319092.0, 198201.0, 84289.0, 35915.0, 16113.0, 7857.0, 3960.0, 2019.0, 1132.0, 668.0, 402.0, 223.0, 149.0, 93.0, 51.0, 44.0, 21.0, 18.0, 8.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.1484375, -13.683837890625, -13.21923828125, -12.754638671875, -12.2900390625, -11.825439453125, -11.36083984375, -10.896240234375, -10.431640625, -9.967041015625, -9.50244140625, -9.037841796875, -8.5732421875, -8.108642578125, -7.64404296875, -7.179443359375, -6.71484375, -6.250244140625, -5.78564453125, -5.321044921875, -4.8564453125, -4.391845703125, -3.92724609375, -3.462646484375, -2.998046875, -2.533447265625, -2.06884765625, -1.604248046875, -1.1396484375, -0.675048828125, -0.21044921875, 0.254150390625, 0.71875, 1.183349609375, 1.64794921875, 2.112548828125, 2.5771484375, 3.041748046875, 3.50634765625, 3.970947265625, 4.435546875, 4.900146484375, 5.36474609375, 5.829345703125, 6.2939453125, 6.758544921875, 7.22314453125, 7.687744140625, 8.15234375, 8.616943359375, 9.08154296875, 9.546142578125, 10.0107421875, 10.475341796875, 10.93994140625, 11.404541015625, 11.869140625, 12.333740234375, 12.79833984375, 13.262939453125, 13.7275390625, 14.192138671875, 14.65673828125, 15.121337890625, 15.5859375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 5.0, 11.0, 14.0, 12.0, 11.0, 14.0, 16.0, 29.0, 23.0, 28.0, 27.0, 38.0, 38.0, 30.0, 28.0, 29.0, 53.0, 34.0, 42.0, 44.0, 37.0, 26.0, 28.0, 31.0, 41.0, 40.0, 36.0, 33.0, 22.0, 24.0, 22.0, 19.0, 11.0, 17.0, 10.0, 13.0, 14.0, 6.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.125, -8.8516845703125, -8.578369140625, -8.3050537109375, -8.03173828125, -7.7584228515625, -7.485107421875, -7.2117919921875, -6.9384765625, -6.6651611328125, -6.391845703125, -6.1185302734375, -5.84521484375, -5.5718994140625, -5.298583984375, -5.0252685546875, -4.751953125, -4.4786376953125, -4.205322265625, -3.9320068359375, -3.65869140625, -3.3853759765625, -3.112060546875, -2.8387451171875, -2.5654296875, -2.2921142578125, -2.018798828125, -1.7454833984375, -1.47216796875, -1.1988525390625, -0.925537109375, -0.6522216796875, -0.37890625, -0.1055908203125, 0.167724609375, 0.4410400390625, 0.71435546875, 0.9876708984375, 1.260986328125, 1.5343017578125, 1.8076171875, 2.0809326171875, 2.354248046875, 2.6275634765625, 2.90087890625, 3.1741943359375, 3.447509765625, 3.7208251953125, 3.994140625, 4.2674560546875, 4.540771484375, 4.8140869140625, 5.08740234375, 5.3607177734375, 5.634033203125, 5.9073486328125, 6.1806640625, 6.4539794921875, 6.727294921875, 7.0006103515625, 7.27392578125, 7.5472412109375, 7.820556640625, 8.0938720703125, 8.3671875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 15.0, 15.0, 32.0, 45.0, 58.0, 78.0, 95.0, 166.0, 228.0, 368.0, 522.0, 809.0, 1139.0, 1786.0, 2960.0, 4720.0, 8246.0, 14682.0, 26791.0, 52190.0, 102072.0, 193308.0, 257209.0, 181418.0, 93585.0, 47658.0, 24917.0, 13532.0, 7649.0, 4527.0, 2777.0, 1722.0, 1102.0, 692.0, 454.0, 299.0, 203.0, 150.0, 99.0, 71.0, 62.0, 39.0, 18.0, 18.0, 7.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.33984375, -5.17523193359375, -5.0106201171875, -4.84600830078125, -4.681396484375, -4.51678466796875, -4.3521728515625, -4.18756103515625, -4.02294921875, -3.85833740234375, -3.6937255859375, -3.52911376953125, -3.364501953125, -3.19989013671875, -3.0352783203125, -2.87066650390625, -2.7060546875, -2.54144287109375, -2.3768310546875, -2.21221923828125, -2.047607421875, -1.88299560546875, -1.7183837890625, -1.55377197265625, -1.38916015625, -1.22454833984375, -1.0599365234375, -0.89532470703125, -0.730712890625, -0.56610107421875, -0.4014892578125, -0.23687744140625, -0.072265625, 0.09234619140625, 0.2569580078125, 0.42156982421875, 0.586181640625, 0.75079345703125, 0.9154052734375, 1.08001708984375, 1.24462890625, 1.40924072265625, 1.5738525390625, 1.73846435546875, 1.903076171875, 2.06768798828125, 2.2322998046875, 2.39691162109375, 2.5615234375, 2.72613525390625, 2.8907470703125, 3.05535888671875, 3.219970703125, 3.38458251953125, 3.5491943359375, 3.71380615234375, 3.87841796875, 4.04302978515625, 4.2076416015625, 4.37225341796875, 4.536865234375, 4.70147705078125, 4.8660888671875, 5.03070068359375, 5.1953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 8.0, 6.0, 9.0, 11.0, 12.0, 16.0, 21.0, 30.0, 37.0, 39.0, 40.0, 68.0, 70.0, 73.0, 64.0, 70.0, 73.0, 57.0, 52.0, 42.0, 49.0, 24.0, 31.0, 22.0, 20.0, 13.0, 11.0, 9.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002281665802001953, -0.00022015348076820374, -0.00021214038133621216, -0.00020412728190422058, -0.000196114182472229, -0.00018810108304023743, -0.00018008798360824585, -0.00017207488417625427, -0.0001640617847442627, -0.00015604868531227112, -0.00014803558588027954, -0.00014002248644828796, -0.0001320093870162964, -0.0001239962875843048, -0.00011598318815231323, -0.00010797008872032166, -9.995698928833008e-05, -9.19438898563385e-05, -8.393079042434692e-05, -7.591769099235535e-05, -6.790459156036377e-05, -5.989149212837219e-05, -5.1878392696380615e-05, -4.386529326438904e-05, -3.585219383239746e-05, -2.7839094400405884e-05, -1.9825994968414307e-05, -1.181289553642273e-05, -3.7997961044311523e-06, 4.213303327560425e-06, 1.2226402759552002e-05, 2.023950219154358e-05, 2.8252601623535156e-05, 3.6265701055526733e-05, 4.427880048751831e-05, 5.229189991950989e-05, 6.0304999351501465e-05, 6.831809878349304e-05, 7.633119821548462e-05, 8.43442976474762e-05, 9.235739707946777e-05, 0.00010037049651145935, 0.00010838359594345093, 0.0001163966953754425, 0.00012440979480743408, 0.00013242289423942566, 0.00014043599367141724, 0.0001484490931034088, 0.0001564621925354004, 0.00016447529196739197, 0.00017248839139938354, 0.00018050149083137512, 0.0001885145902633667, 0.00019652768969535828, 0.00020454078912734985, 0.00021255388855934143, 0.000220566987991333, 0.00022858008742332458, 0.00023659318685531616, 0.00024460628628730774, 0.0002526193857192993, 0.0002606324851512909, 0.00026864558458328247, 0.00027665868401527405, 0.0002846717834472656]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 14.0, 16.0, 25.0, 40.0, 44.0, 81.0, 126.0, 193.0, 290.0, 455.0, 695.0, 1081.0, 1727.0, 3005.0, 5038.0, 8915.0, 16625.0, 32341.0, 63861.0, 126721.0, 219086.0, 240968.0, 158064.0, 81463.0, 40902.0, 20770.0, 10889.0, 6069.0, 3490.0, 2025.0, 1266.0, 769.0, 509.0, 331.0, 211.0, 155.0, 77.0, 61.0, 53.0, 31.0, 23.0, 13.0, 10.0, 5.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.96875, -6.75213623046875, -6.5355224609375, -6.31890869140625, -6.102294921875, -5.88568115234375, -5.6690673828125, -5.45245361328125, -5.23583984375, -5.01922607421875, -4.8026123046875, -4.58599853515625, -4.369384765625, -4.15277099609375, -3.9361572265625, -3.71954345703125, -3.5029296875, -3.28631591796875, -3.0697021484375, -2.85308837890625, -2.636474609375, -2.41986083984375, -2.2032470703125, -1.98663330078125, -1.77001953125, -1.55340576171875, -1.3367919921875, -1.12017822265625, -0.903564453125, -0.68695068359375, -0.4703369140625, -0.25372314453125, -0.037109375, 0.17950439453125, 0.3961181640625, 0.61273193359375, 0.829345703125, 1.04595947265625, 1.2625732421875, 1.47918701171875, 1.69580078125, 1.91241455078125, 2.1290283203125, 2.34564208984375, 2.562255859375, 2.77886962890625, 2.9954833984375, 3.21209716796875, 3.4287109375, 3.64532470703125, 3.8619384765625, 4.07855224609375, 4.295166015625, 4.51177978515625, 4.7283935546875, 4.94500732421875, 5.16162109375, 5.37823486328125, 5.5948486328125, 5.81146240234375, 6.028076171875, 6.24468994140625, 6.4613037109375, 6.67791748046875, 6.89453125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 10.0, 10.0, 14.0, 14.0, 26.0, 30.0, 39.0, 49.0, 64.0, 67.0, 64.0, 82.0, 91.0, 76.0, 58.0, 55.0, 56.0, 37.0, 36.0, 34.0, 22.0, 18.0, 8.0, 8.0, 6.0, 4.0, 6.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.94921875, -1.888427734375, -1.82763671875, -1.766845703125, -1.7060546875, -1.645263671875, -1.58447265625, -1.523681640625, -1.462890625, -1.402099609375, -1.34130859375, -1.280517578125, -1.2197265625, -1.158935546875, -1.09814453125, -1.037353515625, -0.9765625, -0.915771484375, -0.85498046875, -0.794189453125, -0.7333984375, -0.672607421875, -0.61181640625, -0.551025390625, -0.490234375, -0.429443359375, -0.36865234375, -0.307861328125, -0.2470703125, -0.186279296875, -0.12548828125, -0.064697265625, -0.00390625, 0.056884765625, 0.11767578125, 0.178466796875, 0.2392578125, 0.300048828125, 0.36083984375, 0.421630859375, 0.482421875, 0.543212890625, 0.60400390625, 0.664794921875, 0.7255859375, 0.786376953125, 0.84716796875, 0.907958984375, 0.96875, 1.029541015625, 1.09033203125, 1.151123046875, 1.2119140625, 1.272705078125, 1.33349609375, 1.394287109375, 1.455078125, 1.515869140625, 1.57666015625, 1.637451171875, 1.6982421875, 1.759033203125, 1.81982421875, 1.880615234375, 1.94140625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 0.0, 8.0, 6.0, 5.0, 8.0, 20.0, 15.0, 15.0, 14.0, 26.0, 30.0, 42.0, 33.0, 66.0, 70.0, 63.0, 52.0, 59.0, 72.0, 55.0, 46.0, 51.0, 47.0, 38.0, 34.0, 27.0, 20.0, 20.0, 15.0, 6.0, 7.0, 6.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.030563354492188, -23.214033126831055, -22.397502899169922, -21.580974578857422, -20.76444435119629, -19.947914123535156, -19.131383895874023, -18.31485366821289, -17.49832534790039, -16.681795120239258, -15.865265846252441, -15.048735618591309, -14.232206344604492, -13.41567611694336, -12.599145889282227, -11.782615661621094, -10.966085433959961, -10.149555206298828, -9.333025932312012, -8.516495704650879, -7.699965953826904, -6.88343620300293, -6.066905975341797, -5.250376224517822, -4.433846473693848, -3.617316722869873, -2.8007867336273193, -1.9842567443847656, -1.167726993560791, -0.3511972427368164, 0.4653329849243164, 1.281862735748291, 2.0983943939208984, 2.914924144744873, 3.7314541339874268, 4.5479841232299805, 5.364513874053955, 6.18104362487793, 6.9975738525390625, 7.814103603363037, 8.630633354187012, 9.447163581848145, 10.263692855834961, 11.080223083496094, 11.896753311157227, 12.713282585144043, 13.529812812805176, 14.346342086791992, 15.162872314453125, 15.979402542114258, 16.79593276977539, 17.61246109008789, 18.428991317749023, 19.245521545410156, 20.06205177307129, 20.878582000732422, 21.695110321044922, 22.511640548706055, 23.328170776367188, 24.144699096679688, 24.96122932434082, 25.777759552001953, 26.594289779663086, 27.41082000732422, 28.22735023498535]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 6.0, 6.0, 4.0, 4.0, 11.0, 13.0, 10.0, 15.0, 18.0, 22.0, 17.0, 23.0, 26.0, 32.0, 29.0, 26.0, 28.0, 36.0, 33.0, 37.0, 54.0, 46.0, 57.0, 50.0, 30.0, 36.0, 32.0, 34.0, 47.0, 34.0, 29.0, 24.0, 34.0, 14.0, 6.0, 15.0, 19.0, 9.0, 6.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.910043716430664, -13.482439041137695, -13.054834365844727, -12.627229690551758, -12.199624061584473, -11.772019386291504, -11.344414710998535, -10.916810035705566, -10.489204406738281, -10.061599731445312, -9.633995056152344, -9.206390380859375, -8.77878475189209, -8.351180076599121, -7.923575401306152, -7.495970726013184, -7.068366050720215, -6.640761375427246, -6.213156223297119, -5.78555154800415, -5.357946395874023, -4.930341720581055, -4.502737045288086, -4.075132369995117, -3.6475272178649902, -3.2199223041534424, -2.7923173904418945, -2.364712715148926, -1.937107801437378, -1.50950288772583, -1.0818982124328613, -0.6542932987213135, -0.22668743133544922, 0.20091742277145386, 0.6285222768783569, 1.0561270713806152, 1.483731985092163, 1.911336898803711, 2.3389415740966797, 2.7665464878082275, 3.1941514015197754, 3.6217563152313232, 4.049361228942871, 4.47696590423584, 4.904570579528809, 5.3321757316589355, 5.759780406951904, 6.187385559082031, 6.614990234375, 7.042594909667969, 7.470200061798096, 7.8978047370910645, 8.325409889221191, 8.75301456451416, 9.180619239807129, 9.608223915100098, 10.035829544067383, 10.463434219360352, 10.89103889465332, 11.318643569946289, 11.746249198913574, 12.173853874206543, 12.601458549499512, 13.02906322479248, 13.45666790008545]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 7.0, 10.0, 15.0, 15.0, 29.0, 41.0, 51.0, 66.0, 110.0, 145.0, 218.0, 281.0, 401.0, 584.0, 879.0, 1407.0, 2390.0, 4755.0, 10112.0, 24230.0, 58902.0, 137670.0, 252460.0, 268970.0, 160655.0, 70718.0, 28511.0, 12007.0, 5427.0, 2797.0, 1613.0, 992.0, 624.0, 437.0, 295.0, 207.0, 138.0, 113.0, 80.0, 39.0, 35.0, 30.0, 34.0, 16.0, 12.0, 3.0, 13.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.084716796875, -18.45068359375, -17.816650390625, -17.1826171875, -16.548583984375, -15.91455078125, -15.280517578125, -14.646484375, -14.012451171875, -13.37841796875, -12.744384765625, -12.1103515625, -11.476318359375, -10.84228515625, -10.208251953125, -9.57421875, -8.940185546875, -8.30615234375, -7.672119140625, -7.0380859375, -6.404052734375, -5.77001953125, -5.135986328125, -4.501953125, -3.867919921875, -3.23388671875, -2.599853515625, -1.9658203125, -1.331787109375, -0.69775390625, -0.063720703125, 0.5703125, 1.204345703125, 1.83837890625, 2.472412109375, 3.1064453125, 3.740478515625, 4.37451171875, 5.008544921875, 5.642578125, 6.276611328125, 6.91064453125, 7.544677734375, 8.1787109375, 8.812744140625, 9.44677734375, 10.080810546875, 10.71484375, 11.348876953125, 11.98291015625, 12.616943359375, 13.2509765625, 13.885009765625, 14.51904296875, 15.153076171875, 15.787109375, 16.421142578125, 17.05517578125, 17.689208984375, 18.3232421875, 18.957275390625, 19.59130859375, 20.225341796875, 20.859375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 9.0, 2.0, 4.0, 8.0, 7.0, 11.0, 14.0, 15.0, 20.0, 12.0, 10.0, 25.0, 28.0, 27.0, 22.0, 24.0, 28.0, 42.0, 35.0, 47.0, 42.0, 39.0, 49.0, 47.0, 51.0, 35.0, 33.0, 42.0, 38.0, 33.0, 28.0, 35.0, 20.0, 20.0, 14.0, 17.0, 11.0, 10.0, 10.0, 6.0, 9.0, 7.0, 6.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-14.1171875, -13.6663818359375, -13.215576171875, -12.7647705078125, -12.31396484375, -11.8631591796875, -11.412353515625, -10.9615478515625, -10.5107421875, -10.0599365234375, -9.609130859375, -9.1583251953125, -8.70751953125, -8.2567138671875, -7.805908203125, -7.3551025390625, -6.904296875, -6.4534912109375, -6.002685546875, -5.5518798828125, -5.10107421875, -4.6502685546875, -4.199462890625, -3.7486572265625, -3.2978515625, -2.8470458984375, -2.396240234375, -1.9454345703125, -1.49462890625, -1.0438232421875, -0.593017578125, -0.1422119140625, 0.30859375, 0.7593994140625, 1.210205078125, 1.6610107421875, 2.11181640625, 2.5626220703125, 3.013427734375, 3.4642333984375, 3.9150390625, 4.3658447265625, 4.816650390625, 5.2674560546875, 5.71826171875, 6.1690673828125, 6.619873046875, 7.0706787109375, 7.521484375, 7.9722900390625, 8.423095703125, 8.8739013671875, 9.32470703125, 9.7755126953125, 10.226318359375, 10.6771240234375, 11.1279296875, 11.5787353515625, 12.029541015625, 12.4803466796875, 12.93115234375, 13.3819580078125, 13.832763671875, 14.2835693359375, 14.734375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 6.0, 14.0, 11.0, 9.0, 14.0, 29.0, 35.0, 55.0, 75.0, 100.0, 116.0, 158.0, 218.0, 307.0, 441.0, 642.0, 924.0, 1612.0, 3275.0, 7983.0, 24496.0, 88112.0, 276177.0, 385076.0, 180332.0, 51890.0, 14883.0, 5256.0, 2344.0, 1214.0, 815.0, 535.0, 380.0, 273.0, 217.0, 159.0, 98.0, 70.0, 47.0, 47.0, 27.0, 26.0, 16.0, 21.0, 8.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.609375, -29.598876953125, -28.58837890625, -27.577880859375, -26.5673828125, -25.556884765625, -24.54638671875, -23.535888671875, -22.525390625, -21.514892578125, -20.50439453125, -19.493896484375, -18.4833984375, -17.472900390625, -16.46240234375, -15.451904296875, -14.44140625, -13.430908203125, -12.42041015625, -11.409912109375, -10.3994140625, -9.388916015625, -8.37841796875, -7.367919921875, -6.357421875, -5.346923828125, -4.33642578125, -3.325927734375, -2.3154296875, -1.304931640625, -0.29443359375, 0.716064453125, 1.7265625, 2.737060546875, 3.74755859375, 4.758056640625, 5.7685546875, 6.779052734375, 7.78955078125, 8.800048828125, 9.810546875, 10.821044921875, 11.83154296875, 12.842041015625, 13.8525390625, 14.863037109375, 15.87353515625, 16.884033203125, 17.89453125, 18.905029296875, 19.91552734375, 20.926025390625, 21.9365234375, 22.947021484375, 23.95751953125, 24.968017578125, 25.978515625, 26.989013671875, 27.99951171875, 29.010009765625, 30.0205078125, 31.031005859375, 32.04150390625, 33.052001953125, 34.0625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 5.0, 13.0, 11.0, 13.0, 17.0, 27.0, 22.0, 21.0, 24.0, 15.0, 23.0, 22.0, 32.0, 38.0, 34.0, 39.0, 39.0, 34.0, 35.0, 44.0, 33.0, 48.0, 42.0, 37.0, 46.0, 34.0, 38.0, 32.0, 24.0, 28.0, 18.0, 15.0, 14.0, 12.0, 10.0, 10.0, 8.0, 7.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.0390625, -8.7491455078125, -8.459228515625, -8.1693115234375, -7.87939453125, -7.5894775390625, -7.299560546875, -7.0096435546875, -6.7197265625, -6.4298095703125, -6.139892578125, -5.8499755859375, -5.56005859375, -5.2701416015625, -4.980224609375, -4.6903076171875, -4.400390625, -4.1104736328125, -3.820556640625, -3.5306396484375, -3.24072265625, -2.9508056640625, -2.660888671875, -2.3709716796875, -2.0810546875, -1.7911376953125, -1.501220703125, -1.2113037109375, -0.92138671875, -0.6314697265625, -0.341552734375, -0.0516357421875, 0.23828125, 0.5281982421875, 0.818115234375, 1.1080322265625, 1.39794921875, 1.6878662109375, 1.977783203125, 2.2677001953125, 2.5576171875, 2.8475341796875, 3.137451171875, 3.4273681640625, 3.71728515625, 4.0072021484375, 4.297119140625, 4.5870361328125, 4.876953125, 5.1668701171875, 5.456787109375, 5.7467041015625, 6.03662109375, 6.3265380859375, 6.616455078125, 6.9063720703125, 7.1962890625, 7.4862060546875, 7.776123046875, 8.0660400390625, 8.35595703125, 8.6458740234375, 8.935791015625, 9.2257080078125, 9.515625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 9.0, 3.0, 13.0, 10.0, 22.0, 32.0, 43.0, 68.0, 97.0, 157.0, 260.0, 378.0, 491.0, 743.0, 1174.0, 1709.0, 2770.0, 4517.0, 8036.0, 16660.0, 40474.0, 101668.0, 222223.0, 293501.0, 198566.0, 87248.0, 34253.0, 14537.0, 7286.0, 4142.0, 2547.0, 1638.0, 1056.0, 733.0, 517.0, 316.0, 208.0, 136.0, 103.0, 73.0, 39.0, 30.0, 25.0, 20.0, 12.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71875, -9.376708984375, -9.03466796875, -8.692626953125, -8.3505859375, -8.008544921875, -7.66650390625, -7.324462890625, -6.982421875, -6.640380859375, -6.29833984375, -5.956298828125, -5.6142578125, -5.272216796875, -4.93017578125, -4.588134765625, -4.24609375, -3.904052734375, -3.56201171875, -3.219970703125, -2.8779296875, -2.535888671875, -2.19384765625, -1.851806640625, -1.509765625, -1.167724609375, -0.82568359375, -0.483642578125, -0.1416015625, 0.200439453125, 0.54248046875, 0.884521484375, 1.2265625, 1.568603515625, 1.91064453125, 2.252685546875, 2.5947265625, 2.936767578125, 3.27880859375, 3.620849609375, 3.962890625, 4.304931640625, 4.64697265625, 4.989013671875, 5.3310546875, 5.673095703125, 6.01513671875, 6.357177734375, 6.69921875, 7.041259765625, 7.38330078125, 7.725341796875, 8.0673828125, 8.409423828125, 8.75146484375, 9.093505859375, 9.435546875, 9.777587890625, 10.11962890625, 10.461669921875, 10.8037109375, 11.145751953125, 11.48779296875, 11.829833984375, 12.171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 7.0, 13.0, 16.0, 19.0, 31.0, 26.0, 55.0, 69.0, 67.0, 63.0, 107.0, 89.0, 73.0, 68.0, 66.0, 59.0, 33.0, 22.0, 16.0, 18.0, 17.0, 14.0, 7.0, 6.0, 7.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007643699645996094, -0.0007371082901954651, -0.0007098466157913208, -0.0006825849413871765, -0.0006553232669830322, -0.0006280615925788879, -0.0006007999181747437, -0.0005735382437705994, -0.0005462765693664551, -0.0005190148949623108, -0.0004917532205581665, -0.0004644915461540222, -0.00043722987174987793, -0.00040996819734573364, -0.00038270652294158936, -0.00035544484853744507, -0.0003281831741333008, -0.0003009214997291565, -0.0002736598253250122, -0.0002463981509208679, -0.00021913647651672363, -0.00019187480211257935, -0.00016461312770843506, -0.00013735145330429077, -0.00011008977890014648, -8.28281044960022e-05, -5.556643009185791e-05, -2.8304755687713623e-05, -1.043081283569336e-06, 2.621859312057495e-05, 5.348026752471924e-05, 8.074194192886353e-05, 0.00010800361633300781, 0.0001352652907371521, 0.0001625269651412964, 0.00018978863954544067, 0.00021705031394958496, 0.00024431198835372925, 0.00027157366275787354, 0.0002988353371620178, 0.0003260970115661621, 0.0003533586859703064, 0.0003806203603744507, 0.00040788203477859497, 0.00043514370918273926, 0.00046240538358688354, 0.0004896670579910278, 0.0005169287323951721, 0.0005441904067993164, 0.0005714520812034607, 0.000598713755607605, 0.0006259754300117493, 0.0006532371044158936, 0.0006804987788200378, 0.0007077604532241821, 0.0007350221276283264, 0.0007622838020324707, 0.000789545476436615, 0.0008168071508407593, 0.0008440688252449036, 0.0008713304996490479, 0.0008985921740531921, 0.0009258538484573364, 0.0009531155228614807, 0.000980377197265625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 10.0, 7.0, 16.0, 24.0, 39.0, 44.0, 77.0, 126.0, 169.0, 290.0, 466.0, 805.0, 1319.0, 2457.0, 4849.0, 10333.0, 27546.0, 93489.0, 291335.0, 378064.0, 161703.0, 45774.0, 15454.0, 6571.0, 3323.0, 1689.0, 951.0, 576.0, 373.0, 203.0, 142.0, 97.0, 64.0, 44.0, 35.0, 24.0, 22.0, 10.0, 12.0, 5.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.296875, -12.808349609375, -12.31982421875, -11.831298828125, -11.3427734375, -10.854248046875, -10.36572265625, -9.877197265625, -9.388671875, -8.900146484375, -8.41162109375, -7.923095703125, -7.4345703125, -6.946044921875, -6.45751953125, -5.968994140625, -5.48046875, -4.991943359375, -4.50341796875, -4.014892578125, -3.5263671875, -3.037841796875, -2.54931640625, -2.060791015625, -1.572265625, -1.083740234375, -0.59521484375, -0.106689453125, 0.3818359375, 0.870361328125, 1.35888671875, 1.847412109375, 2.3359375, 2.824462890625, 3.31298828125, 3.801513671875, 4.2900390625, 4.778564453125, 5.26708984375, 5.755615234375, 6.244140625, 6.732666015625, 7.22119140625, 7.709716796875, 8.1982421875, 8.686767578125, 9.17529296875, 9.663818359375, 10.15234375, 10.640869140625, 11.12939453125, 11.617919921875, 12.1064453125, 12.594970703125, 13.08349609375, 13.572021484375, 14.060546875, 14.549072265625, 15.03759765625, 15.526123046875, 16.0146484375, 16.503173828125, 16.99169921875, 17.480224609375, 17.96875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 8.0, 6.0, 8.0, 12.0, 19.0, 26.0, 32.0, 41.0, 51.0, 75.0, 61.0, 66.0, 80.0, 94.0, 78.0, 66.0, 66.0, 45.0, 46.0, 35.0, 26.0, 11.0, 6.0, 11.0, 10.0, 2.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.8984375, -2.808074951171875, -2.71771240234375, -2.627349853515625, -2.5369873046875, -2.446624755859375, -2.35626220703125, -2.265899658203125, -2.175537109375, -2.085174560546875, -1.99481201171875, -1.904449462890625, -1.8140869140625, -1.723724365234375, -1.63336181640625, -1.542999267578125, -1.45263671875, -1.362274169921875, -1.27191162109375, -1.181549072265625, -1.0911865234375, -1.000823974609375, -0.91046142578125, -0.820098876953125, -0.729736328125, -0.639373779296875, -0.54901123046875, -0.458648681640625, -0.3682861328125, -0.277923583984375, -0.18756103515625, -0.097198486328125, -0.0068359375, 0.083526611328125, 0.17388916015625, 0.264251708984375, 0.3546142578125, 0.444976806640625, 0.53533935546875, 0.625701904296875, 0.716064453125, 0.806427001953125, 0.89678955078125, 0.987152099609375, 1.0775146484375, 1.167877197265625, 1.25823974609375, 1.348602294921875, 1.43896484375, 1.529327392578125, 1.61968994140625, 1.710052490234375, 1.8004150390625, 1.890777587890625, 1.98114013671875, 2.071502685546875, 2.161865234375, 2.252227783203125, 2.34259033203125, 2.432952880859375, 2.5233154296875, 2.613677978515625, 2.70404052734375, 2.794403076171875, 2.884765625]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 9.0, 12.0, 14.0, 9.0, 20.0, 26.0, 28.0, 44.0, 30.0, 59.0, 50.0, 63.0, 49.0, 61.0, 59.0, 73.0, 52.0, 40.0, 46.0, 44.0, 40.0, 38.0, 24.0, 19.0, 12.0, 15.0, 16.0, 6.0, 6.0, 5.0, 2.0, 7.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.312686920166016, -21.490901947021484, -20.66911506652832, -19.84733009338379, -19.025543212890625, -18.203758239746094, -17.381973266601562, -16.5601863861084, -15.73840045928955, -14.916614532470703, -14.094828605651855, -13.273042678833008, -12.451257705688477, -11.629470825195312, -10.807685852050781, -9.985899925231934, -9.164113998413086, -8.342328071594238, -7.520542144775391, -6.698756694793701, -5.8769707679748535, -5.055184841156006, -4.233399391174316, -3.4116134643554688, -2.589827537536621, -1.768041729927063, -0.9462559223175049, -0.12447023391723633, 0.6973156929016113, 1.519101619720459, 2.3408870697021484, 3.162672996520996, 3.9844589233398438, 4.806244850158691, 5.628030776977539, 6.4498162269592285, 7.271602153778076, 8.093387603759766, 8.915173530578613, 9.736959457397461, 10.558745384216309, 11.380531311035156, 12.202317237854004, 13.024103164672852, 13.845888137817383, 14.667675018310547, 15.489459991455078, 16.31124496459961, 17.133031845092773, 17.954816818237305, 18.77660369873047, 19.598388671875, 20.420175552368164, 21.241960525512695, 22.06374740600586, 22.88553237915039, 23.707317352294922, 24.529102325439453, 25.350889205932617, 26.17267417907715, 26.994461059570312, 27.816246032714844, 28.638031005859375, 29.45981788635254, 30.281604766845703]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 6.0, 7.0, 6.0, 6.0, 8.0, 10.0, 10.0, 17.0, 20.0, 20.0, 17.0, 37.0, 20.0, 23.0, 33.0, 38.0, 40.0, 48.0, 39.0, 50.0, 40.0, 53.0, 39.0, 51.0, 36.0, 36.0, 31.0, 29.0, 34.0, 35.0, 31.0, 22.0, 16.0, 22.0, 12.0, 17.0, 13.0, 8.0, 5.0, 6.0, 3.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-16.957361221313477, -16.446117401123047, -15.934871673583984, -15.423626899719238, -14.912382125854492, -14.401137351989746, -13.889892578125, -13.37864875793457, -12.867403030395508, -12.356158256530762, -11.844913482666016, -11.33366870880127, -10.822423934936523, -10.311179161071777, -9.799934387207031, -9.288690567016602, -8.777445793151855, -8.26620101928711, -7.754956245422363, -7.243711471557617, -6.732466697692871, -6.221221923828125, -5.709977626800537, -5.198732852935791, -4.687488079071045, -4.176243305206299, -3.6649985313415527, -3.1537539958953857, -2.6425092220306396, -2.1312644481658936, -1.6200199127197266, -1.1087751388549805, -0.5975313186645508, -0.08628660440444946, 0.42495810985565186, 0.9362027645111084, 1.4474475383758545, 1.9586923122406006, 2.4699368476867676, 2.9811816215515137, 3.4924263954162598, 4.003671169281006, 4.514915943145752, 5.02616024017334, 5.537405014038086, 6.048649787902832, 6.559894561767578, 7.071139335632324, 7.58238410949707, 8.093628883361816, 8.604873657226562, 9.116118431091309, 9.627363204956055, 10.1386079788208, 10.649852752685547, 11.161096572875977, 11.672342300415039, 12.183587074279785, 12.694831848144531, 13.206076622009277, 13.717321395874023, 14.22856616973877, 14.739810943603516, 15.251054763793945, 15.762299537658691]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 16.0, 14.0, 26.0, 33.0, 57.0, 83.0, 138.0, 260.0, 370.0, 649.0, 1196.0, 2262.0, 4414.0, 8551.0, 18965.0, 46038.0, 126947.0, 407608.0, 1227535.0, 1491336.0, 576063.0, 174162.0, 60209.0, 24070.0, 11067.0, 5476.0, 2821.0, 1582.0, 894.0, 520.0, 341.0, 208.0, 139.0, 67.0, 58.0, 40.0, 15.0, 12.0, 12.0, 8.0, 7.0, 5.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.1875, -41.80078125, -40.4140625, -39.02734375, -37.640625, -36.25390625, -34.8671875, -33.48046875, -32.09375, -30.70703125, -29.3203125, -27.93359375, -26.546875, -25.16015625, -23.7734375, -22.38671875, -21.0, -19.61328125, -18.2265625, -16.83984375, -15.453125, -14.06640625, -12.6796875, -11.29296875, -9.90625, -8.51953125, -7.1328125, -5.74609375, -4.359375, -2.97265625, -1.5859375, -0.19921875, 1.1875, 2.57421875, 3.9609375, 5.34765625, 6.734375, 8.12109375, 9.5078125, 10.89453125, 12.28125, 13.66796875, 15.0546875, 16.44140625, 17.828125, 19.21484375, 20.6015625, 21.98828125, 23.375, 24.76171875, 26.1484375, 27.53515625, 28.921875, 30.30859375, 31.6953125, 33.08203125, 34.46875, 35.85546875, 37.2421875, 38.62890625, 40.015625, 41.40234375, 42.7890625, 44.17578125, 45.5625]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 4.0, 3.0, 9.0, 7.0, 11.0, 8.0, 8.0, 14.0, 17.0, 18.0, 18.0, 27.0, 19.0, 33.0, 36.0, 27.0, 37.0, 48.0, 50.0, 44.0, 58.0, 40.0, 48.0, 38.0, 40.0, 54.0, 27.0, 39.0, 25.0, 17.0, 30.0, 32.0, 10.0, 23.0, 15.0, 16.0, 12.0, 7.0, 7.0, 4.0, 3.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.296875, -15.77392578125, -15.2509765625, -14.72802734375, -14.205078125, -13.68212890625, -13.1591796875, -12.63623046875, -12.11328125, -11.59033203125, -11.0673828125, -10.54443359375, -10.021484375, -9.49853515625, -8.9755859375, -8.45263671875, -7.9296875, -7.40673828125, -6.8837890625, -6.36083984375, -5.837890625, -5.31494140625, -4.7919921875, -4.26904296875, -3.74609375, -3.22314453125, -2.7001953125, -2.17724609375, -1.654296875, -1.13134765625, -0.6083984375, -0.08544921875, 0.4375, 0.96044921875, 1.4833984375, 2.00634765625, 2.529296875, 3.05224609375, 3.5751953125, 4.09814453125, 4.62109375, 5.14404296875, 5.6669921875, 6.18994140625, 6.712890625, 7.23583984375, 7.7587890625, 8.28173828125, 8.8046875, 9.32763671875, 9.8505859375, 10.37353515625, 10.896484375, 11.41943359375, 11.9423828125, 12.46533203125, 12.98828125, 13.51123046875, 14.0341796875, 14.55712890625, 15.080078125, 15.60302734375, 16.1259765625, 16.64892578125, 17.171875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 12.0, 13.0, 24.0, 46.0, 48.0, 99.0, 167.0, 240.0, 385.0, 648.0, 968.0, 1573.0, 2479.0, 4277.0, 7340.0, 12860.0, 23348.0, 44071.0, 86189.0, 178233.0, 380332.0, 777814.0, 1109075.0, 795358.0, 394644.0, 184388.0, 88447.0, 44999.0, 24063.0, 13267.0, 7614.0, 4431.0, 2598.0, 1552.0, 951.0, 623.0, 388.0, 247.0, 186.0, 105.0, 66.0, 37.0, 23.0, 17.0, 13.0, 8.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.15625, -38.88232421875, -37.6083984375, -36.33447265625, -35.060546875, -33.78662109375, -32.5126953125, -31.23876953125, -29.96484375, -28.69091796875, -27.4169921875, -26.14306640625, -24.869140625, -23.59521484375, -22.3212890625, -21.04736328125, -19.7734375, -18.49951171875, -17.2255859375, -15.95166015625, -14.677734375, -13.40380859375, -12.1298828125, -10.85595703125, -9.58203125, -8.30810546875, -7.0341796875, -5.76025390625, -4.486328125, -3.21240234375, -1.9384765625, -0.66455078125, 0.609375, 1.88330078125, 3.1572265625, 4.43115234375, 5.705078125, 6.97900390625, 8.2529296875, 9.52685546875, 10.80078125, 12.07470703125, 13.3486328125, 14.62255859375, 15.896484375, 17.17041015625, 18.4443359375, 19.71826171875, 20.9921875, 22.26611328125, 23.5400390625, 24.81396484375, 26.087890625, 27.36181640625, 28.6357421875, 29.90966796875, 31.18359375, 32.45751953125, 33.7314453125, 35.00537109375, 36.279296875, 37.55322265625, 38.8271484375, 40.10107421875, 41.375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 10.0, 4.0, 13.0, 14.0, 19.0, 25.0, 41.0, 42.0, 49.0, 65.0, 89.0, 101.0, 119.0, 135.0, 152.0, 193.0, 230.0, 237.0, 251.0, 257.0, 286.0, 279.0, 241.0, 233.0, 167.0, 161.0, 129.0, 116.0, 81.0, 71.0, 66.0, 40.0, 26.0, 29.0, 22.0, 22.0, 11.0, 13.0, 10.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.443603515625, -9.11376953125, -8.783935546875, -8.4541015625, -8.124267578125, -7.79443359375, -7.464599609375, -7.134765625, -6.804931640625, -6.47509765625, -6.145263671875, -5.8154296875, -5.485595703125, -5.15576171875, -4.825927734375, -4.49609375, -4.166259765625, -3.83642578125, -3.506591796875, -3.1767578125, -2.846923828125, -2.51708984375, -2.187255859375, -1.857421875, -1.527587890625, -1.19775390625, -0.867919921875, -0.5380859375, -0.208251953125, 0.12158203125, 0.451416015625, 0.78125, 1.111083984375, 1.44091796875, 1.770751953125, 2.1005859375, 2.430419921875, 2.76025390625, 3.090087890625, 3.419921875, 3.749755859375, 4.07958984375, 4.409423828125, 4.7392578125, 5.069091796875, 5.39892578125, 5.728759765625, 6.05859375, 6.388427734375, 6.71826171875, 7.048095703125, 7.3779296875, 7.707763671875, 8.03759765625, 8.367431640625, 8.697265625, 9.027099609375, 9.35693359375, 9.686767578125, 10.0166015625, 10.346435546875, 10.67626953125, 11.006103515625, 11.3359375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 3.0, 4.0, 4.0, 10.0, 13.0, 16.0, 24.0, 31.0, 21.0, 33.0, 44.0, 59.0, 78.0, 85.0, 73.0, 76.0, 79.0, 72.0, 58.0, 36.0, 46.0, 32.0, 20.0, 13.0, 18.0, 14.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.13146209716797, -44.4886589050293, -42.84585189819336, -41.20304870605469, -39.56024169921875, -37.91743850708008, -36.274635314941406, -34.63182830810547, -32.98902130126953, -31.346216201782227, -29.703411102294922, -28.06060791015625, -26.417800903320312, -24.77499771118164, -23.132192611694336, -21.48938751220703, -19.84658432006836, -18.203779220581055, -16.56097412109375, -14.918169975280762, -13.275364875793457, -11.632559776306152, -9.989755630493164, -8.34695053100586, -6.704145431518555, -5.06134033203125, -3.4185357093811035, -1.775731086730957, -0.13292598724365234, 1.5098791122436523, 3.1526832580566406, 4.795488357543945, 6.438289642333984, 8.081094741821289, 9.723899841308594, 11.366703987121582, 13.009509086608887, 14.652314186096191, 16.29511833190918, 17.937923431396484, 19.58072853088379, 21.223533630371094, 22.8663387298584, 24.509143829345703, 26.151947021484375, 27.794754028320312, 29.437557220458984, 31.08036231994629, 32.723167419433594, 34.365970611572266, 36.0087776184082, 37.651580810546875, 39.29438781738281, 40.937191009521484, 42.579994201660156, 44.222801208496094, 45.86560821533203, 47.5084114074707, 49.15121841430664, 50.79402160644531, 52.43682861328125, 54.07963180541992, 55.722434997558594, 57.36524200439453, 59.0080451965332]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 11.0, 7.0, 9.0, 10.0, 11.0, 15.0, 28.0, 29.0, 21.0, 29.0, 29.0, 37.0, 44.0, 44.0, 40.0, 50.0, 40.0, 35.0, 59.0, 41.0, 48.0, 47.0, 49.0, 37.0, 32.0, 26.0, 19.0, 26.0, 20.0, 16.0, 21.0, 6.0, 14.0, 9.0, 10.0, 10.0, 3.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.20033836364746, -23.439237594604492, -22.67813491821289, -21.917034149169922, -21.155933380126953, -20.394832611083984, -19.633731842041016, -18.872629165649414, -18.111528396606445, -17.350427627563477, -16.589324951171875, -15.828224182128906, -15.067123413085938, -14.306022644042969, -13.544920921325684, -12.783819198608398, -12.02271842956543, -11.261617660522461, -10.500515937805176, -9.73941421508789, -8.978313446044922, -8.217212677001953, -7.456110954284668, -6.695009708404541, -5.933908462524414, -5.172807216644287, -4.41170597076416, -3.650604724884033, -2.8895034790039062, -2.1284022331237793, -1.3673009872436523, -0.6061997413635254, 0.15489959716796875, 0.9160008430480957, 1.6771020889282227, 2.4382033348083496, 3.1993045806884766, 3.9604058265686035, 4.7215070724487305, 5.482608318328857, 6.243709564208984, 7.004810810089111, 7.765912055969238, 8.527013778686523, 9.288114547729492, 10.049215316772461, 10.810317039489746, 11.571418762207031, 12.33251953125, 13.093620300292969, 13.854722023010254, 14.615823745727539, 15.376924514770508, 16.138025283813477, 16.899127960205078, 17.660228729248047, 18.421329498291016, 19.182430267333984, 19.943531036376953, 20.704633712768555, 21.465734481811523, 22.226835250854492, 22.987937927246094, 23.749038696289062, 24.51013946533203]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 14.0, 6.0, 17.0, 35.0, 46.0, 73.0, 121.0, 195.0, 303.0, 482.0, 793.0, 1258.0, 2049.0, 3299.0, 5425.0, 9223.0, 15195.0, 25505.0, 43007.0, 70647.0, 111380.0, 156347.0, 177733.0, 151480.0, 105377.0, 67288.0, 40828.0, 24234.0, 14553.0, 8452.0, 5090.0, 3100.0, 1872.0, 1193.0, 708.0, 460.0, 286.0, 175.0, 117.0, 70.0, 51.0, 29.0, 14.0, 12.0, 3.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.671875, -12.303955078125, -11.93603515625, -11.568115234375, -11.2001953125, -10.832275390625, -10.46435546875, -10.096435546875, -9.728515625, -9.360595703125, -8.99267578125, -8.624755859375, -8.2568359375, -7.888916015625, -7.52099609375, -7.153076171875, -6.78515625, -6.417236328125, -6.04931640625, -5.681396484375, -5.3134765625, -4.945556640625, -4.57763671875, -4.209716796875, -3.841796875, -3.473876953125, -3.10595703125, -2.738037109375, -2.3701171875, -2.002197265625, -1.63427734375, -1.266357421875, -0.8984375, -0.530517578125, -0.16259765625, 0.205322265625, 0.5732421875, 0.941162109375, 1.30908203125, 1.677001953125, 2.044921875, 2.412841796875, 2.78076171875, 3.148681640625, 3.5166015625, 3.884521484375, 4.25244140625, 4.620361328125, 4.98828125, 5.356201171875, 5.72412109375, 6.092041015625, 6.4599609375, 6.827880859375, 7.19580078125, 7.563720703125, 7.931640625, 8.299560546875, 8.66748046875, 9.035400390625, 9.4033203125, 9.771240234375, 10.13916015625, 10.507080078125, 10.875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 13.0, 3.0, 10.0, 8.0, 8.0, 15.0, 23.0, 22.0, 29.0, 26.0, 29.0, 38.0, 39.0, 39.0, 37.0, 36.0, 57.0, 47.0, 40.0, 51.0, 48.0, 47.0, 43.0, 53.0, 30.0, 29.0, 28.0, 22.0, 26.0, 23.0, 8.0, 17.0, 18.0, 6.0, 10.0, 7.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.90625, -29.03662109375, -28.1669921875, -27.29736328125, -26.427734375, -25.55810546875, -24.6884765625, -23.81884765625, -22.94921875, -22.07958984375, -21.2099609375, -20.34033203125, -19.470703125, -18.60107421875, -17.7314453125, -16.86181640625, -15.9921875, -15.12255859375, -14.2529296875, -13.38330078125, -12.513671875, -11.64404296875, -10.7744140625, -9.90478515625, -9.03515625, -8.16552734375, -7.2958984375, -6.42626953125, -5.556640625, -4.68701171875, -3.8173828125, -2.94775390625, -2.078125, -1.20849609375, -0.3388671875, 0.53076171875, 1.400390625, 2.27001953125, 3.1396484375, 4.00927734375, 4.87890625, 5.74853515625, 6.6181640625, 7.48779296875, 8.357421875, 9.22705078125, 10.0966796875, 10.96630859375, 11.8359375, 12.70556640625, 13.5751953125, 14.44482421875, 15.314453125, 16.18408203125, 17.0537109375, 17.92333984375, 18.79296875, 19.66259765625, 20.5322265625, 21.40185546875, 22.271484375, 23.14111328125, 24.0107421875, 24.88037109375, 25.75]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 7.0, 11.0, 10.0, 27.0, 42.0, 54.0, 58.0, 107.0, 148.0, 211.0, 335.0, 472.0, 692.0, 1157.0, 1574.0, 2516.0, 4096.0, 6577.0, 10978.0, 18558.0, 31409.0, 55874.0, 95678.0, 153777.0, 201669.0, 178595.0, 116642.0, 69103.0, 39902.0, 22928.0, 13408.0, 8262.0, 4821.0, 3121.0, 1935.0, 1248.0, 846.0, 529.0, 388.0, 225.0, 165.0, 114.0, 92.0, 61.0, 37.0, 20.0, 21.0, 15.0, 5.0, 8.0, 8.0, 2.0, 2.0, 4.0, 3.0], "bins": [-13.640625, -13.23583984375, -12.8310546875, -12.42626953125, -12.021484375, -11.61669921875, -11.2119140625, -10.80712890625, -10.40234375, -9.99755859375, -9.5927734375, -9.18798828125, -8.783203125, -8.37841796875, -7.9736328125, -7.56884765625, -7.1640625, -6.75927734375, -6.3544921875, -5.94970703125, -5.544921875, -5.14013671875, -4.7353515625, -4.33056640625, -3.92578125, -3.52099609375, -3.1162109375, -2.71142578125, -2.306640625, -1.90185546875, -1.4970703125, -1.09228515625, -0.6875, -0.28271484375, 0.1220703125, 0.52685546875, 0.931640625, 1.33642578125, 1.7412109375, 2.14599609375, 2.55078125, 2.95556640625, 3.3603515625, 3.76513671875, 4.169921875, 4.57470703125, 4.9794921875, 5.38427734375, 5.7890625, 6.19384765625, 6.5986328125, 7.00341796875, 7.408203125, 7.81298828125, 8.2177734375, 8.62255859375, 9.02734375, 9.43212890625, 9.8369140625, 10.24169921875, 10.646484375, 11.05126953125, 11.4560546875, 11.86083984375, 12.265625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 0.0, 5.0, 4.0, 4.0, 9.0, 7.0, 10.0, 14.0, 5.0, 9.0, 12.0, 7.0, 11.0, 21.0, 17.0, 26.0, 31.0, 26.0, 26.0, 24.0, 37.0, 19.0, 36.0, 42.0, 29.0, 40.0, 36.0, 32.0, 48.0, 39.0, 38.0, 30.0, 30.0, 32.0, 27.0, 31.0, 25.0, 22.0, 11.0, 15.0, 29.0, 17.0, 14.0, 12.0, 6.0, 12.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.0546875, -12.6634521484375, -12.272216796875, -11.8809814453125, -11.48974609375, -11.0985107421875, -10.707275390625, -10.3160400390625, -9.9248046875, -9.5335693359375, -9.142333984375, -8.7510986328125, -8.35986328125, -7.9686279296875, -7.577392578125, -7.1861572265625, -6.794921875, -6.4036865234375, -6.012451171875, -5.6212158203125, -5.22998046875, -4.8387451171875, -4.447509765625, -4.0562744140625, -3.6650390625, -3.2738037109375, -2.882568359375, -2.4913330078125, -2.10009765625, -1.7088623046875, -1.317626953125, -0.9263916015625, -0.53515625, -0.1439208984375, 0.247314453125, 0.6385498046875, 1.02978515625, 1.4210205078125, 1.812255859375, 2.2034912109375, 2.5947265625, 2.9859619140625, 3.377197265625, 3.7684326171875, 4.15966796875, 4.5509033203125, 4.942138671875, 5.3333740234375, 5.724609375, 6.1158447265625, 6.507080078125, 6.8983154296875, 7.28955078125, 7.6807861328125, 8.072021484375, 8.4632568359375, 8.8544921875, 9.2457275390625, 9.636962890625, 10.0281982421875, 10.41943359375, 10.8106689453125, 11.201904296875, 11.5931396484375, 11.984375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 6.0, 1.0, 6.0, 9.0, 14.0, 19.0, 32.0, 36.0, 69.0, 67.0, 96.0, 192.0, 257.0, 388.0, 607.0, 961.0, 1467.0, 2269.0, 3671.0, 6106.0, 10475.0, 18559.0, 33853.0, 65014.0, 123691.0, 209028.0, 233622.0, 155084.0, 83230.0, 43791.0, 23270.0, 13000.0, 7484.0, 4512.0, 2768.0, 1763.0, 1075.0, 674.0, 471.0, 288.0, 193.0, 144.0, 92.0, 67.0, 44.0, 27.0, 21.0, 16.0, 13.0, 6.0, 1.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-6.5390625, -6.32940673828125, -6.1197509765625, -5.91009521484375, -5.700439453125, -5.49078369140625, -5.2811279296875, -5.07147216796875, -4.86181640625, -4.65216064453125, -4.4425048828125, -4.23284912109375, -4.023193359375, -3.81353759765625, -3.6038818359375, -3.39422607421875, -3.1845703125, -2.97491455078125, -2.7652587890625, -2.55560302734375, -2.345947265625, -2.13629150390625, -1.9266357421875, -1.71697998046875, -1.50732421875, -1.29766845703125, -1.0880126953125, -0.87835693359375, -0.668701171875, -0.45904541015625, -0.2493896484375, -0.03973388671875, 0.169921875, 0.37957763671875, 0.5892333984375, 0.79888916015625, 1.008544921875, 1.21820068359375, 1.4278564453125, 1.63751220703125, 1.84716796875, 2.05682373046875, 2.2664794921875, 2.47613525390625, 2.685791015625, 2.89544677734375, 3.1051025390625, 3.31475830078125, 3.5244140625, 3.73406982421875, 3.9437255859375, 4.15338134765625, 4.363037109375, 4.57269287109375, 4.7823486328125, 4.99200439453125, 5.20166015625, 5.41131591796875, 5.6209716796875, 5.83062744140625, 6.040283203125, 6.24993896484375, 6.4595947265625, 6.66925048828125, 6.87890625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 13.0, 13.0, 10.0, 18.0, 23.0, 17.0, 33.0, 41.0, 46.0, 61.0, 62.0, 64.0, 62.0, 63.0, 72.0, 76.0, 65.0, 48.0, 28.0, 42.0, 32.0, 27.0, 16.0, 15.0, 17.0, 4.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003056526184082031, -0.00029353052377700806, -0.000281408429145813, -0.0002692863345146179, -0.00025716423988342285, -0.0002450421452522278, -0.00023292005062103271, -0.00022079795598983765, -0.00020867586135864258, -0.0001965537667274475, -0.00018443167209625244, -0.00017230957746505737, -0.0001601874828338623, -0.00014806538820266724, -0.00013594329357147217, -0.0001238211989402771, -0.00011169910430908203, -9.957700967788696e-05, -8.74549150466919e-05, -7.533282041549683e-05, -6.321072578430176e-05, -5.108863115310669e-05, -3.896653652191162e-05, -2.6844441890716553e-05, -1.4722347259521484e-05, -2.600252628326416e-06, 9.521842002868652e-06, 2.164393663406372e-05, 3.376603126525879e-05, 4.588812589645386e-05, 5.8010220527648926e-05, 7.0132315158844e-05, 8.225440979003906e-05, 9.437650442123413e-05, 0.0001064985990524292, 0.00011862069368362427, 0.00013074278831481934, 0.0001428648829460144, 0.00015498697757720947, 0.00016710907220840454, 0.0001792311668395996, 0.00019135326147079468, 0.00020347535610198975, 0.00021559745073318481, 0.00022771954536437988, 0.00023984163999557495, 0.00025196373462677, 0.0002640858292579651, 0.00027620792388916016, 0.0002883300185203552, 0.0003004521131515503, 0.00031257420778274536, 0.00032469630241394043, 0.0003368183970451355, 0.00034894049167633057, 0.00036106258630752563, 0.0003731846809387207, 0.00038530677556991577, 0.00039742887020111084, 0.0004095509648323059, 0.000421673059463501, 0.00043379515409469604, 0.0004459172487258911, 0.0004580393433570862, 0.00047016143798828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 10.0, 11.0, 16.0, 25.0, 40.0, 65.0, 76.0, 140.0, 176.0, 282.0, 359.0, 519.0, 844.0, 1180.0, 1820.0, 2567.0, 3877.0, 6211.0, 9707.0, 15499.0, 24421.0, 39734.0, 64272.0, 99759.0, 144216.0, 172115.0, 155357.0, 111346.0, 72703.0, 44825.0, 27838.0, 17123.0, 10846.0, 6982.0, 4487.0, 3048.0, 1979.0, 1247.0, 878.0, 602.0, 437.0, 286.0, 174.0, 143.0, 88.0, 79.0, 43.0, 34.0, 17.0, 19.0, 11.0, 13.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0], "bins": [-6.203125, -6.00701904296875, -5.8109130859375, -5.61480712890625, -5.418701171875, -5.22259521484375, -5.0264892578125, -4.83038330078125, -4.63427734375, -4.43817138671875, -4.2420654296875, -4.04595947265625, -3.849853515625, -3.65374755859375, -3.4576416015625, -3.26153564453125, -3.0654296875, -2.86932373046875, -2.6732177734375, -2.47711181640625, -2.281005859375, -2.08489990234375, -1.8887939453125, -1.69268798828125, -1.49658203125, -1.30047607421875, -1.1043701171875, -0.90826416015625, -0.712158203125, -0.51605224609375, -0.3199462890625, -0.12384033203125, 0.072265625, 0.26837158203125, 0.4644775390625, 0.66058349609375, 0.856689453125, 1.05279541015625, 1.2489013671875, 1.44500732421875, 1.64111328125, 1.83721923828125, 2.0333251953125, 2.22943115234375, 2.425537109375, 2.62164306640625, 2.8177490234375, 3.01385498046875, 3.2099609375, 3.40606689453125, 3.6021728515625, 3.79827880859375, 3.994384765625, 4.19049072265625, 4.3865966796875, 4.58270263671875, 4.77880859375, 4.97491455078125, 5.1710205078125, 5.36712646484375, 5.563232421875, 5.75933837890625, 5.9554443359375, 6.15155029296875, 6.34765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 1.0, 7.0, 9.0, 9.0, 16.0, 12.0, 19.0, 27.0, 26.0, 30.0, 36.0, 42.0, 50.0, 56.0, 59.0, 65.0, 69.0, 55.0, 69.0, 51.0, 62.0, 55.0, 36.0, 24.0, 24.0, 23.0, 18.0, 6.0, 18.0, 6.0, 7.0, 4.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9228515625, -1.8580169677734375, -1.793182373046875, -1.7283477783203125, -1.66351318359375, -1.5986785888671875, -1.533843994140625, -1.4690093994140625, -1.4041748046875, -1.3393402099609375, -1.274505615234375, -1.2096710205078125, -1.14483642578125, -1.0800018310546875, -1.015167236328125, -0.9503326416015625, -0.885498046875, -0.8206634521484375, -0.755828857421875, -0.6909942626953125, -0.62615966796875, -0.5613250732421875, -0.496490478515625, -0.4316558837890625, -0.3668212890625, -0.3019866943359375, -0.237152099609375, -0.1723175048828125, -0.10748291015625, -0.0426483154296875, 0.022186279296875, 0.0870208740234375, 0.15185546875, 0.2166900634765625, 0.281524658203125, 0.3463592529296875, 0.41119384765625, 0.4760284423828125, 0.540863037109375, 0.6056976318359375, 0.6705322265625, 0.7353668212890625, 0.800201416015625, 0.8650360107421875, 0.92987060546875, 0.9947052001953125, 1.059539794921875, 1.1243743896484375, 1.189208984375, 1.2540435791015625, 1.318878173828125, 1.3837127685546875, 1.44854736328125, 1.5133819580078125, 1.578216552734375, 1.6430511474609375, 1.7078857421875, 1.7727203369140625, 1.837554931640625, 1.9023895263671875, 1.96722412109375, 2.0320587158203125, 2.096893310546875, 2.1617279052734375, 2.2265625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 5.0, 13.0, 18.0, 14.0, 27.0, 30.0, 22.0, 39.0, 46.0, 71.0, 72.0, 70.0, 76.0, 74.0, 88.0, 60.0, 53.0, 42.0, 38.0, 26.0, 22.0, 16.0, 18.0, 11.0, 6.0, 9.0, 5.0, 7.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.864013671875, -43.24891662597656, -41.63382339477539, -40.01872634887695, -38.40363311767578, -36.788536071777344, -35.173439025878906, -33.558345794677734, -31.94325065612793, -30.328155517578125, -28.71306037902832, -27.097965240478516, -25.482868194580078, -23.867774963378906, -22.25267791748047, -20.637582778930664, -19.02248764038086, -17.407392501831055, -15.79229736328125, -14.177201271057129, -12.562106132507324, -10.94701099395752, -9.331914901733398, -7.716819763183594, -6.101724624633789, -4.486629486083984, -2.8715338706970215, -1.2564382553100586, 0.3586568832397461, 1.9737520217895508, 3.588848114013672, 5.203943252563477, 6.819042205810547, 8.434137344360352, 10.049232482910156, 11.664328575134277, 13.279423713684082, 14.894518852233887, 16.509614944458008, 18.124710083007812, 19.739805221557617, 21.354900360107422, 22.969995498657227, 24.58509063720703, 26.20018768310547, 27.81528091430664, 29.430377960205078, 31.045473098754883, 32.66056823730469, 34.275665283203125, 35.8907585144043, 37.505855560302734, 39.120948791503906, 40.736045837402344, 42.35114288330078, 43.96623611450195, 45.581329345703125, 47.19642639160156, 48.811519622802734, 50.42661666870117, 52.041709899902344, 53.65680694580078, 55.27190399169922, 56.88699722290039, 58.50209426879883]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 10.0, 6.0, 8.0, 9.0, 13.0, 15.0, 23.0, 23.0, 22.0, 30.0, 30.0, 38.0, 32.0, 53.0, 39.0, 45.0, 46.0, 40.0, 43.0, 43.0, 53.0, 50.0, 53.0, 38.0, 31.0, 23.0, 35.0, 18.0, 22.0, 20.0, 13.0, 13.0, 12.0, 12.0, 9.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.110742568969727, -23.335065841674805, -22.559389114379883, -21.78371238708496, -21.00803565979004, -20.232358932495117, -19.456684112548828, -18.681007385253906, -17.905330657958984, -17.129653930664062, -16.35397720336914, -15.578300476074219, -14.802623748779297, -14.026947021484375, -13.25127124786377, -12.475594520568848, -11.69991683959961, -10.924240112304688, -10.148563385009766, -9.372886657714844, -8.597209930419922, -7.821533679962158, -7.0458574295043945, -6.270180702209473, -5.494503974914551, -4.718827247619629, -3.943150758743286, -3.1674742698669434, -2.3917975425720215, -1.6161208152770996, -0.8404445648193359, -0.06476783752441406, 0.7109088897705078, 1.4865854978561401, 2.2622621059417725, 3.0379385948181152, 3.813615322113037, 4.589292049407959, 5.364968299865723, 6.1406450271606445, 6.916321754455566, 7.691998481750488, 8.46767520904541, 9.243350982666016, 10.019027709960938, 10.79470443725586, 11.570381164550781, 12.346057891845703, 13.121734619140625, 13.897411346435547, 14.673088073730469, 15.44876480102539, 16.224441528320312, 17.000118255615234, 17.775794982910156, 18.551471710205078, 19.3271484375, 20.102825164794922, 20.878501892089844, 21.654178619384766, 22.429855346679688, 23.20553207397461, 23.98120880126953, 24.756885528564453, 25.532560348510742]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 9.0, 5.0, 9.0, 16.0, 29.0, 29.0, 52.0, 69.0, 95.0, 131.0, 231.0, 348.0, 478.0, 847.0, 1372.0, 2251.0, 3959.0, 7105.0, 13813.0, 25747.0, 50346.0, 96637.0, 171220.0, 228868.0, 195814.0, 118230.0, 61782.0, 31944.0, 16502.0, 8936.0, 4743.0, 2741.0, 1577.0, 941.0, 617.0, 350.0, 226.0, 163.0, 105.0, 70.0, 51.0, 37.0, 20.0, 13.0, 13.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -24.896728515625, -23.99658203125, -23.096435546875, -22.1962890625, -21.296142578125, -20.39599609375, -19.495849609375, -18.595703125, -17.695556640625, -16.79541015625, -15.895263671875, -14.9951171875, -14.094970703125, -13.19482421875, -12.294677734375, -11.39453125, -10.494384765625, -9.59423828125, -8.694091796875, -7.7939453125, -6.893798828125, -5.99365234375, -5.093505859375, -4.193359375, -3.293212890625, -2.39306640625, -1.492919921875, -0.5927734375, 0.307373046875, 1.20751953125, 2.107666015625, 3.0078125, 3.907958984375, 4.80810546875, 5.708251953125, 6.6083984375, 7.508544921875, 8.40869140625, 9.308837890625, 10.208984375, 11.109130859375, 12.00927734375, 12.909423828125, 13.8095703125, 14.709716796875, 15.60986328125, 16.510009765625, 17.41015625, 18.310302734375, 19.21044921875, 20.110595703125, 21.0107421875, 21.910888671875, 22.81103515625, 23.711181640625, 24.611328125, 25.511474609375, 26.41162109375, 27.311767578125, 28.2119140625, 29.112060546875, 30.01220703125, 30.912353515625, 31.8125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 8.0, 8.0, 3.0, 12.0, 9.0, 14.0, 17.0, 26.0, 34.0, 30.0, 33.0, 36.0, 46.0, 30.0, 48.0, 34.0, 41.0, 47.0, 53.0, 43.0, 48.0, 55.0, 48.0, 35.0, 34.0, 22.0, 24.0, 23.0, 25.0, 19.0, 11.0, 5.0, 24.0, 13.0, 7.0, 9.0, 2.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.21875, -26.36767578125, -25.5166015625, -24.66552734375, -23.814453125, -22.96337890625, -22.1123046875, -21.26123046875, -20.41015625, -19.55908203125, -18.7080078125, -17.85693359375, -17.005859375, -16.15478515625, -15.3037109375, -14.45263671875, -13.6015625, -12.75048828125, -11.8994140625, -11.04833984375, -10.197265625, -9.34619140625, -8.4951171875, -7.64404296875, -6.79296875, -5.94189453125, -5.0908203125, -4.23974609375, -3.388671875, -2.53759765625, -1.6865234375, -0.83544921875, 0.015625, 0.86669921875, 1.7177734375, 2.56884765625, 3.419921875, 4.27099609375, 5.1220703125, 5.97314453125, 6.82421875, 7.67529296875, 8.5263671875, 9.37744140625, 10.228515625, 11.07958984375, 11.9306640625, 12.78173828125, 13.6328125, 14.48388671875, 15.3349609375, 16.18603515625, 17.037109375, 17.88818359375, 18.7392578125, 19.59033203125, 20.44140625, 21.29248046875, 22.1435546875, 22.99462890625, 23.845703125, 24.69677734375, 25.5478515625, 26.39892578125, 27.25]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 6.0, 3.0, 12.0, 23.0, 25.0, 33.0, 53.0, 86.0, 124.0, 195.0, 245.0, 402.0, 655.0, 933.0, 1411.0, 2251.0, 3514.0, 5687.0, 9314.0, 15940.0, 26994.0, 46817.0, 82358.0, 137563.0, 196647.0, 194190.0, 133377.0, 79101.0, 45430.0, 25578.0, 15156.0, 9098.0, 5619.0, 3359.0, 2199.0, 1446.0, 934.0, 600.0, 376.0, 260.0, 187.0, 139.0, 73.0, 41.0, 39.0, 13.0, 16.0, 10.0, 14.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.25732421875, -30.1396484375, -29.02197265625, -27.904296875, -26.78662109375, -25.6689453125, -24.55126953125, -23.43359375, -22.31591796875, -21.1982421875, -20.08056640625, -18.962890625, -17.84521484375, -16.7275390625, -15.60986328125, -14.4921875, -13.37451171875, -12.2568359375, -11.13916015625, -10.021484375, -8.90380859375, -7.7861328125, -6.66845703125, -5.55078125, -4.43310546875, -3.3154296875, -2.19775390625, -1.080078125, 0.03759765625, 1.1552734375, 2.27294921875, 3.390625, 4.50830078125, 5.6259765625, 6.74365234375, 7.861328125, 8.97900390625, 10.0966796875, 11.21435546875, 12.33203125, 13.44970703125, 14.5673828125, 15.68505859375, 16.802734375, 17.92041015625, 19.0380859375, 20.15576171875, 21.2734375, 22.39111328125, 23.5087890625, 24.62646484375, 25.744140625, 26.86181640625, 27.9794921875, 29.09716796875, 30.21484375, 31.33251953125, 32.4501953125, 33.56787109375, 34.685546875, 35.80322265625, 36.9208984375, 38.03857421875, 39.15625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 11.0, 10.0, 16.0, 19.0, 27.0, 30.0, 31.0, 34.0, 29.0, 28.0, 33.0, 38.0, 29.0, 34.0, 43.0, 44.0, 48.0, 41.0, 37.0, 27.0, 31.0, 35.0, 34.0, 39.0, 34.0, 28.0, 22.0, 15.0, 21.0, 18.0, 14.0, 12.0, 8.0, 11.0, 8.0, 1.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.8984375, -14.4100341796875, -13.921630859375, -13.4332275390625, -12.94482421875, -12.4564208984375, -11.968017578125, -11.4796142578125, -10.9912109375, -10.5028076171875, -10.014404296875, -9.5260009765625, -9.03759765625, -8.5491943359375, -8.060791015625, -7.5723876953125, -7.083984375, -6.5955810546875, -6.107177734375, -5.6187744140625, -5.13037109375, -4.6419677734375, -4.153564453125, -3.6651611328125, -3.1767578125, -2.6883544921875, -2.199951171875, -1.7115478515625, -1.22314453125, -0.7347412109375, -0.246337890625, 0.2420654296875, 0.73046875, 1.2188720703125, 1.707275390625, 2.1956787109375, 2.68408203125, 3.1724853515625, 3.660888671875, 4.1492919921875, 4.6376953125, 5.1260986328125, 5.614501953125, 6.1029052734375, 6.59130859375, 7.0797119140625, 7.568115234375, 8.0565185546875, 8.544921875, 9.0333251953125, 9.521728515625, 10.0101318359375, 10.49853515625, 10.9869384765625, 11.475341796875, 11.9637451171875, 12.4521484375, 12.9405517578125, 13.428955078125, 13.9173583984375, 14.40576171875, 14.8941650390625, 15.382568359375, 15.8709716796875, 16.359375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 5.0, 9.0, 10.0, 16.0, 24.0, 46.0, 68.0, 97.0, 139.0, 248.0, 334.0, 616.0, 1026.0, 2013.0, 4352.0, 10522.0, 27846.0, 77723.0, 197642.0, 320983.0, 240492.0, 102394.0, 37139.0, 13823.0, 5480.0, 2446.0, 1179.0, 679.0, 412.0, 262.0, 186.0, 105.0, 72.0, 56.0, 23.0, 32.0, 20.0, 11.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.421875, -22.7255859375, -22.029296875, -21.3330078125, -20.63671875, -19.9404296875, -19.244140625, -18.5478515625, -17.8515625, -17.1552734375, -16.458984375, -15.7626953125, -15.06640625, -14.3701171875, -13.673828125, -12.9775390625, -12.28125, -11.5849609375, -10.888671875, -10.1923828125, -9.49609375, -8.7998046875, -8.103515625, -7.4072265625, -6.7109375, -6.0146484375, -5.318359375, -4.6220703125, -3.92578125, -3.2294921875, -2.533203125, -1.8369140625, -1.140625, -0.4443359375, 0.251953125, 0.9482421875, 1.64453125, 2.3408203125, 3.037109375, 3.7333984375, 4.4296875, 5.1259765625, 5.822265625, 6.5185546875, 7.21484375, 7.9111328125, 8.607421875, 9.3037109375, 10.0, 10.6962890625, 11.392578125, 12.0888671875, 12.78515625, 13.4814453125, 14.177734375, 14.8740234375, 15.5703125, 16.2666015625, 16.962890625, 17.6591796875, 18.35546875, 19.0517578125, 19.748046875, 20.4443359375, 21.140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 3.0, 5.0, 8.0, 9.0, 15.0, 21.0, 25.0, 27.0, 30.0, 41.0, 52.0, 78.0, 74.0, 96.0, 82.0, 83.0, 69.0, 66.0, 46.0, 39.0, 32.0, 20.0, 19.0, 8.0, 9.0, 7.0, 4.0, 4.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002193450927734375, -0.0021353960037231445, -0.002077341079711914, -0.0020192861557006836, -0.001961231231689453, -0.0019031763076782227, -0.0018451213836669922, -0.0017870664596557617, -0.0017290115356445312, -0.0016709566116333008, -0.0016129016876220703, -0.0015548467636108398, -0.0014967918395996094, -0.001438736915588379, -0.0013806819915771484, -0.001322627067565918, -0.0012645721435546875, -0.001206517219543457, -0.0011484622955322266, -0.001090407371520996, -0.0010323524475097656, -0.0009742975234985352, -0.0009162425994873047, -0.0008581876754760742, -0.0008001327514648438, -0.0007420778274536133, -0.0006840229034423828, -0.0006259679794311523, -0.0005679130554199219, -0.0005098581314086914, -0.00045180320739746094, -0.00039374828338623047, -0.000335693359375, -0.00027763843536376953, -0.00021958351135253906, -0.0001615285873413086, -0.00010347366333007812, -4.5418739318847656e-05, 1.2636184692382812e-05, 7.069110870361328e-05, 0.00012874603271484375, 0.00018680095672607422, 0.0002448558807373047, 0.00030291080474853516, 0.0003609657287597656, 0.0004190206527709961, 0.00047707557678222656, 0.000535130500793457, 0.0005931854248046875, 0.000651240348815918, 0.0007092952728271484, 0.0007673501968383789, 0.0008254051208496094, 0.0008834600448608398, 0.0009415149688720703, 0.0009995698928833008, 0.0010576248168945312, 0.0011156797409057617, 0.0011737346649169922, 0.0012317895889282227, 0.0012898445129394531, 0.0013478994369506836, 0.001405954360961914, 0.0014640092849731445, 0.001522064208984375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 10.0, 22.0, 32.0, 35.0, 57.0, 78.0, 137.0, 237.0, 366.0, 574.0, 870.0, 1438.0, 2468.0, 4233.0, 8086.0, 14993.0, 29194.0, 56448.0, 106427.0, 175558.0, 218944.0, 184485.0, 114148.0, 61612.0, 31657.0, 16245.0, 8589.0, 4764.0, 2668.0, 1552.0, 1013.0, 563.0, 367.0, 236.0, 141.0, 102.0, 69.0, 46.0, 33.0, 15.0, 13.0, 11.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.9453125, -12.5074462890625, -12.069580078125, -11.6317138671875, -11.19384765625, -10.7559814453125, -10.318115234375, -9.8802490234375, -9.4423828125, -9.0045166015625, -8.566650390625, -8.1287841796875, -7.69091796875, -7.2530517578125, -6.815185546875, -6.3773193359375, -5.939453125, -5.5015869140625, -5.063720703125, -4.6258544921875, -4.18798828125, -3.7501220703125, -3.312255859375, -2.8743896484375, -2.4365234375, -1.9986572265625, -1.560791015625, -1.1229248046875, -0.68505859375, -0.2471923828125, 0.190673828125, 0.6285400390625, 1.06640625, 1.5042724609375, 1.942138671875, 2.3800048828125, 2.81787109375, 3.2557373046875, 3.693603515625, 4.1314697265625, 4.5693359375, 5.0072021484375, 5.445068359375, 5.8829345703125, 6.32080078125, 6.7586669921875, 7.196533203125, 7.6343994140625, 8.072265625, 8.5101318359375, 8.947998046875, 9.3858642578125, 9.82373046875, 10.2615966796875, 10.699462890625, 11.1373291015625, 11.5751953125, 12.0130615234375, 12.450927734375, 12.8887939453125, 13.32666015625, 13.7645263671875, 14.202392578125, 14.6402587890625, 15.078125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 8.0, 17.0, 16.0, 19.0, 17.0, 22.0, 29.0, 33.0, 52.0, 43.0, 54.0, 72.0, 69.0, 61.0, 61.0, 62.0, 51.0, 34.0, 38.0, 41.0, 45.0, 28.0, 24.0, 17.0, 12.0, 20.0, 8.0, 6.0, 8.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.080078125, -2.9742431640625, -2.868408203125, -2.7625732421875, -2.65673828125, -2.5509033203125, -2.445068359375, -2.3392333984375, -2.2333984375, -2.1275634765625, -2.021728515625, -1.9158935546875, -1.81005859375, -1.7042236328125, -1.598388671875, -1.4925537109375, -1.38671875, -1.2808837890625, -1.175048828125, -1.0692138671875, -0.96337890625, -0.8575439453125, -0.751708984375, -0.6458740234375, -0.5400390625, -0.4342041015625, -0.328369140625, -0.2225341796875, -0.11669921875, -0.0108642578125, 0.094970703125, 0.2008056640625, 0.306640625, 0.4124755859375, 0.518310546875, 0.6241455078125, 0.72998046875, 0.8358154296875, 0.941650390625, 1.0474853515625, 1.1533203125, 1.2591552734375, 1.364990234375, 1.4708251953125, 1.57666015625, 1.6824951171875, 1.788330078125, 1.8941650390625, 2.0, 2.1058349609375, 2.211669921875, 2.3175048828125, 2.42333984375, 2.5291748046875, 2.635009765625, 2.7408447265625, 2.8466796875, 2.9525146484375, 3.058349609375, 3.1641845703125, 3.27001953125, 3.3758544921875, 3.481689453125, 3.5875244140625, 3.693359375]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 4.0, 5.0, 3.0, 10.0, 13.0, 11.0, 27.0, 24.0, 26.0, 37.0, 46.0, 46.0, 76.0, 60.0, 71.0, 77.0, 72.0, 72.0, 53.0, 41.0, 42.0, 42.0, 28.0, 20.0, 18.0, 19.0, 12.0, 15.0, 6.0, 6.0, 4.0, 0.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.69246292114258, -41.01814270019531, -39.34382629394531, -37.66950988769531, -35.99518966674805, -34.32086944580078, -32.64655303955078, -30.97223472595215, -29.297916412353516, -27.623598098754883, -25.94927978515625, -24.274961471557617, -22.600643157958984, -20.92632484436035, -19.25200653076172, -17.577688217163086, -15.903369903564453, -14.22905158996582, -12.554733276367188, -10.880414962768555, -9.206096649169922, -7.531778335571289, -5.857460021972656, -4.183141708374023, -2.5088233947753906, -0.8345050811767578, 0.839813232421875, 2.514131546020508, 4.188449859619141, 5.862768173217773, 7.537086486816406, 9.211404800415039, 10.885726928710938, 12.56004524230957, 14.234363555908203, 15.908681869506836, 17.58300018310547, 19.2573184967041, 20.931636810302734, 22.605955123901367, 24.2802734375, 25.954591751098633, 27.628910064697266, 29.3032283782959, 30.97754669189453, 32.65186309814453, 34.3261833190918, 36.00050354003906, 37.67481994628906, 39.34913635253906, 41.02345657348633, 42.697776794433594, 44.372093200683594, 46.046409606933594, 47.72072982788086, 49.395050048828125, 51.069366455078125, 52.743682861328125, 54.41800308227539, 56.092323303222656, 57.766639709472656, 59.440956115722656, 61.11527633666992, 62.78959655761719, 64.46391296386719]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 9.0, 1.0, 12.0, 15.0, 8.0, 18.0, 18.0, 24.0, 31.0, 32.0, 35.0, 46.0, 46.0, 49.0, 40.0, 39.0, 60.0, 43.0, 50.0, 61.0, 50.0, 43.0, 44.0, 34.0, 38.0, 29.0, 22.0, 26.0, 9.0, 14.0, 13.0, 9.0, 11.0, 4.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.47378158569336, -34.3286018371582, -33.18342208862305, -32.03824234008789, -30.893062591552734, -29.747882843017578, -28.60270118713379, -27.457521438598633, -26.312341690063477, -25.16716194152832, -24.021982192993164, -22.876802444458008, -21.73162078857422, -20.586441040039062, -19.441261291503906, -18.29608154296875, -17.150901794433594, -16.005722045898438, -14.860542297363281, -13.715361595153809, -12.570181846618652, -11.425002098083496, -10.279821395874023, -9.134641647338867, -7.989461898803711, -6.844282150268555, -5.69910192489624, -4.553921699523926, -3.4087419509887695, -2.2635622024536133, -1.1183819770812988, 0.026798248291015625, 1.1719818115234375, 2.317161798477173, 3.462341785430908, 4.607522010803223, 5.752701759338379, 6.897881507873535, 8.043062210083008, 9.188241958618164, 10.33342170715332, 11.478601455688477, 12.623781204223633, 13.768961906433105, 14.914141654968262, 16.059322357177734, 17.20450210571289, 18.349681854248047, 19.494861602783203, 20.64004135131836, 21.785221099853516, 22.930400848388672, 24.075580596923828, 25.220760345458984, 26.365942001342773, 27.51112174987793, 28.656301498413086, 29.801481246948242, 30.9466609954834, 32.09184265136719, 33.237022399902344, 34.3822021484375, 35.527381896972656, 36.67256164550781, 37.81774139404297]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 8.0, 7.0, 14.0, 12.0, 18.0, 23.0, 39.0, 51.0, 56.0, 47.0, 86.0, 111.0, 181.0, 229.0, 385.0, 588.0, 1023.0, 2112.0, 5848.0, 499078.0, 8256.0, 2775.0, 1200.0, 698.0, 420.0, 256.0, 170.0, 141.0, 94.0, 75.0, 54.0, 41.0, 37.0, 26.0, 22.0, 14.0, 12.0, 13.0, 7.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-657.5618286132812, -635.3809204101562, -613.199951171875, -591.01904296875, -568.838134765625, -546.6572265625, -524.4762573242188, -502.29534912109375, -480.1144104003906, -457.9334716796875, -435.7525634765625, -413.5716247558594, -391.39068603515625, -369.20977783203125, -347.0288391113281, -324.847900390625, -302.6669921875, -280.4860534667969, -258.3051452636719, -236.12420654296875, -213.9432830810547, -191.76235961914062, -169.5814208984375, -147.40049743652344, -125.21957397460938, -103.03865051269531, -80.85771942138672, -58.676788330078125, -36.49586486816406, -14.31494140625, 7.865997314453125, 30.046920776367188, 52.22784423828125, 74.40876770019531, 96.5896987915039, 118.7706298828125, 140.95155334472656, 163.13247680664062, 185.31341552734375, 207.4943389892578, 229.67526245117188, 251.85618591308594, 274.037109375, 296.2180480957031, 318.39898681640625, 340.57989501953125, 362.7608337402344, 384.9417724609375, 407.1226806640625, 429.3036193847656, 451.4845275878906, 473.66546630859375, 495.84637451171875, 518.02734375, 540.208251953125, 562.38916015625, 584.570068359375, 606.7509765625, 628.9319458007812, 651.1128540039062, 673.2937622070312, 695.4747314453125, 717.6556396484375, 739.8365478515625, 762.0175170898438]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 15.0, 11.0, 8.0, 23.0, 15.0, 23.0, 33.0, 37.0, 32.0, 45.0, 60.0, 36.0, 40.0, 48.0, 1080.0, 45.0, 41.0, 62.0, 52.0, 46.0, 40.0, 30.0, 40.0, 29.0, 20.0, 21.0, 12.0, 12.0, 18.0, 4.0, 12.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1096.271728515625, -1060.7425537109375, -1025.21337890625, -989.6842041015625, -954.1550903320312, -918.6259155273438, -883.0967407226562, -847.5675659179688, -812.0384521484375, -776.50927734375, -740.9801025390625, -705.450927734375, -669.9218139648438, -634.3926391601562, -598.8634643554688, -563.3342895507812, -527.8051147460938, -492.27593994140625, -456.7467956542969, -421.2176208496094, -385.6884765625, -350.1593017578125, -314.630126953125, -279.1009521484375, -243.57180786132812, -208.0426483154297, -172.51348876953125, -136.98431396484375, -101.45515441894531, -65.92599487304688, -30.396820068359375, 5.1323394775390625, 40.6614990234375, 76.19065856933594, 111.7198257446289, 147.24899291992188, 182.7781524658203, 218.30731201171875, 253.83648681640625, 289.36566162109375, 324.8948059082031, 360.4239807128906, 395.953125, 431.4822998046875, 467.011474609375, 502.5406188964844, 538.06982421875, 573.5989379882812, 609.1281127929688, 644.6572875976562, 680.1864624023438, 715.715576171875, 751.2447509765625, 786.77392578125, 822.3031005859375, 857.832275390625, 893.3614501953125, 928.890625, 964.4197998046875, 999.948974609375, 1035.4781494140625, 1071.00732421875, 1106.536376953125, 1142.0655517578125, 1177.5947265625]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 2.0, 9.0, 13.0, 7.0, 13.0, 13.0, 15.0, 32.0, 44.0, 66.0, 56.0, 66.0, 117.0, 157.0, 237.0, 458.0, 1001.0, 2305.0, 5516.0, 11046.0, 20476.0, 31079760.0, 99038.0, 27229.0, 3810.0, 1166.0, 606.0, 372.0, 223.0, 161.0, 113.0, 86.0, 57.0, 43.0, 44.0, 22.0, 29.0, 19.0, 22.0, 5.0, 10.0, 6.0, 11.0, 3.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-708.4880981445312, -685.5228271484375, -662.5575561523438, -639.59228515625, -616.6270141601562, -593.6617431640625, -570.6964721679688, -547.731201171875, -524.7659301757812, -501.8006591796875, -478.83538818359375, -455.8701171875, -432.90484619140625, -409.9395751953125, -386.97430419921875, -364.009033203125, -341.0437927246094, -318.0785217285156, -295.1132507324219, -272.1479797363281, -249.18270874023438, -226.21743774414062, -203.25218200683594, -180.2869110107422, -157.32164001464844, -134.3563690185547, -111.39109802246094, -88.42583465576172, -65.46056365966797, -42.49529266357422, -19.530029296875, 3.43524169921875, 26.4005126953125, 49.36578369140625, 72.3310546875, 95.29631805419922, 118.26158905029297, 141.22686767578125, 164.19212341308594, 187.1573944091797, 210.12266540527344, 233.0879364013672, 256.0531921386719, 279.0184631347656, 301.9837341308594, 324.9490051269531, 347.9142761230469, 370.8795471191406, 393.8448181152344, 416.8100891113281, 439.7753601074219, 462.7406311035156, 485.7059020996094, 508.6711730957031, 531.6364135742188, 554.6016845703125, 577.5669555664062, 600.5322265625, 623.4974975585938, 646.4627685546875, 669.4280395507812, 692.393310546875, 715.3585815429688, 738.3238525390625, 761.2891235351562]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 12.0, 18.0, 40.0, 47.0, 59.0, 98.0, 158.0, 210.0, 329.0, 515.0, 860.0, 1310.0, 2168.0, 3581.0, 6264.0, 10968.0, 20173.0, 38774.0, 79661.0, 174501.0, 430603.0, 1210587.0, 2462732.0, 1124170.0, 404186.0, 164573.0, 74661.0, 36170.0, 19091.0, 10264.0, 5843.0, 3394.0, 2002.0, 1246.0, 737.0, 508.0, 337.0, 186.0, 123.0, 91.0, 55.0, 39.0, 27.0, 17.0, 14.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-62.625, -60.75341796875, -58.8818359375, -57.01025390625, -55.138671875, -53.26708984375, -51.3955078125, -49.52392578125, -47.65234375, -45.78076171875, -43.9091796875, -42.03759765625, -40.166015625, -38.29443359375, -36.4228515625, -34.55126953125, -32.6796875, -30.80810546875, -28.9365234375, -27.06494140625, -25.193359375, -23.32177734375, -21.4501953125, -19.57861328125, -17.70703125, -15.83544921875, -13.9638671875, -12.09228515625, -10.220703125, -8.34912109375, -6.4775390625, -4.60595703125, -2.734375, -0.86279296875, 1.0087890625, 2.88037109375, 4.751953125, 6.62353515625, 8.4951171875, 10.36669921875, 12.23828125, 14.10986328125, 15.9814453125, 17.85302734375, 19.724609375, 21.59619140625, 23.4677734375, 25.33935546875, 27.2109375, 29.08251953125, 30.9541015625, 32.82568359375, 34.697265625, 36.56884765625, 38.4404296875, 40.31201171875, 42.18359375, 44.05517578125, 45.9267578125, 47.79833984375, 49.669921875, 51.54150390625, 53.4130859375, 55.28466796875, 57.15625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 10.0, 4.0, 11.0, 15.0, 15.0, 20.0, 17.0, 32.0, 34.0, 33.0, 56.0, 49.0, 63.0, 63.0, 87.0, 121.0, 125.0, 147.0, 134.0, 141.0, 109.0, 108.0, 82.0, 93.0, 61.0, 66.0, 67.0, 47.0, 27.0, 28.0, 19.0, 22.0, 30.0, 14.0, 11.0, 12.0, 11.0, 5.0, 9.0, 5.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.265625, -17.69189453125, -17.1181640625, -16.54443359375, -15.970703125, -15.39697265625, -14.8232421875, -14.24951171875, -13.67578125, -13.10205078125, -12.5283203125, -11.95458984375, -11.380859375, -10.80712890625, -10.2333984375, -9.65966796875, -9.0859375, -8.51220703125, -7.9384765625, -7.36474609375, -6.791015625, -6.21728515625, -5.6435546875, -5.06982421875, -4.49609375, -3.92236328125, -3.3486328125, -2.77490234375, -2.201171875, -1.62744140625, -1.0537109375, -0.47998046875, 0.09375, 0.66748046875, 1.2412109375, 1.81494140625, 2.388671875, 2.96240234375, 3.5361328125, 4.10986328125, 4.68359375, 5.25732421875, 5.8310546875, 6.40478515625, 6.978515625, 7.55224609375, 8.1259765625, 8.69970703125, 9.2734375, 9.84716796875, 10.4208984375, 10.99462890625, 11.568359375, 12.14208984375, 12.7158203125, 13.28955078125, 13.86328125, 14.43701171875, 15.0107421875, 15.58447265625, 16.158203125, 16.73193359375, 17.3056640625, 17.87939453125, 18.453125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 18.0, 28.0, 39.0, 43.0, 86.0, 126.0, 210.0, 325.0, 533.0, 785.0, 1276.0, 2041.0, 3355.0, 5410.0, 8656.0, 14526.0, 24435.0, 41532.0, 69397.0, 116905.0, 193796.0, 326586.0, 589135.0, 1200580.0, 1632651.0, 922947.0, 467526.0, 266899.0, 160622.0, 96176.0, 57655.0, 34537.0, 20410.0, 12493.0, 7486.0, 4571.0, 2812.0, 1695.0, 1109.0, 699.0, 477.0, 307.0, 171.0, 131.0, 72.0, 54.0, 33.0, 29.0, 17.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.265625, -19.61865234375, -18.9716796875, -18.32470703125, -17.677734375, -17.03076171875, -16.3837890625, -15.73681640625, -15.08984375, -14.44287109375, -13.7958984375, -13.14892578125, -12.501953125, -11.85498046875, -11.2080078125, -10.56103515625, -9.9140625, -9.26708984375, -8.6201171875, -7.97314453125, -7.326171875, -6.67919921875, -6.0322265625, -5.38525390625, -4.73828125, -4.09130859375, -3.4443359375, -2.79736328125, -2.150390625, -1.50341796875, -0.8564453125, -0.20947265625, 0.4375, 1.08447265625, 1.7314453125, 2.37841796875, 3.025390625, 3.67236328125, 4.3193359375, 4.96630859375, 5.61328125, 6.26025390625, 6.9072265625, 7.55419921875, 8.201171875, 8.84814453125, 9.4951171875, 10.14208984375, 10.7890625, 11.43603515625, 12.0830078125, 12.72998046875, 13.376953125, 14.02392578125, 14.6708984375, 15.31787109375, 15.96484375, 16.61181640625, 17.2587890625, 17.90576171875, 18.552734375, 19.19970703125, 19.8466796875, 20.49365234375, 21.140625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 5.0, 10.0, 11.0, 12.0, 9.0, 19.0, 19.0, 38.0, 24.0, 37.0, 56.0, 71.0, 66.0, 103.0, 142.0, 149.0, 195.0, 173.0, 164.0, 131.0, 100.0, 101.0, 76.0, 55.0, 61.0, 34.0, 34.0, 24.0, 23.0, 16.0, 15.0, 16.0, 4.0, 10.0, 5.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.33740234375, -20.5185546875, -19.69970703125, -18.880859375, -18.06201171875, -17.2431640625, -16.42431640625, -15.60546875, -14.78662109375, -13.9677734375, -13.14892578125, -12.330078125, -11.51123046875, -10.6923828125, -9.87353515625, -9.0546875, -8.23583984375, -7.4169921875, -6.59814453125, -5.779296875, -4.96044921875, -4.1416015625, -3.32275390625, -2.50390625, -1.68505859375, -0.8662109375, -0.04736328125, 0.771484375, 1.59033203125, 2.4091796875, 3.22802734375, 4.046875, 4.86572265625, 5.6845703125, 6.50341796875, 7.322265625, 8.14111328125, 8.9599609375, 9.77880859375, 10.59765625, 11.41650390625, 12.2353515625, 13.05419921875, 13.873046875, 14.69189453125, 15.5107421875, 16.32958984375, 17.1484375, 17.96728515625, 18.7861328125, 19.60498046875, 20.423828125, 21.24267578125, 22.0615234375, 22.88037109375, 23.69921875, 24.51806640625, 25.3369140625, 26.15576171875, 26.974609375, 27.79345703125, 28.6123046875, 29.43115234375, 30.25]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 5.0, 14.0, 10.0, 18.0, 45.0, 55.0, 96.0, 143.0, 235.0, 319.0, 445.0, 693.0, 1071.0, 1596.0, 2353.0, 3725.0, 5685.0, 9229.0, 14846.0, 24145.0, 41164.0, 79397.0, 235142.0, 5508615.0, 192854.0, 71799.0, 37762.0, 22115.0, 13343.0, 8472.0, 5426.0, 3527.0, 2301.0, 1611.0, 928.0, 689.0, 497.0, 344.0, 234.0, 168.0, 107.0, 72.0, 57.0, 32.0, 22.0, 10.0, 11.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.47705078125, -45.6103515625, -43.74365234375, -41.876953125, -40.01025390625, -38.1435546875, -36.27685546875, -34.41015625, -32.54345703125, -30.6767578125, -28.81005859375, -26.943359375, -25.07666015625, -23.2099609375, -21.34326171875, -19.4765625, -17.60986328125, -15.7431640625, -13.87646484375, -12.009765625, -10.14306640625, -8.2763671875, -6.40966796875, -4.54296875, -2.67626953125, -0.8095703125, 1.05712890625, 2.923828125, 4.79052734375, 6.6572265625, 8.52392578125, 10.390625, 12.25732421875, 14.1240234375, 15.99072265625, 17.857421875, 19.72412109375, 21.5908203125, 23.45751953125, 25.32421875, 27.19091796875, 29.0576171875, 30.92431640625, 32.791015625, 34.65771484375, 36.5244140625, 38.39111328125, 40.2578125, 42.12451171875, 43.9912109375, 45.85791015625, 47.724609375, 49.59130859375, 51.4580078125, 53.32470703125, 55.19140625, 57.05810546875, 58.9248046875, 60.79150390625, 62.658203125, 64.52490234375, 66.3916015625, 68.25830078125, 70.125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 9.0, 8.0, 17.0, 17.0, 17.0, 20.0, 18.0, 21.0, 24.0, 30.0, 32.0, 44.0, 46.0, 63.0, 94.0, 153.0, 201.0, 221.0, 213.0, 158.0, 137.0, 89.0, 54.0, 64.0, 43.0, 31.0, 28.0, 20.0, 28.0, 23.0, 15.0, 14.0, 9.0, 5.0, 8.0, 7.0, 4.0, 3.0, 6.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.46630859375, -33.4013671875, -32.33642578125, -31.271484375, -30.20654296875, -29.1416015625, -28.07666015625, -27.01171875, -25.94677734375, -24.8818359375, -23.81689453125, -22.751953125, -21.68701171875, -20.6220703125, -19.55712890625, -18.4921875, -17.42724609375, -16.3623046875, -15.29736328125, -14.232421875, -13.16748046875, -12.1025390625, -11.03759765625, -9.97265625, -8.90771484375, -7.8427734375, -6.77783203125, -5.712890625, -4.64794921875, -3.5830078125, -2.51806640625, -1.453125, -0.38818359375, 0.6767578125, 1.74169921875, 2.806640625, 3.87158203125, 4.9365234375, 6.00146484375, 7.06640625, 8.13134765625, 9.1962890625, 10.26123046875, 11.326171875, 12.39111328125, 13.4560546875, 14.52099609375, 15.5859375, 16.65087890625, 17.7158203125, 18.78076171875, 19.845703125, 20.91064453125, 21.9755859375, 23.04052734375, 24.10546875, 25.17041015625, 26.2353515625, 27.30029296875, 28.365234375, 29.43017578125, 30.4951171875, 31.56005859375, 32.625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 9.0, 14.0, 20.0, 47.0, 95.0, 490.0, 189.0, 60.0, 27.0, 21.0, 7.0, 9.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4114.9453125, -3985.138427734375, -3855.33154296875, -3725.5244140625, -3595.717529296875, -3465.91064453125, -3336.103515625, -3206.296630859375, -3076.48974609375, -2946.682861328125, -2816.8759765625, -2687.06884765625, -2557.261962890625, -2427.455078125, -2297.64794921875, -2167.841064453125, -2038.0341796875, -1908.227294921875, -1778.4202880859375, -1648.61328125, -1518.806396484375, -1388.99951171875, -1259.1925048828125, -1129.385498046875, -999.57861328125, -869.7716674804688, -739.9647216796875, -610.1577758789062, -480.350830078125, -350.54388427734375, -220.7369384765625, -90.92999267578125, 38.87646484375, 168.68341064453125, 298.4903564453125, 428.29730224609375, 558.104248046875, 687.9111938476562, 817.7181396484375, 947.5250854492188, 1077.33203125, 1207.138916015625, 1336.9459228515625, 1466.7529296875, 1596.559814453125, 1726.36669921875, 1856.1737060546875, 1985.980712890625, 2115.78759765625, 2245.594482421875, 2375.4013671875, 2505.20849609375, 2635.015380859375, 2764.822265625, 2894.62939453125, 3024.436279296875, 3154.2431640625, 3284.050048828125, 3413.85693359375, 3543.6640625, 3673.470947265625, 3803.27783203125, 3933.0849609375, 4062.891845703125, 4192.69873046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 7.0, 7.0, 10.0, 6.0, 5.0, 11.0, 5.0, 10.0, 8.0, 11.0, 13.0, 21.0, 16.0, 20.0, 43.0, 58.0, 102.0, 279.0, 114.0, 48.0, 30.0, 27.0, 22.0, 16.0, 21.0, 12.0, 7.0, 8.0, 14.0, 9.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-948.9963989257812, -918.8461303710938, -888.6958618164062, -858.5455322265625, -828.395263671875, -798.2449951171875, -768.0947265625, -737.9444580078125, -707.794189453125, -677.6439208984375, -647.49365234375, -617.3433837890625, -587.1930541992188, -557.0427856445312, -526.8925170898438, -496.74224853515625, -466.5919189453125, -436.441650390625, -406.2913513183594, -376.1410827636719, -345.99078369140625, -315.84051513671875, -285.69024658203125, -255.5399627685547, -225.38967895507812, -195.23939514160156, -165.089111328125, -134.9388427734375, -104.78855895996094, -74.63827514648438, -44.488006591796875, -14.337722778320312, 15.8126220703125, 45.9629020690918, 76.1131820678711, 106.26345825195312, 136.4137420654297, 166.56402587890625, 196.71429443359375, 226.8645782470703, 257.0148620605469, 287.1651306152344, 317.3154296875, 347.4656982421875, 377.615966796875, 407.7662658691406, 437.9165344238281, 468.06683349609375, 498.21710205078125, 528.3673706054688, 558.5176391601562, 588.66796875, 618.8182373046875, 648.968505859375, 679.1187744140625, 709.26904296875, 739.4193115234375, 769.569580078125, 799.7198486328125, 829.8701171875, 860.0204467773438, 890.1707153320312, 920.3209838867188, 950.4712524414062, 980.62158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 11.0, 14.0, 18.0, 21.0, 24.0, 44.0, 81.0, 116.0, 142.0, 195.0, 328.0, 477.0, 777.0, 1177.0, 2027.0, 3293.0, 5508.0, 10284.0, 20106.0, 44471.0, 137221.0, 2326453.0, 1425456.0, 128088.0, 43830.0, 19737.0, 10094.0, 5495.0, 3254.0, 1990.0, 1211.0, 781.0, 561.0, 323.0, 213.0, 155.0, 84.0, 56.0, 53.0, 35.0, 20.0, 17.0, 12.0, 6.0, 8.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.171875, -10.7861328125, -10.400390625, -10.0146484375, -9.62890625, -9.2431640625, -8.857421875, -8.4716796875, -8.0859375, -7.7001953125, -7.314453125, -6.9287109375, -6.54296875, -6.1572265625, -5.771484375, -5.3857421875, -5.0, -4.6142578125, -4.228515625, -3.8427734375, -3.45703125, -3.0712890625, -2.685546875, -2.2998046875, -1.9140625, -1.5283203125, -1.142578125, -0.7568359375, -0.37109375, 0.0146484375, 0.400390625, 0.7861328125, 1.171875, 1.5576171875, 1.943359375, 2.3291015625, 2.71484375, 3.1005859375, 3.486328125, 3.8720703125, 4.2578125, 4.6435546875, 5.029296875, 5.4150390625, 5.80078125, 6.1865234375, 6.572265625, 6.9580078125, 7.34375, 7.7294921875, 8.115234375, 8.5009765625, 8.88671875, 9.2724609375, 9.658203125, 10.0439453125, 10.4296875, 10.8154296875, 11.201171875, 11.5869140625, 11.97265625, 12.3583984375, 12.744140625, 13.1298828125, 13.515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 8.0, 10.0, 10.0, 10.0, 23.0, 25.0, 69.0, 93.0, 167.0, 179.0, 143.0, 94.0, 42.0, 29.0, 15.0, 11.0, 13.0, 10.0, 8.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.173828125, -1.1352081298828125, -1.096588134765625, -1.0579681396484375, -1.01934814453125, -0.9807281494140625, -0.942108154296875, -0.9034881591796875, -0.8648681640625, -0.8262481689453125, -0.787628173828125, -0.7490081787109375, -0.71038818359375, -0.6717681884765625, -0.633148193359375, -0.5945281982421875, -0.555908203125, -0.5172882080078125, -0.478668212890625, -0.4400482177734375, -0.40142822265625, -0.3628082275390625, -0.324188232421875, -0.2855682373046875, -0.2469482421875, -0.2083282470703125, -0.169708251953125, -0.1310882568359375, -0.09246826171875, -0.0538482666015625, -0.015228271484375, 0.0233917236328125, 0.06201171875, 0.1006317138671875, 0.139251708984375, 0.1778717041015625, 0.21649169921875, 0.2551116943359375, 0.293731689453125, 0.3323516845703125, 0.3709716796875, 0.4095916748046875, 0.448211669921875, 0.4868316650390625, 0.52545166015625, 0.5640716552734375, 0.602691650390625, 0.6413116455078125, 0.679931640625, 0.7185516357421875, 0.757171630859375, 0.7957916259765625, 0.83441162109375, 0.8730316162109375, 0.911651611328125, 0.9502716064453125, 0.9888916015625, 1.0275115966796875, 1.066131591796875, 1.1047515869140625, 1.14337158203125, 1.1819915771484375, 1.220611572265625, 1.2592315673828125, 1.2978515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 23.0, 31.0, 41.0, 84.0, 70.0, 160.0, 253.0, 436.0, 764.0, 1411.0, 2812.0, 5616.0, 12034.0, 28885.0, 78273.0, 243477.0, 950784.0, 2099949.0, 530714.0, 151094.0, 50820.0, 19911.0, 8365.0, 3900.0, 1850.0, 1002.0, 606.0, 307.0, 188.0, 125.0, 76.0, 63.0, 40.0, 34.0, 11.0, 16.0, 14.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -11.9654541015625, -11.594970703125, -11.2244873046875, -10.85400390625, -10.4835205078125, -10.113037109375, -9.7425537109375, -9.3720703125, -9.0015869140625, -8.631103515625, -8.2606201171875, -7.89013671875, -7.5196533203125, -7.149169921875, -6.7786865234375, -6.408203125, -6.0377197265625, -5.667236328125, -5.2967529296875, -4.92626953125, -4.5557861328125, -4.185302734375, -3.8148193359375, -3.4443359375, -3.0738525390625, -2.703369140625, -2.3328857421875, -1.96240234375, -1.5919189453125, -1.221435546875, -0.8509521484375, -0.48046875, -0.1099853515625, 0.260498046875, 0.6309814453125, 1.00146484375, 1.3719482421875, 1.742431640625, 2.1129150390625, 2.4833984375, 2.8538818359375, 3.224365234375, 3.5948486328125, 3.96533203125, 4.3358154296875, 4.706298828125, 5.0767822265625, 5.447265625, 5.8177490234375, 6.188232421875, 6.5587158203125, 6.92919921875, 7.2996826171875, 7.670166015625, 8.0406494140625, 8.4111328125, 8.7816162109375, 9.152099609375, 9.5225830078125, 9.89306640625, 10.2635498046875, 10.634033203125, 11.0045166015625, 11.375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 8.0, 9.0, 10.0, 11.0, 11.0, 23.0, 20.0, 31.0, 27.0, 40.0, 29.0, 53.0, 57.0, 92.0, 100.0, 107.0, 114.0, 165.0, 181.0, 258.0, 266.0, 340.0, 399.0, 276.0, 258.0, 209.0, 169.0, 131.0, 125.0, 90.0, 73.0, 77.0, 51.0, 53.0, 42.0, 25.0, 24.0, 31.0, 14.0, 16.0, 8.0, 6.0, 5.0, 9.0, 6.0, 3.0, 3.0, 4.0, 6.0, 0.0, 2.0], "bins": [-2.751953125, -2.673614501953125, -2.59527587890625, -2.516937255859375, -2.4385986328125, -2.360260009765625, -2.28192138671875, -2.203582763671875, -2.125244140625, -2.046905517578125, -1.96856689453125, -1.890228271484375, -1.8118896484375, -1.733551025390625, -1.65521240234375, -1.576873779296875, -1.49853515625, -1.420196533203125, -1.34185791015625, -1.263519287109375, -1.1851806640625, -1.106842041015625, -1.02850341796875, -0.950164794921875, -0.871826171875, -0.793487548828125, -0.71514892578125, -0.636810302734375, -0.5584716796875, -0.480133056640625, -0.40179443359375, -0.323455810546875, -0.2451171875, -0.166778564453125, -0.08843994140625, -0.010101318359375, 0.0682373046875, 0.146575927734375, 0.22491455078125, 0.303253173828125, 0.381591796875, 0.459930419921875, 0.53826904296875, 0.616607666015625, 0.6949462890625, 0.773284912109375, 0.85162353515625, 0.929962158203125, 1.00830078125, 1.086639404296875, 1.16497802734375, 1.243316650390625, 1.3216552734375, 1.399993896484375, 1.47833251953125, 1.556671142578125, 1.635009765625, 1.713348388671875, 1.79168701171875, 1.870025634765625, 1.9483642578125, 2.026702880859375, 2.10504150390625, 2.183380126953125, 2.26171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 13.0, 26.0, 59.0, 80.0, 116.0, 188.0, 193.0, 161.0, 79.0, 36.0, 17.0, 16.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-88.87611389160156, -86.59979248046875, -84.32347106933594, -82.04714965820312, -79.77082824707031, -77.4945068359375, -75.21818542480469, -72.9418716430664, -70.6655502319336, -68.38922882080078, -66.11290740966797, -63.836585998535156, -61.56026840209961, -59.2839469909668, -57.007625579833984, -54.73130416870117, -52.45498275756836, -50.17866134643555, -47.902339935302734, -45.62602233886719, -43.349700927734375, -41.07337951660156, -38.79705810546875, -36.52073669433594, -34.244415283203125, -31.968093872070312, -29.691774368286133, -27.41545295715332, -25.13913345336914, -22.862812042236328, -20.586490631103516, -18.310169219970703, -16.033851623535156, -13.75753116607666, -11.481210708618164, -9.204889297485352, -6.9285688400268555, -4.652248382568359, -2.375926971435547, -0.09960651397705078, 2.1767139434814453, 4.453034400939941, 6.729355335235596, 9.00567626953125, 11.281996726989746, 13.558317184448242, 15.834638595581055, 18.110958099365234, 20.387279510498047, 22.66360092163086, 24.93992042541504, 27.21624183654785, 29.49256134033203, 31.768882751464844, 34.045204162597656, 36.32152557373047, 38.59784698486328, 40.874168395996094, 43.150489807128906, 45.42681121826172, 47.703128814697266, 49.97945022583008, 52.25577163696289, 54.5320930480957, 56.80841064453125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 5.0, 7.0, 13.0, 10.0, 31.0, 21.0, 38.0, 44.0, 48.0, 42.0, 50.0, 61.0, 50.0, 47.0, 52.0, 48.0, 72.0, 47.0, 54.0, 35.0, 40.0, 28.0, 25.0, 28.0, 26.0, 16.0, 20.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-29.659461975097656, -28.878816604614258, -28.098173141479492, -27.317527770996094, -26.536882400512695, -25.756237030029297, -24.97559356689453, -24.194948196411133, -23.414302825927734, -22.633657455444336, -21.85301399230957, -21.072368621826172, -20.291723251342773, -19.511077880859375, -18.73043441772461, -17.94978904724121, -17.169145584106445, -16.388500213623047, -15.607855796813965, -14.827211380004883, -14.046566009521484, -13.265921592712402, -12.48527717590332, -11.704631805419922, -10.92398738861084, -10.143342971801758, -9.36269760131836, -8.582053184509277, -7.801408290863037, -7.020763397216797, -6.240118980407715, -5.459474086761475, -4.678831100463867, -3.898186206817627, -3.117541551589966, -2.3368968963623047, -1.5562520027160645, -0.7756071090698242, 0.0050373077392578125, 0.785682201385498, 1.5663270950317383, 2.3469719886779785, 3.1276166439056396, 3.908261299133301, 4.688906192779541, 5.469551086425781, 6.250195503234863, 7.0308403968811035, 7.811485290527344, 8.592129707336426, 9.372775077819824, 10.153419494628906, 10.934064865112305, 11.714709281921387, 12.495353698730469, 13.275999069213867, 14.05664348602295, 14.837287902832031, 15.61793327331543, 16.398578643798828, 17.179222106933594, 17.959867477416992, 18.74051284790039, 19.521156311035156, 20.301801681518555]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 9.0, 10.0, 24.0, 31.0, 49.0, 80.0, 92.0, 164.0, 254.0, 382.0, 682.0, 1149.0, 1864.0, 3700.0, 7424.0, 17842.0, 52885.0, 227400.0, 536797.0, 135087.0, 36270.0, 13213.0, 5961.0, 3064.0, 1580.0, 940.0, 540.0, 346.0, 229.0, 146.0, 104.0, 63.0, 47.0, 27.0, 20.0, 17.0, 17.0, 9.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.1640625, -7.92633056640625, -7.6885986328125, -7.45086669921875, -7.213134765625, -6.97540283203125, -6.7376708984375, -6.49993896484375, -6.26220703125, -6.02447509765625, -5.7867431640625, -5.54901123046875, -5.311279296875, -5.07354736328125, -4.8358154296875, -4.59808349609375, -4.3603515625, -4.12261962890625, -3.8848876953125, -3.64715576171875, -3.409423828125, -3.17169189453125, -2.9339599609375, -2.69622802734375, -2.45849609375, -2.22076416015625, -1.9830322265625, -1.74530029296875, -1.507568359375, -1.26983642578125, -1.0321044921875, -0.79437255859375, -0.556640625, -0.31890869140625, -0.0811767578125, 0.15655517578125, 0.394287109375, 0.63201904296875, 0.8697509765625, 1.10748291015625, 1.34521484375, 1.58294677734375, 1.8206787109375, 2.05841064453125, 2.296142578125, 2.53387451171875, 2.7716064453125, 3.00933837890625, 3.2470703125, 3.48480224609375, 3.7225341796875, 3.96026611328125, 4.197998046875, 4.43572998046875, 4.6734619140625, 4.91119384765625, 5.14892578125, 5.38665771484375, 5.6243896484375, 5.86212158203125, 6.099853515625, 6.33758544921875, 6.5753173828125, 6.81304931640625, 7.05078125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 13.0, 17.0, 23.0, 33.0, 74.0, 85.0, 90.0, 105.0, 87.0, 127.0, 90.0, 59.0, 52.0, 37.0, 24.0, 16.0, 11.0, 8.0, 3.0, 5.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1623382568359375, -1.112762451171875, -1.0631866455078125, -1.01361083984375, -0.9640350341796875, -0.914459228515625, -0.8648834228515625, -0.8153076171875, -0.7657318115234375, -0.716156005859375, -0.6665802001953125, -0.61700439453125, -0.5674285888671875, -0.517852783203125, -0.4682769775390625, -0.418701171875, -0.3691253662109375, -0.319549560546875, -0.2699737548828125, -0.22039794921875, -0.1708221435546875, -0.121246337890625, -0.0716705322265625, -0.0220947265625, 0.0274810791015625, 0.077056884765625, 0.1266326904296875, 0.17620849609375, 0.2257843017578125, 0.275360107421875, 0.3249359130859375, 0.37451171875, 0.4240875244140625, 0.473663330078125, 0.5232391357421875, 0.57281494140625, 0.6223907470703125, 0.671966552734375, 0.7215423583984375, 0.7711181640625, 0.8206939697265625, 0.870269775390625, 0.9198455810546875, 0.96942138671875, 1.0189971923828125, 1.068572998046875, 1.1181488037109375, 1.167724609375, 1.2173004150390625, 1.266876220703125, 1.3164520263671875, 1.36602783203125, 1.4156036376953125, 1.465179443359375, 1.5147552490234375, 1.5643310546875, 1.6139068603515625, 1.663482666015625, 1.7130584716796875, 1.76263427734375, 1.8122100830078125, 1.861785888671875, 1.9113616943359375, 1.9609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 5.0, 9.0, 12.0, 9.0, 14.0, 23.0, 25.0, 46.0, 58.0, 76.0, 115.0, 200.0, 275.0, 389.0, 634.0, 986.0, 1646.0, 2846.0, 5288.0, 9717.0, 19221.0, 40968.0, 99352.0, 262071.0, 350337.0, 143967.0, 56635.0, 25654.0, 12350.0, 6491.0, 3677.0, 2041.0, 1241.0, 724.0, 503.0, 316.0, 180.0, 119.0, 115.0, 67.0, 35.0, 40.0, 20.0, 19.0, 13.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.046875, -4.88507080078125, -4.7232666015625, -4.56146240234375, -4.399658203125, -4.23785400390625, -4.0760498046875, -3.91424560546875, -3.75244140625, -3.59063720703125, -3.4288330078125, -3.26702880859375, -3.105224609375, -2.94342041015625, -2.7816162109375, -2.61981201171875, -2.4580078125, -2.29620361328125, -2.1343994140625, -1.97259521484375, -1.810791015625, -1.64898681640625, -1.4871826171875, -1.32537841796875, -1.16357421875, -1.00177001953125, -0.8399658203125, -0.67816162109375, -0.516357421875, -0.35455322265625, -0.1927490234375, -0.03094482421875, 0.130859375, 0.29266357421875, 0.4544677734375, 0.61627197265625, 0.778076171875, 0.93988037109375, 1.1016845703125, 1.26348876953125, 1.42529296875, 1.58709716796875, 1.7489013671875, 1.91070556640625, 2.072509765625, 2.23431396484375, 2.3961181640625, 2.55792236328125, 2.7197265625, 2.88153076171875, 3.0433349609375, 3.20513916015625, 3.366943359375, 3.52874755859375, 3.6905517578125, 3.85235595703125, 4.01416015625, 4.17596435546875, 4.3377685546875, 4.49957275390625, 4.661376953125, 4.82318115234375, 4.9849853515625, 5.14678955078125, 5.30859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 5.0, 2.0, 7.0, 5.0, 7.0, 8.0, 10.0, 15.0, 14.0, 22.0, 23.0, 20.0, 21.0, 21.0, 24.0, 42.0, 37.0, 27.0, 28.0, 36.0, 31.0, 41.0, 37.0, 42.0, 38.0, 37.0, 39.0, 32.0, 34.0, 24.0, 25.0, 22.0, 28.0, 27.0, 25.0, 25.0, 15.0, 14.0, 13.0, 12.0, 10.0, 9.0, 9.0, 9.0, 13.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.6953125, -4.5338134765625, -4.372314453125, -4.2108154296875, -4.04931640625, -3.8878173828125, -3.726318359375, -3.5648193359375, -3.4033203125, -3.2418212890625, -3.080322265625, -2.9188232421875, -2.75732421875, -2.5958251953125, -2.434326171875, -2.2728271484375, -2.111328125, -1.9498291015625, -1.788330078125, -1.6268310546875, -1.46533203125, -1.3038330078125, -1.142333984375, -0.9808349609375, -0.8193359375, -0.6578369140625, -0.496337890625, -0.3348388671875, -0.17333984375, -0.0118408203125, 0.149658203125, 0.3111572265625, 0.47265625, 0.6341552734375, 0.795654296875, 0.9571533203125, 1.11865234375, 1.2801513671875, 1.441650390625, 1.6031494140625, 1.7646484375, 1.9261474609375, 2.087646484375, 2.2491455078125, 2.41064453125, 2.5721435546875, 2.733642578125, 2.8951416015625, 3.056640625, 3.2181396484375, 3.379638671875, 3.5411376953125, 3.70263671875, 3.8641357421875, 4.025634765625, 4.1871337890625, 4.3486328125, 4.5101318359375, 4.671630859375, 4.8331298828125, 4.99462890625, 5.1561279296875, 5.317626953125, 5.4791259765625, 5.640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 3.0, 13.0, 27.0, 25.0, 50.0, 58.0, 109.0, 176.0, 278.0, 522.0, 1069.0, 2262.0, 5683.0, 17705.0, 83540.0, 614545.0, 267782.0, 37446.0, 10191.0, 3656.0, 1570.0, 775.0, 422.0, 223.0, 162.0, 99.0, 38.0, 31.0, 26.0, 16.0, 19.0, 7.0, 10.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1953125, -12.8157958984375, -12.436279296875, -12.0567626953125, -11.67724609375, -11.2977294921875, -10.918212890625, -10.5386962890625, -10.1591796875, -9.7796630859375, -9.400146484375, -9.0206298828125, -8.64111328125, -8.2615966796875, -7.882080078125, -7.5025634765625, -7.123046875, -6.7435302734375, -6.364013671875, -5.9844970703125, -5.60498046875, -5.2254638671875, -4.845947265625, -4.4664306640625, -4.0869140625, -3.7073974609375, -3.327880859375, -2.9483642578125, -2.56884765625, -2.1893310546875, -1.809814453125, -1.4302978515625, -1.05078125, -0.6712646484375, -0.291748046875, 0.0877685546875, 0.46728515625, 0.8468017578125, 1.226318359375, 1.6058349609375, 1.9853515625, 2.3648681640625, 2.744384765625, 3.1239013671875, 3.50341796875, 3.8829345703125, 4.262451171875, 4.6419677734375, 5.021484375, 5.4010009765625, 5.780517578125, 6.1600341796875, 6.53955078125, 6.9190673828125, 7.298583984375, 7.6781005859375, 8.0576171875, 8.4371337890625, 8.816650390625, 9.1961669921875, 9.57568359375, 9.9552001953125, 10.334716796875, 10.7142333984375, 11.09375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 8.0, 8.0, 10.0, 12.0, 18.0, 31.0, 54.0, 61.0, 74.0, 100.0, 93.0, 129.0, 93.0, 67.0, 60.0, 63.0, 39.0, 18.0, 17.0, 11.0, 7.0, 6.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044727325439453125, -0.0004345551133155823, -0.0004218369722366333, -0.0004091188311576843, -0.00039640069007873535, -0.0003836825489997864, -0.0003709644079208374, -0.00035824626684188843, -0.00034552812576293945, -0.0003328099846839905, -0.0003200918436050415, -0.00030737370252609253, -0.00029465556144714355, -0.0002819374203681946, -0.0002692192792892456, -0.00025650113821029663, -0.00024378299713134766, -0.00023106485605239868, -0.0002183467149734497, -0.00020562857389450073, -0.00019291043281555176, -0.00018019229173660278, -0.0001674741506576538, -0.00015475600957870483, -0.00014203786849975586, -0.00012931972742080688, -0.00011660158634185791, -0.00010388344526290894, -9.116530418395996e-05, -7.844716310501099e-05, -6.572902202606201e-05, -5.301088094711304e-05, -4.029273986816406e-05, -2.7574598789215088e-05, -1.4856457710266113e-05, -2.1383166313171387e-06, 1.0579824447631836e-05, 2.329796552658081e-05, 3.6016106605529785e-05, 4.873424768447876e-05, 6.145238876342773e-05, 7.417052984237671e-05, 8.688867092132568e-05, 9.960681200027466e-05, 0.00011232495307922363, 0.0001250430941581726, 0.00013776123523712158, 0.00015047937631607056, 0.00016319751739501953, 0.0001759156584739685, 0.00018863379955291748, 0.00020135194063186646, 0.00021407008171081543, 0.0002267882227897644, 0.00023950636386871338, 0.00025222450494766235, 0.00026494264602661133, 0.0002776607871055603, 0.0002903789281845093, 0.00030309706926345825, 0.0003158152103424072, 0.0003285333514213562, 0.0003412514925003052, 0.00035396963357925415, 0.0003666877746582031]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 6.0, 13.0, 17.0, 25.0, 36.0, 60.0, 65.0, 132.0, 216.0, 393.0, 762.0, 1630.0, 3767.0, 9880.0, 32453.0, 159182.0, 610948.0, 176374.0, 34871.0, 10371.0, 3940.0, 1626.0, 773.0, 383.0, 241.0, 145.0, 107.0, 54.0, 27.0, 18.0, 12.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.3203125, -10.982666015625, -10.64501953125, -10.307373046875, -9.9697265625, -9.632080078125, -9.29443359375, -8.956787109375, -8.619140625, -8.281494140625, -7.94384765625, -7.606201171875, -7.2685546875, -6.930908203125, -6.59326171875, -6.255615234375, -5.91796875, -5.580322265625, -5.24267578125, -4.905029296875, -4.5673828125, -4.229736328125, -3.89208984375, -3.554443359375, -3.216796875, -2.879150390625, -2.54150390625, -2.203857421875, -1.8662109375, -1.528564453125, -1.19091796875, -0.853271484375, -0.515625, -0.177978515625, 0.15966796875, 0.497314453125, 0.8349609375, 1.172607421875, 1.51025390625, 1.847900390625, 2.185546875, 2.523193359375, 2.86083984375, 3.198486328125, 3.5361328125, 3.873779296875, 4.21142578125, 4.549072265625, 4.88671875, 5.224365234375, 5.56201171875, 5.899658203125, 6.2373046875, 6.574951171875, 6.91259765625, 7.250244140625, 7.587890625, 7.925537109375, 8.26318359375, 8.600830078125, 8.9384765625, 9.276123046875, 9.61376953125, 9.951416015625, 10.2890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 10.0, 13.0, 13.0, 19.0, 18.0, 37.0, 35.0, 43.0, 40.0, 53.0, 78.0, 81.0, 70.0, 82.0, 74.0, 60.0, 54.0, 38.0, 40.0, 24.0, 20.0, 15.0, 13.0, 19.0, 12.0, 9.0, 9.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0546875, -4.86639404296875, -4.6781005859375, -4.48980712890625, -4.301513671875, -4.11322021484375, -3.9249267578125, -3.73663330078125, -3.54833984375, -3.36004638671875, -3.1717529296875, -2.98345947265625, -2.795166015625, -2.60687255859375, -2.4185791015625, -2.23028564453125, -2.0419921875, -1.85369873046875, -1.6654052734375, -1.47711181640625, -1.288818359375, -1.10052490234375, -0.9122314453125, -0.72393798828125, -0.53564453125, -0.34735107421875, -0.1590576171875, 0.02923583984375, 0.217529296875, 0.40582275390625, 0.5941162109375, 0.78240966796875, 0.970703125, 1.15899658203125, 1.3472900390625, 1.53558349609375, 1.723876953125, 1.91217041015625, 2.1004638671875, 2.28875732421875, 2.47705078125, 2.66534423828125, 2.8536376953125, 3.04193115234375, 3.230224609375, 3.41851806640625, 3.6068115234375, 3.79510498046875, 3.9833984375, 4.17169189453125, 4.3599853515625, 4.54827880859375, 4.736572265625, 4.92486572265625, 5.1131591796875, 5.30145263671875, 5.48974609375, 5.67803955078125, 5.8663330078125, 6.05462646484375, 6.242919921875, 6.43121337890625, 6.6195068359375, 6.80780029296875, 6.99609375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 12.0, 32.0, 59.0, 194.0, 312.0, 218.0, 80.0, 31.0, 15.0, 13.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.64065551757812, -134.39913940429688, -130.15762329101562, -125.9161148071289, -121.67460632324219, -117.43309020996094, -113.19157409667969, -108.95005798339844, -104.70854949951172, -100.46703338623047, -96.22552490234375, -91.9840087890625, -87.74249267578125, -83.50098419189453, -79.25946807861328, -75.01795959472656, -70.77644348144531, -66.53492736816406, -62.293418884277344, -58.051902770996094, -53.81039047241211, -49.568878173828125, -45.327362060546875, -41.08584976196289, -36.844337463378906, -32.60282516479492, -28.361310958862305, -24.119796752929688, -19.878284454345703, -15.636772155761719, -11.395257949829102, -7.153743743896484, -2.9122314453125, 1.3292818069458008, 5.570795059204102, 9.812308311462402, 14.053821563720703, 18.295333862304688, 22.536848068237305, 26.778362274169922, 31.019874572753906, 35.26138687133789, 39.502899169921875, 43.744415283203125, 47.98592758178711, 52.227439880371094, 56.468955993652344, 60.71046829223633, 64.95198059082031, 69.19349670410156, 73.43500518798828, 77.67652130126953, 81.91802978515625, 86.1595458984375, 90.40106201171875, 94.642578125, 98.88408660888672, 103.12560272216797, 107.36711120605469, 111.60862731933594, 115.85014343261719, 120.0916519165039, 124.33316802978516, 128.57467651367188, 132.81619262695312]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 5.0, 17.0, 12.0, 24.0, 37.0, 78.0, 131.0, 188.0, 154.0, 126.0, 79.0, 46.0, 33.0, 10.0, 12.0, 8.0, 5.0, 4.0, 2.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.78155517578125, -139.55946350097656, -135.33738708496094, -131.11529541015625, -126.89320373535156, -122.6711196899414, -118.44903564453125, -114.22694396972656, -110.0048599243164, -105.78277587890625, -101.56068420410156, -97.3386001586914, -93.11651611328125, -88.89442443847656, -84.6723403930664, -80.45025634765625, -76.22816467285156, -72.0060806274414, -67.78398895263672, -63.56190490722656, -59.33981704711914, -55.11772918701172, -50.89564514160156, -46.67355728149414, -42.45146942138672, -38.2293815612793, -34.007293701171875, -29.78520965576172, -25.563121795654297, -21.341033935546875, -17.118947982788086, -12.896862030029297, -8.674789428710938, -4.452702522277832, -0.23061561584472656, 3.991471290588379, 8.213558197021484, 12.435646057128906, 16.657732009887695, 20.879817962646484, 25.101905822753906, 29.323993682861328, 33.54608154296875, 37.768165588378906, 41.99025344848633, 46.21234130859375, 50.434425354003906, 54.65651321411133, 58.87860107421875, 63.10068893432617, 67.3227767944336, 71.54486083984375, 75.76695251464844, 79.9890365600586, 84.21112060546875, 88.43321228027344, 92.6552963256836, 96.87738037109375, 101.09947204589844, 105.3215560913086, 109.54364013671875, 113.76573181152344, 117.9878158569336, 122.20989990234375, 126.43199157714844]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 7.0, 14.0, 15.0, 39.0, 46.0, 82.0, 108.0, 176.0, 302.0, 462.0, 861.0, 1494.0, 3088.0, 6604.0, 16966.0, 59366.0, 564421.0, 3381351.0, 114517.0, 26177.0, 9377.0, 4099.0, 2041.0, 1094.0, 583.0, 343.0, 223.0, 135.0, 97.0, 51.0, 37.0, 26.0, 19.0, 11.0, 19.0, 4.0, 1.0, 3.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.421875, -20.634033203125, -19.84619140625, -19.058349609375, -18.2705078125, -17.482666015625, -16.69482421875, -15.906982421875, -15.119140625, -14.331298828125, -13.54345703125, -12.755615234375, -11.9677734375, -11.179931640625, -10.39208984375, -9.604248046875, -8.81640625, -8.028564453125, -7.24072265625, -6.452880859375, -5.6650390625, -4.877197265625, -4.08935546875, -3.301513671875, -2.513671875, -1.725830078125, -0.93798828125, -0.150146484375, 0.6376953125, 1.425537109375, 2.21337890625, 3.001220703125, 3.7890625, 4.576904296875, 5.36474609375, 6.152587890625, 6.9404296875, 7.728271484375, 8.51611328125, 9.303955078125, 10.091796875, 10.879638671875, 11.66748046875, 12.455322265625, 13.2431640625, 14.031005859375, 14.81884765625, 15.606689453125, 16.39453125, 17.182373046875, 17.97021484375, 18.758056640625, 19.5458984375, 20.333740234375, 21.12158203125, 21.909423828125, 22.697265625, 23.485107421875, 24.27294921875, 25.060791015625, 25.8486328125, 26.636474609375, 27.42431640625, 28.212158203125, 29.0]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 21.0, 16.0, 25.0, 38.0, 50.0, 76.0, 86.0, 113.0, 100.0, 91.0, 107.0, 73.0, 45.0, 31.0, 35.0, 17.0, 10.0, 19.0, 6.0, 4.0, 3.0, 9.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.3835296630859375, -1.331512451171875, -1.2794952392578125, -1.22747802734375, -1.1754608154296875, -1.123443603515625, -1.0714263916015625, -1.0194091796875, -0.9673919677734375, -0.915374755859375, -0.8633575439453125, -0.81134033203125, -0.7593231201171875, -0.707305908203125, -0.6552886962890625, -0.603271484375, -0.5512542724609375, -0.499237060546875, -0.4472198486328125, -0.39520263671875, -0.3431854248046875, -0.291168212890625, -0.2391510009765625, -0.1871337890625, -0.1351165771484375, -0.083099365234375, -0.0310821533203125, 0.02093505859375, 0.0729522705078125, 0.124969482421875, 0.1769866943359375, 0.22900390625, 0.2810211181640625, 0.333038330078125, 0.3850555419921875, 0.43707275390625, 0.4890899658203125, 0.541107177734375, 0.5931243896484375, 0.6451416015625, 0.6971588134765625, 0.749176025390625, 0.8011932373046875, 0.85321044921875, 0.9052276611328125, 0.957244873046875, 1.0092620849609375, 1.061279296875, 1.1132965087890625, 1.165313720703125, 1.2173309326171875, 1.26934814453125, 1.3213653564453125, 1.373382568359375, 1.4253997802734375, 1.4774169921875, 1.5294342041015625, 1.581451416015625, 1.6334686279296875, 1.68548583984375, 1.7375030517578125, 1.789520263671875, 1.8415374755859375, 1.8935546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 11.0, 14.0, 16.0, 22.0, 45.0, 59.0, 71.0, 124.0, 209.0, 321.0, 509.0, 811.0, 1438.0, 2533.0, 4581.0, 8796.0, 18435.0, 41620.0, 109276.0, 388045.0, 2684178.0, 675498.0, 155870.0, 54884.0, 22998.0, 10996.0, 5551.0, 3070.0, 1721.0, 1009.0, 583.0, 345.0, 215.0, 144.0, 104.0, 57.0, 39.0, 25.0, 16.0, 12.0, 5.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4765625, -14.9718017578125, -14.467041015625, -13.9622802734375, -13.45751953125, -12.9527587890625, -12.447998046875, -11.9432373046875, -11.4384765625, -10.9337158203125, -10.428955078125, -9.9241943359375, -9.41943359375, -8.9146728515625, -8.409912109375, -7.9051513671875, -7.400390625, -6.8956298828125, -6.390869140625, -5.8861083984375, -5.38134765625, -4.8765869140625, -4.371826171875, -3.8670654296875, -3.3623046875, -2.8575439453125, -2.352783203125, -1.8480224609375, -1.34326171875, -0.8385009765625, -0.333740234375, 0.1710205078125, 0.67578125, 1.1805419921875, 1.685302734375, 2.1900634765625, 2.69482421875, 3.1995849609375, 3.704345703125, 4.2091064453125, 4.7138671875, 5.2186279296875, 5.723388671875, 6.2281494140625, 6.73291015625, 7.2376708984375, 7.742431640625, 8.2471923828125, 8.751953125, 9.2567138671875, 9.761474609375, 10.2662353515625, 10.77099609375, 11.2757568359375, 11.780517578125, 12.2852783203125, 12.7900390625, 13.2947998046875, 13.799560546875, 14.3043212890625, 14.80908203125, 15.3138427734375, 15.818603515625, 16.3233642578125, 16.828125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 5.0, 11.0, 10.0, 13.0, 22.0, 27.0, 27.0, 32.0, 39.0, 62.0, 90.0, 113.0, 175.0, 254.0, 460.0, 1185.0, 570.0, 309.0, 213.0, 119.0, 92.0, 67.0, 41.0, 43.0, 22.0, 14.0, 11.0, 11.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55078125, -2.4552001953125, -2.359619140625, -2.2640380859375, -2.16845703125, -2.0728759765625, -1.977294921875, -1.8817138671875, -1.7861328125, -1.6905517578125, -1.594970703125, -1.4993896484375, -1.40380859375, -1.3082275390625, -1.212646484375, -1.1170654296875, -1.021484375, -0.9259033203125, -0.830322265625, -0.7347412109375, -0.63916015625, -0.5435791015625, -0.447998046875, -0.3524169921875, -0.2568359375, -0.1612548828125, -0.065673828125, 0.0299072265625, 0.12548828125, 0.2210693359375, 0.316650390625, 0.4122314453125, 0.5078125, 0.6033935546875, 0.698974609375, 0.7945556640625, 0.89013671875, 0.9857177734375, 1.081298828125, 1.1768798828125, 1.2724609375, 1.3680419921875, 1.463623046875, 1.5592041015625, 1.65478515625, 1.7503662109375, 1.845947265625, 1.9415283203125, 2.037109375, 2.1326904296875, 2.228271484375, 2.3238525390625, 2.41943359375, 2.5150146484375, 2.610595703125, 2.7061767578125, 2.8017578125, 2.8973388671875, 2.992919921875, 3.0885009765625, 3.18408203125, 3.2796630859375, 3.375244140625, 3.4708251953125, 3.56640625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 12.0, 19.0, 42.0, 68.0, 138.0, 191.0, 215.0, 152.0, 79.0, 41.0, 22.0, 8.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.28657531738281, -61.82771682739258, -60.36885452270508, -58.909996032714844, -57.451133728027344, -55.99227523803711, -54.533416748046875, -53.074554443359375, -51.61569595336914, -50.156837463378906, -48.697975158691406, -47.23911666870117, -45.78025436401367, -44.32139587402344, -42.86253356933594, -41.4036750793457, -39.94481658935547, -38.485958099365234, -37.027095794677734, -35.5682373046875, -34.109375, -32.650516510009766, -31.1916561126709, -29.73279571533203, -28.27393341064453, -26.815073013305664, -25.356212615966797, -23.897354125976562, -22.438493728637695, -20.979633331298828, -19.52077293395996, -18.061912536621094, -16.60305404663086, -15.144193649291992, -13.685334205627441, -12.226473808288574, -10.767614364624023, -9.308753967285156, -7.849893569946289, -6.391034126281738, -4.932173728942871, -3.473313808441162, -2.014453649520874, -0.5555934906005859, 0.903266429901123, 2.362126350402832, 3.820986747741699, 5.27984619140625, 6.738706588745117, 8.197566986083984, 9.656426429748535, 11.115286827087402, 12.574146270751953, 14.03300666809082, 15.491867065429688, 16.950725555419922, 18.409587860107422, 19.86844825744629, 21.327308654785156, 22.78616714477539, 24.245027542114258, 25.703887939453125, 27.162748336791992, 28.62160873413086, 30.080467224121094]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 2.0, 4.0, 10.0, 8.0, 13.0, 24.0, 22.0, 25.0, 33.0, 47.0, 52.0, 52.0, 44.0, 70.0, 64.0, 81.0, 54.0, 59.0, 65.0, 46.0, 47.0, 41.0, 44.0, 27.0, 14.0, 17.0, 10.0, 12.0, 3.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.258581161499023, -25.616727828979492, -24.974876403808594, -24.333023071289062, -23.69116973876953, -23.04931640625, -22.4074649810791, -21.76561164855957, -21.123760223388672, -20.48190689086914, -19.840055465698242, -19.19820213317871, -18.55634880065918, -17.91449737548828, -17.27264404296875, -16.63079071044922, -15.988937377929688, -15.347084999084473, -14.705231666564941, -14.063379287719727, -13.421525955200195, -12.77967357635498, -12.137821197509766, -11.495967864990234, -10.85411548614502, -10.212263107299805, -9.570409774780273, -8.928557395935059, -8.286705017089844, -7.6448516845703125, -7.002999305725098, -6.361146450042725, -5.719295501708984, -5.077442646026611, -4.435589790344238, -3.7937374114990234, -3.1518845558166504, -2.5100317001342773, -1.8681790828704834, -1.2263264656066895, -0.5844736099243164, 0.05737912654876709, 0.6992318630218506, 1.341084599494934, 1.9829373359680176, 2.6247901916503906, 3.2666428089141846, 3.9084954261779785, 4.550348281860352, 5.192201137542725, 5.834053993225098, 6.4759063720703125, 7.1177592277526855, 7.759612083435059, 8.401464462280273, 9.043317794799805, 9.68517017364502, 10.327022552490234, 10.968875885009766, 11.61072826385498, 12.252580642700195, 12.894433975219727, 13.536286354064941, 14.178138732910156, 14.819992065429688]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 6.0, 8.0, 5.0, 13.0, 21.0, 28.0, 39.0, 73.0, 299.0, 1467.0, 16729.0, 833914.0, 188932.0, 5804.0, 805.0, 186.0, 75.0, 47.0, 25.0, 20.0, 11.0, 9.0, 5.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.125, -45.3671875, -43.609375, -41.8515625, -40.09375, -38.3359375, -36.578125, -34.8203125, -33.0625, -31.3046875, -29.546875, -27.7890625, -26.03125, -24.2734375, -22.515625, -20.7578125, -19.0, -17.2421875, -15.484375, -13.7265625, -11.96875, -10.2109375, -8.453125, -6.6953125, -4.9375, -3.1796875, -1.421875, 0.3359375, 2.09375, 3.8515625, 5.609375, 7.3671875, 9.125, 10.8828125, 12.640625, 14.3984375, 16.15625, 17.9140625, 19.671875, 21.4296875, 23.1875, 24.9453125, 26.703125, 28.4609375, 30.21875, 31.9765625, 33.734375, 35.4921875, 37.25, 39.0078125, 40.765625, 42.5234375, 44.28125, 46.0390625, 47.796875, 49.5546875, 51.3125, 53.0703125, 54.828125, 56.5859375, 58.34375, 60.1015625, 61.859375, 63.6171875, 65.375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 10.0, 22.0, 31.0, 55.0, 75.0, 121.0, 153.0, 147.0, 129.0, 99.0, 64.0, 47.0, 21.0, 11.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.66796875, -4.576690673828125, -4.48541259765625, -4.394134521484375, -4.3028564453125, -4.211578369140625, -4.12030029296875, -4.029022216796875, -3.937744140625, -3.846466064453125, -3.75518798828125, -3.663909912109375, -3.5726318359375, -3.481353759765625, -3.39007568359375, -3.298797607421875, -3.20751953125, -3.116241455078125, -3.02496337890625, -2.933685302734375, -2.8424072265625, -2.751129150390625, -2.65985107421875, -2.568572998046875, -2.477294921875, -2.386016845703125, -2.29473876953125, -2.203460693359375, -2.1121826171875, -2.020904541015625, -1.92962646484375, -1.838348388671875, -1.7470703125, -1.655792236328125, -1.56451416015625, -1.473236083984375, -1.3819580078125, -1.290679931640625, -1.19940185546875, -1.108123779296875, -1.016845703125, -0.925567626953125, -0.83428955078125, -0.743011474609375, -0.6517333984375, -0.560455322265625, -0.46917724609375, -0.377899169921875, -0.28662109375, -0.195343017578125, -0.10406494140625, -0.012786865234375, 0.0784912109375, 0.169769287109375, 0.26104736328125, 0.352325439453125, 0.443603515625, 0.534881591796875, 0.62615966796875, 0.717437744140625, 0.8087158203125, 0.899993896484375, 0.99127197265625, 1.082550048828125, 1.173828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 16.0, 14.0, 26.0, 44.0, 59.0, 103.0, 158.0, 297.0, 560.0, 1083.0, 2075.0, 4706.0, 11608.0, 32771.0, 109503.0, 389548.0, 350134.0, 96682.0, 29717.0, 10757.0, 4466.0, 2019.0, 976.0, 523.0, 304.0, 152.0, 74.0, 59.0, 41.0, 18.0, 14.0, 8.0, 7.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.765625, -11.3973388671875, -11.029052734375, -10.6607666015625, -10.29248046875, -9.9241943359375, -9.555908203125, -9.1876220703125, -8.8193359375, -8.4510498046875, -8.082763671875, -7.7144775390625, -7.34619140625, -6.9779052734375, -6.609619140625, -6.2413330078125, -5.873046875, -5.5047607421875, -5.136474609375, -4.7681884765625, -4.39990234375, -4.0316162109375, -3.663330078125, -3.2950439453125, -2.9267578125, -2.5584716796875, -2.190185546875, -1.8218994140625, -1.45361328125, -1.0853271484375, -0.717041015625, -0.3487548828125, 0.01953125, 0.3878173828125, 0.756103515625, 1.1243896484375, 1.49267578125, 1.8609619140625, 2.229248046875, 2.5975341796875, 2.9658203125, 3.3341064453125, 3.702392578125, 4.0706787109375, 4.43896484375, 4.8072509765625, 5.175537109375, 5.5438232421875, 5.912109375, 6.2803955078125, 6.648681640625, 7.0169677734375, 7.38525390625, 7.7535400390625, 8.121826171875, 8.4901123046875, 8.8583984375, 9.2266845703125, 9.594970703125, 9.9632568359375, 10.33154296875, 10.6998291015625, 11.068115234375, 11.4364013671875, 11.8046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 5.0, 8.0, 11.0, 12.0, 13.0, 14.0, 16.0, 19.0, 24.0, 20.0, 25.0, 29.0, 38.0, 36.0, 36.0, 41.0, 50.0, 37.0, 52.0, 43.0, 47.0, 38.0, 45.0, 34.0, 36.0, 28.0, 29.0, 32.0, 26.0, 25.0, 20.0, 18.0, 23.0, 11.0, 10.0, 11.0, 5.0, 12.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.30230712890625, -5.1358642578125, -4.96942138671875, -4.802978515625, -4.63653564453125, -4.4700927734375, -4.30364990234375, -4.13720703125, -3.97076416015625, -3.8043212890625, -3.63787841796875, -3.471435546875, -3.30499267578125, -3.1385498046875, -2.97210693359375, -2.8056640625, -2.63922119140625, -2.4727783203125, -2.30633544921875, -2.139892578125, -1.97344970703125, -1.8070068359375, -1.64056396484375, -1.47412109375, -1.30767822265625, -1.1412353515625, -0.97479248046875, -0.808349609375, -0.64190673828125, -0.4754638671875, -0.30902099609375, -0.142578125, 0.02386474609375, 0.1903076171875, 0.35675048828125, 0.523193359375, 0.68963623046875, 0.8560791015625, 1.02252197265625, 1.18896484375, 1.35540771484375, 1.5218505859375, 1.68829345703125, 1.854736328125, 2.02117919921875, 2.1876220703125, 2.35406494140625, 2.5205078125, 2.68695068359375, 2.8533935546875, 3.01983642578125, 3.186279296875, 3.35272216796875, 3.5191650390625, 3.68560791015625, 3.85205078125, 4.01849365234375, 4.1849365234375, 4.35137939453125, 4.517822265625, 4.68426513671875, 4.8507080078125, 5.01715087890625, 5.18359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 15.0, 24.0, 51.0, 130.0, 393.0, 1281.0, 4884.0, 28871.0, 278891.0, 633766.0, 85636.0, 11174.0, 2410.0, 654.0, 225.0, 81.0, 30.0, 21.0, 10.0, 8.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -15.909912109375, -15.19482421875, -14.479736328125, -13.7646484375, -13.049560546875, -12.33447265625, -11.619384765625, -10.904296875, -10.189208984375, -9.47412109375, -8.759033203125, -8.0439453125, -7.328857421875, -6.61376953125, -5.898681640625, -5.18359375, -4.468505859375, -3.75341796875, -3.038330078125, -2.3232421875, -1.608154296875, -0.89306640625, -0.177978515625, 0.537109375, 1.252197265625, 1.96728515625, 2.682373046875, 3.3974609375, 4.112548828125, 4.82763671875, 5.542724609375, 6.2578125, 6.972900390625, 7.68798828125, 8.403076171875, 9.1181640625, 9.833251953125, 10.54833984375, 11.263427734375, 11.978515625, 12.693603515625, 13.40869140625, 14.123779296875, 14.8388671875, 15.553955078125, 16.26904296875, 16.984130859375, 17.69921875, 18.414306640625, 19.12939453125, 19.844482421875, 20.5595703125, 21.274658203125, 21.98974609375, 22.704833984375, 23.419921875, 24.135009765625, 24.85009765625, 25.565185546875, 26.2802734375, 26.995361328125, 27.71044921875, 28.425537109375, 29.140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 8.0, 10.0, 11.0, 30.0, 64.0, 108.0, 212.0, 227.0, 143.0, 65.0, 30.0, 31.0, 16.0, 14.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001377105712890625, -0.001331329345703125, -0.001285552978515625, -0.001239776611328125, -0.001194000244140625, -0.001148223876953125, -0.001102447509765625, -0.001056671142578125, -0.001010894775390625, -0.000965118408203125, -0.000919342041015625, -0.000873565673828125, -0.000827789306640625, -0.000782012939453125, -0.000736236572265625, -0.000690460205078125, -0.000644683837890625, -0.000598907470703125, -0.000553131103515625, -0.000507354736328125, -0.000461578369140625, -0.000415802001953125, -0.000370025634765625, -0.000324249267578125, -0.000278472900390625, -0.000232696533203125, -0.000186920166015625, -0.000141143798828125, -9.5367431640625e-05, -4.9591064453125e-05, -3.814697265625e-06, 4.1961669921875e-05, 8.7738037109375e-05, 0.000133514404296875, 0.000179290771484375, 0.000225067138671875, 0.000270843505859375, 0.000316619873046875, 0.000362396240234375, 0.000408172607421875, 0.000453948974609375, 0.000499725341796875, 0.000545501708984375, 0.000591278076171875, 0.000637054443359375, 0.000682830810546875, 0.000728607177734375, 0.000774383544921875, 0.000820159912109375, 0.000865936279296875, 0.000911712646484375, 0.000957489013671875, 0.001003265380859375, 0.001049041748046875, 0.001094818115234375, 0.001140594482421875, 0.001186370849609375, 0.001232147216796875, 0.001277923583984375, 0.001323699951171875, 0.001369476318359375, 0.001415252685546875, 0.001461029052734375, 0.001506805419921875, 0.001552581787109375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 9.0, 18.0, 20.0, 48.0, 66.0, 96.0, 181.0, 308.0, 518.0, 937.0, 1780.0, 3207.0, 6472.0, 14050.0, 32179.0, 76121.0, 175795.0, 296560.0, 238996.0, 113636.0, 47679.0, 20488.0, 9390.0, 4633.0, 2386.0, 1270.0, 697.0, 413.0, 230.0, 136.0, 82.0, 46.0, 42.0, 19.0, 10.0, 12.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5390625, -9.2720947265625, -9.005126953125, -8.7381591796875, -8.47119140625, -8.2042236328125, -7.937255859375, -7.6702880859375, -7.4033203125, -7.1363525390625, -6.869384765625, -6.6024169921875, -6.33544921875, -6.0684814453125, -5.801513671875, -5.5345458984375, -5.267578125, -5.0006103515625, -4.733642578125, -4.4666748046875, -4.19970703125, -3.9327392578125, -3.665771484375, -3.3988037109375, -3.1318359375, -2.8648681640625, -2.597900390625, -2.3309326171875, -2.06396484375, -1.7969970703125, -1.530029296875, -1.2630615234375, -0.99609375, -0.7291259765625, -0.462158203125, -0.1951904296875, 0.07177734375, 0.3387451171875, 0.605712890625, 0.8726806640625, 1.1396484375, 1.4066162109375, 1.673583984375, 1.9405517578125, 2.20751953125, 2.4744873046875, 2.741455078125, 3.0084228515625, 3.275390625, 3.5423583984375, 3.809326171875, 4.0762939453125, 4.34326171875, 4.6102294921875, 4.877197265625, 5.1441650390625, 5.4111328125, 5.6781005859375, 5.945068359375, 6.2120361328125, 6.47900390625, 6.7459716796875, 7.012939453125, 7.2799072265625, 7.546875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 5.0, 2.0, 3.0, 7.0, 5.0, 5.0, 12.0, 10.0, 22.0, 17.0, 23.0, 29.0, 29.0, 36.0, 30.0, 39.0, 35.0, 37.0, 36.0, 53.0, 37.0, 50.0, 57.0, 49.0, 47.0, 37.0, 34.0, 36.0, 25.0, 23.0, 21.0, 32.0, 24.0, 23.0, 8.0, 14.0, 10.0, 9.0, 6.0, 4.0, 8.0, 5.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.12890625, -3.99749755859375, -3.8660888671875, -3.73468017578125, -3.603271484375, -3.47186279296875, -3.3404541015625, -3.20904541015625, -3.07763671875, -2.94622802734375, -2.8148193359375, -2.68341064453125, -2.552001953125, -2.42059326171875, -2.2891845703125, -2.15777587890625, -2.0263671875, -1.89495849609375, -1.7635498046875, -1.63214111328125, -1.500732421875, -1.36932373046875, -1.2379150390625, -1.10650634765625, -0.97509765625, -0.84368896484375, -0.7122802734375, -0.58087158203125, -0.449462890625, -0.31805419921875, -0.1866455078125, -0.05523681640625, 0.076171875, 0.20758056640625, 0.3389892578125, 0.47039794921875, 0.601806640625, 0.73321533203125, 0.8646240234375, 0.99603271484375, 1.12744140625, 1.25885009765625, 1.3902587890625, 1.52166748046875, 1.653076171875, 1.78448486328125, 1.9158935546875, 2.04730224609375, 2.1787109375, 2.31011962890625, 2.4415283203125, 2.57293701171875, 2.704345703125, 2.83575439453125, 2.9671630859375, 3.09857177734375, 3.22998046875, 3.36138916015625, 3.4927978515625, 3.62420654296875, 3.755615234375, 3.88702392578125, 4.0184326171875, 4.14984130859375, 4.28125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 12.0, 9.0, 29.0, 36.0, 54.0, 91.0, 132.0, 195.0, 148.0, 113.0, 85.0, 39.0, 26.0, 13.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-123.0362548828125, -120.19639587402344, -117.35653686523438, -114.51667785644531, -111.67681884765625, -108.83695983886719, -105.99710083007812, -103.15724182128906, -100.3173828125, -97.47752380371094, -94.63766479492188, -91.79780578613281, -88.95794677734375, -86.11808776855469, -83.27822875976562, -80.43836975097656, -77.59851837158203, -74.75865936279297, -71.9188003540039, -69.07894134521484, -66.23908233642578, -63.39922332763672, -60.55936813354492, -57.71950912475586, -54.8796501159668, -52.039791107177734, -49.19993209838867, -46.360076904296875, -43.52021789550781, -40.68035888671875, -37.84049987792969, -35.000640869140625, -32.16078186035156, -29.3209228515625, -26.481063842773438, -23.641206741333008, -20.801347732543945, -17.961488723754883, -15.121631622314453, -12.28177261352539, -9.441913604736328, -6.602055072784424, -3.7621965408325195, -0.9223384857177734, 1.917520523071289, 4.757379531860352, 7.597236633300781, 10.437095642089844, 13.276954650878906, 16.11681365966797, 18.95667266845703, 21.79652976989746, 24.636388778686523, 27.476247787475586, 30.316104888916016, 33.15596389770508, 35.99582290649414, 38.8356819152832, 41.675540924072266, 44.51539611816406, 47.355255126953125, 50.19511413574219, 53.03497314453125, 55.87483215332031, 58.714691162109375]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 7.0, 16.0, 14.0, 35.0, 47.0, 71.0, 88.0, 97.0, 123.0, 108.0, 103.0, 81.0, 64.0, 58.0, 32.0, 28.0, 13.0, 9.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.49119567871094, -69.84510803222656, -67.19901275634766, -64.55292510986328, -61.906837463378906, -59.260746002197266, -56.614654541015625, -53.96856689453125, -51.322479248046875, -48.676387786865234, -46.03030014038086, -43.38420867919922, -40.738121032714844, -38.0920295715332, -35.44593811035156, -32.79985046386719, -30.153759002685547, -27.50766944885254, -24.86157989501953, -22.21548843383789, -19.569400787353516, -16.923309326171875, -14.277219772338867, -11.63113021850586, -8.985040664672852, -6.338951110839844, -3.6928610801696777, -1.0467710494995117, 1.599318504333496, 4.245408058166504, 6.891498565673828, 9.537588119506836, 12.183677673339844, 14.829767227172852, 17.47585678100586, 20.1219482421875, 22.768035888671875, 25.414127349853516, 28.060216903686523, 30.70630645751953, 33.352394104003906, 35.99848556518555, 38.64457321166992, 41.29066467285156, 43.93675231933594, 46.58284378051758, 49.22893524169922, 51.875022888183594, 54.521114349365234, 57.167205810546875, 59.81329345703125, 62.45938491821289, 65.10547637939453, 67.7515640258789, 70.39765167236328, 73.04374694824219, 75.68983459472656, 78.33592224121094, 80.98201751708984, 83.62810516357422, 86.2741928100586, 88.92028045654297, 91.56637573242188, 94.21246337890625, 96.85855102539062]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 7.0, 10.0, 9.0, 6.0, 13.0, 15.0, 11.0, 16.0, 29.0, 30.0, 46.0, 72.0, 162.0, 385.0, 905.0, 2910.0, 12490.0, 115480.0, 3945689.0, 100393.0, 11708.0, 2649.0, 785.0, 268.0, 77.0, 46.0, 20.0, 15.0, 11.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-100.9375, -98.7177734375, -96.498046875, -94.2783203125, -92.05859375, -89.8388671875, -87.619140625, -85.3994140625, -83.1796875, -80.9599609375, -78.740234375, -76.5205078125, -74.30078125, -72.0810546875, -69.861328125, -67.6416015625, -65.421875, -63.2021484375, -60.982421875, -58.7626953125, -56.54296875, -54.3232421875, -52.103515625, -49.8837890625, -47.6640625, -45.4443359375, -43.224609375, -41.0048828125, -38.78515625, -36.5654296875, -34.345703125, -32.1259765625, -29.90625, -27.6865234375, -25.466796875, -23.2470703125, -21.02734375, -18.8076171875, -16.587890625, -14.3681640625, -12.1484375, -9.9287109375, -7.708984375, -5.4892578125, -3.26953125, -1.0498046875, 1.169921875, 3.3896484375, 5.609375, 7.8291015625, 10.048828125, 12.2685546875, 14.48828125, 16.7080078125, 18.927734375, 21.1474609375, 23.3671875, 25.5869140625, 27.806640625, 30.0263671875, 32.24609375, 34.4658203125, 36.685546875, 38.9052734375, 41.125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 4.0, 9.0, 13.0, 11.0, 10.0, 20.0, 19.0, 24.0, 29.0, 33.0, 35.0, 46.0, 43.0, 42.0, 62.0, 50.0, 45.0, 53.0, 50.0, 49.0, 44.0, 47.0, 35.0, 35.0, 25.0, 30.0, 22.0, 15.0, 16.0, 15.0, 12.0, 12.0, 8.0, 5.0, 4.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9345703125, -0.9020538330078125, -0.869537353515625, -0.8370208740234375, -0.80450439453125, -0.7719879150390625, -0.739471435546875, -0.7069549560546875, -0.6744384765625, -0.6419219970703125, -0.609405517578125, -0.5768890380859375, -0.54437255859375, -0.5118560791015625, -0.479339599609375, -0.4468231201171875, -0.414306640625, -0.3817901611328125, -0.349273681640625, -0.3167572021484375, -0.28424072265625, -0.2517242431640625, -0.219207763671875, -0.1866912841796875, -0.1541748046875, -0.1216583251953125, -0.089141845703125, -0.0566253662109375, -0.02410888671875, 0.0084075927734375, 0.040924072265625, 0.0734405517578125, 0.10595703125, 0.1384735107421875, 0.170989990234375, 0.2035064697265625, 0.23602294921875, 0.2685394287109375, 0.301055908203125, 0.3335723876953125, 0.3660888671875, 0.3986053466796875, 0.431121826171875, 0.4636383056640625, 0.49615478515625, 0.5286712646484375, 0.561187744140625, 0.5937042236328125, 0.626220703125, 0.6587371826171875, 0.691253662109375, 0.7237701416015625, 0.75628662109375, 0.7888031005859375, 0.821319580078125, 0.8538360595703125, 0.8863525390625, 0.9188690185546875, 0.951385498046875, 0.9839019775390625, 1.01641845703125, 1.0489349365234375, 1.081451416015625, 1.1139678955078125, 1.146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 11.0, 11.0, 17.0, 18.0, 32.0, 39.0, 94.0, 141.0, 350.0, 1395.0, 15823.0, 3539656.0, 626797.0, 8273.0, 959.0, 288.0, 124.0, 89.0, 52.0, 24.0, 24.0, 16.0, 15.0, 7.0, 8.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.0, -122.3896484375, -118.779296875, -115.1689453125, -111.55859375, -107.9482421875, -104.337890625, -100.7275390625, -97.1171875, -93.5068359375, -89.896484375, -86.2861328125, -82.67578125, -79.0654296875, -75.455078125, -71.8447265625, -68.234375, -64.6240234375, -61.013671875, -57.4033203125, -53.79296875, -50.1826171875, -46.572265625, -42.9619140625, -39.3515625, -35.7412109375, -32.130859375, -28.5205078125, -24.91015625, -21.2998046875, -17.689453125, -14.0791015625, -10.46875, -6.8583984375, -3.248046875, 0.3623046875, 3.97265625, 7.5830078125, 11.193359375, 14.8037109375, 18.4140625, 22.0244140625, 25.634765625, 29.2451171875, 32.85546875, 36.4658203125, 40.076171875, 43.6865234375, 47.296875, 50.9072265625, 54.517578125, 58.1279296875, 61.73828125, 65.3486328125, 68.958984375, 72.5693359375, 76.1796875, 79.7900390625, 83.400390625, 87.0107421875, 90.62109375, 94.2314453125, 97.841796875, 101.4521484375, 105.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 8.0, 6.0, 12.0, 20.0, 23.0, 20.0, 29.0, 63.0, 61.0, 90.0, 147.0, 231.0, 416.0, 1345.0, 690.0, 336.0, 187.0, 122.0, 86.0, 51.0, 24.0, 24.0, 14.0, 12.0, 16.0, 6.0, 10.0, 8.0, 4.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.97943115234375, -3.8455810546875, -3.71173095703125, -3.577880859375, -3.44403076171875, -3.3101806640625, -3.17633056640625, -3.04248046875, -2.90863037109375, -2.7747802734375, -2.64093017578125, -2.507080078125, -2.37322998046875, -2.2393798828125, -2.10552978515625, -1.9716796875, -1.83782958984375, -1.7039794921875, -1.57012939453125, -1.436279296875, -1.30242919921875, -1.1685791015625, -1.03472900390625, -0.90087890625, -0.76702880859375, -0.6331787109375, -0.49932861328125, -0.365478515625, -0.23162841796875, -0.0977783203125, 0.03607177734375, 0.169921875, 0.30377197265625, 0.4376220703125, 0.57147216796875, 0.705322265625, 0.83917236328125, 0.9730224609375, 1.10687255859375, 1.24072265625, 1.37457275390625, 1.5084228515625, 1.64227294921875, 1.776123046875, 1.90997314453125, 2.0438232421875, 2.17767333984375, 2.3115234375, 2.44537353515625, 2.5792236328125, 2.71307373046875, 2.846923828125, 2.98077392578125, 3.1146240234375, 3.24847412109375, 3.38232421875, 3.51617431640625, 3.6500244140625, 3.78387451171875, 3.917724609375, 4.05157470703125, 4.1854248046875, 4.31927490234375, 4.453125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 3.0, 8.0, 11.0, 17.0, 13.0, 22.0, 26.0, 37.0, 38.0, 52.0, 68.0, 79.0, 87.0, 79.0, 79.0, 82.0, 85.0, 46.0, 40.0, 31.0, 24.0, 13.0, 14.0, 12.0, 5.0, 4.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.251728057861328, -15.519047737121582, -14.786367416381836, -14.053686141967773, -13.321006774902344, -12.588325500488281, -11.855645179748535, -11.122964859008789, -10.390284538269043, -9.657604217529297, -8.92492389678955, -8.192243576049805, -7.4595627784729, -6.726882457733154, -5.99420166015625, -5.261521339416504, -4.528841018676758, -3.7961606979370117, -3.0634801387786865, -2.3307995796203613, -1.5981192588806152, -0.8654389381408691, -0.13275814056396484, 0.5999221801757812, 1.3326025009155273, 2.0652828216552734, 2.7979633808135986, 3.530643939971924, 4.26332426071167, 4.996004581451416, 5.72868537902832, 6.461365699768066, 7.194047927856445, 7.926728248596191, 8.659408569335938, 9.39208984375, 10.12476921081543, 10.857450485229492, 11.590130805969238, 12.322811126708984, 13.05549144744873, 13.788171768188477, 14.520852088928223, 15.253532409667969, 15.986213684082031, 16.71889305114746, 17.451574325561523, 18.184253692626953, 18.916934967041016, 19.649616241455078, 20.382295608520508, 21.11497688293457, 21.84765625, 22.580337524414062, 23.313018798828125, 24.045698165893555, 24.778377532958984, 25.511058807373047, 26.243738174438477, 26.97641944885254, 27.70909881591797, 28.44178009033203, 29.174461364746094, 29.907140731811523, 30.639822006225586]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 12.0, 4.0, 10.0, 12.0, 19.0, 27.0, 22.0, 31.0, 26.0, 26.0, 37.0, 33.0, 35.0, 32.0, 47.0, 58.0, 58.0, 41.0, 43.0, 44.0, 44.0, 37.0, 36.0, 31.0, 24.0, 31.0, 25.0, 19.0, 20.0, 22.0, 16.0, 12.0, 17.0, 13.0, 6.0, 9.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.285501480102539, -12.823211669921875, -12.360921859741211, -11.898632049560547, -11.436342239379883, -10.974052429199219, -10.511762619018555, -10.049471855163574, -9.58718204498291, -9.124892234802246, -8.662602424621582, -8.200312614440918, -7.738022327423096, -7.275732517242432, -6.813442707061768, -6.351152420043945, -5.8888630867004395, -5.426573276519775, -4.964283466339111, -4.501993179321289, -4.039703369140625, -3.577413558959961, -3.115123748779297, -2.6528337001800537, -2.1905438899993896, -1.728253960609436, -1.2659640312194824, -0.8036742210388184, -0.34138429164886475, 0.12090563774108887, 0.5831954479217529, 1.045485496520996, 1.5077753067016602, 1.9700652360916138, 2.4323551654815674, 2.8946449756622314, 3.3569350242614746, 3.8192248344421387, 4.281514644622803, 4.743804931640625, 5.206094741821289, 5.668384552001953, 6.130674362182617, 6.592964172363281, 7.0552544593811035, 7.517544269561768, 7.979834079742432, 8.442124366760254, 8.904413223266602, 9.366703033447266, 9.82899284362793, 10.291282653808594, 10.753572463989258, 11.215862274169922, 11.678152084350586, 12.140442848205566, 12.60273265838623, 13.065022468566895, 13.527312278747559, 13.989602088928223, 14.451891899108887, 14.914182662963867, 15.376472473144531, 15.838762283325195, 16.30105209350586]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 4.0, 6.0, 4.0, 15.0, 21.0, 23.0, 28.0, 49.0, 81.0, 110.0, 163.0, 315.0, 512.0, 888.0, 1508.0, 2829.0, 5354.0, 10768.0, 21689.0, 44064.0, 89099.0, 166830.0, 243063.0, 211792.0, 123830.0, 62996.0, 30561.0, 15218.0, 7732.0, 3857.0, 2137.0, 1209.0, 674.0, 406.0, 212.0, 154.0, 102.0, 78.0, 46.0, 39.0, 27.0, 12.0, 18.0, 9.0, 8.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.9609375, -11.584228515625, -11.20751953125, -10.830810546875, -10.4541015625, -10.077392578125, -9.70068359375, -9.323974609375, -8.947265625, -8.570556640625, -8.19384765625, -7.817138671875, -7.4404296875, -7.063720703125, -6.68701171875, -6.310302734375, -5.93359375, -5.556884765625, -5.18017578125, -4.803466796875, -4.4267578125, -4.050048828125, -3.67333984375, -3.296630859375, -2.919921875, -2.543212890625, -2.16650390625, -1.789794921875, -1.4130859375, -1.036376953125, -0.65966796875, -0.282958984375, 0.09375, 0.470458984375, 0.84716796875, 1.223876953125, 1.6005859375, 1.977294921875, 2.35400390625, 2.730712890625, 3.107421875, 3.484130859375, 3.86083984375, 4.237548828125, 4.6142578125, 4.990966796875, 5.36767578125, 5.744384765625, 6.12109375, 6.497802734375, 6.87451171875, 7.251220703125, 7.6279296875, 8.004638671875, 8.38134765625, 8.758056640625, 9.134765625, 9.511474609375, 9.88818359375, 10.264892578125, 10.6416015625, 11.018310546875, 11.39501953125, 11.771728515625, 12.1484375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 10.0, 12.0, 13.0, 19.0, 18.0, 34.0, 37.0, 41.0, 45.0, 75.0, 69.0, 76.0, 59.0, 65.0, 64.0, 54.0, 42.0, 50.0, 46.0, 27.0, 33.0, 22.0, 20.0, 19.0, 12.0, 9.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7763671875, -1.7316741943359375, -1.686981201171875, -1.6422882080078125, -1.59759521484375, -1.5529022216796875, -1.508209228515625, -1.4635162353515625, -1.4188232421875, -1.3741302490234375, -1.329437255859375, -1.2847442626953125, -1.24005126953125, -1.1953582763671875, -1.150665283203125, -1.1059722900390625, -1.061279296875, -1.0165863037109375, -0.971893310546875, -0.9272003173828125, -0.88250732421875, -0.8378143310546875, -0.793121337890625, -0.7484283447265625, -0.7037353515625, -0.6590423583984375, -0.614349365234375, -0.5696563720703125, -0.52496337890625, -0.4802703857421875, -0.435577392578125, -0.3908843994140625, -0.34619140625, -0.3014984130859375, -0.256805419921875, -0.2121124267578125, -0.16741943359375, -0.1227264404296875, -0.078033447265625, -0.0333404541015625, 0.0113525390625, 0.0560455322265625, 0.100738525390625, 0.1454315185546875, 0.19012451171875, 0.2348175048828125, 0.279510498046875, 0.3242034912109375, 0.368896484375, 0.4135894775390625, 0.458282470703125, 0.5029754638671875, 0.54766845703125, 0.5923614501953125, 0.637054443359375, 0.6817474365234375, 0.7264404296875, 0.7711334228515625, 0.815826416015625, 0.8605194091796875, 0.90521240234375, 0.9499053955078125, 0.994598388671875, 1.0392913818359375, 1.083984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 12.0, 20.0, 24.0, 35.0, 49.0, 58.0, 100.0, 128.0, 198.0, 273.0, 432.0, 677.0, 1086.0, 2051.0, 4229.0, 10064.0, 27076.0, 77830.0, 202458.0, 341179.0, 233457.0, 92812.0, 32236.0, 11692.0, 4828.0, 2279.0, 1183.0, 729.0, 434.0, 277.0, 199.0, 130.0, 95.0, 72.0, 46.0, 21.0, 27.0, 18.0, 14.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.359375, -18.799560546875, -18.23974609375, -17.679931640625, -17.1201171875, -16.560302734375, -16.00048828125, -15.440673828125, -14.880859375, -14.321044921875, -13.76123046875, -13.201416015625, -12.6416015625, -12.081787109375, -11.52197265625, -10.962158203125, -10.40234375, -9.842529296875, -9.28271484375, -8.722900390625, -8.1630859375, -7.603271484375, -7.04345703125, -6.483642578125, -5.923828125, -5.364013671875, -4.80419921875, -4.244384765625, -3.6845703125, -3.124755859375, -2.56494140625, -2.005126953125, -1.4453125, -0.885498046875, -0.32568359375, 0.234130859375, 0.7939453125, 1.353759765625, 1.91357421875, 2.473388671875, 3.033203125, 3.593017578125, 4.15283203125, 4.712646484375, 5.2724609375, 5.832275390625, 6.39208984375, 6.951904296875, 7.51171875, 8.071533203125, 8.63134765625, 9.191162109375, 9.7509765625, 10.310791015625, 10.87060546875, 11.430419921875, 11.990234375, 12.550048828125, 13.10986328125, 13.669677734375, 14.2294921875, 14.789306640625, 15.34912109375, 15.908935546875, 16.46875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 11.0, 10.0, 5.0, 7.0, 5.0, 17.0, 18.0, 24.0, 20.0, 15.0, 31.0, 26.0, 34.0, 40.0, 48.0, 31.0, 46.0, 37.0, 37.0, 29.0, 29.0, 40.0, 44.0, 46.0, 46.0, 34.0, 35.0, 43.0, 31.0, 25.0, 16.0, 24.0, 18.0, 16.0, 9.0, 11.0, 5.0, 6.0, 5.0, 2.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.18359375, -6.9678955078125, -6.752197265625, -6.5364990234375, -6.32080078125, -6.1051025390625, -5.889404296875, -5.6737060546875, -5.4580078125, -5.2423095703125, -5.026611328125, -4.8109130859375, -4.59521484375, -4.3795166015625, -4.163818359375, -3.9481201171875, -3.732421875, -3.5167236328125, -3.301025390625, -3.0853271484375, -2.86962890625, -2.6539306640625, -2.438232421875, -2.2225341796875, -2.0068359375, -1.7911376953125, -1.575439453125, -1.3597412109375, -1.14404296875, -0.9283447265625, -0.712646484375, -0.4969482421875, -0.28125, -0.0655517578125, 0.150146484375, 0.3658447265625, 0.58154296875, 0.7972412109375, 1.012939453125, 1.2286376953125, 1.4443359375, 1.6600341796875, 1.875732421875, 2.0914306640625, 2.30712890625, 2.5228271484375, 2.738525390625, 2.9542236328125, 3.169921875, 3.3856201171875, 3.601318359375, 3.8170166015625, 4.03271484375, 4.2484130859375, 4.464111328125, 4.6798095703125, 4.8955078125, 5.1112060546875, 5.326904296875, 5.5426025390625, 5.75830078125, 5.9739990234375, 6.189697265625, 6.4053955078125, 6.62109375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 9.0, 14.0, 33.0, 46.0, 71.0, 106.0, 189.0, 265.0, 524.0, 870.0, 1709.0, 3662.0, 8293.0, 21956.0, 68802.0, 222268.0, 398449.0, 216787.0, 67338.0, 21786.0, 8044.0, 3557.0, 1642.0, 842.0, 470.0, 317.0, 156.0, 109.0, 69.0, 54.0, 35.0, 19.0, 22.0, 10.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.294921875, -11.84765625, -11.400390625, -10.953125, -10.505859375, -10.05859375, -9.611328125, -9.1640625, -8.716796875, -8.26953125, -7.822265625, -7.375, -6.927734375, -6.48046875, -6.033203125, -5.5859375, -5.138671875, -4.69140625, -4.244140625, -3.796875, -3.349609375, -2.90234375, -2.455078125, -2.0078125, -1.560546875, -1.11328125, -0.666015625, -0.21875, 0.228515625, 0.67578125, 1.123046875, 1.5703125, 2.017578125, 2.46484375, 2.912109375, 3.359375, 3.806640625, 4.25390625, 4.701171875, 5.1484375, 5.595703125, 6.04296875, 6.490234375, 6.9375, 7.384765625, 7.83203125, 8.279296875, 8.7265625, 9.173828125, 9.62109375, 10.068359375, 10.515625, 10.962890625, 11.41015625, 11.857421875, 12.3046875, 12.751953125, 13.19921875, 13.646484375, 14.09375, 14.541015625, 14.98828125, 15.435546875, 15.8828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 3.0, 7.0, 17.0, 21.0, 24.0, 39.0, 50.0, 86.0, 87.0, 122.0, 109.0, 109.0, 104.0, 72.0, 37.0, 38.0, 20.0, 17.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018520355224609375, -0.0017689168453216553, -0.001685798168182373, -0.0016026794910430908, -0.0015195608139038086, -0.0014364421367645264, -0.0013533234596252441, -0.001270204782485962, -0.0011870861053466797, -0.0011039674282073975, -0.0010208487510681152, -0.000937730073928833, -0.0008546113967895508, -0.0007714927196502686, -0.0006883740425109863, -0.0006052553653717041, -0.0005221366882324219, -0.00043901801109313965, -0.0003558993339538574, -0.0002727806568145752, -0.00018966197967529297, -0.00010654330253601074, -2.3424625396728516e-05, 5.969405174255371e-05, 0.00014281272888183594, 0.00022593140602111816, 0.0003090500831604004, 0.0003921687602996826, 0.00047528743743896484, 0.0005584061145782471, 0.0006415247917175293, 0.0007246434688568115, 0.0008077621459960938, 0.000890880823135376, 0.0009739995002746582, 0.0010571181774139404, 0.0011402368545532227, 0.0012233555316925049, 0.0013064742088317871, 0.0013895928859710693, 0.0014727115631103516, 0.0015558302402496338, 0.001638948917388916, 0.0017220675945281982, 0.0018051862716674805, 0.0018883049488067627, 0.001971423625946045, 0.002054542303085327, 0.0021376609802246094, 0.0022207796573638916, 0.002303898334503174, 0.002387017011642456, 0.0024701356887817383, 0.0025532543659210205, 0.0026363730430603027, 0.002719491720199585, 0.002802610397338867, 0.0028857290744781494, 0.0029688477516174316, 0.003051966428756714, 0.003135085105895996, 0.0032182037830352783, 0.0033013224601745605, 0.0033844411373138428, 0.003467559814453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 10.0, 15.0, 18.0, 25.0, 40.0, 53.0, 78.0, 135.0, 182.0, 319.0, 527.0, 963.0, 1964.0, 4159.0, 10503.0, 29785.0, 93503.0, 274610.0, 375550.0, 170946.0, 53797.0, 18185.0, 6919.0, 2909.0, 1414.0, 763.0, 436.0, 241.0, 162.0, 116.0, 67.0, 42.0, 25.0, 21.0, 17.0, 15.0, 8.0, 9.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3046875, -11.8841552734375, -11.463623046875, -11.0430908203125, -10.62255859375, -10.2020263671875, -9.781494140625, -9.3609619140625, -8.9404296875, -8.5198974609375, -8.099365234375, -7.6788330078125, -7.25830078125, -6.8377685546875, -6.417236328125, -5.9967041015625, -5.576171875, -5.1556396484375, -4.735107421875, -4.3145751953125, -3.89404296875, -3.4735107421875, -3.052978515625, -2.6324462890625, -2.2119140625, -1.7913818359375, -1.370849609375, -0.9503173828125, -0.52978515625, -0.1092529296875, 0.311279296875, 0.7318115234375, 1.15234375, 1.5728759765625, 1.993408203125, 2.4139404296875, 2.83447265625, 3.2550048828125, 3.675537109375, 4.0960693359375, 4.5166015625, 4.9371337890625, 5.357666015625, 5.7781982421875, 6.19873046875, 6.6192626953125, 7.039794921875, 7.4603271484375, 7.880859375, 8.3013916015625, 8.721923828125, 9.1424560546875, 9.56298828125, 9.9835205078125, 10.404052734375, 10.8245849609375, 11.2451171875, 11.6656494140625, 12.086181640625, 12.5067138671875, 12.92724609375, 13.3477783203125, 13.768310546875, 14.1888427734375, 14.609375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 6.0, 8.0, 12.0, 7.0, 13.0, 12.0, 16.0, 23.0, 19.0, 24.0, 32.0, 42.0, 45.0, 59.0, 51.0, 61.0, 68.0, 47.0, 62.0, 51.0, 55.0, 37.0, 36.0, 31.0, 33.0, 33.0, 22.0, 21.0, 12.0, 14.0, 11.0, 13.0, 7.0, 7.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5546875, -5.38043212890625, -5.2061767578125, -5.03192138671875, -4.857666015625, -4.68341064453125, -4.5091552734375, -4.33489990234375, -4.16064453125, -3.98638916015625, -3.8121337890625, -3.63787841796875, -3.463623046875, -3.28936767578125, -3.1151123046875, -2.94085693359375, -2.7666015625, -2.59234619140625, -2.4180908203125, -2.24383544921875, -2.069580078125, -1.89532470703125, -1.7210693359375, -1.54681396484375, -1.37255859375, -1.19830322265625, -1.0240478515625, -0.84979248046875, -0.675537109375, -0.50128173828125, -0.3270263671875, -0.15277099609375, 0.021484375, 0.19573974609375, 0.3699951171875, 0.54425048828125, 0.718505859375, 0.89276123046875, 1.0670166015625, 1.24127197265625, 1.41552734375, 1.58978271484375, 1.7640380859375, 1.93829345703125, 2.112548828125, 2.28680419921875, 2.4610595703125, 2.63531494140625, 2.8095703125, 2.98382568359375, 3.1580810546875, 3.33233642578125, 3.506591796875, 3.68084716796875, 3.8551025390625, 4.02935791015625, 4.20361328125, 4.37786865234375, 4.5521240234375, 4.72637939453125, 4.900634765625, 5.07489013671875, 5.2491455078125, 5.42340087890625, 5.59765625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 15.0, 10.0, 18.0, 31.0, 68.0, 105.0, 175.0, 156.0, 168.0, 102.0, 61.0, 37.0, 15.0, 17.0, 8.0, 3.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.0747833251953, -165.66006469726562, -160.245361328125, -154.8306427001953, -149.41592407226562, -144.001220703125, -138.5865020751953, -133.17178344726562, -127.75707244873047, -122.34236145019531, -116.92764282226562, -111.51293182373047, -106.09822082519531, -100.68350219726562, -95.26879119873047, -89.85408020019531, -84.43936157226562, -79.02465057373047, -73.60993194580078, -68.19522094726562, -62.7805061340332, -57.36579132080078, -51.951080322265625, -46.5363655090332, -41.12165069580078, -35.70693588256836, -30.29222297668457, -24.87751007080078, -19.46279525756836, -14.048080444335938, -8.633369445800781, -3.2186546325683594, 2.196075439453125, 7.6107892990112305, 13.025503158569336, 18.440216064453125, 23.854930877685547, 29.26964569091797, 34.684356689453125, 40.09907150268555, 45.51378631591797, 50.92850112915039, 56.34321594238281, 61.75792694091797, 67.17263793945312, 72.58735656738281, 78.00206756591797, 83.41677856445312, 88.83149719238281, 94.24620819091797, 99.66092681884766, 105.07563781738281, 110.4903564453125, 115.90506744384766, 121.31977844238281, 126.7344970703125, 132.14920043945312, 137.5639190673828, 142.97862243652344, 148.39334106445312, 153.8080596923828, 159.2227783203125, 164.63748168945312, 170.0522003173828, 175.4669189453125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 6.0, 16.0, 11.0, 15.0, 18.0, 33.0, 41.0, 34.0, 43.0, 50.0, 44.0, 58.0, 62.0, 57.0, 53.0, 63.0, 59.0, 46.0, 55.0, 38.0, 35.0, 33.0, 24.0, 20.0, 15.0, 16.0, 8.0, 11.0, 8.0, 5.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.20414733886719, -79.92383575439453, -77.64352416992188, -75.36321258544922, -73.08290100097656, -70.8025894165039, -68.52227783203125, -66.24197387695312, -63.9616584777832, -61.68134689331055, -59.40103530883789, -57.120723724365234, -54.840415954589844, -52.56010437011719, -50.27979278564453, -47.999481201171875, -45.71916961669922, -43.43885803222656, -41.158546447753906, -38.87823486328125, -36.597923278808594, -34.31761169433594, -32.03730392456055, -29.75699234008789, -27.476680755615234, -25.196369171142578, -22.916057586669922, -20.6357479095459, -18.355436325073242, -16.075124740600586, -13.794814109802246, -11.514503479003906, -9.234184265136719, -6.953873157501221, -4.673562049865723, -2.3932509422302246, -0.11293983459472656, 2.1673717498779297, 4.4476823806762695, 6.727993011474609, 9.008304595947266, 11.288616180419922, 13.568926811218262, 15.849237442016602, 18.129549026489258, 20.409860610961914, 22.690170288085938, 24.970481872558594, 27.25079345703125, 29.531105041503906, 31.811416625976562, 34.09172821044922, 36.372039794921875, 38.65235137939453, 40.93265914916992, 43.21297073364258, 45.493282318115234, 47.77359390258789, 50.05390548706055, 52.3342170715332, 54.614524841308594, 56.89483642578125, 59.175148010253906, 61.45545959472656, 63.73577117919922]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 11.0, 12.0, 24.0, 32.0, 53.0, 95.0, 135.0, 249.0, 565.0, 1492.0, 6250.0, 39249.0, 2761268.0, 1340776.0, 36684.0, 5605.0, 1153.0, 314.0, 114.0, 57.0, 37.0, 26.0, 23.0, 15.0, 12.0, 9.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.875, -90.36328125, -87.8515625, -85.33984375, -82.828125, -80.31640625, -77.8046875, -75.29296875, -72.78125, -70.26953125, -67.7578125, -65.24609375, -62.734375, -60.22265625, -57.7109375, -55.19921875, -52.6875, -50.17578125, -47.6640625, -45.15234375, -42.640625, -40.12890625, -37.6171875, -35.10546875, -32.59375, -30.08203125, -27.5703125, -25.05859375, -22.546875, -20.03515625, -17.5234375, -15.01171875, -12.5, -9.98828125, -7.4765625, -4.96484375, -2.453125, 0.05859375, 2.5703125, 5.08203125, 7.59375, 10.10546875, 12.6171875, 15.12890625, 17.640625, 20.15234375, 22.6640625, 25.17578125, 27.6875, 30.19921875, 32.7109375, 35.22265625, 37.734375, 40.24609375, 42.7578125, 45.26953125, 47.78125, 50.29296875, 52.8046875, 55.31640625, 57.828125, 60.33984375, 62.8515625, 65.36328125, 67.875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 23.0, 25.0, 28.0, 22.0, 50.0, 60.0, 67.0, 83.0, 74.0, 67.0, 74.0, 69.0, 65.0, 46.0, 43.0, 46.0, 27.0, 32.0, 14.0, 19.0, 12.0, 10.0, 7.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.74609375, -2.6749267578125, -2.603759765625, -2.5325927734375, -2.46142578125, -2.3902587890625, -2.319091796875, -2.2479248046875, -2.1767578125, -2.1055908203125, -2.034423828125, -1.9632568359375, -1.89208984375, -1.8209228515625, -1.749755859375, -1.6785888671875, -1.607421875, -1.5362548828125, -1.465087890625, -1.3939208984375, -1.32275390625, -1.2515869140625, -1.180419921875, -1.1092529296875, -1.0380859375, -0.9669189453125, -0.895751953125, -0.8245849609375, -0.75341796875, -0.6822509765625, -0.611083984375, -0.5399169921875, -0.46875, -0.3975830078125, -0.326416015625, -0.2552490234375, -0.18408203125, -0.1129150390625, -0.041748046875, 0.0294189453125, 0.1005859375, 0.1717529296875, 0.242919921875, 0.3140869140625, 0.38525390625, 0.4564208984375, 0.527587890625, 0.5987548828125, 0.669921875, 0.7410888671875, 0.812255859375, 0.8834228515625, 0.95458984375, 1.0257568359375, 1.096923828125, 1.1680908203125, 1.2392578125, 1.3104248046875, 1.381591796875, 1.4527587890625, 1.52392578125, 1.5950927734375, 1.666259765625, 1.7374267578125, 1.80859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 7.0, 5.0, 1.0, 4.0, 4.0, 17.0, 14.0, 12.0, 16.0, 29.0, 25.0, 56.0, 73.0, 162.0, 283.0, 753.0, 2592.0, 10330.0, 62120.0, 965665.0, 3030253.0, 101999.0, 15009.0, 3193.0, 877.0, 327.0, 155.0, 97.0, 58.0, 41.0, 23.0, 21.0, 16.0, 15.0, 10.0, 9.0, 5.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.59375, -42.74462890625, -40.8955078125, -39.04638671875, -37.197265625, -35.34814453125, -33.4990234375, -31.64990234375, -29.80078125, -27.95166015625, -26.1025390625, -24.25341796875, -22.404296875, -20.55517578125, -18.7060546875, -16.85693359375, -15.0078125, -13.15869140625, -11.3095703125, -9.46044921875, -7.611328125, -5.76220703125, -3.9130859375, -2.06396484375, -0.21484375, 1.63427734375, 3.4833984375, 5.33251953125, 7.181640625, 9.03076171875, 10.8798828125, 12.72900390625, 14.578125, 16.42724609375, 18.2763671875, 20.12548828125, 21.974609375, 23.82373046875, 25.6728515625, 27.52197265625, 29.37109375, 31.22021484375, 33.0693359375, 34.91845703125, 36.767578125, 38.61669921875, 40.4658203125, 42.31494140625, 44.1640625, 46.01318359375, 47.8623046875, 49.71142578125, 51.560546875, 53.40966796875, 55.2587890625, 57.10791015625, 58.95703125, 60.80615234375, 62.6552734375, 64.50439453125, 66.353515625, 68.20263671875, 70.0517578125, 71.90087890625, 73.75]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 6.0, 4.0, 6.0, 11.0, 14.0, 20.0, 25.0, 21.0, 38.0, 74.0, 96.0, 188.0, 282.0, 622.0, 1408.0, 534.0, 275.0, 146.0, 104.0, 67.0, 44.0, 22.0, 15.0, 14.0, 13.0, 9.0, 7.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55859375, -6.32781982421875, -6.0970458984375, -5.86627197265625, -5.635498046875, -5.40472412109375, -5.1739501953125, -4.94317626953125, -4.71240234375, -4.48162841796875, -4.2508544921875, -4.02008056640625, -3.789306640625, -3.55853271484375, -3.3277587890625, -3.09698486328125, -2.8662109375, -2.63543701171875, -2.4046630859375, -2.17388916015625, -1.943115234375, -1.71234130859375, -1.4815673828125, -1.25079345703125, -1.02001953125, -0.78924560546875, -0.5584716796875, -0.32769775390625, -0.096923828125, 0.13385009765625, 0.3646240234375, 0.59539794921875, 0.826171875, 1.05694580078125, 1.2877197265625, 1.51849365234375, 1.749267578125, 1.98004150390625, 2.2108154296875, 2.44158935546875, 2.67236328125, 2.90313720703125, 3.1339111328125, 3.36468505859375, 3.595458984375, 3.82623291015625, 4.0570068359375, 4.28778076171875, 4.5185546875, 4.74932861328125, 4.9801025390625, 5.21087646484375, 5.441650390625, 5.67242431640625, 5.9031982421875, 6.13397216796875, 6.36474609375, 6.59552001953125, 6.8262939453125, 7.05706787109375, 7.287841796875, 7.51861572265625, 7.7493896484375, 7.98016357421875, 8.2109375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 11.0, 10.0, 10.0, 33.0, 39.0, 72.0, 106.0, 110.0, 148.0, 139.0, 108.0, 84.0, 54.0, 24.0, 20.0, 11.0, 10.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.40202331542969, -75.40481567382812, -73.4076156616211, -71.41040802001953, -69.41320037841797, -67.41600036621094, -65.41879272460938, -63.42158889770508, -61.42438507080078, -59.427181243896484, -57.42997360229492, -55.432769775390625, -53.43556594848633, -51.43836212158203, -49.44115447998047, -47.44395065307617, -45.44674301147461, -43.44953918457031, -41.45233154296875, -39.45512771606445, -37.457923889160156, -35.460716247558594, -33.4635124206543, -31.46630859375, -29.46910285949707, -27.47189712524414, -25.474693298339844, -23.477487564086914, -21.480281829833984, -19.483078002929688, -17.485872268676758, -15.488667488098145, -13.491462707519531, -11.494257926940918, -9.497053146362305, -7.499847412109375, -5.502642631530762, -3.5054378509521484, -1.5082321166992188, 0.48897266387939453, 2.486177444458008, 4.483382225036621, 6.480587482452393, 8.477792739868164, 10.474997520446777, 12.47220230102539, 14.46940803527832, 16.46661376953125, 18.463817596435547, 20.461023330688477, 22.458227157592773, 24.455432891845703, 26.45263671875, 28.44984245300293, 30.44704818725586, 32.444252014160156, 34.44145965576172, 36.438663482666016, 38.43587112426758, 40.433074951171875, 42.43027877807617, 44.42748260498047, 46.42469024658203, 48.42189407348633, 50.419097900390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 7.0, 2.0, 6.0, 7.0, 15.0, 19.0, 14.0, 26.0, 22.0, 38.0, 32.0, 27.0, 23.0, 34.0, 37.0, 33.0, 44.0, 49.0, 49.0, 42.0, 46.0, 49.0, 55.0, 32.0, 39.0, 32.0, 30.0, 32.0, 33.0, 25.0, 22.0, 16.0, 18.0, 10.0, 8.0, 9.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.50879669189453, -22.656274795532227, -21.803754806518555, -20.95123291015625, -20.098712921142578, -19.246191024780273, -18.39366912841797, -17.541149139404297, -16.688629150390625, -15.836108207702637, -14.983587265014648, -14.131065368652344, -13.278545379638672, -12.426023483276367, -11.573502540588379, -10.72098159790039, -9.868459701538086, -9.015938758850098, -8.16341781616211, -7.310896396636963, -6.458375453948975, -5.605854511260986, -4.75333309173584, -3.9008121490478516, -3.0482912063598633, -2.195770263671875, -1.3432490825653076, -0.49072790145874023, 0.36179304122924805, 1.2143139839172363, 2.066835403442383, 2.919356346130371, 3.771879196166992, 4.6244001388549805, 5.476921081542969, 6.329442501068115, 7.1819634437561035, 8.03448486328125, 8.887005805969238, 9.739526748657227, 10.592047691345215, 11.444568634033203, 12.297089576721191, 13.14961051940918, 14.002132415771484, 14.854652404785156, 15.707174301147461, 16.559696197509766, 17.412216186523438, 18.264738082885742, 19.117258071899414, 19.96977996826172, 20.82229995727539, 21.674821853637695, 22.52734375, 23.379863739013672, 24.232383728027344, 25.08490562438965, 25.93742561340332, 26.789947509765625, 27.642467498779297, 28.4949893951416, 29.347511291503906, 30.200031280517578, 31.052553176879883]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 0.0, 5.0, 5.0, 9.0, 8.0, 17.0, 16.0, 27.0, 54.0, 66.0, 95.0, 138.0, 202.0, 249.0, 423.0, 576.0, 958.0, 1786.0, 3721.0, 8773.0, 24107.0, 69050.0, 180749.0, 322013.0, 257312.0, 112466.0, 40408.0, 14004.0, 5420.0, 2476.0, 1264.0, 703.0, 398.0, 285.0, 214.0, 152.0, 91.0, 83.0, 71.0, 40.0, 33.0, 28.0, 14.0, 13.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-19.015625, -18.434814453125, -17.85400390625, -17.273193359375, -16.6923828125, -16.111572265625, -15.53076171875, -14.949951171875, -14.369140625, -13.788330078125, -13.20751953125, -12.626708984375, -12.0458984375, -11.465087890625, -10.88427734375, -10.303466796875, -9.72265625, -9.141845703125, -8.56103515625, -7.980224609375, -7.3994140625, -6.818603515625, -6.23779296875, -5.656982421875, -5.076171875, -4.495361328125, -3.91455078125, -3.333740234375, -2.7529296875, -2.172119140625, -1.59130859375, -1.010498046875, -0.4296875, 0.151123046875, 0.73193359375, 1.312744140625, 1.8935546875, 2.474365234375, 3.05517578125, 3.635986328125, 4.216796875, 4.797607421875, 5.37841796875, 5.959228515625, 6.5400390625, 7.120849609375, 7.70166015625, 8.282470703125, 8.86328125, 9.444091796875, 10.02490234375, 10.605712890625, 11.1865234375, 11.767333984375, 12.34814453125, 12.928955078125, 13.509765625, 14.090576171875, 14.67138671875, 15.252197265625, 15.8330078125, 16.413818359375, 16.99462890625, 17.575439453125, 18.15625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 7.0, 10.0, 17.0, 25.0, 34.0, 36.0, 68.0, 73.0, 83.0, 105.0, 72.0, 89.0, 72.0, 64.0, 68.0, 47.0, 45.0, 30.0, 14.0, 14.0, 6.0, 8.0, 7.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.505859375, -3.4100341796875, -3.314208984375, -3.2183837890625, -3.12255859375, -3.0267333984375, -2.930908203125, -2.8350830078125, -2.7392578125, -2.6434326171875, -2.547607421875, -2.4517822265625, -2.35595703125, -2.2601318359375, -2.164306640625, -2.0684814453125, -1.97265625, -1.8768310546875, -1.781005859375, -1.6851806640625, -1.58935546875, -1.4935302734375, -1.397705078125, -1.3018798828125, -1.2060546875, -1.1102294921875, -1.014404296875, -0.9185791015625, -0.82275390625, -0.7269287109375, -0.631103515625, -0.5352783203125, -0.439453125, -0.3436279296875, -0.247802734375, -0.1519775390625, -0.05615234375, 0.0396728515625, 0.135498046875, 0.2313232421875, 0.3271484375, 0.4229736328125, 0.518798828125, 0.6146240234375, 0.71044921875, 0.8062744140625, 0.902099609375, 0.9979248046875, 1.09375, 1.1895751953125, 1.285400390625, 1.3812255859375, 1.47705078125, 1.5728759765625, 1.668701171875, 1.7645263671875, 1.8603515625, 1.9561767578125, 2.052001953125, 2.1478271484375, 2.24365234375, 2.3394775390625, 2.435302734375, 2.5311279296875, 2.626953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 6.0, 15.0, 13.0, 23.0, 44.0, 58.0, 90.0, 133.0, 172.0, 248.0, 405.0, 717.0, 1161.0, 2222.0, 4920.0, 13536.0, 45617.0, 165341.0, 403871.0, 285200.0, 85612.0, 24264.0, 7777.0, 3092.0, 1609.0, 859.0, 522.0, 341.0, 213.0, 175.0, 88.0, 48.0, 49.0, 32.0, 20.0, 15.0, 8.0, 15.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.234375, -24.486572265625, -23.73876953125, -22.990966796875, -22.2431640625, -21.495361328125, -20.74755859375, -19.999755859375, -19.251953125, -18.504150390625, -17.75634765625, -17.008544921875, -16.2607421875, -15.512939453125, -14.76513671875, -14.017333984375, -13.26953125, -12.521728515625, -11.77392578125, -11.026123046875, -10.2783203125, -9.530517578125, -8.78271484375, -8.034912109375, -7.287109375, -6.539306640625, -5.79150390625, -5.043701171875, -4.2958984375, -3.548095703125, -2.80029296875, -2.052490234375, -1.3046875, -0.556884765625, 0.19091796875, 0.938720703125, 1.6865234375, 2.434326171875, 3.18212890625, 3.929931640625, 4.677734375, 5.425537109375, 6.17333984375, 6.921142578125, 7.6689453125, 8.416748046875, 9.16455078125, 9.912353515625, 10.66015625, 11.407958984375, 12.15576171875, 12.903564453125, 13.6513671875, 14.399169921875, 15.14697265625, 15.894775390625, 16.642578125, 17.390380859375, 18.13818359375, 18.885986328125, 19.6337890625, 20.381591796875, 21.12939453125, 21.877197265625, 22.625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 10.0, 10.0, 11.0, 18.0, 27.0, 32.0, 26.0, 34.0, 45.0, 38.0, 49.0, 49.0, 37.0, 52.0, 47.0, 50.0, 45.0, 47.0, 60.0, 47.0, 49.0, 44.0, 26.0, 26.0, 26.0, 15.0, 19.0, 12.0, 11.0, 7.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5625, -14.1451416015625, -13.727783203125, -13.3104248046875, -12.89306640625, -12.4757080078125, -12.058349609375, -11.6409912109375, -11.2236328125, -10.8062744140625, -10.388916015625, -9.9715576171875, -9.55419921875, -9.1368408203125, -8.719482421875, -8.3021240234375, -7.884765625, -7.4674072265625, -7.050048828125, -6.6326904296875, -6.21533203125, -5.7979736328125, -5.380615234375, -4.9632568359375, -4.5458984375, -4.1285400390625, -3.711181640625, -3.2938232421875, -2.87646484375, -2.4591064453125, -2.041748046875, -1.6243896484375, -1.20703125, -0.7896728515625, -0.372314453125, 0.0450439453125, 0.46240234375, 0.8797607421875, 1.297119140625, 1.7144775390625, 2.1318359375, 2.5491943359375, 2.966552734375, 3.3839111328125, 3.80126953125, 4.2186279296875, 4.635986328125, 5.0533447265625, 5.470703125, 5.8880615234375, 6.305419921875, 6.7227783203125, 7.14013671875, 7.5574951171875, 7.974853515625, 8.3922119140625, 8.8095703125, 9.2269287109375, 9.644287109375, 10.0616455078125, 10.47900390625, 10.8963623046875, 11.313720703125, 11.7310791015625, 12.1484375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 12.0, 14.0, 46.0, 97.0, 212.0, 520.0, 1563.0, 8117.0, 143068.0, 827432.0, 60673.0, 4914.0, 1118.0, 383.0, 183.0, 91.0, 32.0, 24.0, 16.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.8828125, -33.734375, -32.5859375, -31.4375, -30.2890625, -29.140625, -27.9921875, -26.84375, -25.6953125, -24.546875, -23.3984375, -22.25, -21.1015625, -19.953125, -18.8046875, -17.65625, -16.5078125, -15.359375, -14.2109375, -13.0625, -11.9140625, -10.765625, -9.6171875, -8.46875, -7.3203125, -6.171875, -5.0234375, -3.875, -2.7265625, -1.578125, -0.4296875, 0.71875, 1.8671875, 3.015625, 4.1640625, 5.3125, 6.4609375, 7.609375, 8.7578125, 9.90625, 11.0546875, 12.203125, 13.3515625, 14.5, 15.6484375, 16.796875, 17.9453125, 19.09375, 20.2421875, 21.390625, 22.5390625, 23.6875, 24.8359375, 25.984375, 27.1328125, 28.28125, 29.4296875, 30.578125, 31.7265625, 32.875, 34.0234375, 35.171875, 36.3203125, 37.46875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 10.0, 5.0, 12.0, 11.0, 14.0, 27.0, 35.0, 34.0, 61.0, 52.0, 84.0, 79.0, 100.0, 86.0, 71.0, 67.0, 49.0, 41.0, 36.0, 27.0, 15.0, 12.0, 8.0, 10.0, 10.0, 6.0, 7.0, 3.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.002193450927734375, -0.002135351300239563, -0.002077251672744751, -0.002019152045249939, -0.001961052417755127, -0.001902952790260315, -0.001844853162765503, -0.001786753535270691, -0.001728653907775879, -0.001670554280281067, -0.0016124546527862549, -0.0015543550252914429, -0.0014962553977966309, -0.0014381557703018188, -0.0013800561428070068, -0.0013219565153121948, -0.0012638568878173828, -0.0012057572603225708, -0.0011476576328277588, -0.0010895580053329468, -0.0010314583778381348, -0.0009733587503433228, -0.0009152591228485107, -0.0008571594953536987, -0.0007990598678588867, -0.0007409602403640747, -0.0006828606128692627, -0.0006247609853744507, -0.0005666613578796387, -0.0005085617303848267, -0.00045046210289001465, -0.00039236247539520264, -0.0003342628479003906, -0.0002761632204055786, -0.0002180635929107666, -0.0001599639654159546, -0.00010186433792114258, -4.3764710426330566e-05, 1.4334917068481445e-05, 7.243454456329346e-05, 0.00013053417205810547, 0.00018863379955291748, 0.0002467334270477295, 0.0003048330545425415, 0.0003629326820373535, 0.00042103230953216553, 0.00047913193702697754, 0.0005372315645217896, 0.0005953311920166016, 0.0006534308195114136, 0.0007115304470062256, 0.0007696300745010376, 0.0008277297019958496, 0.0008858293294906616, 0.0009439289569854736, 0.0010020285844802856, 0.0010601282119750977, 0.0011182278394699097, 0.0011763274669647217, 0.0012344270944595337, 0.0012925267219543457, 0.0013506263494491577, 0.0014087259769439697, 0.0014668256044387817, 0.0015249252319335938]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 6.0, 4.0, 9.0, 18.0, 19.0, 32.0, 37.0, 91.0, 163.0, 256.0, 518.0, 994.0, 2340.0, 6880.0, 29146.0, 188219.0, 601217.0, 179322.0, 28068.0, 6725.0, 2335.0, 1021.0, 474.0, 238.0, 168.0, 95.0, 64.0, 37.0, 28.0, 9.0, 11.0, 6.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.8603515625, -18.220703125, -17.5810546875, -16.94140625, -16.3017578125, -15.662109375, -15.0224609375, -14.3828125, -13.7431640625, -13.103515625, -12.4638671875, -11.82421875, -11.1845703125, -10.544921875, -9.9052734375, -9.265625, -8.6259765625, -7.986328125, -7.3466796875, -6.70703125, -6.0673828125, -5.427734375, -4.7880859375, -4.1484375, -3.5087890625, -2.869140625, -2.2294921875, -1.58984375, -0.9501953125, -0.310546875, 0.3291015625, 0.96875, 1.6083984375, 2.248046875, 2.8876953125, 3.52734375, 4.1669921875, 4.806640625, 5.4462890625, 6.0859375, 6.7255859375, 7.365234375, 8.0048828125, 8.64453125, 9.2841796875, 9.923828125, 10.5634765625, 11.203125, 11.8427734375, 12.482421875, 13.1220703125, 13.76171875, 14.4013671875, 15.041015625, 15.6806640625, 16.3203125, 16.9599609375, 17.599609375, 18.2392578125, 18.87890625, 19.5185546875, 20.158203125, 20.7978515625, 21.4375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 9.0, 11.0, 12.0, 22.0, 25.0, 36.0, 36.0, 63.0, 70.0, 93.0, 106.0, 89.0, 78.0, 50.0, 58.0, 52.0, 42.0, 38.0, 30.0, 26.0, 15.0, 8.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.5626220703125, -6.265869140625, -5.9691162109375, -5.67236328125, -5.3756103515625, -5.078857421875, -4.7821044921875, -4.4853515625, -4.1885986328125, -3.891845703125, -3.5950927734375, -3.29833984375, -3.0015869140625, -2.704833984375, -2.4080810546875, -2.111328125, -1.8145751953125, -1.517822265625, -1.2210693359375, -0.92431640625, -0.6275634765625, -0.330810546875, -0.0340576171875, 0.2626953125, 0.5594482421875, 0.856201171875, 1.1529541015625, 1.44970703125, 1.7464599609375, 2.043212890625, 2.3399658203125, 2.63671875, 2.9334716796875, 3.230224609375, 3.5269775390625, 3.82373046875, 4.1204833984375, 4.417236328125, 4.7139892578125, 5.0107421875, 5.3074951171875, 5.604248046875, 5.9010009765625, 6.19775390625, 6.4945068359375, 6.791259765625, 7.0880126953125, 7.384765625, 7.6815185546875, 7.978271484375, 8.2750244140625, 8.57177734375, 8.8685302734375, 9.165283203125, 9.4620361328125, 9.7587890625, 10.0555419921875, 10.352294921875, 10.6490478515625, 10.94580078125, 11.2425537109375, 11.539306640625, 11.8360595703125, 12.1328125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 17.0, 22.0, 53.0, 77.0, 134.0, 172.0, 169.0, 140.0, 89.0, 56.0, 31.0, 10.0, 10.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.27069091796875, -200.38583374023438, -194.5009765625, -188.61611938476562, -182.73126220703125, -176.84640502929688, -170.9615478515625, -165.0767059326172, -159.1918487548828, -153.30699157714844, -147.42213439941406, -141.5372772216797, -135.6524200439453, -129.767578125, -123.8827133178711, -117.99786376953125, -112.11299896240234, -106.22814178466797, -100.3432846069336, -94.45843505859375, -88.57357788085938, -82.688720703125, -76.80386352539062, -70.91900634765625, -65.03414916992188, -59.1492919921875, -53.26443862915039, -47.379581451416016, -41.494728088378906, -35.60987091064453, -29.725013732910156, -23.840160369873047, -17.955307006835938, -12.070451736450195, -6.185595512390137, -0.3007392883300781, 5.584115982055664, 11.468971252441406, 17.35382843017578, 23.23868179321289, 29.123538970947266, 35.00839614868164, 40.89324951171875, 46.778106689453125, 52.6629638671875, 58.54781723022461, 64.43267822265625, 70.3175277709961, 76.20238494873047, 82.08724212646484, 87.97209930419922, 93.85694885253906, 99.74180603027344, 105.62666320800781, 111.51152038574219, 117.39637756347656, 123.28123474121094, 129.1660919189453, 135.0509490966797, 140.93580627441406, 146.82066345214844, 152.70550537109375, 158.59036254882812, 164.4752197265625, 170.36007690429688]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 8.0, 12.0, 10.0, 10.0, 29.0, 30.0, 19.0, 27.0, 28.0, 43.0, 47.0, 38.0, 46.0, 56.0, 51.0, 55.0, 55.0, 60.0, 62.0, 50.0, 40.0, 40.0, 30.0, 36.0, 21.0, 27.0, 21.0, 17.0, 4.0, 7.0, 8.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-106.69535827636719, -103.6173324584961, -100.53931427001953, -97.46128845214844, -94.38327026367188, -91.30524444580078, -88.22721862792969, -85.14920043945312, -82.07118225097656, -78.99315643310547, -75.9151382446289, -72.83711242675781, -69.75909423828125, -66.68106842041016, -63.60304641723633, -60.5250244140625, -57.446998596191406, -54.36897659301758, -51.29095458984375, -48.212928771972656, -45.134910583496094, -42.056884765625, -38.97886276245117, -35.900840759277344, -32.822818756103516, -29.744796752929688, -26.66677474975586, -23.5887508392334, -20.51072883605957, -17.432706832885742, -14.354682922363281, -11.276660919189453, -8.198646545410156, -5.12062406539917, -2.0426015853881836, 1.035421371459961, 4.113443374633789, 7.191465377807617, 10.269489288330078, 13.347511291503906, 16.425533294677734, 19.503555297851562, 22.58157730102539, 25.65960121154785, 28.73762321472168, 31.815645217895508, 34.89366912841797, 37.9716911315918, 41.049713134765625, 44.12773513793945, 47.20575714111328, 50.283782958984375, 53.36180114746094, 56.43982696533203, 59.51784896850586, 62.59587097167969, 65.67388916015625, 68.75191497802734, 71.8299331665039, 74.907958984375, 77.98597717285156, 81.06400299072266, 84.14202880859375, 87.22004699707031, 90.2980728149414]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 8.0, 9.0, 11.0, 10.0, 12.0, 23.0, 32.0, 50.0, 62.0, 130.0, 194.0, 472.0, 1226.0, 3736.0, 14035.0, 83615.0, 3769360.0, 284324.0, 27181.0, 6395.0, 2040.0, 703.0, 295.0, 149.0, 71.0, 42.0, 27.0, 23.0, 15.0, 12.0, 8.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-68.0625, -66.4306640625, -64.798828125, -63.1669921875, -61.53515625, -59.9033203125, -58.271484375, -56.6396484375, -55.0078125, -53.3759765625, -51.744140625, -50.1123046875, -48.48046875, -46.8486328125, -45.216796875, -43.5849609375, -41.953125, -40.3212890625, -38.689453125, -37.0576171875, -35.42578125, -33.7939453125, -32.162109375, -30.5302734375, -28.8984375, -27.2666015625, -25.634765625, -24.0029296875, -22.37109375, -20.7392578125, -19.107421875, -17.4755859375, -15.84375, -14.2119140625, -12.580078125, -10.9482421875, -9.31640625, -7.6845703125, -6.052734375, -4.4208984375, -2.7890625, -1.1572265625, 0.474609375, 2.1064453125, 3.73828125, 5.3701171875, 7.001953125, 8.6337890625, 10.265625, 11.8974609375, 13.529296875, 15.1611328125, 16.79296875, 18.4248046875, 20.056640625, 21.6884765625, 23.3203125, 24.9521484375, 26.583984375, 28.2158203125, 29.84765625, 31.4794921875, 33.111328125, 34.7431640625, 36.375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 6.0, 11.0, 9.0, 8.0, 15.0, 10.0, 20.0, 30.0, 26.0, 31.0, 31.0, 46.0, 40.0, 61.0, 53.0, 46.0, 60.0, 51.0, 57.0, 40.0, 55.0, 35.0, 39.0, 39.0, 39.0, 30.0, 24.0, 24.0, 12.0, 15.0, 6.0, 14.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.9453125, -2.8698883056640625, -2.794464111328125, -2.7190399169921875, -2.64361572265625, -2.5681915283203125, -2.492767333984375, -2.4173431396484375, -2.3419189453125, -2.2664947509765625, -2.191070556640625, -2.1156463623046875, -2.04022216796875, -1.9647979736328125, -1.889373779296875, -1.8139495849609375, -1.738525390625, -1.6631011962890625, -1.587677001953125, -1.5122528076171875, -1.43682861328125, -1.3614044189453125, -1.285980224609375, -1.2105560302734375, -1.1351318359375, -1.0597076416015625, -0.984283447265625, -0.9088592529296875, -0.83343505859375, -0.7580108642578125, -0.682586669921875, -0.6071624755859375, -0.53173828125, -0.4563140869140625, -0.380889892578125, -0.3054656982421875, -0.23004150390625, -0.1546173095703125, -0.079193115234375, -0.0037689208984375, 0.0716552734375, 0.1470794677734375, 0.222503662109375, 0.2979278564453125, 0.37335205078125, 0.4487762451171875, 0.524200439453125, 0.5996246337890625, 0.675048828125, 0.7504730224609375, 0.825897216796875, 0.9013214111328125, 0.97674560546875, 1.0521697998046875, 1.127593994140625, 1.2030181884765625, 1.2784423828125, 1.3538665771484375, 1.429290771484375, 1.5047149658203125, 1.58013916015625, 1.6555633544921875, 1.730987548828125, 1.8064117431640625, 1.8818359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 12.0, 15.0, 29.0, 39.0, 58.0, 97.0, 138.0, 293.0, 508.0, 913.0, 1727.0, 3637.0, 8416.0, 23120.0, 82072.0, 527860.0, 3187616.0, 270410.0, 55532.0, 17730.0, 6959.0, 3220.0, 1599.0, 876.0, 552.0, 281.0, 208.0, 124.0, 54.0, 56.0, 37.0, 23.0, 16.0, 9.0, 9.0, 9.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-29.6875, -28.8232421875, -27.958984375, -27.0947265625, -26.23046875, -25.3662109375, -24.501953125, -23.6376953125, -22.7734375, -21.9091796875, -21.044921875, -20.1806640625, -19.31640625, -18.4521484375, -17.587890625, -16.7236328125, -15.859375, -14.9951171875, -14.130859375, -13.2666015625, -12.40234375, -11.5380859375, -10.673828125, -9.8095703125, -8.9453125, -8.0810546875, -7.216796875, -6.3525390625, -5.48828125, -4.6240234375, -3.759765625, -2.8955078125, -2.03125, -1.1669921875, -0.302734375, 0.5615234375, 1.42578125, 2.2900390625, 3.154296875, 4.0185546875, 4.8828125, 5.7470703125, 6.611328125, 7.4755859375, 8.33984375, 9.2041015625, 10.068359375, 10.9326171875, 11.796875, 12.6611328125, 13.525390625, 14.3896484375, 15.25390625, 16.1181640625, 16.982421875, 17.8466796875, 18.7109375, 19.5751953125, 20.439453125, 21.3037109375, 22.16796875, 23.0322265625, 23.896484375, 24.7607421875, 25.625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 4.0, 8.0, 16.0, 18.0, 24.0, 34.0, 42.0, 81.0, 112.0, 186.0, 333.0, 819.0, 1229.0, 444.0, 237.0, 139.0, 95.0, 58.0, 36.0, 42.0, 20.0, 22.0, 14.0, 6.0, 10.0, 5.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.3087158203125, -5.113525390625, -4.9183349609375, -4.72314453125, -4.5279541015625, -4.332763671875, -4.1375732421875, -3.9423828125, -3.7471923828125, -3.552001953125, -3.3568115234375, -3.16162109375, -2.9664306640625, -2.771240234375, -2.5760498046875, -2.380859375, -2.1856689453125, -1.990478515625, -1.7952880859375, -1.60009765625, -1.4049072265625, -1.209716796875, -1.0145263671875, -0.8193359375, -0.6241455078125, -0.428955078125, -0.2337646484375, -0.03857421875, 0.1566162109375, 0.351806640625, 0.5469970703125, 0.7421875, 0.9373779296875, 1.132568359375, 1.3277587890625, 1.52294921875, 1.7181396484375, 1.913330078125, 2.1085205078125, 2.3037109375, 2.4989013671875, 2.694091796875, 2.8892822265625, 3.08447265625, 3.2796630859375, 3.474853515625, 3.6700439453125, 3.865234375, 4.0604248046875, 4.255615234375, 4.4508056640625, 4.64599609375, 4.8411865234375, 5.036376953125, 5.2315673828125, 5.4267578125, 5.6219482421875, 5.817138671875, 6.0123291015625, 6.20751953125, 6.4027099609375, 6.597900390625, 6.7930908203125, 6.98828125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 6.0, 11.0, 21.0, 36.0, 81.0, 119.0, 172.0, 195.0, 148.0, 85.0, 59.0, 23.0, 19.0, 7.0, 10.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.731101989746094, -35.66511535644531, -33.59912872314453, -31.533143997192383, -29.4671573638916, -27.40117073059082, -25.335186004638672, -23.26919937133789, -21.20321273803711, -19.137226104736328, -17.071239471435547, -15.005254745483398, -12.939268112182617, -10.873281478881836, -8.807295799255371, -6.741310119628906, -4.675323486328125, -2.609337329864502, -0.5433511734008789, 1.5226349830627441, 3.588621139526367, 5.654607772827148, 7.720593452453613, 9.786579132080078, 11.85256576538086, 13.91855239868164, 15.984538078308105, 18.05052375793457, 20.11651039123535, 22.182497024536133, 24.24848175048828, 26.314468383789062, 28.380447387695312, 30.446434020996094, 32.512420654296875, 34.578407287597656, 36.64439392089844, 38.71038055419922, 40.776363372802734, 42.842350006103516, 44.9083366394043, 46.97432327270508, 49.04030990600586, 51.10629653930664, 53.172279357910156, 55.23826599121094, 57.30425262451172, 59.3702392578125, 61.43622589111328, 63.50221252441406, 65.56819915771484, 67.63418579101562, 69.7001724243164, 71.76615905761719, 73.83214569091797, 75.89813232421875, 77.964111328125, 80.03009796142578, 82.09608459472656, 84.16207122802734, 86.22805786132812, 88.2940444946289, 90.36003112792969, 92.42601013183594, 94.49200439453125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 9.0, 14.0, 19.0, 23.0, 33.0, 29.0, 41.0, 48.0, 57.0, 60.0, 64.0, 81.0, 66.0, 63.0, 51.0, 51.0, 55.0, 45.0, 46.0, 41.0, 28.0, 23.0, 16.0, 11.0, 12.0, 10.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.18926239013672, -40.104164123535156, -39.01906204223633, -37.933963775634766, -36.84886169433594, -35.763763427734375, -34.67866134643555, -33.593563079833984, -32.508460998535156, -31.42336082458496, -30.338260650634766, -29.25316047668457, -28.168060302734375, -27.082962036132812, -25.997861862182617, -24.912761688232422, -23.82766342163086, -22.742563247680664, -21.65746307373047, -20.572362899780273, -19.487262725830078, -18.402164459228516, -17.31706428527832, -16.231964111328125, -15.14686393737793, -14.061763763427734, -12.976663589477539, -11.89156436920166, -10.806464195251465, -9.72136402130127, -8.63626480102539, -7.551164627075195, -6.466068267822266, -5.38096809387207, -4.295868396759033, -3.210768461227417, -2.125668525695801, -1.0405683517456055, 0.04453134536743164, 1.1296310424804688, 2.214731216430664, 3.2998311519622803, 4.3849310874938965, 5.470030784606934, 6.555130958557129, 7.640231132507324, 8.725330352783203, 9.810430526733398, 10.895530700683594, 11.980630874633789, 13.065731048583984, 14.150830268859863, 15.235930442810059, 16.321029663085938, 17.406129837036133, 18.491230010986328, 19.576330184936523, 20.66143035888672, 21.746530532836914, 22.83163070678711, 23.916728973388672, 25.0018310546875, 26.086929321289062, 27.172029495239258, 28.257129669189453]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 9.0, 9.0, 10.0, 14.0, 19.0, 29.0, 33.0, 43.0, 75.0, 108.0, 157.0, 233.0, 364.0, 616.0, 1026.0, 1845.0, 3269.0, 6709.0, 14389.0, 31663.0, 70512.0, 146909.0, 255062.0, 248845.0, 140850.0, 67712.0, 30357.0, 13731.0, 6346.0, 3225.0, 1695.0, 992.0, 578.0, 366.0, 244.0, 154.0, 105.0, 78.0, 52.0, 36.0, 20.0, 19.0, 15.0, 8.0, 7.0, 5.0, 2.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.734375, -12.3360595703125, -11.937744140625, -11.5394287109375, -11.14111328125, -10.7427978515625, -10.344482421875, -9.9461669921875, -9.5478515625, -9.1495361328125, -8.751220703125, -8.3529052734375, -7.95458984375, -7.5562744140625, -7.157958984375, -6.7596435546875, -6.361328125, -5.9630126953125, -5.564697265625, -5.1663818359375, -4.76806640625, -4.3697509765625, -3.971435546875, -3.5731201171875, -3.1748046875, -2.7764892578125, -2.378173828125, -1.9798583984375, -1.58154296875, -1.1832275390625, -0.784912109375, -0.3865966796875, 0.01171875, 0.4100341796875, 0.808349609375, 1.2066650390625, 1.60498046875, 2.0032958984375, 2.401611328125, 2.7999267578125, 3.1982421875, 3.5965576171875, 3.994873046875, 4.3931884765625, 4.79150390625, 5.1898193359375, 5.588134765625, 5.9864501953125, 6.384765625, 6.7830810546875, 7.181396484375, 7.5797119140625, 7.97802734375, 8.3763427734375, 8.774658203125, 9.1729736328125, 9.5712890625, 9.9696044921875, 10.367919921875, 10.7662353515625, 11.16455078125, 11.5628662109375, 11.961181640625, 12.3594970703125, 12.7578125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 6.0, 10.0, 15.0, 14.0, 23.0, 23.0, 35.0, 40.0, 44.0, 54.0, 61.0, 59.0, 52.0, 78.0, 63.0, 50.0, 63.0, 44.0, 50.0, 47.0, 32.0, 30.0, 23.0, 20.0, 15.0, 17.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.13671875, -3.051513671875, -2.96630859375, -2.881103515625, -2.7958984375, -2.710693359375, -2.62548828125, -2.540283203125, -2.455078125, -2.369873046875, -2.28466796875, -2.199462890625, -2.1142578125, -2.029052734375, -1.94384765625, -1.858642578125, -1.7734375, -1.688232421875, -1.60302734375, -1.517822265625, -1.4326171875, -1.347412109375, -1.26220703125, -1.177001953125, -1.091796875, -1.006591796875, -0.92138671875, -0.836181640625, -0.7509765625, -0.665771484375, -0.58056640625, -0.495361328125, -0.41015625, -0.324951171875, -0.23974609375, -0.154541015625, -0.0693359375, 0.015869140625, 0.10107421875, 0.186279296875, 0.271484375, 0.356689453125, 0.44189453125, 0.527099609375, 0.6123046875, 0.697509765625, 0.78271484375, 0.867919921875, 0.953125, 1.038330078125, 1.12353515625, 1.208740234375, 1.2939453125, 1.379150390625, 1.46435546875, 1.549560546875, 1.634765625, 1.719970703125, 1.80517578125, 1.890380859375, 1.9755859375, 2.060791015625, 2.14599609375, 2.231201171875, 2.31640625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 8.0, 18.0, 19.0, 42.0, 34.0, 56.0, 80.0, 91.0, 139.0, 171.0, 262.0, 338.0, 545.0, 816.0, 1415.0, 2554.0, 5199.0, 11915.0, 29149.0, 73051.0, 173344.0, 307364.0, 245502.0, 114596.0, 46579.0, 18538.0, 8037.0, 3572.0, 1863.0, 1043.0, 666.0, 434.0, 271.0, 227.0, 143.0, 133.0, 79.0, 65.0, 39.0, 34.0, 28.0, 18.0, 18.0, 11.0, 10.0, 11.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0], "bins": [-13.921875, -13.5093994140625, -13.096923828125, -12.6844482421875, -12.27197265625, -11.8594970703125, -11.447021484375, -11.0345458984375, -10.6220703125, -10.2095947265625, -9.797119140625, -9.3846435546875, -8.97216796875, -8.5596923828125, -8.147216796875, -7.7347412109375, -7.322265625, -6.9097900390625, -6.497314453125, -6.0848388671875, -5.67236328125, -5.2598876953125, -4.847412109375, -4.4349365234375, -4.0224609375, -3.6099853515625, -3.197509765625, -2.7850341796875, -2.37255859375, -1.9600830078125, -1.547607421875, -1.1351318359375, -0.72265625, -0.3101806640625, 0.102294921875, 0.5147705078125, 0.92724609375, 1.3397216796875, 1.752197265625, 2.1646728515625, 2.5771484375, 2.9896240234375, 3.402099609375, 3.8145751953125, 4.22705078125, 4.6395263671875, 5.052001953125, 5.4644775390625, 5.876953125, 6.2894287109375, 6.701904296875, 7.1143798828125, 7.52685546875, 7.9393310546875, 8.351806640625, 8.7642822265625, 9.1767578125, 9.5892333984375, 10.001708984375, 10.4141845703125, 10.82666015625, 11.2391357421875, 11.651611328125, 12.0640869140625, 12.4765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 11.0, 8.0, 6.0, 8.0, 14.0, 13.0, 24.0, 17.0, 19.0, 31.0, 22.0, 23.0, 28.0, 33.0, 42.0, 35.0, 39.0, 35.0, 32.0, 48.0, 35.0, 41.0, 27.0, 50.0, 43.0, 40.0, 40.0, 41.0, 23.0, 34.0, 23.0, 18.0, 14.0, 17.0, 15.0, 10.0, 7.0, 3.0, 2.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8260498046875, -8.519287109375, -8.2125244140625, -7.90576171875, -7.5989990234375, -7.292236328125, -6.9854736328125, -6.6787109375, -6.3719482421875, -6.065185546875, -5.7584228515625, -5.45166015625, -5.1448974609375, -4.838134765625, -4.5313720703125, -4.224609375, -3.9178466796875, -3.611083984375, -3.3043212890625, -2.99755859375, -2.6907958984375, -2.384033203125, -2.0772705078125, -1.7705078125, -1.4637451171875, -1.156982421875, -0.8502197265625, -0.54345703125, -0.2366943359375, 0.070068359375, 0.3768310546875, 0.68359375, 0.9903564453125, 1.297119140625, 1.6038818359375, 1.91064453125, 2.2174072265625, 2.524169921875, 2.8309326171875, 3.1376953125, 3.4444580078125, 3.751220703125, 4.0579833984375, 4.36474609375, 4.6715087890625, 4.978271484375, 5.2850341796875, 5.591796875, 5.8985595703125, 6.205322265625, 6.5120849609375, 6.81884765625, 7.1256103515625, 7.432373046875, 7.7391357421875, 8.0458984375, 8.3526611328125, 8.659423828125, 8.9661865234375, 9.27294921875, 9.5797119140625, 9.886474609375, 10.1932373046875, 10.5]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 5.0, 9.0, 8.0, 20.0, 22.0, 29.0, 46.0, 56.0, 82.0, 127.0, 218.0, 369.0, 738.0, 1640.0, 4698.0, 16792.0, 84487.0, 449611.0, 397034.0, 70501.0, 14664.0, 4172.0, 1614.0, 655.0, 332.0, 211.0, 133.0, 81.0, 53.0, 41.0, 25.0, 23.0, 13.0, 13.0, 6.0, 6.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.59375, -12.2333984375, -11.873046875, -11.5126953125, -11.15234375, -10.7919921875, -10.431640625, -10.0712890625, -9.7109375, -9.3505859375, -8.990234375, -8.6298828125, -8.26953125, -7.9091796875, -7.548828125, -7.1884765625, -6.828125, -6.4677734375, -6.107421875, -5.7470703125, -5.38671875, -5.0263671875, -4.666015625, -4.3056640625, -3.9453125, -3.5849609375, -3.224609375, -2.8642578125, -2.50390625, -2.1435546875, -1.783203125, -1.4228515625, -1.0625, -0.7021484375, -0.341796875, 0.0185546875, 0.37890625, 0.7392578125, 1.099609375, 1.4599609375, 1.8203125, 2.1806640625, 2.541015625, 2.9013671875, 3.26171875, 3.6220703125, 3.982421875, 4.3427734375, 4.703125, 5.0634765625, 5.423828125, 5.7841796875, 6.14453125, 6.5048828125, 6.865234375, 7.2255859375, 7.5859375, 7.9462890625, 8.306640625, 8.6669921875, 9.02734375, 9.3876953125, 9.748046875, 10.1083984375, 10.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 9.0, 11.0, 12.0, 17.0, 18.0, 38.0, 39.0, 46.0, 60.0, 67.0, 91.0, 90.0, 110.0, 75.0, 58.0, 63.0, 40.0, 33.0, 26.0, 21.0, 17.0, 14.0, 8.0, 6.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012025833129882812, -0.0011607706546783447, -0.0011189579963684082, -0.0010771453380584717, -0.0010353326797485352, -0.0009935200214385986, -0.0009517073631286621, -0.0009098947048187256, -0.0008680820465087891, -0.0008262693881988525, -0.000784456729888916, -0.0007426440715789795, -0.000700831413269043, -0.0006590187549591064, -0.0006172060966491699, -0.0005753934383392334, -0.0005335807800292969, -0.0004917681217193604, -0.00044995546340942383, -0.0004081428050994873, -0.0003663301467895508, -0.00032451748847961426, -0.00028270483016967773, -0.0002408921718597412, -0.0001990795135498047, -0.00015726685523986816, -0.00011545419692993164, -7.364153861999512e-05, -3.1828880310058594e-05, 9.98377799987793e-06, 5.179643630981445e-05, 9.360909461975098e-05, 0.0001354217529296875, 0.00017723441123962402, 0.00021904706954956055, 0.00026085972785949707, 0.0003026723861694336, 0.0003444850444793701, 0.00038629770278930664, 0.00042811036109924316, 0.0004699230194091797, 0.0005117356777191162, 0.0005535483360290527, 0.0005953609943389893, 0.0006371736526489258, 0.0006789863109588623, 0.0007207989692687988, 0.0007626116275787354, 0.0008044242858886719, 0.0008462369441986084, 0.0008880496025085449, 0.0009298622608184814, 0.000971674919128418, 0.0010134875774383545, 0.001055300235748291, 0.0010971128940582275, 0.001138925552368164, 0.0011807382106781006, 0.0012225508689880371, 0.0012643635272979736, 0.0013061761856079102, 0.0013479888439178467, 0.0013898015022277832, 0.0014316141605377197, 0.0014734268188476562]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 3.0, 4.0, 6.0, 8.0, 17.0, 16.0, 23.0, 36.0, 48.0, 75.0, 123.0, 165.0, 320.0, 589.0, 1089.0, 2268.0, 5623.0, 16530.0, 61690.0, 279208.0, 482501.0, 146995.0, 33672.0, 10128.0, 3749.0, 1669.0, 837.0, 449.0, 247.0, 153.0, 97.0, 57.0, 55.0, 34.0, 23.0, 16.0, 8.0, 6.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.375, -10.0723876953125, -9.769775390625, -9.4671630859375, -9.16455078125, -8.8619384765625, -8.559326171875, -8.2567138671875, -7.9541015625, -7.6514892578125, -7.348876953125, -7.0462646484375, -6.74365234375, -6.4410400390625, -6.138427734375, -5.8358154296875, -5.533203125, -5.2305908203125, -4.927978515625, -4.6253662109375, -4.32275390625, -4.0201416015625, -3.717529296875, -3.4149169921875, -3.1123046875, -2.8096923828125, -2.507080078125, -2.2044677734375, -1.90185546875, -1.5992431640625, -1.296630859375, -0.9940185546875, -0.69140625, -0.3887939453125, -0.086181640625, 0.2164306640625, 0.51904296875, 0.8216552734375, 1.124267578125, 1.4268798828125, 1.7294921875, 2.0321044921875, 2.334716796875, 2.6373291015625, 2.93994140625, 3.2425537109375, 3.545166015625, 3.8477783203125, 4.150390625, 4.4530029296875, 4.755615234375, 5.0582275390625, 5.36083984375, 5.6634521484375, 5.966064453125, 6.2686767578125, 6.5712890625, 6.8739013671875, 7.176513671875, 7.4791259765625, 7.78173828125, 8.0843505859375, 8.386962890625, 8.6895751953125, 8.9921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 5.0, 8.0, 7.0, 5.0, 11.0, 15.0, 22.0, 16.0, 26.0, 39.0, 38.0, 48.0, 73.0, 63.0, 63.0, 64.0, 62.0, 60.0, 78.0, 50.0, 50.0, 40.0, 32.0, 20.0, 18.0, 16.0, 14.0, 10.0, 10.0, 7.0, 9.0, 6.0, 6.0, 0.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.63421630859375, -4.4793701171875, -4.32452392578125, -4.169677734375, -4.01483154296875, -3.8599853515625, -3.70513916015625, -3.55029296875, -3.39544677734375, -3.2406005859375, -3.08575439453125, -2.930908203125, -2.77606201171875, -2.6212158203125, -2.46636962890625, -2.3115234375, -2.15667724609375, -2.0018310546875, -1.84698486328125, -1.692138671875, -1.53729248046875, -1.3824462890625, -1.22760009765625, -1.07275390625, -0.91790771484375, -0.7630615234375, -0.60821533203125, -0.453369140625, -0.29852294921875, -0.1436767578125, 0.01116943359375, 0.166015625, 0.32086181640625, 0.4757080078125, 0.63055419921875, 0.785400390625, 0.94024658203125, 1.0950927734375, 1.24993896484375, 1.40478515625, 1.55963134765625, 1.7144775390625, 1.86932373046875, 2.024169921875, 2.17901611328125, 2.3338623046875, 2.48870849609375, 2.6435546875, 2.79840087890625, 2.9532470703125, 3.10809326171875, 3.262939453125, 3.41778564453125, 3.5726318359375, 3.72747802734375, 3.88232421875, 4.03717041015625, 4.1920166015625, 4.34686279296875, 4.501708984375, 4.65655517578125, 4.8114013671875, 4.96624755859375, 5.12109375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 5.0, 5.0, 9.0, 25.0, 32.0, 45.0, 67.0, 81.0, 112.0, 145.0, 114.0, 92.0, 97.0, 47.0, 44.0, 26.0, 23.0, 14.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-127.5039291381836, -123.97856903076172, -120.45320129394531, -116.92784118652344, -113.40248107910156, -109.87712097167969, -106.35176086425781, -102.8263931274414, -99.30103302001953, -95.77567291259766, -92.25030517578125, -88.72494506835938, -85.1995849609375, -81.67422485351562, -78.14886474609375, -74.62349700927734, -71.09813690185547, -67.5727767944336, -64.04740905761719, -60.52204895019531, -56.99668884277344, -53.47132873535156, -49.94596481323242, -46.42060089111328, -42.895240783691406, -39.36988067626953, -35.84451675415039, -32.31915283203125, -28.793792724609375, -25.268430709838867, -21.74306869506836, -18.21770668029785, -14.692344665527344, -11.166982650756836, -7.641620635986328, -4.11625862121582, -0.5908966064453125, 2.9344654083251953, 6.459827423095703, 9.985189437866211, 13.510551452636719, 17.035913467407227, 20.561275482177734, 24.086637496948242, 27.61199951171875, 31.137361526489258, 34.662723541259766, 38.188087463378906, 41.71344757080078, 45.238807678222656, 48.7641716003418, 52.28953552246094, 55.81489562988281, 59.34025573730469, 62.86561965942383, 66.39098358154297, 69.91634368896484, 73.44170379638672, 76.96707153320312, 80.492431640625, 84.01779174804688, 87.54315185546875, 91.06851196289062, 94.59387969970703, 98.1192398071289]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 8.0, 7.0, 5.0, 5.0, 8.0, 15.0, 9.0, 14.0, 20.0, 19.0, 14.0, 32.0, 26.0, 39.0, 40.0, 36.0, 47.0, 50.0, 46.0, 44.0, 37.0, 51.0, 49.0, 45.0, 41.0, 40.0, 38.0, 37.0, 24.0, 30.0, 26.0, 16.0, 8.0, 13.0, 9.0, 12.0, 5.0, 8.0, 6.0, 7.0, 3.0, 1.0, 3.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-74.10862731933594, -72.0201187133789, -69.93160247802734, -67.84309387207031, -65.75458526611328, -63.666072845458984, -61.57756042480469, -59.489051818847656, -57.40053939819336, -55.31202697753906, -53.22351837158203, -51.135005950927734, -49.04649353027344, -46.957984924316406, -44.86947250366211, -42.78096008300781, -40.69245147705078, -38.603939056396484, -36.51543045043945, -34.426918029785156, -32.338409423828125, -30.249897003173828, -28.16138458251953, -26.072874069213867, -23.984363555908203, -21.89585304260254, -19.807342529296875, -17.718830108642578, -15.630319595336914, -13.54180908203125, -11.45329761505127, -9.364786148071289, -7.276271820068359, -5.187760829925537, -3.099249839782715, -1.0107388496398926, 1.0777721405029297, 3.1662826538085938, 5.254794120788574, 7.343305587768555, 9.431816101074219, 11.520326614379883, 13.608838081359863, 15.697349548339844, 17.785860061645508, 19.874370574951172, 21.96288299560547, 24.051393508911133, 26.139904022216797, 28.22841453552246, 30.316925048828125, 32.40543746948242, 34.49394989013672, 36.58245849609375, 38.67097091674805, 40.759483337402344, 42.847991943359375, 44.93650436401367, 47.0250129699707, 49.113525390625, 51.20203399658203, 53.29054641723633, 55.379058837890625, 57.467567443847656, 59.55607986450195]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 12.0, 14.0, 15.0, 24.0, 29.0, 61.0, 94.0, 137.0, 192.0, 353.0, 721.0, 1340.0, 2843.0, 6856.0, 19921.0, 81763.0, 2975604.0, 1009488.0, 65868.0, 17144.0, 6195.0, 2655.0, 1310.0, 727.0, 364.0, 210.0, 121.0, 66.0, 53.0, 32.0, 19.0, 12.0, 12.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.24951171875, -17.5458984375, -16.84228515625, -16.138671875, -15.43505859375, -14.7314453125, -14.02783203125, -13.32421875, -12.62060546875, -11.9169921875, -11.21337890625, -10.509765625, -9.80615234375, -9.1025390625, -8.39892578125, -7.6953125, -6.99169921875, -6.2880859375, -5.58447265625, -4.880859375, -4.17724609375, -3.4736328125, -2.77001953125, -2.06640625, -1.36279296875, -0.6591796875, 0.04443359375, 0.748046875, 1.45166015625, 2.1552734375, 2.85888671875, 3.5625, 4.26611328125, 4.9697265625, 5.67333984375, 6.376953125, 7.08056640625, 7.7841796875, 8.48779296875, 9.19140625, 9.89501953125, 10.5986328125, 11.30224609375, 12.005859375, 12.70947265625, 13.4130859375, 14.11669921875, 14.8203125, 15.52392578125, 16.2275390625, 16.93115234375, 17.634765625, 18.33837890625, 19.0419921875, 19.74560546875, 20.44921875, 21.15283203125, 21.8564453125, 22.56005859375, 23.263671875, 23.96728515625, 24.6708984375, 25.37451171875, 26.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 8.0, 15.0, 14.0, 17.0, 27.0, 36.0, 32.0, 38.0, 35.0, 44.0, 50.0, 58.0, 52.0, 49.0, 57.0, 48.0, 52.0, 40.0, 47.0, 33.0, 33.0, 36.0, 22.0, 22.0, 32.0, 20.0, 11.0, 9.0, 18.0, 7.0, 9.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.3984375, -2.326812744140625, -2.25518798828125, -2.183563232421875, -2.1119384765625, -2.040313720703125, -1.96868896484375, -1.897064208984375, -1.825439453125, -1.753814697265625, -1.68218994140625, -1.610565185546875, -1.5389404296875, -1.467315673828125, -1.39569091796875, -1.324066162109375, -1.25244140625, -1.180816650390625, -1.10919189453125, -1.037567138671875, -0.9659423828125, -0.894317626953125, -0.82269287109375, -0.751068115234375, -0.679443359375, -0.607818603515625, -0.53619384765625, -0.464569091796875, -0.3929443359375, -0.321319580078125, -0.24969482421875, -0.178070068359375, -0.1064453125, -0.034820556640625, 0.03680419921875, 0.108428955078125, 0.1800537109375, 0.251678466796875, 0.32330322265625, 0.394927978515625, 0.466552734375, 0.538177490234375, 0.60980224609375, 0.681427001953125, 0.7530517578125, 0.824676513671875, 0.89630126953125, 0.967926025390625, 1.03955078125, 1.111175537109375, 1.18280029296875, 1.254425048828125, 1.3260498046875, 1.397674560546875, 1.46929931640625, 1.540924072265625, 1.612548828125, 1.684173583984375, 1.75579833984375, 1.827423095703125, 1.8990478515625, 1.970672607421875, 2.04229736328125, 2.113922119140625, 2.185546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 7.0, 9.0, 13.0, 18.0, 35.0, 45.0, 77.0, 124.0, 211.0, 307.0, 532.0, 920.0, 1913.0, 4306.0, 10687.0, 31239.0, 122346.0, 1564899.0, 2272359.0, 131818.0, 32805.0, 11078.0, 4298.0, 1905.0, 937.0, 524.0, 330.0, 168.0, 119.0, 83.0, 45.0, 36.0, 28.0, 13.0, 12.0, 10.0, 7.0, 8.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.171875, -17.586181640625, -17.00048828125, -16.414794921875, -15.8291015625, -15.243408203125, -14.65771484375, -14.072021484375, -13.486328125, -12.900634765625, -12.31494140625, -11.729248046875, -11.1435546875, -10.557861328125, -9.97216796875, -9.386474609375, -8.80078125, -8.215087890625, -7.62939453125, -7.043701171875, -6.4580078125, -5.872314453125, -5.28662109375, -4.700927734375, -4.115234375, -3.529541015625, -2.94384765625, -2.358154296875, -1.7724609375, -1.186767578125, -0.60107421875, -0.015380859375, 0.5703125, 1.156005859375, 1.74169921875, 2.327392578125, 2.9130859375, 3.498779296875, 4.08447265625, 4.670166015625, 5.255859375, 5.841552734375, 6.42724609375, 7.012939453125, 7.5986328125, 8.184326171875, 8.77001953125, 9.355712890625, 9.94140625, 10.527099609375, 11.11279296875, 11.698486328125, 12.2841796875, 12.869873046875, 13.45556640625, 14.041259765625, 14.626953125, 15.212646484375, 15.79833984375, 16.384033203125, 16.9697265625, 17.555419921875, 18.14111328125, 18.726806640625, 19.3125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 10.0, 9.0, 15.0, 22.0, 36.0, 50.0, 81.0, 126.0, 194.0, 465.0, 1559.0, 783.0, 292.0, 135.0, 100.0, 52.0, 37.0, 26.0, 23.0, 11.0, 9.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8671875, -4.691650390625, -4.51611328125, -4.340576171875, -4.1650390625, -3.989501953125, -3.81396484375, -3.638427734375, -3.462890625, -3.287353515625, -3.11181640625, -2.936279296875, -2.7607421875, -2.585205078125, -2.40966796875, -2.234130859375, -2.05859375, -1.883056640625, -1.70751953125, -1.531982421875, -1.3564453125, -1.180908203125, -1.00537109375, -0.829833984375, -0.654296875, -0.478759765625, -0.30322265625, -0.127685546875, 0.0478515625, 0.223388671875, 0.39892578125, 0.574462890625, 0.75, 0.925537109375, 1.10107421875, 1.276611328125, 1.4521484375, 1.627685546875, 1.80322265625, 1.978759765625, 2.154296875, 2.329833984375, 2.50537109375, 2.680908203125, 2.8564453125, 3.031982421875, 3.20751953125, 3.383056640625, 3.55859375, 3.734130859375, 3.90966796875, 4.085205078125, 4.2607421875, 4.436279296875, 4.61181640625, 4.787353515625, 4.962890625, 5.138427734375, 5.31396484375, 5.489501953125, 5.6650390625, 5.840576171875, 6.01611328125, 6.191650390625, 6.3671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 12.0, 11.0, 21.0, 26.0, 39.0, 70.0, 99.0, 133.0, 145.0, 127.0, 102.0, 70.0, 57.0, 36.0, 21.0, 11.0, 10.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.837711334228516, -42.76536178588867, -41.69300842285156, -40.62065887451172, -39.548309326171875, -38.47595977783203, -37.40360641479492, -36.33125686645508, -35.25890350341797, -34.186553955078125, -33.114200592041016, -32.04185104370117, -30.969501495361328, -29.89715003967285, -28.824798583984375, -27.75244903564453, -26.680099487304688, -25.60774803161621, -24.535398483276367, -23.46304702758789, -22.390697479248047, -21.31834602355957, -20.245994567871094, -19.17364501953125, -18.101293563842773, -17.028942108154297, -15.956592559814453, -14.884241104125977, -13.811890602111816, -12.739540100097656, -11.66718864440918, -10.59483814239502, -9.522483825683594, -8.450133323669434, -7.377782344818115, -6.305431365966797, -5.233080863952637, -4.160730361938477, -3.088379383087158, -2.01602840423584, -0.9436779022216797, 0.12867283821105957, 1.2010235786437988, 2.273374319076538, 3.3457250595092773, 4.4180755615234375, 5.490426540374756, 6.562777519226074, 7.635128021240234, 8.707478523254395, 9.779829025268555, 10.852180480957031, 11.924530982971191, 12.996881484985352, 14.069232940673828, 15.141583442687988, 16.21393394470215, 17.286285400390625, 18.35863494873047, 19.430986404418945, 20.503337860107422, 21.575687408447266, 22.648038864135742, 23.72039031982422, 24.792739868164062]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 15.0, 9.0, 12.0, 14.0, 16.0, 27.0, 28.0, 33.0, 48.0, 46.0, 47.0, 58.0, 45.0, 28.0, 51.0, 61.0, 72.0, 48.0, 49.0, 49.0, 45.0, 32.0, 36.0, 27.0, 17.0, 18.0, 16.0, 12.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.641159057617188, -19.009654998779297, -18.378150939941406, -17.74664878845215, -17.115144729614258, -16.483640670776367, -15.852137565612793, -15.220634460449219, -14.589130401611328, -13.957626342773438, -13.326123237609863, -12.694620132446289, -12.063116073608398, -11.431612014770508, -10.800108909606934, -10.16860580444336, -9.537101745605469, -8.905597686767578, -8.274094581604004, -7.6425909996032715, -7.011087417602539, -6.379583835601807, -5.748080253601074, -5.116576671600342, -4.485073089599609, -3.853569507598877, -3.2220659255981445, -2.590562343597412, -1.9590587615966797, -1.3275551795959473, -0.6960515975952148, -0.06454801559448242, 0.5669536590576172, 1.1984572410583496, 1.829960823059082, 2.4614644050598145, 3.092967987060547, 3.7244715690612793, 4.355975151062012, 4.987478733062744, 5.618982315063477, 6.250485897064209, 6.881989479064941, 7.513493061065674, 8.144996643066406, 8.776500701904297, 9.408003807067871, 10.039506912231445, 10.671010971069336, 11.302515029907227, 11.9340181350708, 12.565521240234375, 13.197025299072266, 13.828529357910156, 14.46003246307373, 15.091535568237305, 15.723039627075195, 16.354543685913086, 16.986045837402344, 17.617549896240234, 18.249053955078125, 18.880558013916016, 19.512062072753906, 20.143564224243164, 20.775068283081055]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 5.0, 4.0, 12.0, 12.0, 17.0, 18.0, 27.0, 41.0, 91.0, 112.0, 176.0, 270.0, 454.0, 796.0, 1475.0, 2824.0, 6439.0, 16585.0, 46385.0, 128303.0, 299141.0, 317150.0, 143912.0, 51859.0, 18350.0, 7260.0, 3153.0, 1549.0, 885.0, 468.0, 252.0, 165.0, 100.0, 61.0, 50.0, 38.0, 29.0, 18.0, 19.0, 9.0, 9.0, 8.0, 11.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-17.015625, -16.543701171875, -16.07177734375, -15.599853515625, -15.1279296875, -14.656005859375, -14.18408203125, -13.712158203125, -13.240234375, -12.768310546875, -12.29638671875, -11.824462890625, -11.3525390625, -10.880615234375, -10.40869140625, -9.936767578125, -9.46484375, -8.992919921875, -8.52099609375, -8.049072265625, -7.5771484375, -7.105224609375, -6.63330078125, -6.161376953125, -5.689453125, -5.217529296875, -4.74560546875, -4.273681640625, -3.8017578125, -3.329833984375, -2.85791015625, -2.385986328125, -1.9140625, -1.442138671875, -0.97021484375, -0.498291015625, -0.0263671875, 0.445556640625, 0.91748046875, 1.389404296875, 1.861328125, 2.333251953125, 2.80517578125, 3.277099609375, 3.7490234375, 4.220947265625, 4.69287109375, 5.164794921875, 5.63671875, 6.108642578125, 6.58056640625, 7.052490234375, 7.5244140625, 7.996337890625, 8.46826171875, 8.940185546875, 9.412109375, 9.884033203125, 10.35595703125, 10.827880859375, 11.2998046875, 11.771728515625, 12.24365234375, 12.715576171875, 13.1875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 6.0, 7.0, 11.0, 13.0, 13.0, 22.0, 36.0, 34.0, 42.0, 46.0, 38.0, 50.0, 48.0, 55.0, 47.0, 58.0, 55.0, 51.0, 45.0, 46.0, 37.0, 33.0, 23.0, 29.0, 24.0, 29.0, 15.0, 19.0, 12.0, 8.0, 9.0, 9.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.48046875, -2.4106597900390625, -2.340850830078125, -2.2710418701171875, -2.20123291015625, -2.1314239501953125, -2.061614990234375, -1.9918060302734375, -1.9219970703125, -1.8521881103515625, -1.782379150390625, -1.7125701904296875, -1.64276123046875, -1.5729522705078125, -1.503143310546875, -1.4333343505859375, -1.363525390625, -1.2937164306640625, -1.223907470703125, -1.1540985107421875, -1.08428955078125, -1.0144805908203125, -0.944671630859375, -0.8748626708984375, -0.8050537109375, -0.7352447509765625, -0.665435791015625, -0.5956268310546875, -0.52581787109375, -0.4560089111328125, -0.386199951171875, -0.3163909912109375, -0.24658203125, -0.1767730712890625, -0.106964111328125, -0.0371551513671875, 0.03265380859375, 0.1024627685546875, 0.172271728515625, 0.2420806884765625, 0.3118896484375, 0.3816986083984375, 0.451507568359375, 0.5213165283203125, 0.59112548828125, 0.6609344482421875, 0.730743408203125, 0.8005523681640625, 0.870361328125, 0.9401702880859375, 1.009979248046875, 1.0797882080078125, 1.14959716796875, 1.2194061279296875, 1.289215087890625, 1.3590240478515625, 1.4288330078125, 1.4986419677734375, 1.568450927734375, 1.6382598876953125, 1.70806884765625, 1.7778778076171875, 1.847686767578125, 1.9174957275390625, 1.9873046875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 15.0, 15.0, 21.0, 22.0, 32.0, 49.0, 71.0, 126.0, 144.0, 239.0, 338.0, 518.0, 822.0, 1351.0, 2664.0, 6030.0, 15432.0, 44825.0, 133364.0, 313828.0, 317931.0, 136342.0, 46132.0, 15692.0, 6061.0, 2650.0, 1367.0, 815.0, 487.0, 361.0, 248.0, 148.0, 119.0, 92.0, 54.0, 44.0, 35.0, 20.0, 18.0, 7.0, 9.0, 10.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.2401123046875, -10.823974609375, -10.4078369140625, -9.99169921875, -9.5755615234375, -9.159423828125, -8.7432861328125, -8.3271484375, -7.9110107421875, -7.494873046875, -7.0787353515625, -6.66259765625, -6.2464599609375, -5.830322265625, -5.4141845703125, -4.998046875, -4.5819091796875, -4.165771484375, -3.7496337890625, -3.33349609375, -2.9173583984375, -2.501220703125, -2.0850830078125, -1.6689453125, -1.2528076171875, -0.836669921875, -0.4205322265625, -0.00439453125, 0.4117431640625, 0.827880859375, 1.2440185546875, 1.66015625, 2.0762939453125, 2.492431640625, 2.9085693359375, 3.32470703125, 3.7408447265625, 4.156982421875, 4.5731201171875, 4.9892578125, 5.4053955078125, 5.821533203125, 6.2376708984375, 6.65380859375, 7.0699462890625, 7.486083984375, 7.9022216796875, 8.318359375, 8.7344970703125, 9.150634765625, 9.5667724609375, 9.98291015625, 10.3990478515625, 10.815185546875, 11.2313232421875, 11.6474609375, 12.0635986328125, 12.479736328125, 12.8958740234375, 13.31201171875, 13.7281494140625, 14.144287109375, 14.5604248046875, 14.9765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 1.0, 6.0, 1.0, 9.0, 9.0, 8.0, 7.0, 15.0, 10.0, 11.0, 30.0, 11.0, 32.0, 26.0, 32.0, 35.0, 43.0, 43.0, 33.0, 33.0, 49.0, 45.0, 46.0, 49.0, 52.0, 45.0, 42.0, 36.0, 24.0, 30.0, 20.0, 35.0, 32.0, 21.0, 22.0, 9.0, 12.0, 5.0, 8.0, 13.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8828125, -8.5869140625, -8.291015625, -7.9951171875, -7.69921875, -7.4033203125, -7.107421875, -6.8115234375, -6.515625, -6.2197265625, -5.923828125, -5.6279296875, -5.33203125, -5.0361328125, -4.740234375, -4.4443359375, -4.1484375, -3.8525390625, -3.556640625, -3.2607421875, -2.96484375, -2.6689453125, -2.373046875, -2.0771484375, -1.78125, -1.4853515625, -1.189453125, -0.8935546875, -0.59765625, -0.3017578125, -0.005859375, 0.2900390625, 0.5859375, 0.8818359375, 1.177734375, 1.4736328125, 1.76953125, 2.0654296875, 2.361328125, 2.6572265625, 2.953125, 3.2490234375, 3.544921875, 3.8408203125, 4.13671875, 4.4326171875, 4.728515625, 5.0244140625, 5.3203125, 5.6162109375, 5.912109375, 6.2080078125, 6.50390625, 6.7998046875, 7.095703125, 7.3916015625, 7.6875, 7.9833984375, 8.279296875, 8.5751953125, 8.87109375, 9.1669921875, 9.462890625, 9.7587890625, 10.0546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 10.0, 6.0, 9.0, 15.0, 15.0, 29.0, 45.0, 76.0, 141.0, 249.0, 565.0, 1604.0, 5643.0, 50968.0, 845903.0, 130874.0, 8835.0, 2111.0, 734.0, 322.0, 162.0, 73.0, 46.0, 38.0, 18.0, 18.0, 9.0, 5.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-23.90625, -23.27099609375, -22.6357421875, -22.00048828125, -21.365234375, -20.72998046875, -20.0947265625, -19.45947265625, -18.82421875, -18.18896484375, -17.5537109375, -16.91845703125, -16.283203125, -15.64794921875, -15.0126953125, -14.37744140625, -13.7421875, -13.10693359375, -12.4716796875, -11.83642578125, -11.201171875, -10.56591796875, -9.9306640625, -9.29541015625, -8.66015625, -8.02490234375, -7.3896484375, -6.75439453125, -6.119140625, -5.48388671875, -4.8486328125, -4.21337890625, -3.578125, -2.94287109375, -2.3076171875, -1.67236328125, -1.037109375, -0.40185546875, 0.2333984375, 0.86865234375, 1.50390625, 2.13916015625, 2.7744140625, 3.40966796875, 4.044921875, 4.68017578125, 5.3154296875, 5.95068359375, 6.5859375, 7.22119140625, 7.8564453125, 8.49169921875, 9.126953125, 9.76220703125, 10.3974609375, 11.03271484375, 11.66796875, 12.30322265625, 12.9384765625, 13.57373046875, 14.208984375, 14.84423828125, 15.4794921875, 16.11474609375, 16.75]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 3.0, 12.0, 7.0, 14.0, 11.0, 24.0, 27.0, 35.0, 46.0, 65.0, 79.0, 102.0, 103.0, 95.0, 91.0, 53.0, 37.0, 38.0, 31.0, 23.0, 26.0, 11.0, 7.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013828277587890625, -0.001345023512840271, -0.0013072192668914795, -0.001269415020942688, -0.0012316107749938965, -0.001193806529045105, -0.0011560022830963135, -0.001118198037147522, -0.0010803937911987305, -0.001042589545249939, -0.0010047852993011475, -0.000966981053352356, -0.0009291768074035645, -0.000891372561454773, -0.0008535683155059814, -0.0008157640695571899, -0.0007779598236083984, -0.0007401555776596069, -0.0007023513317108154, -0.0006645470857620239, -0.0006267428398132324, -0.0005889385938644409, -0.0005511343479156494, -0.0005133301019668579, -0.0004755258560180664, -0.0004377216100692749, -0.0003999173641204834, -0.0003621131181716919, -0.0003243088722229004, -0.0002865046262741089, -0.0002487003803253174, -0.00021089613437652588, -0.00017309188842773438, -0.00013528764247894287, -9.748339653015137e-05, -5.967915058135986e-05, -2.187490463256836e-05, 1.5929341316223145e-05, 5.373358726501465e-05, 9.153783321380615e-05, 0.00012934207916259766, 0.00016714632511138916, 0.00020495057106018066, 0.00024275481700897217, 0.00028055906295776367, 0.0003183633089065552, 0.0003561675548553467, 0.0003939718008041382, 0.0004317760467529297, 0.0004695802927017212, 0.0005073845386505127, 0.0005451887845993042, 0.0005829930305480957, 0.0006207972764968872, 0.0006586015224456787, 0.0006964057683944702, 0.0007342100143432617, 0.0007720142602920532, 0.0008098185062408447, 0.0008476227521896362, 0.0008854269981384277, 0.0009232312440872192, 0.0009610354900360107, 0.0009988397359848022, 0.0010366439819335938]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 5.0, 2.0, 10.0, 14.0, 21.0, 23.0, 33.0, 51.0, 108.0, 167.0, 292.0, 717.0, 1912.0, 6492.0, 58248.0, 931631.0, 40134.0, 5591.0, 1798.0, 650.0, 276.0, 157.0, 73.0, 61.0, 26.0, 23.0, 19.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -21.97607421875, -21.0771484375, -20.17822265625, -19.279296875, -18.38037109375, -17.4814453125, -16.58251953125, -15.68359375, -14.78466796875, -13.8857421875, -12.98681640625, -12.087890625, -11.18896484375, -10.2900390625, -9.39111328125, -8.4921875, -7.59326171875, -6.6943359375, -5.79541015625, -4.896484375, -3.99755859375, -3.0986328125, -2.19970703125, -1.30078125, -0.40185546875, 0.4970703125, 1.39599609375, 2.294921875, 3.19384765625, 4.0927734375, 4.99169921875, 5.890625, 6.78955078125, 7.6884765625, 8.58740234375, 9.486328125, 10.38525390625, 11.2841796875, 12.18310546875, 13.08203125, 13.98095703125, 14.8798828125, 15.77880859375, 16.677734375, 17.57666015625, 18.4755859375, 19.37451171875, 20.2734375, 21.17236328125, 22.0712890625, 22.97021484375, 23.869140625, 24.76806640625, 25.6669921875, 26.56591796875, 27.46484375, 28.36376953125, 29.2626953125, 30.16162109375, 31.060546875, 31.95947265625, 32.8583984375, 33.75732421875, 34.65625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 2.0, 2.0, 6.0, 7.0, 15.0, 25.0, 68.0, 159.0, 282.0, 241.0, 95.0, 46.0, 20.0, 8.0, 4.0, 7.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.5291748046875, -10.972412109375, -10.4156494140625, -9.85888671875, -9.3021240234375, -8.745361328125, -8.1885986328125, -7.6318359375, -7.0750732421875, -6.518310546875, -5.9615478515625, -5.40478515625, -4.8480224609375, -4.291259765625, -3.7344970703125, -3.177734375, -2.6209716796875, -2.064208984375, -1.5074462890625, -0.95068359375, -0.3939208984375, 0.162841796875, 0.7196044921875, 1.2763671875, 1.8331298828125, 2.389892578125, 2.9466552734375, 3.50341796875, 4.0601806640625, 4.616943359375, 5.1737060546875, 5.73046875, 6.2872314453125, 6.843994140625, 7.4007568359375, 7.95751953125, 8.5142822265625, 9.071044921875, 9.6278076171875, 10.1845703125, 10.7413330078125, 11.298095703125, 11.8548583984375, 12.41162109375, 12.9683837890625, 13.525146484375, 14.0819091796875, 14.638671875, 15.1954345703125, 15.752197265625, 16.3089599609375, 16.86572265625, 17.4224853515625, 17.979248046875, 18.5360107421875, 19.0927734375, 19.6495361328125, 20.206298828125, 20.7630615234375, 21.31982421875, 21.8765869140625, 22.433349609375, 22.9901123046875, 23.546875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 12.0, 10.0, 27.0, 64.0, 106.0, 207.0, 225.0, 163.0, 107.0, 43.0, 19.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-129.01022338867188, -123.25325775146484, -117.49628448486328, -111.73931884765625, -105.98235321044922, -100.22538757324219, -94.46841430664062, -88.7114486694336, -82.95448303222656, -77.19751739501953, -71.44054412841797, -65.68357849121094, -59.926612854003906, -54.16964340209961, -48.41267395019531, -42.65570831298828, -36.89873504638672, -31.141767501831055, -25.38479995727539, -19.627830505371094, -13.87086296081543, -8.113895416259766, -2.3569259643554688, 3.4000396728515625, 9.15700912475586, 14.913976669311523, 20.670944213867188, 26.427913665771484, 32.18488311767578, 37.94184875488281, 43.69881820678711, 49.45578384399414, 55.21275329589844, 60.969722747802734, 66.72669219970703, 72.48365783691406, 78.2406234741211, 83.99758911132812, 89.75456237792969, 95.51152801513672, 101.26849365234375, 107.02545928955078, 112.78243255615234, 118.53939819335938, 124.2963638305664, 130.05332946777344, 135.810302734375, 141.5672607421875, 147.32424926757812, 153.0812225341797, 158.8381805419922, 164.59515380859375, 170.3521270751953, 176.1090850830078, 181.86605834960938, 187.62301635742188, 193.37998962402344, 199.136962890625, 204.8939208984375, 210.65089416503906, 216.40786743164062, 222.16482543945312, 227.9217987060547, 233.67877197265625, 239.43572998046875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 5.0, 3.0, 1.0, 6.0, 8.0, 10.0, 13.0, 13.0, 21.0, 16.0, 21.0, 29.0, 34.0, 31.0, 32.0, 55.0, 58.0, 51.0, 62.0, 72.0, 57.0, 48.0, 53.0, 47.0, 44.0, 28.0, 39.0, 20.0, 29.0, 27.0, 23.0, 12.0, 11.0, 7.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-75.6527099609375, -73.4660873413086, -71.27947235107422, -69.09284973144531, -66.90623474121094, -64.71961212158203, -62.53299331665039, -60.34637451171875, -58.15975570678711, -55.97313690185547, -53.78651809692383, -51.59989929199219, -49.41327667236328, -47.226661682128906, -45.0400390625, -42.85342025756836, -40.66680145263672, -38.48018264770508, -36.29356384277344, -34.1069450378418, -31.920324325561523, -29.733705520629883, -27.54708480834961, -25.36046600341797, -23.173847198486328, -20.987228393554688, -18.800609588623047, -16.613988876342773, -14.427370071411133, -12.240751266479492, -10.054131507873535, -7.867511749267578, -5.680885314941406, -3.4942660331726074, -1.3076467514038086, 0.8789725303649902, 3.065591812133789, 5.25221061706543, 7.438830375671387, 9.625450134277344, 11.812068939208984, 13.998687744140625, 16.185306549072266, 18.37192726135254, 20.55854606628418, 22.74516487121582, 24.931785583496094, 27.118404388427734, 29.305023193359375, 31.491641998291016, 33.678260803222656, 35.8648796081543, 38.05149841308594, 40.238121032714844, 42.424739837646484, 44.611358642578125, 46.797977447509766, 48.984596252441406, 51.17121505737305, 53.35783386230469, 55.544456481933594, 57.73107147216797, 59.917694091796875, 62.104312896728516, 64.29093170166016]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 6.0, 2.0, 3.0, 8.0, 6.0, 16.0, 13.0, 23.0, 25.0, 34.0, 36.0, 64.0, 69.0, 96.0, 123.0, 162.0, 254.0, 380.0, 599.0, 945.0, 1548.0, 2520.0, 4681.0, 9193.0, 19874.0, 50802.0, 174799.0, 2464975.0, 1238593.0, 143552.0, 44114.0, 17748.0, 8300.0, 4327.0, 2385.0, 1351.0, 850.0, 570.0, 376.0, 265.0, 163.0, 132.0, 83.0, 51.0, 38.0, 28.0, 23.0, 19.0, 22.0, 13.0, 10.0, 2.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.6796875, -13.2374267578125, -12.795166015625, -12.3529052734375, -11.91064453125, -11.4683837890625, -11.026123046875, -10.5838623046875, -10.1416015625, -9.6993408203125, -9.257080078125, -8.8148193359375, -8.37255859375, -7.9302978515625, -7.488037109375, -7.0457763671875, -6.603515625, -6.1612548828125, -5.718994140625, -5.2767333984375, -4.83447265625, -4.3922119140625, -3.949951171875, -3.5076904296875, -3.0654296875, -2.6231689453125, -2.180908203125, -1.7386474609375, -1.29638671875, -0.8541259765625, -0.411865234375, 0.0303955078125, 0.47265625, 0.9149169921875, 1.357177734375, 1.7994384765625, 2.24169921875, 2.6839599609375, 3.126220703125, 3.5684814453125, 4.0107421875, 4.4530029296875, 4.895263671875, 5.3375244140625, 5.77978515625, 6.2220458984375, 6.664306640625, 7.1065673828125, 7.548828125, 7.9910888671875, 8.433349609375, 8.8756103515625, 9.31787109375, 9.7601318359375, 10.202392578125, 10.6446533203125, 11.0869140625, 11.5291748046875, 11.971435546875, 12.4136962890625, 12.85595703125, 13.2982177734375, 13.740478515625, 14.1827392578125, 14.625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 9.0, 12.0, 14.0, 17.0, 24.0, 27.0, 23.0, 43.0, 48.0, 45.0, 57.0, 45.0, 54.0, 54.0, 68.0, 51.0, 48.0, 56.0, 46.0, 33.0, 34.0, 30.0, 24.0, 31.0, 16.0, 17.0, 14.0, 20.0, 11.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.267578125, -2.193145751953125, -2.11871337890625, -2.044281005859375, -1.9698486328125, -1.895416259765625, -1.82098388671875, -1.746551513671875, -1.672119140625, -1.597686767578125, -1.52325439453125, -1.448822021484375, -1.3743896484375, -1.299957275390625, -1.22552490234375, -1.151092529296875, -1.07666015625, -1.002227783203125, -0.92779541015625, -0.853363037109375, -0.7789306640625, -0.704498291015625, -0.63006591796875, -0.555633544921875, -0.481201171875, -0.406768798828125, -0.33233642578125, -0.257904052734375, -0.1834716796875, -0.109039306640625, -0.03460693359375, 0.039825439453125, 0.1142578125, 0.188690185546875, 0.26312255859375, 0.337554931640625, 0.4119873046875, 0.486419677734375, 0.56085205078125, 0.635284423828125, 0.709716796875, 0.784149169921875, 0.85858154296875, 0.933013916015625, 1.0074462890625, 1.081878662109375, 1.15631103515625, 1.230743408203125, 1.30517578125, 1.379608154296875, 1.45404052734375, 1.528472900390625, 1.6029052734375, 1.677337646484375, 1.75177001953125, 1.826202392578125, 1.900634765625, 1.975067138671875, 2.04949951171875, 2.123931884765625, 2.1983642578125, 2.272796630859375, 2.34722900390625, 2.421661376953125, 2.49609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 9.0, 11.0, 17.0, 19.0, 35.0, 59.0, 105.0, 179.0, 312.0, 483.0, 889.0, 1681.0, 3446.0, 9158.0, 38310.0, 402666.0, 3509349.0, 189940.0, 25025.0, 6821.0, 2722.0, 1371.0, 688.0, 395.0, 241.0, 130.0, 58.0, 54.0, 29.0, 23.0, 17.0, 10.0, 6.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.125, -21.316650390625, -20.50830078125, -19.699951171875, -18.8916015625, -18.083251953125, -17.27490234375, -16.466552734375, -15.658203125, -14.849853515625, -14.04150390625, -13.233154296875, -12.4248046875, -11.616455078125, -10.80810546875, -9.999755859375, -9.19140625, -8.383056640625, -7.57470703125, -6.766357421875, -5.9580078125, -5.149658203125, -4.34130859375, -3.532958984375, -2.724609375, -1.916259765625, -1.10791015625, -0.299560546875, 0.5087890625, 1.317138671875, 2.12548828125, 2.933837890625, 3.7421875, 4.550537109375, 5.35888671875, 6.167236328125, 6.9755859375, 7.783935546875, 8.59228515625, 9.400634765625, 10.208984375, 11.017333984375, 11.82568359375, 12.634033203125, 13.4423828125, 14.250732421875, 15.05908203125, 15.867431640625, 16.67578125, 17.484130859375, 18.29248046875, 19.100830078125, 19.9091796875, 20.717529296875, 21.52587890625, 22.334228515625, 23.142578125, 23.950927734375, 24.75927734375, 25.567626953125, 26.3759765625, 27.184326171875, 27.99267578125, 28.801025390625, 29.609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 6.0, 13.0, 17.0, 26.0, 39.0, 96.0, 138.0, 253.0, 602.0, 1461.0, 727.0, 296.0, 168.0, 85.0, 46.0, 27.0, 18.0, 13.0, 11.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0859375, -9.81036376953125, -9.5347900390625, -9.25921630859375, -8.983642578125, -8.70806884765625, -8.4324951171875, -8.15692138671875, -7.88134765625, -7.60577392578125, -7.3302001953125, -7.05462646484375, -6.779052734375, -6.50347900390625, -6.2279052734375, -5.95233154296875, -5.6767578125, -5.40118408203125, -5.1256103515625, -4.85003662109375, -4.574462890625, -4.29888916015625, -4.0233154296875, -3.74774169921875, -3.47216796875, -3.19659423828125, -2.9210205078125, -2.64544677734375, -2.369873046875, -2.09429931640625, -1.8187255859375, -1.54315185546875, -1.267578125, -0.99200439453125, -0.7164306640625, -0.44085693359375, -0.165283203125, 0.11029052734375, 0.3858642578125, 0.66143798828125, 0.93701171875, 1.21258544921875, 1.4881591796875, 1.76373291015625, 2.039306640625, 2.31488037109375, 2.5904541015625, 2.86602783203125, 3.1416015625, 3.41717529296875, 3.6927490234375, 3.96832275390625, 4.243896484375, 4.51947021484375, 4.7950439453125, 5.07061767578125, 5.34619140625, 5.62176513671875, 5.8973388671875, 6.17291259765625, 6.448486328125, 6.72406005859375, 6.9996337890625, 7.27520751953125, 7.55078125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 6.0, 15.0, 25.0, 43.0, 56.0, 91.0, 103.0, 126.0, 113.0, 111.0, 91.0, 61.0, 45.0, 37.0, 21.0, 9.0, 14.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.82662582397461, -45.31364440917969, -43.8006591796875, -42.28767776489258, -40.774696350097656, -39.26171112060547, -37.74872970581055, -36.235748291015625, -34.72276306152344, -33.209781646728516, -31.696796417236328, -30.183815002441406, -28.67083168029785, -27.157848358154297, -25.644866943359375, -24.13188362121582, -22.618900299072266, -21.10591697692871, -19.592933654785156, -18.079952239990234, -16.56696891784668, -15.053985595703125, -13.541003227233887, -12.028020858764648, -10.515037536621094, -9.002054214477539, -7.489071846008301, -5.976089000701904, -4.463106155395508, -2.9501233100891113, -1.4371404647827148, 0.07584190368652344, 1.5888252258300781, 3.1018080711364746, 4.614790916442871, 6.127773761749268, 7.640756607055664, 9.153739929199219, 10.666722297668457, 12.179704666137695, 13.69268798828125, 15.205671310424805, 16.71865463256836, 18.23163604736328, 19.744619369506836, 21.25760269165039, 22.770584106445312, 24.283567428588867, 25.796550750732422, 27.309534072875977, 28.82251739501953, 30.335498809814453, 31.848482131958008, 33.36146545410156, 34.874446868896484, 36.387428283691406, 37.900413513183594, 39.413394927978516, 40.9263801574707, 42.439361572265625, 43.95234680175781, 45.465328216552734, 46.978309631347656, 48.491294860839844, 50.004276275634766]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 11.0, 12.0, 14.0, 24.0, 23.0, 30.0, 42.0, 40.0, 50.0, 61.0, 77.0, 65.0, 74.0, 75.0, 64.0, 64.0, 59.0, 47.0, 44.0, 36.0, 34.0, 20.0, 13.0, 6.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-46.41676330566406, -45.2458381652832, -44.07490921020508, -42.90398406982422, -41.733055114746094, -40.562129974365234, -39.391204833984375, -38.22027587890625, -37.04935073852539, -35.87842559814453, -34.707496643066406, -33.53657150268555, -32.36564254760742, -31.194717407226562, -30.02379035949707, -28.852863311767578, -27.681936264038086, -26.511009216308594, -25.3400821685791, -24.16915512084961, -22.99822998046875, -21.827302932739258, -20.656375885009766, -19.485450744628906, -18.31452178955078, -17.14359474182129, -15.972668647766113, -14.801741600036621, -13.630815505981445, -12.459888458251953, -11.288961410522461, -10.118035316467285, -8.94710922241211, -7.776182651519775, -6.605256080627441, -5.434329032897949, -4.263402462005615, -3.0924758911132812, -1.921548843383789, -0.7506227493286133, 0.4203042984008789, 1.5912309885025024, 2.762157678604126, 3.933084487915039, 5.104011058807373, 6.274937629699707, 7.445864677429199, 8.616790771484375, 9.787717819213867, 10.95864486694336, 12.129570960998535, 13.300498008728027, 14.471424102783203, 15.642351150512695, 16.813278198242188, 17.984203338623047, 19.155132293701172, 20.326059341430664, 21.496986389160156, 22.667911529541016, 23.838838577270508, 25.009765625, 26.180692672729492, 27.351619720458984, 28.522544860839844]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 4.0, 13.0, 19.0, 21.0, 39.0, 55.0, 105.0, 185.0, 309.0, 570.0, 1132.0, 2835.0, 10280.0, 56091.0, 346075.0, 514976.0, 93185.0, 15775.0, 3951.0, 1370.0, 705.0, 339.0, 211.0, 130.0, 67.0, 49.0, 21.0, 17.0, 13.0, 8.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.53125, -28.6123046875, -27.693359375, -26.7744140625, -25.85546875, -24.9365234375, -24.017578125, -23.0986328125, -22.1796875, -21.2607421875, -20.341796875, -19.4228515625, -18.50390625, -17.5849609375, -16.666015625, -15.7470703125, -14.828125, -13.9091796875, -12.990234375, -12.0712890625, -11.15234375, -10.2333984375, -9.314453125, -8.3955078125, -7.4765625, -6.5576171875, -5.638671875, -4.7197265625, -3.80078125, -2.8818359375, -1.962890625, -1.0439453125, -0.125, 0.7939453125, 1.712890625, 2.6318359375, 3.55078125, 4.4697265625, 5.388671875, 6.3076171875, 7.2265625, 8.1455078125, 9.064453125, 9.9833984375, 10.90234375, 11.8212890625, 12.740234375, 13.6591796875, 14.578125, 15.4970703125, 16.416015625, 17.3349609375, 18.25390625, 19.1728515625, 20.091796875, 21.0107421875, 21.9296875, 22.8486328125, 23.767578125, 24.6865234375, 25.60546875, 26.5244140625, 27.443359375, 28.3623046875, 29.28125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 20.0, 18.0, 31.0, 47.0, 58.0, 68.0, 74.0, 57.0, 79.0, 83.0, 72.0, 63.0, 60.0, 50.0, 42.0, 46.0, 33.0, 25.0, 13.0, 14.0, 9.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-4.1875, -4.083953857421875, -3.98040771484375, -3.876861572265625, -3.7733154296875, -3.669769287109375, -3.56622314453125, -3.462677001953125, -3.359130859375, -3.255584716796875, -3.15203857421875, -3.048492431640625, -2.9449462890625, -2.841400146484375, -2.73785400390625, -2.634307861328125, -2.53076171875, -2.427215576171875, -2.32366943359375, -2.220123291015625, -2.1165771484375, -2.013031005859375, -1.90948486328125, -1.805938720703125, -1.702392578125, -1.598846435546875, -1.49530029296875, -1.391754150390625, -1.2882080078125, -1.184661865234375, -1.08111572265625, -0.977569580078125, -0.8740234375, -0.770477294921875, -0.66693115234375, -0.563385009765625, -0.4598388671875, -0.356292724609375, -0.25274658203125, -0.149200439453125, -0.045654296875, 0.057891845703125, 0.16143798828125, 0.264984130859375, 0.3685302734375, 0.472076416015625, 0.57562255859375, 0.679168701171875, 0.78271484375, 0.886260986328125, 0.98980712890625, 1.093353271484375, 1.1968994140625, 1.300445556640625, 1.40399169921875, 1.507537841796875, 1.611083984375, 1.714630126953125, 1.81817626953125, 1.921722412109375, 2.0252685546875, 2.128814697265625, 2.23236083984375, 2.335906982421875, 2.439453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 10.0, 13.0, 22.0, 23.0, 48.0, 61.0, 103.0, 176.0, 261.0, 379.0, 572.0, 951.0, 1858.0, 3812.0, 9061.0, 23771.0, 62824.0, 158437.0, 336690.0, 266393.0, 110795.0, 43055.0, 16291.0, 6466.0, 2885.0, 1433.0, 769.0, 542.0, 269.0, 197.0, 123.0, 83.0, 65.0, 41.0, 24.0, 22.0, 11.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3359375, -9.9891357421875, -9.642333984375, -9.2955322265625, -8.94873046875, -8.6019287109375, -8.255126953125, -7.9083251953125, -7.5615234375, -7.2147216796875, -6.867919921875, -6.5211181640625, -6.17431640625, -5.8275146484375, -5.480712890625, -5.1339111328125, -4.787109375, -4.4403076171875, -4.093505859375, -3.7467041015625, -3.39990234375, -3.0531005859375, -2.706298828125, -2.3594970703125, -2.0126953125, -1.6658935546875, -1.319091796875, -0.9722900390625, -0.62548828125, -0.2786865234375, 0.068115234375, 0.4149169921875, 0.76171875, 1.1085205078125, 1.455322265625, 1.8021240234375, 2.14892578125, 2.4957275390625, 2.842529296875, 3.1893310546875, 3.5361328125, 3.8829345703125, 4.229736328125, 4.5765380859375, 4.92333984375, 5.2701416015625, 5.616943359375, 5.9637451171875, 6.310546875, 6.6573486328125, 7.004150390625, 7.3509521484375, 7.69775390625, 8.0445556640625, 8.391357421875, 8.7381591796875, 9.0849609375, 9.4317626953125, 9.778564453125, 10.1253662109375, 10.47216796875, 10.8189697265625, 11.165771484375, 11.5125732421875, 11.859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 7.0, 7.0, 9.0, 13.0, 16.0, 19.0, 19.0, 27.0, 27.0, 36.0, 31.0, 35.0, 54.0, 42.0, 43.0, 41.0, 31.0, 43.0, 54.0, 52.0, 40.0, 57.0, 45.0, 37.0, 24.0, 22.0, 31.0, 30.0, 21.0, 15.0, 10.0, 7.0, 8.0, 10.0, 10.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.21875, -9.9368896484375, -9.655029296875, -9.3731689453125, -9.09130859375, -8.8094482421875, -8.527587890625, -8.2457275390625, -7.9638671875, -7.6820068359375, -7.400146484375, -7.1182861328125, -6.83642578125, -6.5545654296875, -6.272705078125, -5.9908447265625, -5.708984375, -5.4271240234375, -5.145263671875, -4.8634033203125, -4.58154296875, -4.2996826171875, -4.017822265625, -3.7359619140625, -3.4541015625, -3.1722412109375, -2.890380859375, -2.6085205078125, -2.32666015625, -2.0447998046875, -1.762939453125, -1.4810791015625, -1.19921875, -0.9173583984375, -0.635498046875, -0.3536376953125, -0.07177734375, 0.2100830078125, 0.491943359375, 0.7738037109375, 1.0556640625, 1.3375244140625, 1.619384765625, 1.9012451171875, 2.18310546875, 2.4649658203125, 2.746826171875, 3.0286865234375, 3.310546875, 3.5924072265625, 3.874267578125, 4.1561279296875, 4.43798828125, 4.7198486328125, 5.001708984375, 5.2835693359375, 5.5654296875, 5.8472900390625, 6.129150390625, 6.4110107421875, 6.69287109375, 6.9747314453125, 7.256591796875, 7.5384521484375, 7.8203125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 6.0, 12.0, 13.0, 19.0, 21.0, 33.0, 48.0, 77.0, 117.0, 176.0, 338.0, 598.0, 1081.0, 2142.0, 4616.0, 11911.0, 37946.0, 159020.0, 460728.0, 273803.0, 65277.0, 18114.0, 6507.0, 2757.0, 1373.0, 701.0, 403.0, 223.0, 154.0, 97.0, 56.0, 52.0, 29.0, 26.0, 17.0, 12.0, 8.0, 13.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.1484375, -7.9066162109375, -7.664794921875, -7.4229736328125, -7.18115234375, -6.9393310546875, -6.697509765625, -6.4556884765625, -6.2138671875, -5.9720458984375, -5.730224609375, -5.4884033203125, -5.24658203125, -5.0047607421875, -4.762939453125, -4.5211181640625, -4.279296875, -4.0374755859375, -3.795654296875, -3.5538330078125, -3.31201171875, -3.0701904296875, -2.828369140625, -2.5865478515625, -2.3447265625, -2.1029052734375, -1.861083984375, -1.6192626953125, -1.37744140625, -1.1356201171875, -0.893798828125, -0.6519775390625, -0.41015625, -0.1683349609375, 0.073486328125, 0.3153076171875, 0.55712890625, 0.7989501953125, 1.040771484375, 1.2825927734375, 1.5244140625, 1.7662353515625, 2.008056640625, 2.2498779296875, 2.49169921875, 2.7335205078125, 2.975341796875, 3.2171630859375, 3.458984375, 3.7008056640625, 3.942626953125, 4.1844482421875, 4.42626953125, 4.6680908203125, 4.909912109375, 5.1517333984375, 5.3935546875, 5.6353759765625, 5.877197265625, 6.1190185546875, 6.36083984375, 6.6026611328125, 6.844482421875, 7.0863037109375, 7.328125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 1.0, 6.0, 12.0, 10.0, 12.0, 7.0, 15.0, 21.0, 24.0, 34.0, 41.0, 55.0, 76.0, 87.0, 106.0, 107.0, 77.0, 54.0, 56.0, 45.0, 20.0, 26.0, 15.0, 21.0, 9.0, 9.0, 14.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0009660720825195312, -0.0009374544024467468, -0.0009088367223739624, -0.000880219042301178, -0.0008516013622283936, -0.0008229836821556091, -0.0007943660020828247, -0.0007657483220100403, -0.0007371306419372559, -0.0007085129618644714, -0.000679895281791687, -0.0006512776017189026, -0.0006226599216461182, -0.0005940422415733337, -0.0005654245615005493, -0.0005368068814277649, -0.0005081892013549805, -0.00047957152128219604, -0.0004509538412094116, -0.0004223361611366272, -0.0003937184810638428, -0.00036510080099105835, -0.0003364831209182739, -0.0003078654408454895, -0.0002792477607727051, -0.00025063008069992065, -0.00022201240062713623, -0.0001933947205543518, -0.00016477704048156738, -0.00013615936040878296, -0.00010754168033599854, -7.892400026321411e-05, -5.030632019042969e-05, -2.1688640117645264e-05, 6.92903995513916e-06, 3.5546720027923584e-05, 6.416440010070801e-05, 9.278208017349243e-05, 0.00012139976024627686, 0.00015001744031906128, 0.0001786351203918457, 0.00020725280046463013, 0.00023587048053741455, 0.000264488160610199, 0.0002931058406829834, 0.0003217235207557678, 0.00035034120082855225, 0.00037895888090133667, 0.0004075765609741211, 0.0004361942410469055, 0.00046481192111968994, 0.0004934296011924744, 0.0005220472812652588, 0.0005506649613380432, 0.0005792826414108276, 0.0006079003214836121, 0.0006365180015563965, 0.0006651356816291809, 0.0006937533617019653, 0.0007223710417747498, 0.0007509887218475342, 0.0007796064019203186, 0.000808224081993103, 0.0008368417620658875, 0.0008654594421386719]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 7.0, 11.0, 10.0, 15.0, 28.0, 39.0, 43.0, 80.0, 130.0, 227.0, 457.0, 814.0, 1694.0, 4008.0, 12047.0, 53305.0, 359675.0, 505001.0, 84697.0, 16630.0, 5285.0, 2179.0, 974.0, 524.0, 255.0, 138.0, 76.0, 63.0, 49.0, 33.0, 23.0, 18.0, 4.0, 9.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.310791015625, -10.98876953125, -10.666748046875, -10.3447265625, -10.022705078125, -9.70068359375, -9.378662109375, -9.056640625, -8.734619140625, -8.41259765625, -8.090576171875, -7.7685546875, -7.446533203125, -7.12451171875, -6.802490234375, -6.48046875, -6.158447265625, -5.83642578125, -5.514404296875, -5.1923828125, -4.870361328125, -4.54833984375, -4.226318359375, -3.904296875, -3.582275390625, -3.26025390625, -2.938232421875, -2.6162109375, -2.294189453125, -1.97216796875, -1.650146484375, -1.328125, -1.006103515625, -0.68408203125, -0.362060546875, -0.0400390625, 0.281982421875, 0.60400390625, 0.926025390625, 1.248046875, 1.570068359375, 1.89208984375, 2.214111328125, 2.5361328125, 2.858154296875, 3.18017578125, 3.502197265625, 3.82421875, 4.146240234375, 4.46826171875, 4.790283203125, 5.1123046875, 5.434326171875, 5.75634765625, 6.078369140625, 6.400390625, 6.722412109375, 7.04443359375, 7.366455078125, 7.6884765625, 8.010498046875, 8.33251953125, 8.654541015625, 8.9765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 7.0, 8.0, 10.0, 18.0, 30.0, 56.0, 94.0, 130.0, 142.0, 129.0, 128.0, 81.0, 62.0, 41.0, 27.0, 11.0, 5.0, 5.0, 1.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.28125, -10.999755859375, -10.71826171875, -10.436767578125, -10.1552734375, -9.873779296875, -9.59228515625, -9.310791015625, -9.029296875, -8.747802734375, -8.46630859375, -8.184814453125, -7.9033203125, -7.621826171875, -7.34033203125, -7.058837890625, -6.77734375, -6.495849609375, -6.21435546875, -5.932861328125, -5.6513671875, -5.369873046875, -5.08837890625, -4.806884765625, -4.525390625, -4.243896484375, -3.96240234375, -3.680908203125, -3.3994140625, -3.117919921875, -2.83642578125, -2.554931640625, -2.2734375, -1.991943359375, -1.71044921875, -1.428955078125, -1.1474609375, -0.865966796875, -0.58447265625, -0.302978515625, -0.021484375, 0.260009765625, 0.54150390625, 0.822998046875, 1.1044921875, 1.385986328125, 1.66748046875, 1.948974609375, 2.23046875, 2.511962890625, 2.79345703125, 3.074951171875, 3.3564453125, 3.637939453125, 3.91943359375, 4.200927734375, 4.482421875, 4.763916015625, 5.04541015625, 5.326904296875, 5.6083984375, 5.889892578125, 6.17138671875, 6.452880859375, 6.734375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 1.0, 3.0, 10.0, 20.0, 26.0, 39.0, 61.0, 78.0, 102.0, 144.0, 123.0, 110.0, 101.0, 67.0, 35.0, 29.0, 18.0, 11.0, 10.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.7868881225586, -77.857421875, -74.9279556274414, -71.99848175048828, -69.06901550292969, -66.1395492553711, -63.2100830078125, -60.28061294555664, -57.35114288330078, -54.42167663574219, -51.49220657348633, -48.562740325927734, -45.633270263671875, -42.70380401611328, -39.77433776855469, -36.84486770629883, -33.915401458740234, -30.985933303833008, -28.05646514892578, -25.126998901367188, -22.197528839111328, -19.268062591552734, -16.338594436645508, -13.409126281738281, -10.479658126831055, -7.550189971923828, -4.62072229385376, -1.6912546157836914, 1.2382135391235352, 4.167681694030762, 7.097148895263672, 10.026617050170898, 12.956085205078125, 15.885553359985352, 18.815021514892578, 21.744487762451172, 24.67395782470703, 27.603424072265625, 30.53289222717285, 33.46236038208008, 36.39183044433594, 39.32129669189453, 42.25076675415039, 45.180233001708984, 48.109703063964844, 51.03916931152344, 53.96863555908203, 56.89810562133789, 59.827571868896484, 62.75703811645508, 65.68650817871094, 68.61597442626953, 71.54544067382812, 74.47491455078125, 77.40438079833984, 80.33384704589844, 83.26331329345703, 86.19277954101562, 89.12224578857422, 92.05171966552734, 94.98118591308594, 97.91065216064453, 100.84011840820312, 103.76959228515625, 106.69905853271484]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 9.0, 14.0, 12.0, 21.0, 19.0, 37.0, 39.0, 23.0, 32.0, 51.0, 48.0, 35.0, 51.0, 46.0, 45.0, 70.0, 56.0, 48.0, 45.0, 25.0, 36.0, 31.0, 35.0, 28.0, 23.0, 13.0, 23.0, 8.0, 11.0, 13.0, 6.0, 4.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-62.6007080078125, -60.938514709472656, -59.27631759643555, -57.61412048339844, -55.951927185058594, -54.28973388671875, -52.62753677368164, -50.96533966064453, -49.30314636230469, -47.640953063964844, -45.978755950927734, -44.316558837890625, -42.65436553955078, -40.99217224121094, -39.32997512817383, -37.66777801513672, -36.005584716796875, -34.34339141845703, -32.68119430541992, -31.018999099731445, -29.35680389404297, -27.694608688354492, -26.032413482666016, -24.37021827697754, -22.708023071289062, -21.045827865600586, -19.38363265991211, -17.721437454223633, -16.059242248535156, -14.39704704284668, -12.734851837158203, -11.072656631469727, -9.41046142578125, -7.748266220092773, -6.086071014404297, -4.42387580871582, -2.7616806030273438, -1.0994853973388672, 0.5627098083496094, 2.224905014038086, 3.8871002197265625, 5.549295425415039, 7.211490631103516, 8.873685836791992, 10.535881042480469, 12.198076248168945, 13.860271453857422, 15.522466659545898, 17.184661865234375, 18.84685707092285, 20.509052276611328, 22.171247482299805, 23.83344268798828, 25.495637893676758, 27.157833099365234, 28.82002830505371, 30.482223510742188, 32.14441680908203, 33.80661392211914, 35.46881103515625, 37.131004333496094, 38.79319763183594, 40.45539474487305, 42.117591857910156, 43.77978515625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 4.0, 9.0, 4.0, 11.0, 5.0, 12.0, 26.0, 11.0, 27.0, 52.0, 67.0, 81.0, 133.0, 194.0, 315.0, 563.0, 1144.0, 2426.0, 6155.0, 21184.0, 142978.0, 3818468.0, 166207.0, 22676.0, 6497.0, 2519.0, 1120.0, 561.0, 311.0, 145.0, 135.0, 68.0, 47.0, 36.0, 13.0, 11.0, 16.0, 14.0, 11.0, 6.0, 7.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.9375, -23.1533203125, -22.369140625, -21.5849609375, -20.80078125, -20.0166015625, -19.232421875, -18.4482421875, -17.6640625, -16.8798828125, -16.095703125, -15.3115234375, -14.52734375, -13.7431640625, -12.958984375, -12.1748046875, -11.390625, -10.6064453125, -9.822265625, -9.0380859375, -8.25390625, -7.4697265625, -6.685546875, -5.9013671875, -5.1171875, -4.3330078125, -3.548828125, -2.7646484375, -1.98046875, -1.1962890625, -0.412109375, 0.3720703125, 1.15625, 1.9404296875, 2.724609375, 3.5087890625, 4.29296875, 5.0771484375, 5.861328125, 6.6455078125, 7.4296875, 8.2138671875, 8.998046875, 9.7822265625, 10.56640625, 11.3505859375, 12.134765625, 12.9189453125, 13.703125, 14.4873046875, 15.271484375, 16.0556640625, 16.83984375, 17.6240234375, 18.408203125, 19.1923828125, 19.9765625, 20.7607421875, 21.544921875, 22.3291015625, 23.11328125, 23.8974609375, 24.681640625, 25.4658203125, 26.25]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 13.0, 14.0, 9.0, 25.0, 30.0, 59.0, 62.0, 72.0, 78.0, 70.0, 84.0, 85.0, 75.0, 73.0, 49.0, 49.0, 40.0, 36.0, 18.0, 19.0, 14.0, 8.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.1563720703125, -4.043212890625, -3.9300537109375, -3.81689453125, -3.7037353515625, -3.590576171875, -3.4774169921875, -3.3642578125, -3.2510986328125, -3.137939453125, -3.0247802734375, -2.91162109375, -2.7984619140625, -2.685302734375, -2.5721435546875, -2.458984375, -2.3458251953125, -2.232666015625, -2.1195068359375, -2.00634765625, -1.8931884765625, -1.780029296875, -1.6668701171875, -1.5537109375, -1.4405517578125, -1.327392578125, -1.2142333984375, -1.10107421875, -0.9879150390625, -0.874755859375, -0.7615966796875, -0.6484375, -0.5352783203125, -0.422119140625, -0.3089599609375, -0.19580078125, -0.0826416015625, 0.030517578125, 0.1436767578125, 0.2568359375, 0.3699951171875, 0.483154296875, 0.5963134765625, 0.70947265625, 0.8226318359375, 0.935791015625, 1.0489501953125, 1.162109375, 1.2752685546875, 1.388427734375, 1.5015869140625, 1.61474609375, 1.7279052734375, 1.841064453125, 1.9542236328125, 2.0673828125, 2.1805419921875, 2.293701171875, 2.4068603515625, 2.52001953125, 2.6331787109375, 2.746337890625, 2.8594970703125, 2.97265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 6.0, 9.0, 15.0, 16.0, 20.0, 23.0, 28.0, 26.0, 45.0, 56.0, 86.0, 157.0, 388.0, 1004.0, 3430.0, 14201.0, 98551.0, 3437615.0, 586633.0, 40405.0, 7800.0, 2104.0, 788.0, 381.0, 159.0, 112.0, 53.0, 44.0, 29.0, 22.0, 15.0, 8.0, 10.0, 8.0, 9.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.390625, -24.660888671875, -23.93115234375, -23.201416015625, -22.4716796875, -21.741943359375, -21.01220703125, -20.282470703125, -19.552734375, -18.822998046875, -18.09326171875, -17.363525390625, -16.6337890625, -15.904052734375, -15.17431640625, -14.444580078125, -13.71484375, -12.985107421875, -12.25537109375, -11.525634765625, -10.7958984375, -10.066162109375, -9.33642578125, -8.606689453125, -7.876953125, -7.147216796875, -6.41748046875, -5.687744140625, -4.9580078125, -4.228271484375, -3.49853515625, -2.768798828125, -2.0390625, -1.309326171875, -0.57958984375, 0.150146484375, 0.8798828125, 1.609619140625, 2.33935546875, 3.069091796875, 3.798828125, 4.528564453125, 5.25830078125, 5.988037109375, 6.7177734375, 7.447509765625, 8.17724609375, 8.906982421875, 9.63671875, 10.366455078125, 11.09619140625, 11.825927734375, 12.5556640625, 13.285400390625, 14.01513671875, 14.744873046875, 15.474609375, 16.204345703125, 16.93408203125, 17.663818359375, 18.3935546875, 19.123291015625, 19.85302734375, 20.582763671875, 21.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 9.0, 13.0, 29.0, 47.0, 82.0, 179.0, 587.0, 2112.0, 642.0, 207.0, 78.0, 45.0, 16.0, 13.0, 11.0, 3.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.90625, -12.60986328125, -12.3134765625, -12.01708984375, -11.720703125, -11.42431640625, -11.1279296875, -10.83154296875, -10.53515625, -10.23876953125, -9.9423828125, -9.64599609375, -9.349609375, -9.05322265625, -8.7568359375, -8.46044921875, -8.1640625, -7.86767578125, -7.5712890625, -7.27490234375, -6.978515625, -6.68212890625, -6.3857421875, -6.08935546875, -5.79296875, -5.49658203125, -5.2001953125, -4.90380859375, -4.607421875, -4.31103515625, -4.0146484375, -3.71826171875, -3.421875, -3.12548828125, -2.8291015625, -2.53271484375, -2.236328125, -1.93994140625, -1.6435546875, -1.34716796875, -1.05078125, -0.75439453125, -0.4580078125, -0.16162109375, 0.134765625, 0.43115234375, 0.7275390625, 1.02392578125, 1.3203125, 1.61669921875, 1.9130859375, 2.20947265625, 2.505859375, 2.80224609375, 3.0986328125, 3.39501953125, 3.69140625, 3.98779296875, 4.2841796875, 4.58056640625, 4.876953125, 5.17333984375, 5.4697265625, 5.76611328125, 6.0625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 15.0, 12.0, 20.0, 54.0, 85.0, 125.0, 134.0, 149.0, 144.0, 93.0, 79.0, 30.0, 26.0, 17.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.16429138183594, -47.81736755371094, -46.47044372558594, -45.12351989746094, -43.77659606933594, -42.42967224121094, -41.08274841308594, -39.73582458496094, -38.38890075683594, -37.04197692871094, -35.69505310058594, -34.34812927246094, -33.00120544433594, -31.654281616210938, -30.307357788085938, -28.960433959960938, -27.613508224487305, -26.266584396362305, -24.919660568237305, -23.572736740112305, -22.225812911987305, -20.878889083862305, -19.531963348388672, -18.185039520263672, -16.838115692138672, -15.491191864013672, -14.144268035888672, -12.797344207763672, -11.450420379638672, -10.103496551513672, -8.756571769714355, -7.4096479415893555, -6.062725067138672, -4.715801239013672, -3.3688771724700928, -2.0219531059265137, -0.6750292778015137, 0.6718945503234863, 2.0188188552856445, 3.3657426834106445, 4.7126665115356445, 6.0595903396606445, 7.4065141677856445, 8.753438949584961, 10.100362777709961, 11.447286605834961, 12.794210433959961, 14.141134262084961, 15.488058090209961, 16.83498191833496, 18.18190574645996, 19.52882957458496, 20.87575340270996, 22.22267723083496, 23.569602966308594, 24.916526794433594, 26.263450622558594, 27.610374450683594, 28.957298278808594, 30.304222106933594, 31.651145935058594, 32.998069763183594, 34.344993591308594, 35.691917419433594, 37.038841247558594]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 12.0, 16.0, 18.0, 26.0, 29.0, 45.0, 37.0, 45.0, 43.0, 53.0, 60.0, 64.0, 68.0, 54.0, 63.0, 56.0, 49.0, 27.0, 46.0, 43.0, 29.0, 25.0, 19.0, 18.0, 8.0, 6.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.060779571533203, -17.35297203063965, -16.645164489746094, -15.937358856201172, -15.229551315307617, -14.521743774414062, -13.813937187194824, -13.106130599975586, -12.398323059082031, -11.690515518188477, -10.982708930969238, -10.27490234375, -9.567094802856445, -8.85928726196289, -8.151480674743652, -7.443673610687256, -6.735866546630859, -6.028059482574463, -5.320252418518066, -4.61244535446167, -3.9046382904052734, -3.196831226348877, -2.4890241622924805, -1.781217098236084, -1.0734100341796875, -0.365602970123291, 0.34220409393310547, 1.050011157989502, 1.7578182220458984, 2.465625286102295, 3.1734323501586914, 3.881239414215088, 4.589046478271484, 5.296853542327881, 6.004660606384277, 6.712467670440674, 7.42027473449707, 8.128082275390625, 8.835888862609863, 9.543695449829102, 10.251502990722656, 10.959310531616211, 11.66711711883545, 12.374923706054688, 13.082731246948242, 13.790538787841797, 14.498345375061035, 15.206151962280273, 15.913959503173828, 16.621767044067383, 17.329574584960938, 18.03738021850586, 18.745187759399414, 19.45299530029297, 20.16080093383789, 20.868608474731445, 21.576416015625, 22.284223556518555, 22.99203109741211, 23.69983673095703, 24.407644271850586, 25.11545181274414, 25.823257446289062, 26.531064987182617, 27.238872528076172]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 2.0, 13.0, 14.0, 17.0, 25.0, 37.0, 52.0, 89.0, 129.0, 252.0, 460.0, 919.0, 1963.0, 5473.0, 20059.0, 104402.0, 507515.0, 329703.0, 58200.0, 12350.0, 3778.0, 1434.0, 690.0, 381.0, 210.0, 146.0, 86.0, 46.0, 33.0, 13.0, 19.0, 8.0, 12.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.875, -25.97412109375, -25.0732421875, -24.17236328125, -23.271484375, -22.37060546875, -21.4697265625, -20.56884765625, -19.66796875, -18.76708984375, -17.8662109375, -16.96533203125, -16.064453125, -15.16357421875, -14.2626953125, -13.36181640625, -12.4609375, -11.56005859375, -10.6591796875, -9.75830078125, -8.857421875, -7.95654296875, -7.0556640625, -6.15478515625, -5.25390625, -4.35302734375, -3.4521484375, -2.55126953125, -1.650390625, -0.74951171875, 0.1513671875, 1.05224609375, 1.953125, 2.85400390625, 3.7548828125, 4.65576171875, 5.556640625, 6.45751953125, 7.3583984375, 8.25927734375, 9.16015625, 10.06103515625, 10.9619140625, 11.86279296875, 12.763671875, 13.66455078125, 14.5654296875, 15.46630859375, 16.3671875, 17.26806640625, 18.1689453125, 19.06982421875, 19.970703125, 20.87158203125, 21.7724609375, 22.67333984375, 23.57421875, 24.47509765625, 25.3759765625, 26.27685546875, 27.177734375, 28.07861328125, 28.9794921875, 29.88037109375, 30.78125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 7.0, 21.0, 16.0, 35.0, 44.0, 49.0, 57.0, 78.0, 69.0, 81.0, 75.0, 77.0, 70.0, 58.0, 48.0, 50.0, 42.0, 36.0, 24.0, 13.0, 16.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.056610107421875, -3.94525146484375, -3.833892822265625, -3.7225341796875, -3.611175537109375, -3.49981689453125, -3.388458251953125, -3.277099609375, -3.165740966796875, -3.05438232421875, -2.943023681640625, -2.8316650390625, -2.720306396484375, -2.60894775390625, -2.497589111328125, -2.38623046875, -2.274871826171875, -2.16351318359375, -2.052154541015625, -1.9407958984375, -1.829437255859375, -1.71807861328125, -1.606719970703125, -1.495361328125, -1.384002685546875, -1.27264404296875, -1.161285400390625, -1.0499267578125, -0.938568115234375, -0.82720947265625, -0.715850830078125, -0.6044921875, -0.493133544921875, -0.38177490234375, -0.270416259765625, -0.1590576171875, -0.047698974609375, 0.06365966796875, 0.175018310546875, 0.286376953125, 0.397735595703125, 0.50909423828125, 0.620452880859375, 0.7318115234375, 0.843170166015625, 0.95452880859375, 1.065887451171875, 1.17724609375, 1.288604736328125, 1.39996337890625, 1.511322021484375, 1.6226806640625, 1.734039306640625, 1.84539794921875, 1.956756591796875, 2.068115234375, 2.179473876953125, 2.29083251953125, 2.402191162109375, 2.5135498046875, 2.624908447265625, 2.73626708984375, 2.847625732421875, 2.958984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 20.0, 15.0, 51.0, 65.0, 75.0, 128.0, 190.0, 344.0, 522.0, 963.0, 2188.0, 6292.0, 25450.0, 120642.0, 464069.0, 330088.0, 73438.0, 15902.0, 4409.0, 1681.0, 785.0, 458.0, 237.0, 173.0, 123.0, 70.0, 45.0, 37.0, 17.0, 13.0, 18.0, 9.0, 4.0, 4.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.546875, -18.98583984375, -18.4248046875, -17.86376953125, -17.302734375, -16.74169921875, -16.1806640625, -15.61962890625, -15.05859375, -14.49755859375, -13.9365234375, -13.37548828125, -12.814453125, -12.25341796875, -11.6923828125, -11.13134765625, -10.5703125, -10.00927734375, -9.4482421875, -8.88720703125, -8.326171875, -7.76513671875, -7.2041015625, -6.64306640625, -6.08203125, -5.52099609375, -4.9599609375, -4.39892578125, -3.837890625, -3.27685546875, -2.7158203125, -2.15478515625, -1.59375, -1.03271484375, -0.4716796875, 0.08935546875, 0.650390625, 1.21142578125, 1.7724609375, 2.33349609375, 2.89453125, 3.45556640625, 4.0166015625, 4.57763671875, 5.138671875, 5.69970703125, 6.2607421875, 6.82177734375, 7.3828125, 7.94384765625, 8.5048828125, 9.06591796875, 9.626953125, 10.18798828125, 10.7490234375, 11.31005859375, 11.87109375, 12.43212890625, 12.9931640625, 13.55419921875, 14.115234375, 14.67626953125, 15.2373046875, 15.79833984375, 16.359375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 9.0, 2.0, 4.0, 5.0, 10.0, 11.0, 21.0, 15.0, 27.0, 25.0, 30.0, 40.0, 41.0, 31.0, 31.0, 43.0, 31.0, 56.0, 37.0, 45.0, 35.0, 41.0, 39.0, 50.0, 45.0, 30.0, 36.0, 39.0, 17.0, 24.0, 27.0, 22.0, 9.0, 18.0, 9.0, 9.0, 7.0, 9.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.4140625, -9.14239501953125, -8.8707275390625, -8.59906005859375, -8.327392578125, -8.05572509765625, -7.7840576171875, -7.51239013671875, -7.24072265625, -6.96905517578125, -6.6973876953125, -6.42572021484375, -6.154052734375, -5.88238525390625, -5.6107177734375, -5.33905029296875, -5.0673828125, -4.79571533203125, -4.5240478515625, -4.25238037109375, -3.980712890625, -3.70904541015625, -3.4373779296875, -3.16571044921875, -2.89404296875, -2.62237548828125, -2.3507080078125, -2.07904052734375, -1.807373046875, -1.53570556640625, -1.2640380859375, -0.99237060546875, -0.720703125, -0.44903564453125, -0.1773681640625, 0.09429931640625, 0.365966796875, 0.63763427734375, 0.9093017578125, 1.18096923828125, 1.45263671875, 1.72430419921875, 1.9959716796875, 2.26763916015625, 2.539306640625, 2.81097412109375, 3.0826416015625, 3.35430908203125, 3.6259765625, 3.89764404296875, 4.1693115234375, 4.44097900390625, 4.712646484375, 4.98431396484375, 5.2559814453125, 5.52764892578125, 5.79931640625, 6.07098388671875, 6.3426513671875, 6.61431884765625, 6.885986328125, 7.15765380859375, 7.4293212890625, 7.70098876953125, 7.97265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 8.0, 5.0, 4.0, 11.0, 24.0, 27.0, 41.0, 81.0, 98.0, 164.0, 296.0, 471.0, 845.0, 1619.0, 3532.0, 10066.0, 38545.0, 224298.0, 589595.0, 138786.0, 26312.0, 7592.0, 2906.0, 1427.0, 731.0, 408.0, 248.0, 147.0, 90.0, 59.0, 41.0, 22.0, 16.0, 13.0, 9.0, 10.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-11.6953125, -11.373779296875, -11.05224609375, -10.730712890625, -10.4091796875, -10.087646484375, -9.76611328125, -9.444580078125, -9.123046875, -8.801513671875, -8.47998046875, -8.158447265625, -7.8369140625, -7.515380859375, -7.19384765625, -6.872314453125, -6.55078125, -6.229248046875, -5.90771484375, -5.586181640625, -5.2646484375, -4.943115234375, -4.62158203125, -4.300048828125, -3.978515625, -3.656982421875, -3.33544921875, -3.013916015625, -2.6923828125, -2.370849609375, -2.04931640625, -1.727783203125, -1.40625, -1.084716796875, -0.76318359375, -0.441650390625, -0.1201171875, 0.201416015625, 0.52294921875, 0.844482421875, 1.166015625, 1.487548828125, 1.80908203125, 2.130615234375, 2.4521484375, 2.773681640625, 3.09521484375, 3.416748046875, 3.73828125, 4.059814453125, 4.38134765625, 4.702880859375, 5.0244140625, 5.345947265625, 5.66748046875, 5.989013671875, 6.310546875, 6.632080078125, 6.95361328125, 7.275146484375, 7.5966796875, 7.918212890625, 8.23974609375, 8.561279296875, 8.8828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 6.0, 6.0, 7.0, 20.0, 21.0, 33.0, 43.0, 64.0, 60.0, 93.0, 127.0, 142.0, 117.0, 70.0, 62.0, 35.0, 19.0, 28.0, 13.0, 10.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001220703125, -0.0011721402406692505, -0.001123577356338501, -0.0010750144720077515, -0.001026451587677002, -0.0009778887033462524, -0.0009293258190155029, -0.0008807629346847534, -0.0008322000503540039, -0.0007836371660232544, -0.0007350742816925049, -0.0006865113973617554, -0.0006379485130310059, -0.0005893856287002563, -0.0005408227443695068, -0.0004922598600387573, -0.0004436969757080078, -0.0003951340913772583, -0.0003465712070465088, -0.0002980083227157593, -0.00024944543838500977, -0.00020088255405426025, -0.00015231966972351074, -0.00010375678539276123, -5.519390106201172e-05, -6.631016731262207e-06, 4.1931867599487305e-05, 9.049475193023682e-05, 0.00013905763626098633, 0.00018762052059173584, 0.00023618340492248535, 0.00028474628925323486, 0.0003333091735839844, 0.0003818720579147339, 0.0004304349422454834, 0.0004789978265762329, 0.0005275607109069824, 0.0005761235952377319, 0.0006246864795684814, 0.000673249363899231, 0.0007218122482299805, 0.00077037513256073, 0.0008189380168914795, 0.000867500901222229, 0.0009160637855529785, 0.000964626669883728, 0.0010131895542144775, 0.001061752438545227, 0.0011103153228759766, 0.001158878207206726, 0.0012074410915374756, 0.001256003975868225, 0.0013045668601989746, 0.0013531297445297241, 0.0014016926288604736, 0.0014502555131912231, 0.0014988183975219727, 0.0015473812818527222, 0.0015959441661834717, 0.0016445070505142212, 0.0016930699348449707, 0.0017416328191757202, 0.0017901957035064697, 0.0018387585878372192, 0.0018873214721679688]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 6.0, 3.0, 11.0, 13.0, 14.0, 22.0, 45.0, 86.0, 160.0, 288.0, 511.0, 1076.0, 3058.0, 12962.0, 133436.0, 794380.0, 87717.0, 10112.0, 2634.0, 949.0, 503.0, 250.0, 117.0, 75.0, 35.0, 31.0, 14.0, 12.0, 7.0, 3.0, 7.0, 4.0, 7.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.25, -17.73486328125, -17.2197265625, -16.70458984375, -16.189453125, -15.67431640625, -15.1591796875, -14.64404296875, -14.12890625, -13.61376953125, -13.0986328125, -12.58349609375, -12.068359375, -11.55322265625, -11.0380859375, -10.52294921875, -10.0078125, -9.49267578125, -8.9775390625, -8.46240234375, -7.947265625, -7.43212890625, -6.9169921875, -6.40185546875, -5.88671875, -5.37158203125, -4.8564453125, -4.34130859375, -3.826171875, -3.31103515625, -2.7958984375, -2.28076171875, -1.765625, -1.25048828125, -0.7353515625, -0.22021484375, 0.294921875, 0.81005859375, 1.3251953125, 1.84033203125, 2.35546875, 2.87060546875, 3.3857421875, 3.90087890625, 4.416015625, 4.93115234375, 5.4462890625, 5.96142578125, 6.4765625, 6.99169921875, 7.5068359375, 8.02197265625, 8.537109375, 9.05224609375, 9.5673828125, 10.08251953125, 10.59765625, 11.11279296875, 11.6279296875, 12.14306640625, 12.658203125, 13.17333984375, 13.6884765625, 14.20361328125, 14.71875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 13.0, 8.0, 19.0, 35.0, 52.0, 117.0, 140.0, 167.0, 154.0, 98.0, 61.0, 48.0, 22.0, 22.0, 11.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.1953125, -11.8780517578125, -11.560791015625, -11.2435302734375, -10.92626953125, -10.6090087890625, -10.291748046875, -9.9744873046875, -9.6572265625, -9.3399658203125, -9.022705078125, -8.7054443359375, -8.38818359375, -8.0709228515625, -7.753662109375, -7.4364013671875, -7.119140625, -6.8018798828125, -6.484619140625, -6.1673583984375, -5.85009765625, -5.5328369140625, -5.215576171875, -4.8983154296875, -4.5810546875, -4.2637939453125, -3.946533203125, -3.6292724609375, -3.31201171875, -2.9947509765625, -2.677490234375, -2.3602294921875, -2.04296875, -1.7257080078125, -1.408447265625, -1.0911865234375, -0.77392578125, -0.4566650390625, -0.139404296875, 0.1778564453125, 0.4951171875, 0.8123779296875, 1.129638671875, 1.4468994140625, 1.76416015625, 2.0814208984375, 2.398681640625, 2.7159423828125, 3.033203125, 3.3504638671875, 3.667724609375, 3.9849853515625, 4.30224609375, 4.6195068359375, 4.936767578125, 5.2540283203125, 5.5712890625, 5.8885498046875, 6.205810546875, 6.5230712890625, 6.84033203125, 7.1575927734375, 7.474853515625, 7.7921142578125, 8.109375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 13.0, 23.0, 22.0, 64.0, 88.0, 115.0, 125.0, 169.0, 141.0, 86.0, 71.0, 37.0, 20.0, 11.0, 9.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.7540283203125, -65.89045715332031, -62.026885986328125, -58.16331100463867, -54.299739837646484, -50.4361686706543, -46.572593688964844, -42.709022521972656, -38.84545135498047, -34.98188018798828, -31.11830711364746, -27.25473403930664, -23.391162872314453, -19.527591705322266, -15.664018630981445, -11.800445556640625, -7.9368743896484375, -4.073302268981934, -0.2097301483154297, 3.653841972351074, 7.517414093017578, 11.380985260009766, 15.244558334350586, 19.108131408691406, 22.971702575683594, 26.83527374267578, 30.6988468170166, 34.56241989135742, 38.42599105834961, 42.2895622253418, 46.15313720703125, 50.01670837402344, 53.880279541015625, 57.74385070800781, 61.607421875, 65.47099304199219, 69.33456420898438, 73.19813537597656, 77.06171417236328, 80.92528533935547, 84.78885650634766, 88.65242767333984, 92.51599884033203, 96.37957000732422, 100.24314880371094, 104.10671997070312, 107.97029113769531, 111.8338623046875, 115.69743347167969, 119.56100463867188, 123.42457580566406, 127.28814697265625, 131.15171813964844, 135.01528930664062, 138.8788604736328, 142.742431640625, 146.60601806640625, 150.46958923339844, 154.33316040039062, 158.1967315673828, 162.060302734375, 165.9238739013672, 169.78744506835938, 173.65103149414062, 177.51458740234375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 11.0, 14.0, 15.0, 14.0, 12.0, 11.0, 15.0, 26.0, 22.0, 28.0, 34.0, 28.0, 33.0, 47.0, 51.0, 37.0, 49.0, 49.0, 42.0, 38.0, 47.0, 51.0, 43.0, 35.0, 42.0, 38.0, 29.0, 25.0, 28.0, 18.0, 15.0, 12.0, 8.0, 7.0, 8.0, 7.0, 2.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.45842742919922, -43.83392333984375, -42.20941925048828, -40.58491134643555, -38.96040725708008, -37.33590316772461, -35.71139907836914, -34.086891174316406, -32.46238708496094, -30.83788299560547, -29.213376998901367, -27.5888729095459, -25.964366912841797, -24.339862823486328, -22.71535873413086, -21.090852737426758, -19.46634864807129, -17.84184455871582, -16.21733856201172, -14.59283447265625, -12.968328475952148, -11.34382438659668, -9.719319343566895, -8.09481430053711, -6.470309257507324, -4.845804214477539, -3.221299409866333, -1.596794605255127, 0.027710437774658203, 1.6522150039672852, 3.2767200469970703, 4.9012250900268555, 6.525730133056641, 8.150235176086426, 9.774740219116211, 11.39924430847168, 13.023750305175781, 14.64825439453125, 16.27275848388672, 17.89726448059082, 19.521770477294922, 21.14627456665039, 22.770780563354492, 24.39528465270996, 26.019790649414062, 27.64429473876953, 29.268798828125, 30.8933048248291, 32.51780700683594, 34.142311096191406, 35.766815185546875, 37.39132308959961, 39.01582717895508, 40.64033126831055, 42.264835357666016, 43.88934326171875, 45.51384735107422, 47.13835144042969, 48.762855529785156, 50.38736343383789, 52.01186752319336, 53.63637161254883, 55.2608757019043, 56.88538360595703, 58.5098876953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 8.0, 10.0, 9.0, 20.0, 24.0, 33.0, 44.0, 62.0, 115.0, 141.0, 235.0, 374.0, 685.0, 1445.0, 3420.0, 11170.0, 52950.0, 1643128.0, 2406025.0, 56311.0, 11596.0, 3595.0, 1346.0, 694.0, 332.0, 190.0, 112.0, 61.0, 57.0, 26.0, 21.0, 13.0, 8.0, 9.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.640625, -25.722412109375, -24.80419921875, -23.885986328125, -22.9677734375, -22.049560546875, -21.13134765625, -20.213134765625, -19.294921875, -18.376708984375, -17.45849609375, -16.540283203125, -15.6220703125, -14.703857421875, -13.78564453125, -12.867431640625, -11.94921875, -11.031005859375, -10.11279296875, -9.194580078125, -8.2763671875, -7.358154296875, -6.43994140625, -5.521728515625, -4.603515625, -3.685302734375, -2.76708984375, -1.848876953125, -0.9306640625, -0.012451171875, 0.90576171875, 1.823974609375, 2.7421875, 3.660400390625, 4.57861328125, 5.496826171875, 6.4150390625, 7.333251953125, 8.25146484375, 9.169677734375, 10.087890625, 11.006103515625, 11.92431640625, 12.842529296875, 13.7607421875, 14.678955078125, 15.59716796875, 16.515380859375, 17.43359375, 18.351806640625, 19.27001953125, 20.188232421875, 21.1064453125, 22.024658203125, 22.94287109375, 23.861083984375, 24.779296875, 25.697509765625, 26.61572265625, 27.533935546875, 28.4521484375, 29.370361328125, 30.28857421875, 31.206787109375, 32.125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 9.0, 19.0, 17.0, 18.0, 43.0, 47.0, 58.0, 47.0, 83.0, 84.0, 73.0, 88.0, 72.0, 65.0, 63.0, 43.0, 44.0, 38.0, 19.0, 16.0, 18.0, 10.0, 6.0, 5.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.092681884765625, -3.97833251953125, -3.863983154296875, -3.7496337890625, -3.635284423828125, -3.52093505859375, -3.406585693359375, -3.292236328125, -3.177886962890625, -3.06353759765625, -2.949188232421875, -2.8348388671875, -2.720489501953125, -2.60614013671875, -2.491790771484375, -2.37744140625, -2.263092041015625, -2.14874267578125, -2.034393310546875, -1.9200439453125, -1.805694580078125, -1.69134521484375, -1.576995849609375, -1.462646484375, -1.348297119140625, -1.23394775390625, -1.119598388671875, -1.0052490234375, -0.890899658203125, -0.77655029296875, -0.662200927734375, -0.5478515625, -0.433502197265625, -0.31915283203125, -0.204803466796875, -0.0904541015625, 0.023895263671875, 0.13824462890625, 0.252593994140625, 0.366943359375, 0.481292724609375, 0.59564208984375, 0.709991455078125, 0.8243408203125, 0.938690185546875, 1.05303955078125, 1.167388916015625, 1.28173828125, 1.396087646484375, 1.51043701171875, 1.624786376953125, 1.7391357421875, 1.853485107421875, 1.96783447265625, 2.082183837890625, 2.196533203125, 2.310882568359375, 2.42523193359375, 2.539581298828125, 2.6539306640625, 2.768280029296875, 2.88262939453125, 2.996978759765625, 3.111328125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 6.0, 14.0, 6.0, 11.0, 18.0, 31.0, 41.0, 48.0, 77.0, 98.0, 138.0, 258.0, 448.0, 892.0, 2093.0, 5456.0, 18866.0, 95647.0, 1811424.0, 2126760.0, 101907.0, 20079.0, 5783.0, 2063.0, 911.0, 447.0, 243.0, 157.0, 106.0, 73.0, 52.0, 23.0, 20.0, 16.0, 16.0, 11.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.890625, -18.281494140625, -17.67236328125, -17.063232421875, -16.4541015625, -15.844970703125, -15.23583984375, -14.626708984375, -14.017578125, -13.408447265625, -12.79931640625, -12.190185546875, -11.5810546875, -10.971923828125, -10.36279296875, -9.753662109375, -9.14453125, -8.535400390625, -7.92626953125, -7.317138671875, -6.7080078125, -6.098876953125, -5.48974609375, -4.880615234375, -4.271484375, -3.662353515625, -3.05322265625, -2.444091796875, -1.8349609375, -1.225830078125, -0.61669921875, -0.007568359375, 0.6015625, 1.210693359375, 1.81982421875, 2.428955078125, 3.0380859375, 3.647216796875, 4.25634765625, 4.865478515625, 5.474609375, 6.083740234375, 6.69287109375, 7.302001953125, 7.9111328125, 8.520263671875, 9.12939453125, 9.738525390625, 10.34765625, 10.956787109375, 11.56591796875, 12.175048828125, 12.7841796875, 13.393310546875, 14.00244140625, 14.611572265625, 15.220703125, 15.829833984375, 16.43896484375, 17.048095703125, 17.6572265625, 18.266357421875, 18.87548828125, 19.484619140625, 20.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 7.0, 5.0, 12.0, 20.0, 35.0, 46.0, 74.0, 129.0, 232.0, 627.0, 1503.0, 710.0, 265.0, 138.0, 87.0, 55.0, 42.0, 30.0, 19.0, 8.0, 8.0, 7.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-11.234375, -10.9876708984375, -10.740966796875, -10.4942626953125, -10.24755859375, -10.0008544921875, -9.754150390625, -9.5074462890625, -9.2607421875, -9.0140380859375, -8.767333984375, -8.5206298828125, -8.27392578125, -8.0272216796875, -7.780517578125, -7.5338134765625, -7.287109375, -7.0404052734375, -6.793701171875, -6.5469970703125, -6.30029296875, -6.0535888671875, -5.806884765625, -5.5601806640625, -5.3134765625, -5.0667724609375, -4.820068359375, -4.5733642578125, -4.32666015625, -4.0799560546875, -3.833251953125, -3.5865478515625, -3.33984375, -3.0931396484375, -2.846435546875, -2.5997314453125, -2.35302734375, -2.1063232421875, -1.859619140625, -1.6129150390625, -1.3662109375, -1.1195068359375, -0.872802734375, -0.6260986328125, -0.37939453125, -0.1326904296875, 0.114013671875, 0.3607177734375, 0.607421875, 0.8541259765625, 1.100830078125, 1.3475341796875, 1.59423828125, 1.8409423828125, 2.087646484375, 2.3343505859375, 2.5810546875, 2.8277587890625, 3.074462890625, 3.3211669921875, 3.56787109375, 3.8145751953125, 4.061279296875, 4.3079833984375, 4.5546875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 13.0, 16.0, 33.0, 73.0, 112.0, 137.0, 155.0, 136.0, 136.0, 81.0, 43.0, 35.0, 14.0, 9.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.05807495117188, -66.18486785888672, -64.31166076660156, -62.43845748901367, -60.565250396728516, -58.692047119140625, -56.81884002685547, -54.94563293457031, -53.072425842285156, -51.19921875, -49.32601547241211, -47.45280838012695, -45.5796012878418, -43.706398010253906, -41.83319091796875, -39.959983825683594, -38.0867805480957, -36.21357345581055, -34.340370178222656, -32.4671630859375, -30.593955993652344, -28.72075080871582, -26.847545623779297, -24.97433853149414, -23.101133346557617, -21.227928161621094, -19.354721069335938, -17.481515884399414, -15.608309745788574, -13.735103607177734, -11.861898422241211, -9.988692283630371, -8.115486145019531, -6.242280006408691, -4.36907434463501, -2.495868682861328, -0.6226625442504883, 1.2505435943603516, 3.123748779296875, 4.996954917907715, 6.870161056518555, 8.743367195129395, 10.616573333740234, 12.489778518676758, 14.362984657287598, 16.236190795898438, 18.10939598083496, 19.982601165771484, 21.85580825805664, 23.729013442993164, 25.60222053527832, 27.475425720214844, 29.3486328125, 31.221837997436523, 33.09504318237305, 34.9682502746582, 36.841453552246094, 38.71466064453125, 40.58786392211914, 42.4610710144043, 44.33427810668945, 46.207481384277344, 48.0806884765625, 49.953895568847656, 51.82710266113281]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 5.0, 14.0, 15.0, 14.0, 18.0, 14.0, 11.0, 19.0, 24.0, 37.0, 31.0, 30.0, 38.0, 35.0, 40.0, 46.0, 42.0, 50.0, 39.0, 44.0, 45.0, 50.0, 37.0, 29.0, 42.0, 22.0, 29.0, 26.0, 26.0, 19.0, 25.0, 13.0, 17.0, 11.0, 10.0, 3.0, 7.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-22.42424774169922, -21.78011703491211, -21.135986328125, -20.49185562133789, -19.84772491455078, -19.203596115112305, -18.559465408325195, -17.915334701538086, -17.271203994750977, -16.627073287963867, -15.982942581176758, -15.338812828063965, -14.694682121276855, -14.050551414489746, -13.406421661376953, -12.762290954589844, -12.118160247802734, -11.474029541015625, -10.829898834228516, -10.185769081115723, -9.541638374328613, -8.897507667541504, -8.253377914428711, -7.609247207641602, -6.965116500854492, -6.320985794067383, -5.676855564117432, -5.0327253341674805, -4.388594627380371, -3.744464159011841, -3.1003336906433105, -2.4562034606933594, -1.81207275390625, -1.1679422855377197, -0.5238118171691895, 0.12031865119934082, 0.7644491195678711, 1.4085795879364014, 2.0527100563049316, 2.696840286254883, 3.340970993041992, 3.9851014614105225, 4.629231929779053, 5.273362159729004, 5.917492866516113, 6.561623573303223, 7.205753803253174, 7.849884033203125, 8.494014739990234, 9.138145446777344, 9.782276153564453, 10.426405906677246, 11.070536613464355, 11.714667320251465, 12.358797073364258, 13.002927780151367, 13.647058486938477, 14.291189193725586, 14.935319900512695, 15.579449653625488, 16.22357940673828, 16.86771011352539, 17.5118408203125, 18.15597152709961, 18.80010223388672]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 5.0, 8.0, 8.0, 16.0, 13.0, 21.0, 25.0, 43.0, 52.0, 87.0, 118.0, 200.0, 327.0, 481.0, 981.0, 2025.0, 5024.0, 14078.0, 49829.0, 241917.0, 581678.0, 109386.0, 27177.0, 8550.0, 3156.0, 1420.0, 739.0, 432.0, 244.0, 164.0, 105.0, 69.0, 49.0, 26.0, 32.0, 16.0, 14.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.40625, -21.666015625, -20.92578125, -20.185546875, -19.4453125, -18.705078125, -17.96484375, -17.224609375, -16.484375, -15.744140625, -15.00390625, -14.263671875, -13.5234375, -12.783203125, -12.04296875, -11.302734375, -10.5625, -9.822265625, -9.08203125, -8.341796875, -7.6015625, -6.861328125, -6.12109375, -5.380859375, -4.640625, -3.900390625, -3.16015625, -2.419921875, -1.6796875, -0.939453125, -0.19921875, 0.541015625, 1.28125, 2.021484375, 2.76171875, 3.501953125, 4.2421875, 4.982421875, 5.72265625, 6.462890625, 7.203125, 7.943359375, 8.68359375, 9.423828125, 10.1640625, 10.904296875, 11.64453125, 12.384765625, 13.125, 13.865234375, 14.60546875, 15.345703125, 16.0859375, 16.826171875, 17.56640625, 18.306640625, 19.046875, 19.787109375, 20.52734375, 21.267578125, 22.0078125, 22.748046875, 23.48828125, 24.228515625, 24.96875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 12.0, 16.0, 17.0, 16.0, 33.0, 48.0, 50.0, 50.0, 79.0, 66.0, 90.0, 74.0, 83.0, 75.0, 68.0, 43.0, 40.0, 38.0, 32.0, 11.0, 17.0, 16.0, 5.0, 2.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.946807861328125, -3.83111572265625, -3.715423583984375, -3.5997314453125, -3.484039306640625, -3.36834716796875, -3.252655029296875, -3.136962890625, -3.021270751953125, -2.90557861328125, -2.789886474609375, -2.6741943359375, -2.558502197265625, -2.44281005859375, -2.327117919921875, -2.21142578125, -2.095733642578125, -1.98004150390625, -1.864349365234375, -1.7486572265625, -1.632965087890625, -1.51727294921875, -1.401580810546875, -1.285888671875, -1.170196533203125, -1.05450439453125, -0.938812255859375, -0.8231201171875, -0.707427978515625, -0.59173583984375, -0.476043701171875, -0.3603515625, -0.244659423828125, -0.12896728515625, -0.013275146484375, 0.1024169921875, 0.218109130859375, 0.33380126953125, 0.449493408203125, 0.565185546875, 0.680877685546875, 0.79656982421875, 0.912261962890625, 1.0279541015625, 1.143646240234375, 1.25933837890625, 1.375030517578125, 1.49072265625, 1.606414794921875, 1.72210693359375, 1.837799072265625, 1.9534912109375, 2.069183349609375, 2.18487548828125, 2.300567626953125, 2.416259765625, 2.531951904296875, 2.64764404296875, 2.763336181640625, 2.8790283203125, 2.994720458984375, 3.11041259765625, 3.226104736328125, 3.341796875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 13.0, 13.0, 16.0, 22.0, 22.0, 45.0, 64.0, 80.0, 142.0, 167.0, 261.0, 434.0, 729.0, 1389.0, 3326.0, 9969.0, 36520.0, 166304.0, 615558.0, 161228.0, 35705.0, 9996.0, 3293.0, 1368.0, 700.0, 389.0, 228.0, 159.0, 101.0, 71.0, 71.0, 49.0, 36.0, 21.0, 18.0, 13.0, 4.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.609375, -21.00048828125, -20.3916015625, -19.78271484375, -19.173828125, -18.56494140625, -17.9560546875, -17.34716796875, -16.73828125, -16.12939453125, -15.5205078125, -14.91162109375, -14.302734375, -13.69384765625, -13.0849609375, -12.47607421875, -11.8671875, -11.25830078125, -10.6494140625, -10.04052734375, -9.431640625, -8.82275390625, -8.2138671875, -7.60498046875, -6.99609375, -6.38720703125, -5.7783203125, -5.16943359375, -4.560546875, -3.95166015625, -3.3427734375, -2.73388671875, -2.125, -1.51611328125, -0.9072265625, -0.29833984375, 0.310546875, 0.91943359375, 1.5283203125, 2.13720703125, 2.74609375, 3.35498046875, 3.9638671875, 4.57275390625, 5.181640625, 5.79052734375, 6.3994140625, 7.00830078125, 7.6171875, 8.22607421875, 8.8349609375, 9.44384765625, 10.052734375, 10.66162109375, 11.2705078125, 11.87939453125, 12.48828125, 13.09716796875, 13.7060546875, 14.31494140625, 14.923828125, 15.53271484375, 16.1416015625, 16.75048828125, 17.359375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 3.0, 6.0, 5.0, 11.0, 8.0, 8.0, 11.0, 18.0, 20.0, 18.0, 23.0, 27.0, 30.0, 23.0, 32.0, 39.0, 26.0, 46.0, 36.0, 48.0, 43.0, 40.0, 42.0, 42.0, 39.0, 43.0, 47.0, 32.0, 27.0, 29.0, 27.0, 28.0, 13.0, 26.0, 10.0, 20.0, 8.0, 8.0, 16.0, 3.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6097412109375, -8.313232421875, -8.0167236328125, -7.72021484375, -7.4237060546875, -7.127197265625, -6.8306884765625, -6.5341796875, -6.2376708984375, -5.941162109375, -5.6446533203125, -5.34814453125, -5.0516357421875, -4.755126953125, -4.4586181640625, -4.162109375, -3.8656005859375, -3.569091796875, -3.2725830078125, -2.97607421875, -2.6795654296875, -2.383056640625, -2.0865478515625, -1.7900390625, -1.4935302734375, -1.197021484375, -0.9005126953125, -0.60400390625, -0.3074951171875, -0.010986328125, 0.2855224609375, 0.58203125, 0.8785400390625, 1.175048828125, 1.4715576171875, 1.76806640625, 2.0645751953125, 2.361083984375, 2.6575927734375, 2.9541015625, 3.2506103515625, 3.547119140625, 3.8436279296875, 4.14013671875, 4.4366455078125, 4.733154296875, 5.0296630859375, 5.326171875, 5.6226806640625, 5.919189453125, 6.2156982421875, 6.51220703125, 6.8087158203125, 7.105224609375, 7.4017333984375, 7.6982421875, 7.9947509765625, 8.291259765625, 8.5877685546875, 8.88427734375, 9.1807861328125, 9.477294921875, 9.7738037109375, 10.0703125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 0.0, 5.0, 7.0, 5.0, 10.0, 13.0, 14.0, 18.0, 34.0, 36.0, 58.0, 116.0, 238.0, 628.0, 2188.0, 16276.0, 843572.0, 176421.0, 6802.0, 1268.0, 409.0, 169.0, 92.0, 52.0, 29.0, 23.0, 20.0, 11.0, 7.0, 4.0, 5.0, 6.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.296875, -27.407470703125, -26.51806640625, -25.628662109375, -24.7392578125, -23.849853515625, -22.96044921875, -22.071044921875, -21.181640625, -20.292236328125, -19.40283203125, -18.513427734375, -17.6240234375, -16.734619140625, -15.84521484375, -14.955810546875, -14.06640625, -13.177001953125, -12.28759765625, -11.398193359375, -10.5087890625, -9.619384765625, -8.72998046875, -7.840576171875, -6.951171875, -6.061767578125, -5.17236328125, -4.282958984375, -3.3935546875, -2.504150390625, -1.61474609375, -0.725341796875, 0.1640625, 1.053466796875, 1.94287109375, 2.832275390625, 3.7216796875, 4.611083984375, 5.50048828125, 6.389892578125, 7.279296875, 8.168701171875, 9.05810546875, 9.947509765625, 10.8369140625, 11.726318359375, 12.61572265625, 13.505126953125, 14.39453125, 15.283935546875, 16.17333984375, 17.062744140625, 17.9521484375, 18.841552734375, 19.73095703125, 20.620361328125, 21.509765625, 22.399169921875, 23.28857421875, 24.177978515625, 25.0673828125, 25.956787109375, 26.84619140625, 27.735595703125, 28.625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 10.0, 13.0, 14.0, 22.0, 17.0, 33.0, 52.0, 103.0, 155.0, 198.0, 132.0, 62.0, 43.0, 29.0, 18.0, 19.0, 17.0, 9.0, 10.0, 9.0, 4.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011167526245117188, -0.0010707974433898926, -0.0010248422622680664, -0.0009788870811462402, -0.0009329319000244141, -0.0008869767189025879, -0.0008410215377807617, -0.0007950663566589355, -0.0007491111755371094, -0.0007031559944152832, -0.000657200813293457, -0.0006112456321716309, -0.0005652904510498047, -0.0005193352699279785, -0.00047338008880615234, -0.00042742490768432617, -0.0003814697265625, -0.00033551454544067383, -0.00028955936431884766, -0.00024360418319702148, -0.0001976490020751953, -0.00015169382095336914, -0.00010573863983154297, -5.97834587097168e-05, -1.3828277587890625e-05, 3.212690353393555e-05, 7.808208465576172e-05, 0.0001240372657775879, 0.00016999244689941406, 0.00021594762802124023, 0.0002619028091430664, 0.0003078579902648926, 0.00035381317138671875, 0.0003997683525085449, 0.0004457235336303711, 0.0004916787147521973, 0.0005376338958740234, 0.0005835890769958496, 0.0006295442581176758, 0.000675499439239502, 0.0007214546203613281, 0.0007674098014831543, 0.0008133649826049805, 0.0008593201637268066, 0.0009052753448486328, 0.000951230525970459, 0.0009971857070922852, 0.0010431408882141113, 0.0010890960693359375, 0.0011350512504577637, 0.0011810064315795898, 0.001226961612701416, 0.0012729167938232422, 0.0013188719749450684, 0.0013648271560668945, 0.0014107823371887207, 0.0014567375183105469, 0.001502692699432373, 0.0015486478805541992, 0.0015946030616760254, 0.0016405582427978516, 0.0016865134239196777, 0.001732468605041504, 0.00177842378616333, 0.0018243789672851562]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 2.0, 4.0, 6.0, 13.0, 11.0, 21.0, 24.0, 57.0, 123.0, 209.0, 474.0, 1263.0, 4917.0, 90316.0, 938915.0, 8955.0, 1974.0, 659.0, 300.0, 135.0, 73.0, 28.0, 29.0, 10.0, 12.0, 4.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.50146484375, -36.9716796875, -35.44189453125, -33.912109375, -32.38232421875, -30.8525390625, -29.32275390625, -27.79296875, -26.26318359375, -24.7333984375, -23.20361328125, -21.673828125, -20.14404296875, -18.6142578125, -17.08447265625, -15.5546875, -14.02490234375, -12.4951171875, -10.96533203125, -9.435546875, -7.90576171875, -6.3759765625, -4.84619140625, -3.31640625, -1.78662109375, -0.2568359375, 1.27294921875, 2.802734375, 4.33251953125, 5.8623046875, 7.39208984375, 8.921875, 10.45166015625, 11.9814453125, 13.51123046875, 15.041015625, 16.57080078125, 18.1005859375, 19.63037109375, 21.16015625, 22.68994140625, 24.2197265625, 25.74951171875, 27.279296875, 28.80908203125, 30.3388671875, 31.86865234375, 33.3984375, 34.92822265625, 36.4580078125, 37.98779296875, 39.517578125, 41.04736328125, 42.5771484375, 44.10693359375, 45.63671875, 47.16650390625, 48.6962890625, 50.22607421875, 51.755859375, 53.28564453125, 54.8154296875, 56.34521484375, 57.875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 13.0, 29.0, 63.0, 358.0, 369.0, 78.0, 30.0, 12.0, 13.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.640625, -23.819091796875, -22.99755859375, -22.176025390625, -21.3544921875, -20.532958984375, -19.71142578125, -18.889892578125, -18.068359375, -17.246826171875, -16.42529296875, -15.603759765625, -14.7822265625, -13.960693359375, -13.13916015625, -12.317626953125, -11.49609375, -10.674560546875, -9.85302734375, -9.031494140625, -8.2099609375, -7.388427734375, -6.56689453125, -5.745361328125, -4.923828125, -4.102294921875, -3.28076171875, -2.459228515625, -1.6376953125, -0.816162109375, 0.00537109375, 0.826904296875, 1.6484375, 2.469970703125, 3.29150390625, 4.113037109375, 4.9345703125, 5.756103515625, 6.57763671875, 7.399169921875, 8.220703125, 9.042236328125, 9.86376953125, 10.685302734375, 11.5068359375, 12.328369140625, 13.14990234375, 13.971435546875, 14.79296875, 15.614501953125, 16.43603515625, 17.257568359375, 18.0791015625, 18.900634765625, 19.72216796875, 20.543701171875, 21.365234375, 22.186767578125, 23.00830078125, 23.829833984375, 24.6513671875, 25.472900390625, 26.29443359375, 27.115966796875, 27.9375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 49.0, 276.0, 489.0, 153.0, 25.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-273.4330139160156, -259.2737731933594, -245.11451721191406, -230.95526123046875, -216.7960205078125, -202.63677978515625, -188.47752380371094, -174.31826782226562, -160.15902709960938, -145.99978637695312, -131.8405303955078, -117.68128204345703, -103.52203369140625, -89.36278533935547, -75.20353698730469, -61.044288635253906, -46.885040283203125, -32.725791931152344, -18.566543579101562, -4.407295227050781, 9.751953125, 23.91120147705078, 38.07044982910156, 52.229698181152344, 66.38894653320312, 80.5481948852539, 94.70744323730469, 108.86669158935547, 123.02593994140625, 137.1851806640625, 151.3444366455078, 165.50369262695312, 179.6629638671875, 193.82220458984375, 207.98146057128906, 222.14071655273438, 236.29995727539062, 250.45919799804688, 264.61846923828125, 278.7777099609375, 292.93695068359375, 307.09619140625, 321.25543212890625, 335.4147033691406, 349.5739440917969, 363.7331848144531, 377.8924560546875, 392.05169677734375, 406.2109375, 420.37017822265625, 434.5294189453125, 448.6886901855469, 462.8479309082031, 477.0071716308594, 491.16644287109375, 505.32568359375, 519.4849243164062, 533.6441650390625, 547.8034057617188, 561.962646484375, 576.1219482421875, 590.2811889648438, 604.4404296875, 618.5996704101562, 632.7589111328125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 11.0, 9.0, 2.0, 8.0, 20.0, 33.0, 44.0, 29.0, 43.0, 64.0, 83.0, 65.0, 71.0, 58.0, 57.0, 68.0, 65.0, 50.0, 44.0, 41.0, 36.0, 32.0, 25.0, 15.0, 3.0, 11.0, 6.0, 5.0, 3.0, 5.0, 0.0, 1.0, 1.0], "bins": [-119.6133804321289, -116.91424560546875, -114.2151107788086, -111.51597595214844, -108.81684112548828, -106.11770629882812, -103.41856384277344, -100.71943664550781, -98.02029418945312, -95.32115936279297, -92.62202453613281, -89.92288970947266, -87.2237548828125, -84.52462005615234, -81.82548522949219, -79.1263427734375, -76.42721557617188, -73.72808074951172, -71.02894592285156, -68.3298110961914, -65.63067626953125, -62.931541442871094, -60.23240280151367, -57.533267974853516, -54.83413314819336, -52.1349983215332, -49.43586349487305, -46.736724853515625, -44.03759002685547, -41.33845520019531, -38.639320373535156, -35.940185546875, -33.24104690551758, -30.541912078857422, -27.842777252197266, -25.143640518188477, -22.44450569152832, -19.745370864868164, -17.046234130859375, -14.347099304199219, -11.647964477539062, -8.948829650878906, -6.249693870544434, -3.550558090209961, -0.8514232635498047, 1.8477115631103516, 4.546848297119141, 7.245983123779297, 9.945117950439453, 12.64425277709961, 15.343388557434082, 18.042524337768555, 20.74165916442871, 23.440793991088867, 26.139930725097656, 28.839065551757812, 31.53820037841797, 34.237335205078125, 36.93647003173828, 39.63560485839844, 42.334739685058594, 45.03387451171875, 47.73301315307617, 50.43214797973633, 53.131282806396484]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 3.0, 10.0, 10.0, 14.0, 20.0, 17.0, 27.0, 37.0, 45.0, 58.0, 81.0, 101.0, 136.0, 160.0, 215.0, 346.0, 629.0, 1107.0, 2470.0, 5424.0, 14726.0, 55974.0, 689430.0, 3299828.0, 89832.0, 20557.0, 6955.0, 2929.0, 1331.0, 703.0, 397.0, 208.0, 145.0, 116.0, 81.0, 29.0, 34.0, 23.0, 18.0, 13.0, 11.0, 10.0, 4.0, 7.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.859375, -24.034423828125, -23.20947265625, -22.384521484375, -21.5595703125, -20.734619140625, -19.90966796875, -19.084716796875, -18.259765625, -17.434814453125, -16.60986328125, -15.784912109375, -14.9599609375, -14.135009765625, -13.31005859375, -12.485107421875, -11.66015625, -10.835205078125, -10.01025390625, -9.185302734375, -8.3603515625, -7.535400390625, -6.71044921875, -5.885498046875, -5.060546875, -4.235595703125, -3.41064453125, -2.585693359375, -1.7607421875, -0.935791015625, -0.11083984375, 0.714111328125, 1.5390625, 2.364013671875, 3.18896484375, 4.013916015625, 4.8388671875, 5.663818359375, 6.48876953125, 7.313720703125, 8.138671875, 8.963623046875, 9.78857421875, 10.613525390625, 11.4384765625, 12.263427734375, 13.08837890625, 13.913330078125, 14.73828125, 15.563232421875, 16.38818359375, 17.213134765625, 18.0380859375, 18.863037109375, 19.68798828125, 20.512939453125, 21.337890625, 22.162841796875, 22.98779296875, 23.812744140625, 24.6376953125, 25.462646484375, 26.28759765625, 27.112548828125, 27.9375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 10.0, 9.0, 14.0, 15.0, 31.0, 37.0, 40.0, 51.0, 69.0, 70.0, 72.0, 72.0, 81.0, 78.0, 62.0, 51.0, 49.0, 45.0, 34.0, 31.0, 22.0, 16.0, 15.0, 7.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.13671875, -4.01837158203125, -3.9000244140625, -3.78167724609375, -3.663330078125, -3.54498291015625, -3.4266357421875, -3.30828857421875, -3.18994140625, -3.07159423828125, -2.9532470703125, -2.83489990234375, -2.716552734375, -2.59820556640625, -2.4798583984375, -2.36151123046875, -2.2431640625, -2.12481689453125, -2.0064697265625, -1.88812255859375, -1.769775390625, -1.65142822265625, -1.5330810546875, -1.41473388671875, -1.29638671875, -1.17803955078125, -1.0596923828125, -0.94134521484375, -0.822998046875, -0.70465087890625, -0.5863037109375, -0.46795654296875, -0.349609375, -0.23126220703125, -0.1129150390625, 0.00543212890625, 0.123779296875, 0.24212646484375, 0.3604736328125, 0.47882080078125, 0.59716796875, 0.71551513671875, 0.8338623046875, 0.95220947265625, 1.070556640625, 1.18890380859375, 1.3072509765625, 1.42559814453125, 1.5439453125, 1.66229248046875, 1.7806396484375, 1.89898681640625, 2.017333984375, 2.13568115234375, 2.2540283203125, 2.37237548828125, 2.49072265625, 2.60906982421875, 2.7274169921875, 2.84576416015625, 2.964111328125, 3.08245849609375, 3.2008056640625, 3.31915283203125, 3.4375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 11.0, 11.0, 17.0, 21.0, 32.0, 61.0, 67.0, 118.0, 177.0, 295.0, 514.0, 944.0, 1947.0, 4085.0, 9961.0, 27616.0, 114249.0, 2078846.0, 1799501.0, 110955.0, 27242.0, 9783.0, 3883.0, 1821.0, 861.0, 505.0, 266.0, 165.0, 113.0, 75.0, 41.0, 34.0, 27.0, 12.0, 11.0, 6.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.2725830078125, -15.763916015625, -15.2552490234375, -14.74658203125, -14.2379150390625, -13.729248046875, -13.2205810546875, -12.7119140625, -12.2032470703125, -11.694580078125, -11.1859130859375, -10.67724609375, -10.1685791015625, -9.659912109375, -9.1512451171875, -8.642578125, -8.1339111328125, -7.625244140625, -7.1165771484375, -6.60791015625, -6.0992431640625, -5.590576171875, -5.0819091796875, -4.5732421875, -4.0645751953125, -3.555908203125, -3.0472412109375, -2.53857421875, -2.0299072265625, -1.521240234375, -1.0125732421875, -0.50390625, 0.0047607421875, 0.513427734375, 1.0220947265625, 1.53076171875, 2.0394287109375, 2.548095703125, 3.0567626953125, 3.5654296875, 4.0740966796875, 4.582763671875, 5.0914306640625, 5.60009765625, 6.1087646484375, 6.617431640625, 7.1260986328125, 7.634765625, 8.1434326171875, 8.652099609375, 9.1607666015625, 9.66943359375, 10.1781005859375, 10.686767578125, 11.1954345703125, 11.7041015625, 12.2127685546875, 12.721435546875, 13.2301025390625, 13.73876953125, 14.2474365234375, 14.756103515625, 15.2647705078125, 15.7734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 4.0, 3.0, 8.0, 5.0, 12.0, 13.0, 21.0, 29.0, 56.0, 90.0, 197.0, 452.0, 1456.0, 994.0, 348.0, 144.0, 89.0, 50.0, 32.0, 23.0, 17.0, 9.0, 3.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.3817138671875, -7.150146484375, -6.9185791015625, -6.68701171875, -6.4554443359375, -6.223876953125, -5.9923095703125, -5.7607421875, -5.5291748046875, -5.297607421875, -5.0660400390625, -4.83447265625, -4.6029052734375, -4.371337890625, -4.1397705078125, -3.908203125, -3.6766357421875, -3.445068359375, -3.2135009765625, -2.98193359375, -2.7503662109375, -2.518798828125, -2.2872314453125, -2.0556640625, -1.8240966796875, -1.592529296875, -1.3609619140625, -1.12939453125, -0.8978271484375, -0.666259765625, -0.4346923828125, -0.203125, 0.0284423828125, 0.260009765625, 0.4915771484375, 0.72314453125, 0.9547119140625, 1.186279296875, 1.4178466796875, 1.6494140625, 1.8809814453125, 2.112548828125, 2.3441162109375, 2.57568359375, 2.8072509765625, 3.038818359375, 3.2703857421875, 3.501953125, 3.7335205078125, 3.965087890625, 4.1966552734375, 4.42822265625, 4.6597900390625, 4.891357421875, 5.1229248046875, 5.3544921875, 5.5860595703125, 5.817626953125, 6.0491943359375, 6.28076171875, 6.5123291015625, 6.743896484375, 6.9754638671875, 7.20703125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 7.0, 17.0, 18.0, 25.0, 46.0, 88.0, 127.0, 127.0, 157.0, 133.0, 90.0, 69.0, 41.0, 24.0, 13.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.59861373901367, -57.10755920410156, -55.61650466918945, -54.125450134277344, -52.6343994140625, -51.14334487915039, -49.65229034423828, -48.16123580932617, -46.67018127441406, -45.17912673950195, -43.688072204589844, -42.197017669677734, -40.705963134765625, -39.21491241455078, -37.72385787963867, -36.23280334472656, -34.74174880981445, -33.250694274902344, -31.759639739990234, -30.268587112426758, -28.77753257751465, -27.28647804260254, -25.795425415039062, -24.304370880126953, -22.813316345214844, -21.322261810302734, -19.831207275390625, -18.34015464782715, -16.84910011291504, -15.35804557800293, -13.866991996765137, -12.375938415527344, -10.884883880615234, -9.393829345703125, -7.902775764465332, -6.411721706390381, -4.92066764831543, -3.4296135902404785, -1.9385595321655273, -0.4475059509277344, 1.043548583984375, 2.534602642059326, 4.025656700134277, 5.5167107582092285, 7.00776481628418, 8.498819351196289, 9.989872932434082, 11.480926513671875, 12.971981048583984, 14.463035583496094, 15.954089164733887, 17.44514274597168, 18.93619728088379, 20.4272518157959, 21.918304443359375, 23.409358978271484, 24.900413513183594, 26.391468048095703, 27.882522583007812, 29.37357521057129, 30.8646297454834, 32.355682373046875, 33.846736907958984, 35.337791442871094, 36.8288459777832]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 7.0, 10.0, 9.0, 12.0, 17.0, 21.0, 28.0, 52.0, 46.0, 43.0, 59.0, 62.0, 60.0, 81.0, 75.0, 82.0, 70.0, 48.0, 47.0, 46.0, 31.0, 23.0, 20.0, 18.0, 12.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.358570098876953, -30.502370834350586, -29.646169662475586, -28.78997039794922, -27.93376922607422, -27.07756996154785, -26.221370697021484, -25.365169525146484, -24.508968353271484, -23.652769088745117, -22.796567916870117, -21.94036865234375, -21.08416748046875, -20.227968215942383, -19.371768951416016, -18.515567779541016, -17.65936851501465, -16.80316925048828, -15.946968078613281, -15.090768814086914, -14.234567642211914, -13.378368377685547, -12.522168159484863, -11.66596794128418, -10.809767723083496, -9.953567504882812, -9.097367286682129, -8.241167068481445, -7.38496732711792, -6.528767108917236, -5.672567367553711, -4.816367149353027, -3.960165023803711, -3.1039648056030273, -2.247764825820923, -1.3915648460388184, -0.5353646278381348, 0.32083559036254883, 1.1770353317260742, 2.033235549926758, 2.8894357681274414, 3.745635986328125, 4.601836204528809, 5.458035945892334, 6.314236164093018, 7.170436382293701, 8.026636123657227, 8.88283634185791, 9.739036560058594, 10.595236778259277, 11.451436996459961, 12.307636260986328, 13.163837432861328, 14.020036697387695, 14.876236915588379, 15.732437133789062, 16.588638305664062, 17.44483757019043, 18.30103874206543, 19.157238006591797, 20.013439178466797, 20.869638442993164, 21.72583770751953, 22.58203887939453, 23.4382381439209]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 10.0, 10.0, 19.0, 23.0, 36.0, 47.0, 84.0, 131.0, 220.0, 344.0, 588.0, 1214.0, 3084.0, 9930.0, 39117.0, 208120.0, 645837.0, 105324.0, 23598.0, 6437.0, 2199.0, 917.0, 486.0, 288.0, 177.0, 107.0, 78.0, 38.0, 28.0, 14.0, 15.0, 12.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.046875, -26.2587890625, -25.470703125, -24.6826171875, -23.89453125, -23.1064453125, -22.318359375, -21.5302734375, -20.7421875, -19.9541015625, -19.166015625, -18.3779296875, -17.58984375, -16.8017578125, -16.013671875, -15.2255859375, -14.4375, -13.6494140625, -12.861328125, -12.0732421875, -11.28515625, -10.4970703125, -9.708984375, -8.9208984375, -8.1328125, -7.3447265625, -6.556640625, -5.7685546875, -4.98046875, -4.1923828125, -3.404296875, -2.6162109375, -1.828125, -1.0400390625, -0.251953125, 0.5361328125, 1.32421875, 2.1123046875, 2.900390625, 3.6884765625, 4.4765625, 5.2646484375, 6.052734375, 6.8408203125, 7.62890625, 8.4169921875, 9.205078125, 9.9931640625, 10.78125, 11.5693359375, 12.357421875, 13.1455078125, 13.93359375, 14.7216796875, 15.509765625, 16.2978515625, 17.0859375, 17.8740234375, 18.662109375, 19.4501953125, 20.23828125, 21.0263671875, 21.814453125, 22.6025390625, 23.390625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 13.0, 27.0, 21.0, 25.0, 32.0, 47.0, 61.0, 75.0, 66.0, 75.0, 69.0, 95.0, 71.0, 44.0, 49.0, 46.0, 48.0, 32.0, 22.0, 20.0, 17.0, 12.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.03607177734375, -3.9119873046875, -3.78790283203125, -3.663818359375, -3.53973388671875, -3.4156494140625, -3.29156494140625, -3.16748046875, -3.04339599609375, -2.9193115234375, -2.79522705078125, -2.671142578125, -2.54705810546875, -2.4229736328125, -2.29888916015625, -2.1748046875, -2.05072021484375, -1.9266357421875, -1.80255126953125, -1.678466796875, -1.55438232421875, -1.4302978515625, -1.30621337890625, -1.18212890625, -1.05804443359375, -0.9339599609375, -0.80987548828125, -0.685791015625, -0.56170654296875, -0.4376220703125, -0.31353759765625, -0.189453125, -0.06536865234375, 0.0587158203125, 0.18280029296875, 0.306884765625, 0.43096923828125, 0.5550537109375, 0.67913818359375, 0.80322265625, 0.92730712890625, 1.0513916015625, 1.17547607421875, 1.299560546875, 1.42364501953125, 1.5477294921875, 1.67181396484375, 1.7958984375, 1.91998291015625, 2.0440673828125, 2.16815185546875, 2.292236328125, 2.41632080078125, 2.5404052734375, 2.66448974609375, 2.78857421875, 2.91265869140625, 3.0367431640625, 3.16082763671875, 3.284912109375, 3.40899658203125, 3.5330810546875, 3.65716552734375, 3.78125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 15.0, 12.0, 29.0, 34.0, 57.0, 71.0, 114.0, 145.0, 289.0, 470.0, 1012.0, 2266.0, 5529.0, 14565.0, 39315.0, 124923.0, 499911.0, 256082.0, 65260.0, 23178.0, 8760.0, 3381.0, 1475.0, 700.0, 319.0, 218.0, 141.0, 89.0, 52.0, 32.0, 27.0, 21.0, 16.0, 8.0, 3.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-13.25, -12.83251953125, -12.4150390625, -11.99755859375, -11.580078125, -11.16259765625, -10.7451171875, -10.32763671875, -9.91015625, -9.49267578125, -9.0751953125, -8.65771484375, -8.240234375, -7.82275390625, -7.4052734375, -6.98779296875, -6.5703125, -6.15283203125, -5.7353515625, -5.31787109375, -4.900390625, -4.48291015625, -4.0654296875, -3.64794921875, -3.23046875, -2.81298828125, -2.3955078125, -1.97802734375, -1.560546875, -1.14306640625, -0.7255859375, -0.30810546875, 0.109375, 0.52685546875, 0.9443359375, 1.36181640625, 1.779296875, 2.19677734375, 2.6142578125, 3.03173828125, 3.44921875, 3.86669921875, 4.2841796875, 4.70166015625, 5.119140625, 5.53662109375, 5.9541015625, 6.37158203125, 6.7890625, 7.20654296875, 7.6240234375, 8.04150390625, 8.458984375, 8.87646484375, 9.2939453125, 9.71142578125, 10.12890625, 10.54638671875, 10.9638671875, 11.38134765625, 11.798828125, 12.21630859375, 12.6337890625, 13.05126953125, 13.46875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 5.0, 9.0, 9.0, 14.0, 7.0, 16.0, 15.0, 19.0, 26.0, 24.0, 32.0, 33.0, 32.0, 32.0, 43.0, 36.0, 32.0, 43.0, 43.0, 45.0, 40.0, 36.0, 38.0, 31.0, 36.0, 32.0, 39.0, 25.0, 21.0, 25.0, 19.0, 21.0, 18.0, 11.0, 4.0, 7.0, 10.0, 11.0, 7.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0], "bins": [-9.640625, -9.3623046875, -9.083984375, -8.8056640625, -8.52734375, -8.2490234375, -7.970703125, -7.6923828125, -7.4140625, -7.1357421875, -6.857421875, -6.5791015625, -6.30078125, -6.0224609375, -5.744140625, -5.4658203125, -5.1875, -4.9091796875, -4.630859375, -4.3525390625, -4.07421875, -3.7958984375, -3.517578125, -3.2392578125, -2.9609375, -2.6826171875, -2.404296875, -2.1259765625, -1.84765625, -1.5693359375, -1.291015625, -1.0126953125, -0.734375, -0.4560546875, -0.177734375, 0.1005859375, 0.37890625, 0.6572265625, 0.935546875, 1.2138671875, 1.4921875, 1.7705078125, 2.048828125, 2.3271484375, 2.60546875, 2.8837890625, 3.162109375, 3.4404296875, 3.71875, 3.9970703125, 4.275390625, 4.5537109375, 4.83203125, 5.1103515625, 5.388671875, 5.6669921875, 5.9453125, 6.2236328125, 6.501953125, 6.7802734375, 7.05859375, 7.3369140625, 7.615234375, 7.8935546875, 8.171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 23.0, 25.0, 29.0, 59.0, 91.0, 121.0, 202.0, 382.0, 770.0, 1789.0, 5011.0, 14403.0, 46850.0, 206716.0, 548339.0, 164702.0, 39265.0, 12432.0, 4174.0, 1620.0, 667.0, 351.0, 176.0, 107.0, 65.0, 47.0, 38.0, 19.0, 16.0, 13.0, 13.0, 10.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.724609375, -3.550811767578125, -3.37701416015625, -3.203216552734375, -3.0294189453125, -2.855621337890625, -2.68182373046875, -2.508026123046875, -2.334228515625, -2.160430908203125, -1.98663330078125, -1.812835693359375, -1.6390380859375, -1.465240478515625, -1.29144287109375, -1.117645263671875, -0.94384765625, -0.770050048828125, -0.59625244140625, -0.422454833984375, -0.2486572265625, -0.074859619140625, 0.09893798828125, 0.272735595703125, 0.446533203125, 0.620330810546875, 0.79412841796875, 0.967926025390625, 1.1417236328125, 1.315521240234375, 1.48931884765625, 1.663116455078125, 1.8369140625, 2.010711669921875, 2.18450927734375, 2.358306884765625, 2.5321044921875, 2.705902099609375, 2.87969970703125, 3.053497314453125, 3.227294921875, 3.401092529296875, 3.57489013671875, 3.748687744140625, 3.9224853515625, 4.096282958984375, 4.27008056640625, 4.443878173828125, 4.61767578125, 4.791473388671875, 4.96527099609375, 5.139068603515625, 5.3128662109375, 5.486663818359375, 5.66046142578125, 5.834259033203125, 6.008056640625, 6.181854248046875, 6.35565185546875, 6.529449462890625, 6.7032470703125, 6.877044677734375, 7.05084228515625, 7.224639892578125, 7.3984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 3.0, 3.0, 11.0, 4.0, 14.0, 6.0, 12.0, 18.0, 10.0, 15.0, 31.0, 61.0, 115.0, 190.0, 204.0, 103.0, 54.0, 34.0, 17.0, 20.0, 16.0, 11.0, 13.0, 10.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0014553070068359375, -0.0014198347926139832, -0.0013843625783920288, -0.0013488903641700745, -0.0013134181499481201, -0.0012779459357261658, -0.0012424737215042114, -0.001207001507282257, -0.0011715292930603027, -0.0011360570788383484, -0.001100584864616394, -0.0010651126503944397, -0.0010296404361724854, -0.000994168221950531, -0.0009586960077285767, -0.0009232237935066223, -0.000887751579284668, -0.0008522793650627136, -0.0008168071508407593, -0.0007813349366188049, -0.0007458627223968506, -0.0007103905081748962, -0.0006749182939529419, -0.0006394460797309875, -0.0006039738655090332, -0.0005685016512870789, -0.0005330294370651245, -0.0004975572228431702, -0.0004620850086212158, -0.0004266127943992615, -0.00039114058017730713, -0.0003556683659553528, -0.00032019615173339844, -0.0002847239375114441, -0.00024925172328948975, -0.0002137795090675354, -0.00017830729484558105, -0.0001428350806236267, -0.00010736286640167236, -7.189065217971802e-05, -3.641843795776367e-05, -9.462237358093262e-07, 3.452599048614502e-05, 6.999820470809937e-05, 0.00010547041893005371, 0.00014094263315200806, 0.0001764148473739624, 0.00021188706159591675, 0.0002473592758178711, 0.00028283149003982544, 0.0003183037042617798, 0.00035377591848373413, 0.0003892481327056885, 0.0004247203469276428, 0.00046019256114959717, 0.0004956647753715515, 0.0005311369895935059, 0.0005666092038154602, 0.0006020814180374146, 0.0006375536322593689, 0.0006730258464813232, 0.0007084980607032776, 0.0007439702749252319, 0.0007794424891471863, 0.0008149147033691406]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 11.0, 15.0, 35.0, 39.0, 90.0, 147.0, 309.0, 600.0, 1585.0, 5553.0, 24556.0, 147404.0, 703635.0, 133823.0, 22859.0, 5208.0, 1433.0, 544.0, 306.0, 174.0, 87.0, 52.0, 27.0, 19.0, 19.0, 9.0, 2.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -8.03143310546875, -7.8050537109375, -7.57867431640625, -7.352294921875, -7.12591552734375, -6.8995361328125, -6.67315673828125, -6.44677734375, -6.22039794921875, -5.9940185546875, -5.76763916015625, -5.541259765625, -5.31488037109375, -5.0885009765625, -4.86212158203125, -4.6357421875, -4.40936279296875, -4.1829833984375, -3.95660400390625, -3.730224609375, -3.50384521484375, -3.2774658203125, -3.05108642578125, -2.82470703125, -2.59832763671875, -2.3719482421875, -2.14556884765625, -1.919189453125, -1.69281005859375, -1.4664306640625, -1.24005126953125, -1.013671875, -0.78729248046875, -0.5609130859375, -0.33453369140625, -0.108154296875, 0.11822509765625, 0.3446044921875, 0.57098388671875, 0.79736328125, 1.02374267578125, 1.2501220703125, 1.47650146484375, 1.702880859375, 1.92926025390625, 2.1556396484375, 2.38201904296875, 2.6083984375, 2.83477783203125, 3.0611572265625, 3.28753662109375, 3.513916015625, 3.74029541015625, 3.9666748046875, 4.19305419921875, 4.41943359375, 4.64581298828125, 4.8721923828125, 5.09857177734375, 5.324951171875, 5.55133056640625, 5.7777099609375, 6.00408935546875, 6.23046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 17.0, 13.0, 26.0, 28.0, 39.0, 49.0, 58.0, 80.0, 93.0, 117.0, 111.0, 73.0, 55.0, 48.0, 40.0, 18.0, 21.0, 16.0, 12.0, 10.0, 11.0, 9.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.21875, -4.10247802734375, -3.9862060546875, -3.86993408203125, -3.753662109375, -3.63739013671875, -3.5211181640625, -3.40484619140625, -3.28857421875, -3.17230224609375, -3.0560302734375, -2.93975830078125, -2.823486328125, -2.70721435546875, -2.5909423828125, -2.47467041015625, -2.3583984375, -2.24212646484375, -2.1258544921875, -2.00958251953125, -1.893310546875, -1.77703857421875, -1.6607666015625, -1.54449462890625, -1.42822265625, -1.31195068359375, -1.1956787109375, -1.07940673828125, -0.963134765625, -0.84686279296875, -0.7305908203125, -0.61431884765625, -0.498046875, -0.38177490234375, -0.2655029296875, -0.14923095703125, -0.032958984375, 0.08331298828125, 0.1995849609375, 0.31585693359375, 0.43212890625, 0.54840087890625, 0.6646728515625, 0.78094482421875, 0.897216796875, 1.01348876953125, 1.1297607421875, 1.24603271484375, 1.3623046875, 1.47857666015625, 1.5948486328125, 1.71112060546875, 1.827392578125, 1.94366455078125, 2.0599365234375, 2.17620849609375, 2.29248046875, 2.40875244140625, 2.5250244140625, 2.64129638671875, 2.757568359375, 2.87384033203125, 2.9901123046875, 3.10638427734375, 3.22265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 13.0, 18.0, 46.0, 60.0, 79.0, 137.0, 160.0, 164.0, 137.0, 79.0, 48.0, 28.0, 18.0, 10.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.22698974609375, -73.6961669921875, -70.16534423828125, -66.634521484375, -63.10369873046875, -59.5728759765625, -56.042057037353516, -52.511234283447266, -48.980411529541016, -45.449588775634766, -41.918766021728516, -38.38794708251953, -34.85712432861328, -31.3262996673584, -27.79547882080078, -24.26465606689453, -20.73383331298828, -17.20301055908203, -13.672188758850098, -10.141366958618164, -6.610544204711914, -3.079721450805664, 0.4510993957519531, 3.981922149658203, 7.512744903564453, 11.043567657470703, 14.574389457702637, 18.10521125793457, 21.63603401184082, 25.16685676574707, 28.697677612304688, 32.22850036621094, 35.75932312011719, 39.29014587402344, 42.82096862792969, 46.35179138183594, 49.88261413574219, 53.41343688964844, 56.94425582885742, 60.47507858276367, 64.00590515136719, 67.53672790527344, 71.06755065917969, 74.59837341308594, 78.12919616699219, 81.66001892089844, 85.19084167480469, 88.72166442871094, 92.25247955322266, 95.7833023071289, 99.31412506103516, 102.8449478149414, 106.37577056884766, 109.9065933227539, 113.43740844726562, 116.96823120117188, 120.49905395507812, 124.02987670898438, 127.56069946289062, 131.09152221679688, 134.62234497070312, 138.15316772460938, 141.68399047851562, 145.21481323242188, 148.74563598632812]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 12.0, 14.0, 13.0, 13.0, 22.0, 29.0, 30.0, 24.0, 26.0, 30.0, 29.0, 34.0, 47.0, 61.0, 34.0, 47.0, 34.0, 45.0, 34.0, 44.0, 43.0, 39.0, 38.0, 42.0, 25.0, 23.0, 19.0, 20.0, 24.0, 15.0, 14.0, 15.0, 11.0, 8.0, 9.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.173648834228516, -44.74121856689453, -43.30878829956055, -41.87635803222656, -40.44392395019531, -39.01149368286133, -37.579063415527344, -36.14663314819336, -34.714202880859375, -33.28177261352539, -31.849342346191406, -30.41691017150879, -28.984479904174805, -27.55204963684082, -26.119617462158203, -24.68718719482422, -23.254756927490234, -21.82232666015625, -20.389896392822266, -18.95746421813965, -17.525033950805664, -16.09260368347168, -14.660172462463379, -13.227741241455078, -11.795310974121094, -10.36288070678711, -8.930449485778809, -7.498018741607666, -6.065587997436523, -4.633157253265381, -3.2007265090942383, -1.7682952880859375, -0.3358612060546875, 1.096569538116455, 2.5290002822875977, 3.9614310264587402, 5.393861770629883, 6.826292514801025, 8.258723258972168, 9.691154479980469, 11.123584747314453, 12.556015014648438, 13.988446235656738, 15.420877456665039, 16.853307723999023, 18.285737991333008, 19.718170166015625, 21.15060043334961, 22.583030700683594, 24.015460968017578, 25.447891235351562, 26.88032341003418, 28.312753677368164, 29.74518394470215, 31.177616119384766, 32.61004638671875, 34.042476654052734, 35.47490692138672, 36.9073371887207, 38.33976745605469, 39.77220153808594, 41.20463180541992, 42.637062072753906, 44.06949234008789, 45.501922607421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 10.0, 13.0, 20.0, 28.0, 46.0, 67.0, 85.0, 135.0, 158.0, 259.0, 391.0, 717.0, 1466.0, 3344.0, 9662.0, 35301.0, 289809.0, 3707505.0, 112113.0, 21821.0, 6638.0, 2461.0, 1054.0, 524.0, 242.0, 138.0, 82.0, 61.0, 29.0, 30.0, 21.0, 12.0, 13.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.28125, -30.21435546875, -29.1474609375, -28.08056640625, -27.013671875, -25.94677734375, -24.8798828125, -23.81298828125, -22.74609375, -21.67919921875, -20.6123046875, -19.54541015625, -18.478515625, -17.41162109375, -16.3447265625, -15.27783203125, -14.2109375, -13.14404296875, -12.0771484375, -11.01025390625, -9.943359375, -8.87646484375, -7.8095703125, -6.74267578125, -5.67578125, -4.60888671875, -3.5419921875, -2.47509765625, -1.408203125, -0.34130859375, 0.7255859375, 1.79248046875, 2.859375, 3.92626953125, 4.9931640625, 6.06005859375, 7.126953125, 8.19384765625, 9.2607421875, 10.32763671875, 11.39453125, 12.46142578125, 13.5283203125, 14.59521484375, 15.662109375, 16.72900390625, 17.7958984375, 18.86279296875, 19.9296875, 20.99658203125, 22.0634765625, 23.13037109375, 24.197265625, 25.26416015625, 26.3310546875, 27.39794921875, 28.46484375, 29.53173828125, 30.5986328125, 31.66552734375, 32.732421875, 33.79931640625, 34.8662109375, 35.93310546875, 37.0]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 12.0, 16.0, 22.0, 28.0, 23.0, 40.0, 51.0, 49.0, 57.0, 64.0, 74.0, 80.0, 76.0, 70.0, 56.0, 55.0, 43.0, 40.0, 28.0, 32.0, 20.0, 11.0, 9.0, 14.0, 9.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16796875, -4.0472412109375, -3.926513671875, -3.8057861328125, -3.68505859375, -3.5643310546875, -3.443603515625, -3.3228759765625, -3.2021484375, -3.0814208984375, -2.960693359375, -2.8399658203125, -2.71923828125, -2.5985107421875, -2.477783203125, -2.3570556640625, -2.236328125, -2.1156005859375, -1.994873046875, -1.8741455078125, -1.75341796875, -1.6326904296875, -1.511962890625, -1.3912353515625, -1.2705078125, -1.1497802734375, -1.029052734375, -0.9083251953125, -0.78759765625, -0.6668701171875, -0.546142578125, -0.4254150390625, -0.3046875, -0.1839599609375, -0.063232421875, 0.0574951171875, 0.17822265625, 0.2989501953125, 0.419677734375, 0.5404052734375, 0.6611328125, 0.7818603515625, 0.902587890625, 1.0233154296875, 1.14404296875, 1.2647705078125, 1.385498046875, 1.5062255859375, 1.626953125, 1.7476806640625, 1.868408203125, 1.9891357421875, 2.10986328125, 2.2305908203125, 2.351318359375, 2.4720458984375, 2.5927734375, 2.7135009765625, 2.834228515625, 2.9549560546875, 3.07568359375, 3.1964111328125, 3.317138671875, 3.4378662109375, 3.55859375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 11.0, 8.0, 18.0, 19.0, 22.0, 29.0, 39.0, 71.0, 103.0, 144.0, 229.0, 329.0, 483.0, 831.0, 1368.0, 2440.0, 4247.0, 8198.0, 16017.0, 36032.0, 98599.0, 501727.0, 3102140.0, 290089.0, 72813.0, 28927.0, 13417.0, 6817.0, 3714.0, 2075.0, 1232.0, 752.0, 456.0, 281.0, 182.0, 143.0, 86.0, 58.0, 36.0, 26.0, 25.0, 21.0, 7.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-13.5390625, -13.13330078125, -12.7275390625, -12.32177734375, -11.916015625, -11.51025390625, -11.1044921875, -10.69873046875, -10.29296875, -9.88720703125, -9.4814453125, -9.07568359375, -8.669921875, -8.26416015625, -7.8583984375, -7.45263671875, -7.046875, -6.64111328125, -6.2353515625, -5.82958984375, -5.423828125, -5.01806640625, -4.6123046875, -4.20654296875, -3.80078125, -3.39501953125, -2.9892578125, -2.58349609375, -2.177734375, -1.77197265625, -1.3662109375, -0.96044921875, -0.5546875, -0.14892578125, 0.2568359375, 0.66259765625, 1.068359375, 1.47412109375, 1.8798828125, 2.28564453125, 2.69140625, 3.09716796875, 3.5029296875, 3.90869140625, 4.314453125, 4.72021484375, 5.1259765625, 5.53173828125, 5.9375, 6.34326171875, 6.7490234375, 7.15478515625, 7.560546875, 7.96630859375, 8.3720703125, 8.77783203125, 9.18359375, 9.58935546875, 9.9951171875, 10.40087890625, 10.806640625, 11.21240234375, 11.6181640625, 12.02392578125, 12.4296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 7.0, 9.0, 13.0, 20.0, 20.0, 26.0, 22.0, 55.0, 70.0, 107.0, 173.0, 326.0, 947.0, 1304.0, 377.0, 217.0, 96.0, 66.0, 52.0, 34.0, 27.0, 14.0, 15.0, 20.0, 5.0, 5.0, 5.0, 7.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.8359375, -5.65936279296875, -5.4827880859375, -5.30621337890625, -5.129638671875, -4.95306396484375, -4.7764892578125, -4.59991455078125, -4.42333984375, -4.24676513671875, -4.0701904296875, -3.89361572265625, -3.717041015625, -3.54046630859375, -3.3638916015625, -3.18731689453125, -3.0107421875, -2.83416748046875, -2.6575927734375, -2.48101806640625, -2.304443359375, -2.12786865234375, -1.9512939453125, -1.77471923828125, -1.59814453125, -1.42156982421875, -1.2449951171875, -1.06842041015625, -0.891845703125, -0.71527099609375, -0.5386962890625, -0.36212158203125, -0.185546875, -0.00897216796875, 0.1676025390625, 0.34417724609375, 0.520751953125, 0.69732666015625, 0.8739013671875, 1.05047607421875, 1.22705078125, 1.40362548828125, 1.5802001953125, 1.75677490234375, 1.933349609375, 2.10992431640625, 2.2864990234375, 2.46307373046875, 2.6396484375, 2.81622314453125, 2.9927978515625, 3.16937255859375, 3.345947265625, 3.52252197265625, 3.6990966796875, 3.87567138671875, 4.05224609375, 4.22882080078125, 4.4053955078125, 4.58197021484375, 4.758544921875, 4.93511962890625, 5.1116943359375, 5.28826904296875, 5.46484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 13.0, 34.0, 159.0, 414.0, 297.0, 69.0, 20.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-222.7930908203125, -218.32656860351562, -213.8600311279297, -209.3935089111328, -204.92697143554688, -200.46044921875, -195.99391174316406, -191.5273895263672, -187.06085205078125, -182.59432983398438, -178.12779235839844, -173.66127014160156, -169.19473266601562, -164.72821044921875, -160.2616729736328, -155.79515075683594, -151.32862854003906, -146.8621063232422, -142.39556884765625, -137.92904663085938, -133.46250915527344, -128.99598693847656, -124.52945709228516, -120.06292724609375, -115.59639739990234, -111.12986755371094, -106.66333770751953, -102.19680786132812, -97.73028564453125, -93.26374816894531, -88.79722595214844, -84.33069610595703, -79.86416625976562, -75.39763641357422, -70.93110656738281, -66.4645767211914, -61.998050689697266, -57.53152084350586, -53.06499481201172, -48.59846496582031, -44.13193893432617, -39.665409088134766, -35.198883056640625, -30.73235321044922, -26.265823364257812, -21.799293518066406, -17.332765579223633, -12.86623764038086, -8.399707794189453, -3.9331789016723633, 0.5333499908447266, 4.999878883361816, 9.466407775878906, 13.932937622070312, 18.399465560913086, 22.86599349975586, 27.332523345947266, 31.799053192138672, 36.26557922363281, 40.73210906982422, 45.198638916015625, 49.66516876220703, 54.13169860839844, 58.59822463989258, 63.064754486083984]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 12.0, 7.0, 10.0, 16.0, 15.0, 14.0, 20.0, 25.0, 24.0, 36.0, 30.0, 47.0, 32.0, 48.0, 37.0, 46.0, 49.0, 61.0, 49.0, 43.0, 53.0, 47.0, 32.0, 51.0, 32.0, 43.0, 22.0, 28.0, 21.0, 12.0, 8.0, 7.0, 7.0, 3.0, 6.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.829288482666016, -26.098031997680664, -25.366775512695312, -24.63551902770996, -23.90426254272461, -23.173004150390625, -22.441749572753906, -21.710491180419922, -20.97923469543457, -20.24797821044922, -19.516721725463867, -18.785465240478516, -18.054208755493164, -17.322952270507812, -16.591693878173828, -15.860437393188477, -15.129181861877441, -14.39792537689209, -13.666668891906738, -12.93541145324707, -12.204154968261719, -11.472898483276367, -10.741641998291016, -10.010385513305664, -9.279129028320312, -8.547872543334961, -7.816615581512451, -7.0853590965271, -6.35410213470459, -5.622845649719238, -4.891589164733887, -4.160332202911377, -3.429075241088867, -2.6978185176849365, -1.9665619134902954, -1.2353053092956543, -0.5040485858917236, 0.22720813751220703, 0.9584646224975586, 1.6897215843200684, 2.42097806930542, 3.1522347927093506, 3.8834915161132812, 4.614748001098633, 5.346004486083984, 6.077261447906494, 6.808517932891846, 7.5397748947143555, 8.271031379699707, 9.002287864685059, 9.73354434967041, 10.464801788330078, 11.19605827331543, 11.927314758300781, 12.658571243286133, 13.389827728271484, 14.121084213256836, 14.852340698242188, 15.583597183227539, 16.31485366821289, 17.046110153198242, 17.777366638183594, 18.508625030517578, 19.23988151550293, 19.97113800048828]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 5.0, 6.0, 7.0, 19.0, 27.0, 35.0, 68.0, 88.0, 128.0, 211.0, 315.0, 544.0, 988.0, 1898.0, 4363.0, 13428.0, 49298.0, 187004.0, 530693.0, 188168.0, 49159.0, 13415.0, 4449.0, 1925.0, 875.0, 526.0, 325.0, 177.0, 122.0, 100.0, 59.0, 42.0, 30.0, 16.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.359375, -19.64501953125, -18.9306640625, -18.21630859375, -17.501953125, -16.78759765625, -16.0732421875, -15.35888671875, -14.64453125, -13.93017578125, -13.2158203125, -12.50146484375, -11.787109375, -11.07275390625, -10.3583984375, -9.64404296875, -8.9296875, -8.21533203125, -7.5009765625, -6.78662109375, -6.072265625, -5.35791015625, -4.6435546875, -3.92919921875, -3.21484375, -2.50048828125, -1.7861328125, -1.07177734375, -0.357421875, 0.35693359375, 1.0712890625, 1.78564453125, 2.5, 3.21435546875, 3.9287109375, 4.64306640625, 5.357421875, 6.07177734375, 6.7861328125, 7.50048828125, 8.21484375, 8.92919921875, 9.6435546875, 10.35791015625, 11.072265625, 11.78662109375, 12.5009765625, 13.21533203125, 13.9296875, 14.64404296875, 15.3583984375, 16.07275390625, 16.787109375, 17.50146484375, 18.2158203125, 18.93017578125, 19.64453125, 20.35888671875, 21.0732421875, 21.78759765625, 22.501953125, 23.21630859375, 23.9306640625, 24.64501953125, 25.359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 6.0, 13.0, 13.0, 39.0, 33.0, 37.0, 47.0, 52.0, 56.0, 64.0, 77.0, 76.0, 76.0, 58.0, 64.0, 39.0, 54.0, 48.0, 36.0, 33.0, 17.0, 12.0, 15.0, 4.0, 9.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3125, -4.187713623046875, -4.06292724609375, -3.938140869140625, -3.8133544921875, -3.688568115234375, -3.56378173828125, -3.438995361328125, -3.314208984375, -3.189422607421875, -3.06463623046875, -2.939849853515625, -2.8150634765625, -2.690277099609375, -2.56549072265625, -2.440704345703125, -2.31591796875, -2.191131591796875, -2.06634521484375, -1.941558837890625, -1.8167724609375, -1.691986083984375, -1.56719970703125, -1.442413330078125, -1.317626953125, -1.192840576171875, -1.06805419921875, -0.943267822265625, -0.8184814453125, -0.693695068359375, -0.56890869140625, -0.444122314453125, -0.3193359375, -0.194549560546875, -0.06976318359375, 0.055023193359375, 0.1798095703125, 0.304595947265625, 0.42938232421875, 0.554168701171875, 0.678955078125, 0.803741455078125, 0.92852783203125, 1.053314208984375, 1.1781005859375, 1.302886962890625, 1.42767333984375, 1.552459716796875, 1.67724609375, 1.802032470703125, 1.92681884765625, 2.051605224609375, 2.1763916015625, 2.301177978515625, 2.42596435546875, 2.550750732421875, 2.675537109375, 2.800323486328125, 2.92510986328125, 3.049896240234375, 3.1746826171875, 3.299468994140625, 3.42425537109375, 3.549041748046875, 3.673828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 3.0, 9.0, 11.0, 17.0, 22.0, 21.0, 32.0, 40.0, 51.0, 67.0, 65.0, 107.0, 136.0, 199.0, 279.0, 432.0, 655.0, 1405.0, 3756.0, 11971.0, 45308.0, 176334.0, 525904.0, 206292.0, 53416.0, 13988.0, 4169.0, 1534.0, 767.0, 467.0, 294.0, 221.0, 148.0, 111.0, 90.0, 66.0, 58.0, 24.0, 29.0, 15.0, 14.0, 6.0, 12.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2109375, -12.7135009765625, -12.216064453125, -11.7186279296875, -11.22119140625, -10.7237548828125, -10.226318359375, -9.7288818359375, -9.2314453125, -8.7340087890625, -8.236572265625, -7.7391357421875, -7.24169921875, -6.7442626953125, -6.246826171875, -5.7493896484375, -5.251953125, -4.7545166015625, -4.257080078125, -3.7596435546875, -3.26220703125, -2.7647705078125, -2.267333984375, -1.7698974609375, -1.2724609375, -0.7750244140625, -0.277587890625, 0.2198486328125, 0.71728515625, 1.2147216796875, 1.712158203125, 2.2095947265625, 2.70703125, 3.2044677734375, 3.701904296875, 4.1993408203125, 4.69677734375, 5.1942138671875, 5.691650390625, 6.1890869140625, 6.6865234375, 7.1839599609375, 7.681396484375, 8.1788330078125, 8.67626953125, 9.1737060546875, 9.671142578125, 10.1685791015625, 10.666015625, 11.1634521484375, 11.660888671875, 12.1583251953125, 12.65576171875, 13.1531982421875, 13.650634765625, 14.1480712890625, 14.6455078125, 15.1429443359375, 15.640380859375, 16.1378173828125, 16.63525390625, 17.1326904296875, 17.630126953125, 18.1275634765625, 18.625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 3.0, 7.0, 12.0, 6.0, 25.0, 19.0, 24.0, 38.0, 26.0, 37.0, 44.0, 38.0, 36.0, 46.0, 45.0, 54.0, 42.0, 58.0, 50.0, 62.0, 46.0, 37.0, 40.0, 31.0, 30.0, 38.0, 24.0, 23.0, 15.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.78125, -12.375732421875, -11.97021484375, -11.564697265625, -11.1591796875, -10.753662109375, -10.34814453125, -9.942626953125, -9.537109375, -9.131591796875, -8.72607421875, -8.320556640625, -7.9150390625, -7.509521484375, -7.10400390625, -6.698486328125, -6.29296875, -5.887451171875, -5.48193359375, -5.076416015625, -4.6708984375, -4.265380859375, -3.85986328125, -3.454345703125, -3.048828125, -2.643310546875, -2.23779296875, -1.832275390625, -1.4267578125, -1.021240234375, -0.61572265625, -0.210205078125, 0.1953125, 0.600830078125, 1.00634765625, 1.411865234375, 1.8173828125, 2.222900390625, 2.62841796875, 3.033935546875, 3.439453125, 3.844970703125, 4.25048828125, 4.656005859375, 5.0615234375, 5.467041015625, 5.87255859375, 6.278076171875, 6.68359375, 7.089111328125, 7.49462890625, 7.900146484375, 8.3056640625, 8.711181640625, 9.11669921875, 9.522216796875, 9.927734375, 10.333251953125, 10.73876953125, 11.144287109375, 11.5498046875, 11.955322265625, 12.36083984375, 12.766357421875, 13.171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 10.0, 13.0, 13.0, 23.0, 46.0, 53.0, 126.0, 244.0, 557.0, 1156.0, 2919.0, 8514.0, 28333.0, 102194.0, 496694.0, 308627.0, 69141.0, 19686.0, 6263.0, 2216.0, 871.0, 406.0, 208.0, 98.0, 73.0, 35.0, 17.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1171875, -6.8787841796875, -6.640380859375, -6.4019775390625, -6.16357421875, -5.9251708984375, -5.686767578125, -5.4483642578125, -5.2099609375, -4.9715576171875, -4.733154296875, -4.4947509765625, -4.25634765625, -4.0179443359375, -3.779541015625, -3.5411376953125, -3.302734375, -3.0643310546875, -2.825927734375, -2.5875244140625, -2.34912109375, -2.1107177734375, -1.872314453125, -1.6339111328125, -1.3955078125, -1.1571044921875, -0.918701171875, -0.6802978515625, -0.44189453125, -0.2034912109375, 0.034912109375, 0.2733154296875, 0.51171875, 0.7501220703125, 0.988525390625, 1.2269287109375, 1.46533203125, 1.7037353515625, 1.942138671875, 2.1805419921875, 2.4189453125, 2.6573486328125, 2.895751953125, 3.1341552734375, 3.37255859375, 3.6109619140625, 3.849365234375, 4.0877685546875, 4.326171875, 4.5645751953125, 4.802978515625, 5.0413818359375, 5.27978515625, 5.5181884765625, 5.756591796875, 5.9949951171875, 6.2333984375, 6.4718017578125, 6.710205078125, 6.9486083984375, 7.18701171875, 7.4254150390625, 7.663818359375, 7.9022216796875, 8.140625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 6.0, 12.0, 12.0, 12.0, 21.0, 16.0, 26.0, 23.0, 35.0, 41.0, 66.0, 85.0, 151.0, 130.0, 76.0, 66.0, 39.0, 31.0, 37.0, 15.0, 26.0, 12.0, 19.0, 11.0, 7.0, 7.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007977485656738281, -0.000764213502407074, -0.0007306784391403198, -0.0006971433758735657, -0.0006636083126068115, -0.0006300732493400574, -0.0005965381860733032, -0.0005630031228065491, -0.0005294680595397949, -0.0004959329962730408, -0.0004623979330062866, -0.00042886286973953247, -0.0003953278064727783, -0.00036179274320602417, -0.00032825767993927, -0.00029472261667251587, -0.0002611875534057617, -0.00022765249013900757, -0.00019411742687225342, -0.00016058236360549927, -0.00012704730033874512, -9.351223707199097e-05, -5.9977173805236816e-05, -2.6442110538482666e-05, 7.092952728271484e-06, 4.0628015995025635e-05, 7.416307926177979e-05, 0.00010769814252853394, 0.00014123320579528809, 0.00017476826906204224, 0.0002083033323287964, 0.00024183839559555054, 0.0002753734588623047, 0.00030890852212905884, 0.000342443585395813, 0.00037597864866256714, 0.0004095137119293213, 0.00044304877519607544, 0.0004765838384628296, 0.0005101189017295837, 0.0005436539649963379, 0.000577189028263092, 0.0006107240915298462, 0.0006442591547966003, 0.0006777942180633545, 0.0007113292813301086, 0.0007448643445968628, 0.0007783994078636169, 0.0008119344711303711, 0.0008454695343971252, 0.0008790045976638794, 0.0009125396609306335, 0.0009460747241973877, 0.0009796097874641418, 0.001013144850730896, 0.0010466799139976501, 0.0010802149772644043, 0.0011137500405311584, 0.0011472851037979126, 0.0011808201670646667, 0.001214355230331421, 0.001247890293598175, 0.0012814253568649292, 0.0013149604201316833, 0.0013484954833984375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 13.0, 18.0, 28.0, 49.0, 103.0, 164.0, 295.0, 601.0, 1568.0, 6227.0, 45090.0, 547376.0, 404750.0, 34643.0, 5106.0, 1337.0, 562.0, 271.0, 134.0, 87.0, 55.0, 25.0, 26.0, 12.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.8134765625, -8.392578125, -7.9716796875, -7.55078125, -7.1298828125, -6.708984375, -6.2880859375, -5.8671875, -5.4462890625, -5.025390625, -4.6044921875, -4.18359375, -3.7626953125, -3.341796875, -2.9208984375, -2.5, -2.0791015625, -1.658203125, -1.2373046875, -0.81640625, -0.3955078125, 0.025390625, 0.4462890625, 0.8671875, 1.2880859375, 1.708984375, 2.1298828125, 2.55078125, 2.9716796875, 3.392578125, 3.8134765625, 4.234375, 4.6552734375, 5.076171875, 5.4970703125, 5.91796875, 6.3388671875, 6.759765625, 7.1806640625, 7.6015625, 8.0224609375, 8.443359375, 8.8642578125, 9.28515625, 9.7060546875, 10.126953125, 10.5478515625, 10.96875, 11.3896484375, 11.810546875, 12.2314453125, 12.65234375, 13.0732421875, 13.494140625, 13.9150390625, 14.3359375, 14.7568359375, 15.177734375, 15.5986328125, 16.01953125, 16.4404296875, 16.861328125, 17.2822265625, 17.703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 16.0, 16.0, 20.0, 22.0, 34.0, 52.0, 55.0, 81.0, 94.0, 149.0, 115.0, 79.0, 53.0, 42.0, 32.0, 27.0, 18.0, 20.0, 5.0, 12.0, 9.0, 5.0, 7.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.92999267578125, -4.6998291015625, -4.46966552734375, -4.239501953125, -4.00933837890625, -3.7791748046875, -3.54901123046875, -3.31884765625, -3.08868408203125, -2.8585205078125, -2.62835693359375, -2.398193359375, -2.16802978515625, -1.9378662109375, -1.70770263671875, -1.4775390625, -1.24737548828125, -1.0172119140625, -0.78704833984375, -0.556884765625, -0.32672119140625, -0.0965576171875, 0.13360595703125, 0.36376953125, 0.59393310546875, 0.8240966796875, 1.05426025390625, 1.284423828125, 1.51458740234375, 1.7447509765625, 1.97491455078125, 2.205078125, 2.43524169921875, 2.6654052734375, 2.89556884765625, 3.125732421875, 3.35589599609375, 3.5860595703125, 3.81622314453125, 4.04638671875, 4.27655029296875, 4.5067138671875, 4.73687744140625, 4.967041015625, 5.19720458984375, 5.4273681640625, 5.65753173828125, 5.8876953125, 6.11785888671875, 6.3480224609375, 6.57818603515625, 6.808349609375, 7.03851318359375, 7.2686767578125, 7.49884033203125, 7.72900390625, 7.95916748046875, 8.1893310546875, 8.41949462890625, 8.649658203125, 8.87982177734375, 9.1099853515625, 9.34014892578125, 9.5703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 14.0, 9.0, 25.0, 45.0, 69.0, 61.0, 86.0, 98.0, 111.0, 96.0, 89.0, 88.0, 58.0, 36.0, 35.0, 18.0, 16.0, 12.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.94291687011719, -72.98637390136719, -70.02982330322266, -67.07328033447266, -64.11672973632812, -61.160186767578125, -58.20363998413086, -55.247093200683594, -52.29054641723633, -49.33399963378906, -46.3774528503418, -43.42090606689453, -40.46436309814453, -37.5078125, -34.55126953125, -31.594722747802734, -28.63817596435547, -25.681629180908203, -22.725082397460938, -19.768537521362305, -16.81199073791504, -13.855443954467773, -10.89889907836914, -7.942352294921875, -4.985805511474609, -2.029259204864502, 0.9272871017456055, 3.8838329315185547, 6.84037971496582, 9.796926498413086, 12.753471374511719, 15.710018157958984, 18.66656494140625, 21.623111724853516, 24.57965850830078, 27.536203384399414, 30.49275016784668, 33.44929504394531, 36.40584182739258, 39.362388610839844, 42.31893539428711, 45.275482177734375, 48.23202896118164, 51.188575744628906, 54.145118713378906, 57.10166931152344, 60.05821228027344, 63.0147590637207, 65.97130584716797, 68.92784881591797, 71.8843994140625, 74.8409423828125, 77.79749298095703, 80.75403594970703, 83.71058654785156, 86.66712951660156, 89.62367248535156, 92.58021545410156, 95.5367660522461, 98.4933090209961, 101.44985961914062, 104.40640258789062, 107.36294555664062, 110.31949615478516, 113.27604675292969]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 6.0, 4.0, 10.0, 12.0, 8.0, 9.0, 17.0, 20.0, 20.0, 27.0, 20.0, 25.0, 27.0, 34.0, 45.0, 32.0, 38.0, 47.0, 38.0, 39.0, 41.0, 28.0, 44.0, 40.0, 41.0, 33.0, 35.0, 37.0, 29.0, 32.0, 20.0, 25.0, 18.0, 11.0, 11.0, 12.0, 5.0, 6.0, 14.0, 2.0, 6.0, 5.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-55.7684440612793, -54.07344436645508, -52.37844467163086, -50.68344497680664, -48.988441467285156, -47.29344177246094, -45.59844207763672, -43.9034423828125, -42.20844268798828, -40.51344299316406, -38.818443298339844, -37.123443603515625, -35.428443908691406, -33.73344421386719, -32.0384407043457, -30.343441009521484, -28.648441314697266, -26.953441619873047, -25.258441925048828, -23.563440322875977, -21.868440628051758, -20.17344093322754, -18.478439331054688, -16.78343963623047, -15.08843994140625, -13.393440246582031, -11.698439598083496, -10.003438949584961, -8.308439254760742, -6.613439559936523, -4.918438911437988, -3.223438262939453, -1.5284347534179688, 0.1665654182434082, 1.8615655899047852, 3.556565761566162, 5.251565933227539, 6.946565628051758, 8.641566276550293, 10.336566925048828, 12.031566619873047, 13.726566314697266, 15.4215669631958, 17.116567611694336, 18.811567306518555, 20.506567001342773, 22.201568603515625, 23.896568298339844, 25.591567993164062, 27.28656768798828, 28.9815673828125, 30.67656898498535, 32.37156677246094, 34.066566467285156, 35.76156997680664, 37.45656967163086, 39.15156936645508, 40.8465690612793, 42.541568756103516, 44.236568450927734, 45.93157196044922, 47.62657165527344, 49.321571350097656, 51.016571044921875, 52.711570739746094]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 10.0, 11.0, 24.0, 20.0, 37.0, 34.0, 79.0, 91.0, 196.0, 293.0, 572.0, 1149.0, 2903.0, 9999.0, 60796.0, 3335408.0, 735454.0, 36531.0, 7035.0, 2080.0, 755.0, 342.0, 188.0, 102.0, 42.0, 45.0, 28.0, 19.0, 7.0, 10.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.78125, -33.57666015625, -32.3720703125, -31.16748046875, -29.962890625, -28.75830078125, -27.5537109375, -26.34912109375, -25.14453125, -23.93994140625, -22.7353515625, -21.53076171875, -20.326171875, -19.12158203125, -17.9169921875, -16.71240234375, -15.5078125, -14.30322265625, -13.0986328125, -11.89404296875, -10.689453125, -9.48486328125, -8.2802734375, -7.07568359375, -5.87109375, -4.66650390625, -3.4619140625, -2.25732421875, -1.052734375, 0.15185546875, 1.3564453125, 2.56103515625, 3.765625, 4.97021484375, 6.1748046875, 7.37939453125, 8.583984375, 9.78857421875, 10.9931640625, 12.19775390625, 13.40234375, 14.60693359375, 15.8115234375, 17.01611328125, 18.220703125, 19.42529296875, 20.6298828125, 21.83447265625, 23.0390625, 24.24365234375, 25.4482421875, 26.65283203125, 27.857421875, 29.06201171875, 30.2666015625, 31.47119140625, 32.67578125, 33.88037109375, 35.0849609375, 36.28955078125, 37.494140625, 38.69873046875, 39.9033203125, 41.10791015625, 42.3125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 15.0, 9.0, 14.0, 23.0, 24.0, 39.0, 40.0, 64.0, 62.0, 61.0, 69.0, 69.0, 70.0, 77.0, 57.0, 54.0, 49.0, 56.0, 30.0, 21.0, 21.0, 16.0, 24.0, 10.0, 7.0, 9.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -4.158782958984375, -4.03240966796875, -3.906036376953125, -3.7796630859375, -3.653289794921875, -3.52691650390625, -3.400543212890625, -3.274169921875, -3.147796630859375, -3.02142333984375, -2.895050048828125, -2.7686767578125, -2.642303466796875, -2.51593017578125, -2.389556884765625, -2.26318359375, -2.136810302734375, -2.01043701171875, -1.884063720703125, -1.7576904296875, -1.631317138671875, -1.50494384765625, -1.378570556640625, -1.252197265625, -1.125823974609375, -0.99945068359375, -0.873077392578125, -0.7467041015625, -0.620330810546875, -0.49395751953125, -0.367584228515625, -0.2412109375, -0.114837646484375, 0.01153564453125, 0.137908935546875, 0.2642822265625, 0.390655517578125, 0.51702880859375, 0.643402099609375, 0.769775390625, 0.896148681640625, 1.02252197265625, 1.148895263671875, 1.2752685546875, 1.401641845703125, 1.52801513671875, 1.654388427734375, 1.78076171875, 1.907135009765625, 2.03350830078125, 2.159881591796875, 2.2862548828125, 2.412628173828125, 2.53900146484375, 2.665374755859375, 2.791748046875, 2.918121337890625, 3.04449462890625, 3.170867919921875, 3.2972412109375, 3.423614501953125, 3.54998779296875, 3.676361083984375, 3.802734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 8.0, 8.0, 4.0, 12.0, 9.0, 17.0, 18.0, 20.0, 32.0, 46.0, 66.0, 105.0, 128.0, 211.0, 341.0, 589.0, 1200.0, 3057.0, 9957.0, 49391.0, 657196.0, 3316561.0, 127380.0, 19159.0, 5001.0, 1723.0, 774.0, 451.0, 261.0, 166.0, 122.0, 69.0, 50.0, 36.0, 29.0, 19.0, 19.0, 9.0, 5.0, 11.0, 5.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0], "bins": [-24.890625, -24.163330078125, -23.43603515625, -22.708740234375, -21.9814453125, -21.254150390625, -20.52685546875, -19.799560546875, -19.072265625, -18.344970703125, -17.61767578125, -16.890380859375, -16.1630859375, -15.435791015625, -14.70849609375, -13.981201171875, -13.25390625, -12.526611328125, -11.79931640625, -11.072021484375, -10.3447265625, -9.617431640625, -8.89013671875, -8.162841796875, -7.435546875, -6.708251953125, -5.98095703125, -5.253662109375, -4.5263671875, -3.799072265625, -3.07177734375, -2.344482421875, -1.6171875, -0.889892578125, -0.16259765625, 0.564697265625, 1.2919921875, 2.019287109375, 2.74658203125, 3.473876953125, 4.201171875, 4.928466796875, 5.65576171875, 6.383056640625, 7.1103515625, 7.837646484375, 8.56494140625, 9.292236328125, 10.01953125, 10.746826171875, 11.47412109375, 12.201416015625, 12.9287109375, 13.656005859375, 14.38330078125, 15.110595703125, 15.837890625, 16.565185546875, 17.29248046875, 18.019775390625, 18.7470703125, 19.474365234375, 20.20166015625, 20.928955078125, 21.65625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 15.0, 35.0, 77.0, 107.0, 289.0, 1065.0, 1694.0, 452.0, 174.0, 72.0, 35.0, 23.0, 16.0, 7.0, 8.0, 3.0, 3.0, 1.0], "bins": [-22.8125, -22.37506103515625, -21.9376220703125, -21.50018310546875, -21.062744140625, -20.62530517578125, -20.1878662109375, -19.75042724609375, -19.31298828125, -18.87554931640625, -18.4381103515625, -18.00067138671875, -17.563232421875, -17.12579345703125, -16.6883544921875, -16.25091552734375, -15.8134765625, -15.37603759765625, -14.9385986328125, -14.50115966796875, -14.063720703125, -13.62628173828125, -13.1888427734375, -12.75140380859375, -12.31396484375, -11.87652587890625, -11.4390869140625, -11.00164794921875, -10.564208984375, -10.12677001953125, -9.6893310546875, -9.25189208984375, -8.814453125, -8.37701416015625, -7.9395751953125, -7.50213623046875, -7.064697265625, -6.62725830078125, -6.1898193359375, -5.75238037109375, -5.31494140625, -4.87750244140625, -4.4400634765625, -4.00262451171875, -3.565185546875, -3.12774658203125, -2.6903076171875, -2.25286865234375, -1.8154296875, -1.37799072265625, -0.9405517578125, -0.50311279296875, -0.065673828125, 0.37176513671875, 0.8092041015625, 1.24664306640625, 1.68408203125, 2.12152099609375, 2.5589599609375, 2.99639892578125, 3.433837890625, 3.87127685546875, 4.3087158203125, 4.74615478515625, 5.18359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 19.0, 36.0, 68.0, 154.0, 241.0, 204.0, 143.0, 76.0, 36.0, 9.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-152.61488342285156, -149.49111938476562, -146.3673553466797, -143.24359130859375, -140.11981201171875, -136.9960479736328, -133.87228393554688, -130.74851989746094, -127.624755859375, -124.50099182128906, -121.3772201538086, -118.25345611572266, -115.12969207763672, -112.00592803955078, -108.88215637207031, -105.75839233398438, -102.63462829589844, -99.5108642578125, -96.38709259033203, -93.2633285522461, -90.13956451416016, -87.01580047607422, -83.89202880859375, -80.76826477050781, -77.64449310302734, -74.5207290649414, -71.39695739746094, -68.273193359375, -65.14942932128906, -62.02566146850586, -58.901893615722656, -55.77812957763672, -52.65436935424805, -49.530601501464844, -46.406837463378906, -43.2830696105957, -40.159305572509766, -37.03553771972656, -33.911773681640625, -30.788005828857422, -27.66423988342285, -24.54047393798828, -21.41670799255371, -18.29294204711914, -15.169175148010254, -12.045409202575684, -8.921642303466797, -5.797876358032227, -2.6741104125976562, 0.44965577125549316, 3.5734219551086426, 6.697188377380371, 9.820954322814941, 12.944720268249512, 16.0684871673584, 19.19225311279297, 22.31601905822754, 25.43978500366211, 28.56355094909668, 31.68731689453125, 34.81108474731445, 37.93484878540039, 41.058616638183594, 44.18238067626953, 47.306148529052734]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 15.0, 15.0, 20.0, 33.0, 27.0, 42.0, 58.0, 76.0, 61.0, 83.0, 77.0, 97.0, 71.0, 77.0, 62.0, 42.0, 43.0, 42.0, 20.0, 12.0, 17.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.415626525878906, -26.04025650024414, -24.664886474609375, -23.289518356323242, -21.914148330688477, -20.53877830505371, -19.163410186767578, -17.788040161132812, -16.412670135498047, -15.037300109863281, -13.661931037902832, -12.286561965942383, -10.911191940307617, -9.535821914672852, -8.160452842712402, -6.785083770751953, -5.4097137451171875, -4.03434419631958, -2.6589746475219727, -1.2836050987243652, 0.09176445007324219, 1.4671339988708496, 2.842503547668457, 4.217872619628906, 5.593242645263672, 6.968612194061279, 8.343981742858887, 9.719350814819336, 11.094720840454102, 12.470090866088867, 13.845459938049316, 15.220829010009766, 16.596195220947266, 17.97156524658203, 19.346935272216797, 20.72230339050293, 22.097673416137695, 23.47304344177246, 24.848411560058594, 26.22378158569336, 27.599151611328125, 28.97452163696289, 30.349891662597656, 31.72525978088379, 33.10063171386719, 34.47599792480469, 35.85136795043945, 37.22673797607422, 38.602108001708984, 39.97747802734375, 41.352848052978516, 42.72821807861328, 44.10358428955078, 45.47895431518555, 46.85432434082031, 48.22969436645508, 49.605064392089844, 50.98043441772461, 52.355804443359375, 53.73117446899414, 55.106544494628906, 56.481910705566406, 57.85728073120117, 59.23265075683594, 60.6080207824707]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 8.0, 9.0, 8.0, 14.0, 24.0, 26.0, 48.0, 50.0, 71.0, 98.0, 136.0, 218.0, 317.0, 441.0, 748.0, 1276.0, 2513.0, 5088.0, 12145.0, 34439.0, 109573.0, 308991.0, 357219.0, 142421.0, 44428.0, 15284.0, 6076.0, 2909.0, 1527.0, 844.0, 519.0, 340.0, 218.0, 155.0, 102.0, 70.0, 52.0, 38.0, 35.0, 16.0, 17.0, 17.0, 9.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0], "bins": [-19.078125, -18.5347900390625, -17.991455078125, -17.4481201171875, -16.90478515625, -16.3614501953125, -15.818115234375, -15.2747802734375, -14.7314453125, -14.1881103515625, -13.644775390625, -13.1014404296875, -12.55810546875, -12.0147705078125, -11.471435546875, -10.9281005859375, -10.384765625, -9.8414306640625, -9.298095703125, -8.7547607421875, -8.21142578125, -7.6680908203125, -7.124755859375, -6.5814208984375, -6.0380859375, -5.4947509765625, -4.951416015625, -4.4080810546875, -3.86474609375, -3.3214111328125, -2.778076171875, -2.2347412109375, -1.69140625, -1.1480712890625, -0.604736328125, -0.0614013671875, 0.48193359375, 1.0252685546875, 1.568603515625, 2.1119384765625, 2.6552734375, 3.1986083984375, 3.741943359375, 4.2852783203125, 4.82861328125, 5.3719482421875, 5.915283203125, 6.4586181640625, 7.001953125, 7.5452880859375, 8.088623046875, 8.6319580078125, 9.17529296875, 9.7186279296875, 10.261962890625, 10.8052978515625, 11.3486328125, 11.8919677734375, 12.435302734375, 12.9786376953125, 13.52197265625, 14.0653076171875, 14.608642578125, 15.1519775390625, 15.6953125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 7.0, 8.0, 9.0, 14.0, 15.0, 12.0, 28.0, 33.0, 48.0, 55.0, 62.0, 59.0, 73.0, 66.0, 72.0, 63.0, 64.0, 68.0, 45.0, 38.0, 34.0, 30.0, 29.0, 13.0, 18.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.12847900390625, -3.9991455078125, -3.86981201171875, -3.740478515625, -3.61114501953125, -3.4818115234375, -3.35247802734375, -3.22314453125, -3.09381103515625, -2.9644775390625, -2.83514404296875, -2.705810546875, -2.57647705078125, -2.4471435546875, -2.31781005859375, -2.1884765625, -2.05914306640625, -1.9298095703125, -1.80047607421875, -1.671142578125, -1.54180908203125, -1.4124755859375, -1.28314208984375, -1.15380859375, -1.02447509765625, -0.8951416015625, -0.76580810546875, -0.636474609375, -0.50714111328125, -0.3778076171875, -0.24847412109375, -0.119140625, 0.01019287109375, 0.1395263671875, 0.26885986328125, 0.398193359375, 0.52752685546875, 0.6568603515625, 0.78619384765625, 0.91552734375, 1.04486083984375, 1.1741943359375, 1.30352783203125, 1.432861328125, 1.56219482421875, 1.6915283203125, 1.82086181640625, 1.9501953125, 2.07952880859375, 2.2088623046875, 2.33819580078125, 2.467529296875, 2.59686279296875, 2.7261962890625, 2.85552978515625, 2.98486328125, 3.11419677734375, 3.2435302734375, 3.37286376953125, 3.502197265625, 3.63153076171875, 3.7608642578125, 3.89019775390625, 4.01953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 9.0, 17.0, 9.0, 15.0, 15.0, 37.0, 56.0, 79.0, 180.0, 429.0, 1117.0, 5293.0, 114156.0, 885142.0, 37493.0, 3034.0, 772.0, 289.0, 125.0, 96.0, 57.0, 40.0, 14.0, 23.0, 10.0, 12.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -49.95458984375, -48.2529296875, -46.55126953125, -44.849609375, -43.14794921875, -41.4462890625, -39.74462890625, -38.04296875, -36.34130859375, -34.6396484375, -32.93798828125, -31.236328125, -29.53466796875, -27.8330078125, -26.13134765625, -24.4296875, -22.72802734375, -21.0263671875, -19.32470703125, -17.623046875, -15.92138671875, -14.2197265625, -12.51806640625, -10.81640625, -9.11474609375, -7.4130859375, -5.71142578125, -4.009765625, -2.30810546875, -0.6064453125, 1.09521484375, 2.796875, 4.49853515625, 6.2001953125, 7.90185546875, 9.603515625, 11.30517578125, 13.0068359375, 14.70849609375, 16.41015625, 18.11181640625, 19.8134765625, 21.51513671875, 23.216796875, 24.91845703125, 26.6201171875, 28.32177734375, 30.0234375, 31.72509765625, 33.4267578125, 35.12841796875, 36.830078125, 38.53173828125, 40.2333984375, 41.93505859375, 43.63671875, 45.33837890625, 47.0400390625, 48.74169921875, 50.443359375, 52.14501953125, 53.8466796875, 55.54833984375, 57.25]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 1.0, 8.0, 6.0, 8.0, 12.0, 10.0, 14.0, 22.0, 23.0, 36.0, 37.0, 45.0, 46.0, 56.0, 56.0, 57.0, 79.0, 60.0, 57.0, 63.0, 46.0, 43.0, 43.0, 30.0, 29.0, 24.0, 18.0, 15.0, 8.0, 11.0, 11.0, 3.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.140625, -19.564208984375, -18.98779296875, -18.411376953125, -17.8349609375, -17.258544921875, -16.68212890625, -16.105712890625, -15.529296875, -14.952880859375, -14.37646484375, -13.800048828125, -13.2236328125, -12.647216796875, -12.07080078125, -11.494384765625, -10.91796875, -10.341552734375, -9.76513671875, -9.188720703125, -8.6123046875, -8.035888671875, -7.45947265625, -6.883056640625, -6.306640625, -5.730224609375, -5.15380859375, -4.577392578125, -4.0009765625, -3.424560546875, -2.84814453125, -2.271728515625, -1.6953125, -1.118896484375, -0.54248046875, 0.033935546875, 0.6103515625, 1.186767578125, 1.76318359375, 2.339599609375, 2.916015625, 3.492431640625, 4.06884765625, 4.645263671875, 5.2216796875, 5.798095703125, 6.37451171875, 6.950927734375, 7.52734375, 8.103759765625, 8.68017578125, 9.256591796875, 9.8330078125, 10.409423828125, 10.98583984375, 11.562255859375, 12.138671875, 12.715087890625, 13.29150390625, 13.867919921875, 14.4443359375, 15.020751953125, 15.59716796875, 16.173583984375, 16.75]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 8.0, 6.0, 9.0, 12.0, 10.0, 23.0, 33.0, 41.0, 56.0, 100.0, 243.0, 597.0, 1598.0, 5985.0, 52833.0, 779664.0, 191166.0, 11967.0, 2607.0, 875.0, 313.0, 150.0, 95.0, 32.0, 31.0, 17.0, 15.0, 11.0, 11.0, 12.0, 5.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.645263671875, -16.10302734375, -15.560791015625, -15.0185546875, -14.476318359375, -13.93408203125, -13.391845703125, -12.849609375, -12.307373046875, -11.76513671875, -11.222900390625, -10.6806640625, -10.138427734375, -9.59619140625, -9.053955078125, -8.51171875, -7.969482421875, -7.42724609375, -6.885009765625, -6.3427734375, -5.800537109375, -5.25830078125, -4.716064453125, -4.173828125, -3.631591796875, -3.08935546875, -2.547119140625, -2.0048828125, -1.462646484375, -0.92041015625, -0.378173828125, 0.1640625, 0.706298828125, 1.24853515625, 1.790771484375, 2.3330078125, 2.875244140625, 3.41748046875, 3.959716796875, 4.501953125, 5.044189453125, 5.58642578125, 6.128662109375, 6.6708984375, 7.213134765625, 7.75537109375, 8.297607421875, 8.83984375, 9.382080078125, 9.92431640625, 10.466552734375, 11.0087890625, 11.551025390625, 12.09326171875, 12.635498046875, 13.177734375, 13.719970703125, 14.26220703125, 14.804443359375, 15.3466796875, 15.888916015625, 16.43115234375, 16.973388671875, 17.515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 11.0, 14.0, 12.0, 22.0, 27.0, 43.0, 61.0, 94.0, 106.0, 118.0, 103.0, 101.0, 98.0, 58.0, 43.0, 25.0, 25.0, 9.0, 12.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014820098876953125, -0.0014367848634719849, -0.0013915598392486572, -0.0013463348150253296, -0.001301109790802002, -0.0012558847665786743, -0.0012106597423553467, -0.001165434718132019, -0.0011202096939086914, -0.0010749846696853638, -0.0010297596454620361, -0.0009845346212387085, -0.0009393095970153809, -0.0008940845727920532, -0.0008488595485687256, -0.000803634524345398, -0.0007584095001220703, -0.0007131844758987427, -0.000667959451675415, -0.0006227344274520874, -0.0005775094032287598, -0.0005322843790054321, -0.0004870593547821045, -0.00044183433055877686, -0.0003966093063354492, -0.0003513842821121216, -0.00030615925788879395, -0.0002609342336654663, -0.00021570920944213867, -0.00017048418521881104, -0.0001252591609954834, -8.003413677215576e-05, -3.4809112548828125e-05, 1.0415911674499512e-05, 5.564093589782715e-05, 0.00010086596012115479, 0.00014609098434448242, 0.00019131600856781006, 0.0002365410327911377, 0.00028176605701446533, 0.00032699108123779297, 0.0003722161054611206, 0.00041744112968444824, 0.0004626661539077759, 0.0005078911781311035, 0.0005531162023544312, 0.0005983412265777588, 0.0006435662508010864, 0.0006887912750244141, 0.0007340162992477417, 0.0007792413234710693, 0.000824466347694397, 0.0008696913719177246, 0.0009149163961410522, 0.0009601414203643799, 0.0010053664445877075, 0.0010505914688110352, 0.0010958164930343628, 0.0011410415172576904, 0.001186266541481018, 0.0012314915657043457, 0.0012767165899276733, 0.001321941614151001, 0.0013671666383743286, 0.0014123916625976562]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 2.0, 18.0, 10.0, 19.0, 26.0, 32.0, 52.0, 73.0, 112.0, 200.0, 326.0, 599.0, 1231.0, 2791.0, 7870.0, 36554.0, 531655.0, 424168.0, 30635.0, 7092.0, 2498.0, 1139.0, 556.0, 326.0, 169.0, 110.0, 74.0, 57.0, 41.0, 23.0, 17.0, 14.0, 10.0, 5.0, 2.0, 9.0, 4.0, 1.0, 1.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.21875, -15.711181640625, -15.20361328125, -14.696044921875, -14.1884765625, -13.680908203125, -13.17333984375, -12.665771484375, -12.158203125, -11.650634765625, -11.14306640625, -10.635498046875, -10.1279296875, -9.620361328125, -9.11279296875, -8.605224609375, -8.09765625, -7.590087890625, -7.08251953125, -6.574951171875, -6.0673828125, -5.559814453125, -5.05224609375, -4.544677734375, -4.037109375, -3.529541015625, -3.02197265625, -2.514404296875, -2.0068359375, -1.499267578125, -0.99169921875, -0.484130859375, 0.0234375, 0.531005859375, 1.03857421875, 1.546142578125, 2.0537109375, 2.561279296875, 3.06884765625, 3.576416015625, 4.083984375, 4.591552734375, 5.09912109375, 5.606689453125, 6.1142578125, 6.621826171875, 7.12939453125, 7.636962890625, 8.14453125, 8.652099609375, 9.15966796875, 9.667236328125, 10.1748046875, 10.682373046875, 11.18994140625, 11.697509765625, 12.205078125, 12.712646484375, 13.22021484375, 13.727783203125, 14.2353515625, 14.742919921875, 15.25048828125, 15.758056640625, 16.265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 7.0, 6.0, 5.0, 7.0, 5.0, 16.0, 30.0, 46.0, 75.0, 115.0, 129.0, 155.0, 149.0, 87.0, 57.0, 28.0, 12.0, 25.0, 11.0, 3.0, 6.0, 5.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4453125, -13.04248046875, -12.6396484375, -12.23681640625, -11.833984375, -11.43115234375, -11.0283203125, -10.62548828125, -10.22265625, -9.81982421875, -9.4169921875, -9.01416015625, -8.611328125, -8.20849609375, -7.8056640625, -7.40283203125, -7.0, -6.59716796875, -6.1943359375, -5.79150390625, -5.388671875, -4.98583984375, -4.5830078125, -4.18017578125, -3.77734375, -3.37451171875, -2.9716796875, -2.56884765625, -2.166015625, -1.76318359375, -1.3603515625, -0.95751953125, -0.5546875, -0.15185546875, 0.2509765625, 0.65380859375, 1.056640625, 1.45947265625, 1.8623046875, 2.26513671875, 2.66796875, 3.07080078125, 3.4736328125, 3.87646484375, 4.279296875, 4.68212890625, 5.0849609375, 5.48779296875, 5.890625, 6.29345703125, 6.6962890625, 7.09912109375, 7.501953125, 7.90478515625, 8.3076171875, 8.71044921875, 9.11328125, 9.51611328125, 9.9189453125, 10.32177734375, 10.724609375, 11.12744140625, 11.5302734375, 11.93310546875, 12.3359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 23.0, 154.0, 375.0, 314.0, 105.0, 23.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.13784790039062, -121.69703674316406, -108.2562255859375, -94.8154067993164, -81.37459564208984, -67.93378448486328, -54.49296569824219, -41.052154541015625, -27.611343383789062, -14.170530319213867, -0.7297172546386719, 12.711097717285156, 26.15190887451172, 39.59272003173828, 53.033538818359375, 66.47434997558594, 79.9151611328125, 93.35597229003906, 106.79678344726562, 120.23760223388672, 133.67840576171875, 147.11923217773438, 160.56004333496094, 174.0008544921875, 187.44166564941406, 200.88247680664062, 214.3232879638672, 227.76409912109375, 241.20492553710938, 254.64572143554688, 268.0865478515625, 281.52734375, 294.9681396484375, 308.4089660644531, 321.8497619628906, 335.29058837890625, 348.73138427734375, 362.1722106933594, 375.613037109375, 389.0538330078125, 402.49462890625, 415.9354553222656, 429.3762512207031, 442.81707763671875, 456.25787353515625, 469.6986999511719, 483.1395263671875, 496.580322265625, 510.0211486816406, 523.4619750976562, 536.9027709960938, 550.3435668945312, 563.784423828125, 577.2252197265625, 590.666015625, 604.1068115234375, 617.5476684570312, 630.9884643554688, 644.4293212890625, 657.8701171875, 671.3109130859375, 684.751708984375, 698.1925659179688, 711.6333618164062, 725.0741577148438]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 7.0, 12.0, 10.0, 20.0, 16.0, 24.0, 21.0, 23.0, 21.0, 22.0, 38.0, 46.0, 33.0, 34.0, 45.0, 49.0, 51.0, 39.0, 31.0, 46.0, 32.0, 38.0, 30.0, 39.0, 33.0, 26.0, 28.0, 34.0, 32.0, 21.0, 18.0, 16.0, 15.0, 11.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-74.07373046875, -71.78854370117188, -69.50334930419922, -67.2181625366211, -64.93297576904297, -62.64778518676758, -60.36259460449219, -58.07740783691406, -55.79221725463867, -53.50702667236328, -51.221839904785156, -48.936649322509766, -46.651458740234375, -44.36627197265625, -42.08108139038086, -39.79589080810547, -37.510704040527344, -35.22551345825195, -32.94032669067383, -30.655136108398438, -28.36994743347168, -26.084758758544922, -23.79956817626953, -21.514379501342773, -19.229190826416016, -16.944002151489258, -14.658812522888184, -12.37362289428711, -10.088434219360352, -7.803245544433594, -5.5180559158325195, -3.2328662872314453, -0.9476776123046875, 1.3375115394592285, 3.6227006912231445, 5.9078898429870605, 8.193078994750977, 10.478267669677734, 12.763457298278809, 15.048646926879883, 17.33383560180664, 19.6190242767334, 21.904212951660156, 24.189403533935547, 26.474592208862305, 28.759780883789062, 31.044971466064453, 33.330162048339844, 35.61534881591797, 37.90053939819336, 40.185726165771484, 42.470916748046875, 44.756103515625, 47.04129409790039, 49.32648468017578, 51.611671447753906, 53.8968620300293, 56.18205261230469, 58.46723937988281, 60.7524299621582, 63.037620544433594, 65.32280731201172, 67.60799407958984, 69.8931884765625, 72.17837524414062]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 5.0, 9.0, 20.0, 17.0, 25.0, 55.0, 108.0, 179.0, 354.0, 759.0, 1869.0, 9147.0, 273170.0, 3890646.0, 13847.0, 2356.0, 858.0, 386.0, 216.0, 93.0, 55.0, 25.0, 25.0, 13.0, 6.0, 6.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.125, -46.470703125, -44.81640625, -43.162109375, -41.5078125, -39.853515625, -38.19921875, -36.544921875, -34.890625, -33.236328125, -31.58203125, -29.927734375, -28.2734375, -26.619140625, -24.96484375, -23.310546875, -21.65625, -20.001953125, -18.34765625, -16.693359375, -15.0390625, -13.384765625, -11.73046875, -10.076171875, -8.421875, -6.767578125, -5.11328125, -3.458984375, -1.8046875, -0.150390625, 1.50390625, 3.158203125, 4.8125, 6.466796875, 8.12109375, 9.775390625, 11.4296875, 13.083984375, 14.73828125, 16.392578125, 18.046875, 19.701171875, 21.35546875, 23.009765625, 24.6640625, 26.318359375, 27.97265625, 29.626953125, 31.28125, 32.935546875, 34.58984375, 36.244140625, 37.8984375, 39.552734375, 41.20703125, 42.861328125, 44.515625, 46.169921875, 47.82421875, 49.478515625, 51.1328125, 52.787109375, 54.44140625, 56.095703125, 57.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 3.0, 9.0, 14.0, 26.0, 30.0, 36.0, 51.0, 50.0, 58.0, 72.0, 67.0, 71.0, 78.0, 69.0, 72.0, 60.0, 47.0, 49.0, 32.0, 27.0, 19.0, 10.0, 11.0, 11.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.328125, -5.16070556640625, -4.9932861328125, -4.82586669921875, -4.658447265625, -4.49102783203125, -4.3236083984375, -4.15618896484375, -3.98876953125, -3.82135009765625, -3.6539306640625, -3.48651123046875, -3.319091796875, -3.15167236328125, -2.9842529296875, -2.81683349609375, -2.6494140625, -2.48199462890625, -2.3145751953125, -2.14715576171875, -1.979736328125, -1.81231689453125, -1.6448974609375, -1.47747802734375, -1.31005859375, -1.14263916015625, -0.9752197265625, -0.80780029296875, -0.640380859375, -0.47296142578125, -0.3055419921875, -0.13812255859375, 0.029296875, 0.19671630859375, 0.3641357421875, 0.53155517578125, 0.698974609375, 0.86639404296875, 1.0338134765625, 1.20123291015625, 1.36865234375, 1.53607177734375, 1.7034912109375, 1.87091064453125, 2.038330078125, 2.20574951171875, 2.3731689453125, 2.54058837890625, 2.7080078125, 2.87542724609375, 3.0428466796875, 3.21026611328125, 3.377685546875, 3.54510498046875, 3.7125244140625, 3.87994384765625, 4.04736328125, 4.21478271484375, 4.3822021484375, 4.54962158203125, 4.717041015625, 4.88446044921875, 5.0518798828125, 5.21929931640625, 5.38671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 11.0, 18.0, 12.0, 23.0, 26.0, 43.0, 56.0, 68.0, 106.0, 137.0, 212.0, 347.0, 538.0, 1005.0, 2040.0, 4972.0, 18397.0, 214571.0, 3882961.0, 52882.0, 9226.0, 3100.0, 1454.0, 744.0, 417.0, 254.0, 193.0, 133.0, 89.0, 58.0, 51.0, 39.0, 22.0, 19.0, 11.0, 8.0, 6.0, 10.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.734375, -21.0810546875, -20.427734375, -19.7744140625, -19.12109375, -18.4677734375, -17.814453125, -17.1611328125, -16.5078125, -15.8544921875, -15.201171875, -14.5478515625, -13.89453125, -13.2412109375, -12.587890625, -11.9345703125, -11.28125, -10.6279296875, -9.974609375, -9.3212890625, -8.66796875, -8.0146484375, -7.361328125, -6.7080078125, -6.0546875, -5.4013671875, -4.748046875, -4.0947265625, -3.44140625, -2.7880859375, -2.134765625, -1.4814453125, -0.828125, -0.1748046875, 0.478515625, 1.1318359375, 1.78515625, 2.4384765625, 3.091796875, 3.7451171875, 4.3984375, 5.0517578125, 5.705078125, 6.3583984375, 7.01171875, 7.6650390625, 8.318359375, 8.9716796875, 9.625, 10.2783203125, 10.931640625, 11.5849609375, 12.23828125, 12.8916015625, 13.544921875, 14.1982421875, 14.8515625, 15.5048828125, 16.158203125, 16.8115234375, 17.46484375, 18.1181640625, 18.771484375, 19.4248046875, 20.078125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 5.0, 11.0, 16.0, 28.0, 63.0, 118.0, 272.0, 2840.0, 420.0, 130.0, 60.0, 36.0, 22.0, 13.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.943359375, -3.83880615234375, -3.7342529296875, -3.62969970703125, -3.525146484375, -3.42059326171875, -3.3160400390625, -3.21148681640625, -3.10693359375, -3.00238037109375, -2.8978271484375, -2.79327392578125, -2.688720703125, -2.58416748046875, -2.4796142578125, -2.37506103515625, -2.2705078125, -2.16595458984375, -2.0614013671875, -1.95684814453125, -1.852294921875, -1.74774169921875, -1.6431884765625, -1.53863525390625, -1.43408203125, -1.32952880859375, -1.2249755859375, -1.12042236328125, -1.015869140625, -0.91131591796875, -0.8067626953125, -0.70220947265625, -0.59765625, -0.49310302734375, -0.3885498046875, -0.28399658203125, -0.179443359375, -0.07489013671875, 0.0296630859375, 0.13421630859375, 0.23876953125, 0.34332275390625, 0.4478759765625, 0.55242919921875, 0.656982421875, 0.76153564453125, 0.8660888671875, 0.97064208984375, 1.0751953125, 1.17974853515625, 1.2843017578125, 1.38885498046875, 1.493408203125, 1.59796142578125, 1.7025146484375, 1.80706787109375, 1.91162109375, 2.01617431640625, 2.1207275390625, 2.22528076171875, 2.329833984375, 2.43438720703125, 2.5389404296875, 2.64349365234375, 2.748046875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 8.0, 3.0, 9.0, 17.0, 24.0, 28.0, 62.0, 73.0, 118.0, 153.0, 177.0, 147.0, 95.0, 41.0, 31.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.301677703857422, -27.589229583740234, -26.876781463623047, -26.16433334350586, -25.451885223388672, -24.739437103271484, -24.026988983154297, -23.31454086303711, -22.602092742919922, -21.889644622802734, -21.177196502685547, -20.46474838256836, -19.752300262451172, -19.039852142333984, -18.327404022216797, -17.61495590209961, -16.902507781982422, -16.190059661865234, -15.477611541748047, -14.76516342163086, -14.052715301513672, -13.340267181396484, -12.627819061279297, -11.91537094116211, -11.202922821044922, -10.490474700927734, -9.778026580810547, -9.06557846069336, -8.353130340576172, -7.640682220458984, -6.928234100341797, -6.215785980224609, -5.503335952758789, -4.790887832641602, -4.078439712524414, -3.3659915924072266, -2.653543472290039, -1.9410953521728516, -1.228647232055664, -0.5161991119384766, 0.19624900817871094, 0.9086971282958984, 1.621145248413086, 2.3335933685302734, 3.046041488647461, 3.7584896087646484, 4.470937728881836, 5.183385848999023, 5.895833969116211, 6.608282089233398, 7.320730209350586, 8.033178329467773, 8.745626449584961, 9.458074569702148, 10.170522689819336, 10.882970809936523, 11.595418930053711, 12.307867050170898, 13.020315170288086, 13.732763290405273, 14.445211410522461, 15.157659530639648, 15.870107650756836, 16.582555770874023, 17.29500389099121]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 4.0, 12.0, 9.0, 11.0, 17.0, 23.0, 23.0, 18.0, 29.0, 31.0, 38.0, 31.0, 42.0, 35.0, 35.0, 28.0, 42.0, 48.0, 46.0, 43.0, 43.0, 39.0, 50.0, 36.0, 43.0, 16.0, 32.0, 26.0, 35.0, 22.0, 18.0, 13.0, 16.0, 13.0, 9.0, 10.0, 2.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34560775756836, -9.046968460083008, -8.748330116271973, -8.449690818786621, -8.151052474975586, -7.852413177490234, -7.553774356842041, -7.255135536193848, -6.956496238708496, -6.657857418060303, -6.359218597412109, -6.060579299926758, -5.7619404792785645, -5.463301658630371, -5.164662837982178, -4.866024017333984, -4.567385196685791, -4.268746376037598, -3.970107316970825, -3.671468496322632, -3.3728294372558594, -3.074190616607666, -2.7755517959594727, -2.4769127368927, -2.178273916244507, -1.879634976387024, -1.580996036529541, -1.2823572158813477, -0.9837182760238647, -0.6850793361663818, -0.3864405155181885, -0.08780145645141602, 0.21083736419677734, 0.5094763040542603, 0.8081151843070984, 1.1067540645599365, 1.4053930044174194, 1.7040319442749023, 2.0026707649230957, 2.301309823989868, 2.5999486446380615, 2.898587465286255, 3.1972265243530273, 3.4958653450012207, 3.794504165649414, 4.093143463134766, 4.391781806945801, 4.690421104431152, 4.989059925079346, 5.287698745727539, 5.586337566375732, 5.884976387023926, 6.183615684509277, 6.482254505157471, 6.780893325805664, 7.079532623291016, 7.378170967102051, 7.676809787750244, 7.9754486083984375, 8.274087905883789, 8.572726249694824, 8.871365547180176, 9.170003890991211, 9.468643188476562, 9.767282485961914]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 4.0, 11.0, 21.0, 26.0, 28.0, 43.0, 37.0, 72.0, 110.0, 179.0, 209.0, 316.0, 472.0, 760.0, 1244.0, 2249.0, 4579.0, 9953.0, 24078.0, 61300.0, 153601.0, 303859.0, 273324.0, 125654.0, 49525.0, 19638.0, 8215.0, 3916.0, 1959.0, 1090.0, 693.0, 438.0, 253.0, 210.0, 129.0, 94.0, 64.0, 48.0, 37.0, 28.0, 25.0, 7.0, 15.0, 9.0, 4.0, 4.0, 9.0, 6.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.25, -11.825927734375, -11.40185546875, -10.977783203125, -10.5537109375, -10.129638671875, -9.70556640625, -9.281494140625, -8.857421875, -8.433349609375, -8.00927734375, -7.585205078125, -7.1611328125, -6.737060546875, -6.31298828125, -5.888916015625, -5.46484375, -5.040771484375, -4.61669921875, -4.192626953125, -3.7685546875, -3.344482421875, -2.92041015625, -2.496337890625, -2.072265625, -1.648193359375, -1.22412109375, -0.800048828125, -0.3759765625, 0.048095703125, 0.47216796875, 0.896240234375, 1.3203125, 1.744384765625, 2.16845703125, 2.592529296875, 3.0166015625, 3.440673828125, 3.86474609375, 4.288818359375, 4.712890625, 5.136962890625, 5.56103515625, 5.985107421875, 6.4091796875, 6.833251953125, 7.25732421875, 7.681396484375, 8.10546875, 8.529541015625, 8.95361328125, 9.377685546875, 9.8017578125, 10.225830078125, 10.64990234375, 11.073974609375, 11.498046875, 11.922119140625, 12.34619140625, 12.770263671875, 13.1943359375, 13.618408203125, 14.04248046875, 14.466552734375, 14.890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 4.0, 12.0, 15.0, 19.0, 20.0, 37.0, 47.0, 41.0, 42.0, 70.0, 54.0, 60.0, 70.0, 59.0, 69.0, 65.0, 54.0, 53.0, 40.0, 35.0, 35.0, 23.0, 21.0, 9.0, 12.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.293212890625, -5.12158203125, -4.949951171875, -4.7783203125, -4.606689453125, -4.43505859375, -4.263427734375, -4.091796875, -3.920166015625, -3.74853515625, -3.576904296875, -3.4052734375, -3.233642578125, -3.06201171875, -2.890380859375, -2.71875, -2.547119140625, -2.37548828125, -2.203857421875, -2.0322265625, -1.860595703125, -1.68896484375, -1.517333984375, -1.345703125, -1.174072265625, -1.00244140625, -0.830810546875, -0.6591796875, -0.487548828125, -0.31591796875, -0.144287109375, 0.02734375, 0.198974609375, 0.37060546875, 0.542236328125, 0.7138671875, 0.885498046875, 1.05712890625, 1.228759765625, 1.400390625, 1.572021484375, 1.74365234375, 1.915283203125, 2.0869140625, 2.258544921875, 2.43017578125, 2.601806640625, 2.7734375, 2.945068359375, 3.11669921875, 3.288330078125, 3.4599609375, 3.631591796875, 3.80322265625, 3.974853515625, 4.146484375, 4.318115234375, 4.48974609375, 4.661376953125, 4.8330078125, 5.004638671875, 5.17626953125, 5.347900390625, 5.51953125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 9.0, 13.0, 9.0, 16.0, 17.0, 31.0, 42.0, 45.0, 62.0, 107.0, 168.0, 281.0, 707.0, 2160.0, 16796.0, 866958.0, 153329.0, 5490.0, 1172.0, 426.0, 217.0, 126.0, 94.0, 78.0, 49.0, 31.0, 21.0, 15.0, 12.0, 9.0, 12.0, 6.0, 10.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0, -62.9541015625, -60.908203125, -58.8623046875, -56.81640625, -54.7705078125, -52.724609375, -50.6787109375, -48.6328125, -46.5869140625, -44.541015625, -42.4951171875, -40.44921875, -38.4033203125, -36.357421875, -34.3115234375, -32.265625, -30.2197265625, -28.173828125, -26.1279296875, -24.08203125, -22.0361328125, -19.990234375, -17.9443359375, -15.8984375, -13.8525390625, -11.806640625, -9.7607421875, -7.71484375, -5.6689453125, -3.623046875, -1.5771484375, 0.46875, 2.5146484375, 4.560546875, 6.6064453125, 8.65234375, 10.6982421875, 12.744140625, 14.7900390625, 16.8359375, 18.8818359375, 20.927734375, 22.9736328125, 25.01953125, 27.0654296875, 29.111328125, 31.1572265625, 33.203125, 35.2490234375, 37.294921875, 39.3408203125, 41.38671875, 43.4326171875, 45.478515625, 47.5244140625, 49.5703125, 51.6162109375, 53.662109375, 55.7080078125, 57.75390625, 59.7998046875, 61.845703125, 63.8916015625, 65.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 10.0, 6.0, 13.0, 20.0, 19.0, 24.0, 45.0, 62.0, 60.0, 89.0, 93.0, 94.0, 82.0, 73.0, 74.0, 56.0, 39.0, 50.0, 20.0, 18.0, 9.0, 10.0, 3.0, 7.0, 3.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.71875, -41.548828125, -40.37890625, -39.208984375, -38.0390625, -36.869140625, -35.69921875, -34.529296875, -33.359375, -32.189453125, -31.01953125, -29.849609375, -28.6796875, -27.509765625, -26.33984375, -25.169921875, -24.0, -22.830078125, -21.66015625, -20.490234375, -19.3203125, -18.150390625, -16.98046875, -15.810546875, -14.640625, -13.470703125, -12.30078125, -11.130859375, -9.9609375, -8.791015625, -7.62109375, -6.451171875, -5.28125, -4.111328125, -2.94140625, -1.771484375, -0.6015625, 0.568359375, 1.73828125, 2.908203125, 4.078125, 5.248046875, 6.41796875, 7.587890625, 8.7578125, 9.927734375, 11.09765625, 12.267578125, 13.4375, 14.607421875, 15.77734375, 16.947265625, 18.1171875, 19.287109375, 20.45703125, 21.626953125, 22.796875, 23.966796875, 25.13671875, 26.306640625, 27.4765625, 28.646484375, 29.81640625, 30.986328125, 32.15625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 7.0, 17.0, 9.0, 15.0, 31.0, 40.0, 71.0, 59.0, 136.0, 314.0, 779.0, 3605.0, 29202.0, 535484.0, 448905.0, 25272.0, 3154.0, 732.0, 311.0, 120.0, 74.0, 45.0, 43.0, 24.0, 16.0, 21.0, 6.0, 9.0, 6.0, 4.0, 7.0, 2.0, 5.0, 10.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.9393310546875, -16.425537109375, -15.9117431640625, -15.39794921875, -14.8841552734375, -14.370361328125, -13.8565673828125, -13.3427734375, -12.8289794921875, -12.315185546875, -11.8013916015625, -11.28759765625, -10.7738037109375, -10.260009765625, -9.7462158203125, -9.232421875, -8.7186279296875, -8.204833984375, -7.6910400390625, -7.17724609375, -6.6634521484375, -6.149658203125, -5.6358642578125, -5.1220703125, -4.6082763671875, -4.094482421875, -3.5806884765625, -3.06689453125, -2.5531005859375, -2.039306640625, -1.5255126953125, -1.01171875, -0.4979248046875, 0.015869140625, 0.5296630859375, 1.04345703125, 1.5572509765625, 2.071044921875, 2.5848388671875, 3.0986328125, 3.6124267578125, 4.126220703125, 4.6400146484375, 5.15380859375, 5.6676025390625, 6.181396484375, 6.6951904296875, 7.208984375, 7.7227783203125, 8.236572265625, 8.7503662109375, 9.26416015625, 9.7779541015625, 10.291748046875, 10.8055419921875, 11.3193359375, 11.8331298828125, 12.346923828125, 12.8607177734375, 13.37451171875, 13.8883056640625, 14.402099609375, 14.9158935546875, 15.4296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 6.0, 6.0, 8.0, 8.0, 15.0, 11.0, 17.0, 25.0, 21.0, 39.0, 39.0, 39.0, 48.0, 50.0, 66.0, 60.0, 62.0, 54.0, 60.0, 60.0, 40.0, 32.0, 43.0, 30.0, 16.0, 31.0, 20.0, 16.0, 8.0, 13.0, 8.0, 5.0, 7.0, 9.0, 3.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.000843048095703125, -0.0008190125226974487, -0.0007949769496917725, -0.0007709413766860962, -0.0007469058036804199, -0.0007228702306747437, -0.0006988346576690674, -0.0006747990846633911, -0.0006507635116577148, -0.0006267279386520386, -0.0006026923656463623, -0.000578656792640686, -0.0005546212196350098, -0.0005305856466293335, -0.0005065500736236572, -0.00048251450061798096, -0.0004584789276123047, -0.0004344433546066284, -0.00041040778160095215, -0.0003863722085952759, -0.0003623366355895996, -0.00033830106258392334, -0.00031426548957824707, -0.0002902299165725708, -0.00026619434356689453, -0.00024215877056121826, -0.000218123197555542, -0.00019408762454986572, -0.00017005205154418945, -0.00014601647853851318, -0.00012198090553283691, -9.794533252716064e-05, -7.390975952148438e-05, -4.9874186515808105e-05, -2.5838613510131836e-05, -1.8030405044555664e-06, 2.2232532501220703e-05, 4.626810550689697e-05, 7.030367851257324e-05, 9.433925151824951e-05, 0.00011837482452392578, 0.00014241039752960205, 0.00016644597053527832, 0.0001904815435409546, 0.00021451711654663086, 0.00023855268955230713, 0.0002625882625579834, 0.00028662383556365967, 0.00031065940856933594, 0.0003346949815750122, 0.0003587305545806885, 0.00038276612758636475, 0.000406801700592041, 0.0004308372735977173, 0.00045487284660339355, 0.0004789084196090698, 0.0005029439926147461, 0.0005269795656204224, 0.0005510151386260986, 0.0005750507116317749, 0.0005990862846374512, 0.0006231218576431274, 0.0006471574306488037, 0.00067119300365448, 0.0006952285766601562]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 7.0, 4.0, 13.0, 18.0, 26.0, 67.0, 140.0, 363.0, 1273.0, 10484.0, 894015.0, 137225.0, 3759.0, 703.0, 232.0, 107.0, 42.0, 27.0, 15.0, 8.0, 9.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.5625, -31.5048828125, -30.447265625, -29.3896484375, -28.33203125, -27.2744140625, -26.216796875, -25.1591796875, -24.1015625, -23.0439453125, -21.986328125, -20.9287109375, -19.87109375, -18.8134765625, -17.755859375, -16.6982421875, -15.640625, -14.5830078125, -13.525390625, -12.4677734375, -11.41015625, -10.3525390625, -9.294921875, -8.2373046875, -7.1796875, -6.1220703125, -5.064453125, -4.0068359375, -2.94921875, -1.8916015625, -0.833984375, 0.2236328125, 1.28125, 2.3388671875, 3.396484375, 4.4541015625, 5.51171875, 6.5693359375, 7.626953125, 8.6845703125, 9.7421875, 10.7998046875, 11.857421875, 12.9150390625, 13.97265625, 15.0302734375, 16.087890625, 17.1455078125, 18.203125, 19.2607421875, 20.318359375, 21.3759765625, 22.43359375, 23.4912109375, 24.548828125, 25.6064453125, 26.6640625, 27.7216796875, 28.779296875, 29.8369140625, 30.89453125, 31.9521484375, 33.009765625, 34.0673828125, 35.125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 4.0, 8.0, 9.0, 17.0, 33.0, 54.0, 81.0, 109.0, 124.0, 142.0, 120.0, 95.0, 66.0, 46.0, 23.0, 20.0, 15.0, 8.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.1221923828125, -12.642822265625, -12.1634521484375, -11.68408203125, -11.2047119140625, -10.725341796875, -10.2459716796875, -9.7666015625, -9.2872314453125, -8.807861328125, -8.3284912109375, -7.84912109375, -7.3697509765625, -6.890380859375, -6.4110107421875, -5.931640625, -5.4522705078125, -4.972900390625, -4.4935302734375, -4.01416015625, -3.5347900390625, -3.055419921875, -2.5760498046875, -2.0966796875, -1.6173095703125, -1.137939453125, -0.6585693359375, -0.17919921875, 0.3001708984375, 0.779541015625, 1.2589111328125, 1.73828125, 2.2176513671875, 2.697021484375, 3.1763916015625, 3.65576171875, 4.1351318359375, 4.614501953125, 5.0938720703125, 5.5732421875, 6.0526123046875, 6.531982421875, 7.0113525390625, 7.49072265625, 7.9700927734375, 8.449462890625, 8.9288330078125, 9.408203125, 9.8875732421875, 10.366943359375, 10.8463134765625, 11.32568359375, 11.8050537109375, 12.284423828125, 12.7637939453125, 13.2431640625, 13.7225341796875, 14.201904296875, 14.6812744140625, 15.16064453125, 15.6400146484375, 16.119384765625, 16.5987548828125, 17.078125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 10.0, 14.0, 23.0, 61.0, 129.0, 175.0, 219.0, 174.0, 111.0, 46.0, 30.0, 9.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-247.31735229492188, -239.45172119140625, -231.58609008789062, -223.720458984375, -215.8548126220703, -207.9891815185547, -200.12355041503906, -192.25791931152344, -184.3922882080078, -176.5266571044922, -168.66102600097656, -160.79537963867188, -152.92974853515625, -145.06411743164062, -137.198486328125, -129.33285522460938, -121.46721649169922, -113.6015853881836, -105.73594665527344, -97.87031555175781, -90.00468444824219, -82.13905334472656, -74.2734146118164, -66.40778350830078, -58.54214859008789, -50.676513671875, -42.810882568359375, -34.945247650146484, -27.079614639282227, -19.21398162841797, -11.348346710205078, -3.482715606689453, 4.3829193115234375, 12.248552322387695, 20.114185333251953, 27.979820251464844, 35.84545135498047, 43.71108627319336, 51.57672119140625, 59.442352294921875, 67.3079833984375, 75.17361450195312, 83.03925323486328, 90.9048843383789, 98.77051544189453, 106.63615417480469, 114.50178527832031, 122.36741638183594, 130.23306274414062, 138.09869384765625, 145.96432495117188, 153.8299560546875, 161.6956024169922, 169.5612335205078, 177.42686462402344, 185.29249572753906, 193.1581268310547, 201.0237579345703, 208.88938903808594, 216.75503540039062, 224.62066650390625, 232.48629760742188, 240.3519287109375, 248.21755981445312, 256.08319091796875]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 3.0, 6.0, 3.0, 13.0, 10.0, 23.0, 12.0, 21.0, 33.0, 31.0, 29.0, 30.0, 56.0, 37.0, 44.0, 36.0, 44.0, 49.0, 55.0, 50.0, 50.0, 53.0, 47.0, 41.0, 40.0, 38.0, 21.0, 32.0, 20.0, 16.0, 9.0, 10.0, 6.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-115.8680648803711, -112.44839477539062, -109.02872467041016, -105.60905456542969, -102.18938446044922, -98.76971435546875, -95.35003662109375, -91.93037414550781, -88.51069641113281, -85.09102630615234, -81.67135620117188, -78.2516860961914, -74.83201599121094, -71.41234588623047, -67.99267578125, -64.572998046875, -61.15333557128906, -57.733665466308594, -54.313995361328125, -50.894325256347656, -47.47465515136719, -44.05498504638672, -40.635311126708984, -37.215641021728516, -33.79597091674805, -30.376300811767578, -26.95663070678711, -23.536958694458008, -20.11728858947754, -16.69761848449707, -13.277946472167969, -9.8582763671875, -6.4385986328125, -3.018928050994873, 0.4007425308227539, 3.820413589477539, 7.240083694458008, 10.659753799438477, 14.079425811767578, 17.499095916748047, 20.918766021728516, 24.338436126708984, 27.758106231689453, 31.177778244018555, 34.597450256347656, 38.017120361328125, 41.436790466308594, 44.85646057128906, 48.27613067626953, 51.69580078125, 55.11547088623047, 58.53514099121094, 61.954811096191406, 65.37448120117188, 68.79415893554688, 72.21382141113281, 75.63349914550781, 79.05316925048828, 82.47283935546875, 85.89250946044922, 89.31217956542969, 92.73184967041016, 96.15151977539062, 99.57119750976562, 102.99085998535156]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 11.0, 17.0, 28.0, 17.0, 50.0, 82.0, 134.0, 212.0, 477.0, 1103.0, 3450.0, 15570.0, 3540646.0, 612445.0, 14571.0, 3377.0, 1148.0, 456.0, 210.0, 98.0, 54.0, 28.0, 21.0, 11.0, 16.0, 8.0, 10.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -38.8310546875, -37.443359375, -36.0556640625, -34.66796875, -33.2802734375, -31.892578125, -30.5048828125, -29.1171875, -27.7294921875, -26.341796875, -24.9541015625, -23.56640625, -22.1787109375, -20.791015625, -19.4033203125, -18.015625, -16.6279296875, -15.240234375, -13.8525390625, -12.46484375, -11.0771484375, -9.689453125, -8.3017578125, -6.9140625, -5.5263671875, -4.138671875, -2.7509765625, -1.36328125, 0.0244140625, 1.412109375, 2.7998046875, 4.1875, 5.5751953125, 6.962890625, 8.3505859375, 9.73828125, 11.1259765625, 12.513671875, 13.9013671875, 15.2890625, 16.6767578125, 18.064453125, 19.4521484375, 20.83984375, 22.2275390625, 23.615234375, 25.0029296875, 26.390625, 27.7783203125, 29.166015625, 30.5537109375, 31.94140625, 33.3291015625, 34.716796875, 36.1044921875, 37.4921875, 38.8798828125, 40.267578125, 41.6552734375, 43.04296875, 44.4306640625, 45.818359375, 47.2060546875, 48.59375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 2.0, 6.0, 6.0, 14.0, 17.0, 29.0, 43.0, 49.0, 61.0, 62.0, 81.0, 95.0, 78.0, 86.0, 69.0, 81.0, 61.0, 51.0, 36.0, 15.0, 17.0, 13.0, 17.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.06768798828125, -5.8463134765625, -5.62493896484375, -5.403564453125, -5.18218994140625, -4.9608154296875, -4.73944091796875, -4.51806640625, -4.29669189453125, -4.0753173828125, -3.85394287109375, -3.632568359375, -3.41119384765625, -3.1898193359375, -2.96844482421875, -2.7470703125, -2.52569580078125, -2.3043212890625, -2.08294677734375, -1.861572265625, -1.64019775390625, -1.4188232421875, -1.19744873046875, -0.97607421875, -0.75469970703125, -0.5333251953125, -0.31195068359375, -0.090576171875, 0.13079833984375, 0.3521728515625, 0.57354736328125, 0.794921875, 1.01629638671875, 1.2376708984375, 1.45904541015625, 1.680419921875, 1.90179443359375, 2.1231689453125, 2.34454345703125, 2.56591796875, 2.78729248046875, 3.0086669921875, 3.23004150390625, 3.451416015625, 3.67279052734375, 3.8941650390625, 4.11553955078125, 4.3369140625, 4.55828857421875, 4.7796630859375, 5.00103759765625, 5.222412109375, 5.44378662109375, 5.6651611328125, 5.88653564453125, 6.10791015625, 6.32928466796875, 6.5506591796875, 6.77203369140625, 6.993408203125, 7.21478271484375, 7.4361572265625, 7.65753173828125, 7.87890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 7.0, 6.0, 12.0, 6.0, 14.0, 22.0, 25.0, 33.0, 49.0, 55.0, 85.0, 92.0, 134.0, 174.0, 294.0, 399.0, 571.0, 837.0, 1351.0, 2341.0, 4690.0, 10785.0, 32241.0, 213794.0, 3776625.0, 108751.0, 22895.0, 8312.0, 3834.0, 2058.0, 1254.0, 766.0, 477.0, 338.0, 230.0, 182.0, 142.0, 112.0, 72.0, 48.0, 42.0, 28.0, 24.0, 23.0, 22.0, 7.0, 10.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.7109375, -14.27001953125, -13.8291015625, -13.38818359375, -12.947265625, -12.50634765625, -12.0654296875, -11.62451171875, -11.18359375, -10.74267578125, -10.3017578125, -9.86083984375, -9.419921875, -8.97900390625, -8.5380859375, -8.09716796875, -7.65625, -7.21533203125, -6.7744140625, -6.33349609375, -5.892578125, -5.45166015625, -5.0107421875, -4.56982421875, -4.12890625, -3.68798828125, -3.2470703125, -2.80615234375, -2.365234375, -1.92431640625, -1.4833984375, -1.04248046875, -0.6015625, -0.16064453125, 0.2802734375, 0.72119140625, 1.162109375, 1.60302734375, 2.0439453125, 2.48486328125, 2.92578125, 3.36669921875, 3.8076171875, 4.24853515625, 4.689453125, 5.13037109375, 5.5712890625, 6.01220703125, 6.453125, 6.89404296875, 7.3349609375, 7.77587890625, 8.216796875, 8.65771484375, 9.0986328125, 9.53955078125, 9.98046875, 10.42138671875, 10.8623046875, 11.30322265625, 11.744140625, 12.18505859375, 12.6259765625, 13.06689453125, 13.5078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 7.0, 3.0, 9.0, 8.0, 8.0, 11.0, 27.0, 27.0, 52.0, 99.0, 249.0, 2600.0, 518.0, 187.0, 93.0, 43.0, 35.0, 22.0, 14.0, 11.0, 4.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0], "bins": [-3.919921875, -3.8189697265625, -3.718017578125, -3.6170654296875, -3.51611328125, -3.4151611328125, -3.314208984375, -3.2132568359375, -3.1123046875, -3.0113525390625, -2.910400390625, -2.8094482421875, -2.70849609375, -2.6075439453125, -2.506591796875, -2.4056396484375, -2.3046875, -2.2037353515625, -2.102783203125, -2.0018310546875, -1.90087890625, -1.7999267578125, -1.698974609375, -1.5980224609375, -1.4970703125, -1.3961181640625, -1.295166015625, -1.1942138671875, -1.09326171875, -0.9923095703125, -0.891357421875, -0.7904052734375, -0.689453125, -0.5885009765625, -0.487548828125, -0.3865966796875, -0.28564453125, -0.1846923828125, -0.083740234375, 0.0172119140625, 0.1181640625, 0.2191162109375, 0.320068359375, 0.4210205078125, 0.52197265625, 0.6229248046875, 0.723876953125, 0.8248291015625, 0.92578125, 1.0267333984375, 1.127685546875, 1.2286376953125, 1.32958984375, 1.4305419921875, 1.531494140625, 1.6324462890625, 1.7333984375, 1.8343505859375, 1.935302734375, 2.0362548828125, 2.13720703125, 2.2381591796875, 2.339111328125, 2.4400634765625, 2.541015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 10.0, 7.0, 17.0, 21.0, 32.0, 61.0, 99.0, 136.0, 165.0, 165.0, 131.0, 68.0, 33.0, 22.0, 10.0, 10.0, 8.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.878122329711914, -21.056169509887695, -20.23421859741211, -19.41226577758789, -18.590312957763672, -17.768362045288086, -16.946409225463867, -16.12445831298828, -15.302505493164062, -14.48055362701416, -13.658601760864258, -12.836648941040039, -12.014697074890137, -11.192745208740234, -10.370792388916016, -9.548840522766113, -8.726888656616211, -7.904936790466309, -7.082984447479248, -6.2610321044921875, -5.439080238342285, -4.617128372192383, -3.7951760292053223, -2.9732236862182617, -2.1512718200683594, -1.329319715499878, -0.5073676109313965, 0.31458449363708496, 1.1365365982055664, 1.9584884643554688, 2.7804408073425293, 3.60239315032959, 4.424346923828125, 5.246298789978027, 6.068251132965088, 6.890203475952148, 7.712155342102051, 8.534107208251953, 9.356060028076172, 10.178011894226074, 10.999963760375977, 11.821915626525879, 12.643867492675781, 13.4658203125, 14.287772178649902, 15.109724044799805, 15.931676864624023, 16.75362777709961, 17.575580596923828, 18.397533416748047, 19.219484329223633, 20.04143714904785, 20.863388061523438, 21.685340881347656, 22.507293701171875, 23.329246520996094, 24.15119743347168, 24.9731502532959, 25.795101165771484, 26.617053985595703, 27.439006805419922, 28.260957717895508, 29.082910537719727, 29.904861450195312, 30.72681427001953]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 7.0, 2.0, 7.0, 10.0, 7.0, 8.0, 17.0, 16.0, 29.0, 25.0, 27.0, 38.0, 47.0, 48.0, 55.0, 60.0, 59.0, 67.0, 47.0, 43.0, 43.0, 50.0, 44.0, 35.0, 41.0, 35.0, 26.0, 21.0, 16.0, 25.0, 10.0, 11.0, 11.0, 6.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.751505851745605, -10.385904312133789, -10.020303726196289, -9.654702186584473, -9.289101600646973, -8.923500061035156, -8.557899475097656, -8.19229793548584, -7.826696872711182, -7.461095809936523, -7.095494747161865, -6.729893684387207, -6.364292144775391, -5.998691558837891, -5.633090019226074, -5.267488956451416, -4.901887893676758, -4.5362868309021, -4.170685768127441, -3.805084466934204, -3.439483404159546, -3.0738823413848877, -2.7082810401916504, -2.342679977416992, -1.977078914642334, -1.6114778518676758, -1.245876669883728, -0.8802754878997803, -0.5146744251251221, -0.14907336235046387, 0.21652793884277344, 0.5821290016174316, 0.9477291107177734, 1.3133301734924316, 1.6789313554763794, 2.044532537460327, 2.4101336002349854, 2.7757346630096436, 3.141335964202881, 3.506937026977539, 3.8725380897521973, 4.2381391525268555, 4.603740215301514, 4.969341278076172, 5.334942817687988, 5.700543403625488, 6.066144943237305, 6.431746006011963, 6.797347068786621, 7.162948131561279, 7.5285491943359375, 7.894150733947754, 8.259751319885254, 8.62535285949707, 8.99095344543457, 9.356554985046387, 9.722156524658203, 10.08775806427002, 10.45335865020752, 10.818960189819336, 11.184560775756836, 11.550162315368652, 11.915763854980469, 12.281364440917969, 12.646965026855469]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 4.0, 7.0, 9.0, 18.0, 18.0, 42.0, 49.0, 67.0, 115.0, 156.0, 244.0, 418.0, 693.0, 1249.0, 2390.0, 5114.0, 12445.0, 34604.0, 111348.0, 309614.0, 353147.0, 144243.0, 44684.0, 15416.0, 6103.0, 2813.0, 1399.0, 761.0, 450.0, 305.0, 182.0, 132.0, 91.0, 53.0, 45.0, 39.0, 18.0, 19.0, 9.0, 9.0, 12.0, 4.0, 2.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0], "bins": [-16.96875, -16.4854736328125, -16.002197265625, -15.5189208984375, -15.03564453125, -14.5523681640625, -14.069091796875, -13.5858154296875, -13.1025390625, -12.6192626953125, -12.135986328125, -11.6527099609375, -11.16943359375, -10.6861572265625, -10.202880859375, -9.7196044921875, -9.236328125, -8.7530517578125, -8.269775390625, -7.7864990234375, -7.30322265625, -6.8199462890625, -6.336669921875, -5.8533935546875, -5.3701171875, -4.8868408203125, -4.403564453125, -3.9202880859375, -3.43701171875, -2.9537353515625, -2.470458984375, -1.9871826171875, -1.50390625, -1.0206298828125, -0.537353515625, -0.0540771484375, 0.42919921875, 0.9124755859375, 1.395751953125, 1.8790283203125, 2.3623046875, 2.8455810546875, 3.328857421875, 3.8121337890625, 4.29541015625, 4.7786865234375, 5.261962890625, 5.7452392578125, 6.228515625, 6.7117919921875, 7.195068359375, 7.6783447265625, 8.16162109375, 8.6448974609375, 9.128173828125, 9.6114501953125, 10.0947265625, 10.5780029296875, 11.061279296875, 11.5445556640625, 12.02783203125, 12.5111083984375, 12.994384765625, 13.4776611328125, 13.9609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 9.0, 11.0, 20.0, 14.0, 27.0, 34.0, 51.0, 65.0, 79.0, 82.0, 73.0, 94.0, 70.0, 78.0, 62.0, 66.0, 42.0, 40.0, 28.0, 16.0, 16.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.58367919921875, -6.3509521484375, -6.11822509765625, -5.885498046875, -5.65277099609375, -5.4200439453125, -5.18731689453125, -4.95458984375, -4.72186279296875, -4.4891357421875, -4.25640869140625, -4.023681640625, -3.79095458984375, -3.5582275390625, -3.32550048828125, -3.0927734375, -2.86004638671875, -2.6273193359375, -2.39459228515625, -2.161865234375, -1.92913818359375, -1.6964111328125, -1.46368408203125, -1.23095703125, -0.99822998046875, -0.7655029296875, -0.53277587890625, -0.300048828125, -0.06732177734375, 0.1654052734375, 0.39813232421875, 0.630859375, 0.86358642578125, 1.0963134765625, 1.32904052734375, 1.561767578125, 1.79449462890625, 2.0272216796875, 2.25994873046875, 2.49267578125, 2.72540283203125, 2.9581298828125, 3.19085693359375, 3.423583984375, 3.65631103515625, 3.8890380859375, 4.12176513671875, 4.3544921875, 4.58721923828125, 4.8199462890625, 5.05267333984375, 5.285400390625, 5.51812744140625, 5.7508544921875, 5.98358154296875, 6.21630859375, 6.44903564453125, 6.6817626953125, 6.91448974609375, 7.147216796875, 7.37994384765625, 7.6126708984375, 7.84539794921875, 8.078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 10.0, 8.0, 25.0, 17.0, 28.0, 42.0, 51.0, 99.0, 226.0, 477.0, 1310.0, 6941.0, 458157.0, 571209.0, 7479.0, 1433.0, 462.0, 209.0, 109.0, 58.0, 38.0, 42.0, 25.0, 17.0, 13.0, 12.0, 7.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.9375, -74.607421875, -72.27734375, -69.947265625, -67.6171875, -65.287109375, -62.95703125, -60.626953125, -58.296875, -55.966796875, -53.63671875, -51.306640625, -48.9765625, -46.646484375, -44.31640625, -41.986328125, -39.65625, -37.326171875, -34.99609375, -32.666015625, -30.3359375, -28.005859375, -25.67578125, -23.345703125, -21.015625, -18.685546875, -16.35546875, -14.025390625, -11.6953125, -9.365234375, -7.03515625, -4.705078125, -2.375, -0.044921875, 2.28515625, 4.615234375, 6.9453125, 9.275390625, 11.60546875, 13.935546875, 16.265625, 18.595703125, 20.92578125, 23.255859375, 25.5859375, 27.916015625, 30.24609375, 32.576171875, 34.90625, 37.236328125, 39.56640625, 41.896484375, 44.2265625, 46.556640625, 48.88671875, 51.216796875, 53.546875, 55.876953125, 58.20703125, 60.537109375, 62.8671875, 65.197265625, 67.52734375, 69.857421875, 72.1875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 8.0, 4.0, 4.0, 3.0, 8.0, 6.0, 13.0, 10.0, 25.0, 31.0, 42.0, 51.0, 57.0, 77.0, 95.0, 92.0, 95.0, 86.0, 76.0, 44.0, 48.0, 31.0, 33.0, 11.0, 10.0, 15.0, 6.0, 3.0, 5.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-50.09375, -48.83447265625, -47.5751953125, -46.31591796875, -45.056640625, -43.79736328125, -42.5380859375, -41.27880859375, -40.01953125, -38.76025390625, -37.5009765625, -36.24169921875, -34.982421875, -33.72314453125, -32.4638671875, -31.20458984375, -29.9453125, -28.68603515625, -27.4267578125, -26.16748046875, -24.908203125, -23.64892578125, -22.3896484375, -21.13037109375, -19.87109375, -18.61181640625, -17.3525390625, -16.09326171875, -14.833984375, -13.57470703125, -12.3154296875, -11.05615234375, -9.796875, -8.53759765625, -7.2783203125, -6.01904296875, -4.759765625, -3.50048828125, -2.2412109375, -0.98193359375, 0.27734375, 1.53662109375, 2.7958984375, 4.05517578125, 5.314453125, 6.57373046875, 7.8330078125, 9.09228515625, 10.3515625, 11.61083984375, 12.8701171875, 14.12939453125, 15.388671875, 16.64794921875, 17.9072265625, 19.16650390625, 20.42578125, 21.68505859375, 22.9443359375, 24.20361328125, 25.462890625, 26.72216796875, 27.9814453125, 29.24072265625, 30.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 7.0, 5.0, 8.0, 8.0, 12.0, 28.0, 20.0, 40.0, 43.0, 49.0, 91.0, 160.0, 269.0, 575.0, 2232.0, 27639.0, 931751.0, 80108.0, 3867.0, 805.0, 336.0, 189.0, 82.0, 67.0, 49.0, 36.0, 15.0, 15.0, 11.0, 10.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.34375, -22.581787109375, -21.81982421875, -21.057861328125, -20.2958984375, -19.533935546875, -18.77197265625, -18.010009765625, -17.248046875, -16.486083984375, -15.72412109375, -14.962158203125, -14.2001953125, -13.438232421875, -12.67626953125, -11.914306640625, -11.15234375, -10.390380859375, -9.62841796875, -8.866455078125, -8.1044921875, -7.342529296875, -6.58056640625, -5.818603515625, -5.056640625, -4.294677734375, -3.53271484375, -2.770751953125, -2.0087890625, -1.246826171875, -0.48486328125, 0.277099609375, 1.0390625, 1.801025390625, 2.56298828125, 3.324951171875, 4.0869140625, 4.848876953125, 5.61083984375, 6.372802734375, 7.134765625, 7.896728515625, 8.65869140625, 9.420654296875, 10.1826171875, 10.944580078125, 11.70654296875, 12.468505859375, 13.23046875, 13.992431640625, 14.75439453125, 15.516357421875, 16.2783203125, 17.040283203125, 17.80224609375, 18.564208984375, 19.326171875, 20.088134765625, 20.85009765625, 21.612060546875, 22.3740234375, 23.135986328125, 23.89794921875, 24.659912109375, 25.421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 9.0, 6.0, 11.0, 16.0, 31.0, 50.0, 76.0, 149.0, 200.0, 169.0, 125.0, 68.0, 34.0, 19.0, 16.0, 8.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0028228759765625, -0.002751663327217102, -0.002680450677871704, -0.002609238028526306, -0.002538025379180908, -0.0024668127298355103, -0.0023956000804901123, -0.0023243874311447144, -0.0022531747817993164, -0.0021819621324539185, -0.0021107494831085205, -0.0020395368337631226, -0.0019683241844177246, -0.0018971115350723267, -0.0018258988857269287, -0.0017546862363815308, -0.0016834735870361328, -0.0016122609376907349, -0.001541048288345337, -0.001469835638999939, -0.001398622989654541, -0.001327410340309143, -0.0012561976909637451, -0.0011849850416183472, -0.0011137723922729492, -0.0010425597429275513, -0.0009713470935821533, -0.0009001344442367554, -0.0008289217948913574, -0.0007577091455459595, -0.0006864964962005615, -0.0006152838468551636, -0.0005440711975097656, -0.0004728585481643677, -0.0004016458988189697, -0.0003304332494735718, -0.00025922060012817383, -0.00018800795078277588, -0.00011679530143737793, -4.558265209197998e-05, 2.562999725341797e-05, 9.684264659881592e-05, 0.00016805529594421387, 0.00023926794528961182, 0.00031048059463500977, 0.0003816932439804077, 0.00045290589332580566, 0.0005241185426712036, 0.0005953311920166016, 0.0006665438413619995, 0.0007377564907073975, 0.0008089691400527954, 0.0008801817893981934, 0.0009513944387435913, 0.0010226070880889893, 0.0010938197374343872, 0.0011650323867797852, 0.001236245036125183, 0.001307457685470581, 0.001378670334815979, 0.001449882984161377, 0.001521095633506775, 0.0015923082828521729, 0.0016635209321975708, 0.0017347335815429688]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 5.0, 2.0, 9.0, 6.0, 14.0, 17.0, 21.0, 35.0, 45.0, 98.0, 151.0, 286.0, 722.0, 3110.0, 38561.0, 951414.0, 48957.0, 3570.0, 816.0, 323.0, 155.0, 75.0, 53.0, 27.0, 25.0, 17.0, 13.0, 10.0, 7.0, 1.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.90625, -28.114990234375, -27.32373046875, -26.532470703125, -25.7412109375, -24.949951171875, -24.15869140625, -23.367431640625, -22.576171875, -21.784912109375, -20.99365234375, -20.202392578125, -19.4111328125, -18.619873046875, -17.82861328125, -17.037353515625, -16.24609375, -15.454833984375, -14.66357421875, -13.872314453125, -13.0810546875, -12.289794921875, -11.49853515625, -10.707275390625, -9.916015625, -9.124755859375, -8.33349609375, -7.542236328125, -6.7509765625, -5.959716796875, -5.16845703125, -4.377197265625, -3.5859375, -2.794677734375, -2.00341796875, -1.212158203125, -0.4208984375, 0.370361328125, 1.16162109375, 1.952880859375, 2.744140625, 3.535400390625, 4.32666015625, 5.117919921875, 5.9091796875, 6.700439453125, 7.49169921875, 8.282958984375, 9.07421875, 9.865478515625, 10.65673828125, 11.447998046875, 12.2392578125, 13.030517578125, 13.82177734375, 14.613037109375, 15.404296875, 16.195556640625, 16.98681640625, 17.778076171875, 18.5693359375, 19.360595703125, 20.15185546875, 20.943115234375, 21.734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 6.0, 1.0, 6.0, 3.0, 10.0, 10.0, 15.0, 10.0, 18.0, 24.0, 41.0, 63.0, 96.0, 123.0, 131.0, 129.0, 97.0, 62.0, 33.0, 28.0, 24.0, 13.0, 14.0, 5.0, 5.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.484375, -11.0792236328125, -10.674072265625, -10.2689208984375, -9.86376953125, -9.4586181640625, -9.053466796875, -8.6483154296875, -8.2431640625, -7.8380126953125, -7.432861328125, -7.0277099609375, -6.62255859375, -6.2174072265625, -5.812255859375, -5.4071044921875, -5.001953125, -4.5968017578125, -4.191650390625, -3.7864990234375, -3.38134765625, -2.9761962890625, -2.571044921875, -2.1658935546875, -1.7607421875, -1.3555908203125, -0.950439453125, -0.5452880859375, -0.14013671875, 0.2650146484375, 0.670166015625, 1.0753173828125, 1.48046875, 1.8856201171875, 2.290771484375, 2.6959228515625, 3.10107421875, 3.5062255859375, 3.911376953125, 4.3165283203125, 4.7216796875, 5.1268310546875, 5.531982421875, 5.9371337890625, 6.34228515625, 6.7474365234375, 7.152587890625, 7.5577392578125, 7.962890625, 8.3680419921875, 8.773193359375, 9.1783447265625, 9.58349609375, 9.9886474609375, 10.393798828125, 10.7989501953125, 11.2041015625, 11.6092529296875, 12.014404296875, 12.4195556640625, 12.82470703125, 13.2298583984375, 13.635009765625, 14.0401611328125, 14.4453125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 23.0, 35.0, 92.0, 164.0, 210.0, 199.0, 134.0, 62.0, 35.0, 20.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.58497619628906, -163.07998657226562, -155.57498168945312, -148.0699920654297, -140.56500244140625, -133.05999755859375, -125.55500793457031, -118.05001068115234, -110.54501342773438, -103.0400161743164, -95.53501892089844, -88.030029296875, -80.52503204345703, -73.02003479003906, -65.51504516601562, -58.010047912597656, -50.50505065917969, -43.00005340576172, -35.495059967041016, -27.99006462097168, -20.485069274902344, -12.980072021484375, -5.475078582763672, 2.0299148559570312, 9.534912109375, 17.039907455444336, 24.544902801513672, 32.049896240234375, 39.554893493652344, 47.05989074707031, 54.564884185791016, 62.06987762451172, 69.57485961914062, 77.0798568725586, 84.58485412597656, 92.08984375, 99.59484100341797, 107.09983825683594, 114.60482788085938, 122.10982513427734, 129.6148223876953, 137.11981201171875, 144.62481689453125, 152.1298065185547, 159.63479614257812, 167.13980102539062, 174.64479064941406, 182.1497802734375, 189.65478515625, 197.15977478027344, 204.66477966308594, 212.16976928710938, 219.67477416992188, 227.1797637939453, 234.68475341796875, 242.18975830078125, 249.6947479248047, 257.1997375488281, 264.7047424316406, 272.2097473144531, 279.7147216796875, 287.2197265625, 294.7247314453125, 302.2297058105469, 309.7347106933594]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 11.0, 10.0, 10.0, 13.0, 10.0, 18.0, 16.0, 18.0, 31.0, 24.0, 23.0, 43.0, 38.0, 28.0, 43.0, 33.0, 41.0, 39.0, 38.0, 53.0, 25.0, 37.0, 35.0, 32.0, 33.0, 36.0, 30.0, 24.0, 23.0, 28.0, 20.0, 20.0, 16.0, 14.0, 14.0, 11.0, 6.0, 8.0, 9.0, 4.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.84262084960938, -72.40647888183594, -69.9703369140625, -67.53418731689453, -65.0980453491211, -62.661903381347656, -60.22576141357422, -57.789615631103516, -55.35346984863281, -52.917327880859375, -50.48118209838867, -48.045040130615234, -45.60889434814453, -43.172752380371094, -40.736610412597656, -38.30046463012695, -35.864322662353516, -33.42818069458008, -30.992034912109375, -28.555892944335938, -26.119747161865234, -23.683605194091797, -21.247461318969727, -18.811317443847656, -16.375173568725586, -13.939029693603516, -11.502885818481445, -9.066742897033691, -6.630599021911621, -4.194455146789551, -1.7583122253417969, 0.6778316497802734, 3.1139755249023438, 5.550119400024414, 7.986262798309326, 10.422406196594238, 12.858550071716309, 15.294693946838379, 17.730836868286133, 20.166980743408203, 22.603124618530273, 25.039268493652344, 27.475412368774414, 29.911556243896484, 32.34769821166992, 34.783843994140625, 37.21998596191406, 39.6561279296875, 42.0922737121582, 44.52841567993164, 46.964561462402344, 49.40070343017578, 51.836849212646484, 54.27299118041992, 56.709136962890625, 59.14527893066406, 61.5814208984375, 64.01756286621094, 66.45370483398438, 68.88985443115234, 71.32599639892578, 73.76213836669922, 76.19828033447266, 78.63442993164062, 81.07057189941406]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 8.0, 10.0, 19.0, 17.0, 29.0, 35.0, 79.0, 150.0, 267.0, 569.0, 1408.0, 4090.0, 36041.0, 4122154.0, 23625.0, 3482.0, 1245.0, 525.0, 222.0, 114.0, 77.0, 34.0, 22.0, 15.0, 9.0, 14.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.15625, -43.7197265625, -42.283203125, -40.8466796875, -39.41015625, -37.9736328125, -36.537109375, -35.1005859375, -33.6640625, -32.2275390625, -30.791015625, -29.3544921875, -27.91796875, -26.4814453125, -25.044921875, -23.6083984375, -22.171875, -20.7353515625, -19.298828125, -17.8623046875, -16.42578125, -14.9892578125, -13.552734375, -12.1162109375, -10.6796875, -9.2431640625, -7.806640625, -6.3701171875, -4.93359375, -3.4970703125, -2.060546875, -0.6240234375, 0.8125, 2.2490234375, 3.685546875, 5.1220703125, 6.55859375, 7.9951171875, 9.431640625, 10.8681640625, 12.3046875, 13.7412109375, 15.177734375, 16.6142578125, 18.05078125, 19.4873046875, 20.923828125, 22.3603515625, 23.796875, 25.2333984375, 26.669921875, 28.1064453125, 29.54296875, 30.9794921875, 32.416015625, 33.8525390625, 35.2890625, 36.7255859375, 38.162109375, 39.5986328125, 41.03515625, 42.4716796875, 43.908203125, 45.3447265625, 46.78125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 5.0, 10.0, 11.0, 18.0, 20.0, 38.0, 56.0, 72.0, 73.0, 90.0, 101.0, 107.0, 92.0, 89.0, 76.0, 54.0, 26.0, 27.0, 14.0, 13.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9765625, -7.6802978515625, -7.384033203125, -7.0877685546875, -6.79150390625, -6.4952392578125, -6.198974609375, -5.9027099609375, -5.6064453125, -5.3101806640625, -5.013916015625, -4.7176513671875, -4.42138671875, -4.1251220703125, -3.828857421875, -3.5325927734375, -3.236328125, -2.9400634765625, -2.643798828125, -2.3475341796875, -2.05126953125, -1.7550048828125, -1.458740234375, -1.1624755859375, -0.8662109375, -0.5699462890625, -0.273681640625, 0.0225830078125, 0.31884765625, 0.6151123046875, 0.911376953125, 1.2076416015625, 1.50390625, 1.8001708984375, 2.096435546875, 2.3927001953125, 2.68896484375, 2.9852294921875, 3.281494140625, 3.5777587890625, 3.8740234375, 4.1702880859375, 4.466552734375, 4.7628173828125, 5.05908203125, 5.3553466796875, 5.651611328125, 5.9478759765625, 6.244140625, 6.5404052734375, 6.836669921875, 7.1329345703125, 7.42919921875, 7.7254638671875, 8.021728515625, 8.3179931640625, 8.6142578125, 8.9105224609375, 9.206787109375, 9.5030517578125, 9.79931640625, 10.0955810546875, 10.391845703125, 10.6881103515625, 10.984375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 11.0, 17.0, 14.0, 15.0, 20.0, 18.0, 34.0, 23.0, 43.0, 67.0, 113.0, 380.0, 1400.0, 6417.0, 3948057.0, 230404.0, 5315.0, 1210.0, 298.0, 113.0, 52.0, 44.0, 28.0, 27.0, 34.0, 19.0, 15.0, 11.0, 14.0, 12.0, 11.0, 7.0, 5.0, 0.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-60.59375, -59.03759765625, -57.4814453125, -55.92529296875, -54.369140625, -52.81298828125, -51.2568359375, -49.70068359375, -48.14453125, -46.58837890625, -45.0322265625, -43.47607421875, -41.919921875, -40.36376953125, -38.8076171875, -37.25146484375, -35.6953125, -34.13916015625, -32.5830078125, -31.02685546875, -29.470703125, -27.91455078125, -26.3583984375, -24.80224609375, -23.24609375, -21.68994140625, -20.1337890625, -18.57763671875, -17.021484375, -15.46533203125, -13.9091796875, -12.35302734375, -10.796875, -9.24072265625, -7.6845703125, -6.12841796875, -4.572265625, -3.01611328125, -1.4599609375, 0.09619140625, 1.65234375, 3.20849609375, 4.7646484375, 6.32080078125, 7.876953125, 9.43310546875, 10.9892578125, 12.54541015625, 14.1015625, 15.65771484375, 17.2138671875, 18.77001953125, 20.326171875, 21.88232421875, 23.4384765625, 24.99462890625, 26.55078125, 28.10693359375, 29.6630859375, 31.21923828125, 32.775390625, 34.33154296875, 35.8876953125, 37.44384765625, 39.0]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 39.0, 168.0, 3617.0, 159.0, 35.0, 15.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.140625, -11.89044189453125, -11.6402587890625, -11.39007568359375, -11.139892578125, -10.88970947265625, -10.6395263671875, -10.38934326171875, -10.13916015625, -9.88897705078125, -9.6387939453125, -9.38861083984375, -9.138427734375, -8.88824462890625, -8.6380615234375, -8.38787841796875, -8.1376953125, -7.88751220703125, -7.6373291015625, -7.38714599609375, -7.136962890625, -6.88677978515625, -6.6365966796875, -6.38641357421875, -6.13623046875, -5.88604736328125, -5.6358642578125, -5.38568115234375, -5.135498046875, -4.88531494140625, -4.6351318359375, -4.38494873046875, -4.134765625, -3.88458251953125, -3.6343994140625, -3.38421630859375, -3.134033203125, -2.88385009765625, -2.6336669921875, -2.38348388671875, -2.13330078125, -1.88311767578125, -1.6329345703125, -1.38275146484375, -1.132568359375, -0.88238525390625, -0.6322021484375, -0.38201904296875, -0.1318359375, 0.11834716796875, 0.3685302734375, 0.61871337890625, 0.868896484375, 1.11907958984375, 1.3692626953125, 1.61944580078125, 1.86962890625, 2.11981201171875, 2.3699951171875, 2.62017822265625, 2.870361328125, 3.12054443359375, 3.3707275390625, 3.62091064453125, 3.87109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 22.0, 36.0, 58.0, 72.0, 116.0, 199.0, 173.0, 123.0, 64.0, 44.0, 26.0, 11.0, 13.0, 2.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.56570053100586, -23.767024993896484, -22.968351364135742, -22.169675827026367, -21.371002197265625, -20.57232666015625, -19.773651123046875, -18.974977493286133, -18.176301956176758, -17.377626419067383, -16.57895278930664, -15.780277252197266, -14.981602668762207, -14.182928085327148, -13.38425350189209, -12.585578918457031, -11.786904335021973, -10.988229751586914, -10.189555168151855, -9.390880584716797, -8.592205047607422, -7.793530464172363, -6.994855880737305, -6.196180820465088, -5.397506237030029, -4.598831653594971, -3.800156593322754, -3.0014820098876953, -2.2028071880340576, -1.40413236618042, -0.6054577827453613, 0.19321727752685547, 0.9918918609619141, 1.7905666828155518, 2.5892415046691895, 3.387916088104248, 4.186591148376465, 4.985265731811523, 5.783940315246582, 6.582615375518799, 7.381289958953857, 8.179965019226074, 8.978639602661133, 9.777314186096191, 10.57598876953125, 11.374664306640625, 12.173337936401367, 12.972013473510742, 13.7706880569458, 14.56936264038086, 15.368037223815918, 16.166711807250977, 16.96538734436035, 17.764060974121094, 18.56273651123047, 19.361412048339844, 20.160085678100586, 20.95876121520996, 21.757434844970703, 22.556110382080078, 23.35478401184082, 24.153459548950195, 24.952133178710938, 25.750808715820312, 26.549484252929688]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 11.0, 12.0, 7.0, 13.0, 16.0, 14.0, 18.0, 23.0, 31.0, 24.0, 30.0, 25.0, 24.0, 41.0, 35.0, 38.0, 36.0, 29.0, 50.0, 34.0, 48.0, 43.0, 34.0, 36.0, 23.0, 29.0, 26.0, 32.0, 32.0, 25.0, 19.0, 22.0, 11.0, 16.0, 15.0, 14.0, 4.0, 12.0, 9.0, 5.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-8.252778053283691, -8.00320816040039, -7.75363826751709, -7.504068374633789, -7.254498481750488, -7.0049285888671875, -6.755358695983887, -6.505788326263428, -6.256218433380127, -6.006648540496826, -5.757078647613525, -5.507508754730225, -5.257938861846924, -5.008368492126465, -4.758798599243164, -4.509228706359863, -4.2596588134765625, -4.010088920593262, -3.760519027709961, -3.51094913482666, -3.2613790035247803, -3.0118091106414795, -2.7622392177581787, -2.512669086456299, -2.2630996704101562, -2.0135297775268555, -1.7639597654342651, -1.5143898725509644, -1.264819860458374, -1.0152499675750732, -0.7656800746917725, -0.5161100625991821, -0.2665400505065918, -0.016970112919807434, 0.23259982466697693, 0.4821697473526001, 0.7317396998405457, 0.9813096523284912, 1.230879545211792, 1.4804495573043823, 1.730019450187683, 1.9795893430709839, 2.229159355163574, 2.478729248046875, 2.728299140930176, 2.9778690338134766, 3.2274389266967773, 3.4770090579986572, 3.726578950881958, 3.976148843765259, 4.225718975067139, 4.4752888679504395, 4.72485876083374, 4.974428653717041, 5.223998546600342, 5.473568439483643, 5.723138332366943, 5.972708225250244, 6.222278118133545, 6.471848011016846, 6.7214179039001465, 6.9709882736206055, 7.220558166503906, 7.470128059387207, 7.719697952270508]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 14.0, 18.0, 30.0, 55.0, 58.0, 99.0, 171.0, 330.0, 608.0, 1389.0, 3408.0, 11301.0, 54135.0, 296777.0, 520699.0, 126087.0, 23497.0, 5847.0, 2086.0, 865.0, 477.0, 237.0, 129.0, 76.0, 47.0, 36.0, 20.0, 17.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.0625, -21.418212890625, -20.77392578125, -20.129638671875, -19.4853515625, -18.841064453125, -18.19677734375, -17.552490234375, -16.908203125, -16.263916015625, -15.61962890625, -14.975341796875, -14.3310546875, -13.686767578125, -13.04248046875, -12.398193359375, -11.75390625, -11.109619140625, -10.46533203125, -9.821044921875, -9.1767578125, -8.532470703125, -7.88818359375, -7.243896484375, -6.599609375, -5.955322265625, -5.31103515625, -4.666748046875, -4.0224609375, -3.378173828125, -2.73388671875, -2.089599609375, -1.4453125, -0.801025390625, -0.15673828125, 0.487548828125, 1.1318359375, 1.776123046875, 2.42041015625, 3.064697265625, 3.708984375, 4.353271484375, 4.99755859375, 5.641845703125, 6.2861328125, 6.930419921875, 7.57470703125, 8.218994140625, 8.86328125, 9.507568359375, 10.15185546875, 10.796142578125, 11.4404296875, 12.084716796875, 12.72900390625, 13.373291015625, 14.017578125, 14.661865234375, 15.30615234375, 15.950439453125, 16.5947265625, 17.239013671875, 17.88330078125, 18.527587890625, 19.171875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 9.0, 5.0, 9.0, 19.0, 35.0, 33.0, 53.0, 72.0, 89.0, 69.0, 108.0, 92.0, 96.0, 75.0, 81.0, 55.0, 37.0, 14.0, 18.0, 14.0, 8.0, 9.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.86083984375, -7.5576171875, -7.25439453125, -6.951171875, -6.64794921875, -6.3447265625, -6.04150390625, -5.73828125, -5.43505859375, -5.1318359375, -4.82861328125, -4.525390625, -4.22216796875, -3.9189453125, -3.61572265625, -3.3125, -3.00927734375, -2.7060546875, -2.40283203125, -2.099609375, -1.79638671875, -1.4931640625, -1.18994140625, -0.88671875, -0.58349609375, -0.2802734375, 0.02294921875, 0.326171875, 0.62939453125, 0.9326171875, 1.23583984375, 1.5390625, 1.84228515625, 2.1455078125, 2.44873046875, 2.751953125, 3.05517578125, 3.3583984375, 3.66162109375, 3.96484375, 4.26806640625, 4.5712890625, 4.87451171875, 5.177734375, 5.48095703125, 5.7841796875, 6.08740234375, 6.390625, 6.69384765625, 6.9970703125, 7.30029296875, 7.603515625, 7.90673828125, 8.2099609375, 8.51318359375, 8.81640625, 9.11962890625, 9.4228515625, 9.72607421875, 10.029296875, 10.33251953125, 10.6357421875, 10.93896484375, 11.2421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 13.0, 9.0, 15.0, 20.0, 48.0, 69.0, 110.0, 206.0, 440.0, 1180.0, 4682.0, 176166.0, 853914.0, 8768.0, 1656.0, 589.0, 276.0, 159.0, 91.0, 49.0, 27.0, 26.0, 17.0, 8.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.8125, -73.119140625, -70.42578125, -67.732421875, -65.0390625, -62.345703125, -59.65234375, -56.958984375, -54.265625, -51.572265625, -48.87890625, -46.185546875, -43.4921875, -40.798828125, -38.10546875, -35.412109375, -32.71875, -30.025390625, -27.33203125, -24.638671875, -21.9453125, -19.251953125, -16.55859375, -13.865234375, -11.171875, -8.478515625, -5.78515625, -3.091796875, -0.3984375, 2.294921875, 4.98828125, 7.681640625, 10.375, 13.068359375, 15.76171875, 18.455078125, 21.1484375, 23.841796875, 26.53515625, 29.228515625, 31.921875, 34.615234375, 37.30859375, 40.001953125, 42.6953125, 45.388671875, 48.08203125, 50.775390625, 53.46875, 56.162109375, 58.85546875, 61.548828125, 64.2421875, 66.935546875, 69.62890625, 72.322265625, 75.015625, 77.708984375, 80.40234375, 83.095703125, 85.7890625, 88.482421875, 91.17578125, 93.869140625, 96.5625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 14.0, 15.0, 23.0, 39.0, 35.0, 60.0, 82.0, 107.0, 105.0, 122.0, 97.0, 73.0, 71.0, 52.0, 25.0, 19.0, 12.0, 10.0, 2.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.625, -63.5029296875, -61.380859375, -59.2587890625, -57.13671875, -55.0146484375, -52.892578125, -50.7705078125, -48.6484375, -46.5263671875, -44.404296875, -42.2822265625, -40.16015625, -38.0380859375, -35.916015625, -33.7939453125, -31.671875, -29.5498046875, -27.427734375, -25.3056640625, -23.18359375, -21.0615234375, -18.939453125, -16.8173828125, -14.6953125, -12.5732421875, -10.451171875, -8.3291015625, -6.20703125, -4.0849609375, -1.962890625, 0.1591796875, 2.28125, 4.4033203125, 6.525390625, 8.6474609375, 10.76953125, 12.8916015625, 15.013671875, 17.1357421875, 19.2578125, 21.3798828125, 23.501953125, 25.6240234375, 27.74609375, 29.8681640625, 31.990234375, 34.1123046875, 36.234375, 38.3564453125, 40.478515625, 42.6005859375, 44.72265625, 46.8447265625, 48.966796875, 51.0888671875, 53.2109375, 55.3330078125, 57.455078125, 59.5771484375, 61.69921875, 63.8212890625, 65.943359375, 68.0654296875, 70.1875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 10.0, 11.0, 12.0, 19.0, 26.0, 39.0, 47.0, 82.0, 147.0, 262.0, 706.0, 7922.0, 1021597.0, 16037.0, 877.0, 300.0, 162.0, 96.0, 72.0, 27.0, 33.0, 21.0, 17.0, 16.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -49.60791015625, -47.8720703125, -46.13623046875, -44.400390625, -42.66455078125, -40.9287109375, -39.19287109375, -37.45703125, -35.72119140625, -33.9853515625, -32.24951171875, -30.513671875, -28.77783203125, -27.0419921875, -25.30615234375, -23.5703125, -21.83447265625, -20.0986328125, -18.36279296875, -16.626953125, -14.89111328125, -13.1552734375, -11.41943359375, -9.68359375, -7.94775390625, -6.2119140625, -4.47607421875, -2.740234375, -1.00439453125, 0.7314453125, 2.46728515625, 4.203125, 5.93896484375, 7.6748046875, 9.41064453125, 11.146484375, 12.88232421875, 14.6181640625, 16.35400390625, 18.08984375, 19.82568359375, 21.5615234375, 23.29736328125, 25.033203125, 26.76904296875, 28.5048828125, 30.24072265625, 31.9765625, 33.71240234375, 35.4482421875, 37.18408203125, 38.919921875, 40.65576171875, 42.3916015625, 44.12744140625, 45.86328125, 47.59912109375, 49.3349609375, 51.07080078125, 52.806640625, 54.54248046875, 56.2783203125, 58.01416015625, 59.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 7.0, 11.0, 17.0, 7.0, 19.0, 30.0, 35.0, 46.0, 76.0, 115.0, 114.0, 118.0, 98.0, 64.0, 54.0, 36.0, 36.0, 24.0, 13.0, 14.0, 8.0, 7.0, 5.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0016698837280273438, -0.001623407006263733, -0.001576930284500122, -0.0015304535627365112, -0.0014839768409729004, -0.0014375001192092896, -0.0013910233974456787, -0.0013445466756820679, -0.001298069953918457, -0.0012515932321548462, -0.0012051165103912354, -0.0011586397886276245, -0.0011121630668640137, -0.0010656863451004028, -0.001019209623336792, -0.0009727329015731812, -0.0009262561798095703, -0.0008797794580459595, -0.0008333027362823486, -0.0007868260145187378, -0.000740349292755127, -0.0006938725709915161, -0.0006473958492279053, -0.0006009191274642944, -0.0005544424057006836, -0.0005079656839370728, -0.0004614889621734619, -0.0004150122404098511, -0.00036853551864624023, -0.0003220587968826294, -0.00027558207511901855, -0.00022910535335540771, -0.00018262863159179688, -0.00013615190982818604, -8.96751880645752e-05, -4.3198466300964355e-05, 3.2782554626464844e-06, 4.9754977226257324e-05, 9.623169898986816e-05, 0.000142708420753479, 0.00018918514251708984, 0.00023566186428070068, 0.0002821385860443115, 0.00032861530780792236, 0.0003750920295715332, 0.00042156875133514404, 0.0004680454730987549, 0.0005145221948623657, 0.0005609989166259766, 0.0006074756383895874, 0.0006539523601531982, 0.0007004290819168091, 0.0007469058036804199, 0.0007933825254440308, 0.0008398592472076416, 0.0008863359689712524, 0.0009328126907348633, 0.0009792894124984741, 0.001025766134262085, 0.0010722428560256958, 0.0011187195777893066, 0.0011651962995529175, 0.0012116730213165283, 0.0012581497430801392, 0.00130462646484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 10.0, 12.0, 12.0, 9.0, 30.0, 35.0, 54.0, 103.0, 189.0, 356.0, 932.0, 4847.0, 149219.0, 879976.0, 10188.0, 1599.0, 461.0, 207.0, 98.0, 72.0, 51.0, 15.0, 22.0, 16.0, 8.0, 9.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.875, -44.732666015625, -43.59033203125, -42.447998046875, -41.3056640625, -40.163330078125, -39.02099609375, -37.878662109375, -36.736328125, -35.593994140625, -34.45166015625, -33.309326171875, -32.1669921875, -31.024658203125, -29.88232421875, -28.739990234375, -27.59765625, -26.455322265625, -25.31298828125, -24.170654296875, -23.0283203125, -21.885986328125, -20.74365234375, -19.601318359375, -18.458984375, -17.316650390625, -16.17431640625, -15.031982421875, -13.8896484375, -12.747314453125, -11.60498046875, -10.462646484375, -9.3203125, -8.177978515625, -7.03564453125, -5.893310546875, -4.7509765625, -3.608642578125, -2.46630859375, -1.323974609375, -0.181640625, 0.960693359375, 2.10302734375, 3.245361328125, 4.3876953125, 5.530029296875, 6.67236328125, 7.814697265625, 8.95703125, 10.099365234375, 11.24169921875, 12.384033203125, 13.5263671875, 14.668701171875, 15.81103515625, 16.953369140625, 18.095703125, 19.238037109375, 20.38037109375, 21.522705078125, 22.6650390625, 23.807373046875, 24.94970703125, 26.092041015625, 27.234375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 10.0, 4.0, 9.0, 5.0, 26.0, 51.0, 119.0, 177.0, 240.0, 170.0, 79.0, 37.0, 22.0, 10.0, 6.0, 5.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.8125, -36.8984375, -35.984375, -35.0703125, -34.15625, -33.2421875, -32.328125, -31.4140625, -30.5, -29.5859375, -28.671875, -27.7578125, -26.84375, -25.9296875, -25.015625, -24.1015625, -23.1875, -22.2734375, -21.359375, -20.4453125, -19.53125, -18.6171875, -17.703125, -16.7890625, -15.875, -14.9609375, -14.046875, -13.1328125, -12.21875, -11.3046875, -10.390625, -9.4765625, -8.5625, -7.6484375, -6.734375, -5.8203125, -4.90625, -3.9921875, -3.078125, -2.1640625, -1.25, -0.3359375, 0.578125, 1.4921875, 2.40625, 3.3203125, 4.234375, 5.1484375, 6.0625, 6.9765625, 7.890625, 8.8046875, 9.71875, 10.6328125, 11.546875, 12.4609375, 13.375, 14.2890625, 15.203125, 16.1171875, 17.03125, 17.9453125, 18.859375, 19.7734375, 20.6875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 19.0, 73.0, 231.0, 359.0, 219.0, 64.0, 17.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-643.5451049804688, -629.9508056640625, -616.3564453125, -602.7621459960938, -589.1677856445312, -575.573486328125, -561.9791259765625, -548.3848266601562, -534.79052734375, -521.1962280273438, -507.60186767578125, -494.0075378417969, -480.4132080078125, -466.81890869140625, -453.2245788574219, -439.6302490234375, -426.035888671875, -412.4415588378906, -398.84722900390625, -385.2528991699219, -371.6585693359375, -358.06427001953125, -344.4699401855469, -330.8756103515625, -317.2812805175781, -303.68695068359375, -290.0926208496094, -276.498291015625, -262.90399169921875, -249.3096466064453, -235.71533203125, -222.12100219726562, -208.52670288085938, -194.932373046875, -181.33804321289062, -167.7437286376953, -154.14939880371094, -140.55506896972656, -126.96074676513672, -113.36642456054688, -99.7720947265625, -86.17776489257812, -72.58344268798828, -58.98911666870117, -45.39479064941406, -31.800460815429688, -18.206138610839844, -4.61181640625, 8.982513427734375, 22.576839447021484, 36.171165466308594, 49.7654914855957, 63.35981750488281, 76.95414733886719, 90.54846954345703, 104.14279174804688, 117.73712158203125, 131.33145141601562, 144.92578125, 158.5200958251953, 172.1144256591797, 185.70875549316406, 199.30307006835938, 212.89739990234375, 226.49172973632812]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 5.0, 10.0, 16.0, 7.0, 13.0, 13.0, 18.0, 14.0, 26.0, 30.0, 41.0, 35.0, 44.0, 36.0, 50.0, 50.0, 43.0, 56.0, 45.0, 44.0, 45.0, 49.0, 39.0, 41.0, 42.0, 28.0, 25.0, 19.0, 11.0, 23.0, 16.0, 12.0, 15.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-125.21125030517578, -121.36190795898438, -117.51256561279297, -113.66322326660156, -109.81388092041016, -105.96453857421875, -102.11518859863281, -98.26585388183594, -94.41650390625, -90.5671615600586, -86.71781921386719, -82.86847686767578, -79.01913452148438, -75.16979217529297, -71.32044982910156, -67.47109985351562, -63.62176513671875, -59.772422790527344, -55.92308044433594, -52.07373809814453, -48.224395751953125, -44.37505340576172, -40.52570724487305, -36.67636489868164, -32.827022552490234, -28.977680206298828, -25.128337860107422, -21.278993606567383, -17.429651260375977, -13.58030891418457, -9.730964660644531, -5.881622314453125, -2.0322723388671875, 1.817070484161377, 5.666413307189941, 9.515756607055664, 13.36509895324707, 17.214441299438477, 21.063785552978516, 24.913127899169922, 28.762470245361328, 32.611812591552734, 36.46115493774414, 40.31050109863281, 44.15984344482422, 48.009185791015625, 51.85852813720703, 55.70787048339844, 59.557212829589844, 63.40655517578125, 67.25589752197266, 71.10523986816406, 74.95458221435547, 78.80392456054688, 82.65327453613281, 86.50260925292969, 90.35195922851562, 94.20130157470703, 98.05064392089844, 101.89998626708984, 105.74932861328125, 109.59867095947266, 113.44801330566406, 117.29736328125, 121.14669799804688]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 11.0, 19.0, 49.0, 90.0, 161.0, 370.0, 967.0, 3169.0, 19725.0, 4001239.0, 157140.0, 8285.0, 1820.0, 674.0, 256.0, 123.0, 69.0, 38.0, 25.0, 13.0, 9.0, 9.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.555908203125, -25.43994140625, -24.323974609375, -23.2080078125, -22.092041015625, -20.97607421875, -19.860107421875, -18.744140625, -17.628173828125, -16.51220703125, -15.396240234375, -14.2802734375, -13.164306640625, -12.04833984375, -10.932373046875, -9.81640625, -8.700439453125, -7.58447265625, -6.468505859375, -5.3525390625, -4.236572265625, -3.12060546875, -2.004638671875, -0.888671875, 0.227294921875, 1.34326171875, 2.459228515625, 3.5751953125, 4.691162109375, 5.80712890625, 6.923095703125, 8.0390625, 9.155029296875, 10.27099609375, 11.386962890625, 12.5029296875, 13.618896484375, 14.73486328125, 15.850830078125, 16.966796875, 18.082763671875, 19.19873046875, 20.314697265625, 21.4306640625, 22.546630859375, 23.66259765625, 24.778564453125, 25.89453125, 27.010498046875, 28.12646484375, 29.242431640625, 30.3583984375, 31.474365234375, 32.59033203125, 33.706298828125, 34.822265625, 35.938232421875, 37.05419921875, 38.170166015625, 39.2861328125, 40.402099609375, 41.51806640625, 42.634033203125, 43.75]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 12.0, 21.0, 28.0, 34.0, 48.0, 51.0, 55.0, 92.0, 98.0, 85.0, 90.0, 83.0, 80.0, 70.0, 41.0, 30.0, 16.0, 9.0, 14.0, 4.0, 8.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8671875, -7.5694580078125, -7.271728515625, -6.9739990234375, -6.67626953125, -6.3785400390625, -6.080810546875, -5.7830810546875, -5.4853515625, -5.1876220703125, -4.889892578125, -4.5921630859375, -4.29443359375, -3.9967041015625, -3.698974609375, -3.4012451171875, -3.103515625, -2.8057861328125, -2.508056640625, -2.2103271484375, -1.91259765625, -1.6148681640625, -1.317138671875, -1.0194091796875, -0.7216796875, -0.4239501953125, -0.126220703125, 0.1715087890625, 0.46923828125, 0.7669677734375, 1.064697265625, 1.3624267578125, 1.66015625, 1.9578857421875, 2.255615234375, 2.5533447265625, 2.85107421875, 3.1488037109375, 3.446533203125, 3.7442626953125, 4.0419921875, 4.3397216796875, 4.637451171875, 4.9351806640625, 5.23291015625, 5.5306396484375, 5.828369140625, 6.1260986328125, 6.423828125, 6.7215576171875, 7.019287109375, 7.3170166015625, 7.61474609375, 7.9124755859375, 8.210205078125, 8.5079345703125, 8.8056640625, 9.1033935546875, 9.401123046875, 9.6988525390625, 9.99658203125, 10.2943115234375, 10.592041015625, 10.8897705078125, 11.1875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 10.0, 7.0, 8.0, 17.0, 23.0, 37.0, 36.0, 55.0, 73.0, 106.0, 142.0, 190.0, 305.0, 574.0, 1507.0, 5560.0, 42947.0, 4076205.0, 56760.0, 6483.0, 1616.0, 604.0, 293.0, 189.0, 145.0, 99.0, 80.0, 52.0, 34.0, 33.0, 24.0, 22.0, 10.0, 11.0, 9.0, 3.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.59375, -31.650146484375, -30.70654296875, -29.762939453125, -28.8193359375, -27.875732421875, -26.93212890625, -25.988525390625, -25.044921875, -24.101318359375, -23.15771484375, -22.214111328125, -21.2705078125, -20.326904296875, -19.38330078125, -18.439697265625, -17.49609375, -16.552490234375, -15.60888671875, -14.665283203125, -13.7216796875, -12.778076171875, -11.83447265625, -10.890869140625, -9.947265625, -9.003662109375, -8.06005859375, -7.116455078125, -6.1728515625, -5.229248046875, -4.28564453125, -3.342041015625, -2.3984375, -1.454833984375, -0.51123046875, 0.432373046875, 1.3759765625, 2.319580078125, 3.26318359375, 4.206787109375, 5.150390625, 6.093994140625, 7.03759765625, 7.981201171875, 8.9248046875, 9.868408203125, 10.81201171875, 11.755615234375, 12.69921875, 13.642822265625, 14.58642578125, 15.530029296875, 16.4736328125, 17.417236328125, 18.36083984375, 19.304443359375, 20.248046875, 21.191650390625, 22.13525390625, 23.078857421875, 24.0224609375, 24.966064453125, 25.90966796875, 26.853271484375, 27.796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 12.0, 10.0, 13.0, 24.0, 42.0, 149.0, 2008.0, 1551.0, 152.0, 51.0, 30.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9453125, -9.61376953125, -9.2822265625, -8.95068359375, -8.619140625, -8.28759765625, -7.9560546875, -7.62451171875, -7.29296875, -6.96142578125, -6.6298828125, -6.29833984375, -5.966796875, -5.63525390625, -5.3037109375, -4.97216796875, -4.640625, -4.30908203125, -3.9775390625, -3.64599609375, -3.314453125, -2.98291015625, -2.6513671875, -2.31982421875, -1.98828125, -1.65673828125, -1.3251953125, -0.99365234375, -0.662109375, -0.33056640625, 0.0009765625, 0.33251953125, 0.6640625, 0.99560546875, 1.3271484375, 1.65869140625, 1.990234375, 2.32177734375, 2.6533203125, 2.98486328125, 3.31640625, 3.64794921875, 3.9794921875, 4.31103515625, 4.642578125, 4.97412109375, 5.3056640625, 5.63720703125, 5.96875, 6.30029296875, 6.6318359375, 6.96337890625, 7.294921875, 7.62646484375, 7.9580078125, 8.28955078125, 8.62109375, 8.95263671875, 9.2841796875, 9.61572265625, 9.947265625, 10.27880859375, 10.6103515625, 10.94189453125, 11.2734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 9.0, 13.0, 25.0, 40.0, 84.0, 143.0, 195.0, 192.0, 126.0, 69.0, 39.0, 28.0, 12.0, 10.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.317665100097656, -45.959861755371094, -44.602054595947266, -43.2442512512207, -41.886444091796875, -40.52864074707031, -39.170833587646484, -37.81303024291992, -36.455223083496094, -35.09741973876953, -33.7396125793457, -32.38180923461914, -31.024002075195312, -29.666196823120117, -28.308391571044922, -26.95058822631836, -25.592782974243164, -24.23497772216797, -22.877172470092773, -21.519367218017578, -20.161561965942383, -18.803756713867188, -17.445953369140625, -16.088146209716797, -14.730341911315918, -13.372536659240723, -12.014731407165527, -10.656927108764648, -9.299121856689453, -7.9413161277771, -6.5835113525390625, -5.225706100463867, -3.867900848388672, -2.5100955963134766, -1.1522905826568604, 0.20551443099975586, 1.5633196830749512, 2.9211249351501465, 4.278929710388184, 5.636734962463379, 6.994540214538574, 8.35234546661377, 9.710150718688965, 11.067955017089844, 12.425760269165039, 13.783565521240234, 15.14137077331543, 16.499176025390625, 17.85698127746582, 19.214786529541016, 20.57259178161621, 21.930397033691406, 23.2882022857666, 24.646007537841797, 26.00381088256836, 27.361618041992188, 28.71942138671875, 30.077226638793945, 31.43503189086914, 32.7928352355957, 34.15064239501953, 35.508445739746094, 36.86625289916992, 38.224056243896484, 39.58186340332031]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 5.0, 8.0, 10.0, 18.0, 16.0, 28.0, 22.0, 26.0, 33.0, 40.0, 40.0, 45.0, 57.0, 62.0, 61.0, 51.0, 54.0, 46.0, 58.0, 40.0, 44.0, 29.0, 26.0, 36.0, 27.0, 19.0, 14.0, 29.0, 6.0, 5.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.488224029541016, -15.883613586425781, -15.279003143310547, -14.674392700195312, -14.069781303405762, -13.465170860290527, -12.860560417175293, -12.255949020385742, -11.651338577270508, -11.046728134155273, -10.442117691040039, -9.837507247924805, -9.232895851135254, -8.62828540802002, -8.023674964904785, -7.419064044952393, -6.814454078674316, -6.209843635559082, -5.6052327156066895, -5.000622272491455, -4.3960113525390625, -3.791400909423828, -3.1867904663085938, -2.582179546356201, -1.9775691032409668, -1.3729584217071533, -0.7683478593826294, -0.16373729705810547, 0.440873384475708, 1.0454840660095215, 1.6500945091247559, 2.2547054290771484, 2.859315872192383, 3.4639265537261963, 4.06853723526001, 4.673147678375244, 5.277758598327637, 5.882369041442871, 6.4869794845581055, 7.091590404510498, 7.696200847625732, 8.300811767578125, 8.90542221069336, 9.510032653808594, 10.114643096923828, 10.719253540039062, 11.323863983154297, 11.928475379943848, 12.533085823059082, 13.137696266174316, 13.74230670928955, 14.346918106079102, 14.951528549194336, 15.55613899230957, 16.160749435424805, 16.76535987854004, 17.369970321655273, 17.974580764770508, 18.579191207885742, 19.183801651000977, 19.78841209411621, 20.393024444580078, 20.997634887695312, 21.602245330810547, 22.20685577392578]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 10.0, 9.0, 20.0, 26.0, 52.0, 76.0, 110.0, 247.0, 532.0, 1228.0, 3895.0, 15979.0, 103154.0, 620606.0, 257729.0, 34396.0, 6892.0, 2089.0, 737.0, 354.0, 147.0, 101.0, 54.0, 40.0, 21.0, 10.0, 3.0, 12.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.75, -32.80517578125, -31.8603515625, -30.91552734375, -29.970703125, -29.02587890625, -28.0810546875, -27.13623046875, -26.19140625, -25.24658203125, -24.3017578125, -23.35693359375, -22.412109375, -21.46728515625, -20.5224609375, -19.57763671875, -18.6328125, -17.68798828125, -16.7431640625, -15.79833984375, -14.853515625, -13.90869140625, -12.9638671875, -12.01904296875, -11.07421875, -10.12939453125, -9.1845703125, -8.23974609375, -7.294921875, -6.35009765625, -5.4052734375, -4.46044921875, -3.515625, -2.57080078125, -1.6259765625, -0.68115234375, 0.263671875, 1.20849609375, 2.1533203125, 3.09814453125, 4.04296875, 4.98779296875, 5.9326171875, 6.87744140625, 7.822265625, 8.76708984375, 9.7119140625, 10.65673828125, 11.6015625, 12.54638671875, 13.4912109375, 14.43603515625, 15.380859375, 16.32568359375, 17.2705078125, 18.21533203125, 19.16015625, 20.10498046875, 21.0498046875, 21.99462890625, 22.939453125, 23.88427734375, 24.8291015625, 25.77392578125, 26.71875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 12.0, 18.0, 23.0, 22.0, 30.0, 36.0, 46.0, 49.0, 69.0, 86.0, 78.0, 83.0, 84.0, 69.0, 72.0, 49.0, 42.0, 33.0, 23.0, 15.0, 12.0, 9.0, 10.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4609375, -6.1937255859375, -5.926513671875, -5.6593017578125, -5.39208984375, -5.1248779296875, -4.857666015625, -4.5904541015625, -4.3232421875, -4.0560302734375, -3.788818359375, -3.5216064453125, -3.25439453125, -2.9871826171875, -2.719970703125, -2.4527587890625, -2.185546875, -1.9183349609375, -1.651123046875, -1.3839111328125, -1.11669921875, -0.8494873046875, -0.582275390625, -0.3150634765625, -0.0478515625, 0.2193603515625, 0.486572265625, 0.7537841796875, 1.02099609375, 1.2882080078125, 1.555419921875, 1.8226318359375, 2.08984375, 2.3570556640625, 2.624267578125, 2.8914794921875, 3.15869140625, 3.4259033203125, 3.693115234375, 3.9603271484375, 4.2275390625, 4.4947509765625, 4.761962890625, 5.0291748046875, 5.29638671875, 5.5635986328125, 5.830810546875, 6.0980224609375, 6.365234375, 6.6324462890625, 6.899658203125, 7.1668701171875, 7.43408203125, 7.7012939453125, 7.968505859375, 8.2357177734375, 8.5029296875, 8.7701416015625, 9.037353515625, 9.3045654296875, 9.57177734375, 9.8389892578125, 10.106201171875, 10.3734130859375, 10.640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 8.0, 8.0, 12.0, 14.0, 24.0, 25.0, 39.0, 59.0, 88.0, 116.0, 245.0, 441.0, 1190.0, 5618.0, 124900.0, 895564.0, 16590.0, 2186.0, 660.0, 304.0, 160.0, 77.0, 63.0, 25.0, 30.0, 37.0, 17.0, 6.0, 12.0, 7.0, 5.0, 2.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-78.75, -76.228515625, -73.70703125, -71.185546875, -68.6640625, -66.142578125, -63.62109375, -61.099609375, -58.578125, -56.056640625, -53.53515625, -51.013671875, -48.4921875, -45.970703125, -43.44921875, -40.927734375, -38.40625, -35.884765625, -33.36328125, -30.841796875, -28.3203125, -25.798828125, -23.27734375, -20.755859375, -18.234375, -15.712890625, -13.19140625, -10.669921875, -8.1484375, -5.626953125, -3.10546875, -0.583984375, 1.9375, 4.458984375, 6.98046875, 9.501953125, 12.0234375, 14.544921875, 17.06640625, 19.587890625, 22.109375, 24.630859375, 27.15234375, 29.673828125, 32.1953125, 34.716796875, 37.23828125, 39.759765625, 42.28125, 44.802734375, 47.32421875, 49.845703125, 52.3671875, 54.888671875, 57.41015625, 59.931640625, 62.453125, 64.974609375, 67.49609375, 70.017578125, 72.5390625, 75.060546875, 77.58203125, 80.103515625, 82.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 4.0, 8.0, 5.0, 9.0, 24.0, 39.0, 36.0, 47.0, 58.0, 86.0, 74.0, 83.0, 76.0, 82.0, 89.0, 70.0, 60.0, 35.0, 34.0, 22.0, 11.0, 11.0, 2.0, 6.0, 6.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.5625, -41.0576171875, -39.552734375, -38.0478515625, -36.54296875, -35.0380859375, -33.533203125, -32.0283203125, -30.5234375, -29.0185546875, -27.513671875, -26.0087890625, -24.50390625, -22.9990234375, -21.494140625, -19.9892578125, -18.484375, -16.9794921875, -15.474609375, -13.9697265625, -12.46484375, -10.9599609375, -9.455078125, -7.9501953125, -6.4453125, -4.9404296875, -3.435546875, -1.9306640625, -0.42578125, 1.0791015625, 2.583984375, 4.0888671875, 5.59375, 7.0986328125, 8.603515625, 10.1083984375, 11.61328125, 13.1181640625, 14.623046875, 16.1279296875, 17.6328125, 19.1376953125, 20.642578125, 22.1474609375, 23.65234375, 25.1572265625, 26.662109375, 28.1669921875, 29.671875, 31.1767578125, 32.681640625, 34.1865234375, 35.69140625, 37.1962890625, 38.701171875, 40.2060546875, 41.7109375, 43.2158203125, 44.720703125, 46.2255859375, 47.73046875, 49.2353515625, 50.740234375, 52.2451171875, 53.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 7.0, 10.0, 4.0, 6.0, 11.0, 13.0, 20.0, 20.0, 27.0, 32.0, 44.0, 62.0, 72.0, 139.0, 180.0, 304.0, 538.0, 1141.0, 3036.0, 10006.0, 62971.0, 774348.0, 169494.0, 18137.0, 4551.0, 1565.0, 741.0, 355.0, 227.0, 133.0, 102.0, 73.0, 43.0, 25.0, 25.0, 21.0, 10.0, 13.0, 16.0, 14.0, 7.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.7421875, -13.32177734375, -12.9013671875, -12.48095703125, -12.060546875, -11.64013671875, -11.2197265625, -10.79931640625, -10.37890625, -9.95849609375, -9.5380859375, -9.11767578125, -8.697265625, -8.27685546875, -7.8564453125, -7.43603515625, -7.015625, -6.59521484375, -6.1748046875, -5.75439453125, -5.333984375, -4.91357421875, -4.4931640625, -4.07275390625, -3.65234375, -3.23193359375, -2.8115234375, -2.39111328125, -1.970703125, -1.55029296875, -1.1298828125, -0.70947265625, -0.2890625, 0.13134765625, 0.5517578125, 0.97216796875, 1.392578125, 1.81298828125, 2.2333984375, 2.65380859375, 3.07421875, 3.49462890625, 3.9150390625, 4.33544921875, 4.755859375, 5.17626953125, 5.5966796875, 6.01708984375, 6.4375, 6.85791015625, 7.2783203125, 7.69873046875, 8.119140625, 8.53955078125, 8.9599609375, 9.38037109375, 9.80078125, 10.22119140625, 10.6416015625, 11.06201171875, 11.482421875, 11.90283203125, 12.3232421875, 12.74365234375, 13.1640625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 3.0, 6.0, 5.0, 6.0, 10.0, 24.0, 29.0, 30.0, 56.0, 77.0, 128.0, 259.0, 129.0, 79.0, 56.0, 27.0, 23.0, 10.0, 7.0, 12.0, 8.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022411346435546875, -0.0021535754203796387, -0.00206601619720459, -0.001978456974029541, -0.0018908977508544922, -0.0018033385276794434, -0.0017157793045043945, -0.0016282200813293457, -0.0015406608581542969, -0.001453101634979248, -0.0013655424118041992, -0.0012779831886291504, -0.0011904239654541016, -0.0011028647422790527, -0.001015305519104004, -0.0009277462959289551, -0.0008401870727539062, -0.0007526278495788574, -0.0006650686264038086, -0.0005775094032287598, -0.0004899501800537109, -0.0004023909568786621, -0.0003148317337036133, -0.00022727251052856445, -0.00013971328735351562, -5.21540641784668e-05, 3.540515899658203e-05, 0.00012296438217163086, 0.0002105236053466797, 0.0002980828285217285, 0.00038564205169677734, 0.00047320127487182617, 0.000560760498046875, 0.0006483197212219238, 0.0007358789443969727, 0.0008234381675720215, 0.0009109973907470703, 0.0009985566139221191, 0.001086115837097168, 0.0011736750602722168, 0.0012612342834472656, 0.0013487935066223145, 0.0014363527297973633, 0.0015239119529724121, 0.001611471176147461, 0.0016990303993225098, 0.0017865896224975586, 0.0018741488456726074, 0.0019617080688476562, 0.002049267292022705, 0.002136826515197754, 0.0022243857383728027, 0.0023119449615478516, 0.0023995041847229004, 0.0024870634078979492, 0.002574622631072998, 0.002662181854248047, 0.0027497410774230957, 0.0028373003005981445, 0.0029248595237731934, 0.003012418746948242, 0.003099977970123291, 0.00318753719329834, 0.0032750964164733887, 0.0033626556396484375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 13.0, 28.0, 30.0, 43.0, 62.0, 90.0, 183.0, 253.0, 446.0, 1108.0, 3742.0, 25355.0, 704943.0, 293368.0, 14258.0, 2654.0, 893.0, 422.0, 202.0, 141.0, 98.0, 46.0, 39.0, 24.0, 23.0, 22.0, 15.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.806640625, -19.26953125, -18.732421875, -18.1953125, -17.658203125, -17.12109375, -16.583984375, -16.046875, -15.509765625, -14.97265625, -14.435546875, -13.8984375, -13.361328125, -12.82421875, -12.287109375, -11.75, -11.212890625, -10.67578125, -10.138671875, -9.6015625, -9.064453125, -8.52734375, -7.990234375, -7.453125, -6.916015625, -6.37890625, -5.841796875, -5.3046875, -4.767578125, -4.23046875, -3.693359375, -3.15625, -2.619140625, -2.08203125, -1.544921875, -1.0078125, -0.470703125, 0.06640625, 0.603515625, 1.140625, 1.677734375, 2.21484375, 2.751953125, 3.2890625, 3.826171875, 4.36328125, 4.900390625, 5.4375, 5.974609375, 6.51171875, 7.048828125, 7.5859375, 8.123046875, 8.66015625, 9.197265625, 9.734375, 10.271484375, 10.80859375, 11.345703125, 11.8828125, 12.419921875, 12.95703125, 13.494140625, 14.03125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 7.0, 6.0, 10.0, 15.0, 20.0, 33.0, 51.0, 83.0, 95.0, 143.0, 165.0, 108.0, 76.0, 52.0, 54.0, 17.0, 13.0, 12.0, 8.0, 5.0, 2.0, 8.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2734375, -13.7987060546875, -13.323974609375, -12.8492431640625, -12.37451171875, -11.8997802734375, -11.425048828125, -10.9503173828125, -10.4755859375, -10.0008544921875, -9.526123046875, -9.0513916015625, -8.57666015625, -8.1019287109375, -7.627197265625, -7.1524658203125, -6.677734375, -6.2030029296875, -5.728271484375, -5.2535400390625, -4.77880859375, -4.3040771484375, -3.829345703125, -3.3546142578125, -2.8798828125, -2.4051513671875, -1.930419921875, -1.4556884765625, -0.98095703125, -0.5062255859375, -0.031494140625, 0.4432373046875, 0.91796875, 1.3927001953125, 1.867431640625, 2.3421630859375, 2.81689453125, 3.2916259765625, 3.766357421875, 4.2410888671875, 4.7158203125, 5.1905517578125, 5.665283203125, 6.1400146484375, 6.61474609375, 7.0894775390625, 7.564208984375, 8.0389404296875, 8.513671875, 8.9884033203125, 9.463134765625, 9.9378662109375, 10.41259765625, 10.8873291015625, 11.362060546875, 11.8367919921875, 12.3115234375, 12.7862548828125, 13.260986328125, 13.7357177734375, 14.21044921875, 14.6851806640625, 15.159912109375, 15.6346435546875, 16.109375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 10.0, 46.0, 241.0, 384.0, 241.0, 57.0, 12.0, 14.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-919.341064453125, -900.3383178710938, -881.3356323242188, -862.3328857421875, -843.3302001953125, -824.3274536132812, -805.3247680664062, -786.322021484375, -767.3193359375, -748.3165893554688, -729.3139038085938, -710.3111572265625, -691.3084716796875, -672.3057250976562, -653.3030395507812, -634.30029296875, -615.2975463867188, -596.2947998046875, -577.2921142578125, -558.2893676757812, -539.2866821289062, -520.283935546875, -501.2812194824219, -482.27850341796875, -463.2757873535156, -444.2730712890625, -425.2703552246094, -406.26763916015625, -387.264892578125, -368.26220703125, -349.25946044921875, -330.2567443847656, -311.2539978027344, -292.25128173828125, -273.2485656738281, -254.24583435058594, -235.2431182861328, -216.2404022216797, -197.2376708984375, -178.23495483398438, -159.23223876953125, -140.22952270507812, -121.22679901123047, -102.22407531738281, -83.22135925292969, -64.21864318847656, -45.215919494628906, -26.21319580078125, -7.210479736328125, 11.792240142822266, 30.794960021972656, 49.79767990112305, 68.80039978027344, 87.80311584472656, 106.80583953857422, 125.80856323242188, 144.811279296875, 163.81399536132812, 182.81671142578125, 201.81944274902344, 220.82215881347656, 239.8248748779297, 258.8276062011719, 277.830322265625, 296.8330383300781]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 9.0, 9.0, 13.0, 14.0, 9.0, 27.0, 18.0, 29.0, 39.0, 35.0, 50.0, 49.0, 62.0, 58.0, 62.0, 56.0, 53.0, 57.0, 36.0, 40.0, 38.0, 33.0, 36.0, 29.0, 22.0, 23.0, 13.0, 10.0, 11.0, 12.0, 4.0, 11.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.1280517578125, -136.09954833984375, -132.07106018066406, -128.04257202148438, -124.01406860351562, -119.9855728149414, -115.95707702636719, -111.92858123779297, -107.90008544921875, -103.87158966064453, -99.84309387207031, -95.8145980834961, -91.78610229492188, -87.75760650634766, -83.72911071777344, -79.70061492919922, -75.672119140625, -71.64362335205078, -67.61512756347656, -63.586631774902344, -59.558135986328125, -55.529640197753906, -51.50114440917969, -47.47264862060547, -43.44415283203125, -39.41565704345703, -35.38716125488281, -31.358665466308594, -27.330169677734375, -23.301673889160156, -19.273178100585938, -15.244682312011719, -11.216201782226562, -7.187705993652344, -3.159210205078125, 0.8692855834960938, 4.8977813720703125, 8.926277160644531, 12.95477294921875, 16.98326873779297, 21.011764526367188, 25.040260314941406, 29.068756103515625, 33.097251892089844, 37.12574768066406, 41.15424346923828, 45.1827392578125, 49.21123504638672, 53.23973083496094, 57.268226623535156, 61.296722412109375, 65.3252182006836, 69.35371398925781, 73.38220977783203, 77.41070556640625, 81.43920135498047, 85.46769714355469, 89.4961929321289, 93.52468872070312, 97.55318450927734, 101.58168029785156, 105.61017608642578, 109.638671875, 113.66716766357422, 117.69566345214844]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 4.0, 4.0, 7.0, 12.0, 18.0, 22.0, 39.0, 70.0, 113.0, 259.0, 469.0, 1166.0, 2684.0, 7762.0, 32221.0, 647965.0, 3417028.0, 65764.0, 12251.0, 3789.0, 1427.0, 615.0, 276.0, 136.0, 77.0, 33.0, 26.0, 13.0, 9.0, 11.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-27.421875, -26.755859375, -26.08984375, -25.423828125, -24.7578125, -24.091796875, -23.42578125, -22.759765625, -22.09375, -21.427734375, -20.76171875, -20.095703125, -19.4296875, -18.763671875, -18.09765625, -17.431640625, -16.765625, -16.099609375, -15.43359375, -14.767578125, -14.1015625, -13.435546875, -12.76953125, -12.103515625, -11.4375, -10.771484375, -10.10546875, -9.439453125, -8.7734375, -8.107421875, -7.44140625, -6.775390625, -6.109375, -5.443359375, -4.77734375, -4.111328125, -3.4453125, -2.779296875, -2.11328125, -1.447265625, -0.78125, -0.115234375, 0.55078125, 1.216796875, 1.8828125, 2.548828125, 3.21484375, 3.880859375, 4.546875, 5.212890625, 5.87890625, 6.544921875, 7.2109375, 7.876953125, 8.54296875, 9.208984375, 9.875, 10.541015625, 11.20703125, 11.873046875, 12.5390625, 13.205078125, 13.87109375, 14.537109375, 15.203125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 8.0, 16.0, 16.0, 31.0, 49.0, 57.0, 87.0, 92.0, 101.0, 133.0, 100.0, 87.0, 82.0, 47.0, 31.0, 17.0, 16.0, 4.0, 11.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.98486328125, -9.6416015625, -9.29833984375, -8.955078125, -8.61181640625, -8.2685546875, -7.92529296875, -7.58203125, -7.23876953125, -6.8955078125, -6.55224609375, -6.208984375, -5.86572265625, -5.5224609375, -5.17919921875, -4.8359375, -4.49267578125, -4.1494140625, -3.80615234375, -3.462890625, -3.11962890625, -2.7763671875, -2.43310546875, -2.08984375, -1.74658203125, -1.4033203125, -1.06005859375, -0.716796875, -0.37353515625, -0.0302734375, 0.31298828125, 0.65625, 0.99951171875, 1.3427734375, 1.68603515625, 2.029296875, 2.37255859375, 2.7158203125, 3.05908203125, 3.40234375, 3.74560546875, 4.0888671875, 4.43212890625, 4.775390625, 5.11865234375, 5.4619140625, 5.80517578125, 6.1484375, 6.49169921875, 6.8349609375, 7.17822265625, 7.521484375, 7.86474609375, 8.2080078125, 8.55126953125, 8.89453125, 9.23779296875, 9.5810546875, 9.92431640625, 10.267578125, 10.61083984375, 10.9541015625, 11.29736328125, 11.640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 11.0, 13.0, 15.0, 41.0, 79.0, 107.0, 196.0, 401.0, 918.0, 2791.0, 11505.0, 84784.0, 3812708.0, 253258.0, 21226.0, 4150.0, 1226.0, 421.0, 182.0, 94.0, 56.0, 24.0, 25.0, 10.0, 3.0, 4.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.52685546875, -17.7099609375, -16.89306640625, -16.076171875, -15.25927734375, -14.4423828125, -13.62548828125, -12.80859375, -11.99169921875, -11.1748046875, -10.35791015625, -9.541015625, -8.72412109375, -7.9072265625, -7.09033203125, -6.2734375, -5.45654296875, -4.6396484375, -3.82275390625, -3.005859375, -2.18896484375, -1.3720703125, -0.55517578125, 0.26171875, 1.07861328125, 1.8955078125, 2.71240234375, 3.529296875, 4.34619140625, 5.1630859375, 5.97998046875, 6.796875, 7.61376953125, 8.4306640625, 9.24755859375, 10.064453125, 10.88134765625, 11.6982421875, 12.51513671875, 13.33203125, 14.14892578125, 14.9658203125, 15.78271484375, 16.599609375, 17.41650390625, 18.2333984375, 19.05029296875, 19.8671875, 20.68408203125, 21.5009765625, 22.31787109375, 23.134765625, 23.95166015625, 24.7685546875, 25.58544921875, 26.40234375, 27.21923828125, 28.0361328125, 28.85302734375, 29.669921875, 30.48681640625, 31.3037109375, 32.12060546875, 32.9375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 19.0, 19.0, 23.0, 21.0, 45.0, 76.0, 109.0, 317.0, 1069.0, 1508.0, 479.0, 162.0, 69.0, 57.0, 27.0, 21.0, 19.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.5350341796875, -28.835693359375, -28.1363525390625, -27.43701171875, -26.7376708984375, -26.038330078125, -25.3389892578125, -24.6396484375, -23.9403076171875, -23.240966796875, -22.5416259765625, -21.84228515625, -21.1429443359375, -20.443603515625, -19.7442626953125, -19.044921875, -18.3455810546875, -17.646240234375, -16.9468994140625, -16.24755859375, -15.5482177734375, -14.848876953125, -14.1495361328125, -13.4501953125, -12.7508544921875, -12.051513671875, -11.3521728515625, -10.65283203125, -9.9534912109375, -9.254150390625, -8.5548095703125, -7.85546875, -7.1561279296875, -6.456787109375, -5.7574462890625, -5.05810546875, -4.3587646484375, -3.659423828125, -2.9600830078125, -2.2607421875, -1.5614013671875, -0.862060546875, -0.1627197265625, 0.53662109375, 1.2359619140625, 1.935302734375, 2.6346435546875, 3.333984375, 4.0333251953125, 4.732666015625, 5.4320068359375, 6.13134765625, 6.8306884765625, 7.530029296875, 8.2293701171875, 8.9287109375, 9.6280517578125, 10.327392578125, 11.0267333984375, 11.72607421875, 12.4254150390625, 13.124755859375, 13.8240966796875, 14.5234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 11.0, 11.0, 15.0, 20.0, 52.0, 99.0, 144.0, 171.0, 175.0, 137.0, 69.0, 45.0, 16.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.33547973632812, -142.62643432617188, -137.9174041748047, -133.20835876464844, -128.49932861328125, -123.790283203125, -119.08123779296875, -114.37220001220703, -109.66316223144531, -104.9541244506836, -100.24508666992188, -95.53604125976562, -90.8270034790039, -86.11796569824219, -81.40892028808594, -76.69988250732422, -71.9908447265625, -67.28180694580078, -62.5727653503418, -57.86372375488281, -53.154685974121094, -48.445648193359375, -43.73660659790039, -39.027565002441406, -34.31852722167969, -29.609487533569336, -24.900447845458984, -20.191408157348633, -15.482368469238281, -10.77332878112793, -6.064289093017578, -1.3552474975585938, 3.353790283203125, 8.062829971313477, 12.771869659423828, 17.48090934753418, 22.18994903564453, 26.898988723754883, 31.608028411865234, 36.31707000732422, 41.02610778808594, 45.735145568847656, 50.44418716430664, 55.153228759765625, 59.862266540527344, 64.57130432128906, 69.28034973144531, 73.98938751220703, 78.69842529296875, 83.40746307373047, 88.11650085449219, 92.82554626464844, 97.53458404541016, 102.24362182617188, 106.95266723632812, 111.66170501708984, 116.37074279785156, 121.07978057861328, 125.788818359375, 130.49786376953125, 135.2069091796875, 139.9159393310547, 144.62498474121094, 149.33401489257812, 154.04306030273438]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 9.0, 11.0, 16.0, 12.0, 22.0, 22.0, 23.0, 31.0, 43.0, 43.0, 41.0, 45.0, 54.0, 49.0, 57.0, 62.0, 49.0, 59.0, 57.0, 43.0, 40.0, 41.0, 41.0, 28.0, 22.0, 25.0, 22.0, 7.0, 8.0, 9.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.73100280761719, -65.34998321533203, -62.96896743774414, -60.587947845458984, -58.206932067871094, -55.82591247558594, -53.44489288330078, -51.063873291015625, -48.682857513427734, -46.30183792114258, -43.92082214355469, -41.53980255126953, -39.158782958984375, -36.777767181396484, -34.39674758911133, -32.01573181152344, -29.63471221923828, -27.253694534301758, -24.872676849365234, -22.491657257080078, -20.110639572143555, -17.72962188720703, -15.348603248596191, -12.967584609985352, -10.586566925048828, -8.205549240112305, -5.824530601501465, -3.443512439727783, -1.0624942779541016, 1.3185234069824219, 3.6995420455932617, 6.080560684204102, 8.461585998535156, 10.84260368347168, 13.22362232208252, 15.60464096069336, 17.985658645629883, 20.366676330566406, 22.747695922851562, 25.128713607788086, 27.50973129272461, 29.890748977661133, 32.271766662597656, 34.65278625488281, 37.03380584716797, 39.41482162475586, 41.795841217041016, 44.176856994628906, 46.55787658691406, 48.93889617919922, 51.31991195678711, 53.700931549072266, 56.081947326660156, 58.46296691894531, 60.84398651123047, 63.225006103515625, 65.60601806640625, 67.9870376586914, 70.36805725097656, 72.74906921386719, 75.13008880615234, 77.5111083984375, 79.89212799072266, 82.27314758300781, 84.65416717529297]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 9.0, 5.0, 12.0, 12.0, 19.0, 19.0, 30.0, 49.0, 71.0, 116.0, 181.0, 294.0, 474.0, 868.0, 1636.0, 3736.0, 9049.0, 26684.0, 93580.0, 403866.0, 378594.0, 87790.0, 25208.0, 8894.0, 3631.0, 1634.0, 823.0, 453.0, 285.0, 179.0, 97.0, 76.0, 50.0, 39.0, 25.0, 16.0, 11.0, 8.0, 6.0, 7.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.546875, -15.975830078125, -15.40478515625, -14.833740234375, -14.2626953125, -13.691650390625, -13.12060546875, -12.549560546875, -11.978515625, -11.407470703125, -10.83642578125, -10.265380859375, -9.6943359375, -9.123291015625, -8.55224609375, -7.981201171875, -7.41015625, -6.839111328125, -6.26806640625, -5.697021484375, -5.1259765625, -4.554931640625, -3.98388671875, -3.412841796875, -2.841796875, -2.270751953125, -1.69970703125, -1.128662109375, -0.5576171875, 0.013427734375, 0.58447265625, 1.155517578125, 1.7265625, 2.297607421875, 2.86865234375, 3.439697265625, 4.0107421875, 4.581787109375, 5.15283203125, 5.723876953125, 6.294921875, 6.865966796875, 7.43701171875, 8.008056640625, 8.5791015625, 9.150146484375, 9.72119140625, 10.292236328125, 10.86328125, 11.434326171875, 12.00537109375, 12.576416015625, 13.1474609375, 13.718505859375, 14.28955078125, 14.860595703125, 15.431640625, 16.002685546875, 16.57373046875, 17.144775390625, 17.7158203125, 18.286865234375, 18.85791015625, 19.428955078125, 20.0]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 11.0, 17.0, 16.0, 34.0, 38.0, 45.0, 81.0, 98.0, 121.0, 112.0, 103.0, 96.0, 82.0, 43.0, 38.0, 22.0, 15.0, 12.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2139892578125, -9.865478515625, -9.5169677734375, -9.16845703125, -8.8199462890625, -8.471435546875, -8.1229248046875, -7.7744140625, -7.4259033203125, -7.077392578125, -6.7288818359375, -6.38037109375, -6.0318603515625, -5.683349609375, -5.3348388671875, -4.986328125, -4.6378173828125, -4.289306640625, -3.9407958984375, -3.59228515625, -3.2437744140625, -2.895263671875, -2.5467529296875, -2.1982421875, -1.8497314453125, -1.501220703125, -1.1527099609375, -0.80419921875, -0.4556884765625, -0.107177734375, 0.2413330078125, 0.58984375, 0.9383544921875, 1.286865234375, 1.6353759765625, 1.98388671875, 2.3323974609375, 2.680908203125, 3.0294189453125, 3.3779296875, 3.7264404296875, 4.074951171875, 4.4234619140625, 4.77197265625, 5.1204833984375, 5.468994140625, 5.8175048828125, 6.166015625, 6.5145263671875, 6.863037109375, 7.2115478515625, 7.56005859375, 7.9085693359375, 8.257080078125, 8.6055908203125, 8.9541015625, 9.3026123046875, 9.651123046875, 9.9996337890625, 10.34814453125, 10.6966552734375, 11.045166015625, 11.3936767578125, 11.7421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 11.0, 18.0, 13.0, 19.0, 17.0, 32.0, 48.0, 90.0, 165.0, 263.0, 653.0, 1548.0, 6102.0, 110274.0, 906452.0, 18141.0, 2905.0, 875.0, 388.0, 195.0, 114.0, 70.0, 35.0, 30.0, 21.0, 17.0, 8.0, 8.0, 4.0, 6.0, 3.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-71.75, -69.525390625, -67.30078125, -65.076171875, -62.8515625, -60.626953125, -58.40234375, -56.177734375, -53.953125, -51.728515625, -49.50390625, -47.279296875, -45.0546875, -42.830078125, -40.60546875, -38.380859375, -36.15625, -33.931640625, -31.70703125, -29.482421875, -27.2578125, -25.033203125, -22.80859375, -20.583984375, -18.359375, -16.134765625, -13.91015625, -11.685546875, -9.4609375, -7.236328125, -5.01171875, -2.787109375, -0.5625, 1.662109375, 3.88671875, 6.111328125, 8.3359375, 10.560546875, 12.78515625, 15.009765625, 17.234375, 19.458984375, 21.68359375, 23.908203125, 26.1328125, 28.357421875, 30.58203125, 32.806640625, 35.03125, 37.255859375, 39.48046875, 41.705078125, 43.9296875, 46.154296875, 48.37890625, 50.603515625, 52.828125, 55.052734375, 57.27734375, 59.501953125, 61.7265625, 63.951171875, 66.17578125, 68.400390625, 70.625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 4.0, 3.0, 10.0, 16.0, 22.0, 36.0, 39.0, 77.0, 93.0, 92.0, 90.0, 109.0, 90.0, 93.0, 68.0, 40.0, 33.0, 26.0, 13.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.875, -46.22705078125, -44.5791015625, -42.93115234375, -41.283203125, -39.63525390625, -37.9873046875, -36.33935546875, -34.69140625, -33.04345703125, -31.3955078125, -29.74755859375, -28.099609375, -26.45166015625, -24.8037109375, -23.15576171875, -21.5078125, -19.85986328125, -18.2119140625, -16.56396484375, -14.916015625, -13.26806640625, -11.6201171875, -9.97216796875, -8.32421875, -6.67626953125, -5.0283203125, -3.38037109375, -1.732421875, -0.08447265625, 1.5634765625, 3.21142578125, 4.859375, 6.50732421875, 8.1552734375, 9.80322265625, 11.451171875, 13.09912109375, 14.7470703125, 16.39501953125, 18.04296875, 19.69091796875, 21.3388671875, 22.98681640625, 24.634765625, 26.28271484375, 27.9306640625, 29.57861328125, 31.2265625, 32.87451171875, 34.5224609375, 36.17041015625, 37.818359375, 39.46630859375, 41.1142578125, 42.76220703125, 44.41015625, 46.05810546875, 47.7060546875, 49.35400390625, 51.001953125, 52.64990234375, 54.2978515625, 55.94580078125, 57.59375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 4.0, 12.0, 11.0, 18.0, 28.0, 50.0, 68.0, 116.0, 254.0, 686.0, 2633.0, 34236.0, 997191.0, 10573.0, 1683.0, 480.0, 169.0, 113.0, 51.0, 44.0, 28.0, 17.0, 19.0, 7.0, 2.0, 11.0, 5.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84375, -31.7958984375, -30.748046875, -29.7001953125, -28.65234375, -27.6044921875, -26.556640625, -25.5087890625, -24.4609375, -23.4130859375, -22.365234375, -21.3173828125, -20.26953125, -19.2216796875, -18.173828125, -17.1259765625, -16.078125, -15.0302734375, -13.982421875, -12.9345703125, -11.88671875, -10.8388671875, -9.791015625, -8.7431640625, -7.6953125, -6.6474609375, -5.599609375, -4.5517578125, -3.50390625, -2.4560546875, -1.408203125, -0.3603515625, 0.6875, 1.7353515625, 2.783203125, 3.8310546875, 4.87890625, 5.9267578125, 6.974609375, 8.0224609375, 9.0703125, 10.1181640625, 11.166015625, 12.2138671875, 13.26171875, 14.3095703125, 15.357421875, 16.4052734375, 17.453125, 18.5009765625, 19.548828125, 20.5966796875, 21.64453125, 22.6923828125, 23.740234375, 24.7880859375, 25.8359375, 26.8837890625, 27.931640625, 28.9794921875, 30.02734375, 31.0751953125, 32.123046875, 33.1708984375, 34.21875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 11.0, 14.0, 45.0, 112.0, 317.0, 313.0, 99.0, 35.0, 22.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004207611083984375, -0.004057466983795166, -0.003907322883605957, -0.003757178783416748, -0.003607034683227539, -0.00345689058303833, -0.003306746482849121, -0.003156602382659912, -0.003006458282470703, -0.002856314182281494, -0.002706170082092285, -0.002556025981903076, -0.002405881881713867, -0.002255737781524658, -0.0021055936813354492, -0.0019554495811462402, -0.0018053054809570312, -0.0016551613807678223, -0.0015050172805786133, -0.0013548731803894043, -0.0012047290802001953, -0.0010545849800109863, -0.0009044408798217773, -0.0007542967796325684, -0.0006041526794433594, -0.0004540085792541504, -0.0003038644790649414, -0.00015372037887573242, -3.5762786865234375e-06, 0.00014656782150268555, 0.00029671192169189453, 0.0004468560218811035, 0.0005970001220703125, 0.0007471442222595215, 0.0008972883224487305, 0.0010474324226379395, 0.0011975765228271484, 0.0013477206230163574, 0.0014978647232055664, 0.0016480088233947754, 0.0017981529235839844, 0.0019482970237731934, 0.0020984411239624023, 0.0022485852241516113, 0.0023987293243408203, 0.0025488734245300293, 0.0026990175247192383, 0.0028491616249084473, 0.0029993057250976562, 0.0031494498252868652, 0.0032995939254760742, 0.003449738025665283, 0.003599882125854492, 0.003750026226043701, 0.00390017032623291, 0.004050314426422119, 0.004200458526611328, 0.004350602626800537, 0.004500746726989746, 0.004650890827178955, 0.004801034927368164, 0.004951179027557373, 0.005101323127746582, 0.005251467227935791, 0.005401611328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 16.0, 18.0, 16.0, 21.0, 31.0, 43.0, 79.0, 127.0, 274.0, 668.0, 2277.0, 12299.0, 937215.0, 88487.0, 4761.0, 1224.0, 451.0, 204.0, 101.0, 67.0, 42.0, 30.0, 16.0, 9.0, 12.0, 11.0, 5.0, 7.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.609375, -23.809326171875, -23.00927734375, -22.209228515625, -21.4091796875, -20.609130859375, -19.80908203125, -19.009033203125, -18.208984375, -17.408935546875, -16.60888671875, -15.808837890625, -15.0087890625, -14.208740234375, -13.40869140625, -12.608642578125, -11.80859375, -11.008544921875, -10.20849609375, -9.408447265625, -8.6083984375, -7.808349609375, -7.00830078125, -6.208251953125, -5.408203125, -4.608154296875, -3.80810546875, -3.008056640625, -2.2080078125, -1.407958984375, -0.60791015625, 0.192138671875, 0.9921875, 1.792236328125, 2.59228515625, 3.392333984375, 4.1923828125, 4.992431640625, 5.79248046875, 6.592529296875, 7.392578125, 8.192626953125, 8.99267578125, 9.792724609375, 10.5927734375, 11.392822265625, 12.19287109375, 12.992919921875, 13.79296875, 14.593017578125, 15.39306640625, 16.193115234375, 16.9931640625, 17.793212890625, 18.59326171875, 19.393310546875, 20.193359375, 20.993408203125, 21.79345703125, 22.593505859375, 23.3935546875, 24.193603515625, 24.99365234375, 25.793701171875, 26.59375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 14.0, 35.0, 51.0, 109.0, 182.0, 236.0, 156.0, 82.0, 54.0, 25.0, 5.0, 8.0, 5.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.734375, -16.142822265625, -15.55126953125, -14.959716796875, -14.3681640625, -13.776611328125, -13.18505859375, -12.593505859375, -12.001953125, -11.410400390625, -10.81884765625, -10.227294921875, -9.6357421875, -9.044189453125, -8.45263671875, -7.861083984375, -7.26953125, -6.677978515625, -6.08642578125, -5.494873046875, -4.9033203125, -4.311767578125, -3.72021484375, -3.128662109375, -2.537109375, -1.945556640625, -1.35400390625, -0.762451171875, -0.1708984375, 0.420654296875, 1.01220703125, 1.603759765625, 2.1953125, 2.786865234375, 3.37841796875, 3.969970703125, 4.5615234375, 5.153076171875, 5.74462890625, 6.336181640625, 6.927734375, 7.519287109375, 8.11083984375, 8.702392578125, 9.2939453125, 9.885498046875, 10.47705078125, 11.068603515625, 11.66015625, 12.251708984375, 12.84326171875, 13.434814453125, 14.0263671875, 14.617919921875, 15.20947265625, 15.801025390625, 16.392578125, 16.984130859375, 17.57568359375, 18.167236328125, 18.7587890625, 19.350341796875, 19.94189453125, 20.533447265625, 21.125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 19.0, 34.0, 194.0, 465.0, 240.0, 39.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-807.2546997070312, -790.6134033203125, -773.9721069335938, -757.330810546875, -740.6895141601562, -724.0482177734375, -707.4069213867188, -690.765625, -674.124267578125, -657.4829711914062, -640.8416748046875, -624.2003784179688, -607.55908203125, -590.9177856445312, -574.2764892578125, -557.6351318359375, -540.993896484375, -524.3526000976562, -507.7113037109375, -491.07000732421875, -474.4287109375, -457.78741455078125, -441.1460876464844, -424.5047912597656, -407.8634948730469, -391.2221984863281, -374.5809020996094, -357.9396057128906, -341.29827880859375, -324.656982421875, -308.01568603515625, -291.3743896484375, -274.733154296875, -258.09185791015625, -241.4505615234375, -224.8092498779297, -208.16795349121094, -191.5266571044922, -174.88534545898438, -158.24404907226562, -141.60275268554688, -124.96145629882812, -108.32015228271484, -91.67884826660156, -75.03755187988281, -58.39625549316406, -41.75495147705078, -25.1136474609375, -8.47235107421875, 8.168949127197266, 24.81024932861328, 41.4515495300293, 58.09284973144531, 74.73414611816406, 91.37545013427734, 108.01675415039062, 124.65805053710938, 141.29934692382812, 157.94064331054688, 174.5819549560547, 191.22325134277344, 207.8645477294922, 224.505859375, 241.14715576171875, 257.7884521484375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 13.0, 16.0, 16.0, 27.0, 24.0, 31.0, 39.0, 38.0, 47.0, 73.0, 73.0, 74.0, 70.0, 80.0, 75.0, 49.0, 47.0, 35.0, 36.0, 35.0, 30.0, 25.0, 15.0, 5.0, 11.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-146.8711700439453, -142.57101440429688, -138.27084350585938, -133.97068786621094, -129.6705322265625, -125.370361328125, -121.07020568847656, -116.7700424194336, -112.46987915039062, -108.16971588134766, -103.86955261230469, -99.56939697265625, -95.26923370361328, -90.96907043457031, -86.66891479492188, -82.3687515258789, -78.06858825683594, -73.76842498779297, -69.46826171875, -65.16810607910156, -60.867942810058594, -56.567779541015625, -52.26762008666992, -47.96746063232422, -43.66729736328125, -39.36713409423828, -35.06697463989258, -30.766813278198242, -26.466651916503906, -22.16649055480957, -17.866329193115234, -13.566167831420898, -9.266021728515625, -4.965860366821289, -0.6656990051269531, 3.634462356567383, 7.934623718261719, 12.234785079956055, 16.53494644165039, 20.835107803344727, 25.135269165039062, 29.4354305267334, 33.735591888427734, 38.03575134277344, 42.335914611816406, 46.636077880859375, 50.93623733520508, 55.23639678955078, 59.53656005859375, 63.83672332763672, 68.13688659667969, 72.43704223632812, 76.7372055053711, 81.03736877441406, 85.3375244140625, 89.63768768310547, 93.93785095214844, 98.2380142211914, 102.53817749023438, 106.83833312988281, 111.13849639892578, 115.43865966796875, 119.73881530761719, 124.03897857666016, 128.33914184570312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 9.0, 38.0, 64.0, 130.0, 419.0, 1794.0, 12020.0, 930025.0, 3228996.0, 17687.0, 2252.0, 526.0, 166.0, 66.0, 29.0, 16.0, 4.0, 10.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.328125, -19.363525390625, -18.39892578125, -17.434326171875, -16.4697265625, -15.505126953125, -14.54052734375, -13.575927734375, -12.611328125, -11.646728515625, -10.68212890625, -9.717529296875, -8.7529296875, -7.788330078125, -6.82373046875, -5.859130859375, -4.89453125, -3.929931640625, -2.96533203125, -2.000732421875, -1.0361328125, -0.071533203125, 0.89306640625, 1.857666015625, 2.822265625, 3.786865234375, 4.75146484375, 5.716064453125, 6.6806640625, 7.645263671875, 8.60986328125, 9.574462890625, 10.5390625, 11.503662109375, 12.46826171875, 13.432861328125, 14.3974609375, 15.362060546875, 16.32666015625, 17.291259765625, 18.255859375, 19.220458984375, 20.18505859375, 21.149658203125, 22.1142578125, 23.078857421875, 24.04345703125, 25.008056640625, 25.97265625, 26.937255859375, 27.90185546875, 28.866455078125, 29.8310546875, 30.795654296875, 31.76025390625, 32.724853515625, 33.689453125, 34.654052734375, 35.61865234375, 36.583251953125, 37.5478515625, 38.512451171875, 39.47705078125, 40.441650390625, 41.40625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 11.0, 14.0, 21.0, 24.0, 24.0, 38.0, 40.0, 61.0, 57.0, 65.0, 74.0, 68.0, 88.0, 76.0, 66.0, 60.0, 51.0, 39.0, 30.0, 35.0, 11.0, 12.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.49066162109375, -4.2508544921875, -4.01104736328125, -3.771240234375, -3.53143310546875, -3.2916259765625, -3.05181884765625, -2.81201171875, -2.57220458984375, -2.3323974609375, -2.09259033203125, -1.852783203125, -1.61297607421875, -1.3731689453125, -1.13336181640625, -0.8935546875, -0.65374755859375, -0.4139404296875, -0.17413330078125, 0.065673828125, 0.30548095703125, 0.5452880859375, 0.78509521484375, 1.02490234375, 1.26470947265625, 1.5045166015625, 1.74432373046875, 1.984130859375, 2.22393798828125, 2.4637451171875, 2.70355224609375, 2.943359375, 3.18316650390625, 3.4229736328125, 3.66278076171875, 3.902587890625, 4.14239501953125, 4.3822021484375, 4.62200927734375, 4.86181640625, 5.10162353515625, 5.3414306640625, 5.58123779296875, 5.821044921875, 6.06085205078125, 6.3006591796875, 6.54046630859375, 6.7802734375, 7.02008056640625, 7.2598876953125, 7.49969482421875, 7.739501953125, 7.97930908203125, 8.2191162109375, 8.45892333984375, 8.69873046875, 8.93853759765625, 9.1783447265625, 9.41815185546875, 9.657958984375, 9.89776611328125, 10.1375732421875, 10.37738037109375, 10.6171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 11.0, 28.0, 44.0, 78.0, 115.0, 213.0, 464.0, 901.0, 2109.0, 5627.0, 19596.0, 105030.0, 3259506.0, 733368.0, 49406.0, 11544.0, 3617.0, 1351.0, 604.0, 305.0, 152.0, 81.0, 52.0, 23.0, 17.0, 6.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2890625, -12.7532958984375, -12.217529296875, -11.6817626953125, -11.14599609375, -10.6102294921875, -10.074462890625, -9.5386962890625, -9.0029296875, -8.4671630859375, -7.931396484375, -7.3956298828125, -6.85986328125, -6.3240966796875, -5.788330078125, -5.2525634765625, -4.716796875, -4.1810302734375, -3.645263671875, -3.1094970703125, -2.57373046875, -2.0379638671875, -1.502197265625, -0.9664306640625, -0.4306640625, 0.1051025390625, 0.640869140625, 1.1766357421875, 1.71240234375, 2.2481689453125, 2.783935546875, 3.3197021484375, 3.85546875, 4.3912353515625, 4.927001953125, 5.4627685546875, 5.99853515625, 6.5343017578125, 7.070068359375, 7.6058349609375, 8.1416015625, 8.6773681640625, 9.213134765625, 9.7489013671875, 10.28466796875, 10.8204345703125, 11.356201171875, 11.8919677734375, 12.427734375, 12.9635009765625, 13.499267578125, 14.0350341796875, 14.57080078125, 15.1065673828125, 15.642333984375, 16.1781005859375, 16.7138671875, 17.2496337890625, 17.785400390625, 18.3211669921875, 18.85693359375, 19.3927001953125, 19.928466796875, 20.4642333984375, 21.0]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 18.0, 17.0, 19.0, 33.0, 60.0, 58.0, 149.0, 268.0, 674.0, 1257.0, 771.0, 340.0, 142.0, 83.0, 58.0, 32.0, 31.0, 15.0, 12.0, 6.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.625, -18.1295166015625, -17.634033203125, -17.1385498046875, -16.64306640625, -16.1475830078125, -15.652099609375, -15.1566162109375, -14.6611328125, -14.1656494140625, -13.670166015625, -13.1746826171875, -12.67919921875, -12.1837158203125, -11.688232421875, -11.1927490234375, -10.697265625, -10.2017822265625, -9.706298828125, -9.2108154296875, -8.71533203125, -8.2198486328125, -7.724365234375, -7.2288818359375, -6.7333984375, -6.2379150390625, -5.742431640625, -5.2469482421875, -4.75146484375, -4.2559814453125, -3.760498046875, -3.2650146484375, -2.76953125, -2.2740478515625, -1.778564453125, -1.2830810546875, -0.78759765625, -0.2921142578125, 0.203369140625, 0.6988525390625, 1.1943359375, 1.6898193359375, 2.185302734375, 2.6807861328125, 3.17626953125, 3.6717529296875, 4.167236328125, 4.6627197265625, 5.158203125, 5.6536865234375, 6.149169921875, 6.6446533203125, 7.14013671875, 7.6356201171875, 8.131103515625, 8.6265869140625, 9.1220703125, 9.6175537109375, 10.113037109375, 10.6085205078125, 11.10400390625, 11.5994873046875, 12.094970703125, 12.5904541015625, 13.0859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 14.0, 37.0, 151.0, 390.0, 284.0, 80.0, 20.0, 8.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-347.1724853515625, -339.01263427734375, -330.852783203125, -322.6929626464844, -314.5331115722656, -306.3732604980469, -298.2134094238281, -290.0535888671875, -281.89373779296875, -273.73388671875, -265.57403564453125, -257.4142150878906, -249.25436401367188, -241.09451293945312, -232.93466186523438, -224.7748260498047, -216.61497497558594, -208.4551239013672, -200.2952880859375, -192.13543701171875, -183.97560119628906, -175.8157501220703, -167.65591430664062, -159.49606323242188, -151.33621215820312, -143.17636108398438, -135.0165252685547, -126.85667419433594, -118.69683837890625, -110.5369873046875, -102.37714385986328, -94.21730041503906, -86.05746459960938, -77.89762115478516, -69.73777770996094, -61.57793045043945, -53.418087005615234, -45.258243560791016, -37.09839630126953, -28.938552856445312, -20.778709411621094, -12.618865013122559, -4.459020614624023, 3.700824737548828, 11.860668182373047, 20.020511627197266, 28.18035888671875, 36.34020233154297, 44.50004577636719, 52.659889221191406, 60.819732666015625, 68.97958374023438, 77.13941955566406, 85.29927062988281, 93.45911407470703, 101.61895751953125, 109.77880096435547, 117.93864440917969, 126.0984878540039, 134.25833129882812, 142.41818237304688, 150.57801818847656, 158.7378692626953, 166.897705078125, 175.05755615234375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 19.0, 10.0, 15.0, 16.0, 21.0, 35.0, 38.0, 29.0, 38.0, 63.0, 51.0, 48.0, 61.0, 62.0, 52.0, 63.0, 64.0, 48.0, 44.0, 45.0, 35.0, 35.0, 19.0, 18.0, 11.0, 13.0, 8.0, 5.0, 4.0, 8.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.07528305053711, -54.089576721191406, -52.10386657714844, -50.11815643310547, -48.132450103759766, -46.14674377441406, -44.161033630371094, -42.175323486328125, -40.18961715698242, -38.20391082763672, -36.21820068359375, -34.23249053955078, -32.24678421020508, -30.261075973510742, -28.275367736816406, -26.28965950012207, -24.303951263427734, -22.3182430267334, -20.332534790039062, -18.346826553344727, -16.36111831665039, -14.375410079956055, -12.389701843261719, -10.403993606567383, -8.418285369873047, -6.432577133178711, -4.446868896484375, -2.461160659790039, -0.4754524230957031, 1.5102558135986328, 3.4959640502929688, 5.481672286987305, 7.467376708984375, 9.453084945678711, 11.438793182373047, 13.424501419067383, 15.410209655761719, 17.395917892456055, 19.38162612915039, 21.367334365844727, 23.353042602539062, 25.3387508392334, 27.324459075927734, 29.31016731262207, 31.295875549316406, 33.281585693359375, 35.26729202270508, 37.25299835205078, 39.23870849609375, 41.22441864013672, 43.21012496948242, 45.195831298828125, 47.181541442871094, 49.16725158691406, 51.152957916259766, 53.13866424560547, 55.12437438964844, 57.110084533691406, 59.09579086303711, 61.08149719238281, 63.06720733642578, 65.05291748046875, 67.03861999511719, 69.02433013916016, 71.01004028320312]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 13.0, 9.0, 17.0, 19.0, 30.0, 68.0, 89.0, 148.0, 238.0, 412.0, 799.0, 1843.0, 3891.0, 9525.0, 26699.0, 83307.0, 303480.0, 430414.0, 126674.0, 38068.0, 13058.0, 5158.0, 2233.0, 1083.0, 535.0, 266.0, 183.0, 102.0, 62.0, 32.0, 23.0, 20.0, 19.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5703125, -14.102783203125, -13.63525390625, -13.167724609375, -12.7001953125, -12.232666015625, -11.76513671875, -11.297607421875, -10.830078125, -10.362548828125, -9.89501953125, -9.427490234375, -8.9599609375, -8.492431640625, -8.02490234375, -7.557373046875, -7.08984375, -6.622314453125, -6.15478515625, -5.687255859375, -5.2197265625, -4.752197265625, -4.28466796875, -3.817138671875, -3.349609375, -2.882080078125, -2.41455078125, -1.947021484375, -1.4794921875, -1.011962890625, -0.54443359375, -0.076904296875, 0.390625, 0.858154296875, 1.32568359375, 1.793212890625, 2.2607421875, 2.728271484375, 3.19580078125, 3.663330078125, 4.130859375, 4.598388671875, 5.06591796875, 5.533447265625, 6.0009765625, 6.468505859375, 6.93603515625, 7.403564453125, 7.87109375, 8.338623046875, 8.80615234375, 9.273681640625, 9.7412109375, 10.208740234375, 10.67626953125, 11.143798828125, 11.611328125, 12.078857421875, 12.54638671875, 13.013916015625, 13.4814453125, 13.948974609375, 14.41650390625, 14.884033203125, 15.3515625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 14.0, 9.0, 15.0, 20.0, 21.0, 18.0, 22.0, 27.0, 29.0, 36.0, 39.0, 34.0, 37.0, 53.0, 54.0, 49.0, 43.0, 35.0, 51.0, 50.0, 44.0, 37.0, 43.0, 35.0, 18.0, 30.0, 23.0, 25.0, 19.0, 14.0, 13.0, 10.0, 5.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.87109375, -4.71514892578125, -4.5592041015625, -4.40325927734375, -4.247314453125, -4.09136962890625, -3.9354248046875, -3.77947998046875, -3.62353515625, -3.46759033203125, -3.3116455078125, -3.15570068359375, -2.999755859375, -2.84381103515625, -2.6878662109375, -2.53192138671875, -2.3759765625, -2.22003173828125, -2.0640869140625, -1.90814208984375, -1.752197265625, -1.59625244140625, -1.4403076171875, -1.28436279296875, -1.12841796875, -0.97247314453125, -0.8165283203125, -0.66058349609375, -0.504638671875, -0.34869384765625, -0.1927490234375, -0.03680419921875, 0.119140625, 0.27508544921875, 0.4310302734375, 0.58697509765625, 0.742919921875, 0.89886474609375, 1.0548095703125, 1.21075439453125, 1.36669921875, 1.52264404296875, 1.6785888671875, 1.83453369140625, 1.990478515625, 2.14642333984375, 2.3023681640625, 2.45831298828125, 2.6142578125, 2.77020263671875, 2.9261474609375, 3.08209228515625, 3.238037109375, 3.39398193359375, 3.5499267578125, 3.70587158203125, 3.86181640625, 4.01776123046875, 4.1737060546875, 4.32965087890625, 4.485595703125, 4.64154052734375, 4.7974853515625, 4.95343017578125, 5.109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 5.0, 8.0, 14.0, 12.0, 21.0, 13.0, 28.0, 64.0, 73.0, 120.0, 240.0, 459.0, 902.0, 2246.0, 8007.0, 50135.0, 670115.0, 281432.0, 26343.0, 5071.0, 1662.0, 697.0, 330.0, 201.0, 109.0, 73.0, 53.0, 33.0, 26.0, 15.0, 6.0, 1.0, 12.0, 8.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.78125, -27.84814453125, -26.9150390625, -25.98193359375, -25.048828125, -24.11572265625, -23.1826171875, -22.24951171875, -21.31640625, -20.38330078125, -19.4501953125, -18.51708984375, -17.583984375, -16.65087890625, -15.7177734375, -14.78466796875, -13.8515625, -12.91845703125, -11.9853515625, -11.05224609375, -10.119140625, -9.18603515625, -8.2529296875, -7.31982421875, -6.38671875, -5.45361328125, -4.5205078125, -3.58740234375, -2.654296875, -1.72119140625, -0.7880859375, 0.14501953125, 1.078125, 2.01123046875, 2.9443359375, 3.87744140625, 4.810546875, 5.74365234375, 6.6767578125, 7.60986328125, 8.54296875, 9.47607421875, 10.4091796875, 11.34228515625, 12.275390625, 13.20849609375, 14.1416015625, 15.07470703125, 16.0078125, 16.94091796875, 17.8740234375, 18.80712890625, 19.740234375, 20.67333984375, 21.6064453125, 22.53955078125, 23.47265625, 24.40576171875, 25.3388671875, 26.27197265625, 27.205078125, 28.13818359375, 29.0712890625, 30.00439453125, 30.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 3.0, 5.0, 8.0, 6.0, 11.0, 16.0, 12.0, 19.0, 20.0, 25.0, 30.0, 33.0, 40.0, 37.0, 33.0, 42.0, 50.0, 50.0, 49.0, 53.0, 52.0, 35.0, 46.0, 38.0, 39.0, 36.0, 35.0, 34.0, 15.0, 18.0, 25.0, 29.0, 13.0, 9.0, 7.0, 2.0, 9.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -17.949462890625, -17.33642578125, -16.723388671875, -16.1103515625, -15.497314453125, -14.88427734375, -14.271240234375, -13.658203125, -13.045166015625, -12.43212890625, -11.819091796875, -11.2060546875, -10.593017578125, -9.97998046875, -9.366943359375, -8.75390625, -8.140869140625, -7.52783203125, -6.914794921875, -6.3017578125, -5.688720703125, -5.07568359375, -4.462646484375, -3.849609375, -3.236572265625, -2.62353515625, -2.010498046875, -1.3974609375, -0.784423828125, -0.17138671875, 0.441650390625, 1.0546875, 1.667724609375, 2.28076171875, 2.893798828125, 3.5068359375, 4.119873046875, 4.73291015625, 5.345947265625, 5.958984375, 6.572021484375, 7.18505859375, 7.798095703125, 8.4111328125, 9.024169921875, 9.63720703125, 10.250244140625, 10.86328125, 11.476318359375, 12.08935546875, 12.702392578125, 13.3154296875, 13.928466796875, 14.54150390625, 15.154541015625, 15.767578125, 16.380615234375, 16.99365234375, 17.606689453125, 18.2197265625, 18.832763671875, 19.44580078125, 20.058837890625, 20.671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 12.0, 11.0, 29.0, 52.0, 117.0, 368.0, 1774.0, 58438.0, 981286.0, 5342.0, 720.0, 228.0, 96.0, 30.0, 14.0, 14.0, 5.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.875, -41.723388671875, -40.57177734375, -39.420166015625, -38.2685546875, -37.116943359375, -35.96533203125, -34.813720703125, -33.662109375, -32.510498046875, -31.35888671875, -30.207275390625, -29.0556640625, -27.904052734375, -26.75244140625, -25.600830078125, -24.44921875, -23.297607421875, -22.14599609375, -20.994384765625, -19.8427734375, -18.691162109375, -17.53955078125, -16.387939453125, -15.236328125, -14.084716796875, -12.93310546875, -11.781494140625, -10.6298828125, -9.478271484375, -8.32666015625, -7.175048828125, -6.0234375, -4.871826171875, -3.72021484375, -2.568603515625, -1.4169921875, -0.265380859375, 0.88623046875, 2.037841796875, 3.189453125, 4.341064453125, 5.49267578125, 6.644287109375, 7.7958984375, 8.947509765625, 10.09912109375, 11.250732421875, 12.40234375, 13.553955078125, 14.70556640625, 15.857177734375, 17.0087890625, 18.160400390625, 19.31201171875, 20.463623046875, 21.615234375, 22.766845703125, 23.91845703125, 25.070068359375, 26.2216796875, 27.373291015625, 28.52490234375, 29.676513671875, 30.828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 7.0, 7.0, 11.0, 26.0, 16.0, 35.0, 36.0, 64.0, 108.0, 159.0, 200.0, 100.0, 64.0, 41.0, 29.0, 35.0, 11.0, 17.0, 13.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.002227783203125, -0.0021677911281585693, -0.0021077990531921387, -0.002047806978225708, -0.0019878149032592773, -0.0019278228282928467, -0.001867830753326416, -0.0018078386783599854, -0.0017478466033935547, -0.001687854528427124, -0.0016278624534606934, -0.0015678703784942627, -0.001507878303527832, -0.0014478862285614014, -0.0013878941535949707, -0.00132790207862854, -0.0012679100036621094, -0.0012079179286956787, -0.001147925853729248, -0.0010879337787628174, -0.0010279417037963867, -0.0009679496288299561, -0.0009079575538635254, -0.0008479654788970947, -0.0007879734039306641, -0.0007279813289642334, -0.0006679892539978027, -0.0006079971790313721, -0.0005480051040649414, -0.00048801302909851074, -0.0004280209541320801, -0.0003680288791656494, -0.00030803680419921875, -0.0002480447292327881, -0.00018805265426635742, -0.00012806057929992676, -6.80685043334961e-05, -8.07642936706543e-06, 5.1915645599365234e-05, 0.0001119077205657959, 0.00017189979553222656, 0.00023189187049865723, 0.0002918839454650879, 0.00035187602043151855, 0.0004118680953979492, 0.0004718601703643799, 0.0005318522453308105, 0.0005918443202972412, 0.0006518363952636719, 0.0007118284702301025, 0.0007718205451965332, 0.0008318126201629639, 0.0008918046951293945, 0.0009517967700958252, 0.0010117888450622559, 0.0010717809200286865, 0.0011317729949951172, 0.0011917650699615479, 0.0012517571449279785, 0.0013117492198944092, 0.0013717412948608398, 0.0014317333698272705, 0.0014917254447937012, 0.0015517175197601318, 0.0016117095947265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 2.0, 12.0, 15.0, 13.0, 24.0, 34.0, 43.0, 101.0, 174.0, 311.0, 794.0, 2122.0, 8077.0, 72049.0, 887544.0, 65930.0, 7702.0, 2081.0, 796.0, 342.0, 150.0, 81.0, 42.0, 34.0, 27.0, 17.0, 6.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.70458984375, -9.2529296875, -8.80126953125, -8.349609375, -7.89794921875, -7.4462890625, -6.99462890625, -6.54296875, -6.09130859375, -5.6396484375, -5.18798828125, -4.736328125, -4.28466796875, -3.8330078125, -3.38134765625, -2.9296875, -2.47802734375, -2.0263671875, -1.57470703125, -1.123046875, -0.67138671875, -0.2197265625, 0.23193359375, 0.68359375, 1.13525390625, 1.5869140625, 2.03857421875, 2.490234375, 2.94189453125, 3.3935546875, 3.84521484375, 4.296875, 4.74853515625, 5.2001953125, 5.65185546875, 6.103515625, 6.55517578125, 7.0068359375, 7.45849609375, 7.91015625, 8.36181640625, 8.8134765625, 9.26513671875, 9.716796875, 10.16845703125, 10.6201171875, 11.07177734375, 11.5234375, 11.97509765625, 12.4267578125, 12.87841796875, 13.330078125, 13.78173828125, 14.2333984375, 14.68505859375, 15.13671875, 15.58837890625, 16.0400390625, 16.49169921875, 16.943359375, 17.39501953125, 17.8466796875, 18.29833984375, 18.75]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 18.0, 26.0, 30.0, 43.0, 64.0, 93.0, 92.0, 118.0, 139.0, 90.0, 91.0, 53.0, 36.0, 26.0, 10.0, 14.0, 10.0, 2.0, 1.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.93359375, -5.63214111328125, -5.3306884765625, -5.02923583984375, -4.727783203125, -4.42633056640625, -4.1248779296875, -3.82342529296875, -3.52197265625, -3.22052001953125, -2.9190673828125, -2.61761474609375, -2.316162109375, -2.01470947265625, -1.7132568359375, -1.41180419921875, -1.1103515625, -0.80889892578125, -0.5074462890625, -0.20599365234375, 0.095458984375, 0.39691162109375, 0.6983642578125, 0.99981689453125, 1.30126953125, 1.60272216796875, 1.9041748046875, 2.20562744140625, 2.507080078125, 2.80853271484375, 3.1099853515625, 3.41143798828125, 3.712890625, 4.01434326171875, 4.3157958984375, 4.61724853515625, 4.918701171875, 5.22015380859375, 5.5216064453125, 5.82305908203125, 6.12451171875, 6.42596435546875, 6.7274169921875, 7.02886962890625, 7.330322265625, 7.63177490234375, 7.9332275390625, 8.23468017578125, 8.5361328125, 8.83758544921875, 9.1390380859375, 9.44049072265625, 9.741943359375, 10.04339599609375, 10.3448486328125, 10.64630126953125, 10.94775390625, 11.24920654296875, 11.5506591796875, 11.85211181640625, 12.153564453125, 12.45501708984375, 12.7564697265625, 13.05792236328125, 13.359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 12.0, 30.0, 128.0, 375.0, 300.0, 100.0, 29.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-378.58331298828125, -368.02154541015625, -357.4598083496094, -346.8980407714844, -336.3362731933594, -325.7745361328125, -315.2127685546875, -304.6510009765625, -294.0892333984375, -283.5274658203125, -272.9657287597656, -262.4039611816406, -251.84219360351562, -241.2804412841797, -230.71868896484375, -220.15692138671875, -209.59518432617188, -199.03343200683594, -188.47166442871094, -177.909912109375, -167.34814453125, -156.78639221191406, -146.22463989257812, -135.66287231445312, -125.10111999511719, -114.53936004638672, -103.97760009765625, -93.41584777832031, -82.85408782958984, -72.29232788085938, -61.73057174682617, -51.16881561279297, -40.6070556640625, -30.045297622680664, -19.483539581298828, -8.921781539916992, 1.6399765014648438, 12.201736450195312, 22.763492584228516, 33.32524871826172, 43.88700866699219, 54.448768615722656, 65.01052856445312, 75.57228088378906, 86.13404083251953, 96.69580078125, 107.25755310058594, 117.8193130493164, 128.38107299804688, 138.9428253173828, 149.5045928955078, 160.06634521484375, 170.62811279296875, 181.1898651123047, 191.75161743164062, 202.31338500976562, 212.87513732910156, 223.4368896484375, 233.9986572265625, 244.56040954589844, 255.12216186523438, 265.6839294433594, 276.2456970214844, 286.80743408203125, 297.36920166015625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 7.0, 11.0, 12.0, 11.0, 20.0, 24.0, 20.0, 31.0, 43.0, 36.0, 36.0, 34.0, 35.0, 54.0, 54.0, 63.0, 70.0, 47.0, 43.0, 35.0, 37.0, 38.0, 38.0, 24.0, 23.0, 20.0, 25.0, 14.0, 16.0, 11.0, 14.0, 7.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-89.90695190429688, -87.3105239868164, -84.71410369873047, -82.11767578125, -79.52125549316406, -76.9248275756836, -74.32839965820312, -71.73197937011719, -69.13555145263672, -66.53912353515625, -63.94270324707031, -61.346275329589844, -58.74985122680664, -56.15342712402344, -53.55699920654297, -50.960575103759766, -48.36415100097656, -45.76772689819336, -43.171302795410156, -40.57487487792969, -37.978450775146484, -35.38202667236328, -32.78559875488281, -30.18917465209961, -27.592750549316406, -24.996326446533203, -22.399900436401367, -19.80347442626953, -17.207050323486328, -14.610625267028809, -12.014200210571289, -9.417774200439453, -6.82135009765625, -4.2249250411987305, -1.628499984741211, 0.9679250717163086, 3.564350128173828, 6.160775184631348, 8.757200241088867, 11.353626251220703, 13.950050354003906, 16.54647445678711, 19.142900466918945, 21.73932647705078, 24.335750579833984, 26.932174682617188, 29.528600692749023, 32.12502670288086, 34.72145080566406, 37.317874908447266, 39.91429901123047, 42.51072692871094, 45.10715103149414, 47.703575134277344, 50.30000305175781, 52.896427154541016, 55.49285125732422, 58.08927536010742, 60.685699462890625, 63.282127380371094, 65.87855529785156, 68.4749755859375, 71.07140350341797, 73.66783142089844, 76.26425170898438]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 10.0, 17.0, 13.0, 29.0, 30.0, 68.0, 133.0, 267.0, 644.0, 1866.0, 7167.0, 39501.0, 608260.0, 3368869.0, 144042.0, 17760.0, 3789.0, 1072.0, 361.0, 141.0, 80.0, 39.0, 40.0, 16.0, 12.0, 13.0, 3.0, 6.0, 5.0, 2.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -11.8878173828125, -11.377197265625, -10.8665771484375, -10.35595703125, -9.8453369140625, -9.334716796875, -8.8240966796875, -8.3134765625, -7.8028564453125, -7.292236328125, -6.7816162109375, -6.27099609375, -5.7603759765625, -5.249755859375, -4.7391357421875, -4.228515625, -3.7178955078125, -3.207275390625, -2.6966552734375, -2.18603515625, -1.6754150390625, -1.164794921875, -0.6541748046875, -0.1435546875, 0.3670654296875, 0.877685546875, 1.3883056640625, 1.89892578125, 2.4095458984375, 2.920166015625, 3.4307861328125, 3.94140625, 4.4520263671875, 4.962646484375, 5.4732666015625, 5.98388671875, 6.4945068359375, 7.005126953125, 7.5157470703125, 8.0263671875, 8.5369873046875, 9.047607421875, 9.5582275390625, 10.06884765625, 10.5794677734375, 11.090087890625, 11.6007080078125, 12.111328125, 12.6219482421875, 13.132568359375, 13.6431884765625, 14.15380859375, 14.6644287109375, 15.175048828125, 15.6856689453125, 16.1962890625, 16.7069091796875, 17.217529296875, 17.7281494140625, 18.23876953125, 18.7493896484375, 19.260009765625, 19.7706298828125, 20.28125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 8.0, 6.0, 8.0, 8.0, 12.0, 11.0, 13.0, 14.0, 17.0, 30.0, 31.0, 34.0, 37.0, 40.0, 32.0, 37.0, 60.0, 45.0, 52.0, 50.0, 51.0, 49.0, 48.0, 35.0, 34.0, 21.0, 29.0, 35.0, 32.0, 24.0, 17.0, 15.0, 15.0, 7.0, 10.0, 12.0, 4.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.2340087890625, -4.096923828125, -3.9598388671875, -3.82275390625, -3.6856689453125, -3.548583984375, -3.4114990234375, -3.2744140625, -3.1373291015625, -3.000244140625, -2.8631591796875, -2.72607421875, -2.5889892578125, -2.451904296875, -2.3148193359375, -2.177734375, -2.0406494140625, -1.903564453125, -1.7664794921875, -1.62939453125, -1.4923095703125, -1.355224609375, -1.2181396484375, -1.0810546875, -0.9439697265625, -0.806884765625, -0.6697998046875, -0.53271484375, -0.3956298828125, -0.258544921875, -0.1214599609375, 0.015625, 0.1527099609375, 0.289794921875, 0.4268798828125, 0.56396484375, 0.7010498046875, 0.838134765625, 0.9752197265625, 1.1123046875, 1.2493896484375, 1.386474609375, 1.5235595703125, 1.66064453125, 1.7977294921875, 1.934814453125, 2.0718994140625, 2.208984375, 2.3460693359375, 2.483154296875, 2.6202392578125, 2.75732421875, 2.8944091796875, 3.031494140625, 3.1685791015625, 3.3056640625, 3.4427490234375, 3.579833984375, 3.7169189453125, 3.85400390625, 3.9910888671875, 4.128173828125, 4.2652587890625, 4.40234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 14.0, 12.0, 25.0, 34.0, 48.0, 75.0, 113.0, 238.0, 517.0, 1108.0, 2711.0, 8606.0, 31532.0, 165629.0, 2442358.0, 1394796.0, 112209.0, 23416.0, 6685.0, 2264.0, 911.0, 430.0, 212.0, 116.0, 72.0, 48.0, 22.0, 19.0, 17.0, 10.0, 5.0, 8.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.657958984375, -12.26123046875, -11.864501953125, -11.4677734375, -11.071044921875, -10.67431640625, -10.277587890625, -9.880859375, -9.484130859375, -9.08740234375, -8.690673828125, -8.2939453125, -7.897216796875, -7.50048828125, -7.103759765625, -6.70703125, -6.310302734375, -5.91357421875, -5.516845703125, -5.1201171875, -4.723388671875, -4.32666015625, -3.929931640625, -3.533203125, -3.136474609375, -2.73974609375, -2.343017578125, -1.9462890625, -1.549560546875, -1.15283203125, -0.756103515625, -0.359375, 0.037353515625, 0.43408203125, 0.830810546875, 1.2275390625, 1.624267578125, 2.02099609375, 2.417724609375, 2.814453125, 3.211181640625, 3.60791015625, 4.004638671875, 4.4013671875, 4.798095703125, 5.19482421875, 5.591552734375, 5.98828125, 6.385009765625, 6.78173828125, 7.178466796875, 7.5751953125, 7.971923828125, 8.36865234375, 8.765380859375, 9.162109375, 9.558837890625, 9.95556640625, 10.352294921875, 10.7490234375, 11.145751953125, 11.54248046875, 11.939208984375, 12.3359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 5.0, 6.0, 11.0, 8.0, 18.0, 23.0, 26.0, 27.0, 39.0, 68.0, 75.0, 95.0, 136.0, 187.0, 274.0, 421.0, 619.0, 600.0, 446.0, 272.0, 209.0, 130.0, 77.0, 70.0, 58.0, 38.0, 28.0, 25.0, 15.0, 15.0, 8.0, 6.0, 8.0, 4.0, 5.0, 5.0, 7.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8125, -10.4749755859375, -10.137451171875, -9.7999267578125, -9.46240234375, -9.1248779296875, -8.787353515625, -8.4498291015625, -8.1123046875, -7.7747802734375, -7.437255859375, -7.0997314453125, -6.76220703125, -6.4246826171875, -6.087158203125, -5.7496337890625, -5.412109375, -5.0745849609375, -4.737060546875, -4.3995361328125, -4.06201171875, -3.7244873046875, -3.386962890625, -3.0494384765625, -2.7119140625, -2.3743896484375, -2.036865234375, -1.6993408203125, -1.36181640625, -1.0242919921875, -0.686767578125, -0.3492431640625, -0.01171875, 0.3258056640625, 0.663330078125, 1.0008544921875, 1.33837890625, 1.6759033203125, 2.013427734375, 2.3509521484375, 2.6884765625, 3.0260009765625, 3.363525390625, 3.7010498046875, 4.03857421875, 4.3760986328125, 4.713623046875, 5.0511474609375, 5.388671875, 5.7261962890625, 6.063720703125, 6.4012451171875, 6.73876953125, 7.0762939453125, 7.413818359375, 7.7513427734375, 8.0888671875, 8.4263916015625, 8.763916015625, 9.1014404296875, 9.43896484375, 9.7764892578125, 10.114013671875, 10.4515380859375, 10.7890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 8.0, 14.0, 32.0, 68.0, 154.0, 215.0, 204.0, 162.0, 66.0, 26.0, 14.0, 5.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.7950439453125, -124.1967544555664, -118.59846496582031, -113.00017547607422, -107.40188598632812, -101.80359649658203, -96.20530700683594, -90.60701751708984, -85.00872802734375, -79.41043853759766, -73.81214904785156, -68.21385955810547, -62.615570068359375, -57.01728057861328, -51.41899108886719, -45.820701599121094, -40.222412109375, -34.624122619628906, -29.025833129882812, -23.42754364013672, -17.829254150390625, -12.230964660644531, -6.6326751708984375, -1.0343856811523438, 4.56390380859375, 10.162193298339844, 15.760482788085938, 21.35877227783203, 26.957061767578125, 32.55535125732422, 38.15364074707031, 43.751930236816406, 49.3502197265625, 54.948509216308594, 60.54679870605469, 66.14508819580078, 71.74337768554688, 77.34166717529297, 82.93995666503906, 88.53824615478516, 94.13653564453125, 99.73482513427734, 105.33311462402344, 110.93140411376953, 116.52969360351562, 122.12798309326172, 127.72627258300781, 133.32455444335938, 138.9228515625, 144.52114868164062, 150.1194305419922, 155.71771240234375, 161.31600952148438, 166.914306640625, 172.51258850097656, 178.11087036132812, 183.70916748046875, 189.30746459960938, 194.90574645996094, 200.5040283203125, 206.10232543945312, 211.70062255859375, 217.2989044189453, 222.89718627929688, 228.4954833984375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 3.0, 10.0, 14.0, 20.0, 15.0, 21.0, 23.0, 31.0, 35.0, 18.0, 27.0, 47.0, 39.0, 43.0, 49.0, 54.0, 51.0, 44.0, 45.0, 43.0, 50.0, 50.0, 31.0, 30.0, 33.0, 30.0, 26.0, 20.0, 14.0, 22.0, 11.0, 12.0, 7.0, 8.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.21015548706055, -58.33202362060547, -56.453887939453125, -54.57575607299805, -52.69762420654297, -50.81949234008789, -48.94136047363281, -47.06322479248047, -45.18509292602539, -43.30696105957031, -41.42882537841797, -39.55069351196289, -37.67256164550781, -35.794429779052734, -33.916297912597656, -32.03816223144531, -30.160030364990234, -28.281898498535156, -26.403764724731445, -24.525630950927734, -22.647499084472656, -20.769367218017578, -18.891233444213867, -17.013099670410156, -15.134967803955078, -13.256834983825684, -11.378702163696289, -9.500569343566895, -7.6224365234375, -5.7443037033081055, -3.866170883178711, -1.9880380630493164, -0.1099090576171875, 1.768223762512207, 3.6463565826416016, 5.524489402770996, 7.402622222900391, 9.280755043029785, 11.15888786315918, 13.037020683288574, 14.915153503417969, 16.793285369873047, 18.671419143676758, 20.54955291748047, 22.427684783935547, 24.305816650390625, 26.183950424194336, 28.062084197998047, 29.940216064453125, 31.818347930908203, 33.69647979736328, 35.574615478515625, 37.4527473449707, 39.33087921142578, 41.209014892578125, 43.0871467590332, 44.96527862548828, 46.84341049194336, 48.72154235839844, 50.59967803955078, 52.47780990600586, 54.35594177246094, 56.23407745361328, 58.11220932006836, 59.99034118652344]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 1.0, 6.0, 7.0, 6.0, 6.0, 14.0, 14.0, 21.0, 32.0, 48.0, 104.0, 135.0, 258.0, 454.0, 1024.0, 2326.0, 6576.0, 21979.0, 83647.0, 318753.0, 439683.0, 125516.0, 32892.0, 9201.0, 3208.0, 1336.0, 576.0, 282.0, 158.0, 95.0, 58.0, 47.0, 26.0, 24.0, 13.0, 9.0, 2.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.53125, -16.01708984375, -15.5029296875, -14.98876953125, -14.474609375, -13.96044921875, -13.4462890625, -12.93212890625, -12.41796875, -11.90380859375, -11.3896484375, -10.87548828125, -10.361328125, -9.84716796875, -9.3330078125, -8.81884765625, -8.3046875, -7.79052734375, -7.2763671875, -6.76220703125, -6.248046875, -5.73388671875, -5.2197265625, -4.70556640625, -4.19140625, -3.67724609375, -3.1630859375, -2.64892578125, -2.134765625, -1.62060546875, -1.1064453125, -0.59228515625, -0.078125, 0.43603515625, 0.9501953125, 1.46435546875, 1.978515625, 2.49267578125, 3.0068359375, 3.52099609375, 4.03515625, 4.54931640625, 5.0634765625, 5.57763671875, 6.091796875, 6.60595703125, 7.1201171875, 7.63427734375, 8.1484375, 8.66259765625, 9.1767578125, 9.69091796875, 10.205078125, 10.71923828125, 11.2333984375, 11.74755859375, 12.26171875, 12.77587890625, 13.2900390625, 13.80419921875, 14.318359375, 14.83251953125, 15.3466796875, 15.86083984375, 16.375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 5.0, 3.0, 6.0, 2.0, 5.0, 7.0, 9.0, 8.0, 13.0, 9.0, 13.0, 21.0, 22.0, 25.0, 28.0, 28.0, 41.0, 31.0, 39.0, 43.0, 40.0, 43.0, 48.0, 42.0, 39.0, 55.0, 43.0, 52.0, 43.0, 38.0, 33.0, 23.0, 23.0, 19.0, 18.0, 18.0, 15.0, 16.0, 9.0, 9.0, 8.0, 9.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.13641357421875, -4.0032958984375, -3.87017822265625, -3.737060546875, -3.60394287109375, -3.4708251953125, -3.33770751953125, -3.20458984375, -3.07147216796875, -2.9383544921875, -2.80523681640625, -2.672119140625, -2.53900146484375, -2.4058837890625, -2.27276611328125, -2.1396484375, -2.00653076171875, -1.8734130859375, -1.74029541015625, -1.607177734375, -1.47406005859375, -1.3409423828125, -1.20782470703125, -1.07470703125, -0.94158935546875, -0.8084716796875, -0.67535400390625, -0.542236328125, -0.40911865234375, -0.2760009765625, -0.14288330078125, -0.009765625, 0.12335205078125, 0.2564697265625, 0.38958740234375, 0.522705078125, 0.65582275390625, 0.7889404296875, 0.92205810546875, 1.05517578125, 1.18829345703125, 1.3214111328125, 1.45452880859375, 1.587646484375, 1.72076416015625, 1.8538818359375, 1.98699951171875, 2.1201171875, 2.25323486328125, 2.3863525390625, 2.51947021484375, 2.652587890625, 2.78570556640625, 2.9188232421875, 3.05194091796875, 3.18505859375, 3.31817626953125, 3.4512939453125, 3.58441162109375, 3.717529296875, 3.85064697265625, 3.9837646484375, 4.11688232421875, 4.25]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 21.0, 25.0, 26.0, 49.0, 80.0, 138.0, 263.0, 436.0, 873.0, 2041.0, 7720.0, 113225.0, 877504.0, 38205.0, 4793.0, 1570.0, 668.0, 360.0, 203.0, 106.0, 56.0, 45.0, 35.0, 16.0, 20.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-42.375, -41.02294921875, -39.6708984375, -38.31884765625, -36.966796875, -35.61474609375, -34.2626953125, -32.91064453125, -31.55859375, -30.20654296875, -28.8544921875, -27.50244140625, -26.150390625, -24.79833984375, -23.4462890625, -22.09423828125, -20.7421875, -19.39013671875, -18.0380859375, -16.68603515625, -15.333984375, -13.98193359375, -12.6298828125, -11.27783203125, -9.92578125, -8.57373046875, -7.2216796875, -5.86962890625, -4.517578125, -3.16552734375, -1.8134765625, -0.46142578125, 0.890625, 2.24267578125, 3.5947265625, 4.94677734375, 6.298828125, 7.65087890625, 9.0029296875, 10.35498046875, 11.70703125, 13.05908203125, 14.4111328125, 15.76318359375, 17.115234375, 18.46728515625, 19.8193359375, 21.17138671875, 22.5234375, 23.87548828125, 25.2275390625, 26.57958984375, 27.931640625, 29.28369140625, 30.6357421875, 31.98779296875, 33.33984375, 34.69189453125, 36.0439453125, 37.39599609375, 38.748046875, 40.10009765625, 41.4521484375, 42.80419921875, 44.15625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 8.0, 13.0, 16.0, 16.0, 19.0, 24.0, 19.0, 40.0, 44.0, 30.0, 49.0, 41.0, 66.0, 61.0, 68.0, 61.0, 71.0, 50.0, 41.0, 48.0, 40.0, 31.0, 28.0, 27.0, 16.0, 16.0, 15.0, 12.0, 9.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.19189453125, -19.4306640625, -18.66943359375, -17.908203125, -17.14697265625, -16.3857421875, -15.62451171875, -14.86328125, -14.10205078125, -13.3408203125, -12.57958984375, -11.818359375, -11.05712890625, -10.2958984375, -9.53466796875, -8.7734375, -8.01220703125, -7.2509765625, -6.48974609375, -5.728515625, -4.96728515625, -4.2060546875, -3.44482421875, -2.68359375, -1.92236328125, -1.1611328125, -0.39990234375, 0.361328125, 1.12255859375, 1.8837890625, 2.64501953125, 3.40625, 4.16748046875, 4.9287109375, 5.68994140625, 6.451171875, 7.21240234375, 7.9736328125, 8.73486328125, 9.49609375, 10.25732421875, 11.0185546875, 11.77978515625, 12.541015625, 13.30224609375, 14.0634765625, 14.82470703125, 15.5859375, 16.34716796875, 17.1083984375, 17.86962890625, 18.630859375, 19.39208984375, 20.1533203125, 20.91455078125, 21.67578125, 22.43701171875, 23.1982421875, 23.95947265625, 24.720703125, 25.48193359375, 26.2431640625, 27.00439453125, 27.765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 12.0, 8.0, 6.0, 7.0, 15.0, 20.0, 16.0, 29.0, 79.0, 108.0, 204.0, 560.0, 2611.0, 26913.0, 909966.0, 100956.0, 5455.0, 940.0, 312.0, 137.0, 63.0, 43.0, 25.0, 19.0, 13.0, 5.0, 4.0, 4.0, 2.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1875, -12.711181640625, -12.23486328125, -11.758544921875, -11.2822265625, -10.805908203125, -10.32958984375, -9.853271484375, -9.376953125, -8.900634765625, -8.42431640625, -7.947998046875, -7.4716796875, -6.995361328125, -6.51904296875, -6.042724609375, -5.56640625, -5.090087890625, -4.61376953125, -4.137451171875, -3.6611328125, -3.184814453125, -2.70849609375, -2.232177734375, -1.755859375, -1.279541015625, -0.80322265625, -0.326904296875, 0.1494140625, 0.625732421875, 1.10205078125, 1.578369140625, 2.0546875, 2.531005859375, 3.00732421875, 3.483642578125, 3.9599609375, 4.436279296875, 4.91259765625, 5.388916015625, 5.865234375, 6.341552734375, 6.81787109375, 7.294189453125, 7.7705078125, 8.246826171875, 8.72314453125, 9.199462890625, 9.67578125, 10.152099609375, 10.62841796875, 11.104736328125, 11.5810546875, 12.057373046875, 12.53369140625, 13.010009765625, 13.486328125, 13.962646484375, 14.43896484375, 14.915283203125, 15.3916015625, 15.867919921875, 16.34423828125, 16.820556640625, 17.296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 11.0, 4.0, 9.0, 16.0, 12.0, 19.0, 28.0, 34.0, 38.0, 45.0, 67.0, 85.0, 146.0, 130.0, 78.0, 49.0, 33.0, 34.0, 27.0, 23.0, 15.0, 15.0, 20.0, 7.0, 9.0, 7.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0018224716186523438, -0.0017727762460708618, -0.0017230808734893799, -0.001673385500907898, -0.001623690128326416, -0.001573994755744934, -0.0015242993831634521, -0.0014746040105819702, -0.0014249086380004883, -0.0013752132654190063, -0.0013255178928375244, -0.0012758225202560425, -0.0012261271476745605, -0.0011764317750930786, -0.0011267364025115967, -0.0010770410299301147, -0.0010273456573486328, -0.0009776502847671509, -0.0009279549121856689, -0.000878259539604187, -0.0008285641670227051, -0.0007788687944412231, -0.0007291734218597412, -0.0006794780492782593, -0.0006297826766967773, -0.0005800873041152954, -0.0005303919315338135, -0.00048069655895233154, -0.0004310011863708496, -0.0003813058137893677, -0.00033161044120788574, -0.0002819150686264038, -0.00023221969604492188, -0.00018252432346343994, -0.000132828950881958, -8.313357830047607e-05, -3.343820571899414e-05, 1.6257166862487793e-05, 6.595253944396973e-05, 0.00011564791202545166, 0.0001653432846069336, 0.00021503865718841553, 0.00026473402976989746, 0.0003144294023513794, 0.00036412477493286133, 0.00041382014751434326, 0.0004635155200958252, 0.0005132108926773071, 0.0005629062652587891, 0.000612601637840271, 0.0006622970104217529, 0.0007119923830032349, 0.0007616877555847168, 0.0008113831281661987, 0.0008610785007476807, 0.0009107738733291626, 0.0009604692459106445, 0.0010101646184921265, 0.0010598599910736084, 0.0011095553636550903, 0.0011592507362365723, 0.0012089461088180542, 0.0012586414813995361, 0.001308336853981018, 0.0013580322265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 10.0, 9.0, 8.0, 14.0, 26.0, 40.0, 73.0, 94.0, 144.0, 264.0, 494.0, 1081.0, 2598.0, 8852.0, 54876.0, 828631.0, 130613.0, 14125.0, 3809.0, 1317.0, 637.0, 299.0, 180.0, 111.0, 64.0, 41.0, 30.0, 32.0, 13.0, 15.0, 9.0, 5.0, 7.0, 6.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-10.9375, -10.6307373046875, -10.323974609375, -10.0172119140625, -9.71044921875, -9.4036865234375, -9.096923828125, -8.7901611328125, -8.4833984375, -8.1766357421875, -7.869873046875, -7.5631103515625, -7.25634765625, -6.9495849609375, -6.642822265625, -6.3360595703125, -6.029296875, -5.7225341796875, -5.415771484375, -5.1090087890625, -4.80224609375, -4.4954833984375, -4.188720703125, -3.8819580078125, -3.5751953125, -3.2684326171875, -2.961669921875, -2.6549072265625, -2.34814453125, -2.0413818359375, -1.734619140625, -1.4278564453125, -1.12109375, -0.8143310546875, -0.507568359375, -0.2008056640625, 0.10595703125, 0.4127197265625, 0.719482421875, 1.0262451171875, 1.3330078125, 1.6397705078125, 1.946533203125, 2.2532958984375, 2.56005859375, 2.8668212890625, 3.173583984375, 3.4803466796875, 3.787109375, 4.0938720703125, 4.400634765625, 4.7073974609375, 5.01416015625, 5.3209228515625, 5.627685546875, 5.9344482421875, 6.2412109375, 6.5479736328125, 6.854736328125, 7.1614990234375, 7.46826171875, 7.7750244140625, 8.081787109375, 8.3885498046875, 8.6953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 7.0, 15.0, 15.0, 27.0, 33.0, 43.0, 56.0, 64.0, 94.0, 131.0, 122.0, 106.0, 83.0, 49.0, 37.0, 33.0, 13.0, 15.0, 7.0, 6.0, 3.0, 7.0, 7.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.58984375, -6.34527587890625, -6.1007080078125, -5.85614013671875, -5.611572265625, -5.36700439453125, -5.1224365234375, -4.87786865234375, -4.63330078125, -4.38873291015625, -4.1441650390625, -3.89959716796875, -3.655029296875, -3.41046142578125, -3.1658935546875, -2.92132568359375, -2.6767578125, -2.43218994140625, -2.1876220703125, -1.94305419921875, -1.698486328125, -1.45391845703125, -1.2093505859375, -0.96478271484375, -0.72021484375, -0.47564697265625, -0.2310791015625, 0.01348876953125, 0.258056640625, 0.50262451171875, 0.7471923828125, 0.99176025390625, 1.236328125, 1.48089599609375, 1.7254638671875, 1.97003173828125, 2.214599609375, 2.45916748046875, 2.7037353515625, 2.94830322265625, 3.19287109375, 3.43743896484375, 3.6820068359375, 3.92657470703125, 4.171142578125, 4.41571044921875, 4.6602783203125, 4.90484619140625, 5.1494140625, 5.39398193359375, 5.6385498046875, 5.88311767578125, 6.127685546875, 6.37225341796875, 6.6168212890625, 6.86138916015625, 7.10595703125, 7.35052490234375, 7.5950927734375, 7.83966064453125, 8.084228515625, 8.32879638671875, 8.5733642578125, 8.81793212890625, 9.0625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 10.0, 21.0, 34.0, 63.0, 115.0, 204.0, 232.0, 134.0, 87.0, 40.0, 18.0, 10.0, 5.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.42556762695312, -152.39869689941406, -147.371826171875, -142.34495544433594, -137.31808471679688, -132.29119873046875, -127.26433563232422, -122.23745727539062, -117.21058654785156, -112.1837158203125, -107.15684509277344, -102.12997436523438, -97.10309600830078, -92.07622528076172, -87.04935455322266, -82.02247619628906, -76.99561309814453, -71.96874237060547, -66.9418716430664, -61.91499710083008, -56.88812255859375, -51.86125183105469, -46.834381103515625, -41.8075065612793, -36.780635833740234, -31.75376319885254, -26.726890563964844, -21.70001983642578, -16.673147201538086, -11.64627456665039, -6.619403839111328, -1.592529296875, 3.4343414306640625, 8.461214065551758, 13.488085746765137, 18.514957427978516, 23.54183006286621, 28.568702697753906, 33.59557342529297, 38.6224479675293, 43.64931869506836, 48.67618942260742, 53.70306396484375, 58.72993469238281, 63.756805419921875, 68.78367614746094, 73.810546875, 78.8374252319336, 83.86429595947266, 88.89116668701172, 93.91803741455078, 98.94491577148438, 103.97178649902344, 108.9986572265625, 114.02552795410156, 119.05239868164062, 124.07926940917969, 129.10614013671875, 134.1330108642578, 139.15988159179688, 144.18675231933594, 149.213623046875, 154.24050903320312, 159.2673797607422, 164.29425048828125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 12.0, 10.0, 11.0, 7.0, 18.0, 20.0, 32.0, 26.0, 28.0, 29.0, 30.0, 33.0, 37.0, 39.0, 49.0, 64.0, 55.0, 45.0, 56.0, 51.0, 44.0, 25.0, 36.0, 37.0, 24.0, 20.0, 20.0, 14.0, 14.0, 10.0, 16.0, 12.0, 8.0, 6.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-68.70359802246094, -66.64787292480469, -64.5921401977539, -62.53641128540039, -60.480682373046875, -58.42495346069336, -56.369224548339844, -54.31349563598633, -52.25776672363281, -50.2020378112793, -48.14630889892578, -46.090579986572266, -44.03485107421875, -41.979122161865234, -39.92339324951172, -37.8676643371582, -35.81193542480469, -33.75620651245117, -31.700477600097656, -29.64474868774414, -27.589019775390625, -25.53329086303711, -23.477561950683594, -21.421833038330078, -19.366104125976562, -17.310375213623047, -15.254646301269531, -13.198917388916016, -11.1431884765625, -9.087459564208984, -7.031730651855469, -4.976001739501953, -2.920276641845703, -0.8645477294921875, 1.1911811828613281, 3.2469100952148438, 5.302639007568359, 7.358367919921875, 9.41409683227539, 11.469825744628906, 13.525554656982422, 15.581283569335938, 17.637012481689453, 19.69274139404297, 21.748470306396484, 23.80419921875, 25.859928131103516, 27.91565704345703, 29.971385955810547, 32.02711486816406, 34.08284378051758, 36.138572692871094, 38.19430160522461, 40.250030517578125, 42.30575942993164, 44.361488342285156, 46.41721725463867, 48.47294616699219, 50.5286750793457, 52.58440399169922, 54.640132904052734, 56.69586181640625, 58.751590728759766, 60.80731964111328, 62.8630485534668]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 11.0, 27.0, 23.0, 68.0, 186.0, 597.0, 2652.0, 26282.0, 3200767.0, 946646.0, 14620.0, 1704.0, 407.0, 147.0, 62.0, 25.0, 19.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.5, -16.735595703125, -15.97119140625, -15.206787109375, -14.4423828125, -13.677978515625, -12.91357421875, -12.149169921875, -11.384765625, -10.620361328125, -9.85595703125, -9.091552734375, -8.3271484375, -7.562744140625, -6.79833984375, -6.033935546875, -5.26953125, -4.505126953125, -3.74072265625, -2.976318359375, -2.2119140625, -1.447509765625, -0.68310546875, 0.081298828125, 0.845703125, 1.610107421875, 2.37451171875, 3.138916015625, 3.9033203125, 4.667724609375, 5.43212890625, 6.196533203125, 6.9609375, 7.725341796875, 8.48974609375, 9.254150390625, 10.0185546875, 10.782958984375, 11.54736328125, 12.311767578125, 13.076171875, 13.840576171875, 14.60498046875, 15.369384765625, 16.1337890625, 16.898193359375, 17.66259765625, 18.427001953125, 19.19140625, 19.955810546875, 20.72021484375, 21.484619140625, 22.2490234375, 23.013427734375, 23.77783203125, 24.542236328125, 25.306640625, 26.071044921875, 26.83544921875, 27.599853515625, 28.3642578125, 29.128662109375, 29.89306640625, 30.657470703125, 31.421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 6.0, 11.0, 22.0, 14.0, 26.0, 19.0, 27.0, 22.0, 32.0, 39.0, 37.0, 41.0, 59.0, 51.0, 49.0, 49.0, 45.0, 49.0, 47.0, 52.0, 58.0, 46.0, 34.0, 29.0, 26.0, 24.0, 11.0, 17.0, 13.0, 7.0, 6.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-5.37890625, -5.230712890625, -5.08251953125, -4.934326171875, -4.7861328125, -4.637939453125, -4.48974609375, -4.341552734375, -4.193359375, -4.045166015625, -3.89697265625, -3.748779296875, -3.6005859375, -3.452392578125, -3.30419921875, -3.156005859375, -3.0078125, -2.859619140625, -2.71142578125, -2.563232421875, -2.4150390625, -2.266845703125, -2.11865234375, -1.970458984375, -1.822265625, -1.674072265625, -1.52587890625, -1.377685546875, -1.2294921875, -1.081298828125, -0.93310546875, -0.784912109375, -0.63671875, -0.488525390625, -0.34033203125, -0.192138671875, -0.0439453125, 0.104248046875, 0.25244140625, 0.400634765625, 0.548828125, 0.697021484375, 0.84521484375, 0.993408203125, 1.1416015625, 1.289794921875, 1.43798828125, 1.586181640625, 1.734375, 1.882568359375, 2.03076171875, 2.178955078125, 2.3271484375, 2.475341796875, 2.62353515625, 2.771728515625, 2.919921875, 3.068115234375, 3.21630859375, 3.364501953125, 3.5126953125, 3.660888671875, 3.80908203125, 3.957275390625, 4.10546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 5.0, 8.0, 15.0, 19.0, 24.0, 61.0, 96.0, 213.0, 501.0, 1199.0, 4702.0, 31956.0, 772040.0, 3303798.0, 68517.0, 8172.0, 1854.0, 615.0, 254.0, 122.0, 48.0, 27.0, 17.0, 9.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1171875, -14.4915771484375, -13.865966796875, -13.2403564453125, -12.61474609375, -11.9891357421875, -11.363525390625, -10.7379150390625, -10.1123046875, -9.4866943359375, -8.861083984375, -8.2354736328125, -7.60986328125, -6.9842529296875, -6.358642578125, -5.7330322265625, -5.107421875, -4.4818115234375, -3.856201171875, -3.2305908203125, -2.60498046875, -1.9793701171875, -1.353759765625, -0.7281494140625, -0.1025390625, 0.5230712890625, 1.148681640625, 1.7742919921875, 2.39990234375, 3.0255126953125, 3.651123046875, 4.2767333984375, 4.90234375, 5.5279541015625, 6.153564453125, 6.7791748046875, 7.40478515625, 8.0303955078125, 8.656005859375, 9.2816162109375, 9.9072265625, 10.5328369140625, 11.158447265625, 11.7840576171875, 12.40966796875, 13.0352783203125, 13.660888671875, 14.2864990234375, 14.912109375, 15.5377197265625, 16.163330078125, 16.7889404296875, 17.41455078125, 18.0401611328125, 18.665771484375, 19.2913818359375, 19.9169921875, 20.5426025390625, 21.168212890625, 21.7938232421875, 22.41943359375, 23.0450439453125, 23.670654296875, 24.2962646484375, 24.921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 14.0, 27.0, 31.0, 43.0, 67.0, 109.0, 232.0, 490.0, 921.0, 1026.0, 522.0, 242.0, 124.0, 67.0, 39.0, 28.0, 16.0, 17.0, 12.0, 15.0, 10.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.9586181640625, -19.448486328125, -18.9383544921875, -18.42822265625, -17.9180908203125, -17.407958984375, -16.8978271484375, -16.3876953125, -15.8775634765625, -15.367431640625, -14.8572998046875, -14.34716796875, -13.8370361328125, -13.326904296875, -12.8167724609375, -12.306640625, -11.7965087890625, -11.286376953125, -10.7762451171875, -10.26611328125, -9.7559814453125, -9.245849609375, -8.7357177734375, -8.2255859375, -7.7154541015625, -7.205322265625, -6.6951904296875, -6.18505859375, -5.6749267578125, -5.164794921875, -4.6546630859375, -4.14453125, -3.6343994140625, -3.124267578125, -2.6141357421875, -2.10400390625, -1.5938720703125, -1.083740234375, -0.5736083984375, -0.0634765625, 0.4466552734375, 0.956787109375, 1.4669189453125, 1.97705078125, 2.4871826171875, 2.997314453125, 3.5074462890625, 4.017578125, 4.5277099609375, 5.037841796875, 5.5479736328125, 6.05810546875, 6.5682373046875, 7.078369140625, 7.5885009765625, 8.0986328125, 8.6087646484375, 9.118896484375, 9.6290283203125, 10.13916015625, 10.6492919921875, 11.159423828125, 11.6695556640625, 12.1796875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 8.0, 15.0, 73.0, 330.0, 401.0, 138.0, 27.0, 6.0, 1.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-307.48004150390625, -298.24835205078125, -289.01666259765625, -279.78497314453125, -270.55328369140625, -261.32159423828125, -252.08990478515625, -242.85821533203125, -233.62652587890625, -224.39483642578125, -215.16314697265625, -205.93145751953125, -196.69976806640625, -187.46807861328125, -178.23638916015625, -169.00469970703125, -159.77301025390625, -150.54132080078125, -141.30963134765625, -132.07794189453125, -122.84625244140625, -113.61456298828125, -104.38287353515625, -95.15118408203125, -85.91949462890625, -76.68780517578125, -67.45611572265625, -58.22442626953125, -48.99273681640625, -39.76104736328125, -30.52935791015625, -21.29766845703125, -12.06597900390625, -2.83428955078125, 6.39739990234375, 15.62908935546875, 24.86077880859375, 34.09246826171875, 43.32415771484375, 52.55584716796875, 61.78753662109375, 71.01922607421875, 80.25091552734375, 89.48260498046875, 98.71429443359375, 107.94598388671875, 117.17767333984375, 126.40936279296875, 135.64105224609375, 144.87274169921875, 154.10443115234375, 163.33612060546875, 172.56781005859375, 181.79949951171875, 191.03118896484375, 200.26287841796875, 209.49456787109375, 218.72625732421875, 227.95794677734375, 237.18963623046875, 246.42132568359375, 255.65301513671875, 264.88470458984375, 274.11639404296875, 283.34808349609375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 13.0, 14.0, 13.0, 26.0, 37.0, 40.0, 39.0, 62.0, 55.0, 58.0, 70.0, 68.0, 80.0, 77.0, 64.0, 56.0, 50.0, 49.0, 39.0, 22.0, 28.0, 9.0, 10.0, 12.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-105.33206176757812, -102.91027069091797, -100.48847961425781, -98.06668090820312, -95.64488983154297, -93.22309875488281, -90.80130767822266, -88.3795166015625, -85.95771789550781, -83.53592681884766, -81.1141357421875, -78.69233703613281, -76.27054595947266, -73.8487548828125, -71.42696380615234, -69.00517272949219, -66.5833740234375, -64.16158294677734, -61.73978805541992, -59.317996978759766, -56.896202087402344, -54.47441101074219, -52.05261993408203, -49.63082504272461, -47.20903778076172, -44.78724670410156, -42.36545181274414, -39.943660736083984, -37.52186584472656, -35.100074768066406, -32.67828369140625, -30.256488800048828, -27.834693908691406, -25.412900924682617, -22.991107940673828, -20.569316864013672, -18.14752197265625, -15.725729942321777, -13.303937911987305, -10.882144927978516, -8.460351943969727, -6.0385589599609375, -3.6167664527893066, -1.1949739456176758, 1.2268190383911133, 3.6486120223999023, 6.070404052734375, 8.492197036743164, 10.913990020751953, 13.335783004760742, 15.757575988769531, 18.179367065429688, 20.60116195678711, 23.022953033447266, 25.444746017456055, 27.866539001464844, 30.288331985473633, 32.71012496948242, 35.13191604614258, 37.5537109375, 39.975502014160156, 42.39729690551758, 44.819087982177734, 47.240882873535156, 49.66267395019531]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 2.0, 4.0, 8.0, 7.0, 10.0, 21.0, 24.0, 36.0, 57.0, 106.0, 162.0, 328.0, 771.0, 1683.0, 4439.0, 14097.0, 53101.0, 254758.0, 550649.0, 125396.0, 29212.0, 8419.0, 2976.0, 1170.0, 521.0, 235.0, 120.0, 71.0, 46.0, 36.0, 26.0, 13.0, 13.0, 7.0, 6.0, 3.0, 6.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.4188232421875, -14.892333984375, -14.3658447265625, -13.83935546875, -13.3128662109375, -12.786376953125, -12.2598876953125, -11.7333984375, -11.2069091796875, -10.680419921875, -10.1539306640625, -9.62744140625, -9.1009521484375, -8.574462890625, -8.0479736328125, -7.521484375, -6.9949951171875, -6.468505859375, -5.9420166015625, -5.41552734375, -4.8890380859375, -4.362548828125, -3.8360595703125, -3.3095703125, -2.7830810546875, -2.256591796875, -1.7301025390625, -1.20361328125, -0.6771240234375, -0.150634765625, 0.3758544921875, 0.90234375, 1.4288330078125, 1.955322265625, 2.4818115234375, 3.00830078125, 3.5347900390625, 4.061279296875, 4.5877685546875, 5.1142578125, 5.6407470703125, 6.167236328125, 6.6937255859375, 7.22021484375, 7.7467041015625, 8.273193359375, 8.7996826171875, 9.326171875, 9.8526611328125, 10.379150390625, 10.9056396484375, 11.43212890625, 11.9586181640625, 12.485107421875, 13.0115966796875, 13.5380859375, 14.0645751953125, 14.591064453125, 15.1175537109375, 15.64404296875, 16.1705322265625, 16.697021484375, 17.2235107421875, 17.75]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 5.0, 5.0, 14.0, 13.0, 21.0, 10.0, 23.0, 25.0, 31.0, 34.0, 29.0, 36.0, 37.0, 41.0, 45.0, 50.0, 42.0, 57.0, 57.0, 55.0, 36.0, 40.0, 43.0, 53.0, 32.0, 37.0, 23.0, 20.0, 10.0, 15.0, 8.0, 14.0, 8.0, 4.0, 7.0, 0.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-5.2890625, -5.1422119140625, -4.995361328125, -4.8485107421875, -4.70166015625, -4.5548095703125, -4.407958984375, -4.2611083984375, -4.1142578125, -3.9674072265625, -3.820556640625, -3.6737060546875, -3.52685546875, -3.3800048828125, -3.233154296875, -3.0863037109375, -2.939453125, -2.7926025390625, -2.645751953125, -2.4989013671875, -2.35205078125, -2.2052001953125, -2.058349609375, -1.9114990234375, -1.7646484375, -1.6177978515625, -1.470947265625, -1.3240966796875, -1.17724609375, -1.0303955078125, -0.883544921875, -0.7366943359375, -0.58984375, -0.4429931640625, -0.296142578125, -0.1492919921875, -0.00244140625, 0.1444091796875, 0.291259765625, 0.4381103515625, 0.5849609375, 0.7318115234375, 0.878662109375, 1.0255126953125, 1.17236328125, 1.3192138671875, 1.466064453125, 1.6129150390625, 1.759765625, 1.9066162109375, 2.053466796875, 2.2003173828125, 2.34716796875, 2.4940185546875, 2.640869140625, 2.7877197265625, 2.9345703125, 3.0814208984375, 3.228271484375, 3.3751220703125, 3.52197265625, 3.6688232421875, 3.815673828125, 3.9625244140625, 4.109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 13.0, 13.0, 11.0, 27.0, 24.0, 56.0, 68.0, 141.0, 251.0, 456.0, 1013.0, 2874.0, 16097.0, 639129.0, 370442.0, 13393.0, 2568.0, 942.0, 422.0, 229.0, 120.0, 73.0, 48.0, 28.0, 20.0, 22.0, 17.0, 14.0, 7.0, 6.0, 1.0, 4.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.03125, -38.77880859375, -37.5263671875, -36.27392578125, -35.021484375, -33.76904296875, -32.5166015625, -31.26416015625, -30.01171875, -28.75927734375, -27.5068359375, -26.25439453125, -25.001953125, -23.74951171875, -22.4970703125, -21.24462890625, -19.9921875, -18.73974609375, -17.4873046875, -16.23486328125, -14.982421875, -13.72998046875, -12.4775390625, -11.22509765625, -9.97265625, -8.72021484375, -7.4677734375, -6.21533203125, -4.962890625, -3.71044921875, -2.4580078125, -1.20556640625, 0.046875, 1.29931640625, 2.5517578125, 3.80419921875, 5.056640625, 6.30908203125, 7.5615234375, 8.81396484375, 10.06640625, 11.31884765625, 12.5712890625, 13.82373046875, 15.076171875, 16.32861328125, 17.5810546875, 18.83349609375, 20.0859375, 21.33837890625, 22.5908203125, 23.84326171875, 25.095703125, 26.34814453125, 27.6005859375, 28.85302734375, 30.10546875, 31.35791015625, 32.6103515625, 33.86279296875, 35.115234375, 36.36767578125, 37.6201171875, 38.87255859375, 40.125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 4.0, 1.0, 9.0, 11.0, 16.0, 19.0, 22.0, 16.0, 22.0, 18.0, 30.0, 27.0, 39.0, 40.0, 39.0, 42.0, 55.0, 46.0, 52.0, 46.0, 47.0, 49.0, 36.0, 51.0, 33.0, 29.0, 26.0, 27.0, 16.0, 21.0, 19.0, 14.0, 12.0, 12.0, 11.0, 8.0, 4.0, 4.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.1875, -16.658203125, -16.12890625, -15.599609375, -15.0703125, -14.541015625, -14.01171875, -13.482421875, -12.953125, -12.423828125, -11.89453125, -11.365234375, -10.8359375, -10.306640625, -9.77734375, -9.248046875, -8.71875, -8.189453125, -7.66015625, -7.130859375, -6.6015625, -6.072265625, -5.54296875, -5.013671875, -4.484375, -3.955078125, -3.42578125, -2.896484375, -2.3671875, -1.837890625, -1.30859375, -0.779296875, -0.25, 0.279296875, 0.80859375, 1.337890625, 1.8671875, 2.396484375, 2.92578125, 3.455078125, 3.984375, 4.513671875, 5.04296875, 5.572265625, 6.1015625, 6.630859375, 7.16015625, 7.689453125, 8.21875, 8.748046875, 9.27734375, 9.806640625, 10.3359375, 10.865234375, 11.39453125, 11.923828125, 12.453125, 12.982421875, 13.51171875, 14.041015625, 14.5703125, 15.099609375, 15.62890625, 16.158203125, 16.6875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 22.0, 10.0, 11.0, 24.0, 29.0, 48.0, 67.0, 80.0, 140.0, 176.0, 286.0, 523.0, 1155.0, 3074.0, 11471.0, 79161.0, 812112.0, 118939.0, 14749.0, 3660.0, 1298.0, 586.0, 294.0, 188.0, 123.0, 81.0, 56.0, 31.0, 43.0, 23.0, 13.0, 11.0, 14.0, 13.0, 6.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-8.2109375, -7.98016357421875, -7.7493896484375, -7.51861572265625, -7.287841796875, -7.05706787109375, -6.8262939453125, -6.59552001953125, -6.36474609375, -6.13397216796875, -5.9031982421875, -5.67242431640625, -5.441650390625, -5.21087646484375, -4.9801025390625, -4.74932861328125, -4.5185546875, -4.28778076171875, -4.0570068359375, -3.82623291015625, -3.595458984375, -3.36468505859375, -3.1339111328125, -2.90313720703125, -2.67236328125, -2.44158935546875, -2.2108154296875, -1.98004150390625, -1.749267578125, -1.51849365234375, -1.2877197265625, -1.05694580078125, -0.826171875, -0.59539794921875, -0.3646240234375, -0.13385009765625, 0.096923828125, 0.32769775390625, 0.5584716796875, 0.78924560546875, 1.02001953125, 1.25079345703125, 1.4815673828125, 1.71234130859375, 1.943115234375, 2.17388916015625, 2.4046630859375, 2.63543701171875, 2.8662109375, 3.09698486328125, 3.3277587890625, 3.55853271484375, 3.789306640625, 4.02008056640625, 4.2508544921875, 4.48162841796875, 4.71240234375, 4.94317626953125, 5.1739501953125, 5.40472412109375, 5.635498046875, 5.86627197265625, 6.0970458984375, 6.32781982421875, 6.55859375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 7.0, 3.0, 8.0, 8.0, 15.0, 15.0, 14.0, 19.0, 31.0, 31.0, 56.0, 76.0, 104.0, 140.0, 140.0, 96.0, 70.0, 40.0, 15.0, 25.0, 18.0, 13.0, 10.0, 10.0, 5.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012922286987304688, -0.0012472718954086304, -0.001202315092086792, -0.0011573582887649536, -0.0011124014854431152, -0.0010674446821212769, -0.0010224878787994385, -0.0009775310754776, -0.0009325742721557617, -0.0008876174688339233, -0.000842660665512085, -0.0007977038621902466, -0.0007527470588684082, -0.0007077902555465698, -0.0006628334522247314, -0.0006178766489028931, -0.0005729198455810547, -0.0005279630422592163, -0.00048300623893737793, -0.00043804943561553955, -0.00039309263229370117, -0.0003481358289718628, -0.0003031790256500244, -0.00025822222232818604, -0.00021326541900634766, -0.00016830861568450928, -0.0001233518123626709, -7.839500904083252e-05, -3.343820571899414e-05, 1.1518597602844238e-05, 5.647540092468262e-05, 0.000101432204246521, 0.00014638900756835938, 0.00019134581089019775, 0.00023630261421203613, 0.0002812594175338745, 0.0003262162208557129, 0.00037117302417755127, 0.00041612982749938965, 0.00046108663082122803, 0.0005060434341430664, 0.0005510002374649048, 0.0005959570407867432, 0.0006409138441085815, 0.0006858706474304199, 0.0007308274507522583, 0.0007757842540740967, 0.0008207410573959351, 0.0008656978607177734, 0.0009106546640396118, 0.0009556114673614502, 0.0010005682706832886, 0.001045525074005127, 0.0010904818773269653, 0.0011354386806488037, 0.001180395483970642, 0.0012253522872924805, 0.0012703090906143188, 0.0013152658939361572, 0.0013602226972579956, 0.001405179500579834, 0.0014501363039016724, 0.0014950931072235107, 0.0015400499105453491, 0.0015850067138671875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 6.0, 4.0, 4.0, 8.0, 3.0, 2.0, 7.0, 17.0, 21.0, 27.0, 35.0, 48.0, 67.0, 106.0, 183.0, 272.0, 440.0, 863.0, 1754.0, 4283.0, 13872.0, 88268.0, 768827.0, 141379.0, 18408.0, 5227.0, 2069.0, 985.0, 500.0, 315.0, 183.0, 110.0, 77.0, 64.0, 40.0, 22.0, 17.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.17950439453125, -4.9918212890625, -4.80413818359375, -4.616455078125, -4.42877197265625, -4.2410888671875, -4.05340576171875, -3.86572265625, -3.67803955078125, -3.4903564453125, -3.30267333984375, -3.114990234375, -2.92730712890625, -2.7396240234375, -2.55194091796875, -2.3642578125, -2.17657470703125, -1.9888916015625, -1.80120849609375, -1.613525390625, -1.42584228515625, -1.2381591796875, -1.05047607421875, -0.86279296875, -0.67510986328125, -0.4874267578125, -0.29974365234375, -0.112060546875, 0.07562255859375, 0.2633056640625, 0.45098876953125, 0.638671875, 0.82635498046875, 1.0140380859375, 1.20172119140625, 1.389404296875, 1.57708740234375, 1.7647705078125, 1.95245361328125, 2.14013671875, 2.32781982421875, 2.5155029296875, 2.70318603515625, 2.890869140625, 3.07855224609375, 3.2662353515625, 3.45391845703125, 3.6416015625, 3.82928466796875, 4.0169677734375, 4.20465087890625, 4.392333984375, 4.58001708984375, 4.7677001953125, 4.95538330078125, 5.14306640625, 5.33074951171875, 5.5184326171875, 5.70611572265625, 5.893798828125, 6.08148193359375, 6.2691650390625, 6.45684814453125, 6.64453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 14.0, 5.0, 27.0, 28.0, 25.0, 33.0, 50.0, 79.0, 108.0, 112.0, 94.0, 102.0, 75.0, 62.0, 34.0, 35.0, 24.0, 19.0, 12.0, 11.0, 8.0, 8.0, 5.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4296875, -6.25689697265625, -6.0841064453125, -5.91131591796875, -5.738525390625, -5.56573486328125, -5.3929443359375, -5.22015380859375, -5.04736328125, -4.87457275390625, -4.7017822265625, -4.52899169921875, -4.356201171875, -4.18341064453125, -4.0106201171875, -3.83782958984375, -3.6650390625, -3.49224853515625, -3.3194580078125, -3.14666748046875, -2.973876953125, -2.80108642578125, -2.6282958984375, -2.45550537109375, -2.28271484375, -2.10992431640625, -1.9371337890625, -1.76434326171875, -1.591552734375, -1.41876220703125, -1.2459716796875, -1.07318115234375, -0.900390625, -0.72760009765625, -0.5548095703125, -0.38201904296875, -0.209228515625, -0.03643798828125, 0.1363525390625, 0.30914306640625, 0.48193359375, 0.65472412109375, 0.8275146484375, 1.00030517578125, 1.173095703125, 1.34588623046875, 1.5186767578125, 1.69146728515625, 1.8642578125, 2.03704833984375, 2.2098388671875, 2.38262939453125, 2.555419921875, 2.72821044921875, 2.9010009765625, 3.07379150390625, 3.24658203125, 3.41937255859375, 3.5921630859375, 3.76495361328125, 3.937744140625, 4.11053466796875, 4.2833251953125, 4.45611572265625, 4.62890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 12.0, 45.0, 129.0, 360.0, 287.0, 101.0, 38.0, 10.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-319.18878173828125, -311.5707702636719, -303.9527587890625, -296.3347473144531, -288.71673583984375, -281.0987243652344, -273.480712890625, -265.86273193359375, -258.2447204589844, -250.626708984375, -243.00869750976562, -235.39068603515625, -227.77268981933594, -220.15467834472656, -212.5366668701172, -204.9186553955078, -197.30062866210938, -189.6826171875, -182.06460571289062, -174.44659423828125, -166.82859802246094, -159.21058654785156, -151.5925750732422, -143.9745635986328, -136.3565673828125, -128.73855590820312, -121.12055206298828, -113.5025405883789, -105.88452911376953, -98.26652526855469, -90.64851379394531, -83.03050231933594, -75.41249084472656, -67.79447937011719, -60.17647171020508, -52.55846405029297, -44.940452575683594, -37.322444915771484, -29.704437255859375, -22.08642578125, -14.46841812133789, -6.850409030914307, 0.7676000595092773, 8.385608673095703, 16.003618240356445, 23.621627807617188, 31.239635467529297, 38.85764694213867, 46.47565460205078, 54.09366226196289, 61.711673736572266, 69.32968139648438, 76.94769287109375, 84.56570434570312, 92.18370819091797, 99.80171966552734, 107.41972351074219, 115.03773498535156, 122.6557388305664, 130.27374267578125, 137.89175415039062, 145.509765625, 153.12777709960938, 160.74578857421875, 168.36380004882812]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 2.0, 10.0, 12.0, 19.0, 18.0, 21.0, 30.0, 26.0, 37.0, 29.0, 36.0, 40.0, 50.0, 49.0, 56.0, 89.0, 73.0, 58.0, 44.0, 50.0, 30.0, 25.0, 27.0, 27.0, 21.0, 14.0, 16.0, 19.0, 9.0, 11.0, 7.0, 11.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.75736999511719, -58.3917350769043, -56.026100158691406, -53.66046905517578, -51.29483413696289, -48.92919921875, -46.563568115234375, -44.197933197021484, -41.832298278808594, -39.4666633605957, -37.10102844238281, -34.73539733886719, -32.3697624206543, -30.004127502441406, -27.63849449157715, -25.27286148071289, -22.9072265625, -20.54159164428711, -18.17595863342285, -15.810324668884277, -13.444690704345703, -11.079056739807129, -8.713422775268555, -6.347789764404297, -3.9821548461914062, -1.616520881652832, 0.7491130828857422, 3.1147470474243164, 5.480381011962891, 7.846014976501465, 10.211648941040039, 12.577281951904297, 14.942916870117188, 17.308551788330078, 19.674184799194336, 22.039817810058594, 24.405452728271484, 26.771087646484375, 29.136720657348633, 31.50235366821289, 33.86798858642578, 36.23362350463867, 38.59925842285156, 40.96488952636719, 43.33052444458008, 45.69615936279297, 48.061790466308594, 50.427425384521484, 52.793060302734375, 55.158695220947266, 57.524330139160156, 59.88996124267578, 62.25559616088867, 64.62123107910156, 66.98686218261719, 69.35249328613281, 71.71813201904297, 74.0837631225586, 76.44940185546875, 78.81503295898438, 81.1806640625, 83.54630279541016, 85.91193389892578, 88.27757263183594, 90.64320373535156]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 15.0, 15.0, 26.0, 50.0, 99.0, 229.0, 624.0, 2703.0, 21372.0, 2990472.0, 1161992.0, 13782.0, 1984.0, 523.0, 182.0, 93.0, 48.0, 35.0, 9.0, 14.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.29248046875, -16.5380859375, -15.78369140625, -15.029296875, -14.27490234375, -13.5205078125, -12.76611328125, -12.01171875, -11.25732421875, -10.5029296875, -9.74853515625, -8.994140625, -8.23974609375, -7.4853515625, -6.73095703125, -5.9765625, -5.22216796875, -4.4677734375, -3.71337890625, -2.958984375, -2.20458984375, -1.4501953125, -0.69580078125, 0.05859375, 0.81298828125, 1.5673828125, 2.32177734375, 3.076171875, 3.83056640625, 4.5849609375, 5.33935546875, 6.09375, 6.84814453125, 7.6025390625, 8.35693359375, 9.111328125, 9.86572265625, 10.6201171875, 11.37451171875, 12.12890625, 12.88330078125, 13.6376953125, 14.39208984375, 15.146484375, 15.90087890625, 16.6552734375, 17.40966796875, 18.1640625, 18.91845703125, 19.6728515625, 20.42724609375, 21.181640625, 21.93603515625, 22.6904296875, 23.44482421875, 24.19921875, 24.95361328125, 25.7080078125, 26.46240234375, 27.216796875, 27.97119140625, 28.7255859375, 29.47998046875, 30.234375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 10.0, 8.0, 8.0, 15.0, 18.0, 29.0, 27.0, 25.0, 27.0, 39.0, 35.0, 41.0, 44.0, 53.0, 55.0, 68.0, 70.0, 62.0, 48.0, 50.0, 40.0, 41.0, 42.0, 25.0, 31.0, 20.0, 14.0, 13.0, 8.0, 9.0, 7.0, 9.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.38067626953125, -4.2222900390625, -4.06390380859375, -3.905517578125, -3.74713134765625, -3.5887451171875, -3.43035888671875, -3.27197265625, -3.11358642578125, -2.9552001953125, -2.79681396484375, -2.638427734375, -2.48004150390625, -2.3216552734375, -2.16326904296875, -2.0048828125, -1.84649658203125, -1.6881103515625, -1.52972412109375, -1.371337890625, -1.21295166015625, -1.0545654296875, -0.89617919921875, -0.73779296875, -0.57940673828125, -0.4210205078125, -0.26263427734375, -0.104248046875, 0.05413818359375, 0.2125244140625, 0.37091064453125, 0.529296875, 0.68768310546875, 0.8460693359375, 1.00445556640625, 1.162841796875, 1.32122802734375, 1.4796142578125, 1.63800048828125, 1.79638671875, 1.95477294921875, 2.1131591796875, 2.27154541015625, 2.429931640625, 2.58831787109375, 2.7467041015625, 2.90509033203125, 3.0634765625, 3.22186279296875, 3.3802490234375, 3.53863525390625, 3.697021484375, 3.85540771484375, 4.0137939453125, 4.17218017578125, 4.33056640625, 4.48895263671875, 4.6473388671875, 4.80572509765625, 4.964111328125, 5.12249755859375, 5.2808837890625, 5.43927001953125, 5.59765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 5.0, 5.0, 10.0, 31.0, 38.0, 76.0, 129.0, 351.0, 880.0, 2810.0, 12946.0, 201809.0, 3885976.0, 75863.0, 9307.0, 2516.0, 816.0, 364.0, 162.0, 82.0, 44.0, 22.0, 6.0, 12.0, 2.0, 7.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.753173828125, -17.05322265625, -16.353271484375, -15.6533203125, -14.953369140625, -14.25341796875, -13.553466796875, -12.853515625, -12.153564453125, -11.45361328125, -10.753662109375, -10.0537109375, -9.353759765625, -8.65380859375, -7.953857421875, -7.25390625, -6.553955078125, -5.85400390625, -5.154052734375, -4.4541015625, -3.754150390625, -3.05419921875, -2.354248046875, -1.654296875, -0.954345703125, -0.25439453125, 0.445556640625, 1.1455078125, 1.845458984375, 2.54541015625, 3.245361328125, 3.9453125, 4.645263671875, 5.34521484375, 6.045166015625, 6.7451171875, 7.445068359375, 8.14501953125, 8.844970703125, 9.544921875, 10.244873046875, 10.94482421875, 11.644775390625, 12.3447265625, 13.044677734375, 13.74462890625, 14.444580078125, 15.14453125, 15.844482421875, 16.54443359375, 17.244384765625, 17.9443359375, 18.644287109375, 19.34423828125, 20.044189453125, 20.744140625, 21.444091796875, 22.14404296875, 22.843994140625, 23.5439453125, 24.243896484375, 24.94384765625, 25.643798828125, 26.34375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 9.0, 27.0, 39.0, 64.0, 112.0, 243.0, 634.0, 1455.0, 846.0, 309.0, 132.0, 55.0, 49.0, 19.0, 13.0, 10.0, 10.0, 9.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.96875, -18.36865234375, -17.7685546875, -17.16845703125, -16.568359375, -15.96826171875, -15.3681640625, -14.76806640625, -14.16796875, -13.56787109375, -12.9677734375, -12.36767578125, -11.767578125, -11.16748046875, -10.5673828125, -9.96728515625, -9.3671875, -8.76708984375, -8.1669921875, -7.56689453125, -6.966796875, -6.36669921875, -5.7666015625, -5.16650390625, -4.56640625, -3.96630859375, -3.3662109375, -2.76611328125, -2.166015625, -1.56591796875, -0.9658203125, -0.36572265625, 0.234375, 0.83447265625, 1.4345703125, 2.03466796875, 2.634765625, 3.23486328125, 3.8349609375, 4.43505859375, 5.03515625, 5.63525390625, 6.2353515625, 6.83544921875, 7.435546875, 8.03564453125, 8.6357421875, 9.23583984375, 9.8359375, 10.43603515625, 11.0361328125, 11.63623046875, 12.236328125, 12.83642578125, 13.4365234375, 14.03662109375, 14.63671875, 15.23681640625, 15.8369140625, 16.43701171875, 17.037109375, 17.63720703125, 18.2373046875, 18.83740234375, 19.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 12.0, 70.0, 411.0, 397.0, 54.0, 30.0, 9.0, 3.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-325.65704345703125, -315.499267578125, -305.34149169921875, -295.1836853027344, -285.0259094238281, -274.8681335449219, -264.7103271484375, -254.55255126953125, -244.394775390625, -234.23699951171875, -224.07920837402344, -213.92141723632812, -203.76364135742188, -193.60586547851562, -183.4480743408203, -173.290283203125, -163.13250732421875, -152.9747314453125, -142.8169403076172, -132.65914916992188, -122.50137329101562, -112.34358978271484, -102.18580627441406, -92.02802276611328, -81.8702392578125, -71.71245574951172, -61.55467224121094, -51.396888732910156, -41.239105224609375, -31.081321716308594, -20.923538208007812, -10.765754699707031, -0.608001708984375, 9.549781799316406, 19.707565307617188, 29.86534881591797, 40.02313232421875, 50.18091583251953, 60.33869934082031, 70.4964828491211, 80.65426635742188, 90.81204986572266, 100.96983337402344, 111.12761688232422, 121.285400390625, 131.44317626953125, 141.60096740722656, 151.75875854492188, 161.91653442382812, 172.07431030273438, 182.2321014404297, 192.389892578125, 202.54766845703125, 212.7054443359375, 222.8632354736328, 233.02102661132812, 243.17880249023438, 253.33657836914062, 263.494384765625, 273.65216064453125, 283.8099365234375, 293.96771240234375, 304.12548828125, 314.2832946777344, 324.4410705566406]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 9.0, 15.0, 20.0, 20.0, 32.0, 59.0, 62.0, 78.0, 86.0, 111.0, 113.0, 108.0, 97.0, 55.0, 46.0, 32.0, 23.0, 19.0, 10.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-160.99249267578125, -157.40968322753906, -153.82688903808594, -150.24407958984375, -146.66127014160156, -143.07847595214844, -139.49566650390625, -135.91287231445312, -132.33006286621094, -128.74725341796875, -125.1644515991211, -121.58164978027344, -117.99884796142578, -114.41604614257812, -110.83323669433594, -107.25043487548828, -103.66763305664062, -100.08483123779297, -96.50202178955078, -92.91921997070312, -89.33641815185547, -85.75361633300781, -82.17080688476562, -78.58800506591797, -75.00519561767578, -71.42239379882812, -67.83958435058594, -64.25678253173828, -60.673980712890625, -57.0911750793457, -53.50836944580078, -49.925567626953125, -46.34276580810547, -42.75996017456055, -39.17715835571289, -35.59435272216797, -32.01155090332031, -28.42874526977539, -24.8459415435791, -21.263137817382812, -17.680334091186523, -14.097530364990234, -10.514726638793945, -6.93192195892334, -3.349118232727051, 0.2336864471435547, 3.8164901733398438, 7.399293899536133, 10.982097625732422, 14.564901351928711, 18.147705078125, 21.730510711669922, 25.313312530517578, 28.8961181640625, 32.478919982910156, 36.06172561645508, 39.64453125, 43.22733688354492, 46.81013870239258, 50.3929443359375, 53.975746154785156, 57.55855178833008, 61.141357421875, 64.72415924072266, 68.30696105957031]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 12.0, 6.0, 12.0, 26.0, 32.0, 40.0, 53.0, 101.0, 222.0, 363.0, 682.0, 1467.0, 3389.0, 8772.0, 25536.0, 84058.0, 297797.0, 420862.0, 142378.0, 40413.0, 13283.0, 5017.0, 2025.0, 899.0, 464.0, 228.0, 155.0, 85.0, 46.0, 29.0, 27.0, 15.0, 14.0, 10.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.3046875, -10.011962890625, -9.71923828125, -9.426513671875, -9.1337890625, -8.841064453125, -8.54833984375, -8.255615234375, -7.962890625, -7.670166015625, -7.37744140625, -7.084716796875, -6.7919921875, -6.499267578125, -6.20654296875, -5.913818359375, -5.62109375, -5.328369140625, -5.03564453125, -4.742919921875, -4.4501953125, -4.157470703125, -3.86474609375, -3.572021484375, -3.279296875, -2.986572265625, -2.69384765625, -2.401123046875, -2.1083984375, -1.815673828125, -1.52294921875, -1.230224609375, -0.9375, -0.644775390625, -0.35205078125, -0.059326171875, 0.2333984375, 0.526123046875, 0.81884765625, 1.111572265625, 1.404296875, 1.697021484375, 1.98974609375, 2.282470703125, 2.5751953125, 2.867919921875, 3.16064453125, 3.453369140625, 3.74609375, 4.038818359375, 4.33154296875, 4.624267578125, 4.9169921875, 5.209716796875, 5.50244140625, 5.795166015625, 6.087890625, 6.380615234375, 6.67333984375, 6.966064453125, 7.2587890625, 7.551513671875, 7.84423828125, 8.136962890625, 8.4296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 10.0, 21.0, 18.0, 28.0, 31.0, 48.0, 44.0, 43.0, 79.0, 75.0, 86.0, 82.0, 68.0, 74.0, 65.0, 56.0, 43.0, 32.0, 26.0, 20.0, 13.0, 10.0, 10.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.1102294921875, -8.876708984375, -8.6431884765625, -8.40966796875, -8.1761474609375, -7.942626953125, -7.7091064453125, -7.4755859375, -7.2420654296875, -7.008544921875, -6.7750244140625, -6.54150390625, -6.3079833984375, -6.074462890625, -5.8409423828125, -5.607421875, -5.3739013671875, -5.140380859375, -4.9068603515625, -4.67333984375, -4.4398193359375, -4.206298828125, -3.9727783203125, -3.7392578125, -3.5057373046875, -3.272216796875, -3.0386962890625, -2.80517578125, -2.5716552734375, -2.338134765625, -2.1046142578125, -1.87109375, -1.6375732421875, -1.404052734375, -1.1705322265625, -0.93701171875, -0.7034912109375, -0.469970703125, -0.2364501953125, -0.0029296875, 0.2305908203125, 0.464111328125, 0.6976318359375, 0.93115234375, 1.1646728515625, 1.398193359375, 1.6317138671875, 1.865234375, 2.0987548828125, 2.332275390625, 2.5657958984375, 2.79931640625, 3.0328369140625, 3.266357421875, 3.4998779296875, 3.7333984375, 3.9669189453125, 4.200439453125, 4.4339599609375, 4.66748046875, 4.9010009765625, 5.134521484375, 5.3680419921875, 5.6015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 4.0, 5.0, 1.0, 6.0, 12.0, 10.0, 14.0, 21.0, 31.0, 43.0, 62.0, 107.0, 159.0, 247.0, 495.0, 1034.0, 2591.0, 7056.0, 23833.0, 107951.0, 626063.0, 218672.0, 41906.0, 11233.0, 3902.0, 1478.0, 641.0, 384.0, 207.0, 142.0, 77.0, 51.0, 32.0, 13.0, 15.0, 11.0, 15.0, 10.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.75, -12.3717041015625, -11.993408203125, -11.6151123046875, -11.23681640625, -10.8585205078125, -10.480224609375, -10.1019287109375, -9.7236328125, -9.3453369140625, -8.967041015625, -8.5887451171875, -8.21044921875, -7.8321533203125, -7.453857421875, -7.0755615234375, -6.697265625, -6.3189697265625, -5.940673828125, -5.5623779296875, -5.18408203125, -4.8057861328125, -4.427490234375, -4.0491943359375, -3.6708984375, -3.2926025390625, -2.914306640625, -2.5360107421875, -2.15771484375, -1.7794189453125, -1.401123046875, -1.0228271484375, -0.64453125, -0.2662353515625, 0.112060546875, 0.4903564453125, 0.86865234375, 1.2469482421875, 1.625244140625, 2.0035400390625, 2.3818359375, 2.7601318359375, 3.138427734375, 3.5167236328125, 3.89501953125, 4.2733154296875, 4.651611328125, 5.0299072265625, 5.408203125, 5.7864990234375, 6.164794921875, 6.5430908203125, 6.92138671875, 7.2996826171875, 7.677978515625, 8.0562744140625, 8.4345703125, 8.8128662109375, 9.191162109375, 9.5694580078125, 9.94775390625, 10.3260498046875, 10.704345703125, 11.0826416015625, 11.4609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 8.0, 2.0, 5.0, 7.0, 9.0, 7.0, 12.0, 16.0, 14.0, 22.0, 41.0, 38.0, 58.0, 49.0, 59.0, 69.0, 66.0, 55.0, 61.0, 65.0, 48.0, 59.0, 46.0, 29.0, 36.0, 23.0, 19.0, 21.0, 22.0, 10.0, 5.0, 7.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-25.734375, -25.0634765625, -24.392578125, -23.7216796875, -23.05078125, -22.3798828125, -21.708984375, -21.0380859375, -20.3671875, -19.6962890625, -19.025390625, -18.3544921875, -17.68359375, -17.0126953125, -16.341796875, -15.6708984375, -15.0, -14.3291015625, -13.658203125, -12.9873046875, -12.31640625, -11.6455078125, -10.974609375, -10.3037109375, -9.6328125, -8.9619140625, -8.291015625, -7.6201171875, -6.94921875, -6.2783203125, -5.607421875, -4.9365234375, -4.265625, -3.5947265625, -2.923828125, -2.2529296875, -1.58203125, -0.9111328125, -0.240234375, 0.4306640625, 1.1015625, 1.7724609375, 2.443359375, 3.1142578125, 3.78515625, 4.4560546875, 5.126953125, 5.7978515625, 6.46875, 7.1396484375, 7.810546875, 8.4814453125, 9.15234375, 9.8232421875, 10.494140625, 11.1650390625, 11.8359375, 12.5068359375, 13.177734375, 13.8486328125, 14.51953125, 15.1904296875, 15.861328125, 16.5322265625, 17.203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 5.0, 10.0, 16.0, 21.0, 36.0, 36.0, 65.0, 122.0, 251.0, 555.0, 1319.0, 4339.0, 20084.0, 146091.0, 737438.0, 115207.0, 16885.0, 3825.0, 1190.0, 501.0, 236.0, 112.0, 64.0, 45.0, 25.0, 22.0, 20.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.643890380859375, -3.52801513671875, -3.412139892578125, -3.2962646484375, -3.180389404296875, -3.06451416015625, -2.948638916015625, -2.832763671875, -2.716888427734375, -2.60101318359375, -2.485137939453125, -2.3692626953125, -2.253387451171875, -2.13751220703125, -2.021636962890625, -1.90576171875, -1.789886474609375, -1.67401123046875, -1.558135986328125, -1.4422607421875, -1.326385498046875, -1.21051025390625, -1.094635009765625, -0.978759765625, -0.862884521484375, -0.74700927734375, -0.631134033203125, -0.5152587890625, -0.399383544921875, -0.28350830078125, -0.167633056640625, -0.0517578125, 0.064117431640625, 0.17999267578125, 0.295867919921875, 0.4117431640625, 0.527618408203125, 0.64349365234375, 0.759368896484375, 0.875244140625, 0.991119384765625, 1.10699462890625, 1.222869873046875, 1.3387451171875, 1.454620361328125, 1.57049560546875, 1.686370849609375, 1.80224609375, 1.918121337890625, 2.03399658203125, 2.149871826171875, 2.2657470703125, 2.381622314453125, 2.49749755859375, 2.613372802734375, 2.729248046875, 2.845123291015625, 2.96099853515625, 3.076873779296875, 3.1927490234375, 3.308624267578125, 3.42449951171875, 3.540374755859375, 3.65625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 7.0, 15.0, 7.0, 10.0, 29.0, 44.0, 76.0, 125.0, 120.0, 155.0, 129.0, 90.0, 57.0, 48.0, 28.0, 21.0, 13.0, 8.0, 2.0, 7.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000820159912109375, -0.0007879436016082764, -0.0007557272911071777, -0.0007235109806060791, -0.0006912946701049805, -0.0006590783596038818, -0.0006268620491027832, -0.0005946457386016846, -0.0005624294281005859, -0.0005302131175994873, -0.0004979968070983887, -0.00046578049659729004, -0.0004335641860961914, -0.0004013478755950928, -0.00036913156509399414, -0.0003369152545928955, -0.0003046989440917969, -0.00027248263359069824, -0.0002402663230895996, -0.00020805001258850098, -0.00017583370208740234, -0.0001436173915863037, -0.00011140108108520508, -7.918477058410645e-05, -4.696846008300781e-05, -1.475214958190918e-05, 1.7464160919189453e-05, 4.9680471420288086e-05, 8.189678192138672e-05, 0.00011411309242248535, 0.00014632940292358398, 0.00017854571342468262, 0.00021076202392578125, 0.00024297833442687988, 0.0002751946449279785, 0.00030741095542907715, 0.0003396272659301758, 0.0003718435764312744, 0.00040405988693237305, 0.0004362761974334717, 0.0004684925079345703, 0.0005007088184356689, 0.0005329251289367676, 0.0005651414394378662, 0.0005973577499389648, 0.0006295740604400635, 0.0006617903709411621, 0.0006940066814422607, 0.0007262229919433594, 0.000758439302444458, 0.0007906556129455566, 0.0008228719234466553, 0.0008550882339477539, 0.0008873045444488525, 0.0009195208549499512, 0.0009517371654510498, 0.0009839534759521484, 0.001016169786453247, 0.0010483860969543457, 0.0010806024074554443, 0.001112818717956543, 0.0011450350284576416, 0.0011772513389587402, 0.0012094676494598389, 0.0012416839599609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 9.0, 15.0, 18.0, 38.0, 49.0, 92.0, 140.0, 293.0, 850.0, 2711.0, 11483.0, 84445.0, 754784.0, 168783.0, 18984.0, 3900.0, 1159.0, 394.0, 175.0, 74.0, 66.0, 26.0, 22.0, 16.0, 11.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.11712646484375, -1.9725341796875, -1.82794189453125, -1.683349609375, -1.53875732421875, -1.3941650390625, -1.24957275390625, -1.10498046875, -0.96038818359375, -0.8157958984375, -0.67120361328125, -0.526611328125, -0.38201904296875, -0.2374267578125, -0.09283447265625, 0.0517578125, 0.19635009765625, 0.3409423828125, 0.48553466796875, 0.630126953125, 0.77471923828125, 0.9193115234375, 1.06390380859375, 1.20849609375, 1.35308837890625, 1.4976806640625, 1.64227294921875, 1.786865234375, 1.93145751953125, 2.0760498046875, 2.22064208984375, 2.365234375, 2.50982666015625, 2.6544189453125, 2.79901123046875, 2.943603515625, 3.08819580078125, 3.2327880859375, 3.37738037109375, 3.52197265625, 3.66656494140625, 3.8111572265625, 3.95574951171875, 4.100341796875, 4.24493408203125, 4.3895263671875, 4.53411865234375, 4.6787109375, 4.82330322265625, 4.9678955078125, 5.11248779296875, 5.257080078125, 5.40167236328125, 5.5462646484375, 5.69085693359375, 5.83544921875, 5.98004150390625, 6.1246337890625, 6.26922607421875, 6.413818359375, 6.55841064453125, 6.7030029296875, 6.84759521484375, 6.9921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 5.0, 8.0, 13.0, 25.0, 25.0, 34.0, 32.0, 48.0, 51.0, 62.0, 81.0, 71.0, 92.0, 87.0, 70.0, 68.0, 38.0, 30.0, 34.0, 30.0, 11.0, 26.0, 16.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.193359375, -3.09478759765625, -2.9962158203125, -2.89764404296875, -2.799072265625, -2.70050048828125, -2.6019287109375, -2.50335693359375, -2.40478515625, -2.30621337890625, -2.2076416015625, -2.10906982421875, -2.010498046875, -1.91192626953125, -1.8133544921875, -1.71478271484375, -1.6162109375, -1.51763916015625, -1.4190673828125, -1.32049560546875, -1.221923828125, -1.12335205078125, -1.0247802734375, -0.92620849609375, -0.82763671875, -0.72906494140625, -0.6304931640625, -0.53192138671875, -0.433349609375, -0.33477783203125, -0.2362060546875, -0.13763427734375, -0.0390625, 0.05950927734375, 0.1580810546875, 0.25665283203125, 0.355224609375, 0.45379638671875, 0.5523681640625, 0.65093994140625, 0.74951171875, 0.84808349609375, 0.9466552734375, 1.04522705078125, 1.143798828125, 1.24237060546875, 1.3409423828125, 1.43951416015625, 1.5380859375, 1.63665771484375, 1.7352294921875, 1.83380126953125, 1.932373046875, 2.03094482421875, 2.1295166015625, 2.22808837890625, 2.32666015625, 2.42523193359375, 2.5238037109375, 2.62237548828125, 2.720947265625, 2.81951904296875, 2.9180908203125, 3.01666259765625, 3.115234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 5.0, 8.0, 12.0, 21.0, 36.0, 69.0, 98.0, 185.0, 215.0, 130.0, 99.0, 40.0, 28.0, 18.0, 15.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.0500259399414, -80.3927993774414, -77.73558044433594, -75.07835388183594, -72.42112731933594, -69.76390075683594, -67.10667419433594, -64.44945526123047, -61.79222869873047, -59.13500213623047, -56.477779388427734, -53.820556640625, -51.163330078125, -48.506103515625, -45.848880767822266, -43.19165802001953, -40.53443145751953, -37.87720489501953, -35.2199821472168, -32.56275939941406, -29.905532836914062, -27.248308181762695, -24.591083526611328, -21.93385887145996, -19.276634216308594, -16.619409561157227, -13.96218490600586, -11.304960250854492, -8.647735595703125, -5.990510940551758, -3.3332862854003906, -0.6760616302490234, 1.981170654296875, 4.638395309448242, 7.295619964599609, 9.952844619750977, 12.610069274902344, 15.267293930053711, 17.924518585205078, 20.581743240356445, 23.238967895507812, 25.89619255065918, 28.553417205810547, 31.210641860961914, 33.86786651611328, 36.52509307861328, 39.182315826416016, 41.83953857421875, 44.49676513671875, 47.15399169921875, 49.811214447021484, 52.46843719482422, 55.12566375732422, 57.78289031982422, 60.44011306762695, 63.09733581542969, 65.75456237792969, 68.41178894042969, 71.06901550292969, 73.72623443603516, 76.38346099853516, 79.04068756103516, 81.69790649414062, 84.35513305664062, 87.01235961914062]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 9.0, 11.0, 10.0, 6.0, 14.0, 16.0, 23.0, 19.0, 22.0, 18.0, 30.0, 33.0, 30.0, 29.0, 45.0, 59.0, 66.0, 93.0, 74.0, 66.0, 33.0, 28.0, 23.0, 38.0, 41.0, 20.0, 18.0, 24.0, 19.0, 21.0, 8.0, 9.0, 5.0, 9.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-74.3485336303711, -72.12584686279297, -69.90316009521484, -67.68047332763672, -65.45779418945312, -63.235103607177734, -61.012420654296875, -58.78973388671875, -56.567047119140625, -54.3443603515625, -52.121673583984375, -49.898990631103516, -47.67630386352539, -45.453617095947266, -43.230934143066406, -41.00824737548828, -38.785560607910156, -36.56287384033203, -34.340187072753906, -32.11750411987305, -29.894817352294922, -27.672130584716797, -25.449445724487305, -23.226760864257812, -21.004074096679688, -18.781387329101562, -16.55870246887207, -14.336016654968262, -12.113330841064453, -9.890645027160645, -7.667959213256836, -5.445273399353027, -3.2225875854492188, -0.9999017715454102, 1.2227840423583984, 3.445469856262207, 5.668155670166016, 7.890841484069824, 10.113527297973633, 12.336213111877441, 14.55889892578125, 16.781585693359375, 19.004270553588867, 21.22695541381836, 23.449642181396484, 25.67232894897461, 27.8950138092041, 30.117698669433594, 32.34038543701172, 34.563072204589844, 36.78575897216797, 39.00844192504883, 41.23112869262695, 43.45381546020508, 45.67649841308594, 47.89918518066406, 50.12187194824219, 52.34455871582031, 54.56724548339844, 56.7899284362793, 59.01261520385742, 61.23530197143555, 63.457984924316406, 65.68067169189453, 67.90335845947266]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 10.0, 3.0, 11.0, 19.0, 14.0, 26.0, 57.0, 84.0, 105.0, 189.0, 289.0, 565.0, 1071.0, 2236.0, 5206.0, 15274.0, 63189.0, 478343.0, 2664506.0, 830484.0, 99318.0, 20962.0, 6883.0, 2721.0, 1283.0, 620.0, 322.0, 168.0, 126.0, 57.0, 49.0, 32.0, 13.0, 18.0, 8.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8359375, -4.6395263671875, -4.443115234375, -4.2467041015625, -4.05029296875, -3.8538818359375, -3.657470703125, -3.4610595703125, -3.2646484375, -3.0682373046875, -2.871826171875, -2.6754150390625, -2.47900390625, -2.2825927734375, -2.086181640625, -1.8897705078125, -1.693359375, -1.4969482421875, -1.300537109375, -1.1041259765625, -0.90771484375, -0.7113037109375, -0.514892578125, -0.3184814453125, -0.1220703125, 0.0743408203125, 0.270751953125, 0.4671630859375, 0.66357421875, 0.8599853515625, 1.056396484375, 1.2528076171875, 1.44921875, 1.6456298828125, 1.842041015625, 2.0384521484375, 2.23486328125, 2.4312744140625, 2.627685546875, 2.8240966796875, 3.0205078125, 3.2169189453125, 3.413330078125, 3.6097412109375, 3.80615234375, 4.0025634765625, 4.198974609375, 4.3953857421875, 4.591796875, 4.7882080078125, 4.984619140625, 5.1810302734375, 5.37744140625, 5.5738525390625, 5.770263671875, 5.9666748046875, 6.1630859375, 6.3594970703125, 6.555908203125, 6.7523193359375, 6.94873046875, 7.1451416015625, 7.341552734375, 7.5379638671875, 7.734375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 5.0, 9.0, 13.0, 10.0, 21.0, 21.0, 30.0, 33.0, 28.0, 33.0, 39.0, 34.0, 46.0, 55.0, 66.0, 46.0, 52.0, 66.0, 49.0, 44.0, 43.0, 41.0, 36.0, 25.0, 36.0, 19.0, 30.0, 14.0, 16.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.79296875, -5.6356201171875, -5.478271484375, -5.3209228515625, -5.16357421875, -5.0062255859375, -4.848876953125, -4.6915283203125, -4.5341796875, -4.3768310546875, -4.219482421875, -4.0621337890625, -3.90478515625, -3.7474365234375, -3.590087890625, -3.4327392578125, -3.275390625, -3.1180419921875, -2.960693359375, -2.8033447265625, -2.64599609375, -2.4886474609375, -2.331298828125, -2.1739501953125, -2.0166015625, -1.8592529296875, -1.701904296875, -1.5445556640625, -1.38720703125, -1.2298583984375, -1.072509765625, -0.9151611328125, -0.7578125, -0.6004638671875, -0.443115234375, -0.2857666015625, -0.12841796875, 0.0289306640625, 0.186279296875, 0.3436279296875, 0.5009765625, 0.6583251953125, 0.815673828125, 0.9730224609375, 1.13037109375, 1.2877197265625, 1.445068359375, 1.6024169921875, 1.759765625, 1.9171142578125, 2.074462890625, 2.2318115234375, 2.38916015625, 2.5465087890625, 2.703857421875, 2.8612060546875, 3.0185546875, 3.1759033203125, 3.333251953125, 3.4906005859375, 3.64794921875, 3.8052978515625, 3.962646484375, 4.1199951171875, 4.27734375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 11.0, 10.0, 23.0, 28.0, 41.0, 111.0, 227.0, 588.0, 1756.0, 8276.0, 141726.0, 3934873.0, 97183.0, 6912.0, 1597.0, 512.0, 199.0, 84.0, 40.0, 26.0, 15.0, 11.0, 5.0, 8.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.078125, -15.5322265625, -14.986328125, -14.4404296875, -13.89453125, -13.3486328125, -12.802734375, -12.2568359375, -11.7109375, -11.1650390625, -10.619140625, -10.0732421875, -9.52734375, -8.9814453125, -8.435546875, -7.8896484375, -7.34375, -6.7978515625, -6.251953125, -5.7060546875, -5.16015625, -4.6142578125, -4.068359375, -3.5224609375, -2.9765625, -2.4306640625, -1.884765625, -1.3388671875, -0.79296875, -0.2470703125, 0.298828125, 0.8447265625, 1.390625, 1.9365234375, 2.482421875, 3.0283203125, 3.57421875, 4.1201171875, 4.666015625, 5.2119140625, 5.7578125, 6.3037109375, 6.849609375, 7.3955078125, 7.94140625, 8.4873046875, 9.033203125, 9.5791015625, 10.125, 10.6708984375, 11.216796875, 11.7626953125, 12.30859375, 12.8544921875, 13.400390625, 13.9462890625, 14.4921875, 15.0380859375, 15.583984375, 16.1298828125, 16.67578125, 17.2216796875, 17.767578125, 18.3134765625, 18.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 14.0, 17.0, 25.0, 29.0, 33.0, 69.0, 111.0, 174.0, 335.0, 564.0, 779.0, 726.0, 472.0, 276.0, 147.0, 94.0, 65.0, 30.0, 31.0, 22.0, 15.0, 4.0, 3.0, 4.0, 7.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-11.1484375, -10.8463134765625, -10.544189453125, -10.2420654296875, -9.93994140625, -9.6378173828125, -9.335693359375, -9.0335693359375, -8.7314453125, -8.4293212890625, -8.127197265625, -7.8250732421875, -7.52294921875, -7.2208251953125, -6.918701171875, -6.6165771484375, -6.314453125, -6.0123291015625, -5.710205078125, -5.4080810546875, -5.10595703125, -4.8038330078125, -4.501708984375, -4.1995849609375, -3.8974609375, -3.5953369140625, -3.293212890625, -2.9910888671875, -2.68896484375, -2.3868408203125, -2.084716796875, -1.7825927734375, -1.48046875, -1.1783447265625, -0.876220703125, -0.5740966796875, -0.27197265625, 0.0301513671875, 0.332275390625, 0.6343994140625, 0.9365234375, 1.2386474609375, 1.540771484375, 1.8428955078125, 2.14501953125, 2.4471435546875, 2.749267578125, 3.0513916015625, 3.353515625, 3.6556396484375, 3.957763671875, 4.2598876953125, 4.56201171875, 4.8641357421875, 5.166259765625, 5.4683837890625, 5.7705078125, 6.0726318359375, 6.374755859375, 6.6768798828125, 6.97900390625, 7.2811279296875, 7.583251953125, 7.8853759765625, 8.1875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 19.0, 32.0, 45.0, 103.0, 179.0, 184.0, 181.0, 119.0, 58.0, 25.0, 21.0, 12.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-113.70182800292969, -110.84175872802734, -107.98169708251953, -105.12162780761719, -102.26155853271484, -99.40149688720703, -96.54142761230469, -93.68136596679688, -90.82129669189453, -87.96122741699219, -85.10116577148438, -82.24109649658203, -79.38102722167969, -76.52096557617188, -73.66089630126953, -70.80082702636719, -67.94076538085938, -65.08069610595703, -62.22063064575195, -59.360565185546875, -56.5004997253418, -53.64043426513672, -50.780364990234375, -47.9202995300293, -45.06022644042969, -42.20016098022461, -39.340091705322266, -36.48002624511719, -33.61996078491211, -30.7598934173584, -27.899826049804688, -25.03976058959961, -22.17969512939453, -19.31962776184082, -16.459562301635742, -13.599494934082031, -10.739428520202637, -7.879362106323242, -5.019294738769531, -2.159229278564453, 0.7008380889892578, 3.5609047412872314, 6.420971393585205, 9.281038284301758, 12.141104698181152, 15.001171112060547, 17.861238479614258, 20.721303939819336, 23.581371307373047, 26.441438674926758, 29.301504135131836, 32.16157150268555, 35.021636962890625, 37.88170623779297, 40.74177169799805, 43.601837158203125, 46.46190643310547, 49.32197189331055, 52.18204116821289, 55.04210662841797, 57.90217208862305, 60.762237548828125, 63.62230682373047, 66.48237609863281, 69.34243774414062]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 6.0, 8.0, 7.0, 11.0, 11.0, 12.0, 16.0, 27.0, 23.0, 29.0, 32.0, 32.0, 36.0, 45.0, 35.0, 31.0, 36.0, 49.0, 41.0, 38.0, 42.0, 41.0, 32.0, 43.0, 31.0, 33.0, 46.0, 29.0, 23.0, 29.0, 16.0, 17.0, 17.0, 9.0, 17.0, 6.0, 8.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.21644592285156, -34.16857147216797, -33.120697021484375, -32.07282257080078, -31.024946212768555, -29.97707176208496, -28.929195404052734, -27.88132095336914, -26.833446502685547, -25.785572052001953, -24.73769760131836, -23.689821243286133, -22.64194679260254, -21.594072341918945, -20.54619598388672, -19.498321533203125, -18.45044708251953, -17.402572631835938, -16.354698181152344, -15.306821823120117, -14.258947372436523, -13.21107292175293, -12.16319751739502, -11.11532211303711, -10.067447662353516, -9.019573211669922, -7.971697807312012, -6.92382287979126, -5.875947952270508, -4.828073024749756, -3.780198097229004, -2.732323169708252, -1.6844444274902344, -0.6365694999694824, 0.41130542755126953, 1.4591803550720215, 2.5070552825927734, 3.5549302101135254, 4.602805137634277, 5.650680065155029, 6.698554992675781, 7.746429920196533, 8.794304847717285, 9.842180252075195, 10.890054702758789, 11.937929153442383, 12.985804557800293, 14.033679962158203, 15.081554412841797, 16.12942886352539, 17.177303314208984, 18.22517967224121, 19.273054122924805, 20.3209285736084, 21.368804931640625, 22.41667938232422, 23.464553833007812, 24.512428283691406, 25.560302734375, 26.608179092407227, 27.65605354309082, 28.703927993774414, 29.75180435180664, 30.799678802490234, 31.847553253173828]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 13.0, 6.0, 14.0, 30.0, 31.0, 56.0, 73.0, 167.0, 302.0, 601.0, 1255.0, 2663.0, 6619.0, 17715.0, 55840.0, 208773.0, 486259.0, 188785.0, 51532.0, 16513.0, 6302.0, 2591.0, 1160.0, 591.0, 283.0, 145.0, 81.0, 47.0, 40.0, 22.0, 21.0, 7.0, 7.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.5125732421875, -9.251708984375, -8.9908447265625, -8.72998046875, -8.4691162109375, -8.208251953125, -7.9473876953125, -7.6865234375, -7.4256591796875, -7.164794921875, -6.9039306640625, -6.64306640625, -6.3822021484375, -6.121337890625, -5.8604736328125, -5.599609375, -5.3387451171875, -5.077880859375, -4.8170166015625, -4.55615234375, -4.2952880859375, -4.034423828125, -3.7735595703125, -3.5126953125, -3.2518310546875, -2.990966796875, -2.7301025390625, -2.46923828125, -2.2083740234375, -1.947509765625, -1.6866455078125, -1.42578125, -1.1649169921875, -0.904052734375, -0.6431884765625, -0.38232421875, -0.1214599609375, 0.139404296875, 0.4002685546875, 0.6611328125, 0.9219970703125, 1.182861328125, 1.4437255859375, 1.70458984375, 1.9654541015625, 2.226318359375, 2.4871826171875, 2.748046875, 3.0089111328125, 3.269775390625, 3.5306396484375, 3.79150390625, 4.0523681640625, 4.313232421875, 4.5740966796875, 4.8349609375, 5.0958251953125, 5.356689453125, 5.6175537109375, 5.87841796875, 6.1392822265625, 6.400146484375, 6.6610107421875, 6.921875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 4.0, 4.0, 6.0, 1.0, 7.0, 10.0, 15.0, 17.0, 18.0, 27.0, 29.0, 29.0, 24.0, 39.0, 65.0, 46.0, 46.0, 63.0, 58.0, 69.0, 56.0, 52.0, 46.0, 41.0, 43.0, 35.0, 30.0, 15.0, 25.0, 21.0, 15.0, 19.0, 10.0, 6.0, 2.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.90234375, -5.737548828125, -5.57275390625, -5.407958984375, -5.2431640625, -5.078369140625, -4.91357421875, -4.748779296875, -4.583984375, -4.419189453125, -4.25439453125, -4.089599609375, -3.9248046875, -3.760009765625, -3.59521484375, -3.430419921875, -3.265625, -3.100830078125, -2.93603515625, -2.771240234375, -2.6064453125, -2.441650390625, -2.27685546875, -2.112060546875, -1.947265625, -1.782470703125, -1.61767578125, -1.452880859375, -1.2880859375, -1.123291015625, -0.95849609375, -0.793701171875, -0.62890625, -0.464111328125, -0.29931640625, -0.134521484375, 0.0302734375, 0.195068359375, 0.35986328125, 0.524658203125, 0.689453125, 0.854248046875, 1.01904296875, 1.183837890625, 1.3486328125, 1.513427734375, 1.67822265625, 1.843017578125, 2.0078125, 2.172607421875, 2.33740234375, 2.502197265625, 2.6669921875, 2.831787109375, 2.99658203125, 3.161376953125, 3.326171875, 3.490966796875, 3.65576171875, 3.820556640625, 3.9853515625, 4.150146484375, 4.31494140625, 4.479736328125, 4.64453125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 9.0, 8.0, 10.0, 7.0, 13.0, 16.0, 27.0, 21.0, 45.0, 49.0, 53.0, 84.0, 129.0, 174.0, 308.0, 464.0, 892.0, 1719.0, 4755.0, 19405.0, 142751.0, 763619.0, 92334.0, 14306.0, 3825.0, 1453.0, 770.0, 426.0, 290.0, 180.0, 129.0, 78.0, 56.0, 40.0, 29.0, 29.0, 11.0, 12.0, 9.0, 6.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0], "bins": [-16.546875, -16.126953125, -15.70703125, -15.287109375, -14.8671875, -14.447265625, -14.02734375, -13.607421875, -13.1875, -12.767578125, -12.34765625, -11.927734375, -11.5078125, -11.087890625, -10.66796875, -10.248046875, -9.828125, -9.408203125, -8.98828125, -8.568359375, -8.1484375, -7.728515625, -7.30859375, -6.888671875, -6.46875, -6.048828125, -5.62890625, -5.208984375, -4.7890625, -4.369140625, -3.94921875, -3.529296875, -3.109375, -2.689453125, -2.26953125, -1.849609375, -1.4296875, -1.009765625, -0.58984375, -0.169921875, 0.25, 0.669921875, 1.08984375, 1.509765625, 1.9296875, 2.349609375, 2.76953125, 3.189453125, 3.609375, 4.029296875, 4.44921875, 4.869140625, 5.2890625, 5.708984375, 6.12890625, 6.548828125, 6.96875, 7.388671875, 7.80859375, 8.228515625, 8.6484375, 9.068359375, 9.48828125, 9.908203125, 10.328125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 7.0, 12.0, 12.0, 19.0, 18.0, 34.0, 41.0, 39.0, 56.0, 56.0, 54.0, 64.0, 55.0, 59.0, 61.0, 59.0, 59.0, 63.0, 38.0, 32.0, 22.0, 29.0, 21.0, 15.0, 9.0, 11.0, 10.0, 8.0, 6.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.484375, -20.9072265625, -20.330078125, -19.7529296875, -19.17578125, -18.5986328125, -18.021484375, -17.4443359375, -16.8671875, -16.2900390625, -15.712890625, -15.1357421875, -14.55859375, -13.9814453125, -13.404296875, -12.8271484375, -12.25, -11.6728515625, -11.095703125, -10.5185546875, -9.94140625, -9.3642578125, -8.787109375, -8.2099609375, -7.6328125, -7.0556640625, -6.478515625, -5.9013671875, -5.32421875, -4.7470703125, -4.169921875, -3.5927734375, -3.015625, -2.4384765625, -1.861328125, -1.2841796875, -0.70703125, -0.1298828125, 0.447265625, 1.0244140625, 1.6015625, 2.1787109375, 2.755859375, 3.3330078125, 3.91015625, 4.4873046875, 5.064453125, 5.6416015625, 6.21875, 6.7958984375, 7.373046875, 7.9501953125, 8.52734375, 9.1044921875, 9.681640625, 10.2587890625, 10.8359375, 11.4130859375, 11.990234375, 12.5673828125, 13.14453125, 13.7216796875, 14.298828125, 14.8759765625, 15.453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 11.0, 6.0, 4.0, 10.0, 16.0, 15.0, 29.0, 49.0, 69.0, 96.0, 155.0, 265.0, 516.0, 1020.0, 2470.0, 6352.0, 19964.0, 93900.0, 750917.0, 134075.0, 25604.0, 7541.0, 2830.0, 1240.0, 546.0, 301.0, 183.0, 119.0, 68.0, 52.0, 35.0, 14.0, 18.0, 13.0, 11.0, 3.0, 4.0, 10.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4453125, -3.342742919921875, -3.24017333984375, -3.137603759765625, -3.0350341796875, -2.932464599609375, -2.82989501953125, -2.727325439453125, -2.624755859375, -2.522186279296875, -2.41961669921875, -2.317047119140625, -2.2144775390625, -2.111907958984375, -2.00933837890625, -1.906768798828125, -1.80419921875, -1.701629638671875, -1.59906005859375, -1.496490478515625, -1.3939208984375, -1.291351318359375, -1.18878173828125, -1.086212158203125, -0.983642578125, -0.881072998046875, -0.77850341796875, -0.675933837890625, -0.5733642578125, -0.470794677734375, -0.36822509765625, -0.265655517578125, -0.1630859375, -0.060516357421875, 0.04205322265625, 0.144622802734375, 0.2471923828125, 0.349761962890625, 0.45233154296875, 0.554901123046875, 0.657470703125, 0.760040283203125, 0.86260986328125, 0.965179443359375, 1.0677490234375, 1.170318603515625, 1.27288818359375, 1.375457763671875, 1.47802734375, 1.580596923828125, 1.68316650390625, 1.785736083984375, 1.8883056640625, 1.990875244140625, 2.09344482421875, 2.196014404296875, 2.298583984375, 2.401153564453125, 2.50372314453125, 2.606292724609375, 2.7088623046875, 2.811431884765625, 2.91400146484375, 3.016571044921875, 3.119140625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 2.0, 5.0, 11.0, 7.0, 9.0, 14.0, 14.0, 26.0, 36.0, 42.0, 63.0, 93.0, 114.0, 159.0, 100.0, 95.0, 53.0, 43.0, 28.0, 20.0, 13.0, 7.0, 5.0, 6.0, 5.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006971359252929688, -0.0006725043058395386, -0.0006478726863861084, -0.0006232410669326782, -0.000598609447479248, -0.0005739778280258179, -0.0005493462085723877, -0.0005247145891189575, -0.0005000829696655273, -0.00047545135021209717, -0.000450819730758667, -0.0004261881113052368, -0.00040155649185180664, -0.00037692487239837646, -0.0003522932529449463, -0.0003276616334915161, -0.00030303001403808594, -0.00027839839458465576, -0.0002537667751312256, -0.0002291351556777954, -0.00020450353622436523, -0.00017987191677093506, -0.00015524029731750488, -0.0001306086778640747, -0.00010597705841064453, -8.134543895721436e-05, -5.671381950378418e-05, -3.2082200050354004e-05, -7.450580596923828e-06, 1.7181038856506348e-05, 4.1812658309936523e-05, 6.64442777633667e-05, 9.107589721679688e-05, 0.00011570751667022705, 0.00014033913612365723, 0.0001649707555770874, 0.00018960237503051758, 0.00021423399448394775, 0.00023886561393737793, 0.0002634972333908081, 0.0002881288528442383, 0.00031276047229766846, 0.00033739209175109863, 0.0003620237112045288, 0.000386655330657959, 0.00041128695011138916, 0.00043591856956481934, 0.0004605501890182495, 0.0004851818084716797, 0.0005098134279251099, 0.00053444504737854, 0.0005590766668319702, 0.0005837082862854004, 0.0006083399057388306, 0.0006329715251922607, 0.0006576031446456909, 0.0006822347640991211, 0.0007068663835525513, 0.0007314980030059814, 0.0007561296224594116, 0.0007807612419128418, 0.000805392861366272, 0.0008300244808197021, 0.0008546561002731323, 0.0008792877197265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 11.0, 16.0, 12.0, 23.0, 37.0, 45.0, 66.0, 104.0, 169.0, 291.0, 494.0, 982.0, 2256.0, 6351.0, 22782.0, 126814.0, 756813.0, 101585.0, 19813.0, 5569.0, 2121.0, 962.0, 483.0, 248.0, 152.0, 95.0, 72.0, 45.0, 30.0, 24.0, 17.0, 10.0, 10.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.552734375, -3.4432373046875, -3.333740234375, -3.2242431640625, -3.11474609375, -3.0052490234375, -2.895751953125, -2.7862548828125, -2.6767578125, -2.5672607421875, -2.457763671875, -2.3482666015625, -2.23876953125, -2.1292724609375, -2.019775390625, -1.9102783203125, -1.80078125, -1.6912841796875, -1.581787109375, -1.4722900390625, -1.36279296875, -1.2532958984375, -1.143798828125, -1.0343017578125, -0.9248046875, -0.8153076171875, -0.705810546875, -0.5963134765625, -0.48681640625, -0.3773193359375, -0.267822265625, -0.1583251953125, -0.048828125, 0.0606689453125, 0.170166015625, 0.2796630859375, 0.38916015625, 0.4986572265625, 0.608154296875, 0.7176513671875, 0.8271484375, 0.9366455078125, 1.046142578125, 1.1556396484375, 1.26513671875, 1.3746337890625, 1.484130859375, 1.5936279296875, 1.703125, 1.8126220703125, 1.922119140625, 2.0316162109375, 2.14111328125, 2.2506103515625, 2.360107421875, 2.4696044921875, 2.5791015625, 2.6885986328125, 2.798095703125, 2.9075927734375, 3.01708984375, 3.1265869140625, 3.236083984375, 3.3455810546875, 3.455078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 3.0, 4.0, 6.0, 11.0, 18.0, 18.0, 15.0, 34.0, 56.0, 58.0, 78.0, 116.0, 118.0, 105.0, 104.0, 64.0, 45.0, 28.0, 31.0, 21.0, 9.0, 11.0, 6.0, 5.0, 5.0, 1.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.6328125, -3.52740478515625, -3.4219970703125, -3.31658935546875, -3.211181640625, -3.10577392578125, -3.0003662109375, -2.89495849609375, -2.78955078125, -2.68414306640625, -2.5787353515625, -2.47332763671875, -2.367919921875, -2.26251220703125, -2.1571044921875, -2.05169677734375, -1.9462890625, -1.84088134765625, -1.7354736328125, -1.63006591796875, -1.524658203125, -1.41925048828125, -1.3138427734375, -1.20843505859375, -1.10302734375, -0.99761962890625, -0.8922119140625, -0.78680419921875, -0.681396484375, -0.57598876953125, -0.4705810546875, -0.36517333984375, -0.259765625, -0.15435791015625, -0.0489501953125, 0.05645751953125, 0.161865234375, 0.26727294921875, 0.3726806640625, 0.47808837890625, 0.58349609375, 0.68890380859375, 0.7943115234375, 0.89971923828125, 1.005126953125, 1.11053466796875, 1.2159423828125, 1.32135009765625, 1.4267578125, 1.53216552734375, 1.6375732421875, 1.74298095703125, 1.848388671875, 1.95379638671875, 2.0592041015625, 2.16461181640625, 2.27001953125, 2.37542724609375, 2.4808349609375, 2.58624267578125, 2.691650390625, 2.79705810546875, 2.9024658203125, 3.00787353515625, 3.11328125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 2.0, 7.0, 13.0, 21.0, 59.0, 137.0, 294.0, 241.0, 115.0, 51.0, 27.0, 7.0, 3.0, 4.0, 6.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.01658630371094, -49.671199798583984, -46.32581329345703, -42.98042678833008, -39.635040283203125, -36.28965377807617, -32.94426727294922, -29.598880767822266, -26.253494262695312, -22.90810775756836, -19.562721252441406, -16.217334747314453, -12.8719482421875, -9.526561737060547, -6.181175231933594, -2.8357887268066406, 0.5095977783203125, 3.8549842834472656, 7.200370788574219, 10.545757293701172, 13.891143798828125, 17.236530303955078, 20.58191680908203, 23.927303314208984, 27.272689819335938, 30.61807632446289, 33.963462829589844, 37.3088493347168, 40.65423583984375, 43.9996223449707, 47.345008850097656, 50.69039535522461, 54.03578186035156, 57.381168365478516, 60.72655487060547, 64.07194519042969, 67.41732788085938, 70.76271057128906, 74.10810089111328, 77.4534912109375, 80.79887390136719, 84.14425659179688, 87.4896469116211, 90.83503723144531, 94.180419921875, 97.52580261230469, 100.8711929321289, 104.21658325195312, 107.56196594238281, 110.9073486328125, 114.25273895263672, 117.59812927246094, 120.94351196289062, 124.28889465332031, 127.63428497314453, 130.97967529296875, 134.32505798339844, 137.67044067382812, 141.01583862304688, 144.36122131347656, 147.70660400390625, 151.05198669433594, 154.39736938476562, 157.74276733398438, 161.08815002441406]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 12.0, 9.0, 9.0, 8.0, 10.0, 11.0, 8.0, 16.0, 14.0, 25.0, 27.0, 24.0, 32.0, 16.0, 47.0, 29.0, 47.0, 64.0, 102.0, 95.0, 62.0, 45.0, 30.0, 31.0, 27.0, 26.0, 32.0, 26.0, 20.0, 7.0, 17.0, 11.0, 8.0, 8.0, 9.0, 8.0, 4.0, 6.0, 4.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-48.36821365356445, -46.6351318359375, -44.90205001831055, -43.168968200683594, -41.43588638305664, -39.70280456542969, -37.969722747802734, -36.23664093017578, -34.50355911254883, -32.770477294921875, -31.037395477294922, -29.30431365966797, -27.571231842041016, -25.838150024414062, -24.10506820678711, -22.371986389160156, -20.638904571533203, -18.90582275390625, -17.172740936279297, -15.439659118652344, -13.70657730102539, -11.973495483398438, -10.240413665771484, -8.507331848144531, -6.774250030517578, -5.041168212890625, -3.308086395263672, -1.5750045776367188, 0.15807723999023438, 1.8911590576171875, 3.6242408752441406, 5.357322692871094, 7.090400695800781, 8.823482513427734, 10.556564331054688, 12.28964614868164, 14.022727966308594, 15.755809783935547, 17.4888916015625, 19.221973419189453, 20.955055236816406, 22.68813705444336, 24.421218872070312, 26.154300689697266, 27.88738250732422, 29.620464324951172, 31.353546142578125, 33.08662796020508, 34.81970977783203, 36.552791595458984, 38.28587341308594, 40.01895523071289, 41.752037048339844, 43.4851188659668, 45.21820068359375, 46.9512825012207, 48.684364318847656, 50.41744613647461, 52.15052795410156, 53.883609771728516, 55.61669158935547, 57.34977340698242, 59.082855224609375, 60.81593704223633, 62.54901885986328]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 13.0, 18.0, 32.0, 54.0, 108.0, 241.0, 627.0, 1807.0, 7019.0, 44251.0, 717607.0, 3096175.0, 294392.0, 24929.0, 4741.0, 1352.0, 494.0, 218.0, 73.0, 41.0, 28.0, 16.0, 13.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.034423828125, -7.74072265625, -7.447021484375, -7.1533203125, -6.859619140625, -6.56591796875, -6.272216796875, -5.978515625, -5.684814453125, -5.39111328125, -5.097412109375, -4.8037109375, -4.510009765625, -4.21630859375, -3.922607421875, -3.62890625, -3.335205078125, -3.04150390625, -2.747802734375, -2.4541015625, -2.160400390625, -1.86669921875, -1.572998046875, -1.279296875, -0.985595703125, -0.69189453125, -0.398193359375, -0.1044921875, 0.189208984375, 0.48291015625, 0.776611328125, 1.0703125, 1.364013671875, 1.65771484375, 1.951416015625, 2.2451171875, 2.538818359375, 2.83251953125, 3.126220703125, 3.419921875, 3.713623046875, 4.00732421875, 4.301025390625, 4.5947265625, 4.888427734375, 5.18212890625, 5.475830078125, 5.76953125, 6.063232421875, 6.35693359375, 6.650634765625, 6.9443359375, 7.238037109375, 7.53173828125, 7.825439453125, 8.119140625, 8.412841796875, 8.70654296875, 9.000244140625, 9.2939453125, 9.587646484375, 9.88134765625, 10.175048828125, 10.46875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 4.0, 2.0, 8.0, 14.0, 12.0, 10.0, 26.0, 19.0, 26.0, 22.0, 28.0, 26.0, 37.0, 39.0, 41.0, 62.0, 63.0, 35.0, 46.0, 46.0, 56.0, 58.0, 34.0, 32.0, 33.0, 32.0, 26.0, 30.0, 26.0, 15.0, 16.0, 14.0, 16.0, 16.0, 15.0, 2.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.0859375, -4.946746826171875, -4.80755615234375, -4.668365478515625, -4.5291748046875, -4.389984130859375, -4.25079345703125, -4.111602783203125, -3.972412109375, -3.833221435546875, -3.69403076171875, -3.554840087890625, -3.4156494140625, -3.276458740234375, -3.13726806640625, -2.998077392578125, -2.85888671875, -2.719696044921875, -2.58050537109375, -2.441314697265625, -2.3021240234375, -2.162933349609375, -2.02374267578125, -1.884552001953125, -1.745361328125, -1.606170654296875, -1.46697998046875, -1.327789306640625, -1.1885986328125, -1.049407958984375, -0.91021728515625, -0.771026611328125, -0.6318359375, -0.492645263671875, -0.35345458984375, -0.214263916015625, -0.0750732421875, 0.064117431640625, 0.20330810546875, 0.342498779296875, 0.481689453125, 0.620880126953125, 0.76007080078125, 0.899261474609375, 1.0384521484375, 1.177642822265625, 1.31683349609375, 1.456024169921875, 1.59521484375, 1.734405517578125, 1.87359619140625, 2.012786865234375, 2.1519775390625, 2.291168212890625, 2.43035888671875, 2.569549560546875, 2.708740234375, 2.847930908203125, 2.98712158203125, 3.126312255859375, 3.2655029296875, 3.404693603515625, 3.54388427734375, 3.683074951171875, 3.822265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 11.0, 22.0, 27.0, 47.0, 76.0, 156.0, 337.0, 862.0, 4744.0, 88151.0, 3985438.0, 107423.0, 5325.0, 926.0, 360.0, 168.0, 100.0, 43.0, 26.0, 8.0, 7.0, 7.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8671875, -15.2906494140625, -14.714111328125, -14.1375732421875, -13.56103515625, -12.9844970703125, -12.407958984375, -11.8314208984375, -11.2548828125, -10.6783447265625, -10.101806640625, -9.5252685546875, -8.94873046875, -8.3721923828125, -7.795654296875, -7.2191162109375, -6.642578125, -6.0660400390625, -5.489501953125, -4.9129638671875, -4.33642578125, -3.7598876953125, -3.183349609375, -2.6068115234375, -2.0302734375, -1.4537353515625, -0.877197265625, -0.3006591796875, 0.27587890625, 0.8524169921875, 1.428955078125, 2.0054931640625, 2.58203125, 3.1585693359375, 3.735107421875, 4.3116455078125, 4.88818359375, 5.4647216796875, 6.041259765625, 6.6177978515625, 7.1943359375, 7.7708740234375, 8.347412109375, 8.9239501953125, 9.50048828125, 10.0770263671875, 10.653564453125, 11.2301025390625, 11.806640625, 12.3831787109375, 12.959716796875, 13.5362548828125, 14.11279296875, 14.6893310546875, 15.265869140625, 15.8424072265625, 16.4189453125, 16.9954833984375, 17.572021484375, 18.1485595703125, 18.72509765625, 19.3016357421875, 19.878173828125, 20.4547119140625, 21.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 12.0, 19.0, 18.0, 58.0, 107.0, 189.0, 447.0, 826.0, 1045.0, 660.0, 326.0, 131.0, 99.0, 53.0, 32.0, 11.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.73828125, -7.29193115234375, -6.8455810546875, -6.39923095703125, -5.952880859375, -5.50653076171875, -5.0601806640625, -4.61383056640625, -4.16748046875, -3.72113037109375, -3.2747802734375, -2.82843017578125, -2.382080078125, -1.93572998046875, -1.4893798828125, -1.04302978515625, -0.5966796875, -0.15032958984375, 0.2960205078125, 0.74237060546875, 1.188720703125, 1.63507080078125, 2.0814208984375, 2.52777099609375, 2.97412109375, 3.42047119140625, 3.8668212890625, 4.31317138671875, 4.759521484375, 5.20587158203125, 5.6522216796875, 6.09857177734375, 6.544921875, 6.99127197265625, 7.4376220703125, 7.88397216796875, 8.330322265625, 8.77667236328125, 9.2230224609375, 9.66937255859375, 10.11572265625, 10.56207275390625, 11.0084228515625, 11.45477294921875, 11.901123046875, 12.34747314453125, 12.7938232421875, 13.24017333984375, 13.6865234375, 14.13287353515625, 14.5792236328125, 15.02557373046875, 15.471923828125, 15.91827392578125, 16.3646240234375, 16.81097412109375, 17.25732421875, 17.70367431640625, 18.1500244140625, 18.59637451171875, 19.042724609375, 19.48907470703125, 19.9354248046875, 20.38177490234375, 20.828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 11.0, 6.0, 18.0, 30.0, 46.0, 109.0, 215.0, 216.0, 171.0, 76.0, 45.0, 23.0, 13.0, 5.0, 1.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.12738037109375, -125.0787353515625, -122.03008270263672, -118.98143005371094, -115.93278503417969, -112.88414001464844, -109.83548736572266, -106.78683471679688, -103.73818969726562, -100.68954467773438, -97.6408920288086, -94.59223937988281, -91.54359436035156, -88.49494934082031, -85.44629669189453, -82.39764404296875, -79.3489990234375, -76.30035400390625, -73.25170135498047, -70.20304870605469, -67.15440368652344, -64.10575866699219, -61.057106018066406, -58.00845718383789, -54.959808349609375, -51.91115951538086, -48.862510681152344, -45.81386184692383, -42.76521301269531, -39.7165641784668, -36.66791534423828, -33.619266510009766, -30.57061767578125, -27.521968841552734, -24.47332000732422, -21.424671173095703, -18.376022338867188, -15.327373504638672, -12.278724670410156, -9.23007583618164, -6.181427001953125, -3.1327781677246094, -0.08412933349609375, 2.964519500732422, 6.0131683349609375, 9.061817169189453, 12.110466003417969, 15.159114837646484, 18.207763671875, 21.256412506103516, 24.30506134033203, 27.353710174560547, 30.402359008789062, 33.45100784301758, 36.499656677246094, 39.54830551147461, 42.596954345703125, 45.64560317993164, 48.694252014160156, 51.74290084838867, 54.79154968261719, 57.8401985168457, 60.88884735107422, 63.937496185302734, 66.98614501953125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 8.0, 9.0, 8.0, 10.0, 19.0, 15.0, 20.0, 19.0, 31.0, 28.0, 35.0, 37.0, 32.0, 42.0, 44.0, 48.0, 64.0, 69.0, 57.0, 52.0, 49.0, 41.0, 42.0, 37.0, 26.0, 21.0, 28.0, 18.0, 20.0, 12.0, 14.0, 9.0, 7.0, 4.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.152992248535156, -33.865177154541016, -32.577362060546875, -31.289546966552734, -30.001731872558594, -28.713916778564453, -27.42609977722168, -26.13828468322754, -24.8504695892334, -23.562654495239258, -22.274839401245117, -20.987024307250977, -19.699207305908203, -18.411392211914062, -17.123577117919922, -15.835762023925781, -14.54794692993164, -13.2601318359375, -11.97231674194336, -10.684500694274902, -9.396685600280762, -8.108870506286621, -6.821054935455322, -5.533239364624023, -4.245424270629883, -2.957608938217163, -1.6697936058044434, -0.38197827339172363, 0.9058370590209961, 2.1936521530151367, 3.4814677238464355, 4.769283294677734, 6.057098388671875, 7.344913482666016, 8.632728576660156, 9.920544624328613, 11.208359718322754, 12.496174812316895, 13.783990859985352, 15.071805953979492, 16.359621047973633, 17.647436141967773, 18.935251235961914, 20.223066329956055, 21.510883331298828, 22.79869842529297, 24.08651351928711, 25.37432861328125, 26.66214370727539, 27.94995880126953, 29.237773895263672, 30.525588989257812, 31.813404083251953, 33.101219177246094, 34.389034271240234, 35.676849365234375, 36.96466827392578, 38.25248336791992, 39.54029846191406, 40.8281135559082, 42.115928649902344, 43.403743743896484, 44.691558837890625, 45.97937774658203, 47.267189025878906]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 9.0, 9.0, 22.0, 30.0, 26.0, 37.0, 59.0, 116.0, 165.0, 237.0, 385.0, 692.0, 1121.0, 2125.0, 4206.0, 9012.0, 20932.0, 53353.0, 158713.0, 416834.0, 247278.0, 79607.0, 29255.0, 12242.0, 5587.0, 2738.0, 1502.0, 846.0, 495.0, 352.0, 188.0, 121.0, 83.0, 45.0, 43.0, 15.0, 12.0, 14.0, 9.0, 4.0, 8.0, 7.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4296875, -6.213134765625, -5.99658203125, -5.780029296875, -5.5634765625, -5.346923828125, -5.13037109375, -4.913818359375, -4.697265625, -4.480712890625, -4.26416015625, -4.047607421875, -3.8310546875, -3.614501953125, -3.39794921875, -3.181396484375, -2.96484375, -2.748291015625, -2.53173828125, -2.315185546875, -2.0986328125, -1.882080078125, -1.66552734375, -1.448974609375, -1.232421875, -1.015869140625, -0.79931640625, -0.582763671875, -0.3662109375, -0.149658203125, 0.06689453125, 0.283447265625, 0.5, 0.716552734375, 0.93310546875, 1.149658203125, 1.3662109375, 1.582763671875, 1.79931640625, 2.015869140625, 2.232421875, 2.448974609375, 2.66552734375, 2.882080078125, 3.0986328125, 3.315185546875, 3.53173828125, 3.748291015625, 3.96484375, 4.181396484375, 4.39794921875, 4.614501953125, 4.8310546875, 5.047607421875, 5.26416015625, 5.480712890625, 5.697265625, 5.913818359375, 6.13037109375, 6.346923828125, 6.5634765625, 6.780029296875, 6.99658203125, 7.213134765625, 7.4296875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 6.0, 8.0, 8.0, 7.0, 21.0, 12.0, 29.0, 26.0, 31.0, 34.0, 45.0, 46.0, 38.0, 48.0, 61.0, 42.0, 53.0, 45.0, 55.0, 55.0, 39.0, 36.0, 38.0, 28.0, 24.0, 32.0, 24.0, 17.0, 18.0, 14.0, 10.0, 7.0, 5.0, 12.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.06640625, -4.9156494140625, -4.764892578125, -4.6141357421875, -4.46337890625, -4.3126220703125, -4.161865234375, -4.0111083984375, -3.8603515625, -3.7095947265625, -3.558837890625, -3.4080810546875, -3.25732421875, -3.1065673828125, -2.955810546875, -2.8050537109375, -2.654296875, -2.5035400390625, -2.352783203125, -2.2020263671875, -2.05126953125, -1.9005126953125, -1.749755859375, -1.5989990234375, -1.4482421875, -1.2974853515625, -1.146728515625, -0.9959716796875, -0.84521484375, -0.6944580078125, -0.543701171875, -0.3929443359375, -0.2421875, -0.0914306640625, 0.059326171875, 0.2100830078125, 0.36083984375, 0.5115966796875, 0.662353515625, 0.8131103515625, 0.9638671875, 1.1146240234375, 1.265380859375, 1.4161376953125, 1.56689453125, 1.7176513671875, 1.868408203125, 2.0191650390625, 2.169921875, 2.3206787109375, 2.471435546875, 2.6221923828125, 2.77294921875, 2.9237060546875, 3.074462890625, 3.2252197265625, 3.3759765625, 3.5267333984375, 3.677490234375, 3.8282470703125, 3.97900390625, 4.1297607421875, 4.280517578125, 4.4312744140625, 4.58203125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 6.0, 5.0, 9.0, 6.0, 7.0, 13.0, 16.0, 21.0, 30.0, 34.0, 47.0, 68.0, 116.0, 148.0, 211.0, 317.0, 516.0, 954.0, 1755.0, 5239.0, 27264.0, 706987.0, 276532.0, 19899.0, 4419.0, 1691.0, 790.0, 497.0, 301.0, 199.0, 128.0, 81.0, 67.0, 47.0, 33.0, 22.0, 23.0, 18.0, 17.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.9921875, -15.4749755859375, -14.957763671875, -14.4405517578125, -13.92333984375, -13.4061279296875, -12.888916015625, -12.3717041015625, -11.8544921875, -11.3372802734375, -10.820068359375, -10.3028564453125, -9.78564453125, -9.2684326171875, -8.751220703125, -8.2340087890625, -7.716796875, -7.1995849609375, -6.682373046875, -6.1651611328125, -5.64794921875, -5.1307373046875, -4.613525390625, -4.0963134765625, -3.5791015625, -3.0618896484375, -2.544677734375, -2.0274658203125, -1.51025390625, -0.9930419921875, -0.475830078125, 0.0413818359375, 0.55859375, 1.0758056640625, 1.593017578125, 2.1102294921875, 2.62744140625, 3.1446533203125, 3.661865234375, 4.1790771484375, 4.6962890625, 5.2135009765625, 5.730712890625, 6.2479248046875, 6.76513671875, 7.2823486328125, 7.799560546875, 8.3167724609375, 8.833984375, 9.3511962890625, 9.868408203125, 10.3856201171875, 10.90283203125, 11.4200439453125, 11.937255859375, 12.4544677734375, 12.9716796875, 13.4888916015625, 14.006103515625, 14.5233154296875, 15.04052734375, 15.5577392578125, 16.074951171875, 16.5921630859375, 17.109375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 12.0, 12.0, 13.0, 14.0, 19.0, 15.0, 16.0, 32.0, 40.0, 47.0, 48.0, 50.0, 52.0, 71.0, 63.0, 51.0, 70.0, 64.0, 57.0, 45.0, 29.0, 34.0, 25.0, 22.0, 19.0, 9.0, 4.0, 13.0, 6.0, 7.0, 4.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.734375, -19.169677734375, -18.60498046875, -18.040283203125, -17.4755859375, -16.910888671875, -16.34619140625, -15.781494140625, -15.216796875, -14.652099609375, -14.08740234375, -13.522705078125, -12.9580078125, -12.393310546875, -11.82861328125, -11.263916015625, -10.69921875, -10.134521484375, -9.56982421875, -9.005126953125, -8.4404296875, -7.875732421875, -7.31103515625, -6.746337890625, -6.181640625, -5.616943359375, -5.05224609375, -4.487548828125, -3.9228515625, -3.358154296875, -2.79345703125, -2.228759765625, -1.6640625, -1.099365234375, -0.53466796875, 0.030029296875, 0.5947265625, 1.159423828125, 1.72412109375, 2.288818359375, 2.853515625, 3.418212890625, 3.98291015625, 4.547607421875, 5.1123046875, 5.677001953125, 6.24169921875, 6.806396484375, 7.37109375, 7.935791015625, 8.50048828125, 9.065185546875, 9.6298828125, 10.194580078125, 10.75927734375, 11.323974609375, 11.888671875, 12.453369140625, 13.01806640625, 13.582763671875, 14.1474609375, 14.712158203125, 15.27685546875, 15.841552734375, 16.40625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 11.0, 10.0, 10.0, 10.0, 19.0, 25.0, 33.0, 35.0, 47.0, 66.0, 98.0, 137.0, 293.0, 584.0, 1482.0, 4899.0, 36125.0, 956583.0, 39679.0, 5371.0, 1537.0, 645.0, 305.0, 166.0, 105.0, 67.0, 43.0, 44.0, 35.0, 13.0, 12.0, 14.0, 9.0, 9.0, 7.0, 3.0, 8.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6171875, -5.43310546875, -5.2490234375, -5.06494140625, -4.880859375, -4.69677734375, -4.5126953125, -4.32861328125, -4.14453125, -3.96044921875, -3.7763671875, -3.59228515625, -3.408203125, -3.22412109375, -3.0400390625, -2.85595703125, -2.671875, -2.48779296875, -2.3037109375, -2.11962890625, -1.935546875, -1.75146484375, -1.5673828125, -1.38330078125, -1.19921875, -1.01513671875, -0.8310546875, -0.64697265625, -0.462890625, -0.27880859375, -0.0947265625, 0.08935546875, 0.2734375, 0.45751953125, 0.6416015625, 0.82568359375, 1.009765625, 1.19384765625, 1.3779296875, 1.56201171875, 1.74609375, 1.93017578125, 2.1142578125, 2.29833984375, 2.482421875, 2.66650390625, 2.8505859375, 3.03466796875, 3.21875, 3.40283203125, 3.5869140625, 3.77099609375, 3.955078125, 4.13916015625, 4.3232421875, 4.50732421875, 4.69140625, 4.87548828125, 5.0595703125, 5.24365234375, 5.427734375, 5.61181640625, 5.7958984375, 5.97998046875, 6.1640625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 16.0, 28.0, 48.0, 113.0, 242.0, 273.0, 126.0, 41.0, 26.0, 14.0, 10.0, 7.0, 4.0, 4.0, 2.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001537322998046875, -0.0014957785606384277, -0.0014542341232299805, -0.0014126896858215332, -0.001371145248413086, -0.0013296008110046387, -0.0012880563735961914, -0.0012465119361877441, -0.0012049674987792969, -0.0011634230613708496, -0.0011218786239624023, -0.001080334186553955, -0.0010387897491455078, -0.0009972453117370605, -0.0009557008743286133, -0.000914156436920166, -0.0008726119995117188, -0.0008310675621032715, -0.0007895231246948242, -0.000747978687286377, -0.0007064342498779297, -0.0006648898124694824, -0.0006233453750610352, -0.0005818009376525879, -0.0005402565002441406, -0.0004987120628356934, -0.0004571676254272461, -0.00041562318801879883, -0.00037407875061035156, -0.0003325343132019043, -0.00029098987579345703, -0.00024944543838500977, -0.0002079010009765625, -0.00016635656356811523, -0.00012481212615966797, -8.32676887512207e-05, -4.172325134277344e-05, -1.7881393432617188e-07, 4.1365623474121094e-05, 8.291006088256836e-05, 0.00012445449829101562, 0.0001659989356994629, 0.00020754337310791016, 0.0002490878105163574, 0.0002906322479248047, 0.00033217668533325195, 0.0003737211227416992, 0.0004152655601501465, 0.00045680999755859375, 0.000498354434967041, 0.0005398988723754883, 0.0005814433097839355, 0.0006229877471923828, 0.0006645321846008301, 0.0007060766220092773, 0.0007476210594177246, 0.0007891654968261719, 0.0008307099342346191, 0.0008722543716430664, 0.0009137988090515137, 0.0009553432464599609, 0.0009968876838684082, 0.0010384321212768555, 0.0010799765586853027, 0.00112152099609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 11.0, 8.0, 12.0, 21.0, 24.0, 37.0, 40.0, 84.0, 110.0, 154.0, 282.0, 584.0, 1372.0, 3978.0, 15555.0, 212289.0, 777803.0, 27010.0, 5671.0, 1882.0, 728.0, 335.0, 187.0, 122.0, 80.0, 56.0, 41.0, 29.0, 24.0, 3.0, 7.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.818359375, -3.691680908203125, -3.56500244140625, -3.438323974609375, -3.3116455078125, -3.184967041015625, -3.05828857421875, -2.931610107421875, -2.804931640625, -2.678253173828125, -2.55157470703125, -2.424896240234375, -2.2982177734375, -2.171539306640625, -2.04486083984375, -1.918182373046875, -1.79150390625, -1.664825439453125, -1.53814697265625, -1.411468505859375, -1.2847900390625, -1.158111572265625, -1.03143310546875, -0.904754638671875, -0.778076171875, -0.651397705078125, -0.52471923828125, -0.398040771484375, -0.2713623046875, -0.144683837890625, -0.01800537109375, 0.108673095703125, 0.2353515625, 0.362030029296875, 0.48870849609375, 0.615386962890625, 0.7420654296875, 0.868743896484375, 0.99542236328125, 1.122100830078125, 1.248779296875, 1.375457763671875, 1.50213623046875, 1.628814697265625, 1.7554931640625, 1.882171630859375, 2.00885009765625, 2.135528564453125, 2.26220703125, 2.388885498046875, 2.51556396484375, 2.642242431640625, 2.7689208984375, 2.895599365234375, 3.02227783203125, 3.148956298828125, 3.275634765625, 3.402313232421875, 3.52899169921875, 3.655670166015625, 3.7823486328125, 3.909027099609375, 4.03570556640625, 4.162384033203125, 4.2890625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 9.0, 21.0, 17.0, 38.0, 37.0, 51.0, 86.0, 126.0, 143.0, 129.0, 88.0, 70.0, 45.0, 30.0, 27.0, 15.0, 9.0, 10.0, 5.0, 12.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.7421875, -4.62554931640625, -4.5089111328125, -4.39227294921875, -4.275634765625, -4.15899658203125, -4.0423583984375, -3.92572021484375, -3.80908203125, -3.69244384765625, -3.5758056640625, -3.45916748046875, -3.342529296875, -3.22589111328125, -3.1092529296875, -2.99261474609375, -2.8759765625, -2.75933837890625, -2.6427001953125, -2.52606201171875, -2.409423828125, -2.29278564453125, -2.1761474609375, -2.05950927734375, -1.94287109375, -1.82623291015625, -1.7095947265625, -1.59295654296875, -1.476318359375, -1.35968017578125, -1.2430419921875, -1.12640380859375, -1.009765625, -0.89312744140625, -0.7764892578125, -0.65985107421875, -0.543212890625, -0.42657470703125, -0.3099365234375, -0.19329833984375, -0.07666015625, 0.03997802734375, 0.1566162109375, 0.27325439453125, 0.389892578125, 0.50653076171875, 0.6231689453125, 0.73980712890625, 0.8564453125, 0.97308349609375, 1.0897216796875, 1.20635986328125, 1.322998046875, 1.43963623046875, 1.5562744140625, 1.67291259765625, 1.78955078125, 1.90618896484375, 2.0228271484375, 2.13946533203125, 2.256103515625, 2.37274169921875, 2.4893798828125, 2.60601806640625, 2.72265625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 14.0, 32.0, 131.0, 550.0, 187.0, 56.0, 11.0, 12.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-253.48745727539062, -247.91746520996094, -242.34747314453125, -236.77748107910156, -231.20748901367188, -225.63751220703125, -220.06752014160156, -214.49752807617188, -208.9275360107422, -203.3575439453125, -197.7875518798828, -192.21755981445312, -186.6475830078125, -181.0775909423828, -175.50759887695312, -169.93760681152344, -164.36761474609375, -158.79762268066406, -153.22763061523438, -147.6576385498047, -142.087646484375, -136.51766967773438, -130.9476776123047, -125.377685546875, -119.80769348144531, -114.23770141601562, -108.66770935058594, -103.09772491455078, -97.5277328491211, -91.9577407836914, -86.38775634765625, -80.81776428222656, -75.24778747558594, -69.67779541015625, -64.10780334472656, -58.537818908691406, -52.96782684326172, -47.39783477783203, -41.82784652709961, -36.25785827636719, -30.6878662109375, -25.117876052856445, -19.54788589477539, -13.977895736694336, -8.407905578613281, -2.8379154205322266, 2.732074737548828, 8.30206298828125, 13.872055053710938, 19.442045211791992, 25.012035369873047, 30.5820255279541, 36.152015686035156, 41.722007751464844, 47.291996002197266, 52.86198425292969, 58.431976318359375, 64.00196838378906, 69.57196044921875, 75.1419448852539, 80.7119369506836, 86.28192901611328, 91.85191345214844, 97.42190551757812, 102.99189758300781]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 6.0, 5.0, 8.0, 15.0, 8.0, 11.0, 15.0, 18.0, 22.0, 31.0, 36.0, 37.0, 47.0, 56.0, 95.0, 181.0, 98.0, 49.0, 48.0, 34.0, 27.0, 20.0, 15.0, 20.0, 23.0, 18.0, 10.0, 6.0, 8.0, 7.0, 2.0, 8.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-90.15495300292969, -87.87124633789062, -85.5875473022461, -83.30384063720703, -81.0201416015625, -78.73643493652344, -76.45272827148438, -74.16902923583984, -71.88532257080078, -69.60161590576172, -67.31791687011719, -65.03421020507812, -62.75050735473633, -60.46680450439453, -58.183101654052734, -55.89939880371094, -53.61569595336914, -51.331993103027344, -49.04829025268555, -46.76458740234375, -44.48088073730469, -42.19717788696289, -39.913475036621094, -37.6297721862793, -35.3460693359375, -33.0623664855957, -30.778661727905273, -28.494958877563477, -26.211254119873047, -23.92755126953125, -21.643848419189453, -19.360145568847656, -17.076438903808594, -14.79273509979248, -12.509031295776367, -10.22532844543457, -7.941624641418457, -5.657920837402344, -3.374217987060547, -1.0905141830444336, 1.1931896209716797, 3.476893186569214, 5.760596752166748, 8.044300079345703, 10.328003883361816, 12.61170768737793, 14.895410537719727, 17.179115295410156, 19.462818145751953, 21.74652099609375, 24.03022575378418, 26.313928604125977, 28.597633361816406, 30.881336212158203, 33.1650390625, 35.4487419128418, 37.732444763183594, 40.01614761352539, 42.29985046386719, 44.58355712890625, 46.86725997924805, 49.150962829589844, 51.43466567993164, 53.71836853027344, 56.0020751953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 9.0, 22.0, 27.0, 52.0, 101.0, 252.0, 640.0, 1952.0, 10601.0, 290738.0, 3636886.0, 239648.0, 10336.0, 1997.0, 573.0, 226.0, 107.0, 44.0, 26.0, 10.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.5697021484375, -9.022216796875, -8.4747314453125, -7.92724609375, -7.3797607421875, -6.832275390625, -6.2847900390625, -5.7373046875, -5.1898193359375, -4.642333984375, -4.0948486328125, -3.54736328125, -2.9998779296875, -2.452392578125, -1.9049072265625, -1.357421875, -0.8099365234375, -0.262451171875, 0.2850341796875, 0.83251953125, 1.3800048828125, 1.927490234375, 2.4749755859375, 3.0224609375, 3.5699462890625, 4.117431640625, 4.6649169921875, 5.21240234375, 5.7598876953125, 6.307373046875, 6.8548583984375, 7.40234375, 7.9498291015625, 8.497314453125, 9.0447998046875, 9.59228515625, 10.1397705078125, 10.687255859375, 11.2347412109375, 11.7822265625, 12.3297119140625, 12.877197265625, 13.4246826171875, 13.97216796875, 14.5196533203125, 15.067138671875, 15.6146240234375, 16.162109375, 16.7095947265625, 17.257080078125, 17.8045654296875, 18.35205078125, 18.8995361328125, 19.447021484375, 19.9945068359375, 20.5419921875, 21.0894775390625, 21.636962890625, 22.1844482421875, 22.73193359375, 23.2794189453125, 23.826904296875, 24.3743896484375, 24.921875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 0.0, 3.0, 7.0, 9.0, 5.0, 11.0, 9.0, 23.0, 16.0, 17.0, 27.0, 27.0, 28.0, 44.0, 40.0, 39.0, 54.0, 36.0, 45.0, 57.0, 48.0, 43.0, 41.0, 55.0, 33.0, 44.0, 35.0, 36.0, 23.0, 22.0, 25.0, 20.0, 18.0, 11.0, 8.0, 9.0, 7.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.56640625, -4.4364013671875, -4.306396484375, -4.1763916015625, -4.04638671875, -3.9163818359375, -3.786376953125, -3.6563720703125, -3.5263671875, -3.3963623046875, -3.266357421875, -3.1363525390625, -3.00634765625, -2.8763427734375, -2.746337890625, -2.6163330078125, -2.486328125, -2.3563232421875, -2.226318359375, -2.0963134765625, -1.96630859375, -1.8363037109375, -1.706298828125, -1.5762939453125, -1.4462890625, -1.3162841796875, -1.186279296875, -1.0562744140625, -0.92626953125, -0.7962646484375, -0.666259765625, -0.5362548828125, -0.40625, -0.2762451171875, -0.146240234375, -0.0162353515625, 0.11376953125, 0.2437744140625, 0.373779296875, 0.5037841796875, 0.6337890625, 0.7637939453125, 0.893798828125, 1.0238037109375, 1.15380859375, 1.2838134765625, 1.413818359375, 1.5438232421875, 1.673828125, 1.8038330078125, 1.933837890625, 2.0638427734375, 2.19384765625, 2.3238525390625, 2.453857421875, 2.5838623046875, 2.7138671875, 2.8438720703125, 2.973876953125, 3.1038818359375, 3.23388671875, 3.3638916015625, 3.493896484375, 3.6239013671875, 3.75390625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 12.0, 11.0, 25.0, 46.0, 86.0, 155.0, 290.0, 625.0, 1755.0, 8118.0, 363294.0, 3797494.0, 17859.0, 2802.0, 904.0, 388.0, 171.0, 97.0, 46.0, 44.0, 18.0, 9.0, 9.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.765625, -20.826416015625, -19.88720703125, -18.947998046875, -18.0087890625, -17.069580078125, -16.13037109375, -15.191162109375, -14.251953125, -13.312744140625, -12.37353515625, -11.434326171875, -10.4951171875, -9.555908203125, -8.61669921875, -7.677490234375, -6.73828125, -5.799072265625, -4.85986328125, -3.920654296875, -2.9814453125, -2.042236328125, -1.10302734375, -0.163818359375, 0.775390625, 1.714599609375, 2.65380859375, 3.593017578125, 4.5322265625, 5.471435546875, 6.41064453125, 7.349853515625, 8.2890625, 9.228271484375, 10.16748046875, 11.106689453125, 12.0458984375, 12.985107421875, 13.92431640625, 14.863525390625, 15.802734375, 16.741943359375, 17.68115234375, 18.620361328125, 19.5595703125, 20.498779296875, 21.43798828125, 22.377197265625, 23.31640625, 24.255615234375, 25.19482421875, 26.134033203125, 27.0732421875, 28.012451171875, 28.95166015625, 29.890869140625, 30.830078125, 31.769287109375, 32.70849609375, 33.647705078125, 34.5869140625, 35.526123046875, 36.46533203125, 37.404541015625, 38.34375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 12.0, 12.0, 18.0, 17.0, 27.0, 27.0, 56.0, 68.0, 107.0, 149.0, 221.0, 360.0, 474.0, 600.0, 593.0, 426.0, 271.0, 183.0, 124.0, 97.0, 60.0, 44.0, 34.0, 27.0, 19.0, 11.0, 7.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.15625, -12.7275390625, -12.298828125, -11.8701171875, -11.44140625, -11.0126953125, -10.583984375, -10.1552734375, -9.7265625, -9.2978515625, -8.869140625, -8.4404296875, -8.01171875, -7.5830078125, -7.154296875, -6.7255859375, -6.296875, -5.8681640625, -5.439453125, -5.0107421875, -4.58203125, -4.1533203125, -3.724609375, -3.2958984375, -2.8671875, -2.4384765625, -2.009765625, -1.5810546875, -1.15234375, -0.7236328125, -0.294921875, 0.1337890625, 0.5625, 0.9912109375, 1.419921875, 1.8486328125, 2.27734375, 2.7060546875, 3.134765625, 3.5634765625, 3.9921875, 4.4208984375, 4.849609375, 5.2783203125, 5.70703125, 6.1357421875, 6.564453125, 6.9931640625, 7.421875, 7.8505859375, 8.279296875, 8.7080078125, 9.13671875, 9.5654296875, 9.994140625, 10.4228515625, 10.8515625, 11.2802734375, 11.708984375, 12.1376953125, 12.56640625, 12.9951171875, 13.423828125, 13.8525390625, 14.28125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 1.0, 11.0, 27.0, 42.0, 89.0, 209.0, 297.0, 189.0, 68.0, 26.0, 12.0, 3.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.8411865234375, -165.30868530273438, -158.7761688232422, -152.24366760253906, -145.71116638183594, -139.17864990234375, -132.64614868164062, -126.1136474609375, -119.58113861083984, -113.04862976074219, -106.51612854003906, -99.9836196899414, -93.45111083984375, -86.91860961914062, -80.38610076904297, -73.85359191894531, -67.32109069824219, -60.7885856628418, -54.256080627441406, -47.72357177734375, -41.19106674194336, -34.65856170654297, -28.126052856445312, -21.593547821044922, -15.061042785644531, -8.528536796569824, -1.9960308074951172, 4.536476135253906, 11.068981170654297, 17.601486206054688, 24.133995056152344, 30.666500091552734, 37.199005126953125, 43.731510162353516, 50.264015197753906, 56.79652404785156, 63.32902908325195, 69.86153411865234, 76.39404296875, 82.92654418945312, 89.45905303955078, 95.99156188964844, 102.52406311035156, 109.05657196044922, 115.58908081054688, 122.12158203125, 128.65408325195312, 135.1865997314453, 141.71910095214844, 148.25160217285156, 154.78411865234375, 161.31661987304688, 167.84912109375, 174.38162231445312, 180.9141387939453, 187.44664001464844, 193.97915649414062, 200.51165771484375, 207.04417419433594, 213.57667541503906, 220.1091766357422, 226.64169311523438, 233.1741943359375, 239.70669555664062, 246.23919677734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 12.0, 11.0, 14.0, 21.0, 26.0, 24.0, 33.0, 45.0, 31.0, 39.0, 42.0, 51.0, 61.0, 73.0, 60.0, 66.0, 60.0, 48.0, 43.0, 36.0, 34.0, 37.0, 18.0, 22.0, 22.0, 16.0, 17.0, 9.0, 6.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.58037567138672, -88.0301284790039, -85.47987365722656, -82.92962646484375, -80.37937927246094, -77.8291244506836, -75.27887725830078, -72.72862243652344, -70.17837524414062, -67.62812805175781, -65.07787322998047, -62.527626037597656, -59.97737503051758, -57.4271240234375, -54.87687683105469, -52.32662582397461, -49.77637481689453, -47.22612380981445, -44.675872802734375, -42.12562561035156, -39.575374603271484, -37.025123596191406, -34.474876403808594, -31.924625396728516, -29.374374389648438, -26.82412338256836, -24.273874282836914, -21.72362518310547, -19.17337417602539, -16.623123168945312, -14.072874069213867, -11.522624969482422, -8.972381591796875, -6.422131538391113, -3.8718814849853516, -1.3216314315795898, 1.2286186218261719, 3.7788686752319336, 6.329118728637695, 8.87936782836914, 11.429618835449219, 13.97986888885498, 16.530118942260742, 19.080368041992188, 21.630619049072266, 24.180870056152344, 26.73111915588379, 29.281368255615234, 31.831619262695312, 34.38187026977539, 36.93212127685547, 39.48236846923828, 42.03261947631836, 44.58287048339844, 47.13311767578125, 49.68336868286133, 52.233619689941406, 54.783870697021484, 57.33412170410156, 59.884368896484375, 62.43461990356445, 64.98487091064453, 67.53511810302734, 70.08537292480469, 72.6356201171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 9.0, 9.0, 18.0, 27.0, 34.0, 52.0, 90.0, 119.0, 172.0, 287.0, 486.0, 887.0, 1620.0, 3289.0, 7025.0, 17477.0, 52082.0, 234092.0, 562176.0, 114951.0, 31506.0, 11708.0, 5039.0, 2346.0, 1253.0, 668.0, 410.0, 248.0, 166.0, 85.0, 54.0, 41.0, 32.0, 18.0, 13.0, 10.0, 11.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.734375, -7.5087890625, -7.283203125, -7.0576171875, -6.83203125, -6.6064453125, -6.380859375, -6.1552734375, -5.9296875, -5.7041015625, -5.478515625, -5.2529296875, -5.02734375, -4.8017578125, -4.576171875, -4.3505859375, -4.125, -3.8994140625, -3.673828125, -3.4482421875, -3.22265625, -2.9970703125, -2.771484375, -2.5458984375, -2.3203125, -2.0947265625, -1.869140625, -1.6435546875, -1.41796875, -1.1923828125, -0.966796875, -0.7412109375, -0.515625, -0.2900390625, -0.064453125, 0.1611328125, 0.38671875, 0.6123046875, 0.837890625, 1.0634765625, 1.2890625, 1.5146484375, 1.740234375, 1.9658203125, 2.19140625, 2.4169921875, 2.642578125, 2.8681640625, 3.09375, 3.3193359375, 3.544921875, 3.7705078125, 3.99609375, 4.2216796875, 4.447265625, 4.6728515625, 4.8984375, 5.1240234375, 5.349609375, 5.5751953125, 5.80078125, 6.0263671875, 6.251953125, 6.4775390625, 6.703125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 9.0, 3.0, 7.0, 10.0, 5.0, 11.0, 13.0, 12.0, 28.0, 20.0, 13.0, 25.0, 34.0, 36.0, 27.0, 35.0, 30.0, 41.0, 48.0, 48.0, 52.0, 40.0, 46.0, 46.0, 39.0, 43.0, 43.0, 29.0, 27.0, 26.0, 21.0, 28.0, 28.0, 10.0, 11.0, 12.0, 6.0, 8.0, 4.0, 4.0, 8.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.6796875, -4.543701171875, -4.40771484375, -4.271728515625, -4.1357421875, -3.999755859375, -3.86376953125, -3.727783203125, -3.591796875, -3.455810546875, -3.31982421875, -3.183837890625, -3.0478515625, -2.911865234375, -2.77587890625, -2.639892578125, -2.50390625, -2.367919921875, -2.23193359375, -2.095947265625, -1.9599609375, -1.823974609375, -1.68798828125, -1.552001953125, -1.416015625, -1.280029296875, -1.14404296875, -1.008056640625, -0.8720703125, -0.736083984375, -0.60009765625, -0.464111328125, -0.328125, -0.192138671875, -0.05615234375, 0.079833984375, 0.2158203125, 0.351806640625, 0.48779296875, 0.623779296875, 0.759765625, 0.895751953125, 1.03173828125, 1.167724609375, 1.3037109375, 1.439697265625, 1.57568359375, 1.711669921875, 1.84765625, 1.983642578125, 2.11962890625, 2.255615234375, 2.3916015625, 2.527587890625, 2.66357421875, 2.799560546875, 2.935546875, 3.071533203125, 3.20751953125, 3.343505859375, 3.4794921875, 3.615478515625, 3.75146484375, 3.887451171875, 4.0234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 11.0, 18.0, 17.0, 33.0, 53.0, 52.0, 76.0, 96.0, 127.0, 224.0, 362.0, 625.0, 1361.0, 4221.0, 20947.0, 549607.0, 444054.0, 19743.0, 3852.0, 1372.0, 645.0, 353.0, 197.0, 144.0, 88.0, 72.0, 45.0, 41.0, 25.0, 26.0, 13.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5546875, -9.246337890625, -8.93798828125, -8.629638671875, -8.3212890625, -8.012939453125, -7.70458984375, -7.396240234375, -7.087890625, -6.779541015625, -6.47119140625, -6.162841796875, -5.8544921875, -5.546142578125, -5.23779296875, -4.929443359375, -4.62109375, -4.312744140625, -4.00439453125, -3.696044921875, -3.3876953125, -3.079345703125, -2.77099609375, -2.462646484375, -2.154296875, -1.845947265625, -1.53759765625, -1.229248046875, -0.9208984375, -0.612548828125, -0.30419921875, 0.004150390625, 0.3125, 0.620849609375, 0.92919921875, 1.237548828125, 1.5458984375, 1.854248046875, 2.16259765625, 2.470947265625, 2.779296875, 3.087646484375, 3.39599609375, 3.704345703125, 4.0126953125, 4.321044921875, 4.62939453125, 4.937744140625, 5.24609375, 5.554443359375, 5.86279296875, 6.171142578125, 6.4794921875, 6.787841796875, 7.09619140625, 7.404541015625, 7.712890625, 8.021240234375, 8.32958984375, 8.637939453125, 8.9462890625, 9.254638671875, 9.56298828125, 9.871337890625, 10.1796875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 9.0, 6.0, 7.0, 10.0, 10.0, 18.0, 19.0, 26.0, 23.0, 23.0, 26.0, 52.0, 54.0, 54.0, 85.0, 90.0, 99.0, 79.0, 43.0, 58.0, 47.0, 45.0, 28.0, 19.0, 14.0, 15.0, 6.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.870361328125, -20.19384765625, -19.517333984375, -18.8408203125, -18.164306640625, -17.48779296875, -16.811279296875, -16.134765625, -15.458251953125, -14.78173828125, -14.105224609375, -13.4287109375, -12.752197265625, -12.07568359375, -11.399169921875, -10.72265625, -10.046142578125, -9.36962890625, -8.693115234375, -8.0166015625, -7.340087890625, -6.66357421875, -5.987060546875, -5.310546875, -4.634033203125, -3.95751953125, -3.281005859375, -2.6044921875, -1.927978515625, -1.25146484375, -0.574951171875, 0.1015625, 0.778076171875, 1.45458984375, 2.131103515625, 2.8076171875, 3.484130859375, 4.16064453125, 4.837158203125, 5.513671875, 6.190185546875, 6.86669921875, 7.543212890625, 8.2197265625, 8.896240234375, 9.57275390625, 10.249267578125, 10.92578125, 11.602294921875, 12.27880859375, 12.955322265625, 13.6318359375, 14.308349609375, 14.98486328125, 15.661376953125, 16.337890625, 17.014404296875, 17.69091796875, 18.367431640625, 19.0439453125, 19.720458984375, 20.39697265625, 21.073486328125, 21.75]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 9.0, 9.0, 9.0, 9.0, 17.0, 21.0, 30.0, 39.0, 66.0, 117.0, 170.0, 282.0, 620.0, 1581.0, 4933.0, 25544.0, 876339.0, 121413.0, 12117.0, 3020.0, 1091.0, 458.0, 229.0, 115.0, 82.0, 46.0, 46.0, 26.0, 15.0, 17.0, 17.0, 24.0, 7.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.37109375, -2.3066558837890625, -2.242218017578125, -2.1777801513671875, -2.11334228515625, -2.0489044189453125, -1.984466552734375, -1.9200286865234375, -1.8555908203125, -1.7911529541015625, -1.726715087890625, -1.6622772216796875, -1.59783935546875, -1.5334014892578125, -1.468963623046875, -1.4045257568359375, -1.340087890625, -1.2756500244140625, -1.211212158203125, -1.1467742919921875, -1.08233642578125, -1.0178985595703125, -0.953460693359375, -0.8890228271484375, -0.8245849609375, -0.7601470947265625, -0.695709228515625, -0.6312713623046875, -0.56683349609375, -0.5023956298828125, -0.437957763671875, -0.3735198974609375, -0.30908203125, -0.2446441650390625, -0.180206298828125, -0.1157684326171875, -0.05133056640625, 0.0131072998046875, 0.077545166015625, 0.1419830322265625, 0.2064208984375, 0.2708587646484375, 0.335296630859375, 0.3997344970703125, 0.46417236328125, 0.5286102294921875, 0.593048095703125, 0.6574859619140625, 0.721923828125, 0.7863616943359375, 0.850799560546875, 0.9152374267578125, 0.97967529296875, 1.0441131591796875, 1.108551025390625, 1.1729888916015625, 1.2374267578125, 1.3018646240234375, 1.366302490234375, 1.4307403564453125, 1.49517822265625, 1.5596160888671875, 1.624053955078125, 1.6884918212890625, 1.7529296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 3.0, 5.0, 11.0, 7.0, 15.0, 9.0, 13.0, 28.0, 34.0, 63.0, 74.0, 122.0, 141.0, 140.0, 107.0, 70.0, 34.0, 31.0, 20.0, 20.0, 12.0, 9.0, 8.0, 8.0, 2.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004165172576904297, -0.0004042200744152069, -0.00039192289113998413, -0.00037962570786476135, -0.0003673285245895386, -0.0003550313413143158, -0.000342734158039093, -0.00033043697476387024, -0.00031813979148864746, -0.0003058426082134247, -0.0002935454249382019, -0.0002812482416629791, -0.00026895105838775635, -0.00025665387511253357, -0.0002443566918373108, -0.000232059508562088, -0.00021976232528686523, -0.00020746514201164246, -0.00019516795873641968, -0.0001828707754611969, -0.00017057359218597412, -0.00015827640891075134, -0.00014597922563552856, -0.00013368204236030579, -0.00012138485908508301, -0.00010908767580986023, -9.679049253463745e-05, -8.449330925941467e-05, -7.21961259841919e-05, -5.9898942708969116e-05, -4.760175943374634e-05, -3.530457615852356e-05, -2.300739288330078e-05, -1.0710209608078003e-05, 1.5869736671447754e-06, 1.3884156942367554e-05, 2.6181340217590332e-05, 3.847852349281311e-05, 5.077570676803589e-05, 6.307289004325867e-05, 7.537007331848145e-05, 8.766725659370422e-05, 9.9964439868927e-05, 0.00011226162314414978, 0.00012455880641937256, 0.00013685598969459534, 0.00014915317296981812, 0.0001614503562450409, 0.00017374753952026367, 0.00018604472279548645, 0.00019834190607070923, 0.000210639089345932, 0.00022293627262115479, 0.00023523345589637756, 0.00024753063917160034, 0.0002598278224468231, 0.0002721250057220459, 0.0002844221889972687, 0.00029671937227249146, 0.00030901655554771423, 0.000321313738822937, 0.0003336109220981598, 0.00034590810537338257, 0.00035820528864860535, 0.0003705024719238281]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 25.0, 23.0, 35.0, 67.0, 88.0, 186.0, 305.0, 591.0, 1262.0, 3050.0, 9690.0, 49680.0, 859488.0, 101108.0, 15364.0, 4207.0, 1688.0, 729.0, 385.0, 186.0, 123.0, 92.0, 47.0, 36.0, 22.0, 14.0, 10.0, 8.0, 5.0, 5.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.41278076171875, -1.3616943359375, -1.31060791015625, -1.259521484375, -1.20843505859375, -1.1573486328125, -1.10626220703125, -1.05517578125, -1.00408935546875, -0.9530029296875, -0.90191650390625, -0.850830078125, -0.79974365234375, -0.7486572265625, -0.69757080078125, -0.646484375, -0.59539794921875, -0.5443115234375, -0.49322509765625, -0.442138671875, -0.39105224609375, -0.3399658203125, -0.28887939453125, -0.23779296875, -0.18670654296875, -0.1356201171875, -0.08453369140625, -0.033447265625, 0.01763916015625, 0.0687255859375, 0.11981201171875, 0.1708984375, 0.22198486328125, 0.2730712890625, 0.32415771484375, 0.375244140625, 0.42633056640625, 0.4774169921875, 0.52850341796875, 0.57958984375, 0.63067626953125, 0.6817626953125, 0.73284912109375, 0.783935546875, 0.83502197265625, 0.8861083984375, 0.93719482421875, 0.98828125, 1.03936767578125, 1.0904541015625, 1.14154052734375, 1.192626953125, 1.24371337890625, 1.2947998046875, 1.34588623046875, 1.39697265625, 1.44805908203125, 1.4991455078125, 1.55023193359375, 1.601318359375, 1.65240478515625, 1.7034912109375, 1.75457763671875, 1.8056640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 13.0, 7.0, 22.0, 15.0, 43.0, 91.0, 210.0, 259.0, 154.0, 92.0, 26.0, 17.0, 15.0, 9.0, 12.0, 7.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.779449462890625, -3.65069580078125, -3.521942138671875, -3.3931884765625, -3.264434814453125, -3.13568115234375, -3.006927490234375, -2.878173828125, -2.749420166015625, -2.62066650390625, -2.491912841796875, -2.3631591796875, -2.234405517578125, -2.10565185546875, -1.976898193359375, -1.84814453125, -1.719390869140625, -1.59063720703125, -1.461883544921875, -1.3331298828125, -1.204376220703125, -1.07562255859375, -0.946868896484375, -0.818115234375, -0.689361572265625, -0.56060791015625, -0.431854248046875, -0.3031005859375, -0.174346923828125, -0.04559326171875, 0.083160400390625, 0.2119140625, 0.340667724609375, 0.46942138671875, 0.598175048828125, 0.7269287109375, 0.855682373046875, 0.98443603515625, 1.113189697265625, 1.241943359375, 1.370697021484375, 1.49945068359375, 1.628204345703125, 1.7569580078125, 1.885711669921875, 2.01446533203125, 2.143218994140625, 2.27197265625, 2.400726318359375, 2.52947998046875, 2.658233642578125, 2.7869873046875, 2.915740966796875, 3.04449462890625, 3.173248291015625, 3.302001953125, 3.430755615234375, 3.55950927734375, 3.688262939453125, 3.8170166015625, 3.945770263671875, 4.07452392578125, 4.203277587890625, 4.33203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 10.0, 15.0, 41.0, 68.0, 490.0, 210.0, 75.0, 42.0, 15.0, 10.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.13438415527344, -81.0976333618164, -78.06088256835938, -75.02412414550781, -71.98737335205078, -68.95062255859375, -65.91387176513672, -62.87711715698242, -59.840362548828125, -56.803611755371094, -53.7668571472168, -50.730106353759766, -47.69335174560547, -44.65660095214844, -41.619850158691406, -38.58309555053711, -35.54634475708008, -32.50959396362305, -29.47283935546875, -26.43608856201172, -23.399333953857422, -20.36258316040039, -17.325830459594727, -14.289077758789062, -11.252325057983398, -8.215572357177734, -5.1788201332092285, -2.1420679092407227, 0.8946847915649414, 3.9314374923706055, 6.968189239501953, 10.004941940307617, 13.041694641113281, 16.078447341918945, 19.11520004272461, 22.15195083618164, 25.188705444335938, 28.22545623779297, 31.262208938598633, 34.2989616394043, 37.335716247558594, 40.372467041015625, 43.40922164916992, 46.44597244262695, 49.48272705078125, 52.51947784423828, 55.55622863769531, 58.59298324584961, 61.62973403930664, 64.66648864746094, 67.70323944091797, 70.739990234375, 73.77674102783203, 76.8134994506836, 79.85025024414062, 82.88700103759766, 85.92375183105469, 88.96050262451172, 91.99725341796875, 95.03401184082031, 98.07076263427734, 101.10751342773438, 104.1442642211914, 107.18101501464844, 110.2177734375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 4.0, 9.0, 8.0, 7.0, 4.0, 10.0, 11.0, 16.0, 8.0, 22.0, 24.0, 23.0, 24.0, 24.0, 24.0, 84.0, 128.0, 153.0, 146.0, 60.0, 28.0, 21.0, 22.0, 19.0, 18.0, 15.0, 13.0, 5.0, 8.0, 10.0, 4.0, 8.0, 9.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.177345275878906, -53.66476821899414, -52.152191162109375, -50.63961410522461, -49.127037048339844, -47.61445999145508, -46.10188293457031, -44.58930969238281, -43.07672882080078, -41.564151763916016, -40.05157470703125, -38.538997650146484, -37.02642059326172, -35.51384353637695, -34.00126647949219, -32.48869323730469, -30.976116180419922, -29.463539123535156, -27.95096206665039, -26.438385009765625, -24.92580795288086, -23.413230895996094, -21.90065574645996, -20.388078689575195, -18.87550163269043, -17.362924575805664, -15.850347518920898, -14.33777141571045, -12.825194358825684, -11.312617301940918, -9.800041198730469, -8.287464141845703, -6.7748870849609375, -5.262310028076172, -3.7497334480285645, -2.237156867980957, -0.7245798110961914, 0.7879972457885742, 2.3005733489990234, 3.813150405883789, 5.325727462768555, 6.83830451965332, 8.350881576538086, 9.863457679748535, 11.3760347366333, 12.888611793518066, 14.401187896728516, 15.913764953613281, 17.426342010498047, 18.938919067382812, 20.451496124267578, 21.964073181152344, 23.47665023803711, 24.989227294921875, 26.501802444458008, 28.014379501342773, 29.52695655822754, 31.039533615112305, 32.55210876464844, 34.0646858215332, 35.57726287841797, 37.089839935302734, 38.6024169921875, 40.114994049072266, 41.62757110595703]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 16.0, 13.0, 19.0, 31.0, 31.0, 31.0, 36.0, 53.0, 135.0, 294.0, 69.0, 51.0, 34.0, 34.0, 33.0, 22.0, 31.0, 15.0, 7.0, 8.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.7686767578125, -5.564697265625, -5.3607177734375, -5.15673828125, -4.9527587890625, -4.748779296875, -4.5447998046875, -4.3408203125, -4.1368408203125, -3.932861328125, -3.7288818359375, -3.52490234375, -3.3209228515625, -3.116943359375, -2.9129638671875, -2.708984375, -2.5050048828125, -2.301025390625, -2.0970458984375, -1.89306640625, -1.6890869140625, -1.485107421875, -1.2811279296875, -1.0771484375, -0.8731689453125, -0.669189453125, -0.4652099609375, -0.26123046875, -0.0572509765625, 0.146728515625, 0.3507080078125, 0.5546875, 0.7586669921875, 0.962646484375, 1.1666259765625, 1.37060546875, 1.5745849609375, 1.778564453125, 1.9825439453125, 2.1865234375, 2.3905029296875, 2.594482421875, 2.7984619140625, 3.00244140625, 3.2064208984375, 3.410400390625, 3.6143798828125, 3.818359375, 4.0223388671875, 4.226318359375, 4.4302978515625, 4.63427734375, 4.8382568359375, 5.042236328125, 5.2462158203125, 5.4501953125, 5.6541748046875, 5.858154296875, 6.0621337890625, 6.26611328125, 6.4700927734375, 6.674072265625, 6.8780517578125, 7.08203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 5.0, 5.0, 7.0, 12.0, 25.0, 22.0, 28.0, 32.0, 57.0, 145.0, 279.0, 687.0, 2706.0, 23437.0, 8349392.0, 9078.0, 1635.0, 463.0, 225.0, 100.0, 56.0, 43.0, 30.0, 24.0, 20.0, 16.0, 7.0, 4.0, 0.0, 2.0, 1.0, 7.0, 6.0, 4.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0], "bins": [-59.76436996459961, -57.79380416870117, -55.8232421875, -53.85267639160156, -51.882110595703125, -49.91154479980469, -47.940982818603516, -45.97041702270508, -43.999855041503906, -42.02928924560547, -40.0587272644043, -38.08816146850586, -36.11759567260742, -34.14703369140625, -32.17646789550781, -30.205902099609375, -28.235336303710938, -26.264772415161133, -24.294206619262695, -22.32364273071289, -20.353076934814453, -18.38251304626465, -16.411949157714844, -14.441384315490723, -12.470819473266602, -10.50025463104248, -8.52968978881836, -6.559125900268555, -4.588561058044434, -2.6179962158203125, -0.6474323272705078, 1.3231325149536133, 3.293701171875, 5.264266014099121, 7.234830379486084, 9.205394744873047, 11.175959587097168, 13.146524429321289, 15.117088317871094, 17.08765411376953, 19.058218002319336, 21.02878189086914, 22.999347686767578, 24.969911575317383, 26.940475463867188, 28.911041259765625, 30.88160514831543, 32.852169036865234, 34.82273483276367, 36.79330062866211, 38.76386260986328, 40.73442840576172, 42.704994201660156, 44.675559997558594, 46.646121978759766, 48.6166877746582, 50.587249755859375, 52.55781555175781, 54.528377532958984, 56.49894332885742, 58.46950912475586, 60.44007110595703, 62.41063690185547, 64.3812026977539, 66.35176849365234]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 1.0, 6.0, 4.0, 8.0, 3.0, 7.0, 2.0, 3.0, 10.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-79.71174621582031, -75.95531463623047, -72.19888305664062, -68.44245910644531, -64.68602752685547, -60.929595947265625, -57.17316818237305, -53.41674041748047, -49.660308837890625, -45.90387725830078, -42.1474494934082, -38.391021728515625, -34.63459014892578, -30.87816047668457, -27.12173080444336, -23.36530113220215, -19.608871459960938, -15.852441787719727, -12.096012115478516, -8.339582443237305, -4.583152770996094, -0.8267230987548828, 2.929706573486328, 6.686136245727539, 10.44256591796875, 14.198995590209961, 17.955425262451172, 21.711854934692383, 25.468284606933594, 29.224714279174805, 32.981143951416016, 36.737571716308594, 40.49400329589844, 44.25043487548828, 48.00686264038086, 51.76329040527344, 55.51972198486328, 59.276153564453125, 63.0325813293457, 66.78900909423828, 70.54544067382812, 74.30187225341797, 78.05830383300781, 81.81472778320312, 85.57115936279297, 89.32759094238281, 93.08401489257812, 96.84044647216797, 100.59687805175781, 104.35330963134766, 108.1097412109375, 111.86616516113281, 115.62259674072266, 119.3790283203125, 123.13545227050781, 126.89188385009766, 130.6483154296875, 134.4047393798828, 138.1611785888672, 141.9176025390625, 145.67404174804688, 149.4304656982422, 153.1868896484375, 156.94332885742188, 160.6997528076172]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 4.0, 14.0, 23.0, 18.0, 29.0, 32.0, 51.0, 70.0, 100.0, 174.0, 253.0, 524.0, 1097.0, 2521.0, 6317.0, 17124.0, 46398.0, 126789.0, 187832.0, 85072.0, 30599.0, 11294.0, 4369.0, 1688.0, 781.0, 392.0, 244.0, 130.0, 98.0, 69.0, 47.0, 25.0, 25.0, 11.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.171875, -27.058349609375, -25.94482421875, -24.831298828125, -23.7177734375, -22.604248046875, -21.49072265625, -20.377197265625, -19.263671875, -18.150146484375, -17.03662109375, -15.923095703125, -14.8095703125, -13.696044921875, -12.58251953125, -11.468994140625, -10.35546875, -9.241943359375, -8.12841796875, -7.014892578125, -5.9013671875, -4.787841796875, -3.67431640625, -2.560791015625, -1.447265625, -0.333740234375, 0.77978515625, 1.893310546875, 3.0068359375, 4.120361328125, 5.23388671875, 6.347412109375, 7.4609375, 8.574462890625, 9.68798828125, 10.801513671875, 11.9150390625, 13.028564453125, 14.14208984375, 15.255615234375, 16.369140625, 17.482666015625, 18.59619140625, 19.709716796875, 20.8232421875, 21.936767578125, 23.05029296875, 24.163818359375, 25.27734375, 26.390869140625, 27.50439453125, 28.617919921875, 29.7314453125, 30.844970703125, 31.95849609375, 33.072021484375, 34.185546875, 35.299072265625, 36.41259765625, 37.526123046875, 38.6396484375, 39.753173828125, 40.86669921875, 41.980224609375, 43.09375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 7.0, 4.0, 7.0, 9.0, 10.0, 15.0, 9.0, 11.0, 12.0, 19.0, 26.0, 34.0, 45.0, 42.0, 49.0, 53.0, 59.0, 46.0, 51.0, 58.0, 63.0, 44.0, 42.0, 46.0, 39.0, 40.0, 37.0, 26.0, 19.0, 10.0, 18.0, 10.0, 7.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.3709716796875, -4.218505859375, -4.0660400390625, -3.91357421875, -3.7611083984375, -3.608642578125, -3.4561767578125, -3.3037109375, -3.1512451171875, -2.998779296875, -2.8463134765625, -2.69384765625, -2.5413818359375, -2.388916015625, -2.2364501953125, -2.083984375, -1.9315185546875, -1.779052734375, -1.6265869140625, -1.47412109375, -1.3216552734375, -1.169189453125, -1.0167236328125, -0.8642578125, -0.7117919921875, -0.559326171875, -0.4068603515625, -0.25439453125, -0.1019287109375, 0.050537109375, 0.2030029296875, 0.35546875, 0.5079345703125, 0.660400390625, 0.8128662109375, 0.96533203125, 1.1177978515625, 1.270263671875, 1.4227294921875, 1.5751953125, 1.7276611328125, 1.880126953125, 2.0325927734375, 2.18505859375, 2.3375244140625, 2.489990234375, 2.6424560546875, 2.794921875, 2.9473876953125, 3.099853515625, 3.2523193359375, 3.40478515625, 3.5572509765625, 3.709716796875, 3.8621826171875, 4.0146484375, 4.1671142578125, 4.319580078125, 4.4720458984375, 4.62451171875, 4.7769775390625, 4.929443359375, 5.0819091796875, 5.234375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 7.0, 18.0, 27.0, 40.0, 77.0, 65.0, 83.0, 57.0, 33.0, 16.0, 15.0, 9.0, 8.0, 9.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.49615478515625, -42.117000579833984, -40.73784637451172, -39.35869216918945, -37.97953796386719, -36.60038375854492, -35.221229553222656, -33.842071533203125, -32.462921142578125, -31.08376693725586, -29.704612731933594, -28.325458526611328, -26.946304321289062, -25.567150115966797, -24.1879940032959, -22.808839797973633, -21.429683685302734, -20.05052947998047, -18.671375274658203, -17.292221069335938, -15.913065910339355, -14.53391170501709, -13.154756546020508, -11.775602340698242, -10.396448135375977, -9.017293930053711, -7.638139247894287, -6.258984565734863, -4.879830360412598, -3.500676155090332, -2.12152099609375, -0.7423667907714844, 0.6367874145507812, 2.015941858291626, 3.3950963020324707, 4.7742509841918945, 6.15340518951416, 7.532559394836426, 8.911714553833008, 10.290868759155273, 11.670022964477539, 13.049177169799805, 14.42833137512207, 15.807486534118652, 17.186641693115234, 18.5657958984375, 19.944950103759766, 21.32410430908203, 22.703258514404297, 24.082412719726562, 25.461566925048828, 26.840721130371094, 28.21987533569336, 29.599029541015625, 30.978185653686523, 32.357337951660156, 33.73649597167969, 35.11565017700195, 36.49480438232422, 37.873958587646484, 39.25311279296875, 40.632266998291016, 42.01142120361328, 43.39057922363281, 44.76972961425781]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 9.0, 6.0, 10.0, 12.0, 40.0, 57.0, 61.0, 63.0, 59.0, 47.0, 18.0, 23.0, 15.0, 10.0, 6.0, 5.0, 6.0, 2.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.523101806640625, -16.629711151123047, -15.736321449279785, -14.842931747436523, -13.949541091918945, -13.056151390075684, -12.162761688232422, -11.269371032714844, -10.375980377197266, -9.482590675354004, -8.589200019836426, -7.695810317993164, -6.802419662475586, -5.909029960632324, -5.015639781951904, -4.122249603271484, -3.2288599014282227, -2.3354697227478027, -1.4420796632766724, -0.548689603805542, 0.34470057487487793, 1.2380905151367188, 2.1314806938171387, 3.0248708724975586, 3.9182610511779785, 4.811651229858398, 5.705041408538818, 6.598431587219238, 7.4918212890625, 8.385211944580078, 9.27860164642334, 10.171991348266602, 11.06538200378418, 11.958771705627441, 12.85216236114502, 13.745552062988281, 14.63894271850586, 15.532332420349121, 16.425722122192383, 17.31911277770996, 18.21250343322754, 19.105894088745117, 19.999282836914062, 20.89267349243164, 21.78606414794922, 22.679454803466797, 23.572843551635742, 24.46623420715332, 25.359622955322266, 26.253013610839844, 27.14640235900879, 28.039793014526367, 28.933183670043945, 29.82657241821289, 30.71996307373047, 31.613353729248047, 32.506744384765625, 33.4001350402832, 34.29352569580078, 35.18691635131836, 36.08030319213867, 36.97369384765625, 37.86708450317383, 38.760475158691406, 39.653865814208984]}, "eval/loss": 3.785594940185547, "eval/wer": 0.6683334325455881, "eval/runtime": 893.3132, "eval/samples_per_second": 2.958, "eval/steps_per_second": 0.371} \ No newline at end of file