diff --git "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" --- "a/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" +++ "b/wandb/run-20220307_135359-2ct09q1k/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.6666, "train/learning_rate": 7.740498812351543e-06, "train/epoch": 15.13, "train/global_step": 13500, "_runtime": 88234, "_timestamp": 1646749473, "_step": 13508, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 25.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 9.0, 31.0, 30112.0, 244.0, 23.0, 11.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.3125, -87.57666015625, -85.8408203125, -84.10498046875, -82.369140625, -80.63330078125, -78.8974609375, -77.16162109375, -75.42578125, -73.68994140625, -71.9541015625, -70.21826171875, -68.482421875, -66.74658203125, -65.0107421875, -63.27490234375, -61.5390625, -59.80322265625, -58.0673828125, -56.33154296875, -54.595703125, -52.85986328125, -51.1240234375, -49.38818359375, -47.65234375, -45.91650390625, -44.1806640625, -42.44482421875, -40.708984375, -38.97314453125, -37.2373046875, -35.50146484375, -33.765625, -32.02978515625, -30.2939453125, -28.55810546875, -26.822265625, -25.08642578125, -23.3505859375, -21.61474609375, -19.87890625, -18.14306640625, -16.4072265625, -14.67138671875, -12.935546875, -11.19970703125, -9.4638671875, -7.72802734375, -5.9921875, -4.25634765625, -2.5205078125, -0.78466796875, 0.951171875, 2.68701171875, 4.4228515625, 6.15869140625, 7.89453125, 9.63037109375, 11.3662109375, 13.10205078125, 14.837890625, 16.57373046875, 18.3095703125, 20.04541015625, 21.78125]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 10.0, 3.0, 7.0, 8.0, 9.0, 16.0, 17.0, 19.0, 24.0, 24.0, 27.0, 30.0, 37.0, 36.0, 36.0, 51.0, 60.0, 47.0, 49.0, 35.0, 56.0, 41.0, 46.0, 42.0, 44.0, 41.0, 33.0, 43.0, 25.0, 14.0, 15.0, 12.0, 10.0, 10.0, 4.0, 4.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-40.340782165527344, -39.48328399658203, -38.625789642333984, -37.76829147338867, -36.910797119140625, -36.05329895019531, -35.195804595947266, -34.33830642700195, -33.480812072753906, -32.623313903808594, -31.765819549560547, -30.908323287963867, -30.050827026367188, -29.193328857421875, -28.335832595825195, -27.478336334228516, -26.620838165283203, -25.763341903686523, -24.905845642089844, -24.048349380493164, -23.190853118896484, -22.333354949951172, -21.475858688354492, -20.618362426757812, -19.760866165161133, -18.903369903564453, -18.045873641967773, -17.188377380371094, -16.33087921142578, -15.473383903503418, -14.615886688232422, -13.758390426635742, -12.900894165039062, -12.043397903442383, -11.185901641845703, -10.328404426574707, -9.470908164978027, -8.613411903381348, -7.75591516494751, -6.898418426513672, -6.040922164916992, -5.1834259033203125, -4.325929164886475, -3.468432664871216, -2.610936164855957, -1.7534399032592773, -0.8959431648254395, -0.03844642639160156, 0.8190498352050781, 1.676546335220337, 2.5340428352355957, 3.3915393352508545, 4.249035835266113, 5.106532096862793, 5.964028835296631, 6.821525573730469, 7.679021835327148, 8.536518096923828, 9.394014358520508, 10.251511573791504, 11.109007835388184, 11.966504096984863, 12.82400131225586, 13.681497573852539, 14.538993835449219]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 11.0, 7.0, 15.0, 11.0, 14.0, 21.0, 15.0, 16.0, 19.0, 22.0, 24.0, 26.0, 30.0, 28.0, 39.0, 44.0, 41.0, 57.0, 40.0, 36.0, 38.0, 41.0, 35.0, 21.0, 32.0, 35.0, 38.0, 32.0, 27.0, 19.0, 23.0, 21.0, 19.0, 11.0, 13.0, 15.0, 13.0, 11.0, 4.0, 14.0, 4.0, 7.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-22.986465454101562, -22.310056686401367, -21.633649826049805, -20.95724105834961, -20.280834197998047, -19.60442543029785, -18.92801856994629, -18.251609802246094, -17.57520294189453, -16.898794174194336, -16.222387313842773, -15.545979499816895, -14.869571685791016, -14.193163871765137, -13.516756057739258, -12.840347290039062, -12.163939476013184, -11.487531661987305, -10.811123847961426, -10.134716033935547, -9.458308219909668, -8.781900405883789, -8.105491638183594, -7.429084300994873, -6.752676486968994, -6.076268672943115, -5.399860858917236, -4.723452568054199, -4.04704475402832, -3.3706371784210205, -2.6942291259765625, -2.0178213119506836, -1.3414134979248047, -0.665005624294281, 0.011402249336242676, 0.6878101825714111, 1.36421799659729, 2.040625810623169, 2.717033863067627, 3.393441677093506, 4.069849491119385, 4.746257305145264, 5.422665119171143, 6.09907341003418, 6.775481224060059, 7.4518890380859375, 8.128296852111816, 8.804704666137695, 9.481112480163574, 10.157520294189453, 10.833928108215332, 11.510335922241211, 12.18674373626709, 12.863151550292969, 13.539560317993164, 14.215967178344727, 14.892375946044922, 15.5687837600708, 16.24519157409668, 16.921600341796875, 17.598007202148438, 18.274415969848633, 18.950822830200195, 19.62723159790039, 20.303638458251953]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 5.0, 11.0, 17.0, 31.0, 59.0, 79.0, 109.0, 217.0, 355.0, 546.0, 908.0, 1452.0, 2193.0, 3479.0, 5202.0, 7571.0, 11176.0, 15538.0, 21785.0, 29032.0, 38585.0, 48980.0, 59649.0, 71146.0, 80790.0, 91353.0, 112462.0, 85404.0, 76523.0, 66410.0, 54696.0, 43593.0, 34014.0, 25628.0, 18598.0, 13336.0, 9194.0, 6420.0, 4223.0, 2786.0, 1838.0, 1169.0, 749.0, 468.0, 298.0, 200.0, 117.0, 55.0, 46.0, 27.0, 16.0, 10.0, 9.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.5625, -59.458984375, -57.35546875, -55.251953125, -53.1484375, -51.044921875, -48.94140625, -46.837890625, -44.734375, -42.630859375, -40.52734375, -38.423828125, -36.3203125, -34.216796875, -32.11328125, -30.009765625, -27.90625, -25.802734375, -23.69921875, -21.595703125, -19.4921875, -17.388671875, -15.28515625, -13.181640625, -11.078125, -8.974609375, -6.87109375, -4.767578125, -2.6640625, -0.560546875, 1.54296875, 3.646484375, 5.75, 7.853515625, 9.95703125, 12.060546875, 14.1640625, 16.267578125, 18.37109375, 20.474609375, 22.578125, 24.681640625, 26.78515625, 28.888671875, 30.9921875, 33.095703125, 35.19921875, 37.302734375, 39.40625, 41.509765625, 43.61328125, 45.716796875, 47.8203125, 49.923828125, 52.02734375, 54.130859375, 56.234375, 58.337890625, 60.44140625, 62.544921875, 64.6484375, 66.751953125, 68.85546875, 70.958984375, 73.0625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 6.0, 3.0, 9.0, 7.0, 10.0, 14.0, 10.0, 15.0, 19.0, 18.0, 29.0, 23.0, 27.0, 21.0, 33.0, 35.0, 44.0, 34.0, 38.0, 38.0, 50.0, 56.0, 36.0, 43.0, 33.0, 40.0, 34.0, 31.0, 29.0, 37.0, 26.0, 20.0, 21.0, 18.0, 11.0, 8.0, 14.0, 12.0, 10.0, 9.0, 6.0, 5.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-29.546875, -28.529052734375, -27.51123046875, -26.493408203125, -25.4755859375, -24.457763671875, -23.43994140625, -22.422119140625, -21.404296875, -20.386474609375, -19.36865234375, -18.350830078125, -17.3330078125, -16.315185546875, -15.29736328125, -14.279541015625, -13.26171875, -12.243896484375, -11.22607421875, -10.208251953125, -9.1904296875, -8.172607421875, -7.15478515625, -6.136962890625, -5.119140625, -4.101318359375, -3.08349609375, -2.065673828125, -1.0478515625, -0.030029296875, 0.98779296875, 2.005615234375, 3.0234375, 4.041259765625, 5.05908203125, 6.076904296875, 7.0947265625, 8.112548828125, 9.13037109375, 10.148193359375, 11.166015625, 12.183837890625, 13.20166015625, 14.219482421875, 15.2373046875, 16.255126953125, 17.27294921875, 18.290771484375, 19.30859375, 20.326416015625, 21.34423828125, 22.362060546875, 23.3798828125, 24.397705078125, 25.41552734375, 26.433349609375, 27.451171875, 28.468994140625, 29.48681640625, 30.504638671875, 31.5224609375, 32.540283203125, 33.55810546875, 34.575927734375, 35.59375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 3.0, 4.0, 11.0, 8.0, 11.0, 18.0, 16.0, 25.0, 24.0, 29.0, 19.0, 27.0, 31.0, 40.0, 30.0, 32.0, 43.0, 27.0, 39.0, 33.0, 34.0, 40.0, 36.0, 40.0, 45.0, 36.0, 29.0, 33.0, 30.0, 31.0, 20.0, 26.0, 22.0, 23.0, 10.0, 9.0, 13.0, 9.0, 7.0, 14.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.236202239990234, -18.583940505981445, -17.931676864624023, -17.279415130615234, -16.627151489257812, -15.974889755249023, -15.322627067565918, -14.670364379882812, -14.018101692199707, -13.365839004516602, -12.713576316833496, -12.06131362915039, -11.409051895141602, -10.75678825378418, -10.10452651977539, -9.452263832092285, -8.80000114440918, -8.147738456726074, -7.495475769042969, -6.8432135581970215, -6.190950870513916, -5.5386881828308105, -4.886425971984863, -4.234163284301758, -3.5819005966186523, -2.929637908935547, -2.2773754596710205, -1.6251128911972046, -0.9728503227233887, -0.3205876350402832, 0.33167481422424316, 0.9839372634887695, 1.6361980438232422, 2.2884607315063477, 2.940723180770874, 3.5929856300354004, 4.245248317718506, 4.897511005401611, 5.549773216247559, 6.202035903930664, 6.8542985916137695, 7.506561279296875, 8.15882396697998, 8.811086654663086, 9.463348388671875, 10.115612030029297, 10.767873764038086, 11.420136451721191, 12.072399139404297, 12.724661827087402, 13.376924514770508, 14.029187202453613, 14.681449890136719, 15.333711624145508, 15.985974311828613, 16.63823699951172, 17.29050064086914, 17.94276237487793, 18.59502601623535, 19.24728775024414, 19.899551391601562, 20.55181312561035, 21.204076766967773, 21.856338500976562, 22.50860023498535]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 6.0, 5.0, 2.0, 8.0, 7.0, 7.0, 19.0, 15.0, 14.0, 22.0, 32.0, 24.0, 23.0, 34.0, 34.0, 44.0, 42.0, 49.0, 35.0, 52.0, 46.0, 44.0, 39.0, 56.0, 35.0, 27.0, 49.0, 30.0, 25.0, 36.0, 24.0, 20.0, 15.0, 16.0, 13.0, 12.0, 13.0, 8.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.614103317260742, -24.833560943603516, -24.05301856994629, -23.272476196289062, -22.49193572998047, -21.711393356323242, -20.930850982666016, -20.15030860900879, -19.369766235351562, -18.589223861694336, -17.80868148803711, -17.028141021728516, -16.24759864807129, -15.467056274414062, -14.686513900756836, -13.90597152709961, -13.125431060791016, -12.344888687133789, -11.564347267150879, -10.783804893493652, -10.003263473510742, -9.222721099853516, -8.442178726196289, -7.661636829376221, -6.881094932556152, -6.100553035736084, -5.320011138916016, -4.539468765258789, -3.7589268684387207, -2.9783849716186523, -2.197842597961426, -1.4173007011413574, -0.6367568969726562, 0.14378511905670166, 0.9243271350860596, 1.704869270324707, 2.4854111671447754, 3.2659530639648438, 4.04649543762207, 4.827037334442139, 5.607579231262207, 6.388121128082275, 7.168663024902344, 7.94920539855957, 8.729747772216797, 9.510289192199707, 10.290831565856934, 11.071372985839844, 11.85191535949707, 12.632457733154297, 13.412999153137207, 14.193541526794434, 14.974082946777344, 15.75462532043457, 16.535167694091797, 17.315710067749023, 18.09625244140625, 18.876794815063477, 19.657337188720703, 20.437877655029297, 21.218420028686523, 21.99896240234375, 22.779504776000977, 23.560047149658203, 24.340587615966797]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 12.0, 6.0, 11.0, 27.0, 24.0, 55.0, 85.0, 105.0, 170.0, 249.0, 397.0, 635.0, 937.0, 1454.0, 2346.0, 3580.0, 5745.0, 8977.0, 14116.0, 22833.0, 36215.0, 58176.0, 93253.0, 147768.0, 228916.0, 344426.0, 493168.0, 623966.0, 629130.0, 498378.0, 350824.0, 230822.0, 148752.0, 93287.0, 58496.0, 36271.0, 22739.0, 14223.0, 8908.0, 5490.0, 3404.0, 2124.0, 1416.0, 872.0, 579.0, 340.0, 208.0, 136.0, 99.0, 57.0, 29.0, 15.0, 18.0, 7.0, 6.0, 6.0, 4.0, 1.0], "bins": [-35.0, -33.970947265625, -32.94189453125, -31.912841796875, -30.8837890625, -29.854736328125, -28.82568359375, -27.796630859375, -26.767578125, -25.738525390625, -24.70947265625, -23.680419921875, -22.6513671875, -21.622314453125, -20.59326171875, -19.564208984375, -18.53515625, -17.506103515625, -16.47705078125, -15.447998046875, -14.4189453125, -13.389892578125, -12.36083984375, -11.331787109375, -10.302734375, -9.273681640625, -8.24462890625, -7.215576171875, -6.1865234375, -5.157470703125, -4.12841796875, -3.099365234375, -2.0703125, -1.041259765625, -0.01220703125, 1.016845703125, 2.0458984375, 3.074951171875, 4.10400390625, 5.133056640625, 6.162109375, 7.191162109375, 8.22021484375, 9.249267578125, 10.2783203125, 11.307373046875, 12.33642578125, 13.365478515625, 14.39453125, 15.423583984375, 16.45263671875, 17.481689453125, 18.5107421875, 19.539794921875, 20.56884765625, 21.597900390625, 22.626953125, 23.656005859375, 24.68505859375, 25.714111328125, 26.7431640625, 27.772216796875, 28.80126953125, 29.830322265625, 30.859375]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 4.0, 14.0, 8.0, 14.0, 8.0, 23.0, 20.0, 15.0, 35.0, 31.0, 29.0, 36.0, 37.0, 44.0, 48.0, 39.0, 48.0, 44.0, 43.0, 47.0, 46.0, 42.0, 29.0, 43.0, 31.0, 28.0, 32.0, 27.0, 15.0, 21.0, 17.0, 14.0, 10.0, 8.0, 11.0, 6.0, 9.0, 9.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.452392578125, -18.77978515625, -18.107177734375, -17.4345703125, -16.761962890625, -16.08935546875, -15.416748046875, -14.744140625, -14.071533203125, -13.39892578125, -12.726318359375, -12.0537109375, -11.381103515625, -10.70849609375, -10.035888671875, -9.36328125, -8.690673828125, -8.01806640625, -7.345458984375, -6.6728515625, -6.000244140625, -5.32763671875, -4.655029296875, -3.982421875, -3.309814453125, -2.63720703125, -1.964599609375, -1.2919921875, -0.619384765625, 0.05322265625, 0.725830078125, 1.3984375, 2.071044921875, 2.74365234375, 3.416259765625, 4.0888671875, 4.761474609375, 5.43408203125, 6.106689453125, 6.779296875, 7.451904296875, 8.12451171875, 8.797119140625, 9.4697265625, 10.142333984375, 10.81494140625, 11.487548828125, 12.16015625, 12.832763671875, 13.50537109375, 14.177978515625, 14.8505859375, 15.523193359375, 16.19580078125, 16.868408203125, 17.541015625, 18.213623046875, 18.88623046875, 19.558837890625, 20.2314453125, 20.904052734375, 21.57666015625, 22.249267578125, 22.921875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 16.0, 17.0, 30.0, 38.0, 71.0, 124.0, 190.0, 337.0, 518.0, 815.0, 1326.0, 2165.0, 3585.0, 5636.0, 9307.0, 14825.0, 23664.0, 37560.0, 59964.0, 93749.0, 142417.0, 211604.0, 303166.0, 409168.0, 507813.0, 552642.0, 505408.0, 406297.0, 301106.0, 208772.0, 141128.0, 92424.0, 59133.0, 37251.0, 23535.0, 14875.0, 9112.0, 5559.0, 3333.0, 2117.0, 1323.0, 823.0, 519.0, 327.0, 188.0, 122.0, 80.0, 40.0, 25.0, 18.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-21.078125, -20.40869140625, -19.7392578125, -19.06982421875, -18.400390625, -17.73095703125, -17.0615234375, -16.39208984375, -15.72265625, -15.05322265625, -14.3837890625, -13.71435546875, -13.044921875, -12.37548828125, -11.7060546875, -11.03662109375, -10.3671875, -9.69775390625, -9.0283203125, -8.35888671875, -7.689453125, -7.02001953125, -6.3505859375, -5.68115234375, -5.01171875, -4.34228515625, -3.6728515625, -3.00341796875, -2.333984375, -1.66455078125, -0.9951171875, -0.32568359375, 0.34375, 1.01318359375, 1.6826171875, 2.35205078125, 3.021484375, 3.69091796875, 4.3603515625, 5.02978515625, 5.69921875, 6.36865234375, 7.0380859375, 7.70751953125, 8.376953125, 9.04638671875, 9.7158203125, 10.38525390625, 11.0546875, 11.72412109375, 12.3935546875, 13.06298828125, 13.732421875, 14.40185546875, 15.0712890625, 15.74072265625, 16.41015625, 17.07958984375, 17.7490234375, 18.41845703125, 19.087890625, 19.75732421875, 20.4267578125, 21.09619140625, 21.765625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 5.0, 15.0, 20.0, 16.0, 29.0, 31.0, 52.0, 50.0, 78.0, 90.0, 107.0, 114.0, 133.0, 150.0, 195.0, 220.0, 241.0, 248.0, 272.0, 242.0, 234.0, 230.0, 237.0, 180.0, 176.0, 126.0, 117.0, 92.0, 84.0, 64.0, 54.0, 42.0, 27.0, 23.0, 22.0, 10.0, 11.0, 6.0, 8.0, 5.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.5595703125, -10.205078125, -9.8505859375, -9.49609375, -9.1416015625, -8.787109375, -8.4326171875, -8.078125, -7.7236328125, -7.369140625, -7.0146484375, -6.66015625, -6.3056640625, -5.951171875, -5.5966796875, -5.2421875, -4.8876953125, -4.533203125, -4.1787109375, -3.82421875, -3.4697265625, -3.115234375, -2.7607421875, -2.40625, -2.0517578125, -1.697265625, -1.3427734375, -0.98828125, -0.6337890625, -0.279296875, 0.0751953125, 0.4296875, 0.7841796875, 1.138671875, 1.4931640625, 1.84765625, 2.2021484375, 2.556640625, 2.9111328125, 3.265625, 3.6201171875, 3.974609375, 4.3291015625, 4.68359375, 5.0380859375, 5.392578125, 5.7470703125, 6.1015625, 6.4560546875, 6.810546875, 7.1650390625, 7.51953125, 7.8740234375, 8.228515625, 8.5830078125, 8.9375, 9.2919921875, 9.646484375, 10.0009765625, 10.35546875, 10.7099609375, 11.064453125, 11.4189453125, 11.7734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 15.0, 5.0, 14.0, 14.0, 15.0, 18.0, 23.0, 23.0, 20.0, 29.0, 20.0, 25.0, 45.0, 41.0, 36.0, 34.0, 56.0, 42.0, 51.0, 43.0, 30.0, 39.0, 38.0, 36.0, 34.0, 28.0, 25.0, 26.0, 30.0, 21.0, 21.0, 13.0, 13.0, 15.0, 9.0, 8.0, 7.0, 5.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-21.884994506835938, -21.225168228149414, -20.565340042114258, -19.905513763427734, -19.245685577392578, -18.585859298706055, -17.9260311126709, -17.266204833984375, -16.60637664794922, -15.946549415588379, -15.286722183227539, -14.6268949508667, -13.96706771850586, -13.307241439819336, -12.647414207458496, -11.987586975097656, -11.327760696411133, -10.667933464050293, -10.008106231689453, -9.348278999328613, -8.688451766967773, -8.02862548828125, -7.36879825592041, -6.70897102355957, -6.0491437911987305, -5.389316558837891, -4.729489326477051, -4.069662570953369, -3.4098353385925293, -2.7500081062316895, -2.0901811122894287, -1.430354118347168, -0.7705287933349609, -0.11070168018341064, 0.5491254329681396, 1.20895254611969, 1.8687796592712402, 2.52860689163208, 3.188433885574341, 3.8482608795166016, 4.508088111877441, 5.167915344238281, 5.827742576599121, 6.487569332122803, 7.147396564483643, 7.807223796844482, 8.467050552368164, 9.126877784729004, 9.786705017089844, 10.446532249450684, 11.106359481811523, 11.766186714172363, 12.426013946533203, 13.085840225219727, 13.745667457580566, 14.405494689941406, 15.065321922302246, 15.725149154663086, 16.38497543334961, 17.044803619384766, 17.70462989807129, 18.364458084106445, 19.02428436279297, 19.684112548828125, 20.34393882751465]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 1.0, 6.0, 7.0, 6.0, 9.0, 14.0, 18.0, 23.0, 15.0, 15.0, 33.0, 31.0, 26.0, 40.0, 34.0, 42.0, 38.0, 47.0, 32.0, 43.0, 35.0, 44.0, 41.0, 47.0, 21.0, 36.0, 29.0, 27.0, 26.0, 26.0, 28.0, 29.0, 24.0, 11.0, 6.0, 19.0, 14.0, 7.0, 6.0, 6.0, 5.0, 5.0, 7.0, 4.0, 1.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-22.203296661376953, -21.519153594970703, -20.835010528564453, -20.150867462158203, -19.466724395751953, -18.782581329345703, -18.098438262939453, -17.414295196533203, -16.730152130126953, -16.046009063720703, -15.361865997314453, -14.677722930908203, -13.993579864501953, -13.309436798095703, -12.625292778015137, -11.941149711608887, -11.25700569152832, -10.57286262512207, -9.88871955871582, -9.20457649230957, -8.52043342590332, -7.836289882659912, -7.152146339416504, -6.468003273010254, -5.783860206604004, -5.099717140197754, -4.415574073791504, -3.7314305305480957, -3.0472874641418457, -2.3631443977355957, -1.6790008544921875, -0.9948577880859375, -0.3107166290283203, 0.37342655658721924, 1.0575697422027588, 1.741713047027588, 2.425856113433838, 3.109999179840088, 3.794142723083496, 4.478285789489746, 5.162428855895996, 5.846571922302246, 6.530714988708496, 7.214858531951904, 7.899001598358154, 8.583145141601562, 9.267288208007812, 9.951431274414062, 10.635574340820312, 11.319717407226562, 12.003860473632812, 12.688003540039062, 13.372146606445312, 14.056289672851562, 14.740433692932129, 15.424576759338379, 16.108718872070312, 16.792861938476562, 17.477005004882812, 18.161148071289062, 18.845291137695312, 19.529434204101562, 20.213577270507812, 20.897720336914062, 21.581865310668945]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 12.0, 2.0, 22.0, 32.0, 34.0, 50.0, 79.0, 96.0, 167.0, 259.0, 406.0, 610.0, 933.0, 1383.0, 2163.0, 3331.0, 5098.0, 7994.0, 12461.0, 19181.0, 30479.0, 48710.0, 78657.0, 122304.0, 164260.0, 171719.0, 135512.0, 89926.0, 56008.0, 34734.0, 21943.0, 14334.0, 9040.0, 5821.0, 3814.0, 2390.0, 1575.0, 1016.0, 671.0, 415.0, 288.0, 224.0, 130.0, 89.0, 62.0, 46.0, 28.0, 18.0, 13.0, 9.0, 7.0, 1.0, 5.0, 1.0, 0.0, 2.0], "bins": [-34.84375, -33.79248046875, -32.7412109375, -31.68994140625, -30.638671875, -29.58740234375, -28.5361328125, -27.48486328125, -26.43359375, -25.38232421875, -24.3310546875, -23.27978515625, -22.228515625, -21.17724609375, -20.1259765625, -19.07470703125, -18.0234375, -16.97216796875, -15.9208984375, -14.86962890625, -13.818359375, -12.76708984375, -11.7158203125, -10.66455078125, -9.61328125, -8.56201171875, -7.5107421875, -6.45947265625, -5.408203125, -4.35693359375, -3.3056640625, -2.25439453125, -1.203125, -0.15185546875, 0.8994140625, 1.95068359375, 3.001953125, 4.05322265625, 5.1044921875, 6.15576171875, 7.20703125, 8.25830078125, 9.3095703125, 10.36083984375, 11.412109375, 12.46337890625, 13.5146484375, 14.56591796875, 15.6171875, 16.66845703125, 17.7197265625, 18.77099609375, 19.822265625, 20.87353515625, 21.9248046875, 22.97607421875, 24.02734375, 25.07861328125, 26.1298828125, 27.18115234375, 28.232421875, 29.28369140625, 30.3349609375, 31.38623046875, 32.4375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 8.0, 5.0, 15.0, 14.0, 9.0, 15.0, 20.0, 18.0, 37.0, 27.0, 26.0, 35.0, 38.0, 34.0, 40.0, 56.0, 43.0, 42.0, 39.0, 38.0, 42.0, 38.0, 33.0, 35.0, 39.0, 25.0, 21.0, 31.0, 21.0, 22.0, 21.0, 18.0, 11.0, 13.0, 16.0, 14.0, 6.0, 5.0, 3.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0], "bins": [-20.828125, -20.22509765625, -19.6220703125, -19.01904296875, -18.416015625, -17.81298828125, -17.2099609375, -16.60693359375, -16.00390625, -15.40087890625, -14.7978515625, -14.19482421875, -13.591796875, -12.98876953125, -12.3857421875, -11.78271484375, -11.1796875, -10.57666015625, -9.9736328125, -9.37060546875, -8.767578125, -8.16455078125, -7.5615234375, -6.95849609375, -6.35546875, -5.75244140625, -5.1494140625, -4.54638671875, -3.943359375, -3.34033203125, -2.7373046875, -2.13427734375, -1.53125, -0.92822265625, -0.3251953125, 0.27783203125, 0.880859375, 1.48388671875, 2.0869140625, 2.68994140625, 3.29296875, 3.89599609375, 4.4990234375, 5.10205078125, 5.705078125, 6.30810546875, 6.9111328125, 7.51416015625, 8.1171875, 8.72021484375, 9.3232421875, 9.92626953125, 10.529296875, 11.13232421875, 11.7353515625, 12.33837890625, 12.94140625, 13.54443359375, 14.1474609375, 14.75048828125, 15.353515625, 15.95654296875, 16.5595703125, 17.16259765625, 17.765625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 12.0, 13.0, 19.0, 26.0, 32.0, 47.0, 81.0, 103.0, 144.0, 214.0, 324.0, 514.0, 654.0, 1149.0, 1792.0, 2939.0, 4666.0, 7946.0, 13700.0, 24290.0, 45850.0, 94388.0, 206176.0, 298816.0, 173837.0, 79421.0, 39571.0, 21251.0, 11943.0, 6993.0, 4296.0, 2631.0, 1633.0, 1000.0, 659.0, 470.0, 317.0, 190.0, 143.0, 78.0, 65.0, 42.0, 32.0, 33.0, 12.0, 13.0, 11.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.90625, -54.125, -52.34375, -50.5625, -48.78125, -47.0, -45.21875, -43.4375, -41.65625, -39.875, -38.09375, -36.3125, -34.53125, -32.75, -30.96875, -29.1875, -27.40625, -25.625, -23.84375, -22.0625, -20.28125, -18.5, -16.71875, -14.9375, -13.15625, -11.375, -9.59375, -7.8125, -6.03125, -4.25, -2.46875, -0.6875, 1.09375, 2.875, 4.65625, 6.4375, 8.21875, 10.0, 11.78125, 13.5625, 15.34375, 17.125, 18.90625, 20.6875, 22.46875, 24.25, 26.03125, 27.8125, 29.59375, 31.375, 33.15625, 34.9375, 36.71875, 38.5, 40.28125, 42.0625, 43.84375, 45.625, 47.40625, 49.1875, 50.96875, 52.75, 54.53125, 56.3125, 58.09375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 9.0, 10.0, 13.0, 7.0, 10.0, 11.0, 16.0, 22.0, 24.0, 25.0, 28.0, 32.0, 24.0, 33.0, 47.0, 36.0, 49.0, 46.0, 45.0, 39.0, 53.0, 38.0, 38.0, 28.0, 38.0, 38.0, 28.0, 33.0, 28.0, 19.0, 22.0, 14.0, 17.0, 12.0, 13.0, 13.0, 7.0, 4.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -14.076904296875, -13.63037109375, -13.183837890625, -12.7373046875, -12.290771484375, -11.84423828125, -11.397705078125, -10.951171875, -10.504638671875, -10.05810546875, -9.611572265625, -9.1650390625, -8.718505859375, -8.27197265625, -7.825439453125, -7.37890625, -6.932373046875, -6.48583984375, -6.039306640625, -5.5927734375, -5.146240234375, -4.69970703125, -4.253173828125, -3.806640625, -3.360107421875, -2.91357421875, -2.467041015625, -2.0205078125, -1.573974609375, -1.12744140625, -0.680908203125, -0.234375, 0.212158203125, 0.65869140625, 1.105224609375, 1.5517578125, 1.998291015625, 2.44482421875, 2.891357421875, 3.337890625, 3.784423828125, 4.23095703125, 4.677490234375, 5.1240234375, 5.570556640625, 6.01708984375, 6.463623046875, 6.91015625, 7.356689453125, 7.80322265625, 8.249755859375, 8.6962890625, 9.142822265625, 9.58935546875, 10.035888671875, 10.482421875, 10.928955078125, 11.37548828125, 11.822021484375, 12.2685546875, 12.715087890625, 13.16162109375, 13.608154296875, 14.0546875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 11.0, 11.0, 15.0, 24.0, 25.0, 54.0, 49.0, 64.0, 95.0, 142.0, 212.0, 337.0, 488.0, 761.0, 1275.0, 2252.0, 4365.0, 9632.0, 25431.0, 79067.0, 261465.0, 410465.0, 168848.0, 50656.0, 17638.0, 6991.0, 3391.0, 1787.0, 1028.0, 644.0, 427.0, 265.0, 181.0, 121.0, 101.0, 58.0, 42.0, 32.0, 27.0, 23.0, 15.0, 9.0, 14.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 3.0], "bins": [-34.40625, -33.431884765625, -32.45751953125, -31.483154296875, -30.5087890625, -29.534423828125, -28.56005859375, -27.585693359375, -26.611328125, -25.636962890625, -24.66259765625, -23.688232421875, -22.7138671875, -21.739501953125, -20.76513671875, -19.790771484375, -18.81640625, -17.842041015625, -16.86767578125, -15.893310546875, -14.9189453125, -13.944580078125, -12.97021484375, -11.995849609375, -11.021484375, -10.047119140625, -9.07275390625, -8.098388671875, -7.1240234375, -6.149658203125, -5.17529296875, -4.200927734375, -3.2265625, -2.252197265625, -1.27783203125, -0.303466796875, 0.6708984375, 1.645263671875, 2.61962890625, 3.593994140625, 4.568359375, 5.542724609375, 6.51708984375, 7.491455078125, 8.4658203125, 9.440185546875, 10.41455078125, 11.388916015625, 12.36328125, 13.337646484375, 14.31201171875, 15.286376953125, 16.2607421875, 17.235107421875, 18.20947265625, 19.183837890625, 20.158203125, 21.132568359375, 22.10693359375, 23.081298828125, 24.0556640625, 25.030029296875, 26.00439453125, 26.978759765625, 27.953125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 6.0, 13.0, 9.0, 12.0, 14.0, 16.0, 35.0, 67.0, 106.0, 173.0, 161.0, 127.0, 89.0, 46.0, 29.0, 14.0, 18.0, 17.0, 13.0, 7.0, 1.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023822784423828125, -0.0023037195205688477, -0.002225160598754883, -0.002146601676940918, -0.002068042755126953, -0.0019894838333129883, -0.0019109249114990234, -0.0018323659896850586, -0.0017538070678710938, -0.001675248146057129, -0.001596689224243164, -0.0015181303024291992, -0.0014395713806152344, -0.0013610124588012695, -0.0012824535369873047, -0.0012038946151733398, -0.001125335693359375, -0.0010467767715454102, -0.0009682178497314453, -0.0008896589279174805, -0.0008111000061035156, -0.0007325410842895508, -0.0006539821624755859, -0.0005754232406616211, -0.0004968643188476562, -0.0004183053970336914, -0.00033974647521972656, -0.0002611875534057617, -0.00018262863159179688, -0.00010406970977783203, -2.5510787963867188e-05, 5.3048133850097656e-05, 0.0001316070556640625, 0.00021016597747802734, 0.0002887248992919922, 0.00036728382110595703, 0.0004458427429199219, 0.0005244016647338867, 0.0006029605865478516, 0.0006815195083618164, 0.0007600784301757812, 0.0008386373519897461, 0.0009171962738037109, 0.0009957551956176758, 0.0010743141174316406, 0.0011528730392456055, 0.0012314319610595703, 0.0013099908828735352, 0.0013885498046875, 0.0014671087265014648, 0.0015456676483154297, 0.0016242265701293945, 0.0017027854919433594, 0.0017813444137573242, 0.001859903335571289, 0.001938462257385254, 0.0020170211791992188, 0.0020955801010131836, 0.0021741390228271484, 0.0022526979446411133, 0.002331256866455078, 0.002409815788269043, 0.002488374710083008, 0.0025669336318969727, 0.0026454925537109375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 6.0, 5.0, 16.0, 14.0, 24.0, 21.0, 48.0, 76.0, 96.0, 126.0, 196.0, 269.0, 384.0, 528.0, 810.0, 1441.0, 2479.0, 4676.0, 9028.0, 18956.0, 40818.0, 90551.0, 178841.0, 256017.0, 216253.0, 120482.0, 55589.0, 25117.0, 11924.0, 5873.0, 3046.0, 1761.0, 1030.0, 639.0, 441.0, 301.0, 192.0, 154.0, 90.0, 72.0, 39.0, 35.0, 30.0, 20.0, 17.0, 8.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-26.90625, -26.130615234375, -25.35498046875, -24.579345703125, -23.8037109375, -23.028076171875, -22.25244140625, -21.476806640625, -20.701171875, -19.925537109375, -19.14990234375, -18.374267578125, -17.5986328125, -16.822998046875, -16.04736328125, -15.271728515625, -14.49609375, -13.720458984375, -12.94482421875, -12.169189453125, -11.3935546875, -10.617919921875, -9.84228515625, -9.066650390625, -8.291015625, -7.515380859375, -6.73974609375, -5.964111328125, -5.1884765625, -4.412841796875, -3.63720703125, -2.861572265625, -2.0859375, -1.310302734375, -0.53466796875, 0.240966796875, 1.0166015625, 1.792236328125, 2.56787109375, 3.343505859375, 4.119140625, 4.894775390625, 5.67041015625, 6.446044921875, 7.2216796875, 7.997314453125, 8.77294921875, 9.548583984375, 10.32421875, 11.099853515625, 11.87548828125, 12.651123046875, 13.4267578125, 14.202392578125, 14.97802734375, 15.753662109375, 16.529296875, 17.304931640625, 18.08056640625, 18.856201171875, 19.6318359375, 20.407470703125, 21.18310546875, 21.958740234375, 22.734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 9.0, 5.0, 9.0, 14.0, 23.0, 28.0, 27.0, 32.0, 50.0, 57.0, 72.0, 61.0, 93.0, 70.0, 57.0, 70.0, 56.0, 44.0, 39.0, 25.0, 30.0, 21.0, 17.0, 16.0, 13.0, 8.0, 12.0, 7.0, 3.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.34375, -9.0885009765625, -8.833251953125, -8.5780029296875, -8.32275390625, -8.0675048828125, -7.812255859375, -7.5570068359375, -7.3017578125, -7.0465087890625, -6.791259765625, -6.5360107421875, -6.28076171875, -6.0255126953125, -5.770263671875, -5.5150146484375, -5.259765625, -5.0045166015625, -4.749267578125, -4.4940185546875, -4.23876953125, -3.9835205078125, -3.728271484375, -3.4730224609375, -3.2177734375, -2.9625244140625, -2.707275390625, -2.4520263671875, -2.19677734375, -1.9415283203125, -1.686279296875, -1.4310302734375, -1.17578125, -0.9205322265625, -0.665283203125, -0.4100341796875, -0.15478515625, 0.1004638671875, 0.355712890625, 0.6109619140625, 0.8662109375, 1.1214599609375, 1.376708984375, 1.6319580078125, 1.88720703125, 2.1424560546875, 2.397705078125, 2.6529541015625, 2.908203125, 3.1634521484375, 3.418701171875, 3.6739501953125, 3.92919921875, 4.1844482421875, 4.439697265625, 4.6949462890625, 4.9501953125, 5.2054443359375, 5.460693359375, 5.7159423828125, 5.97119140625, 6.2264404296875, 6.481689453125, 6.7369384765625, 6.9921875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 8.0, 7.0, 10.0, 18.0, 12.0, 21.0, 16.0, 25.0, 24.0, 39.0, 29.0, 32.0, 28.0, 41.0, 34.0, 40.0, 37.0, 44.0, 51.0, 43.0, 39.0, 38.0, 52.0, 36.0, 33.0, 36.0, 23.0, 33.0, 16.0, 25.0, 20.0, 18.0, 18.0, 12.0, 8.0, 9.0, 6.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.797592163085938, -18.215620040893555, -17.633647918701172, -17.05167579650879, -16.469703674316406, -15.887730598449707, -15.305757522583008, -14.723785400390625, -14.141813278198242, -13.55984115600586, -12.977869033813477, -12.395895957946777, -11.813923835754395, -11.231951713562012, -10.649978637695312, -10.06800651550293, -9.486034393310547, -8.904062271118164, -8.322090148925781, -7.740117073059082, -7.158144950866699, -6.576172828674316, -5.994200229644775, -5.412227630615234, -4.830255508422852, -4.248283386230469, -3.6663107872009277, -3.084338426589966, -2.502366065979004, -1.920393705368042, -1.33842134475708, -0.7564487457275391, -0.17447471618652344, 0.4074976444244385, 0.9894700050354004, 1.5714423656463623, 2.153414726257324, 2.735387086868286, 3.317359447479248, 3.899332046508789, 4.481304168701172, 5.063276290893555, 5.645248889923096, 6.227221488952637, 6.8091936111450195, 7.391165733337402, 7.973138332366943, 8.555110931396484, 9.137083053588867, 9.71905517578125, 10.301027297973633, 10.883000373840332, 11.464972496032715, 12.046944618225098, 12.628917694091797, 13.21088981628418, 13.792861938476562, 14.374834060668945, 14.956806182861328, 15.538779258728027, 16.120750427246094, 16.70272445678711, 17.284696578979492, 17.866668701171875, 18.448640823364258]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 0.0, 5.0, 8.0, 9.0, 13.0, 7.0, 10.0, 17.0, 22.0, 13.0, 24.0, 17.0, 29.0, 34.0, 45.0, 41.0, 33.0, 43.0, 42.0, 34.0, 36.0, 38.0, 39.0, 48.0, 44.0, 34.0, 38.0, 26.0, 31.0, 18.0, 19.0, 30.0, 20.0, 14.0, 24.0, 17.0, 10.0, 13.0, 11.0, 6.0, 4.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-19.259403228759766, -18.68049430847168, -18.10158348083496, -17.522674560546875, -16.94376564025879, -16.364856719970703, -15.785945892333984, -15.207036972045898, -14.628127098083496, -14.049217224121094, -13.470308303833008, -12.891398429870605, -12.312488555908203, -11.733579635620117, -11.154669761657715, -10.575759887695312, -9.996850967407227, -9.417941093444824, -8.839032173156738, -8.260122299194336, -7.681212902069092, -7.102303504943848, -6.523393630981445, -5.944484233856201, -5.365574836730957, -4.786665439605713, -4.207756042480469, -3.6288461685180664, -3.0499367713928223, -2.471027374267578, -1.8921177387237549, -1.3132081031799316, -0.7343006134033203, -0.15539109706878662, 0.42351841926574707, 1.0024279356002808, 1.5813374519348145, 2.1602468490600586, 2.739156484603882, 3.318066120147705, 3.896975517272949, 4.475884914398193, 5.0547943115234375, 5.63370418548584, 6.212613582611084, 6.791522979736328, 7.3704328536987305, 7.949342250823975, 8.528251647949219, 9.107161521911621, 9.686070442199707, 10.26498031616211, 10.843889236450195, 11.422799110412598, 12.001708984375, 12.580617904663086, 13.159527778625488, 13.73843765258789, 14.317346572875977, 14.896256446838379, 15.475166320800781, 16.054075241088867, 16.632984161376953, 17.211894989013672, 17.790803909301758]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 9.0, 4.0, 14.0, 15.0, 34.0, 41.0, 70.0, 90.0, 151.0, 232.0, 399.0, 588.0, 922.0, 1397.0, 2287.0, 3545.0, 5119.0, 7907.0, 11975.0, 17607.0, 25552.0, 35484.0, 48009.0, 63166.0, 80541.0, 94776.0, 104581.0, 106070.0, 98789.0, 85718.0, 69844.0, 54102.0, 39790.0, 28818.0, 19897.0, 13826.0, 9452.0, 6155.0, 4081.0, 2573.0, 1757.0, 1098.0, 778.0, 485.0, 284.0, 196.0, 132.0, 78.0, 44.0, 37.0, 14.0, 10.0, 7.0, 10.0, 4.0, 1.0, 0.0, 0.0, 4.0], "bins": [-20.171875, -19.545166015625, -18.91845703125, -18.291748046875, -17.6650390625, -17.038330078125, -16.41162109375, -15.784912109375, -15.158203125, -14.531494140625, -13.90478515625, -13.278076171875, -12.6513671875, -12.024658203125, -11.39794921875, -10.771240234375, -10.14453125, -9.517822265625, -8.89111328125, -8.264404296875, -7.6376953125, -7.010986328125, -6.38427734375, -5.757568359375, -5.130859375, -4.504150390625, -3.87744140625, -3.250732421875, -2.6240234375, -1.997314453125, -1.37060546875, -0.743896484375, -0.1171875, 0.509521484375, 1.13623046875, 1.762939453125, 2.3896484375, 3.016357421875, 3.64306640625, 4.269775390625, 4.896484375, 5.523193359375, 6.14990234375, 6.776611328125, 7.4033203125, 8.030029296875, 8.65673828125, 9.283447265625, 9.91015625, 10.536865234375, 11.16357421875, 11.790283203125, 12.4169921875, 13.043701171875, 13.67041015625, 14.297119140625, 14.923828125, 15.550537109375, 16.17724609375, 16.803955078125, 17.4306640625, 18.057373046875, 18.68408203125, 19.310791015625, 19.9375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 13.0, 15.0, 8.0, 12.0, 19.0, 14.0, 20.0, 29.0, 30.0, 40.0, 42.0, 46.0, 45.0, 36.0, 42.0, 41.0, 43.0, 46.0, 43.0, 42.0, 34.0, 37.0, 32.0, 31.0, 26.0, 27.0, 21.0, 28.0, 25.0, 16.0, 18.0, 7.0, 8.0, 6.0, 8.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.703125, -19.115966796875, -18.52880859375, -17.941650390625, -17.3544921875, -16.767333984375, -16.18017578125, -15.593017578125, -15.005859375, -14.418701171875, -13.83154296875, -13.244384765625, -12.6572265625, -12.070068359375, -11.48291015625, -10.895751953125, -10.30859375, -9.721435546875, -9.13427734375, -8.547119140625, -7.9599609375, -7.372802734375, -6.78564453125, -6.198486328125, -5.611328125, -5.024169921875, -4.43701171875, -3.849853515625, -3.2626953125, -2.675537109375, -2.08837890625, -1.501220703125, -0.9140625, -0.326904296875, 0.26025390625, 0.847412109375, 1.4345703125, 2.021728515625, 2.60888671875, 3.196044921875, 3.783203125, 4.370361328125, 4.95751953125, 5.544677734375, 6.1318359375, 6.718994140625, 7.30615234375, 7.893310546875, 8.48046875, 9.067626953125, 9.65478515625, 10.241943359375, 10.8291015625, 11.416259765625, 12.00341796875, 12.590576171875, 13.177734375, 13.764892578125, 14.35205078125, 14.939208984375, 15.5263671875, 16.113525390625, 16.70068359375, 17.287841796875, 17.875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 8.0, 13.0, 32.0, 42.0, 74.0, 101.0, 167.0, 241.0, 419.0, 605.0, 1035.0, 1697.0, 2514.0, 4081.0, 6239.0, 9323.0, 14216.0, 20466.0, 29906.0, 41612.0, 55268.0, 72210.0, 87756.0, 99176.0, 106133.0, 103286.0, 93629.0, 79213.0, 62652.0, 47800.0, 34769.0, 24679.0, 16885.0, 11258.0, 7590.0, 4888.0, 3115.0, 2000.0, 1367.0, 765.0, 491.0, 310.0, 205.0, 108.0, 89.0, 48.0, 30.0, 21.0, 9.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0], "bins": [-19.671875, -19.088623046875, -18.50537109375, -17.922119140625, -17.3388671875, -16.755615234375, -16.17236328125, -15.589111328125, -15.005859375, -14.422607421875, -13.83935546875, -13.256103515625, -12.6728515625, -12.089599609375, -11.50634765625, -10.923095703125, -10.33984375, -9.756591796875, -9.17333984375, -8.590087890625, -8.0068359375, -7.423583984375, -6.84033203125, -6.257080078125, -5.673828125, -5.090576171875, -4.50732421875, -3.924072265625, -3.3408203125, -2.757568359375, -2.17431640625, -1.591064453125, -1.0078125, -0.424560546875, 0.15869140625, 0.741943359375, 1.3251953125, 1.908447265625, 2.49169921875, 3.074951171875, 3.658203125, 4.241455078125, 4.82470703125, 5.407958984375, 5.9912109375, 6.574462890625, 7.15771484375, 7.740966796875, 8.32421875, 8.907470703125, 9.49072265625, 10.073974609375, 10.6572265625, 11.240478515625, 11.82373046875, 12.406982421875, 12.990234375, 13.573486328125, 14.15673828125, 14.739990234375, 15.3232421875, 15.906494140625, 16.48974609375, 17.072998046875, 17.65625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 10.0, 9.0, 15.0, 19.0, 17.0, 21.0, 21.0, 30.0, 24.0, 41.0, 30.0, 45.0, 43.0, 48.0, 53.0, 47.0, 37.0, 54.0, 43.0, 45.0, 45.0, 46.0, 34.0, 37.0, 25.0, 30.0, 19.0, 19.0, 11.0, 20.0, 12.0, 11.0, 6.0, 4.0, 3.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.1015625, -13.6748046875, -13.248046875, -12.8212890625, -12.39453125, -11.9677734375, -11.541015625, -11.1142578125, -10.6875, -10.2607421875, -9.833984375, -9.4072265625, -8.98046875, -8.5537109375, -8.126953125, -7.7001953125, -7.2734375, -6.8466796875, -6.419921875, -5.9931640625, -5.56640625, -5.1396484375, -4.712890625, -4.2861328125, -3.859375, -3.4326171875, -3.005859375, -2.5791015625, -2.15234375, -1.7255859375, -1.298828125, -0.8720703125, -0.4453125, -0.0185546875, 0.408203125, 0.8349609375, 1.26171875, 1.6884765625, 2.115234375, 2.5419921875, 2.96875, 3.3955078125, 3.822265625, 4.2490234375, 4.67578125, 5.1025390625, 5.529296875, 5.9560546875, 6.3828125, 6.8095703125, 7.236328125, 7.6630859375, 8.08984375, 8.5166015625, 8.943359375, 9.3701171875, 9.796875, 10.2236328125, 10.650390625, 11.0771484375, 11.50390625, 11.9306640625, 12.357421875, 12.7841796875, 13.2109375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 11.0, 12.0, 23.0, 26.0, 42.0, 55.0, 79.0, 106.0, 157.0, 233.0, 338.0, 507.0, 713.0, 1056.0, 1629.0, 2568.0, 4438.0, 7894.0, 15272.0, 30847.0, 64649.0, 129508.0, 213250.0, 234077.0, 165298.0, 88064.0, 42368.0, 20329.0, 10315.0, 5436.0, 3246.0, 2029.0, 1319.0, 867.0, 519.0, 370.0, 281.0, 188.0, 136.0, 72.0, 69.0, 45.0, 39.0, 23.0, 14.0, 14.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.1328125, -14.64794921875, -14.1630859375, -13.67822265625, -13.193359375, -12.70849609375, -12.2236328125, -11.73876953125, -11.25390625, -10.76904296875, -10.2841796875, -9.79931640625, -9.314453125, -8.82958984375, -8.3447265625, -7.85986328125, -7.375, -6.89013671875, -6.4052734375, -5.92041015625, -5.435546875, -4.95068359375, -4.4658203125, -3.98095703125, -3.49609375, -3.01123046875, -2.5263671875, -2.04150390625, -1.556640625, -1.07177734375, -0.5869140625, -0.10205078125, 0.3828125, 0.86767578125, 1.3525390625, 1.83740234375, 2.322265625, 2.80712890625, 3.2919921875, 3.77685546875, 4.26171875, 4.74658203125, 5.2314453125, 5.71630859375, 6.201171875, 6.68603515625, 7.1708984375, 7.65576171875, 8.140625, 8.62548828125, 9.1103515625, 9.59521484375, 10.080078125, 10.56494140625, 11.0498046875, 11.53466796875, 12.01953125, 12.50439453125, 12.9892578125, 13.47412109375, 13.958984375, 14.44384765625, 14.9287109375, 15.41357421875, 15.8984375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 6.0, 2.0, 6.0, 6.0, 11.0, 13.0, 13.0, 22.0, 30.0, 30.0, 53.0, 67.0, 83.0, 79.0, 109.0, 94.0, 82.0, 75.0, 48.0, 33.0, 42.0, 28.0, 15.0, 21.0, 6.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002346038818359375, -0.0022850781679153442, -0.0022241175174713135, -0.0021631568670272827, -0.002102196216583252, -0.002041235566139221, -0.0019802749156951904, -0.0019193142652511597, -0.001858353614807129, -0.0017973929643630981, -0.0017364323139190674, -0.0016754716634750366, -0.0016145110130310059, -0.001553550362586975, -0.0014925897121429443, -0.0014316290616989136, -0.0013706684112548828, -0.001309707760810852, -0.0012487471103668213, -0.0011877864599227905, -0.0011268258094787598, -0.001065865159034729, -0.0010049045085906982, -0.0009439438581466675, -0.0008829832077026367, -0.000822022557258606, -0.0007610619068145752, -0.0007001012563705444, -0.0006391406059265137, -0.0005781799554824829, -0.0005172193050384521, -0.0004562586545944214, -0.0003952980041503906, -0.00033433735370635986, -0.0002733767032623291, -0.00021241605281829834, -0.00015145540237426758, -9.049475193023682e-05, -2.9534101486206055e-05, 3.142654895782471e-05, 9.238719940185547e-05, 0.00015334784984588623, 0.000214308500289917, 0.00027526915073394775, 0.0003362298011779785, 0.0003971904516220093, 0.00045815110206604004, 0.0005191117525100708, 0.0005800724029541016, 0.0006410330533981323, 0.0007019937038421631, 0.0007629543542861938, 0.0008239150047302246, 0.0008848756551742554, 0.0009458363056182861, 0.001006796956062317, 0.0010677576065063477, 0.0011287182569503784, 0.0011896789073944092, 0.00125063955783844, 0.0013116002082824707, 0.0013725608587265015, 0.0014335215091705322, 0.001494482159614563, 0.0015554428100585938]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 6.0, 13.0, 12.0, 15.0, 21.0, 40.0, 36.0, 54.0, 103.0, 130.0, 194.0, 261.0, 403.0, 587.0, 843.0, 1297.0, 2196.0, 3318.0, 5516.0, 8930.0, 14909.0, 25283.0, 41744.0, 67013.0, 102787.0, 141062.0, 162048.0, 151544.0, 115421.0, 78109.0, 48861.0, 30069.0, 17733.0, 10661.0, 6376.0, 3882.0, 2431.0, 1598.0, 959.0, 638.0, 452.0, 306.0, 220.0, 132.0, 109.0, 65.0, 48.0, 35.0, 23.0, 22.0, 20.0, 9.0, 9.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.5078125, -9.19775390625, -8.8876953125, -8.57763671875, -8.267578125, -7.95751953125, -7.6474609375, -7.33740234375, -7.02734375, -6.71728515625, -6.4072265625, -6.09716796875, -5.787109375, -5.47705078125, -5.1669921875, -4.85693359375, -4.546875, -4.23681640625, -3.9267578125, -3.61669921875, -3.306640625, -2.99658203125, -2.6865234375, -2.37646484375, -2.06640625, -1.75634765625, -1.4462890625, -1.13623046875, -0.826171875, -0.51611328125, -0.2060546875, 0.10400390625, 0.4140625, 0.72412109375, 1.0341796875, 1.34423828125, 1.654296875, 1.96435546875, 2.2744140625, 2.58447265625, 2.89453125, 3.20458984375, 3.5146484375, 3.82470703125, 4.134765625, 4.44482421875, 4.7548828125, 5.06494140625, 5.375, 5.68505859375, 5.9951171875, 6.30517578125, 6.615234375, 6.92529296875, 7.2353515625, 7.54541015625, 7.85546875, 8.16552734375, 8.4755859375, 8.78564453125, 9.095703125, 9.40576171875, 9.7158203125, 10.02587890625, 10.3359375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 0.0, 4.0, 2.0, 6.0, 2.0, 9.0, 13.0, 15.0, 17.0, 19.0, 26.0, 31.0, 37.0, 42.0, 32.0, 50.0, 49.0, 49.0, 52.0, 52.0, 59.0, 42.0, 51.0, 48.0, 56.0, 40.0, 33.0, 36.0, 26.0, 20.0, 16.0, 20.0, 17.0, 11.0, 5.0, 3.0, 3.0, 0.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.96136474609375, -3.8367919921875, -3.71221923828125, -3.587646484375, -3.46307373046875, -3.3385009765625, -3.21392822265625, -3.08935546875, -2.96478271484375, -2.8402099609375, -2.71563720703125, -2.591064453125, -2.46649169921875, -2.3419189453125, -2.21734619140625, -2.0927734375, -1.96820068359375, -1.8436279296875, -1.71905517578125, -1.594482421875, -1.46990966796875, -1.3453369140625, -1.22076416015625, -1.09619140625, -0.97161865234375, -0.8470458984375, -0.72247314453125, -0.597900390625, -0.47332763671875, -0.3487548828125, -0.22418212890625, -0.099609375, 0.02496337890625, 0.1495361328125, 0.27410888671875, 0.398681640625, 0.52325439453125, 0.6478271484375, 0.77239990234375, 0.89697265625, 1.02154541015625, 1.1461181640625, 1.27069091796875, 1.395263671875, 1.51983642578125, 1.6444091796875, 1.76898193359375, 1.8935546875, 2.01812744140625, 2.1427001953125, 2.26727294921875, 2.391845703125, 2.51641845703125, 2.6409912109375, 2.76556396484375, 2.89013671875, 3.01470947265625, 3.1392822265625, 3.26385498046875, 3.388427734375, 3.51300048828125, 3.6375732421875, 3.76214599609375, 3.88671875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 10.0, 16.0, 18.0, 25.0, 20.0, 34.0, 29.0, 23.0, 34.0, 33.0, 41.0, 56.0, 46.0, 40.0, 51.0, 40.0, 45.0, 48.0, 51.0, 48.0, 42.0, 37.0, 30.0, 14.0, 26.0, 21.0, 18.0, 22.0, 13.0, 11.0, 8.0, 13.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.25560188293457, -17.62774658203125, -16.99989128112793, -16.37203598022461, -15.744180679321289, -15.116325378417969, -14.488469123840332, -13.860613822937012, -13.232758522033691, -12.604903221130371, -11.97704792022705, -11.34919261932373, -10.721336364746094, -10.093481063842773, -9.465625762939453, -8.837770462036133, -8.209915161132812, -7.582059860229492, -6.954204559326172, -6.326348781585693, -5.698493480682373, -5.070638179779053, -4.442782402038574, -3.814927101135254, -3.1870718002319336, -2.5592164993286133, -1.9313609600067139, -1.303505539894104, -0.6756501197814941, -0.04779481887817383, 0.5800607204437256, 1.207916259765625, 1.8357734680175781, 2.4636287689208984, 3.091484308242798, 3.7193398475646973, 4.347195148468018, 4.975050449371338, 5.602906227111816, 6.230761528015137, 6.858616828918457, 7.486472129821777, 8.114327430725098, 8.742182731628418, 9.370038986206055, 9.997894287109375, 10.625749588012695, 11.253604888916016, 11.881460189819336, 12.509315490722656, 13.137170791625977, 13.765026092529297, 14.392881393432617, 15.020736694335938, 15.648592948913574, 16.276447296142578, 16.90430450439453, 17.53215980529785, 18.160015106201172, 18.787870407104492, 19.415725708007812, 20.043581008911133, 20.671436309814453, 21.299293518066406, 21.927146911621094]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 3.0, 4.0, 1.0, 4.0, 6.0, 4.0, 5.0, 12.0, 9.0, 13.0, 6.0, 17.0, 21.0, 22.0, 26.0, 33.0, 21.0, 35.0, 34.0, 49.0, 50.0, 38.0, 39.0, 36.0, 40.0, 40.0, 33.0, 42.0, 39.0, 40.0, 36.0, 24.0, 28.0, 24.0, 27.0, 15.0, 15.0, 17.0, 10.0, 6.0, 14.0, 12.0, 13.0, 8.0, 8.0, 5.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-18.44998550415039, -17.86862564086914, -17.28726577758789, -16.70590591430664, -16.124544143676758, -15.543184280395508, -14.961824417114258, -14.380464553833008, -13.799104690551758, -13.217744827270508, -12.636384010314941, -12.055024147033691, -11.473664283752441, -10.892303466796875, -10.310943603515625, -9.729583740234375, -9.148222923278809, -8.566863059997559, -7.98550271987915, -7.404142379760742, -6.822782516479492, -6.241422176361084, -5.660061836242676, -5.078701972961426, -4.497341632843018, -3.9159815311431885, -3.3346214294433594, -2.753261089324951, -2.171900987625122, -1.590540885925293, -1.0091805458068848, -0.42782068252563477, 0.15353965759277344, 0.7348998188972473, 1.3162599802017212, 1.8976202011108398, 2.478980302810669, 3.060340404510498, 3.6417007446289062, 4.223060607910156, 4.8044209480285645, 5.385781288146973, 5.967141151428223, 6.548501491546631, 7.129861831665039, 7.711221694946289, 8.292581558227539, 8.873941421508789, 9.455302238464355, 10.036662101745605, 10.618022918701172, 11.199382781982422, 11.780742645263672, 12.362102508544922, 12.943463325500488, 13.524823188781738, 14.106184005737305, 14.687543869018555, 15.268904685974121, 15.850264549255371, 16.431625366210938, 17.012985229492188, 17.594345092773438, 18.175704956054688, 18.757064819335938]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [6.0, 8.0, 7.0, 9.0, 13.0, 27.0, 33.0, 65.0, 95.0, 172.0, 245.0, 357.0, 615.0, 999.0, 1641.0, 2590.0, 4245.0, 6749.0, 11210.0, 17769.0, 29177.0, 46679.0, 75836.0, 122406.0, 196658.0, 308575.0, 460503.0, 617052.0, 666345.0, 555846.0, 391303.0, 254943.0, 161401.0, 99805.0, 62076.0, 37873.0, 23356.0, 14392.0, 8776.0, 5398.0, 3356.0, 2092.0, 1374.0, 826.0, 489.0, 334.0, 203.0, 116.0, 107.0, 58.0, 37.0, 20.0, 11.0, 7.0, 5.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.3125, -17.665283203125, -17.01806640625, -16.370849609375, -15.7236328125, -15.076416015625, -14.42919921875, -13.781982421875, -13.134765625, -12.487548828125, -11.84033203125, -11.193115234375, -10.5458984375, -9.898681640625, -9.25146484375, -8.604248046875, -7.95703125, -7.309814453125, -6.66259765625, -6.015380859375, -5.3681640625, -4.720947265625, -4.07373046875, -3.426513671875, -2.779296875, -2.132080078125, -1.48486328125, -0.837646484375, -0.1904296875, 0.456787109375, 1.10400390625, 1.751220703125, 2.3984375, 3.045654296875, 3.69287109375, 4.340087890625, 4.9873046875, 5.634521484375, 6.28173828125, 6.928955078125, 7.576171875, 8.223388671875, 8.87060546875, 9.517822265625, 10.1650390625, 10.812255859375, 11.45947265625, 12.106689453125, 12.75390625, 13.401123046875, 14.04833984375, 14.695556640625, 15.3427734375, 15.989990234375, 16.63720703125, 17.284423828125, 17.931640625, 18.578857421875, 19.22607421875, 19.873291015625, 20.5205078125, 21.167724609375, 21.81494140625, 22.462158203125, 23.109375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 11.0, 8.0, 6.0, 11.0, 6.0, 17.0, 20.0, 18.0, 24.0, 26.0, 35.0, 43.0, 43.0, 35.0, 34.0, 46.0, 39.0, 49.0, 39.0, 46.0, 36.0, 35.0, 45.0, 39.0, 26.0, 39.0, 26.0, 21.0, 12.0, 22.0, 16.0, 13.0, 15.0, 17.0, 7.0, 16.0, 6.0, 8.0, 8.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.140625, -12.7105712890625, -12.280517578125, -11.8504638671875, -11.42041015625, -10.9903564453125, -10.560302734375, -10.1302490234375, -9.7001953125, -9.2701416015625, -8.840087890625, -8.4100341796875, -7.97998046875, -7.5499267578125, -7.119873046875, -6.6898193359375, -6.259765625, -5.8297119140625, -5.399658203125, -4.9696044921875, -4.53955078125, -4.1094970703125, -3.679443359375, -3.2493896484375, -2.8193359375, -2.3892822265625, -1.959228515625, -1.5291748046875, -1.09912109375, -0.6690673828125, -0.239013671875, 0.1910400390625, 0.62109375, 1.0511474609375, 1.481201171875, 1.9112548828125, 2.34130859375, 2.7713623046875, 3.201416015625, 3.6314697265625, 4.0615234375, 4.4915771484375, 4.921630859375, 5.3516845703125, 5.78173828125, 6.2117919921875, 6.641845703125, 7.0718994140625, 7.501953125, 7.9320068359375, 8.362060546875, 8.7921142578125, 9.22216796875, 9.6522216796875, 10.082275390625, 10.5123291015625, 10.9423828125, 11.3724365234375, 11.802490234375, 12.2325439453125, 12.66259765625, 13.0926513671875, 13.522705078125, 13.9527587890625, 14.3828125]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 5.0, 13.0, 12.0, 16.0, 38.0, 61.0, 96.0, 165.0, 257.0, 453.0, 727.0, 1234.0, 1864.0, 3082.0, 5021.0, 8647.0, 13765.0, 22655.0, 36806.0, 59477.0, 95596.0, 148615.0, 224357.0, 326499.0, 440888.0, 536882.0, 561824.0, 502254.0, 395711.0, 282723.0, 192301.0, 124621.0, 79752.0, 49480.0, 30659.0, 18569.0, 11441.0, 6986.0, 4149.0, 2560.0, 1572.0, 945.0, 543.0, 340.0, 236.0, 153.0, 86.0, 64.0, 34.0, 28.0, 13.0, 10.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.8046875, -13.34912109375, -12.8935546875, -12.43798828125, -11.982421875, -11.52685546875, -11.0712890625, -10.61572265625, -10.16015625, -9.70458984375, -9.2490234375, -8.79345703125, -8.337890625, -7.88232421875, -7.4267578125, -6.97119140625, -6.515625, -6.06005859375, -5.6044921875, -5.14892578125, -4.693359375, -4.23779296875, -3.7822265625, -3.32666015625, -2.87109375, -2.41552734375, -1.9599609375, -1.50439453125, -1.048828125, -0.59326171875, -0.1376953125, 0.31787109375, 0.7734375, 1.22900390625, 1.6845703125, 2.14013671875, 2.595703125, 3.05126953125, 3.5068359375, 3.96240234375, 4.41796875, 4.87353515625, 5.3291015625, 5.78466796875, 6.240234375, 6.69580078125, 7.1513671875, 7.60693359375, 8.0625, 8.51806640625, 8.9736328125, 9.42919921875, 9.884765625, 10.34033203125, 10.7958984375, 11.25146484375, 11.70703125, 12.16259765625, 12.6181640625, 13.07373046875, 13.529296875, 13.98486328125, 14.4404296875, 14.89599609375, 15.3515625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 11.0, 8.0, 17.0, 8.0, 15.0, 17.0, 31.0, 35.0, 43.0, 56.0, 62.0, 88.0, 98.0, 94.0, 111.0, 168.0, 171.0, 167.0, 191.0, 206.0, 232.0, 249.0, 249.0, 208.0, 200.0, 177.0, 188.0, 163.0, 154.0, 118.0, 115.0, 102.0, 64.0, 58.0, 47.0, 39.0, 40.0, 15.0, 15.0, 12.0, 6.0, 8.0, 4.0, 7.0, 5.0, 6.0, 3.0, 0.0, 1.0], "bins": [-7.88671875, -7.6708984375, -7.455078125, -7.2392578125, -7.0234375, -6.8076171875, -6.591796875, -6.3759765625, -6.16015625, -5.9443359375, -5.728515625, -5.5126953125, -5.296875, -5.0810546875, -4.865234375, -4.6494140625, -4.43359375, -4.2177734375, -4.001953125, -3.7861328125, -3.5703125, -3.3544921875, -3.138671875, -2.9228515625, -2.70703125, -2.4912109375, -2.275390625, -2.0595703125, -1.84375, -1.6279296875, -1.412109375, -1.1962890625, -0.98046875, -0.7646484375, -0.548828125, -0.3330078125, -0.1171875, 0.0986328125, 0.314453125, 0.5302734375, 0.74609375, 0.9619140625, 1.177734375, 1.3935546875, 1.609375, 1.8251953125, 2.041015625, 2.2568359375, 2.47265625, 2.6884765625, 2.904296875, 3.1201171875, 3.3359375, 3.5517578125, 3.767578125, 3.9833984375, 4.19921875, 4.4150390625, 4.630859375, 4.8466796875, 5.0625, 5.2783203125, 5.494140625, 5.7099609375, 5.92578125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 1.0, 6.0, 9.0, 13.0, 6.0, 10.0, 14.0, 18.0, 18.0, 25.0, 30.0, 40.0, 40.0, 51.0, 48.0, 45.0, 55.0, 56.0, 59.0, 51.0, 41.0, 44.0, 38.0, 25.0, 48.0, 37.0, 31.0, 25.0, 13.0, 13.0, 20.0, 12.0, 17.0, 7.0, 10.0, 7.0, 10.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.521527290344238, -14.977306365966797, -14.433084487915039, -13.888863563537598, -13.344642639160156, -12.800420761108398, -12.256199836730957, -11.711978912353516, -11.167757034301758, -10.623536109924316, -10.079314231872559, -9.535093307495117, -8.99087142944336, -8.446650505065918, -7.902429580688477, -7.358208179473877, -6.813986778259277, -6.269765377044678, -5.725543975830078, -5.181323051452637, -4.637101650238037, -4.0928802490234375, -3.548659086227417, -3.0044379234313965, -2.460216522216797, -1.9159952402114868, -1.3717739582061768, -0.8275526762008667, -0.28333139419555664, 0.26089000701904297, 0.8051111698150635, 1.349332332611084, 1.8935527801513672, 2.437774181365967, 2.9819953441619873, 3.526216506958008, 4.070437908172607, 4.614659309387207, 5.158880233764648, 5.703101634979248, 6.247323036193848, 6.791544437408447, 7.335765838623047, 7.879986763000488, 8.42420768737793, 8.968429565429688, 9.512650489807129, 10.05687141418457, 10.601093292236328, 11.14531421661377, 11.689536094665527, 12.233757019042969, 12.777978897094727, 13.322199821472168, 13.86642074584961, 14.410642623901367, 14.954863548278809, 15.49908447265625, 16.043306350708008, 16.587528228759766, 17.13174819946289, 17.67597007751465, 18.220191955566406, 18.76441192626953, 19.30863380432129]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 2.0, 10.0, 11.0, 12.0, 9.0, 12.0, 21.0, 17.0, 22.0, 18.0, 21.0, 39.0, 30.0, 30.0, 60.0, 52.0, 45.0, 44.0, 38.0, 42.0, 51.0, 38.0, 32.0, 35.0, 31.0, 33.0, 24.0, 30.0, 30.0, 20.0, 18.0, 14.0, 22.0, 17.0, 21.0, 6.0, 10.0, 8.0, 4.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.370956420898438, -15.827173233032227, -15.283390045166016, -14.739606857299805, -14.195823669433594, -13.652040481567383, -13.108257293701172, -12.564474105834961, -12.02069091796875, -11.476907730102539, -10.933124542236328, -10.389341354370117, -9.845558166503906, -9.301774978637695, -8.757991790771484, -8.214208602905273, -7.6704254150390625, -7.126642227172852, -6.582859039306641, -6.03907585144043, -5.495292663574219, -4.951509475708008, -4.407726287841797, -3.863943099975586, -3.320159912109375, -2.776376724243164, -2.232593536376953, -1.6888103485107422, -1.1450271606445312, -0.6012439727783203, -0.057460784912109375, 0.48632240295410156, 1.0301055908203125, 1.5738887786865234, 2.1176719665527344, 2.6614551544189453, 3.2052383422851562, 3.749021530151367, 4.292804718017578, 4.836587905883789, 5.38037109375, 5.924154281616211, 6.467937469482422, 7.011720657348633, 7.555503845214844, 8.099287033081055, 8.643070220947266, 9.186853408813477, 9.730636596679688, 10.274419784545898, 10.81820297241211, 11.36198616027832, 11.905769348144531, 12.449552536010742, 12.993335723876953, 13.537118911743164, 14.080902099609375, 14.624685287475586, 15.168468475341797, 15.712251663208008, 16.25603485107422, 16.79981803894043, 17.34360122680664, 17.88738441467285, 18.431167602539062]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 2.0, 11.0, 10.0, 19.0, 28.0, 53.0, 69.0, 107.0, 161.0, 267.0, 384.0, 609.0, 930.0, 1397.0, 2148.0, 3422.0, 5382.0, 8086.0, 12368.0, 19188.0, 28466.0, 41242.0, 58652.0, 76734.0, 95828.0, 109905.0, 115365.0, 110576.0, 95977.0, 77174.0, 58410.0, 41956.0, 28718.0, 19146.0, 12590.0, 8171.0, 5305.0, 3520.0, 2217.0, 1400.0, 926.0, 538.0, 411.0, 255.0, 157.0, 97.0, 76.0, 47.0, 21.0, 17.0, 11.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-24.25, -23.455078125, -22.66015625, -21.865234375, -21.0703125, -20.275390625, -19.48046875, -18.685546875, -17.890625, -17.095703125, -16.30078125, -15.505859375, -14.7109375, -13.916015625, -13.12109375, -12.326171875, -11.53125, -10.736328125, -9.94140625, -9.146484375, -8.3515625, -7.556640625, -6.76171875, -5.966796875, -5.171875, -4.376953125, -3.58203125, -2.787109375, -1.9921875, -1.197265625, -0.40234375, 0.392578125, 1.1875, 1.982421875, 2.77734375, 3.572265625, 4.3671875, 5.162109375, 5.95703125, 6.751953125, 7.546875, 8.341796875, 9.13671875, 9.931640625, 10.7265625, 11.521484375, 12.31640625, 13.111328125, 13.90625, 14.701171875, 15.49609375, 16.291015625, 17.0859375, 17.880859375, 18.67578125, 19.470703125, 20.265625, 21.060546875, 21.85546875, 22.650390625, 23.4453125, 24.240234375, 25.03515625, 25.830078125, 26.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 5.0, 10.0, 13.0, 7.0, 9.0, 27.0, 14.0, 28.0, 22.0, 15.0, 29.0, 34.0, 35.0, 37.0, 45.0, 32.0, 44.0, 48.0, 44.0, 47.0, 31.0, 37.0, 34.0, 37.0, 35.0, 30.0, 25.0, 36.0, 35.0, 19.0, 25.0, 20.0, 15.0, 16.0, 15.0, 11.0, 12.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.1015625, -10.7225341796875, -10.343505859375, -9.9644775390625, -9.58544921875, -9.2064208984375, -8.827392578125, -8.4483642578125, -8.0693359375, -7.6903076171875, -7.311279296875, -6.9322509765625, -6.55322265625, -6.1741943359375, -5.795166015625, -5.4161376953125, -5.037109375, -4.6580810546875, -4.279052734375, -3.9000244140625, -3.52099609375, -3.1419677734375, -2.762939453125, -2.3839111328125, -2.0048828125, -1.6258544921875, -1.246826171875, -0.8677978515625, -0.48876953125, -0.1097412109375, 0.269287109375, 0.6483154296875, 1.02734375, 1.4063720703125, 1.785400390625, 2.1644287109375, 2.54345703125, 2.9224853515625, 3.301513671875, 3.6805419921875, 4.0595703125, 4.4385986328125, 4.817626953125, 5.1966552734375, 5.57568359375, 5.9547119140625, 6.333740234375, 6.7127685546875, 7.091796875, 7.4708251953125, 7.849853515625, 8.2288818359375, 8.60791015625, 8.9869384765625, 9.365966796875, 9.7449951171875, 10.1240234375, 10.5030517578125, 10.882080078125, 11.2611083984375, 11.64013671875, 12.0191650390625, 12.398193359375, 12.7772216796875, 13.15625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 6.0, 10.0, 9.0, 11.0, 20.0, 35.0, 51.0, 75.0, 99.0, 120.0, 188.0, 292.0, 423.0, 666.0, 1042.0, 1555.0, 2376.0, 3824.0, 6185.0, 10232.0, 17539.0, 30905.0, 54083.0, 94393.0, 153283.0, 204784.0, 181364.0, 118262.0, 70118.0, 39568.0, 22945.0, 13290.0, 7794.0, 4781.0, 2829.0, 1823.0, 1174.0, 775.0, 509.0, 329.0, 247.0, 171.0, 120.0, 78.0, 53.0, 33.0, 25.0, 26.0, 17.0, 12.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.65625, -36.4306640625, -35.205078125, -33.9794921875, -32.75390625, -31.5283203125, -30.302734375, -29.0771484375, -27.8515625, -26.6259765625, -25.400390625, -24.1748046875, -22.94921875, -21.7236328125, -20.498046875, -19.2724609375, -18.046875, -16.8212890625, -15.595703125, -14.3701171875, -13.14453125, -11.9189453125, -10.693359375, -9.4677734375, -8.2421875, -7.0166015625, -5.791015625, -4.5654296875, -3.33984375, -2.1142578125, -0.888671875, 0.3369140625, 1.5625, 2.7880859375, 4.013671875, 5.2392578125, 6.46484375, 7.6904296875, 8.916015625, 10.1416015625, 11.3671875, 12.5927734375, 13.818359375, 15.0439453125, 16.26953125, 17.4951171875, 18.720703125, 19.9462890625, 21.171875, 22.3974609375, 23.623046875, 24.8486328125, 26.07421875, 27.2998046875, 28.525390625, 29.7509765625, 30.9765625, 32.2021484375, 33.427734375, 34.6533203125, 35.87890625, 37.1044921875, 38.330078125, 39.5556640625, 40.78125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 13.0, 8.0, 11.0, 22.0, 18.0, 17.0, 23.0, 34.0, 23.0, 40.0, 32.0, 31.0, 34.0, 41.0, 67.0, 41.0, 52.0, 46.0, 55.0, 56.0, 45.0, 39.0, 28.0, 33.0, 27.0, 34.0, 18.0, 21.0, 13.0, 18.0, 14.0, 11.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-13.0859375, -12.6903076171875, -12.294677734375, -11.8990478515625, -11.50341796875, -11.1077880859375, -10.712158203125, -10.3165283203125, -9.9208984375, -9.5252685546875, -9.129638671875, -8.7340087890625, -8.33837890625, -7.9427490234375, -7.547119140625, -7.1514892578125, -6.755859375, -6.3602294921875, -5.964599609375, -5.5689697265625, -5.17333984375, -4.7777099609375, -4.382080078125, -3.9864501953125, -3.5908203125, -3.1951904296875, -2.799560546875, -2.4039306640625, -2.00830078125, -1.6126708984375, -1.217041015625, -0.8214111328125, -0.42578125, -0.0301513671875, 0.365478515625, 0.7611083984375, 1.15673828125, 1.5523681640625, 1.947998046875, 2.3436279296875, 2.7392578125, 3.1348876953125, 3.530517578125, 3.9261474609375, 4.32177734375, 4.7174072265625, 5.113037109375, 5.5086669921875, 5.904296875, 6.2999267578125, 6.695556640625, 7.0911865234375, 7.48681640625, 7.8824462890625, 8.278076171875, 8.6737060546875, 9.0693359375, 9.4649658203125, 9.860595703125, 10.2562255859375, 10.65185546875, 11.0474853515625, 11.443115234375, 11.8387451171875, 12.234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 14.0, 16.0, 28.0, 45.0, 57.0, 77.0, 126.0, 202.0, 326.0, 483.0, 771.0, 1340.0, 2615.0, 5999.0, 17105.0, 62733.0, 308997.0, 493966.0, 110595.0, 26665.0, 8478.0, 3581.0, 1753.0, 926.0, 578.0, 348.0, 243.0, 146.0, 107.0, 69.0, 47.0, 29.0, 27.0, 5.0, 19.0, 7.0, 4.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.5, -43.8857421875, -42.271484375, -40.6572265625, -39.04296875, -37.4287109375, -35.814453125, -34.2001953125, -32.5859375, -30.9716796875, -29.357421875, -27.7431640625, -26.12890625, -24.5146484375, -22.900390625, -21.2861328125, -19.671875, -18.0576171875, -16.443359375, -14.8291015625, -13.21484375, -11.6005859375, -9.986328125, -8.3720703125, -6.7578125, -5.1435546875, -3.529296875, -1.9150390625, -0.30078125, 1.3134765625, 2.927734375, 4.5419921875, 6.15625, 7.7705078125, 9.384765625, 10.9990234375, 12.61328125, 14.2275390625, 15.841796875, 17.4560546875, 19.0703125, 20.6845703125, 22.298828125, 23.9130859375, 25.52734375, 27.1416015625, 28.755859375, 30.3701171875, 31.984375, 33.5986328125, 35.212890625, 36.8271484375, 38.44140625, 40.0556640625, 41.669921875, 43.2841796875, 44.8984375, 46.5126953125, 48.126953125, 49.7412109375, 51.35546875, 52.9697265625, 54.583984375, 56.1982421875, 57.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 17.0, 21.0, 31.0, 38.0, 66.0, 128.0, 181.0, 177.0, 133.0, 71.0, 46.0, 31.0, 19.0, 13.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004962921142578125, -0.004797220230102539, -0.004631519317626953, -0.004465818405151367, -0.004300117492675781, -0.004134416580200195, -0.003968715667724609, -0.0038030147552490234, -0.0036373138427734375, -0.0034716129302978516, -0.0033059120178222656, -0.0031402111053466797, -0.0029745101928710938, -0.002808809280395508, -0.002643108367919922, -0.002477407455444336, -0.00231170654296875, -0.002146005630493164, -0.001980304718017578, -0.0018146038055419922, -0.0016489028930664062, -0.0014832019805908203, -0.0013175010681152344, -0.0011518001556396484, -0.0009860992431640625, -0.0008203983306884766, -0.0006546974182128906, -0.0004889965057373047, -0.00032329559326171875, -0.0001575946807861328, 8.106231689453125e-06, 0.00017380714416503906, 0.000339508056640625, 0.0005052089691162109, 0.0006709098815917969, 0.0008366107940673828, 0.0010023117065429688, 0.0011680126190185547, 0.0013337135314941406, 0.0014994144439697266, 0.0016651153564453125, 0.0018308162689208984, 0.0019965171813964844, 0.0021622180938720703, 0.0023279190063476562, 0.002493619918823242, 0.002659320831298828, 0.002825021743774414, 0.00299072265625, 0.003156423568725586, 0.003322124481201172, 0.003487825393676758, 0.0036535263061523438, 0.0038192272186279297, 0.003984928131103516, 0.0041506290435791016, 0.0043163299560546875, 0.0044820308685302734, 0.004647731781005859, 0.004813432693481445, 0.004979133605957031, 0.005144834518432617, 0.005310535430908203, 0.005476236343383789, 0.005641937255859375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 8.0, 10.0, 8.0, 16.0, 14.0, 26.0, 20.0, 46.0, 51.0, 60.0, 80.0, 123.0, 146.0, 222.0, 305.0, 441.0, 679.0, 1107.0, 1709.0, 2887.0, 5464.0, 11130.0, 24021.0, 56876.0, 139080.0, 274306.0, 278466.0, 142732.0, 58379.0, 25100.0, 11370.0, 5548.0, 3040.0, 1727.0, 1039.0, 695.0, 489.0, 308.0, 204.0, 166.0, 118.0, 104.0, 58.0, 44.0, 34.0, 28.0, 17.0, 12.0, 11.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-19.96875, -19.324951171875, -18.68115234375, -18.037353515625, -17.3935546875, -16.749755859375, -16.10595703125, -15.462158203125, -14.818359375, -14.174560546875, -13.53076171875, -12.886962890625, -12.2431640625, -11.599365234375, -10.95556640625, -10.311767578125, -9.66796875, -9.024169921875, -8.38037109375, -7.736572265625, -7.0927734375, -6.448974609375, -5.80517578125, -5.161376953125, -4.517578125, -3.873779296875, -3.22998046875, -2.586181640625, -1.9423828125, -1.298583984375, -0.65478515625, -0.010986328125, 0.6328125, 1.276611328125, 1.92041015625, 2.564208984375, 3.2080078125, 3.851806640625, 4.49560546875, 5.139404296875, 5.783203125, 6.427001953125, 7.07080078125, 7.714599609375, 8.3583984375, 9.002197265625, 9.64599609375, 10.289794921875, 10.93359375, 11.577392578125, 12.22119140625, 12.864990234375, 13.5087890625, 14.152587890625, 14.79638671875, 15.440185546875, 16.083984375, 16.727783203125, 17.37158203125, 18.015380859375, 18.6591796875, 19.302978515625, 19.94677734375, 20.590576171875, 21.234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 16.0, 11.0, 14.0, 24.0, 33.0, 46.0, 55.0, 63.0, 75.0, 68.0, 68.0, 70.0, 68.0, 72.0, 62.0, 44.0, 46.0, 34.0, 22.0, 15.0, 24.0, 16.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.15234375, -6.95751953125, -6.7626953125, -6.56787109375, -6.373046875, -6.17822265625, -5.9833984375, -5.78857421875, -5.59375, -5.39892578125, -5.2041015625, -5.00927734375, -4.814453125, -4.61962890625, -4.4248046875, -4.22998046875, -4.03515625, -3.84033203125, -3.6455078125, -3.45068359375, -3.255859375, -3.06103515625, -2.8662109375, -2.67138671875, -2.4765625, -2.28173828125, -2.0869140625, -1.89208984375, -1.697265625, -1.50244140625, -1.3076171875, -1.11279296875, -0.91796875, -0.72314453125, -0.5283203125, -0.33349609375, -0.138671875, 0.05615234375, 0.2509765625, 0.44580078125, 0.640625, 0.83544921875, 1.0302734375, 1.22509765625, 1.419921875, 1.61474609375, 1.8095703125, 2.00439453125, 2.19921875, 2.39404296875, 2.5888671875, 2.78369140625, 2.978515625, 3.17333984375, 3.3681640625, 3.56298828125, 3.7578125, 3.95263671875, 4.1474609375, 4.34228515625, 4.537109375, 4.73193359375, 4.9267578125, 5.12158203125, 5.31640625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 10.0, 11.0, 12.0, 15.0, 13.0, 24.0, 27.0, 36.0, 30.0, 26.0, 41.0, 59.0, 49.0, 71.0, 55.0, 63.0, 59.0, 50.0, 55.0, 53.0, 39.0, 34.0, 26.0, 29.0, 20.0, 16.0, 14.0, 8.0, 16.0, 5.0, 6.0, 7.0, 4.0, 5.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.133628845214844, -13.695039749145508, -13.256451606750488, -12.817862510681152, -12.379273414611816, -11.940685272216797, -11.502096176147461, -11.063507080078125, -10.624917984008789, -10.186328887939453, -9.747740745544434, -9.309151649475098, -8.870562553405762, -8.431974411010742, -7.993385314941406, -7.55479621887207, -7.116208076477051, -6.677619457244873, -6.239030361175537, -5.800441741943359, -5.361852645874023, -4.923264026641846, -4.484675407409668, -4.046086311340332, -3.6074976921081543, -3.1689088344573975, -2.7303199768066406, -2.291731357574463, -1.853142499923706, -1.4145536422729492, -0.9759650230407715, -0.5373761653900146, -0.09878730773925781, 0.33980149030685425, 0.7783902883529663, 1.2169790267944336, 1.6555678844451904, 2.0941567420959473, 2.532745361328125, 2.971334218978882, 3.4099230766296387, 3.8485119342803955, 4.287100791931152, 4.72568941116333, 5.164278030395508, 5.602867126464844, 6.0414557456970215, 6.480044364929199, 6.918633460998535, 7.357222080230713, 7.795811176300049, 8.234399795532227, 8.672988891601562, 9.111577987670898, 9.550166130065918, 9.988755226135254, 10.427343368530273, 10.86593246459961, 11.304520606994629, 11.743109703063965, 12.1816987991333, 12.62028694152832, 13.058876037597656, 13.497465133666992, 13.936054229736328]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 10.0, 1.0, 4.0, 7.0, 5.0, 7.0, 8.0, 14.0, 18.0, 28.0, 14.0, 23.0, 22.0, 33.0, 36.0, 42.0, 48.0, 48.0, 41.0, 47.0, 35.0, 49.0, 32.0, 42.0, 36.0, 33.0, 36.0, 33.0, 32.0, 24.0, 27.0, 24.0, 19.0, 24.0, 24.0, 19.0, 13.0, 9.0, 10.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.565991401672363, -12.1818265914917, -11.797660827636719, -11.413496017456055, -11.02933120727539, -10.645166397094727, -10.261001586914062, -9.876835823059082, -9.492671012878418, -9.108506202697754, -8.724340438842773, -8.34017562866211, -7.956010818481445, -7.571846008300781, -7.187680721282959, -6.803515434265137, -6.419350624084473, -6.035185813903809, -5.651020526885986, -5.266855239868164, -4.8826904296875, -4.498525619506836, -4.114360332489014, -3.7301952838897705, -3.3460302352905273, -2.961865186691284, -2.577700138092041, -2.193535089492798, -1.8093700408935547, -1.4252049922943115, -1.0410399436950684, -0.6568748950958252, -0.27270984649658203, 0.11145520210266113, 0.4956202507019043, 0.8797852993011475, 1.2639503479003906, 1.6481153964996338, 2.032280445098877, 2.41644549369812, 2.8006105422973633, 3.1847755908966064, 3.5689406394958496, 3.9531056880950928, 4.337270736694336, 4.721435546875, 5.105600833892822, 5.4897661209106445, 5.873930931091309, 6.258095741271973, 6.642261028289795, 7.026426315307617, 7.410591125488281, 7.794755935668945, 8.17892074584961, 8.56308650970459, 8.947251319885254, 9.331416130065918, 9.715581893920898, 10.099746704101562, 10.483911514282227, 10.86807632446289, 11.252241134643555, 11.636406898498535, 12.0205717086792]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 43.0, 37.0, 93.0, 124.0, 172.0, 332.0, 452.0, 802.0, 1310.0, 2135.0, 3509.0, 5621.0, 9270.0, 14825.0, 23437.0, 36883.0, 55660.0, 81079.0, 108927.0, 132452.0, 139545.0, 126236.0, 99953.0, 71632.0, 48728.0, 32045.0, 19970.0, 12756.0, 7935.0, 4867.0, 3042.0, 1747.0, 1120.0, 671.0, 417.0, 271.0, 153.0, 108.0, 70.0, 31.0, 32.0, 16.0, 7.0, 8.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6796875, -9.3255615234375, -8.971435546875, -8.6173095703125, -8.26318359375, -7.9090576171875, -7.554931640625, -7.2008056640625, -6.8466796875, -6.4925537109375, -6.138427734375, -5.7843017578125, -5.43017578125, -5.0760498046875, -4.721923828125, -4.3677978515625, -4.013671875, -3.6595458984375, -3.305419921875, -2.9512939453125, -2.59716796875, -2.2430419921875, -1.888916015625, -1.5347900390625, -1.1806640625, -0.8265380859375, -0.472412109375, -0.1182861328125, 0.23583984375, 0.5899658203125, 0.944091796875, 1.2982177734375, 1.65234375, 2.0064697265625, 2.360595703125, 2.7147216796875, 3.06884765625, 3.4229736328125, 3.777099609375, 4.1312255859375, 4.4853515625, 4.8394775390625, 5.193603515625, 5.5477294921875, 5.90185546875, 6.2559814453125, 6.610107421875, 6.9642333984375, 7.318359375, 7.6724853515625, 8.026611328125, 8.3807373046875, 8.73486328125, 9.0889892578125, 9.443115234375, 9.7972412109375, 10.1513671875, 10.5054931640625, 10.859619140625, 11.2137451171875, 11.56787109375, 11.9219970703125, 12.276123046875, 12.6302490234375, 12.984375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 9.0, 12.0, 9.0, 15.0, 14.0, 19.0, 21.0, 24.0, 32.0, 34.0, 38.0, 37.0, 46.0, 45.0, 39.0, 48.0, 48.0, 44.0, 32.0, 36.0, 35.0, 33.0, 29.0, 27.0, 35.0, 34.0, 24.0, 32.0, 26.0, 22.0, 17.0, 9.0, 7.0, 12.0, 8.0, 8.0, 0.0, 7.0, 3.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-12.0859375, -11.7318115234375, -11.377685546875, -11.0235595703125, -10.66943359375, -10.3153076171875, -9.961181640625, -9.6070556640625, -9.2529296875, -8.8988037109375, -8.544677734375, -8.1905517578125, -7.83642578125, -7.4822998046875, -7.128173828125, -6.7740478515625, -6.419921875, -6.0657958984375, -5.711669921875, -5.3575439453125, -5.00341796875, -4.6492919921875, -4.295166015625, -3.9410400390625, -3.5869140625, -3.2327880859375, -2.878662109375, -2.5245361328125, -2.17041015625, -1.8162841796875, -1.462158203125, -1.1080322265625, -0.75390625, -0.3997802734375, -0.045654296875, 0.3084716796875, 0.66259765625, 1.0167236328125, 1.370849609375, 1.7249755859375, 2.0791015625, 2.4332275390625, 2.787353515625, 3.1414794921875, 3.49560546875, 3.8497314453125, 4.203857421875, 4.5579833984375, 4.912109375, 5.2662353515625, 5.620361328125, 5.9744873046875, 6.32861328125, 6.6827392578125, 7.036865234375, 7.3909912109375, 7.7451171875, 8.0992431640625, 8.453369140625, 8.8074951171875, 9.16162109375, 9.5157470703125, 9.869873046875, 10.2239990234375, 10.578125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 15.0, 16.0, 32.0, 40.0, 60.0, 82.0, 132.0, 222.0, 320.0, 494.0, 826.0, 1306.0, 1963.0, 3279.0, 5395.0, 8789.0, 14997.0, 25334.0, 42665.0, 70569.0, 109284.0, 149523.0, 168058.0, 152211.0, 111627.0, 71904.0, 44132.0, 26000.0, 15492.0, 9188.0, 5622.0, 3358.0, 2065.0, 1313.0, 787.0, 479.0, 322.0, 220.0, 156.0, 81.0, 62.0, 46.0, 35.0, 16.0, 14.0, 11.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.71875, -12.3021240234375, -11.885498046875, -11.4688720703125, -11.05224609375, -10.6356201171875, -10.218994140625, -9.8023681640625, -9.3857421875, -8.9691162109375, -8.552490234375, -8.1358642578125, -7.71923828125, -7.3026123046875, -6.885986328125, -6.4693603515625, -6.052734375, -5.6361083984375, -5.219482421875, -4.8028564453125, -4.38623046875, -3.9696044921875, -3.552978515625, -3.1363525390625, -2.7197265625, -2.3031005859375, -1.886474609375, -1.4698486328125, -1.05322265625, -0.6365966796875, -0.219970703125, 0.1966552734375, 0.61328125, 1.0299072265625, 1.446533203125, 1.8631591796875, 2.27978515625, 2.6964111328125, 3.113037109375, 3.5296630859375, 3.9462890625, 4.3629150390625, 4.779541015625, 5.1961669921875, 5.61279296875, 6.0294189453125, 6.446044921875, 6.8626708984375, 7.279296875, 7.6959228515625, 8.112548828125, 8.5291748046875, 8.94580078125, 9.3624267578125, 9.779052734375, 10.1956787109375, 10.6123046875, 11.0289306640625, 11.445556640625, 11.8621826171875, 12.27880859375, 12.6954345703125, 13.112060546875, 13.5286865234375, 13.9453125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 4.0, 11.0, 9.0, 13.0, 17.0, 20.0, 19.0, 26.0, 28.0, 37.0, 37.0, 26.0, 39.0, 36.0, 45.0, 48.0, 33.0, 37.0, 47.0, 46.0, 47.0, 44.0, 48.0, 39.0, 31.0, 29.0, 21.0, 21.0, 19.0, 21.0, 20.0, 14.0, 11.0, 11.0, 11.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.6875, -8.43011474609375, -8.1727294921875, -7.91534423828125, -7.657958984375, -7.40057373046875, -7.1431884765625, -6.88580322265625, -6.62841796875, -6.37103271484375, -6.1136474609375, -5.85626220703125, -5.598876953125, -5.34149169921875, -5.0841064453125, -4.82672119140625, -4.5693359375, -4.31195068359375, -4.0545654296875, -3.79718017578125, -3.539794921875, -3.28240966796875, -3.0250244140625, -2.76763916015625, -2.51025390625, -2.25286865234375, -1.9954833984375, -1.73809814453125, -1.480712890625, -1.22332763671875, -0.9659423828125, -0.70855712890625, -0.451171875, -0.19378662109375, 0.0635986328125, 0.32098388671875, 0.578369140625, 0.83575439453125, 1.0931396484375, 1.35052490234375, 1.60791015625, 1.86529541015625, 2.1226806640625, 2.38006591796875, 2.637451171875, 2.89483642578125, 3.1522216796875, 3.40960693359375, 3.6669921875, 3.92437744140625, 4.1817626953125, 4.43914794921875, 4.696533203125, 4.95391845703125, 5.2113037109375, 5.46868896484375, 5.72607421875, 5.98345947265625, 6.2408447265625, 6.49822998046875, 6.755615234375, 7.01300048828125, 7.2703857421875, 7.52777099609375, 7.78515625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 2.0, 5.0, 11.0, 21.0, 18.0, 50.0, 44.0, 89.0, 115.0, 162.0, 262.0, 366.0, 562.0, 798.0, 1287.0, 1927.0, 2869.0, 4714.0, 7736.0, 13118.0, 22996.0, 41426.0, 75270.0, 132017.0, 193384.0, 203130.0, 147612.0, 86393.0, 47552.0, 26174.0, 14866.0, 8844.0, 5365.0, 3177.0, 2060.0, 1385.0, 865.0, 606.0, 393.0, 282.0, 198.0, 133.0, 75.0, 59.0, 33.0, 37.0, 20.0, 20.0, 10.0, 6.0, 5.0, 4.0, 2.0, 0.0, 4.0], "bins": [-8.9453125, -8.68310546875, -8.4208984375, -8.15869140625, -7.896484375, -7.63427734375, -7.3720703125, -7.10986328125, -6.84765625, -6.58544921875, -6.3232421875, -6.06103515625, -5.798828125, -5.53662109375, -5.2744140625, -5.01220703125, -4.75, -4.48779296875, -4.2255859375, -3.96337890625, -3.701171875, -3.43896484375, -3.1767578125, -2.91455078125, -2.65234375, -2.39013671875, -2.1279296875, -1.86572265625, -1.603515625, -1.34130859375, -1.0791015625, -0.81689453125, -0.5546875, -0.29248046875, -0.0302734375, 0.23193359375, 0.494140625, 0.75634765625, 1.0185546875, 1.28076171875, 1.54296875, 1.80517578125, 2.0673828125, 2.32958984375, 2.591796875, 2.85400390625, 3.1162109375, 3.37841796875, 3.640625, 3.90283203125, 4.1650390625, 4.42724609375, 4.689453125, 4.95166015625, 5.2138671875, 5.47607421875, 5.73828125, 6.00048828125, 6.2626953125, 6.52490234375, 6.787109375, 7.04931640625, 7.3115234375, 7.57373046875, 7.8359375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 11.0, 9.0, 12.0, 16.0, 28.0, 25.0, 36.0, 47.0, 57.0, 96.0, 97.0, 117.0, 119.0, 80.0, 46.0, 45.0, 42.0, 21.0, 17.0, 15.0, 10.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.001598358154296875, -0.0015589147806167603, -0.0015194714069366455, -0.0014800280332565308, -0.001440584659576416, -0.0014011412858963013, -0.0013616979122161865, -0.0013222545385360718, -0.001282811164855957, -0.0012433677911758423, -0.0012039244174957275, -0.0011644810438156128, -0.001125037670135498, -0.0010855942964553833, -0.0010461509227752686, -0.0010067075490951538, -0.0009672641754150391, -0.0009278208017349243, -0.0008883774280548096, -0.0008489340543746948, -0.0008094906806945801, -0.0007700473070144653, -0.0007306039333343506, -0.0006911605596542358, -0.0006517171859741211, -0.0006122738122940063, -0.0005728304386138916, -0.0005333870649337769, -0.0004939436912536621, -0.00045450031757354736, -0.0004150569438934326, -0.00037561357021331787, -0.0003361701965332031, -0.0002967268228530884, -0.00025728344917297363, -0.0002178400754928589, -0.00017839670181274414, -0.0001389533281326294, -9.950995445251465e-05, -6.00665807723999e-05, -2.0623207092285156e-05, 1.882016658782959e-05, 5.8263540267944336e-05, 9.770691394805908e-05, 0.00013715028762817383, 0.00017659366130828857, 0.00021603703498840332, 0.00025548040866851807, 0.0002949237823486328, 0.00033436715602874756, 0.0003738105297088623, 0.00041325390338897705, 0.0004526972770690918, 0.0004921406507492065, 0.0005315840244293213, 0.000571027398109436, 0.0006104707717895508, 0.0006499141454696655, 0.0006893575191497803, 0.000728800892829895, 0.0007682442665100098, 0.0008076876401901245, 0.0008471310138702393, 0.000886574387550354, 0.0009260177612304688]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 10.0, 13.0, 14.0, 24.0, 32.0, 42.0, 68.0, 105.0, 141.0, 203.0, 311.0, 487.0, 632.0, 982.0, 1506.0, 2208.0, 3441.0, 5243.0, 8294.0, 13323.0, 21347.0, 34087.0, 53922.0, 82433.0, 118188.0, 148865.0, 154371.0, 131191.0, 95111.0, 63113.0, 40239.0, 25220.0, 15496.0, 9832.0, 6156.0, 3945.0, 2622.0, 1700.0, 1108.0, 791.0, 518.0, 337.0, 288.0, 188.0, 125.0, 80.0, 69.0, 38.0, 32.0, 21.0, 9.0, 10.0, 6.0, 11.0, 3.0, 2.0], "bins": [-6.15625, -5.97613525390625, -5.7960205078125, -5.61590576171875, -5.435791015625, -5.25567626953125, -5.0755615234375, -4.89544677734375, -4.71533203125, -4.53521728515625, -4.3551025390625, -4.17498779296875, -3.994873046875, -3.81475830078125, -3.6346435546875, -3.45452880859375, -3.2744140625, -3.09429931640625, -2.9141845703125, -2.73406982421875, -2.553955078125, -2.37384033203125, -2.1937255859375, -2.01361083984375, -1.83349609375, -1.65338134765625, -1.4732666015625, -1.29315185546875, -1.113037109375, -0.93292236328125, -0.7528076171875, -0.57269287109375, -0.392578125, -0.21246337890625, -0.0323486328125, 0.14776611328125, 0.327880859375, 0.50799560546875, 0.6881103515625, 0.86822509765625, 1.04833984375, 1.22845458984375, 1.4085693359375, 1.58868408203125, 1.768798828125, 1.94891357421875, 2.1290283203125, 2.30914306640625, 2.4892578125, 2.66937255859375, 2.8494873046875, 3.02960205078125, 3.209716796875, 3.38983154296875, 3.5699462890625, 3.75006103515625, 3.93017578125, 4.11029052734375, 4.2904052734375, 4.47052001953125, 4.650634765625, 4.83074951171875, 5.0108642578125, 5.19097900390625, 5.37109375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 10.0, 8.0, 15.0, 12.0, 16.0, 23.0, 27.0, 38.0, 39.0, 43.0, 33.0, 51.0, 69.0, 58.0, 62.0, 48.0, 49.0, 58.0, 40.0, 31.0, 32.0, 31.0, 32.0, 21.0, 18.0, 10.0, 16.0, 14.0, 14.0, 7.0, 12.0, 6.0, 6.0, 9.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9609375, -1.892303466796875, -1.82366943359375, -1.755035400390625, -1.6864013671875, -1.617767333984375, -1.54913330078125, -1.480499267578125, -1.411865234375, -1.343231201171875, -1.27459716796875, -1.205963134765625, -1.1373291015625, -1.068695068359375, -1.00006103515625, -0.931427001953125, -0.86279296875, -0.794158935546875, -0.72552490234375, -0.656890869140625, -0.5882568359375, -0.519622802734375, -0.45098876953125, -0.382354736328125, -0.313720703125, -0.245086669921875, -0.17645263671875, -0.107818603515625, -0.0391845703125, 0.029449462890625, 0.09808349609375, 0.166717529296875, 0.2353515625, 0.303985595703125, 0.37261962890625, 0.441253662109375, 0.5098876953125, 0.578521728515625, 0.64715576171875, 0.715789794921875, 0.784423828125, 0.853057861328125, 0.92169189453125, 0.990325927734375, 1.0589599609375, 1.127593994140625, 1.19622802734375, 1.264862060546875, 1.33349609375, 1.402130126953125, 1.47076416015625, 1.539398193359375, 1.6080322265625, 1.676666259765625, 1.74530029296875, 1.813934326171875, 1.882568359375, 1.951202392578125, 2.01983642578125, 2.088470458984375, 2.1571044921875, 2.225738525390625, 2.29437255859375, 2.363006591796875, 2.431640625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 2.0, 3.0, 7.0, 13.0, 13.0, 19.0, 16.0, 24.0, 25.0, 33.0, 43.0, 57.0, 60.0, 39.0, 53.0, 64.0, 72.0, 47.0, 61.0, 58.0, 55.0, 25.0, 44.0, 28.0, 24.0, 32.0, 11.0, 8.0, 13.0, 10.0, 9.0, 10.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.314119338989258, -14.902887344360352, -14.491654396057129, -14.080422401428223, -13.669189453125, -13.257957458496094, -12.846725463867188, -12.435492515563965, -12.024259567260742, -11.613027572631836, -11.201794624328613, -10.790562629699707, -10.379329681396484, -9.968097686767578, -9.556865692138672, -9.14563274383545, -8.734400749206543, -8.323168754577637, -7.911935806274414, -7.500703811645508, -7.089470863342285, -6.678238868713379, -6.2670063972473145, -5.85577392578125, -5.4445414543151855, -5.033308982849121, -4.622076511383057, -4.210844039916992, -3.799611806869507, -3.3883793354034424, -2.977147102355957, -2.5659146308898926, -2.154682159423828, -1.7434496879577637, -1.3322173357009888, -0.9209849834442139, -0.5097525119781494, -0.09852004051208496, 0.3127121925354004, 0.7239446640014648, 1.1351771354675293, 1.5464096069335938, 1.9576419591903687, 2.3688743114471436, 2.780106782913208, 3.1913392543792725, 3.602571487426758, 4.013803958892822, 4.425036430358887, 4.836268901824951, 5.247501373291016, 5.658733367919922, 6.0699663162231445, 6.481198310852051, 6.892430782318115, 7.30366325378418, 7.714895725250244, 8.126128196716309, 8.537360191345215, 8.948593139648438, 9.359825134277344, 9.771058082580566, 10.182290077209473, 10.593523025512695, 11.004755020141602]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 6.0, 15.0, 11.0, 20.0, 24.0, 19.0, 20.0, 38.0, 31.0, 32.0, 34.0, 47.0, 45.0, 44.0, 32.0, 48.0, 50.0, 49.0, 37.0, 35.0, 29.0, 33.0, 32.0, 28.0, 32.0, 37.0, 20.0, 18.0, 24.0, 11.0, 13.0, 14.0, 15.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.064876556396484, -11.6774320602417, -11.289986610412598, -10.902542114257812, -10.515096664428711, -10.127652168273926, -9.74020767211914, -9.352762222290039, -8.965317726135254, -8.577873229980469, -8.190427780151367, -7.802983283996582, -7.415538311004639, -7.028093338012695, -6.640648365020752, -6.253203392028809, -5.865758419036865, -5.478313446044922, -5.0908684730529785, -4.703423500061035, -4.31597900390625, -3.9285340309143066, -3.5410890579223633, -3.153644323348999, -2.7661993503570557, -2.3787543773651123, -1.991309642791748, -1.6038646697998047, -1.2164198160171509, -0.8289749622344971, -0.4415299892425537, -0.05408525466918945, 0.3333597183227539, 0.7208045721054077, 1.1082494258880615, 1.4956943988800049, 1.8831392526626587, 2.2705841064453125, 2.658029079437256, 3.04547381401062, 3.4329187870025635, 3.820363759994507, 4.207808494567871, 4.5952534675598145, 4.982698440551758, 5.370142936706543, 5.7575883865356445, 6.14503288269043, 6.532477855682373, 6.919922828674316, 7.30736780166626, 7.694812774658203, 8.082257270812988, 8.469701766967773, 8.857147216796875, 9.24459171295166, 9.632037162780762, 10.019481658935547, 10.406927108764648, 10.794371604919434, 11.181817054748535, 11.56926155090332, 11.956707000732422, 12.344151496887207, 12.731595993041992]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 12.0, 17.0, 28.0, 45.0, 69.0, 108.0, 127.0, 259.0, 381.0, 625.0, 952.0, 1670.0, 2690.0, 4562.0, 8169.0, 14817.0, 27940.0, 54923.0, 112579.0, 238544.0, 501315.0, 876729.0, 991632.0, 681542.0, 346030.0, 164951.0, 79098.0, 39080.0, 20204.0, 10760.0, 5808.0, 3417.0, 1959.0, 1154.0, 763.0, 472.0, 285.0, 178.0, 129.0, 80.0, 52.0, 34.0, 23.0, 22.0, 13.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.88037109375, -10.4951171875, -10.10986328125, -9.724609375, -9.33935546875, -8.9541015625, -8.56884765625, -8.18359375, -7.79833984375, -7.4130859375, -7.02783203125, -6.642578125, -6.25732421875, -5.8720703125, -5.48681640625, -5.1015625, -4.71630859375, -4.3310546875, -3.94580078125, -3.560546875, -3.17529296875, -2.7900390625, -2.40478515625, -2.01953125, -1.63427734375, -1.2490234375, -0.86376953125, -0.478515625, -0.09326171875, 0.2919921875, 0.67724609375, 1.0625, 1.44775390625, 1.8330078125, 2.21826171875, 2.603515625, 2.98876953125, 3.3740234375, 3.75927734375, 4.14453125, 4.52978515625, 4.9150390625, 5.30029296875, 5.685546875, 6.07080078125, 6.4560546875, 6.84130859375, 7.2265625, 7.61181640625, 7.9970703125, 8.38232421875, 8.767578125, 9.15283203125, 9.5380859375, 9.92333984375, 10.30859375, 10.69384765625, 11.0791015625, 11.46435546875, 11.849609375, 12.23486328125, 12.6201171875, 13.00537109375, 13.390625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 8.0, 5.0, 8.0, 7.0, 8.0, 11.0, 16.0, 17.0, 18.0, 27.0, 28.0, 30.0, 25.0, 29.0, 35.0, 39.0, 44.0, 38.0, 37.0, 53.0, 47.0, 44.0, 47.0, 46.0, 34.0, 40.0, 34.0, 31.0, 26.0, 16.0, 28.0, 16.0, 23.0, 10.0, 18.0, 11.0, 7.0, 13.0, 11.0, 11.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.59375, -9.3203125, -9.046875, -8.7734375, -8.5, -8.2265625, -7.953125, -7.6796875, -7.40625, -7.1328125, -6.859375, -6.5859375, -6.3125, -6.0390625, -5.765625, -5.4921875, -5.21875, -4.9453125, -4.671875, -4.3984375, -4.125, -3.8515625, -3.578125, -3.3046875, -3.03125, -2.7578125, -2.484375, -2.2109375, -1.9375, -1.6640625, -1.390625, -1.1171875, -0.84375, -0.5703125, -0.296875, -0.0234375, 0.25, 0.5234375, 0.796875, 1.0703125, 1.34375, 1.6171875, 1.890625, 2.1640625, 2.4375, 2.7109375, 2.984375, 3.2578125, 3.53125, 3.8046875, 4.078125, 4.3515625, 4.625, 4.8984375, 5.171875, 5.4453125, 5.71875, 5.9921875, 6.265625, 6.5390625, 6.8125, 7.0859375, 7.359375, 7.6328125, 7.90625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 4.0, 15.0, 18.0, 47.0, 47.0, 74.0, 106.0, 156.0, 231.0, 366.0, 558.0, 901.0, 1505.0, 2499.0, 4373.0, 7613.0, 13700.0, 25658.0, 48956.0, 95540.0, 187829.0, 357697.0, 621346.0, 864799.0, 811148.0, 534582.0, 296087.0, 152381.0, 77686.0, 40280.0, 21113.0, 11378.0, 6300.0, 3582.0, 2172.0, 1254.0, 882.0, 485.0, 310.0, 201.0, 143.0, 87.0, 61.0, 35.0, 31.0, 16.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.40625, -11.048095703125, -10.68994140625, -10.331787109375, -9.9736328125, -9.615478515625, -9.25732421875, -8.899169921875, -8.541015625, -8.182861328125, -7.82470703125, -7.466552734375, -7.1083984375, -6.750244140625, -6.39208984375, -6.033935546875, -5.67578125, -5.317626953125, -4.95947265625, -4.601318359375, -4.2431640625, -3.885009765625, -3.52685546875, -3.168701171875, -2.810546875, -2.452392578125, -2.09423828125, -1.736083984375, -1.3779296875, -1.019775390625, -0.66162109375, -0.303466796875, 0.0546875, 0.412841796875, 0.77099609375, 1.129150390625, 1.4873046875, 1.845458984375, 2.20361328125, 2.561767578125, 2.919921875, 3.278076171875, 3.63623046875, 3.994384765625, 4.3525390625, 4.710693359375, 5.06884765625, 5.427001953125, 5.78515625, 6.143310546875, 6.50146484375, 6.859619140625, 7.2177734375, 7.575927734375, 7.93408203125, 8.292236328125, 8.650390625, 9.008544921875, 9.36669921875, 9.724853515625, 10.0830078125, 10.441162109375, 10.79931640625, 11.157470703125, 11.515625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 12.0, 10.0, 12.0, 19.0, 20.0, 42.0, 30.0, 46.0, 55.0, 69.0, 85.0, 89.0, 115.0, 140.0, 163.0, 189.0, 215.0, 236.0, 278.0, 266.0, 266.0, 218.0, 263.0, 207.0, 207.0, 152.0, 140.0, 104.0, 73.0, 76.0, 52.0, 59.0, 35.0, 33.0, 24.0, 22.0, 11.0, 7.0, 2.0, 5.0, 2.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32421875, -4.197418212890625, -4.07061767578125, -3.943817138671875, -3.8170166015625, -3.690216064453125, -3.56341552734375, -3.436614990234375, -3.309814453125, -3.183013916015625, -3.05621337890625, -2.929412841796875, -2.8026123046875, -2.675811767578125, -2.54901123046875, -2.422210693359375, -2.29541015625, -2.168609619140625, -2.04180908203125, -1.915008544921875, -1.7882080078125, -1.661407470703125, -1.53460693359375, -1.407806396484375, -1.281005859375, -1.154205322265625, -1.02740478515625, -0.900604248046875, -0.7738037109375, -0.647003173828125, -0.52020263671875, -0.393402099609375, -0.2666015625, -0.139801025390625, -0.01300048828125, 0.113800048828125, 0.2406005859375, 0.367401123046875, 0.49420166015625, 0.621002197265625, 0.747802734375, 0.874603271484375, 1.00140380859375, 1.128204345703125, 1.2550048828125, 1.381805419921875, 1.50860595703125, 1.635406494140625, 1.76220703125, 1.889007568359375, 2.01580810546875, 2.142608642578125, 2.2694091796875, 2.396209716796875, 2.52301025390625, 2.649810791015625, 2.776611328125, 2.903411865234375, 3.03021240234375, 3.157012939453125, 3.2838134765625, 3.410614013671875, 3.53741455078125, 3.664215087890625, 3.791015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 0.0, 3.0, 5.0, 8.0, 15.0, 11.0, 8.0, 17.0, 25.0, 25.0, 27.0, 24.0, 41.0, 53.0, 56.0, 59.0, 54.0, 55.0, 51.0, 63.0, 46.0, 68.0, 50.0, 37.0, 47.0, 26.0, 25.0, 17.0, 17.0, 16.0, 13.0, 9.0, 7.0, 8.0, 1.0, 8.0, 6.0, 2.0, 3.0, 2.0], "bins": [-15.151134490966797, -14.793688774108887, -14.436243057250977, -14.078797340393066, -13.721351623535156, -13.363906860351562, -13.006461143493652, -12.649015426635742, -12.291569709777832, -11.934123992919922, -11.576678276062012, -11.219232559204102, -10.861787796020508, -10.504342079162598, -10.146896362304688, -9.789450645446777, -9.432004928588867, -9.074559211730957, -8.717113494873047, -8.359667778015137, -8.002222061157227, -7.644776821136475, -7.287331581115723, -6.9298858642578125, -6.572440147399902, -6.214994430541992, -5.857548713684082, -5.50010347366333, -5.14265775680542, -4.78521203994751, -4.427766799926758, -4.070321083068848, -3.712876319885254, -3.3554306030273438, -2.9979851245880127, -2.6405396461486816, -2.2830939292907715, -1.9256483316421509, -1.5682027339935303, -1.2107572555541992, -0.8533115386962891, -0.49586594104766846, -0.13842034339904785, 0.21902525424957275, 0.5764708518981934, 0.933916449546814, 1.2913620471954346, 1.6488075256347656, 2.006253242492676, 2.363698959350586, 2.721144437789917, 3.078589916229248, 3.436035633087158, 3.7934813499450684, 4.15092658996582, 4.5083723068237305, 4.865818023681641, 5.223263740539551, 5.580709457397461, 5.938154697418213, 6.295600414276123, 6.653046131134033, 7.010491371154785, 7.367937088012695, 7.7253828048706055]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 10.0, 6.0, 13.0, 11.0, 11.0, 10.0, 22.0, 11.0, 25.0, 23.0, 32.0, 22.0, 27.0, 30.0, 33.0, 51.0, 31.0, 29.0, 38.0, 45.0, 39.0, 39.0, 28.0, 34.0, 38.0, 44.0, 33.0, 30.0, 25.0, 31.0, 22.0, 22.0, 21.0, 17.0, 16.0, 14.0, 8.0, 6.0, 7.0, 9.0, 10.0, 7.0, 7.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-9.199252128601074, -8.91621208190918, -8.633171081542969, -8.350131034851074, -8.06709098815918, -7.784050941467285, -7.501010417938232, -7.21796989440918, -6.934929847717285, -6.651889801025391, -6.368849277496338, -6.085808753967285, -5.802768707275391, -5.519728660583496, -5.236688137054443, -4.953647613525391, -4.670607566833496, -4.387567520141602, -4.104526996612549, -3.821486711502075, -3.5384464263916016, -3.255406141281128, -2.9723658561706543, -2.6893255710601807, -2.406285285949707, -2.1232450008392334, -1.8402047157287598, -1.5571644306182861, -1.2741241455078125, -0.9910838603973389, -0.7080435752868652, -0.4250032901763916, -0.14196300506591797, 0.14107728004455566, 0.4241175651550293, 0.7071578502655029, 0.9901981353759766, 1.2732384204864502, 1.5562787055969238, 1.8393189907073975, 2.122359275817871, 2.4053995609283447, 2.6884398460388184, 2.971480131149292, 3.2545204162597656, 3.5375607013702393, 3.820600986480713, 4.103641510009766, 4.38668155670166, 4.669721603393555, 4.952762126922607, 5.23580265045166, 5.518842697143555, 5.801882743835449, 6.084923267364502, 6.367963790893555, 6.651003837585449, 6.934043884277344, 7.2170844078063965, 7.500124931335449, 7.783164978027344, 8.066205024719238, 8.349245071411133, 8.632286071777344, 8.915326118469238]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 14.0, 15.0, 26.0, 34.0, 44.0, 79.0, 128.0, 169.0, 249.0, 352.0, 554.0, 745.0, 1168.0, 1719.0, 2709.0, 4134.0, 6447.0, 10448.0, 16377.0, 26649.0, 43142.0, 69763.0, 107656.0, 153237.0, 176388.0, 147948.0, 102624.0, 66285.0, 41186.0, 25466.0, 15578.0, 9543.0, 6119.0, 4011.0, 2540.0, 1671.0, 1114.0, 724.0, 453.0, 324.0, 201.0, 172.0, 109.0, 80.0, 51.0, 34.0, 29.0, 16.0, 9.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.5, -22.775634765625, -22.05126953125, -21.326904296875, -20.6025390625, -19.878173828125, -19.15380859375, -18.429443359375, -17.705078125, -16.980712890625, -16.25634765625, -15.531982421875, -14.8076171875, -14.083251953125, -13.35888671875, -12.634521484375, -11.91015625, -11.185791015625, -10.46142578125, -9.737060546875, -9.0126953125, -8.288330078125, -7.56396484375, -6.839599609375, -6.115234375, -5.390869140625, -4.66650390625, -3.942138671875, -3.2177734375, -2.493408203125, -1.76904296875, -1.044677734375, -0.3203125, 0.404052734375, 1.12841796875, 1.852783203125, 2.5771484375, 3.301513671875, 4.02587890625, 4.750244140625, 5.474609375, 6.198974609375, 6.92333984375, 7.647705078125, 8.3720703125, 9.096435546875, 9.82080078125, 10.545166015625, 11.26953125, 11.993896484375, 12.71826171875, 13.442626953125, 14.1669921875, 14.891357421875, 15.61572265625, 16.340087890625, 17.064453125, 17.788818359375, 18.51318359375, 19.237548828125, 19.9619140625, 20.686279296875, 21.41064453125, 22.135009765625, 22.859375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 6.0, 11.0, 8.0, 8.0, 8.0, 12.0, 8.0, 19.0, 20.0, 21.0, 29.0, 25.0, 23.0, 26.0, 20.0, 41.0, 33.0, 29.0, 41.0, 35.0, 31.0, 41.0, 34.0, 35.0, 42.0, 37.0, 29.0, 38.0, 29.0, 33.0, 25.0, 27.0, 14.0, 24.0, 20.0, 20.0, 21.0, 14.0, 9.0, 9.0, 10.0, 8.0, 10.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-7.41796875, -7.179931640625, -6.94189453125, -6.703857421875, -6.4658203125, -6.227783203125, -5.98974609375, -5.751708984375, -5.513671875, -5.275634765625, -5.03759765625, -4.799560546875, -4.5615234375, -4.323486328125, -4.08544921875, -3.847412109375, -3.609375, -3.371337890625, -3.13330078125, -2.895263671875, -2.6572265625, -2.419189453125, -2.18115234375, -1.943115234375, -1.705078125, -1.467041015625, -1.22900390625, -0.990966796875, -0.7529296875, -0.514892578125, -0.27685546875, -0.038818359375, 0.19921875, 0.437255859375, 0.67529296875, 0.913330078125, 1.1513671875, 1.389404296875, 1.62744140625, 1.865478515625, 2.103515625, 2.341552734375, 2.57958984375, 2.817626953125, 3.0556640625, 3.293701171875, 3.53173828125, 3.769775390625, 4.0078125, 4.245849609375, 4.48388671875, 4.721923828125, 4.9599609375, 5.197998046875, 5.43603515625, 5.674072265625, 5.912109375, 6.150146484375, 6.38818359375, 6.626220703125, 6.8642578125, 7.102294921875, 7.34033203125, 7.578369140625, 7.81640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 9.0, 13.0, 14.0, 24.0, 32.0, 47.0, 49.0, 104.0, 128.0, 213.0, 284.0, 396.0, 583.0, 779.0, 1104.0, 1668.0, 2615.0, 3959.0, 6174.0, 9884.0, 15874.0, 27435.0, 47617.0, 84589.0, 147490.0, 218609.0, 195216.0, 119574.0, 67424.0, 37941.0, 21758.0, 13332.0, 8221.0, 5143.0, 3287.0, 2144.0, 1485.0, 1055.0, 726.0, 471.0, 321.0, 226.0, 156.0, 105.0, 74.0, 74.0, 48.0, 27.0, 20.0, 14.0, 13.0, 6.0, 1.0, 5.0, 3.0, 1.0], "bins": [-23.71875, -23.01708984375, -22.3154296875, -21.61376953125, -20.912109375, -20.21044921875, -19.5087890625, -18.80712890625, -18.10546875, -17.40380859375, -16.7021484375, -16.00048828125, -15.298828125, -14.59716796875, -13.8955078125, -13.19384765625, -12.4921875, -11.79052734375, -11.0888671875, -10.38720703125, -9.685546875, -8.98388671875, -8.2822265625, -7.58056640625, -6.87890625, -6.17724609375, -5.4755859375, -4.77392578125, -4.072265625, -3.37060546875, -2.6689453125, -1.96728515625, -1.265625, -0.56396484375, 0.1376953125, 0.83935546875, 1.541015625, 2.24267578125, 2.9443359375, 3.64599609375, 4.34765625, 5.04931640625, 5.7509765625, 6.45263671875, 7.154296875, 7.85595703125, 8.5576171875, 9.25927734375, 9.9609375, 10.66259765625, 11.3642578125, 12.06591796875, 12.767578125, 13.46923828125, 14.1708984375, 14.87255859375, 15.57421875, 16.27587890625, 16.9775390625, 17.67919921875, 18.380859375, 19.08251953125, 19.7841796875, 20.48583984375, 21.1875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 14.0, 8.0, 12.0, 16.0, 12.0, 15.0, 21.0, 20.0, 23.0, 40.0, 34.0, 40.0, 34.0, 39.0, 41.0, 47.0, 38.0, 47.0, 37.0, 44.0, 55.0, 38.0, 45.0, 41.0, 35.0, 29.0, 33.0, 19.0, 23.0, 11.0, 13.0, 14.0, 17.0, 9.0, 7.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.69921875, -7.4820556640625, -7.264892578125, -7.0477294921875, -6.83056640625, -6.6134033203125, -6.396240234375, -6.1790771484375, -5.9619140625, -5.7447509765625, -5.527587890625, -5.3104248046875, -5.09326171875, -4.8760986328125, -4.658935546875, -4.4417724609375, -4.224609375, -4.0074462890625, -3.790283203125, -3.5731201171875, -3.35595703125, -3.1387939453125, -2.921630859375, -2.7044677734375, -2.4873046875, -2.2701416015625, -2.052978515625, -1.8358154296875, -1.61865234375, -1.4014892578125, -1.184326171875, -0.9671630859375, -0.75, -0.5328369140625, -0.315673828125, -0.0985107421875, 0.11865234375, 0.3358154296875, 0.552978515625, 0.7701416015625, 0.9873046875, 1.2044677734375, 1.421630859375, 1.6387939453125, 1.85595703125, 2.0731201171875, 2.290283203125, 2.5074462890625, 2.724609375, 2.9417724609375, 3.158935546875, 3.3760986328125, 3.59326171875, 3.8104248046875, 4.027587890625, 4.2447509765625, 4.4619140625, 4.6790771484375, 4.896240234375, 5.1134033203125, 5.33056640625, 5.5477294921875, 5.764892578125, 5.9820556640625, 6.19921875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 13.0, 13.0, 23.0, 15.0, 29.0, 35.0, 43.0, 92.0, 112.0, 174.0, 253.0, 350.0, 569.0, 844.0, 1382.0, 2298.0, 4186.0, 8040.0, 17549.0, 45425.0, 146879.0, 447499.0, 252374.0, 71268.0, 25365.0, 10850.0, 5357.0, 2851.0, 1683.0, 1038.0, 634.0, 411.0, 281.0, 202.0, 110.0, 79.0, 86.0, 47.0, 28.0, 21.0, 18.0, 13.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-25.671875, -24.886962890625, -24.10205078125, -23.317138671875, -22.5322265625, -21.747314453125, -20.96240234375, -20.177490234375, -19.392578125, -18.607666015625, -17.82275390625, -17.037841796875, -16.2529296875, -15.468017578125, -14.68310546875, -13.898193359375, -13.11328125, -12.328369140625, -11.54345703125, -10.758544921875, -9.9736328125, -9.188720703125, -8.40380859375, -7.618896484375, -6.833984375, -6.049072265625, -5.26416015625, -4.479248046875, -3.6943359375, -2.909423828125, -2.12451171875, -1.339599609375, -0.5546875, 0.230224609375, 1.01513671875, 1.800048828125, 2.5849609375, 3.369873046875, 4.15478515625, 4.939697265625, 5.724609375, 6.509521484375, 7.29443359375, 8.079345703125, 8.8642578125, 9.649169921875, 10.43408203125, 11.218994140625, 12.00390625, 12.788818359375, 13.57373046875, 14.358642578125, 15.1435546875, 15.928466796875, 16.71337890625, 17.498291015625, 18.283203125, 19.068115234375, 19.85302734375, 20.637939453125, 21.4228515625, 22.207763671875, 22.99267578125, 23.777587890625, 24.5625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 4.0, 9.0, 2.0, 13.0, 13.0, 19.0, 29.0, 38.0, 33.0, 48.0, 69.0, 96.0, 103.0, 111.0, 104.0, 70.0, 69.0, 33.0, 36.0, 23.0, 18.0, 16.0, 5.0, 5.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001468658447265625, -0.0014197379350662231, -0.0013708174228668213, -0.0013218969106674194, -0.0012729763984680176, -0.0012240558862686157, -0.0011751353740692139, -0.001126214861869812, -0.0010772943496704102, -0.0010283738374710083, -0.0009794533252716064, -0.0009305328130722046, -0.0008816123008728027, -0.0008326917886734009, -0.000783771276473999, -0.0007348507642745972, -0.0006859302520751953, -0.0006370097398757935, -0.0005880892276763916, -0.0005391687154769897, -0.0004902482032775879, -0.00044132769107818604, -0.0003924071788787842, -0.0003434866666793823, -0.00029456615447998047, -0.0002456456422805786, -0.00019672513008117676, -0.0001478046178817749, -9.888410568237305e-05, -4.996359348297119e-05, -1.043081283569336e-06, 4.787743091583252e-05, 9.679794311523438e-05, 0.00014571845531463623, 0.00019463896751403809, 0.00024355947971343994, 0.0002924799919128418, 0.00034140050411224365, 0.0003903210163116455, 0.00043924152851104736, 0.0004881620407104492, 0.0005370825529098511, 0.0005860030651092529, 0.0006349235773086548, 0.0006838440895080566, 0.0007327646017074585, 0.0007816851139068604, 0.0008306056261062622, 0.0008795261383056641, 0.0009284466505050659, 0.0009773671627044678, 0.0010262876749038696, 0.0010752081871032715, 0.0011241286993026733, 0.0011730492115020752, 0.001221969723701477, 0.001270890235900879, 0.0013198107481002808, 0.0013687312602996826, 0.0014176517724990845, 0.0014665722846984863, 0.0015154927968978882, 0.00156441330909729, 0.001613333821296692, 0.0016622543334960938]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 18.0, 17.0, 16.0, 39.0, 33.0, 48.0, 77.0, 112.0, 136.0, 224.0, 288.0, 408.0, 640.0, 845.0, 1316.0, 1905.0, 3076.0, 5012.0, 8621.0, 15402.0, 29651.0, 59682.0, 121966.0, 214645.0, 244697.0, 164645.0, 84096.0, 40977.0, 20895.0, 11095.0, 6510.0, 3971.0, 2513.0, 1576.0, 1007.0, 710.0, 486.0, 348.0, 223.0, 170.0, 124.0, 93.0, 80.0, 43.0, 36.0, 25.0, 6.0, 16.0, 10.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-11.34375, -10.9805908203125, -10.617431640625, -10.2542724609375, -9.89111328125, -9.5279541015625, -9.164794921875, -8.8016357421875, -8.4384765625, -8.0753173828125, -7.712158203125, -7.3489990234375, -6.98583984375, -6.6226806640625, -6.259521484375, -5.8963623046875, -5.533203125, -5.1700439453125, -4.806884765625, -4.4437255859375, -4.08056640625, -3.7174072265625, -3.354248046875, -2.9910888671875, -2.6279296875, -2.2647705078125, -1.901611328125, -1.5384521484375, -1.17529296875, -0.8121337890625, -0.448974609375, -0.0858154296875, 0.27734375, 0.6405029296875, 1.003662109375, 1.3668212890625, 1.72998046875, 2.0931396484375, 2.456298828125, 2.8194580078125, 3.1826171875, 3.5457763671875, 3.908935546875, 4.2720947265625, 4.63525390625, 4.9984130859375, 5.361572265625, 5.7247314453125, 6.087890625, 6.4510498046875, 6.814208984375, 7.1773681640625, 7.54052734375, 7.9036865234375, 8.266845703125, 8.6300048828125, 8.9931640625, 9.3563232421875, 9.719482421875, 10.0826416015625, 10.44580078125, 10.8089599609375, 11.172119140625, 11.5352783203125, 11.8984375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 1.0, 7.0, 6.0, 7.0, 17.0, 21.0, 21.0, 27.0, 42.0, 59.0, 71.0, 66.0, 72.0, 92.0, 84.0, 76.0, 70.0, 57.0, 47.0, 32.0, 26.0, 28.0, 22.0, 5.0, 7.0, 4.0, 5.0, 6.0, 1.0, 7.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.4342041015625, -4.294189453125, -4.1541748046875, -4.01416015625, -3.8741455078125, -3.734130859375, -3.5941162109375, -3.4541015625, -3.3140869140625, -3.174072265625, -3.0340576171875, -2.89404296875, -2.7540283203125, -2.614013671875, -2.4739990234375, -2.333984375, -2.1939697265625, -2.053955078125, -1.9139404296875, -1.77392578125, -1.6339111328125, -1.493896484375, -1.3538818359375, -1.2138671875, -1.0738525390625, -0.933837890625, -0.7938232421875, -0.65380859375, -0.5137939453125, -0.373779296875, -0.2337646484375, -0.09375, 0.0462646484375, 0.186279296875, 0.3262939453125, 0.46630859375, 0.6063232421875, 0.746337890625, 0.8863525390625, 1.0263671875, 1.1663818359375, 1.306396484375, 1.4464111328125, 1.58642578125, 1.7264404296875, 1.866455078125, 2.0064697265625, 2.146484375, 2.2864990234375, 2.426513671875, 2.5665283203125, 2.70654296875, 2.8465576171875, 2.986572265625, 3.1265869140625, 3.2666015625, 3.4066162109375, 3.546630859375, 3.6866455078125, 3.82666015625, 3.9666748046875, 4.106689453125, 4.2467041015625, 4.38671875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 9.0, 5.0, 5.0, 5.0, 10.0, 6.0, 6.0, 14.0, 17.0, 21.0, 22.0, 30.0, 21.0, 42.0, 45.0, 47.0, 52.0, 44.0, 55.0, 72.0, 60.0, 60.0, 32.0, 54.0, 39.0, 39.0, 39.0, 27.0, 20.0, 20.0, 19.0, 16.0, 9.0, 13.0, 6.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.158653259277344, -10.865707397460938, -10.572760581970215, -10.279813766479492, -9.986867904663086, -9.69392204284668, -9.400975227355957, -9.108028411865234, -8.815082550048828, -8.522136688232422, -8.2291898727417, -7.936243534088135, -7.64329719543457, -7.350350856781006, -7.057404518127441, -6.764458179473877, -6.4715118408203125, -6.178565502166748, -5.885619163513184, -5.592672824859619, -5.299726486206055, -5.00678014755249, -4.713833808898926, -4.420887470245361, -4.127941131591797, -3.8349947929382324, -3.542048454284668, -3.2491021156311035, -2.956155776977539, -2.6632094383239746, -2.37026309967041, -2.0773167610168457, -1.784369945526123, -1.4914236068725586, -1.1984772682189941, -0.9055309295654297, -0.6125845909118652, -0.3196382522583008, -0.026691913604736328, 0.2662544250488281, 0.5592007637023926, 0.852147102355957, 1.1450934410095215, 1.438039779663086, 1.7309861183166504, 2.023932456970215, 2.3168787956237793, 2.6098251342773438, 2.902771472930908, 3.1957178115844727, 3.488664150238037, 3.7816104888916016, 4.074556827545166, 4.3675031661987305, 4.660449504852295, 4.953395843505859, 5.246342182159424, 5.539288520812988, 5.832234859466553, 6.125181198120117, 6.418127536773682, 6.711073875427246, 7.0040202140808105, 7.296966552734375, 7.5899128913879395]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 13.0, 14.0, 13.0, 16.0, 16.0, 21.0, 25.0, 20.0, 32.0, 32.0, 33.0, 31.0, 33.0, 37.0, 46.0, 43.0, 47.0, 34.0, 44.0, 31.0, 33.0, 30.0, 37.0, 37.0, 30.0, 41.0, 32.0, 24.0, 18.0, 16.0, 17.0, 15.0, 14.0, 12.0, 11.0, 4.0, 11.0, 5.0, 8.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.721414566040039, -7.469111919403076, -7.216809272766113, -6.96450662612915, -6.7122039794921875, -6.459901332855225, -6.207598686218262, -5.955296039581299, -5.702993392944336, -5.450690746307373, -5.19838809967041, -4.946085453033447, -4.693782806396484, -4.4414801597595215, -4.189177513122559, -3.9368748664855957, -3.684572219848633, -3.43226957321167, -3.179966926574707, -2.927664279937744, -2.6753616333007812, -2.4230589866638184, -2.1707563400268555, -1.9184536933898926, -1.6661510467529297, -1.4138484001159668, -1.161545753479004, -0.909243106842041, -0.6569404602050781, -0.40463781356811523, -0.15233516693115234, 0.09996747970581055, 0.35226917266845703, 0.6045718193054199, 0.8568744659423828, 1.1091771125793457, 1.3614797592163086, 1.6137824058532715, 1.8660850524902344, 2.1183876991271973, 2.37069034576416, 2.622992992401123, 2.875295639038086, 3.127598285675049, 3.3799009323120117, 3.6322035789489746, 3.8845062255859375, 4.1368088722229, 4.389111518859863, 4.641414165496826, 4.893716812133789, 5.146019458770752, 5.398322105407715, 5.650624752044678, 5.902927398681641, 6.1552300453186035, 6.407532691955566, 6.659835338592529, 6.912137985229492, 7.164440631866455, 7.416743278503418, 7.669045925140381, 7.921348571777344, 8.173650741577148, 8.42595386505127]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 7.0, 6.0, 23.0, 21.0, 42.0, 39.0, 82.0, 115.0, 193.0, 306.0, 481.0, 694.0, 1163.0, 1872.0, 3061.0, 5038.0, 8303.0, 13504.0, 23139.0, 36898.0, 58274.0, 86636.0, 118892.0, 144291.0, 147472.0, 128202.0, 96139.0, 65182.0, 41947.0, 25895.0, 16001.0, 9614.0, 5723.0, 3522.0, 2144.0, 1277.0, 812.0, 554.0, 338.0, 195.0, 145.0, 102.0, 63.0, 50.0, 27.0, 22.0, 15.0, 6.0, 10.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.109375, -7.871826171875, -7.63427734375, -7.396728515625, -7.1591796875, -6.921630859375, -6.68408203125, -6.446533203125, -6.208984375, -5.971435546875, -5.73388671875, -5.496337890625, -5.2587890625, -5.021240234375, -4.78369140625, -4.546142578125, -4.30859375, -4.071044921875, -3.83349609375, -3.595947265625, -3.3583984375, -3.120849609375, -2.88330078125, -2.645751953125, -2.408203125, -2.170654296875, -1.93310546875, -1.695556640625, -1.4580078125, -1.220458984375, -0.98291015625, -0.745361328125, -0.5078125, -0.270263671875, -0.03271484375, 0.204833984375, 0.4423828125, 0.679931640625, 0.91748046875, 1.155029296875, 1.392578125, 1.630126953125, 1.86767578125, 2.105224609375, 2.3427734375, 2.580322265625, 2.81787109375, 3.055419921875, 3.29296875, 3.530517578125, 3.76806640625, 4.005615234375, 4.2431640625, 4.480712890625, 4.71826171875, 4.955810546875, 5.193359375, 5.430908203125, 5.66845703125, 5.906005859375, 6.1435546875, 6.381103515625, 6.61865234375, 6.856201171875, 7.09375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 7.0, 5.0, 6.0, 8.0, 14.0, 13.0, 12.0, 20.0, 19.0, 21.0, 27.0, 25.0, 25.0, 46.0, 40.0, 32.0, 41.0, 34.0, 39.0, 40.0, 51.0, 45.0, 32.0, 29.0, 39.0, 35.0, 48.0, 28.0, 32.0, 28.0, 22.0, 19.0, 12.0, 17.0, 16.0, 14.0, 16.0, 9.0, 7.0, 5.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.640625, -7.3980712890625, -7.155517578125, -6.9129638671875, -6.67041015625, -6.4278564453125, -6.185302734375, -5.9427490234375, -5.7001953125, -5.4576416015625, -5.215087890625, -4.9725341796875, -4.72998046875, -4.4874267578125, -4.244873046875, -4.0023193359375, -3.759765625, -3.5172119140625, -3.274658203125, -3.0321044921875, -2.78955078125, -2.5469970703125, -2.304443359375, -2.0618896484375, -1.8193359375, -1.5767822265625, -1.334228515625, -1.0916748046875, -0.84912109375, -0.6065673828125, -0.364013671875, -0.1214599609375, 0.12109375, 0.3636474609375, 0.606201171875, 0.8487548828125, 1.09130859375, 1.3338623046875, 1.576416015625, 1.8189697265625, 2.0615234375, 2.3040771484375, 2.546630859375, 2.7891845703125, 3.03173828125, 3.2742919921875, 3.516845703125, 3.7593994140625, 4.001953125, 4.2445068359375, 4.487060546875, 4.7296142578125, 4.97216796875, 5.2147216796875, 5.457275390625, 5.6998291015625, 5.9423828125, 6.1849365234375, 6.427490234375, 6.6700439453125, 6.91259765625, 7.1551513671875, 7.397705078125, 7.6402587890625, 7.8828125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 8.0, 21.0, 14.0, 28.0, 56.0, 52.0, 92.0, 125.0, 194.0, 310.0, 452.0, 633.0, 984.0, 1519.0, 2449.0, 3767.0, 6018.0, 9470.0, 15067.0, 24067.0, 38160.0, 58056.0, 85816.0, 116681.0, 139963.0, 143786.0, 124561.0, 93603.0, 65326.0, 43041.0, 27130.0, 17146.0, 11043.0, 6845.0, 4243.0, 2683.0, 1739.0, 1127.0, 720.0, 518.0, 339.0, 222.0, 163.0, 100.0, 59.0, 59.0, 23.0, 20.0, 18.0, 17.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0], "bins": [-6.93359375, -6.724365234375, -6.51513671875, -6.305908203125, -6.0966796875, -5.887451171875, -5.67822265625, -5.468994140625, -5.259765625, -5.050537109375, -4.84130859375, -4.632080078125, -4.4228515625, -4.213623046875, -4.00439453125, -3.795166015625, -3.5859375, -3.376708984375, -3.16748046875, -2.958251953125, -2.7490234375, -2.539794921875, -2.33056640625, -2.121337890625, -1.912109375, -1.702880859375, -1.49365234375, -1.284423828125, -1.0751953125, -0.865966796875, -0.65673828125, -0.447509765625, -0.23828125, -0.029052734375, 0.18017578125, 0.389404296875, 0.5986328125, 0.807861328125, 1.01708984375, 1.226318359375, 1.435546875, 1.644775390625, 1.85400390625, 2.063232421875, 2.2724609375, 2.481689453125, 2.69091796875, 2.900146484375, 3.109375, 3.318603515625, 3.52783203125, 3.737060546875, 3.9462890625, 4.155517578125, 4.36474609375, 4.573974609375, 4.783203125, 4.992431640625, 5.20166015625, 5.410888671875, 5.6201171875, 5.829345703125, 6.03857421875, 6.247802734375, 6.45703125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 8.0, 7.0, 5.0, 12.0, 5.0, 10.0, 14.0, 11.0, 15.0, 22.0, 21.0, 20.0, 23.0, 40.0, 35.0, 38.0, 29.0, 36.0, 36.0, 40.0, 42.0, 51.0, 46.0, 37.0, 40.0, 35.0, 32.0, 35.0, 31.0, 36.0, 22.0, 25.0, 24.0, 16.0, 24.0, 17.0, 11.0, 10.0, 9.0, 7.0, 7.0, 10.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.54510498046875, -4.3870849609375, -4.22906494140625, -4.071044921875, -3.91302490234375, -3.7550048828125, -3.59698486328125, -3.43896484375, -3.28094482421875, -3.1229248046875, -2.96490478515625, -2.806884765625, -2.64886474609375, -2.4908447265625, -2.33282470703125, -2.1748046875, -2.01678466796875, -1.8587646484375, -1.70074462890625, -1.542724609375, -1.38470458984375, -1.2266845703125, -1.06866455078125, -0.91064453125, -0.75262451171875, -0.5946044921875, -0.43658447265625, -0.278564453125, -0.12054443359375, 0.0374755859375, 0.19549560546875, 0.353515625, 0.51153564453125, 0.6695556640625, 0.82757568359375, 0.985595703125, 1.14361572265625, 1.3016357421875, 1.45965576171875, 1.61767578125, 1.77569580078125, 1.9337158203125, 2.09173583984375, 2.249755859375, 2.40777587890625, 2.5657958984375, 2.72381591796875, 2.8818359375, 3.03985595703125, 3.1978759765625, 3.35589599609375, 3.513916015625, 3.67193603515625, 3.8299560546875, 3.98797607421875, 4.14599609375, 4.30401611328125, 4.4620361328125, 4.62005615234375, 4.778076171875, 4.93609619140625, 5.0941162109375, 5.25213623046875, 5.41015625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 6.0, 13.0, 16.0, 9.0, 31.0, 33.0, 35.0, 80.0, 103.0, 156.0, 273.0, 439.0, 762.0, 1374.0, 2727.0, 5934.0, 13728.0, 35749.0, 101377.0, 258992.0, 341919.0, 179180.0, 64120.0, 23197.0, 9451.0, 4138.0, 2052.0, 1036.0, 620.0, 332.0, 223.0, 117.0, 110.0, 57.0, 45.0, 34.0, 20.0, 21.0, 9.0, 9.0, 2.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.05859375, -8.7265625, -8.39453125, -8.0625, -7.73046875, -7.3984375, -7.06640625, -6.734375, -6.40234375, -6.0703125, -5.73828125, -5.40625, -5.07421875, -4.7421875, -4.41015625, -4.078125, -3.74609375, -3.4140625, -3.08203125, -2.75, -2.41796875, -2.0859375, -1.75390625, -1.421875, -1.08984375, -0.7578125, -0.42578125, -0.09375, 0.23828125, 0.5703125, 0.90234375, 1.234375, 1.56640625, 1.8984375, 2.23046875, 2.5625, 2.89453125, 3.2265625, 3.55859375, 3.890625, 4.22265625, 4.5546875, 4.88671875, 5.21875, 5.55078125, 5.8828125, 6.21484375, 6.546875, 6.87890625, 7.2109375, 7.54296875, 7.875, 8.20703125, 8.5390625, 8.87109375, 9.203125, 9.53515625, 9.8671875, 10.19921875, 10.53125, 10.86328125, 11.1953125, 11.52734375, 11.859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 9.0, 15.0, 13.0, 12.0, 10.0, 28.0, 27.0, 39.0, 41.0, 40.0, 58.0, 62.0, 72.0, 76.0, 67.0, 71.0, 54.0, 51.0, 40.0, 42.0, 44.0, 26.0, 28.0, 19.0, 17.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006656646728515625, -0.0006448626518249512, -0.0006240606307983398, -0.0006032586097717285, -0.0005824565887451172, -0.0005616545677185059, -0.0005408525466918945, -0.0005200505256652832, -0.0004992485046386719, -0.00047844648361206055, -0.0004576444625854492, -0.0004368424415588379, -0.00041604042053222656, -0.00039523839950561523, -0.0003744363784790039, -0.0003536343574523926, -0.00033283233642578125, -0.0003120303153991699, -0.0002912282943725586, -0.00027042627334594727, -0.00024962425231933594, -0.0002288222312927246, -0.00020802021026611328, -0.00018721818923950195, -0.00016641616821289062, -0.0001456141471862793, -0.00012481212615966797, -0.00010401010513305664, -8.320808410644531e-05, -6.240606307983398e-05, -4.1604042053222656e-05, -2.0802021026611328e-05, 0.0, 2.0802021026611328e-05, 4.1604042053222656e-05, 6.240606307983398e-05, 8.320808410644531e-05, 0.00010401010513305664, 0.00012481212615966797, 0.0001456141471862793, 0.00016641616821289062, 0.00018721818923950195, 0.00020802021026611328, 0.0002288222312927246, 0.00024962425231933594, 0.00027042627334594727, 0.0002912282943725586, 0.0003120303153991699, 0.00033283233642578125, 0.0003536343574523926, 0.0003744363784790039, 0.00039523839950561523, 0.00041604042053222656, 0.0004368424415588379, 0.0004576444625854492, 0.00047844648361206055, 0.0004992485046386719, 0.0005200505256652832, 0.0005408525466918945, 0.0005616545677185059, 0.0005824565887451172, 0.0006032586097717285, 0.0006240606307983398, 0.0006448626518249512, 0.0006656646728515625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 8.0, 4.0, 9.0, 8.0, 18.0, 21.0, 46.0, 44.0, 79.0, 109.0, 178.0, 259.0, 478.0, 818.0, 1429.0, 2486.0, 4603.0, 8717.0, 16789.0, 33095.0, 65904.0, 124679.0, 200568.0, 225892.0, 167169.0, 94781.0, 48507.0, 24503.0, 12565.0, 6575.0, 3526.0, 1916.0, 1023.0, 690.0, 378.0, 240.0, 157.0, 98.0, 73.0, 35.0, 24.0, 18.0, 11.0, 5.0, 7.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.96875, -6.75933837890625, -6.5499267578125, -6.34051513671875, -6.131103515625, -5.92169189453125, -5.7122802734375, -5.50286865234375, -5.29345703125, -5.08404541015625, -4.8746337890625, -4.66522216796875, -4.455810546875, -4.24639892578125, -4.0369873046875, -3.82757568359375, -3.6181640625, -3.40875244140625, -3.1993408203125, -2.98992919921875, -2.780517578125, -2.57110595703125, -2.3616943359375, -2.15228271484375, -1.94287109375, -1.73345947265625, -1.5240478515625, -1.31463623046875, -1.105224609375, -0.89581298828125, -0.6864013671875, -0.47698974609375, -0.267578125, -0.05816650390625, 0.1512451171875, 0.36065673828125, 0.570068359375, 0.77947998046875, 0.9888916015625, 1.19830322265625, 1.40771484375, 1.61712646484375, 1.8265380859375, 2.03594970703125, 2.245361328125, 2.45477294921875, 2.6641845703125, 2.87359619140625, 3.0830078125, 3.29241943359375, 3.5018310546875, 3.71124267578125, 3.920654296875, 4.13006591796875, 4.3394775390625, 4.54888916015625, 4.75830078125, 4.96771240234375, 5.1771240234375, 5.38653564453125, 5.595947265625, 5.80535888671875, 6.0147705078125, 6.22418212890625, 6.43359375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 10.0, 9.0, 13.0, 24.0, 20.0, 32.0, 38.0, 31.0, 38.0, 36.0, 54.0, 60.0, 64.0, 70.0, 72.0, 61.0, 68.0, 54.0, 45.0, 33.0, 36.0, 21.0, 29.0, 14.0, 11.0, 9.0, 16.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5, -1.438812255859375, -1.37762451171875, -1.316436767578125, -1.2552490234375, -1.194061279296875, -1.13287353515625, -1.071685791015625, -1.010498046875, -0.949310302734375, -0.88812255859375, -0.826934814453125, -0.7657470703125, -0.704559326171875, -0.64337158203125, -0.582183837890625, -0.52099609375, -0.459808349609375, -0.39862060546875, -0.337432861328125, -0.2762451171875, -0.215057373046875, -0.15386962890625, -0.092681884765625, -0.031494140625, 0.029693603515625, 0.09088134765625, 0.152069091796875, 0.2132568359375, 0.274444580078125, 0.33563232421875, 0.396820068359375, 0.4580078125, 0.519195556640625, 0.58038330078125, 0.641571044921875, 0.7027587890625, 0.763946533203125, 0.82513427734375, 0.886322021484375, 0.947509765625, 1.008697509765625, 1.06988525390625, 1.131072998046875, 1.1922607421875, 1.253448486328125, 1.31463623046875, 1.375823974609375, 1.43701171875, 1.498199462890625, 1.55938720703125, 1.620574951171875, 1.6817626953125, 1.742950439453125, 1.80413818359375, 1.865325927734375, 1.926513671875, 1.987701416015625, 2.04888916015625, 2.110076904296875, 2.1712646484375, 2.232452392578125, 2.29364013671875, 2.354827880859375, 2.416015625]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 6.0, 10.0, 10.0, 14.0, 9.0, 8.0, 13.0, 18.0, 25.0, 35.0, 34.0, 34.0, 46.0, 51.0, 59.0, 62.0, 64.0, 53.0, 69.0, 51.0, 44.0, 50.0, 47.0, 34.0, 33.0, 19.0, 21.0, 18.0, 10.0, 17.0, 10.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.958701133728027, -10.670417785644531, -10.382135391235352, -10.093852043151855, -9.80556869506836, -9.51728630065918, -9.229002952575684, -8.940719604492188, -8.652437210083008, -8.364153861999512, -8.075871467590332, -7.787588119506836, -7.499305248260498, -7.21102237701416, -6.922739028930664, -6.634456157684326, -6.346173286437988, -6.05789041519165, -5.7696075439453125, -5.481324195861816, -5.1930413246154785, -4.904758453369141, -4.6164751052856445, -4.328192234039307, -4.039909362792969, -3.751626491546631, -3.463343381881714, -3.175060272216797, -2.886777400970459, -2.598494529724121, -2.310211420059204, -2.021928310394287, -1.7336454391479492, -1.4453624486923218, -1.1570794582366943, -0.8687964677810669, -0.5805134773254395, -0.292230486869812, -0.00394749641418457, 0.2843356132507324, 0.5726184844970703, 0.8609014749526978, 1.1491844654083252, 1.4374674558639526, 1.72575044631958, 2.014033317565918, 2.302316427230835, 2.590599536895752, 2.87888240814209, 3.1671652793884277, 3.4554483890533447, 3.7437314987182617, 4.0320143699646, 4.3202972412109375, 4.608580589294434, 4.8968634605407715, 5.185146331787109, 5.473429203033447, 5.761712074279785, 6.049995422363281, 6.338278293609619, 6.626561164855957, 6.914844512939453, 7.203127384185791, 7.491410255432129]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 10.0, 11.0, 1.0, 2.0, 6.0, 10.0, 15.0, 21.0, 13.0, 10.0, 13.0, 25.0, 13.0, 16.0, 28.0, 27.0, 28.0, 34.0, 39.0, 24.0, 38.0, 36.0, 43.0, 36.0, 35.0, 39.0, 29.0, 38.0, 41.0, 33.0, 22.0, 26.0, 28.0, 27.0, 22.0, 23.0, 20.0, 17.0, 12.0, 18.0, 20.0, 7.0, 7.0, 8.0, 8.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.7469258308410645, -6.521121978759766, -6.295317649841309, -6.06951379776001, -5.843709945678711, -5.617905616760254, -5.392101764678955, -5.166297912597656, -4.940493583679199, -4.7146897315979, -4.488885402679443, -4.2630815505981445, -4.037277698516846, -3.8114736080169678, -3.58566951751709, -3.359865665435791, -3.134061813354492, -2.9082577228546143, -2.6824538707733154, -2.4566497802734375, -2.2308459281921387, -2.0050418376922607, -1.7792377471923828, -1.5534337759017944, -1.327629804611206, -1.1018258333206177, -0.8760218024253845, -0.6502177715301514, -0.424413800239563, -0.1986098289489746, 0.02719426155090332, 0.2529982328414917, 0.4788026809692383, 0.7046066522598267, 0.9304106831550598, 1.156214714050293, 1.3820186853408813, 1.6078226566314697, 1.8336267471313477, 2.0594305992126465, 2.2852346897125244, 2.5110387802124023, 2.736842632293701, 2.962646722793579, 3.188450813293457, 3.414254665374756, 3.640058755874634, 3.8658628463745117, 4.0916666984558105, 4.317470550537109, 4.543274879455566, 4.769078731536865, 4.994882583618164, 5.220686912536621, 5.44649076461792, 5.672294616699219, 5.898098945617676, 6.123902797698975, 6.349707126617432, 6.5755109786987305, 6.801314830780029, 7.027118682861328, 7.252923011779785, 7.478726863861084, 7.704530715942383]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 9.0, 12.0, 15.0, 20.0, 23.0, 54.0, 87.0, 99.0, 204.0, 298.0, 476.0, 812.0, 1261.0, 2252.0, 3779.0, 6662.0, 12100.0, 22973.0, 46221.0, 101098.0, 241169.0, 569316.0, 1023374.0, 1057998.0, 621325.0, 266334.0, 110864.0, 50429.0, 24476.0, 12875.0, 7311.0, 4104.0, 2367.0, 1427.0, 904.0, 569.0, 330.0, 238.0, 137.0, 85.0, 63.0, 43.0, 26.0, 20.0, 15.0, 4.0, 6.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.5703125, -8.302978515625, -8.03564453125, -7.768310546875, -7.5009765625, -7.233642578125, -6.96630859375, -6.698974609375, -6.431640625, -6.164306640625, -5.89697265625, -5.629638671875, -5.3623046875, -5.094970703125, -4.82763671875, -4.560302734375, -4.29296875, -4.025634765625, -3.75830078125, -3.490966796875, -3.2236328125, -2.956298828125, -2.68896484375, -2.421630859375, -2.154296875, -1.886962890625, -1.61962890625, -1.352294921875, -1.0849609375, -0.817626953125, -0.55029296875, -0.282958984375, -0.015625, 0.251708984375, 0.51904296875, 0.786376953125, 1.0537109375, 1.321044921875, 1.58837890625, 1.855712890625, 2.123046875, 2.390380859375, 2.65771484375, 2.925048828125, 3.1923828125, 3.459716796875, 3.72705078125, 3.994384765625, 4.26171875, 4.529052734375, 4.79638671875, 5.063720703125, 5.3310546875, 5.598388671875, 5.86572265625, 6.133056640625, 6.400390625, 6.667724609375, 6.93505859375, 7.202392578125, 7.4697265625, 7.737060546875, 8.00439453125, 8.271728515625, 8.5390625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 14.0, 6.0, 5.0, 14.0, 23.0, 15.0, 17.0, 17.0, 20.0, 23.0, 19.0, 24.0, 32.0, 36.0, 31.0, 45.0, 37.0, 38.0, 45.0, 46.0, 38.0, 36.0, 38.0, 42.0, 28.0, 30.0, 30.0, 28.0, 35.0, 31.0, 20.0, 19.0, 19.0, 14.0, 15.0, 13.0, 9.0, 8.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.15234375, -4.978759765625, -4.80517578125, -4.631591796875, -4.4580078125, -4.284423828125, -4.11083984375, -3.937255859375, -3.763671875, -3.590087890625, -3.41650390625, -3.242919921875, -3.0693359375, -2.895751953125, -2.72216796875, -2.548583984375, -2.375, -2.201416015625, -2.02783203125, -1.854248046875, -1.6806640625, -1.507080078125, -1.33349609375, -1.159912109375, -0.986328125, -0.812744140625, -0.63916015625, -0.465576171875, -0.2919921875, -0.118408203125, 0.05517578125, 0.228759765625, 0.40234375, 0.575927734375, 0.74951171875, 0.923095703125, 1.0966796875, 1.270263671875, 1.44384765625, 1.617431640625, 1.791015625, 1.964599609375, 2.13818359375, 2.311767578125, 2.4853515625, 2.658935546875, 2.83251953125, 3.006103515625, 3.1796875, 3.353271484375, 3.52685546875, 3.700439453125, 3.8740234375, 4.047607421875, 4.22119140625, 4.394775390625, 4.568359375, 4.741943359375, 4.91552734375, 5.089111328125, 5.2626953125, 5.436279296875, 5.60986328125, 5.783447265625, 5.95703125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 3.0, 8.0, 15.0, 13.0, 26.0, 30.0, 34.0, 68.0, 93.0, 123.0, 205.0, 284.0, 426.0, 600.0, 959.0, 1613.0, 2399.0, 3872.0, 6445.0, 10805.0, 18749.0, 34382.0, 63515.0, 124335.0, 249059.0, 483471.0, 814585.0, 943242.0, 674950.0, 369288.0, 185735.0, 92761.0, 48426.0, 26402.0, 14689.0, 8579.0, 5266.0, 3135.0, 2036.0, 1231.0, 778.0, 546.0, 355.0, 222.0, 156.0, 113.0, 86.0, 58.0, 29.0, 29.0, 22.0, 14.0, 14.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2578125, -7.0181884765625, -6.778564453125, -6.5389404296875, -6.29931640625, -6.0596923828125, -5.820068359375, -5.5804443359375, -5.3408203125, -5.1011962890625, -4.861572265625, -4.6219482421875, -4.38232421875, -4.1427001953125, -3.903076171875, -3.6634521484375, -3.423828125, -3.1842041015625, -2.944580078125, -2.7049560546875, -2.46533203125, -2.2257080078125, -1.986083984375, -1.7464599609375, -1.5068359375, -1.2672119140625, -1.027587890625, -0.7879638671875, -0.54833984375, -0.3087158203125, -0.069091796875, 0.1705322265625, 0.41015625, 0.6497802734375, 0.889404296875, 1.1290283203125, 1.36865234375, 1.6082763671875, 1.847900390625, 2.0875244140625, 2.3271484375, 2.5667724609375, 2.806396484375, 3.0460205078125, 3.28564453125, 3.5252685546875, 3.764892578125, 4.0045166015625, 4.244140625, 4.4837646484375, 4.723388671875, 4.9630126953125, 5.20263671875, 5.4422607421875, 5.681884765625, 5.9215087890625, 6.1611328125, 6.4007568359375, 6.640380859375, 6.8800048828125, 7.11962890625, 7.3592529296875, 7.598876953125, 7.8385009765625, 8.078125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 4.0, 10.0, 10.0, 18.0, 7.0, 25.0, 27.0, 39.0, 40.0, 48.0, 57.0, 80.0, 96.0, 112.0, 149.0, 160.0, 212.0, 233.0, 283.0, 239.0, 286.0, 280.0, 225.0, 236.0, 182.0, 208.0, 163.0, 120.0, 101.0, 100.0, 77.0, 53.0, 42.0, 35.0, 24.0, 25.0, 9.0, 12.0, 9.0, 10.0, 9.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.984375, -2.9019775390625, -2.819580078125, -2.7371826171875, -2.65478515625, -2.5723876953125, -2.489990234375, -2.4075927734375, -2.3251953125, -2.2427978515625, -2.160400390625, -2.0780029296875, -1.99560546875, -1.9132080078125, -1.830810546875, -1.7484130859375, -1.666015625, -1.5836181640625, -1.501220703125, -1.4188232421875, -1.33642578125, -1.2540283203125, -1.171630859375, -1.0892333984375, -1.0068359375, -0.9244384765625, -0.842041015625, -0.7596435546875, -0.67724609375, -0.5948486328125, -0.512451171875, -0.4300537109375, -0.34765625, -0.2652587890625, -0.182861328125, -0.1004638671875, -0.01806640625, 0.0643310546875, 0.146728515625, 0.2291259765625, 0.3115234375, 0.3939208984375, 0.476318359375, 0.5587158203125, 0.64111328125, 0.7235107421875, 0.805908203125, 0.8883056640625, 0.970703125, 1.0531005859375, 1.135498046875, 1.2178955078125, 1.30029296875, 1.3826904296875, 1.465087890625, 1.5474853515625, 1.6298828125, 1.7122802734375, 1.794677734375, 1.8770751953125, 1.95947265625, 2.0418701171875, 2.124267578125, 2.2066650390625, 2.2890625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 2.0, 6.0, 6.0, 9.0, 6.0, 3.0, 14.0, 14.0, 15.0, 25.0, 23.0, 30.0, 40.0, 49.0, 50.0, 52.0, 63.0, 62.0, 68.0, 72.0, 46.0, 51.0, 52.0, 53.0, 38.0, 29.0, 20.0, 20.0, 19.0, 15.0, 10.0, 17.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-10.62624454498291, -10.362457275390625, -10.098669052124023, -9.834881782531738, -9.571094512939453, -9.307306289672852, -9.043519020080566, -8.779731750488281, -8.51594352722168, -8.252156257629395, -7.988368511199951, -7.724580764770508, -7.460793495178223, -7.197005748748779, -6.933218002319336, -6.669430732727051, -6.405643463134766, -6.141855716705322, -5.878068447113037, -5.614280700683594, -5.350493431091309, -5.086705684661865, -4.822917938232422, -4.559130668640137, -4.295342922210693, -4.03155517578125, -3.767767906188965, -3.5039801597595215, -3.2401926517486572, -2.976405143737793, -2.7126173973083496, -2.4488298892974854, -2.185041904449463, -1.9212543964385986, -1.6574667692184448, -1.393679141998291, -1.1298916339874268, -0.8661041259765625, -0.6023164987564087, -0.3385288715362549, -0.07474136352539062, 0.1890462040901184, 0.45283377170562744, 0.7166213393211365, 0.9804089069366455, 1.2441964149475098, 1.5079840421676636, 1.7717716693878174, 2.0355591773986816, 2.299346685409546, 2.56313419342041, 2.8269219398498535, 3.0907094478607178, 3.354496955871582, 3.6182847023010254, 3.8820722103118896, 4.145859718322754, 4.409647464752197, 4.673434734344482, 4.937222480773926, 5.201009750366211, 5.464797496795654, 5.728585243225098, 5.992372512817383, 6.256160259246826]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 12.0, 4.0, 14.0, 14.0, 15.0, 18.0, 21.0, 16.0, 26.0, 23.0, 19.0, 43.0, 36.0, 33.0, 36.0, 37.0, 34.0, 38.0, 39.0, 31.0, 55.0, 34.0, 28.0, 43.0, 25.0, 28.0, 35.0, 31.0, 29.0, 23.0, 27.0, 11.0, 17.0, 13.0, 11.0, 9.0, 8.0, 14.0, 6.0, 7.0, 2.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-6.255807876586914, -6.064458847045898, -5.873109817504883, -5.681760311126709, -5.490411281585693, -5.299062252044678, -5.107712745666504, -4.916363716125488, -4.725014686584473, -4.533665657043457, -4.342316627502441, -4.150967121124268, -3.959618091583252, -3.7682690620422363, -3.5769197940826416, -3.385570526123047, -3.1942214965820312, -3.0028724670410156, -2.811523199081421, -2.620173931121826, -2.4288249015808105, -2.237475872039795, -2.0461266040802, -1.854777455329895, -1.6634283065795898, -1.4720791578292847, -1.2807300090789795, -1.0893808603286743, -0.8980317115783691, -0.706682562828064, -0.5153334140777588, -0.3239842653274536, -0.13263463973999023, 0.05871450901031494, 0.2500636577606201, 0.4414128065109253, 0.6327619552612305, 0.8241111040115356, 1.0154602527618408, 1.206809401512146, 1.3981585502624512, 1.5895076990127563, 1.7808568477630615, 1.9722059965133667, 2.163555145263672, 2.3549041748046875, 2.5462534427642822, 2.737602710723877, 2.9289517402648926, 3.120300769805908, 3.311650037765503, 3.5029993057250977, 3.6943483352661133, 3.885697364807129, 4.0770463943481445, 4.268395900726318, 4.459744930267334, 4.65109395980835, 4.842443466186523, 5.033792495727539, 5.225141525268555, 5.41649055480957, 5.607839584350586, 5.79918909072876, 5.990538120269775]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 7.0, 4.0, 21.0, 17.0, 22.0, 55.0, 64.0, 80.0, 111.0, 154.0, 250.0, 355.0, 532.0, 783.0, 1155.0, 1764.0, 2841.0, 4737.0, 8313.0, 15869.0, 32841.0, 74114.0, 176949.0, 311741.0, 228185.0, 99736.0, 42797.0, 19729.0, 10174.0, 5772.0, 3343.0, 1982.0, 1309.0, 909.0, 549.0, 425.0, 258.0, 171.0, 124.0, 91.0, 78.0, 39.0, 33.0, 27.0, 25.0, 9.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.421875, -17.85791015625, -17.2939453125, -16.72998046875, -16.166015625, -15.60205078125, -15.0380859375, -14.47412109375, -13.91015625, -13.34619140625, -12.7822265625, -12.21826171875, -11.654296875, -11.09033203125, -10.5263671875, -9.96240234375, -9.3984375, -8.83447265625, -8.2705078125, -7.70654296875, -7.142578125, -6.57861328125, -6.0146484375, -5.45068359375, -4.88671875, -4.32275390625, -3.7587890625, -3.19482421875, -2.630859375, -2.06689453125, -1.5029296875, -0.93896484375, -0.375, 0.18896484375, 0.7529296875, 1.31689453125, 1.880859375, 2.44482421875, 3.0087890625, 3.57275390625, 4.13671875, 4.70068359375, 5.2646484375, 5.82861328125, 6.392578125, 6.95654296875, 7.5205078125, 8.08447265625, 8.6484375, 9.21240234375, 9.7763671875, 10.34033203125, 10.904296875, 11.46826171875, 12.0322265625, 12.59619140625, 13.16015625, 13.72412109375, 14.2880859375, 14.85205078125, 15.416015625, 15.97998046875, 16.5439453125, 17.10791015625, 17.671875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 9.0, 11.0, 5.0, 11.0, 10.0, 9.0, 17.0, 12.0, 26.0, 27.0, 23.0, 26.0, 27.0, 36.0, 36.0, 30.0, 37.0, 36.0, 40.0, 39.0, 29.0, 45.0, 38.0, 41.0, 30.0, 30.0, 30.0, 39.0, 35.0, 31.0, 26.0, 22.0, 30.0, 21.0, 18.0, 9.0, 8.0, 6.0, 10.0, 6.0, 10.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.2421875, -6.0567626953125, -5.871337890625, -5.6859130859375, -5.50048828125, -5.3150634765625, -5.129638671875, -4.9442138671875, -4.7587890625, -4.5733642578125, -4.387939453125, -4.2025146484375, -4.01708984375, -3.8316650390625, -3.646240234375, -3.4608154296875, -3.275390625, -3.0899658203125, -2.904541015625, -2.7191162109375, -2.53369140625, -2.3482666015625, -2.162841796875, -1.9774169921875, -1.7919921875, -1.6065673828125, -1.421142578125, -1.2357177734375, -1.05029296875, -0.8648681640625, -0.679443359375, -0.4940185546875, -0.30859375, -0.1231689453125, 0.062255859375, 0.2476806640625, 0.43310546875, 0.6185302734375, 0.803955078125, 0.9893798828125, 1.1748046875, 1.3602294921875, 1.545654296875, 1.7310791015625, 1.91650390625, 2.1019287109375, 2.287353515625, 2.4727783203125, 2.658203125, 2.8436279296875, 3.029052734375, 3.2144775390625, 3.39990234375, 3.5853271484375, 3.770751953125, 3.9561767578125, 4.1416015625, 4.3270263671875, 4.512451171875, 4.6978759765625, 4.88330078125, 5.0687255859375, 5.254150390625, 5.4395751953125, 5.625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 16.0, 26.0, 24.0, 45.0, 49.0, 94.0, 133.0, 194.0, 299.0, 462.0, 750.0, 1109.0, 1812.0, 3120.0, 5384.0, 10289.0, 20974.0, 47833.0, 124349.0, 319649.0, 306118.0, 116733.0, 45621.0, 20109.0, 9922.0, 5371.0, 2968.0, 1818.0, 1131.0, 724.0, 491.0, 276.0, 211.0, 137.0, 102.0, 62.0, 40.0, 23.0, 17.0, 13.0, 9.0, 7.0, 10.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-18.75, -18.14453125, -17.5390625, -16.93359375, -16.328125, -15.72265625, -15.1171875, -14.51171875, -13.90625, -13.30078125, -12.6953125, -12.08984375, -11.484375, -10.87890625, -10.2734375, -9.66796875, -9.0625, -8.45703125, -7.8515625, -7.24609375, -6.640625, -6.03515625, -5.4296875, -4.82421875, -4.21875, -3.61328125, -3.0078125, -2.40234375, -1.796875, -1.19140625, -0.5859375, 0.01953125, 0.625, 1.23046875, 1.8359375, 2.44140625, 3.046875, 3.65234375, 4.2578125, 4.86328125, 5.46875, 6.07421875, 6.6796875, 7.28515625, 7.890625, 8.49609375, 9.1015625, 9.70703125, 10.3125, 10.91796875, 11.5234375, 12.12890625, 12.734375, 13.33984375, 13.9453125, 14.55078125, 15.15625, 15.76171875, 16.3671875, 16.97265625, 17.578125, 18.18359375, 18.7890625, 19.39453125, 20.0]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 10.0, 9.0, 3.0, 8.0, 15.0, 11.0, 6.0, 22.0, 19.0, 32.0, 23.0, 28.0, 19.0, 27.0, 43.0, 23.0, 44.0, 33.0, 40.0, 34.0, 49.0, 45.0, 43.0, 37.0, 38.0, 42.0, 30.0, 43.0, 20.0, 28.0, 27.0, 23.0, 25.0, 17.0, 16.0, 15.0, 12.0, 9.0, 7.0, 3.0, 5.0, 10.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.12109375, -3.992919921875, -3.86474609375, -3.736572265625, -3.6083984375, -3.480224609375, -3.35205078125, -3.223876953125, -3.095703125, -2.967529296875, -2.83935546875, -2.711181640625, -2.5830078125, -2.454833984375, -2.32666015625, -2.198486328125, -2.0703125, -1.942138671875, -1.81396484375, -1.685791015625, -1.5576171875, -1.429443359375, -1.30126953125, -1.173095703125, -1.044921875, -0.916748046875, -0.78857421875, -0.660400390625, -0.5322265625, -0.404052734375, -0.27587890625, -0.147705078125, -0.01953125, 0.108642578125, 0.23681640625, 0.364990234375, 0.4931640625, 0.621337890625, 0.74951171875, 0.877685546875, 1.005859375, 1.134033203125, 1.26220703125, 1.390380859375, 1.5185546875, 1.646728515625, 1.77490234375, 1.903076171875, 2.03125, 2.159423828125, 2.28759765625, 2.415771484375, 2.5439453125, 2.672119140625, 2.80029296875, 2.928466796875, 3.056640625, 3.184814453125, 3.31298828125, 3.441162109375, 3.5693359375, 3.697509765625, 3.82568359375, 3.953857421875, 4.08203125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 1.0, 10.0, 9.0, 12.0, 23.0, 20.0, 43.0, 37.0, 54.0, 76.0, 104.0, 149.0, 205.0, 253.0, 416.0, 511.0, 686.0, 885.0, 1296.0, 1997.0, 3533.0, 8482.0, 28859.0, 175373.0, 628156.0, 153196.0, 26236.0, 7643.0, 3374.0, 2026.0, 1379.0, 950.0, 607.0, 487.0, 383.0, 288.0, 184.0, 148.0, 130.0, 76.0, 72.0, 51.0, 26.0, 33.0, 23.0, 21.0, 11.0, 9.0, 2.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.109375, -15.597412109375, -15.08544921875, -14.573486328125, -14.0615234375, -13.549560546875, -13.03759765625, -12.525634765625, -12.013671875, -11.501708984375, -10.98974609375, -10.477783203125, -9.9658203125, -9.453857421875, -8.94189453125, -8.429931640625, -7.91796875, -7.406005859375, -6.89404296875, -6.382080078125, -5.8701171875, -5.358154296875, -4.84619140625, -4.334228515625, -3.822265625, -3.310302734375, -2.79833984375, -2.286376953125, -1.7744140625, -1.262451171875, -0.75048828125, -0.238525390625, 0.2734375, 0.785400390625, 1.29736328125, 1.809326171875, 2.3212890625, 2.833251953125, 3.34521484375, 3.857177734375, 4.369140625, 4.881103515625, 5.39306640625, 5.905029296875, 6.4169921875, 6.928955078125, 7.44091796875, 7.952880859375, 8.46484375, 8.976806640625, 9.48876953125, 10.000732421875, 10.5126953125, 11.024658203125, 11.53662109375, 12.048583984375, 12.560546875, 13.072509765625, 13.58447265625, 14.096435546875, 14.6083984375, 15.120361328125, 15.63232421875, 16.144287109375, 16.65625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 12.0, 33.0, 79.0, 262.0, 365.0, 130.0, 52.0, 28.0, 10.0, 10.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014810562133789062, -0.001428559422492981, -0.0013760626316070557, -0.0013235658407211304, -0.001271069049835205, -0.0012185722589492798, -0.0011660754680633545, -0.0011135786771774292, -0.001061081886291504, -0.0010085850954055786, -0.0009560883045196533, -0.000903591513633728, -0.0008510947227478027, -0.0007985979318618774, -0.0007461011409759521, -0.0006936043500900269, -0.0006411075592041016, -0.0005886107683181763, -0.000536113977432251, -0.0004836171865463257, -0.0004311203956604004, -0.0003786236047744751, -0.0003261268138885498, -0.0002736300230026245, -0.00022113323211669922, -0.00016863644123077393, -0.00011613965034484863, -6.364285945892334e-05, -1.1146068572998047e-05, 4.1350722312927246e-05, 9.384751319885254e-05, 0.00014634430408477783, 0.00019884109497070312, 0.0002513378858566284, 0.0003038346767425537, 0.000356331467628479, 0.0004088282585144043, 0.0004613250494003296, 0.0005138218402862549, 0.0005663186311721802, 0.0006188154220581055, 0.0006713122129440308, 0.0007238090038299561, 0.0007763057947158813, 0.0008288025856018066, 0.0008812993764877319, 0.0009337961673736572, 0.0009862929582595825, 0.0010387897491455078, 0.001091286540031433, 0.0011437833309173584, 0.0011962801218032837, 0.001248776912689209, 0.0013012737035751343, 0.0013537704944610596, 0.0014062672853469849, 0.0014587640762329102, 0.0015112608671188354, 0.0015637576580047607, 0.001616254448890686, 0.0016687512397766113, 0.0017212480306625366, 0.001773744821548462, 0.0018262416124343872, 0.0018787384033203125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 7.0, 5.0, 6.0, 6.0, 17.0, 18.0, 20.0, 34.0, 51.0, 52.0, 76.0, 113.0, 135.0, 154.0, 229.0, 307.0, 359.0, 482.0, 621.0, 825.0, 1042.0, 1536.0, 2149.0, 3461.0, 6288.0, 14645.0, 45936.0, 167264.0, 401873.0, 274858.0, 80216.0, 23154.0, 8686.0, 4346.0, 2655.0, 1739.0, 1262.0, 912.0, 735.0, 537.0, 408.0, 313.0, 231.0, 200.0, 155.0, 117.0, 90.0, 68.0, 41.0, 33.0, 28.0, 21.0, 13.0, 12.0, 7.0, 9.0, 6.0, 6.0, 1.0, 0.0, 1.0], "bins": [-10.4921875, -10.161376953125, -9.83056640625, -9.499755859375, -9.1689453125, -8.838134765625, -8.50732421875, -8.176513671875, -7.845703125, -7.514892578125, -7.18408203125, -6.853271484375, -6.5224609375, -6.191650390625, -5.86083984375, -5.530029296875, -5.19921875, -4.868408203125, -4.53759765625, -4.206787109375, -3.8759765625, -3.545166015625, -3.21435546875, -2.883544921875, -2.552734375, -2.221923828125, -1.89111328125, -1.560302734375, -1.2294921875, -0.898681640625, -0.56787109375, -0.237060546875, 0.09375, 0.424560546875, 0.75537109375, 1.086181640625, 1.4169921875, 1.747802734375, 2.07861328125, 2.409423828125, 2.740234375, 3.071044921875, 3.40185546875, 3.732666015625, 4.0634765625, 4.394287109375, 4.72509765625, 5.055908203125, 5.38671875, 5.717529296875, 6.04833984375, 6.379150390625, 6.7099609375, 7.040771484375, 7.37158203125, 7.702392578125, 8.033203125, 8.364013671875, 8.69482421875, 9.025634765625, 9.3564453125, 9.687255859375, 10.01806640625, 10.348876953125, 10.6796875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 5.0, 19.0, 17.0, 25.0, 45.0, 64.0, 84.0, 104.0, 117.0, 119.0, 100.0, 92.0, 59.0, 42.0, 24.0, 16.0, 18.0, 9.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.330078125, -3.21923828125, -3.1083984375, -2.99755859375, -2.88671875, -2.77587890625, -2.6650390625, -2.55419921875, -2.443359375, -2.33251953125, -2.2216796875, -2.11083984375, -2.0, -1.88916015625, -1.7783203125, -1.66748046875, -1.556640625, -1.44580078125, -1.3349609375, -1.22412109375, -1.11328125, -1.00244140625, -0.8916015625, -0.78076171875, -0.669921875, -0.55908203125, -0.4482421875, -0.33740234375, -0.2265625, -0.11572265625, -0.0048828125, 0.10595703125, 0.216796875, 0.32763671875, 0.4384765625, 0.54931640625, 0.66015625, 0.77099609375, 0.8818359375, 0.99267578125, 1.103515625, 1.21435546875, 1.3251953125, 1.43603515625, 1.546875, 1.65771484375, 1.7685546875, 1.87939453125, 1.990234375, 2.10107421875, 2.2119140625, 2.32275390625, 2.43359375, 2.54443359375, 2.6552734375, 2.76611328125, 2.876953125, 2.98779296875, 3.0986328125, 3.20947265625, 3.3203125, 3.43115234375, 3.5419921875, 3.65283203125, 3.763671875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 3.0, 5.0, 2.0, 5.0, 10.0, 17.0, 11.0, 30.0, 29.0, 34.0, 39.0, 37.0, 43.0, 61.0, 45.0, 55.0, 58.0, 57.0, 66.0, 64.0, 40.0, 35.0, 50.0, 33.0, 35.0, 26.0, 20.0, 15.0, 9.0, 14.0, 14.0, 9.0, 5.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-8.80270767211914, -8.575565338134766, -8.348422050476074, -8.1212797164917, -7.894136428833008, -7.666993618011475, -7.439850807189941, -7.212707996368408, -6.985565185546875, -6.758422374725342, -6.531279563903809, -6.304136753082275, -6.076993942260742, -5.849851131439209, -5.622708320617676, -5.395565509796143, -5.168422698974609, -4.941279888153076, -4.714137077331543, -4.48699426651001, -4.259851455688477, -4.032708644866943, -3.80556583404541, -3.578423023223877, -3.351280689239502, -3.1241378784179688, -2.8969950675964355, -2.6698522567749023, -2.442709445953369, -2.215566635131836, -1.9884239435195923, -1.761281132698059, -1.5341382026672363, -1.3069953918457031, -1.07985258102417, -0.8527098298072815, -0.6255670189857483, -0.39842426776885986, -0.17128145694732666, 0.05586135387420654, 0.28300416469573975, 0.510146975517273, 0.7372897863388062, 0.9644325375556946, 1.191575288772583, 1.4187180995941162, 1.6458609104156494, 1.8730037212371826, 2.100146532058716, 2.327289342880249, 2.5544321537017822, 2.7815749645233154, 3.0087177753448486, 3.2358603477478027, 3.463003158569336, 3.690145969390869, 3.9172887802124023, 4.1444315910339355, 4.371574401855469, 4.598717212677002, 4.825860023498535, 5.053002834320068, 5.280145645141602, 5.507288455963135, 5.734431266784668]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 8.0, 7.0, 9.0, 7.0, 11.0, 23.0, 14.0, 21.0, 17.0, 19.0, 25.0, 30.0, 25.0, 31.0, 38.0, 29.0, 30.0, 48.0, 34.0, 41.0, 38.0, 36.0, 31.0, 37.0, 39.0, 46.0, 33.0, 25.0, 26.0, 34.0, 26.0, 20.0, 20.0, 22.0, 20.0, 16.0, 13.0, 3.0, 5.0, 14.0, 6.0, 2.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0], "bins": [-6.523237705230713, -6.344842433929443, -6.166447162628174, -5.988051891326904, -5.809656620025635, -5.631261348724365, -5.4528656005859375, -5.274470329284668, -5.096075057983398, -4.917679786682129, -4.739284515380859, -4.56088924407959, -4.38249397277832, -4.204098701477051, -4.025703430175781, -3.8473079204559326, -3.668912887573242, -3.4905176162719727, -3.312122344970703, -3.1337270736694336, -2.955331802368164, -2.7769365310668945, -2.598541021347046, -2.4201457500457764, -2.241750478744507, -2.0633552074432373, -1.8849599361419678, -1.7065645456314087, -1.5281692743301392, -1.3497740030288696, -1.1713786125183105, -0.992983341217041, -0.8145875930786133, -0.6361923217773438, -0.45779699087142944, -0.27940165996551514, -0.1010063886642456, 0.07738888263702393, 0.255784273147583, 0.43417954444885254, 0.6125748157501221, 0.7909700870513916, 0.9693654179573059, 1.1477607488632202, 1.3261560201644897, 1.5045512914657593, 1.6829466819763184, 1.861341953277588, 2.0397372245788574, 2.218132495880127, 2.3965277671813965, 2.574923038482666, 2.7533183097839355, 2.931713581085205, 3.1101090908050537, 3.2885043621063232, 3.4668996334075928, 3.6452949047088623, 3.823690176010132, 4.0020856857299805, 4.18048095703125, 4.3588762283325195, 4.537271499633789, 4.715666770935059, 4.894062042236328]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 11.0, 15.0, 22.0, 37.0, 48.0, 69.0, 116.0, 191.0, 273.0, 445.0, 636.0, 1036.0, 1727.0, 2776.0, 4618.0, 8141.0, 14014.0, 24995.0, 42953.0, 72816.0, 113896.0, 156719.0, 174770.0, 152930.0, 109350.0, 68894.0, 41093.0, 23588.0, 13417.0, 7486.0, 4385.0, 2600.0, 1614.0, 1010.0, 653.0, 387.0, 317.0, 167.0, 102.0, 80.0, 39.0, 34.0, 29.0, 15.0, 16.0, 5.0, 4.0, 9.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.8671875, -6.6678466796875, -6.468505859375, -6.2691650390625, -6.06982421875, -5.8704833984375, -5.671142578125, -5.4718017578125, -5.2724609375, -5.0731201171875, -4.873779296875, -4.6744384765625, -4.47509765625, -4.2757568359375, -4.076416015625, -3.8770751953125, -3.677734375, -3.4783935546875, -3.279052734375, -3.0797119140625, -2.88037109375, -2.6810302734375, -2.481689453125, -2.2823486328125, -2.0830078125, -1.8836669921875, -1.684326171875, -1.4849853515625, -1.28564453125, -1.0863037109375, -0.886962890625, -0.6876220703125, -0.48828125, -0.2889404296875, -0.089599609375, 0.1097412109375, 0.30908203125, 0.5084228515625, 0.707763671875, 0.9071044921875, 1.1064453125, 1.3057861328125, 1.505126953125, 1.7044677734375, 1.90380859375, 2.1031494140625, 2.302490234375, 2.5018310546875, 2.701171875, 2.9005126953125, 3.099853515625, 3.2991943359375, 3.49853515625, 3.6978759765625, 3.897216796875, 4.0965576171875, 4.2958984375, 4.4952392578125, 4.694580078125, 4.8939208984375, 5.09326171875, 5.2926025390625, 5.491943359375, 5.6912841796875, 5.890625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 5.0, 7.0, 12.0, 11.0, 8.0, 14.0, 16.0, 18.0, 21.0, 22.0, 17.0, 29.0, 35.0, 24.0, 41.0, 34.0, 23.0, 28.0, 38.0, 40.0, 41.0, 40.0, 33.0, 41.0, 35.0, 33.0, 41.0, 23.0, 28.0, 30.0, 22.0, 22.0, 23.0, 16.0, 18.0, 15.0, 16.0, 18.0, 9.0, 10.0, 6.0, 4.0, 4.0, 7.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.7109375, -5.54229736328125, -5.3736572265625, -5.20501708984375, -5.036376953125, -4.86773681640625, -4.6990966796875, -4.53045654296875, -4.36181640625, -4.19317626953125, -4.0245361328125, -3.85589599609375, -3.687255859375, -3.51861572265625, -3.3499755859375, -3.18133544921875, -3.0126953125, -2.84405517578125, -2.6754150390625, -2.50677490234375, -2.338134765625, -2.16949462890625, -2.0008544921875, -1.83221435546875, -1.66357421875, -1.49493408203125, -1.3262939453125, -1.15765380859375, -0.989013671875, -0.82037353515625, -0.6517333984375, -0.48309326171875, -0.314453125, -0.14581298828125, 0.0228271484375, 0.19146728515625, 0.360107421875, 0.52874755859375, 0.6973876953125, 0.86602783203125, 1.03466796875, 1.20330810546875, 1.3719482421875, 1.54058837890625, 1.709228515625, 1.87786865234375, 2.0465087890625, 2.21514892578125, 2.3837890625, 2.55242919921875, 2.7210693359375, 2.88970947265625, 3.058349609375, 3.22698974609375, 3.3956298828125, 3.56427001953125, 3.73291015625, 3.90155029296875, 4.0701904296875, 4.23883056640625, 4.407470703125, 4.57611083984375, 4.7447509765625, 4.91339111328125, 5.08203125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 6.0, 7.0, 6.0, 16.0, 16.0, 17.0, 45.0, 69.0, 120.0, 178.0, 262.0, 386.0, 641.0, 1036.0, 1580.0, 2624.0, 4269.0, 7301.0, 12123.0, 21270.0, 36645.0, 61890.0, 101442.0, 147380.0, 176156.0, 163917.0, 120676.0, 77240.0, 46076.0, 26916.0, 15512.0, 8867.0, 5390.0, 3172.0, 1960.0, 1224.0, 799.0, 455.0, 301.0, 190.0, 131.0, 83.0, 60.0, 35.0, 27.0, 18.0, 9.0, 6.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.202880859375, -5.01513671875, -4.827392578125, -4.6396484375, -4.451904296875, -4.26416015625, -4.076416015625, -3.888671875, -3.700927734375, -3.51318359375, -3.325439453125, -3.1376953125, -2.949951171875, -2.76220703125, -2.574462890625, -2.38671875, -2.198974609375, -2.01123046875, -1.823486328125, -1.6357421875, -1.447998046875, -1.26025390625, -1.072509765625, -0.884765625, -0.697021484375, -0.50927734375, -0.321533203125, -0.1337890625, 0.053955078125, 0.24169921875, 0.429443359375, 0.6171875, 0.804931640625, 0.99267578125, 1.180419921875, 1.3681640625, 1.555908203125, 1.74365234375, 1.931396484375, 2.119140625, 2.306884765625, 2.49462890625, 2.682373046875, 2.8701171875, 3.057861328125, 3.24560546875, 3.433349609375, 3.62109375, 3.808837890625, 3.99658203125, 4.184326171875, 4.3720703125, 4.559814453125, 4.74755859375, 4.935302734375, 5.123046875, 5.310791015625, 5.49853515625, 5.686279296875, 5.8740234375, 6.061767578125, 6.24951171875, 6.437255859375, 6.625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 7.0, 14.0, 13.0, 9.0, 13.0, 17.0, 27.0, 28.0, 33.0, 33.0, 27.0, 35.0, 33.0, 28.0, 37.0, 36.0, 49.0, 34.0, 40.0, 41.0, 39.0, 40.0, 26.0, 33.0, 36.0, 36.0, 31.0, 20.0, 33.0, 14.0, 11.0, 20.0, 17.0, 13.0, 17.0, 13.0, 11.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.83203125, -3.7100830078125, -3.588134765625, -3.4661865234375, -3.34423828125, -3.2222900390625, -3.100341796875, -2.9783935546875, -2.8564453125, -2.7344970703125, -2.612548828125, -2.4906005859375, -2.36865234375, -2.2467041015625, -2.124755859375, -2.0028076171875, -1.880859375, -1.7589111328125, -1.636962890625, -1.5150146484375, -1.39306640625, -1.2711181640625, -1.149169921875, -1.0272216796875, -0.9052734375, -0.7833251953125, -0.661376953125, -0.5394287109375, -0.41748046875, -0.2955322265625, -0.173583984375, -0.0516357421875, 0.0703125, 0.1922607421875, 0.314208984375, 0.4361572265625, 0.55810546875, 0.6800537109375, 0.802001953125, 0.9239501953125, 1.0458984375, 1.1678466796875, 1.289794921875, 1.4117431640625, 1.53369140625, 1.6556396484375, 1.777587890625, 1.8995361328125, 2.021484375, 2.1434326171875, 2.265380859375, 2.3873291015625, 2.50927734375, 2.6312255859375, 2.753173828125, 2.8751220703125, 2.9970703125, 3.1190185546875, 3.240966796875, 3.3629150390625, 3.48486328125, 3.6068115234375, 3.728759765625, 3.8507080078125, 3.97265625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 4.0, 6.0, 1.0, 13.0, 22.0, 16.0, 24.0, 42.0, 62.0, 75.0, 111.0, 166.0, 241.0, 287.0, 431.0, 539.0, 852.0, 1180.0, 1663.0, 2639.0, 3923.0, 6260.0, 10200.0, 17848.0, 32712.0, 63578.0, 121776.0, 201223.0, 226573.0, 161639.0, 88277.0, 45460.0, 24114.0, 13349.0, 7934.0, 5046.0, 3169.0, 2162.0, 1395.0, 1029.0, 743.0, 517.0, 348.0, 253.0, 186.0, 148.0, 105.0, 67.0, 50.0, 29.0, 29.0, 12.0, 17.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.2421875, -4.1064453125, -3.970703125, -3.8349609375, -3.69921875, -3.5634765625, -3.427734375, -3.2919921875, -3.15625, -3.0205078125, -2.884765625, -2.7490234375, -2.61328125, -2.4775390625, -2.341796875, -2.2060546875, -2.0703125, -1.9345703125, -1.798828125, -1.6630859375, -1.52734375, -1.3916015625, -1.255859375, -1.1201171875, -0.984375, -0.8486328125, -0.712890625, -0.5771484375, -0.44140625, -0.3056640625, -0.169921875, -0.0341796875, 0.1015625, 0.2373046875, 0.373046875, 0.5087890625, 0.64453125, 0.7802734375, 0.916015625, 1.0517578125, 1.1875, 1.3232421875, 1.458984375, 1.5947265625, 1.73046875, 1.8662109375, 2.001953125, 2.1376953125, 2.2734375, 2.4091796875, 2.544921875, 2.6806640625, 2.81640625, 2.9521484375, 3.087890625, 3.2236328125, 3.359375, 3.4951171875, 3.630859375, 3.7666015625, 3.90234375, 4.0380859375, 4.173828125, 4.3095703125, 4.4453125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 9.0, 9.0, 9.0, 17.0, 38.0, 39.0, 49.0, 64.0, 103.0, 113.0, 119.0, 110.0, 80.0, 74.0, 39.0, 39.0, 11.0, 18.0, 6.0, 8.0, 7.0, 3.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007581710815429688, -0.0007371976971626282, -0.0007162243127822876, -0.000695250928401947, -0.0006742775440216064, -0.0006533041596412659, -0.0006323307752609253, -0.0006113573908805847, -0.0005903840065002441, -0.0005694106221199036, -0.000548437237739563, -0.0005274638533592224, -0.0005064904689788818, -0.00048551708459854126, -0.0004645437002182007, -0.0004435703158378601, -0.00042259693145751953, -0.00040162354707717896, -0.0003806501626968384, -0.0003596767783164978, -0.0003387033939361572, -0.00031773000955581665, -0.0002967566251754761, -0.0002757832407951355, -0.0002548098564147949, -0.00023383647203445435, -0.00021286308765411377, -0.0001918897032737732, -0.00017091631889343262, -0.00014994293451309204, -0.00012896955013275146, -0.00010799616575241089, -8.702278137207031e-05, -6.604939699172974e-05, -4.507601261138916e-05, -2.4102628231048584e-05, -3.129243850708008e-06, 1.784414052963257e-05, 3.8817524909973145e-05, 5.979090929031372e-05, 8.07642936706543e-05, 0.00010173767805099487, 0.00012271106243133545, 0.00014368444681167603, 0.0001646578311920166, 0.00018563121557235718, 0.00020660459995269775, 0.00022757798433303833, 0.0002485513687133789, 0.0002695247530937195, 0.00029049813747406006, 0.00031147152185440063, 0.0003324449062347412, 0.0003534182906150818, 0.00037439167499542236, 0.00039536505937576294, 0.0004163384437561035, 0.0004373118281364441, 0.00045828521251678467, 0.00047925859689712524, 0.0005002319812774658, 0.0005212053656578064, 0.000542178750038147, 0.0005631521344184875, 0.0005841255187988281]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 13.0, 16.0, 23.0, 59.0, 78.0, 99.0, 140.0, 225.0, 309.0, 440.0, 646.0, 1037.0, 1654.0, 2589.0, 4047.0, 6727.0, 11575.0, 20449.0, 36184.0, 63441.0, 109414.0, 168028.0, 197433.0, 167233.0, 108648.0, 63218.0, 35404.0, 20047.0, 11498.0, 6765.0, 3990.0, 2470.0, 1590.0, 1023.0, 653.0, 411.0, 275.0, 225.0, 152.0, 104.0, 66.0, 62.0, 33.0, 14.0, 14.0, 13.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.8203125, -3.70623779296875, -3.5921630859375, -3.47808837890625, -3.364013671875, -3.24993896484375, -3.1358642578125, -3.02178955078125, -2.90771484375, -2.79364013671875, -2.6795654296875, -2.56549072265625, -2.451416015625, -2.33734130859375, -2.2232666015625, -2.10919189453125, -1.9951171875, -1.88104248046875, -1.7669677734375, -1.65289306640625, -1.538818359375, -1.42474365234375, -1.3106689453125, -1.19659423828125, -1.08251953125, -0.96844482421875, -0.8543701171875, -0.74029541015625, -0.626220703125, -0.51214599609375, -0.3980712890625, -0.28399658203125, -0.169921875, -0.05584716796875, 0.0582275390625, 0.17230224609375, 0.286376953125, 0.40045166015625, 0.5145263671875, 0.62860107421875, 0.74267578125, 0.85675048828125, 0.9708251953125, 1.08489990234375, 1.198974609375, 1.31304931640625, 1.4271240234375, 1.54119873046875, 1.6552734375, 1.76934814453125, 1.8834228515625, 1.99749755859375, 2.111572265625, 2.22564697265625, 2.3397216796875, 2.45379638671875, 2.56787109375, 2.68194580078125, 2.7960205078125, 2.91009521484375, 3.024169921875, 3.13824462890625, 3.2523193359375, 3.36639404296875, 3.48046875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 2.0, 11.0, 5.0, 12.0, 8.0, 14.0, 18.0, 26.0, 33.0, 38.0, 44.0, 41.0, 59.0, 64.0, 81.0, 70.0, 65.0, 56.0, 58.0, 52.0, 54.0, 27.0, 36.0, 34.0, 14.0, 20.0, 14.0, 6.0, 2.0, 7.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5556640625, -1.5105743408203125, -1.465484619140625, -1.4203948974609375, -1.37530517578125, -1.3302154541015625, -1.285125732421875, -1.2400360107421875, -1.1949462890625, -1.1498565673828125, -1.104766845703125, -1.0596771240234375, -1.01458740234375, -0.9694976806640625, -0.924407958984375, -0.8793182373046875, -0.834228515625, -0.7891387939453125, -0.744049072265625, -0.6989593505859375, -0.65386962890625, -0.6087799072265625, -0.563690185546875, -0.5186004638671875, -0.4735107421875, -0.4284210205078125, -0.383331298828125, -0.3382415771484375, -0.29315185546875, -0.2480621337890625, -0.202972412109375, -0.1578826904296875, -0.11279296875, -0.0677032470703125, -0.022613525390625, 0.0224761962890625, 0.06756591796875, 0.1126556396484375, 0.157745361328125, 0.2028350830078125, 0.2479248046875, 0.2930145263671875, 0.338104248046875, 0.3831939697265625, 0.42828369140625, 0.4733734130859375, 0.518463134765625, 0.5635528564453125, 0.608642578125, 0.6537322998046875, 0.698822021484375, 0.7439117431640625, 0.78900146484375, 0.8340911865234375, 0.879180908203125, 0.9242706298828125, 0.9693603515625, 1.0144500732421875, 1.059539794921875, 1.1046295166015625, 1.14971923828125, 1.1948089599609375, 1.239898681640625, 1.2849884033203125, 1.330078125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 1.0, 3.0, 9.0, 11.0, 10.0, 11.0, 10.0, 14.0, 10.0, 20.0, 31.0, 20.0, 33.0, 42.0, 48.0, 48.0, 57.0, 50.0, 58.0, 51.0, 56.0, 46.0, 45.0, 46.0, 37.0, 41.0, 30.0, 25.0, 29.0, 20.0, 17.0, 14.0, 11.0, 15.0, 9.0, 6.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.092888832092285, -7.885030746459961, -7.677173137664795, -7.469315052032471, -7.261457443237305, -7.0535993576049805, -6.8457417488098145, -6.63788366317749, -6.430026054382324, -6.22216796875, -6.014310359954834, -5.80645227432251, -5.598594665527344, -5.3907365798950195, -5.1828789710998535, -4.975020885467529, -4.767163276672363, -4.559305191040039, -4.351447582244873, -4.143589496612549, -3.935731887817383, -3.7278738021850586, -3.5200161933898926, -3.3121581077575684, -3.104300022125244, -2.896442174911499, -2.688584327697754, -2.480726480484009, -2.2728686332702637, -2.0650105476379395, -1.8571528196334839, -1.6492949724197388, -1.4414372444152832, -1.233579397201538, -1.025721549987793, -0.8178636431694031, -0.610005795955658, -0.40214788913726807, -0.19429004192352295, 0.013567805290222168, 0.22142565250396729, 0.4292834997177124, 0.6371413469314575, 0.8449992537498474, 1.0528571605682373, 1.2607150077819824, 1.4685728549957275, 1.6764307022094727, 1.8842885494232178, 2.092146396636963, 2.300004243850708, 2.507862091064453, 2.7157199382781982, 2.9235777854919434, 3.1314358711242676, 3.3392934799194336, 3.547151565551758, 3.755009412765503, 3.962867259979248, 4.170725345611572, 4.378582954406738, 4.5864410400390625, 4.7942986488342285, 5.002156734466553, 5.210014343261719]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 8.0, 12.0, 6.0, 8.0, 15.0, 18.0, 15.0, 12.0, 22.0, 27.0, 25.0, 32.0, 27.0, 42.0, 31.0, 30.0, 36.0, 24.0, 36.0, 40.0, 47.0, 28.0, 44.0, 40.0, 33.0, 31.0, 26.0, 28.0, 30.0, 27.0, 24.0, 20.0, 18.0, 21.0, 21.0, 14.0, 9.0, 12.0, 11.0, 5.0, 10.0, 7.0, 7.0, 0.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.523662567138672, -5.341506481170654, -5.1593499183654785, -4.977193832397461, -4.795037269592285, -4.612881183624268, -4.43072509765625, -4.248568534851074, -4.066412448883057, -3.88425612449646, -3.7020998001098633, -3.5199437141418457, -3.337787389755249, -3.1556310653686523, -2.9734747409820557, -2.791318416595459, -2.6091620922088623, -2.4270057678222656, -2.244849443435669, -2.0626931190490723, -1.8805370330810547, -1.698380708694458, -1.5162243843078613, -1.3340681791305542, -1.1519118547439575, -0.9697555899620056, -0.7875993251800537, -0.605443000793457, -0.4232867360115051, -0.24113047122955322, -0.05897414684295654, 0.12318205833435059, 0.30533838272094727, 0.48749464750289917, 0.6696509122848511, 0.8518072366714478, 1.0339634418487549, 1.2161197662353516, 1.3982760906219482, 1.5804322957992554, 1.762588620185852, 1.9447449445724487, 2.126901149749756, 2.3090574741363525, 2.491213798522949, 2.673369884490967, 2.8555264472961426, 3.03768253326416, 3.219838857650757, 3.4019951820373535, 3.58415150642395, 3.766307830810547, 3.9484639167785645, 4.130620002746582, 4.312776565551758, 4.494932651519775, 4.677089214324951, 4.859245300292969, 5.0414018630981445, 5.223557949066162, 5.405714511871338, 5.5878705978393555, 5.770027160644531, 5.952183246612549, 6.134339332580566]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 8.0, 7.0, 11.0, 16.0, 20.0, 35.0, 50.0, 85.0, 133.0, 159.0, 269.0, 356.0, 519.0, 745.0, 1119.0, 1608.0, 2559.0, 4043.0, 6241.0, 10188.0, 17239.0, 31099.0, 60579.0, 133079.0, 317843.0, 717057.0, 1102891.0, 926504.0, 476616.0, 200150.0, 86262.0, 41645.0, 21979.0, 12650.0, 7330.0, 4663.0, 2919.0, 1929.0, 1202.0, 871.0, 545.0, 399.0, 234.0, 154.0, 103.0, 64.0, 45.0, 24.0, 23.0, 12.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.14453125, -6.944580078125, -6.74462890625, -6.544677734375, -6.3447265625, -6.144775390625, -5.94482421875, -5.744873046875, -5.544921875, -5.344970703125, -5.14501953125, -4.945068359375, -4.7451171875, -4.545166015625, -4.34521484375, -4.145263671875, -3.9453125, -3.745361328125, -3.54541015625, -3.345458984375, -3.1455078125, -2.945556640625, -2.74560546875, -2.545654296875, -2.345703125, -2.145751953125, -1.94580078125, -1.745849609375, -1.5458984375, -1.345947265625, -1.14599609375, -0.946044921875, -0.74609375, -0.546142578125, -0.34619140625, -0.146240234375, 0.0537109375, 0.253662109375, 0.45361328125, 0.653564453125, 0.853515625, 1.053466796875, 1.25341796875, 1.453369140625, 1.6533203125, 1.853271484375, 2.05322265625, 2.253173828125, 2.453125, 2.653076171875, 2.85302734375, 3.052978515625, 3.2529296875, 3.452880859375, 3.65283203125, 3.852783203125, 4.052734375, 4.252685546875, 4.45263671875, 4.652587890625, 4.8525390625, 5.052490234375, 5.25244140625, 5.452392578125, 5.65234375]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 5.0, 9.0, 11.0, 7.0, 18.0, 17.0, 11.0, 21.0, 27.0, 27.0, 24.0, 43.0, 32.0, 39.0, 32.0, 45.0, 45.0, 35.0, 38.0, 35.0, 39.0, 41.0, 45.0, 50.0, 39.0, 19.0, 24.0, 30.0, 34.0, 21.0, 18.0, 18.0, 20.0, 11.0, 10.0, 15.0, 7.0, 7.0, 3.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.984375, -3.8470458984375, -3.709716796875, -3.5723876953125, -3.43505859375, -3.2977294921875, -3.160400390625, -3.0230712890625, -2.8857421875, -2.7484130859375, -2.611083984375, -2.4737548828125, -2.33642578125, -2.1990966796875, -2.061767578125, -1.9244384765625, -1.787109375, -1.6497802734375, -1.512451171875, -1.3751220703125, -1.23779296875, -1.1004638671875, -0.963134765625, -0.8258056640625, -0.6884765625, -0.5511474609375, -0.413818359375, -0.2764892578125, -0.13916015625, -0.0018310546875, 0.135498046875, 0.2728271484375, 0.41015625, 0.5474853515625, 0.684814453125, 0.8221435546875, 0.95947265625, 1.0968017578125, 1.234130859375, 1.3714599609375, 1.5087890625, 1.6461181640625, 1.783447265625, 1.9207763671875, 2.05810546875, 2.1954345703125, 2.332763671875, 2.4700927734375, 2.607421875, 2.7447509765625, 2.882080078125, 3.0194091796875, 3.15673828125, 3.2940673828125, 3.431396484375, 3.5687255859375, 3.7060546875, 3.8433837890625, 3.980712890625, 4.1180419921875, 4.25537109375, 4.3927001953125, 4.530029296875, 4.6673583984375, 4.8046875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 7.0, 4.0, 4.0, 6.0, 11.0, 20.0, 34.0, 52.0, 68.0, 104.0, 145.0, 205.0, 274.0, 415.0, 663.0, 981.0, 1436.0, 2319.0, 3539.0, 5462.0, 8948.0, 14893.0, 25796.0, 47584.0, 92921.0, 195810.0, 412425.0, 808298.0, 1066446.0, 755369.0, 378601.0, 178607.0, 86644.0, 44680.0, 24190.0, 13891.0, 8437.0, 5332.0, 3369.0, 2160.0, 1322.0, 930.0, 642.0, 382.0, 279.0, 187.0, 135.0, 89.0, 54.0, 39.0, 36.0, 16.0, 11.0, 10.0, 7.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16796875, -5.9718017578125, -5.775634765625, -5.5794677734375, -5.38330078125, -5.1871337890625, -4.990966796875, -4.7947998046875, -4.5986328125, -4.4024658203125, -4.206298828125, -4.0101318359375, -3.81396484375, -3.6177978515625, -3.421630859375, -3.2254638671875, -3.029296875, -2.8331298828125, -2.636962890625, -2.4407958984375, -2.24462890625, -2.0484619140625, -1.852294921875, -1.6561279296875, -1.4599609375, -1.2637939453125, -1.067626953125, -0.8714599609375, -0.67529296875, -0.4791259765625, -0.282958984375, -0.0867919921875, 0.109375, 0.3055419921875, 0.501708984375, 0.6978759765625, 0.89404296875, 1.0902099609375, 1.286376953125, 1.4825439453125, 1.6787109375, 1.8748779296875, 2.071044921875, 2.2672119140625, 2.46337890625, 2.6595458984375, 2.855712890625, 3.0518798828125, 3.248046875, 3.4442138671875, 3.640380859375, 3.8365478515625, 4.03271484375, 4.2288818359375, 4.425048828125, 4.6212158203125, 4.8173828125, 5.0135498046875, 5.209716796875, 5.4058837890625, 5.60205078125, 5.7982177734375, 5.994384765625, 6.1905517578125, 6.38671875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 6.0, 9.0, 13.0, 11.0, 10.0, 10.0, 20.0, 25.0, 39.0, 38.0, 48.0, 68.0, 99.0, 97.0, 140.0, 192.0, 244.0, 312.0, 329.0, 353.0, 366.0, 351.0, 290.0, 244.0, 186.0, 154.0, 110.0, 71.0, 63.0, 53.0, 36.0, 30.0, 20.0, 12.0, 8.0, 6.0, 7.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.677734375, -2.59619140625, -2.5146484375, -2.43310546875, -2.3515625, -2.27001953125, -2.1884765625, -2.10693359375, -2.025390625, -1.94384765625, -1.8623046875, -1.78076171875, -1.69921875, -1.61767578125, -1.5361328125, -1.45458984375, -1.373046875, -1.29150390625, -1.2099609375, -1.12841796875, -1.046875, -0.96533203125, -0.8837890625, -0.80224609375, -0.720703125, -0.63916015625, -0.5576171875, -0.47607421875, -0.39453125, -0.31298828125, -0.2314453125, -0.14990234375, -0.068359375, 0.01318359375, 0.0947265625, 0.17626953125, 0.2578125, 0.33935546875, 0.4208984375, 0.50244140625, 0.583984375, 0.66552734375, 0.7470703125, 0.82861328125, 0.91015625, 0.99169921875, 1.0732421875, 1.15478515625, 1.236328125, 1.31787109375, 1.3994140625, 1.48095703125, 1.5625, 1.64404296875, 1.7255859375, 1.80712890625, 1.888671875, 1.97021484375, 2.0517578125, 2.13330078125, 2.21484375, 2.29638671875, 2.3779296875, 2.45947265625, 2.541015625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 7.0, 12.0, 6.0, 13.0, 17.0, 11.0, 31.0, 22.0, 25.0, 41.0, 51.0, 66.0, 54.0, 60.0, 74.0, 56.0, 68.0, 56.0, 57.0, 35.0, 33.0, 34.0, 38.0, 21.0, 21.0, 17.0, 12.0, 14.0, 14.0, 8.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.805457592010498, -7.606225490570068, -7.406993865966797, -7.207761764526367, -7.008530139923096, -6.809298038482666, -6.6100664138793945, -6.410834312438965, -6.211602210998535, -6.0123701095581055, -5.813138484954834, -5.613906383514404, -5.414674758911133, -5.215442657470703, -5.016210556030273, -4.816978931427002, -4.6177473068237305, -4.418515205383301, -4.219283580780029, -4.0200514793396, -3.820819854736328, -3.6215877532958984, -3.422355890274048, -3.2231240272521973, -3.0238921642303467, -2.824660301208496, -2.6254284381866455, -2.426196575164795, -2.2269644737243652, -2.0277328491210938, -1.828500747680664, -1.6292688846588135, -1.4300365447998047, -1.230804681777954, -1.0315728187561035, -0.8323408365249634, -0.6331089735031128, -0.4338771104812622, -0.23464512825012207, -0.035413265228271484, 0.1638185977935791, 0.3630504906177521, 0.562282383441925, 0.7615143060684204, 0.960746169090271, 1.1599780321121216, 1.3592100143432617, 1.5584418773651123, 1.757673740386963, 1.9569056034088135, 2.156137466430664, 2.3553695678710938, 2.5546011924743652, 2.753833293914795, 2.9530651569366455, 3.152297019958496, 3.3515288829803467, 3.5507607460021973, 3.749992609024048, 3.9492244720458984, 4.148456573486328, 4.3476881980896, 4.546920299530029, 4.746151924133301, 4.9453840255737305]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 8.0, 5.0, 4.0, 8.0, 16.0, 12.0, 11.0, 22.0, 17.0, 19.0, 31.0, 28.0, 29.0, 27.0, 30.0, 39.0, 40.0, 34.0, 41.0, 50.0, 26.0, 38.0, 33.0, 41.0, 36.0, 35.0, 28.0, 40.0, 28.0, 28.0, 26.0, 28.0, 21.0, 16.0, 20.0, 18.0, 11.0, 10.0, 6.0, 13.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.991107940673828, -4.833901405334473, -4.676694869995117, -4.519488334655762, -4.362281799316406, -4.205075263977051, -4.047868728637695, -3.89066219329834, -3.7334556579589844, -3.576249122619629, -3.4190425872802734, -3.261836051940918, -3.1046295166015625, -2.947422981262207, -2.7902164459228516, -2.633009910583496, -2.4758033752441406, -2.318596839904785, -2.1613903045654297, -2.004183769226074, -1.8469772338867188, -1.6897706985473633, -1.5325641632080078, -1.3753576278686523, -1.2181510925292969, -1.0609445571899414, -0.9037380218505859, -0.7465314865112305, -0.589324951171875, -0.43211841583251953, -0.27491188049316406, -0.1177053451538086, 0.03950071334838867, 0.19670724868774414, 0.3539137840270996, 0.5111203193664551, 0.6683268547058105, 0.825533390045166, 0.9827399253845215, 1.139946460723877, 1.2971529960632324, 1.454359531402588, 1.6115660667419434, 1.7687726020812988, 1.9259791374206543, 2.0831856727600098, 2.2403922080993652, 2.3975987434387207, 2.554805278778076, 2.7120118141174316, 2.869218349456787, 3.0264248847961426, 3.183631420135498, 3.3408379554748535, 3.498044490814209, 3.6552510261535645, 3.81245756149292, 3.9696640968322754, 4.126870632171631, 4.284077167510986, 4.441283702850342, 4.598490238189697, 4.755696773529053, 4.912903308868408, 5.070109844207764]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 16.0, 19.0, 18.0, 41.0, 69.0, 89.0, 118.0, 171.0, 231.0, 361.0, 502.0, 788.0, 1132.0, 1682.0, 2498.0, 3996.0, 6519.0, 10342.0, 17160.0, 28767.0, 48032.0, 80466.0, 128738.0, 177109.0, 183041.0, 136973.0, 86904.0, 52302.0, 31062.0, 18715.0, 11132.0, 6866.0, 4384.0, 2787.0, 1802.0, 1211.0, 797.0, 539.0, 390.0, 220.0, 176.0, 102.0, 69.0, 75.0, 37.0, 33.0, 14.0, 15.0, 13.0, 6.0, 8.0, 6.0, 2.0, 0.0, 0.0, 3.0], "bins": [-5.640625, -5.46478271484375, -5.2889404296875, -5.11309814453125, -4.937255859375, -4.76141357421875, -4.5855712890625, -4.40972900390625, -4.23388671875, -4.05804443359375, -3.8822021484375, -3.70635986328125, -3.530517578125, -3.35467529296875, -3.1788330078125, -3.00299072265625, -2.8271484375, -2.65130615234375, -2.4754638671875, -2.29962158203125, -2.123779296875, -1.94793701171875, -1.7720947265625, -1.59625244140625, -1.42041015625, -1.24456787109375, -1.0687255859375, -0.89288330078125, -0.717041015625, -0.54119873046875, -0.3653564453125, -0.18951416015625, -0.013671875, 0.16217041015625, 0.3380126953125, 0.51385498046875, 0.689697265625, 0.86553955078125, 1.0413818359375, 1.21722412109375, 1.39306640625, 1.56890869140625, 1.7447509765625, 1.92059326171875, 2.096435546875, 2.27227783203125, 2.4481201171875, 2.62396240234375, 2.7998046875, 2.97564697265625, 3.1514892578125, 3.32733154296875, 3.503173828125, 3.67901611328125, 3.8548583984375, 4.03070068359375, 4.20654296875, 4.38238525390625, 4.5582275390625, 4.73406982421875, 4.909912109375, 5.08575439453125, 5.2615966796875, 5.43743896484375, 5.61328125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 9.0, 14.0, 16.0, 11.0, 27.0, 26.0, 12.0, 28.0, 26.0, 27.0, 29.0, 32.0, 35.0, 41.0, 41.0, 35.0, 37.0, 37.0, 40.0, 34.0, 43.0, 34.0, 38.0, 32.0, 27.0, 22.0, 36.0, 29.0, 21.0, 26.0, 16.0, 16.0, 18.0, 9.0, 14.0, 4.0, 7.0, 8.0, 6.0, 2.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.754638671875, -4.59912109375, -4.443603515625, -4.2880859375, -4.132568359375, -3.97705078125, -3.821533203125, -3.666015625, -3.510498046875, -3.35498046875, -3.199462890625, -3.0439453125, -2.888427734375, -2.73291015625, -2.577392578125, -2.421875, -2.266357421875, -2.11083984375, -1.955322265625, -1.7998046875, -1.644287109375, -1.48876953125, -1.333251953125, -1.177734375, -1.022216796875, -0.86669921875, -0.711181640625, -0.5556640625, -0.400146484375, -0.24462890625, -0.089111328125, 0.06640625, 0.221923828125, 0.37744140625, 0.532958984375, 0.6884765625, 0.843994140625, 0.99951171875, 1.155029296875, 1.310546875, 1.466064453125, 1.62158203125, 1.777099609375, 1.9326171875, 2.088134765625, 2.24365234375, 2.399169921875, 2.5546875, 2.710205078125, 2.86572265625, 3.021240234375, 3.1767578125, 3.332275390625, 3.48779296875, 3.643310546875, 3.798828125, 3.954345703125, 4.10986328125, 4.265380859375, 4.4208984375, 4.576416015625, 4.73193359375, 4.887451171875, 5.04296875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 9.0, 9.0, 15.0, 19.0, 23.0, 22.0, 30.0, 44.0, 78.0, 70.0, 146.0, 254.0, 387.0, 704.0, 1453.0, 3067.0, 7116.0, 19484.0, 69092.0, 317183.0, 469532.0, 113146.0, 28907.0, 9662.0, 3965.0, 1865.0, 945.0, 513.0, 267.0, 164.0, 96.0, 79.0, 54.0, 27.0, 14.0, 24.0, 16.0, 11.0, 16.0, 12.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.893798828125, -18.28759765625, -17.681396484375, -17.0751953125, -16.468994140625, -15.86279296875, -15.256591796875, -14.650390625, -14.044189453125, -13.43798828125, -12.831787109375, -12.2255859375, -11.619384765625, -11.01318359375, -10.406982421875, -9.80078125, -9.194580078125, -8.58837890625, -7.982177734375, -7.3759765625, -6.769775390625, -6.16357421875, -5.557373046875, -4.951171875, -4.344970703125, -3.73876953125, -3.132568359375, -2.5263671875, -1.920166015625, -1.31396484375, -0.707763671875, -0.1015625, 0.504638671875, 1.11083984375, 1.717041015625, 2.3232421875, 2.929443359375, 3.53564453125, 4.141845703125, 4.748046875, 5.354248046875, 5.96044921875, 6.566650390625, 7.1728515625, 7.779052734375, 8.38525390625, 8.991455078125, 9.59765625, 10.203857421875, 10.81005859375, 11.416259765625, 12.0224609375, 12.628662109375, 13.23486328125, 13.841064453125, 14.447265625, 15.053466796875, 15.65966796875, 16.265869140625, 16.8720703125, 17.478271484375, 18.08447265625, 18.690673828125, 19.296875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 6.0, 11.0, 12.0, 9.0, 16.0, 18.0, 18.0, 22.0, 24.0, 21.0, 26.0, 27.0, 24.0, 37.0, 35.0, 44.0, 35.0, 30.0, 39.0, 44.0, 41.0, 43.0, 35.0, 50.0, 39.0, 37.0, 35.0, 20.0, 20.0, 21.0, 25.0, 17.0, 17.0, 20.0, 13.0, 5.0, 11.0, 10.0, 6.0, 5.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.65234375, -3.55047607421875, -3.4486083984375, -3.34674072265625, -3.244873046875, -3.14300537109375, -3.0411376953125, -2.93927001953125, -2.83740234375, -2.73553466796875, -2.6336669921875, -2.53179931640625, -2.429931640625, -2.32806396484375, -2.2261962890625, -2.12432861328125, -2.0224609375, -1.92059326171875, -1.8187255859375, -1.71685791015625, -1.614990234375, -1.51312255859375, -1.4112548828125, -1.30938720703125, -1.20751953125, -1.10565185546875, -1.0037841796875, -0.90191650390625, -0.800048828125, -0.69818115234375, -0.5963134765625, -0.49444580078125, -0.392578125, -0.29071044921875, -0.1888427734375, -0.08697509765625, 0.014892578125, 0.11676025390625, 0.2186279296875, 0.32049560546875, 0.42236328125, 0.52423095703125, 0.6260986328125, 0.72796630859375, 0.829833984375, 0.93170166015625, 1.0335693359375, 1.13543701171875, 1.2373046875, 1.33917236328125, 1.4410400390625, 1.54290771484375, 1.644775390625, 1.74664306640625, 1.8485107421875, 1.95037841796875, 2.05224609375, 2.15411376953125, 2.2559814453125, 2.35784912109375, 2.459716796875, 2.56158447265625, 2.6634521484375, 2.76531982421875, 2.8671875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 15.0, 10.0, 12.0, 14.0, 39.0, 42.0, 65.0, 72.0, 115.0, 200.0, 290.0, 462.0, 712.0, 1234.0, 2170.0, 4415.0, 9319.0, 22976.0, 68441.0, 246123.0, 448685.0, 163283.0, 47565.0, 16999.0, 7211.0, 3466.0, 1840.0, 1038.0, 613.0, 398.0, 217.0, 152.0, 111.0, 70.0, 60.0, 40.0, 18.0, 14.0, 11.0, 11.0, 8.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.42578125, -6.206787109375, -5.98779296875, -5.768798828125, -5.5498046875, -5.330810546875, -5.11181640625, -4.892822265625, -4.673828125, -4.454833984375, -4.23583984375, -4.016845703125, -3.7978515625, -3.578857421875, -3.35986328125, -3.140869140625, -2.921875, -2.702880859375, -2.48388671875, -2.264892578125, -2.0458984375, -1.826904296875, -1.60791015625, -1.388916015625, -1.169921875, -0.950927734375, -0.73193359375, -0.512939453125, -0.2939453125, -0.074951171875, 0.14404296875, 0.363037109375, 0.58203125, 0.801025390625, 1.02001953125, 1.239013671875, 1.4580078125, 1.677001953125, 1.89599609375, 2.114990234375, 2.333984375, 2.552978515625, 2.77197265625, 2.990966796875, 3.2099609375, 3.428955078125, 3.64794921875, 3.866943359375, 4.0859375, 4.304931640625, 4.52392578125, 4.742919921875, 4.9619140625, 5.180908203125, 5.39990234375, 5.618896484375, 5.837890625, 6.056884765625, 6.27587890625, 6.494873046875, 6.7138671875, 6.932861328125, 7.15185546875, 7.370849609375, 7.58984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 8.0, 12.0, 30.0, 36.0, 66.0, 84.0, 133.0, 143.0, 144.0, 115.0, 81.0, 45.0, 33.0, 18.0, 8.0, 8.0, 4.0, 8.0, 5.0, 3.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00038242340087890625, -0.0003714337944984436, -0.00036044418811798096, -0.0003494545817375183, -0.00033846497535705566, -0.000327475368976593, -0.00031648576259613037, -0.0003054961562156677, -0.0002945065498352051, -0.00028351694345474243, -0.0002725273370742798, -0.00026153773069381714, -0.0002505481243133545, -0.00023955851793289185, -0.0002285689115524292, -0.00021757930517196655, -0.0002065896987915039, -0.00019560009241104126, -0.0001846104860305786, -0.00017362087965011597, -0.00016263127326965332, -0.00015164166688919067, -0.00014065206050872803, -0.00012966245412826538, -0.00011867284774780273, -0.00010768324136734009, -9.669363498687744e-05, -8.57040286064148e-05, -7.471442222595215e-05, -6.37248158454895e-05, -5.2735209465026855e-05, -4.174560308456421e-05, -3.075599670410156e-05, -1.9766390323638916e-05, -8.77678394317627e-06, 2.212822437286377e-06, 1.3202428817749023e-05, 2.419203519821167e-05, 3.5181641578674316e-05, 4.617124795913696e-05, 5.716085433959961e-05, 6.815046072006226e-05, 7.91400671005249e-05, 9.012967348098755e-05, 0.0001011192798614502, 0.00011210888624191284, 0.0001230984926223755, 0.00013408809900283813, 0.00014507770538330078, 0.00015606731176376343, 0.00016705691814422607, 0.00017804652452468872, 0.00018903613090515137, 0.00020002573728561401, 0.00021101534366607666, 0.0002220049500465393, 0.00023299455642700195, 0.0002439841628074646, 0.00025497376918792725, 0.0002659633755683899, 0.00027695298194885254, 0.0002879425883293152, 0.00029893219470977783, 0.0003099218010902405, 0.0003209114074707031]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 7.0, 11.0, 12.0, 17.0, 25.0, 27.0, 57.0, 62.0, 71.0, 91.0, 125.0, 172.0, 254.0, 296.0, 455.0, 578.0, 823.0, 1220.0, 1777.0, 2920.0, 5120.0, 10005.0, 22778.0, 60303.0, 173628.0, 357006.0, 254039.0, 92204.0, 33169.0, 13951.0, 6552.0, 3624.0, 2149.0, 1463.0, 1001.0, 663.0, 508.0, 354.0, 263.0, 200.0, 148.0, 123.0, 81.0, 42.0, 40.0, 36.0, 29.0, 14.0, 12.0, 16.0, 8.0, 11.0, 9.0, 6.0, 3.0, 5.0], "bins": [-6.41796875, -6.2275390625, -6.037109375, -5.8466796875, -5.65625, -5.4658203125, -5.275390625, -5.0849609375, -4.89453125, -4.7041015625, -4.513671875, -4.3232421875, -4.1328125, -3.9423828125, -3.751953125, -3.5615234375, -3.37109375, -3.1806640625, -2.990234375, -2.7998046875, -2.609375, -2.4189453125, -2.228515625, -2.0380859375, -1.84765625, -1.6572265625, -1.466796875, -1.2763671875, -1.0859375, -0.8955078125, -0.705078125, -0.5146484375, -0.32421875, -0.1337890625, 0.056640625, 0.2470703125, 0.4375, 0.6279296875, 0.818359375, 1.0087890625, 1.19921875, 1.3896484375, 1.580078125, 1.7705078125, 1.9609375, 2.1513671875, 2.341796875, 2.5322265625, 2.72265625, 2.9130859375, 3.103515625, 3.2939453125, 3.484375, 3.6748046875, 3.865234375, 4.0556640625, 4.24609375, 4.4365234375, 4.626953125, 4.8173828125, 5.0078125, 5.1982421875, 5.388671875, 5.5791015625, 5.76953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 10.0, 6.0, 6.0, 14.0, 18.0, 20.0, 29.0, 35.0, 48.0, 67.0, 106.0, 101.0, 84.0, 99.0, 88.0, 62.0, 49.0, 31.0, 32.0, 23.0, 13.0, 19.0, 10.0, 8.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.09375, -2.02972412109375, -1.9656982421875, -1.90167236328125, -1.837646484375, -1.77362060546875, -1.7095947265625, -1.64556884765625, -1.58154296875, -1.51751708984375, -1.4534912109375, -1.38946533203125, -1.325439453125, -1.26141357421875, -1.1973876953125, -1.13336181640625, -1.0693359375, -1.00531005859375, -0.9412841796875, -0.87725830078125, -0.813232421875, -0.74920654296875, -0.6851806640625, -0.62115478515625, -0.55712890625, -0.49310302734375, -0.4290771484375, -0.36505126953125, -0.301025390625, -0.23699951171875, -0.1729736328125, -0.10894775390625, -0.044921875, 0.01910400390625, 0.0831298828125, 0.14715576171875, 0.211181640625, 0.27520751953125, 0.3392333984375, 0.40325927734375, 0.46728515625, 0.53131103515625, 0.5953369140625, 0.65936279296875, 0.723388671875, 0.78741455078125, 0.8514404296875, 0.91546630859375, 0.9794921875, 1.04351806640625, 1.1075439453125, 1.17156982421875, 1.235595703125, 1.29962158203125, 1.3636474609375, 1.42767333984375, 1.49169921875, 1.55572509765625, 1.6197509765625, 1.68377685546875, 1.747802734375, 1.81182861328125, 1.8758544921875, 1.93988037109375, 2.00390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 7.0, 4.0, 10.0, 7.0, 10.0, 7.0, 13.0, 16.0, 22.0, 24.0, 35.0, 46.0, 47.0, 67.0, 55.0, 60.0, 43.0, 74.0, 66.0, 59.0, 41.0, 45.0, 41.0, 33.0, 37.0, 31.0, 9.0, 19.0, 11.0, 15.0, 11.0, 12.0, 6.0, 8.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.309675693511963, -7.117921352386475, -6.9261674880981445, -6.734413146972656, -6.542658805847168, -6.350904941558838, -6.15915060043335, -5.9673967361450195, -5.775642395019531, -5.583888053894043, -5.392134189605713, -5.200379848480225, -5.008625507354736, -4.816871643066406, -4.625117301940918, -4.43336296081543, -4.241608619689941, -4.049854278564453, -3.858100175857544, -3.6663460731506348, -3.4745919704437256, -3.2828378677368164, -3.091083526611328, -2.899329423904419, -2.7075753211975098, -2.5158212184906006, -2.3240668773651123, -2.132312774658203, -1.940558671951294, -1.7488044500350952, -1.5570502281188965, -1.3652961254119873, -1.1735420227050781, -0.9817878603935242, -0.7900336980819702, -0.5982794761657715, -0.40652531385421753, -0.21477115154266357, -0.023016929626464844, 0.16873717308044434, 0.36049139499664307, 0.552245557308197, 0.743999719619751, 0.9357539415359497, 1.1275081634521484, 1.3192622661590576, 1.5110164880752563, 1.7027705907821655, 1.8945248126983643, 2.0862789154052734, 2.2780332565307617, 2.469787359237671, 2.66154146194458, 2.8532958030700684, 3.0450499057769775, 3.2368040084838867, 3.428558349609375, 3.620312452316284, 3.8120667934417725, 4.003820896148682, 4.19557523727417, 4.3873291015625, 4.579083442687988, 4.770837783813477, 4.962591648101807]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 4.0, 12.0, 8.0, 11.0, 6.0, 13.0, 16.0, 19.0, 14.0, 29.0, 26.0, 18.0, 36.0, 31.0, 39.0, 32.0, 32.0, 41.0, 39.0, 37.0, 42.0, 47.0, 39.0, 30.0, 33.0, 33.0, 38.0, 38.0, 28.0, 34.0, 16.0, 20.0, 29.0, 16.0, 14.0, 12.0, 15.0, 18.0, 10.0, 6.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.907649993896484, -4.7516303062438965, -4.59561014175415, -4.4395904541015625, -4.283570766448975, -4.127551078796387, -3.9715309143066406, -3.8155112266540527, -3.6594913005828857, -3.5034713745117188, -3.347451686859131, -3.191431760787964, -3.035411834716797, -2.879392147064209, -2.723372220993042, -2.567352294921875, -2.411332607269287, -2.25531268119812, -2.0992929935455322, -1.9432730674743652, -1.7872532606124878, -1.6312334537506104, -1.4752135276794434, -1.319193720817566, -1.1631739139556885, -1.007154107093811, -0.8511342406272888, -0.6951143741607666, -0.5390945672988892, -0.3830747604370117, -0.2270548939704895, -0.07103502750396729, 0.08498430252075195, 0.24100413918495178, 0.3970239758491516, 0.5530438423156738, 0.7090636491775513, 0.8650834560394287, 1.0211033821105957, 1.1771231889724731, 1.3331429958343506, 1.489162802696228, 1.6451826095581055, 1.8012025356292725, 1.95722234249115, 2.1132421493530273, 2.2692620754241943, 2.4252820014953613, 2.581301689147949, 2.737321615219116, 2.893341302871704, 3.049361228942871, 3.205380916595459, 3.361400842666626, 3.517420768737793, 3.673440456390381, 3.829460382461548, 3.985480308532715, 4.141499996185303, 4.297519683837891, 4.453539848327637, 4.609559535980225, 4.7655792236328125, 4.921599388122559, 5.0776190757751465]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 13.0, 11.0, 23.0, 23.0, 32.0, 43.0, 90.0, 111.0, 186.0, 283.0, 425.0, 638.0, 1078.0, 1703.0, 2788.0, 4415.0, 7541.0, 13002.0, 21900.0, 37066.0, 60427.0, 94279.0, 132968.0, 161204.0, 158184.0, 125989.0, 86595.0, 55176.0, 33499.0, 19691.0, 11662.0, 6830.0, 4031.0, 2451.0, 1495.0, 913.0, 621.0, 395.0, 259.0, 177.0, 116.0, 82.0, 48.0, 27.0, 19.0, 10.0, 14.0, 8.0, 6.0, 6.0, 4.0, 1.0, 4.0], "bins": [-5.75390625, -5.58905029296875, -5.4241943359375, -5.25933837890625, -5.094482421875, -4.92962646484375, -4.7647705078125, -4.59991455078125, -4.43505859375, -4.27020263671875, -4.1053466796875, -3.94049072265625, -3.775634765625, -3.61077880859375, -3.4459228515625, -3.28106689453125, -3.1162109375, -2.95135498046875, -2.7864990234375, -2.62164306640625, -2.456787109375, -2.29193115234375, -2.1270751953125, -1.96221923828125, -1.79736328125, -1.63250732421875, -1.4676513671875, -1.30279541015625, -1.137939453125, -0.97308349609375, -0.8082275390625, -0.64337158203125, -0.478515625, -0.31365966796875, -0.1488037109375, 0.01605224609375, 0.180908203125, 0.34576416015625, 0.5106201171875, 0.67547607421875, 0.84033203125, 1.00518798828125, 1.1700439453125, 1.33489990234375, 1.499755859375, 1.66461181640625, 1.8294677734375, 1.99432373046875, 2.1591796875, 2.32403564453125, 2.4888916015625, 2.65374755859375, 2.818603515625, 2.98345947265625, 3.1483154296875, 3.31317138671875, 3.47802734375, 3.64288330078125, 3.8077392578125, 3.97259521484375, 4.137451171875, 4.30230712890625, 4.4671630859375, 4.63201904296875, 4.796875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 3.0, 6.0, 7.0, 7.0, 9.0, 9.0, 18.0, 20.0, 16.0, 23.0, 21.0, 25.0, 36.0, 32.0, 33.0, 48.0, 44.0, 43.0, 37.0, 50.0, 31.0, 39.0, 54.0, 41.0, 32.0, 32.0, 43.0, 31.0, 25.0, 21.0, 24.0, 27.0, 18.0, 20.0, 17.0, 9.0, 11.0, 12.0, 11.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.35546875, -5.1947021484375, -5.033935546875, -4.8731689453125, -4.71240234375, -4.5516357421875, -4.390869140625, -4.2301025390625, -4.0693359375, -3.9085693359375, -3.747802734375, -3.5870361328125, -3.42626953125, -3.2655029296875, -3.104736328125, -2.9439697265625, -2.783203125, -2.6224365234375, -2.461669921875, -2.3009033203125, -2.14013671875, -1.9793701171875, -1.818603515625, -1.6578369140625, -1.4970703125, -1.3363037109375, -1.175537109375, -1.0147705078125, -0.85400390625, -0.6932373046875, -0.532470703125, -0.3717041015625, -0.2109375, -0.0501708984375, 0.110595703125, 0.2713623046875, 0.43212890625, 0.5928955078125, 0.753662109375, 0.9144287109375, 1.0751953125, 1.2359619140625, 1.396728515625, 1.5574951171875, 1.71826171875, 1.8790283203125, 2.039794921875, 2.2005615234375, 2.361328125, 2.5220947265625, 2.682861328125, 2.8436279296875, 3.00439453125, 3.1651611328125, 3.325927734375, 3.4866943359375, 3.6474609375, 3.8082275390625, 3.968994140625, 4.1297607421875, 4.29052734375, 4.4512939453125, 4.612060546875, 4.7728271484375, 4.93359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 6.0, 9.0, 14.0, 23.0, 37.0, 55.0, 65.0, 82.0, 153.0, 178.0, 270.0, 388.0, 555.0, 836.0, 1218.0, 1782.0, 2573.0, 3837.0, 5782.0, 8400.0, 12512.0, 18961.0, 27869.0, 40816.0, 58442.0, 80642.0, 103916.0, 120689.0, 125755.0, 114868.0, 92730.0, 70166.0, 49984.0, 33955.0, 23495.0, 15594.0, 10419.0, 6861.0, 4730.0, 3096.0, 2064.0, 1459.0, 992.0, 722.0, 512.0, 354.0, 199.0, 141.0, 129.0, 68.0, 51.0, 46.0, 16.0, 19.0, 14.0, 6.0, 7.0, 4.0, 1.0, 1.0], "bins": [-3.693359375, -3.578887939453125, -3.46441650390625, -3.349945068359375, -3.2354736328125, -3.121002197265625, -3.00653076171875, -2.892059326171875, -2.777587890625, -2.663116455078125, -2.54864501953125, -2.434173583984375, -2.3197021484375, -2.205230712890625, -2.09075927734375, -1.976287841796875, -1.86181640625, -1.747344970703125, -1.63287353515625, -1.518402099609375, -1.4039306640625, -1.289459228515625, -1.17498779296875, -1.060516357421875, -0.946044921875, -0.831573486328125, -0.71710205078125, -0.602630615234375, -0.4881591796875, -0.373687744140625, -0.25921630859375, -0.144744873046875, -0.0302734375, 0.084197998046875, 0.19866943359375, 0.313140869140625, 0.4276123046875, 0.542083740234375, 0.65655517578125, 0.771026611328125, 0.885498046875, 0.999969482421875, 1.11444091796875, 1.228912353515625, 1.3433837890625, 1.457855224609375, 1.57232666015625, 1.686798095703125, 1.80126953125, 1.915740966796875, 2.03021240234375, 2.144683837890625, 2.2591552734375, 2.373626708984375, 2.48809814453125, 2.602569580078125, 2.717041015625, 2.831512451171875, 2.94598388671875, 3.060455322265625, 3.1749267578125, 3.289398193359375, 3.40386962890625, 3.518341064453125, 3.6328125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 10.0, 5.0, 6.0, 7.0, 7.0, 8.0, 11.0, 12.0, 13.0, 15.0, 16.0, 29.0, 27.0, 34.0, 25.0, 40.0, 38.0, 39.0, 37.0, 42.0, 49.0, 33.0, 38.0, 43.0, 52.0, 42.0, 34.0, 37.0, 37.0, 35.0, 28.0, 15.0, 19.0, 21.0, 18.0, 18.0, 14.0, 11.0, 13.0, 5.0, 7.0, 5.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.697265625, -3.59332275390625, -3.4893798828125, -3.38543701171875, -3.281494140625, -3.17755126953125, -3.0736083984375, -2.96966552734375, -2.86572265625, -2.76177978515625, -2.6578369140625, -2.55389404296875, -2.449951171875, -2.34600830078125, -2.2420654296875, -2.13812255859375, -2.0341796875, -1.93023681640625, -1.8262939453125, -1.72235107421875, -1.618408203125, -1.51446533203125, -1.4105224609375, -1.30657958984375, -1.20263671875, -1.09869384765625, -0.9947509765625, -0.89080810546875, -0.786865234375, -0.68292236328125, -0.5789794921875, -0.47503662109375, -0.37109375, -0.26715087890625, -0.1632080078125, -0.05926513671875, 0.044677734375, 0.14862060546875, 0.2525634765625, 0.35650634765625, 0.46044921875, 0.56439208984375, 0.6683349609375, 0.77227783203125, 0.876220703125, 0.98016357421875, 1.0841064453125, 1.18804931640625, 1.2919921875, 1.39593505859375, 1.4998779296875, 1.60382080078125, 1.707763671875, 1.81170654296875, 1.9156494140625, 2.01959228515625, 2.12353515625, 2.22747802734375, 2.3314208984375, 2.43536376953125, 2.539306640625, 2.64324951171875, 2.7471923828125, 2.85113525390625, 2.955078125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 8.0, 12.0, 37.0, 50.0, 71.0, 123.0, 151.0, 234.0, 320.0, 486.0, 697.0, 1163.0, 1821.0, 2751.0, 4489.0, 7241.0, 11849.0, 20184.0, 34572.0, 61900.0, 109759.0, 179463.0, 213810.0, 165439.0, 99018.0, 55345.0, 30980.0, 17984.0, 10769.0, 6430.0, 4005.0, 2515.0, 1652.0, 1092.0, 690.0, 456.0, 330.0, 210.0, 157.0, 90.0, 66.0, 44.0, 24.0, 17.0, 9.0, 11.0, 7.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.97119140625, -3.8447265625, -3.71826171875, -3.591796875, -3.46533203125, -3.3388671875, -3.21240234375, -3.0859375, -2.95947265625, -2.8330078125, -2.70654296875, -2.580078125, -2.45361328125, -2.3271484375, -2.20068359375, -2.07421875, -1.94775390625, -1.8212890625, -1.69482421875, -1.568359375, -1.44189453125, -1.3154296875, -1.18896484375, -1.0625, -0.93603515625, -0.8095703125, -0.68310546875, -0.556640625, -0.43017578125, -0.3037109375, -0.17724609375, -0.05078125, 0.07568359375, 0.2021484375, 0.32861328125, 0.455078125, 0.58154296875, 0.7080078125, 0.83447265625, 0.9609375, 1.08740234375, 1.2138671875, 1.34033203125, 1.466796875, 1.59326171875, 1.7197265625, 1.84619140625, 1.97265625, 2.09912109375, 2.2255859375, 2.35205078125, 2.478515625, 2.60498046875, 2.7314453125, 2.85791015625, 2.984375, 3.11083984375, 3.2373046875, 3.36376953125, 3.490234375, 3.61669921875, 3.7431640625, 3.86962890625, 3.99609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 6.0, 4.0, 4.0, 11.0, 11.0, 11.0, 28.0, 17.0, 34.0, 35.0, 55.0, 73.0, 80.0, 105.0, 75.0, 89.0, 67.0, 62.0, 46.0, 40.0, 27.0, 26.0, 23.0, 13.0, 19.0, 4.0, 4.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00039005279541015625, -0.00037520378828048706, -0.00036035478115081787, -0.0003455057740211487, -0.0003306567668914795, -0.0003158077597618103, -0.0003009587526321411, -0.0002861097455024719, -0.00027126073837280273, -0.00025641173124313354, -0.00024156272411346436, -0.00022671371698379517, -0.00021186470985412598, -0.0001970157027244568, -0.0001821666955947876, -0.0001673176884651184, -0.00015246868133544922, -0.00013761967420578003, -0.00012277066707611084, -0.00010792165994644165, -9.307265281677246e-05, -7.822364568710327e-05, -6.337463855743408e-05, -4.852563142776489e-05, -3.36766242980957e-05, -1.8827617168426514e-05, -3.978610038757324e-06, 1.0870397090911865e-05, 2.5719404220581055e-05, 4.0568411350250244e-05, 5.5417418479919434e-05, 7.026642560958862e-05, 8.511543273925781e-05, 9.9964439868927e-05, 0.00011481344699859619, 0.00012966245412826538, 0.00014451146125793457, 0.00015936046838760376, 0.00017420947551727295, 0.00018905848264694214, 0.00020390748977661133, 0.00021875649690628052, 0.0002336055040359497, 0.0002484545111656189, 0.0002633035182952881, 0.0002781525254249573, 0.00029300153255462646, 0.00030785053968429565, 0.00032269954681396484, 0.00033754855394363403, 0.0003523975610733032, 0.0003672465682029724, 0.0003820955753326416, 0.0003969445824623108, 0.00041179358959198, 0.00042664259672164917, 0.00044149160385131836, 0.00045634061098098755, 0.00047118961811065674, 0.00048603862524032593, 0.0005008876323699951, 0.0005157366394996643, 0.0005305856466293335, 0.0005454346537590027, 0.0005602836608886719]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 19.0, 23.0, 42.0, 52.0, 82.0, 117.0, 167.0, 263.0, 352.0, 594.0, 911.0, 1426.0, 2273.0, 3635.0, 5787.0, 8955.0, 14684.0, 24146.0, 39582.0, 65700.0, 107961.0, 159829.0, 186678.0, 156314.0, 104656.0, 64195.0, 38633.0, 23205.0, 14286.0, 8865.0, 5523.0, 3395.0, 2182.0, 1340.0, 881.0, 595.0, 391.0, 261.0, 164.0, 119.0, 75.0, 55.0, 43.0, 22.0, 24.0, 17.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-3.244140625, -3.14422607421875, -3.0443115234375, -2.94439697265625, -2.844482421875, -2.74456787109375, -2.6446533203125, -2.54473876953125, -2.44482421875, -2.34490966796875, -2.2449951171875, -2.14508056640625, -2.045166015625, -1.94525146484375, -1.8453369140625, -1.74542236328125, -1.6455078125, -1.54559326171875, -1.4456787109375, -1.34576416015625, -1.245849609375, -1.14593505859375, -1.0460205078125, -0.94610595703125, -0.84619140625, -0.74627685546875, -0.6463623046875, -0.54644775390625, -0.446533203125, -0.34661865234375, -0.2467041015625, -0.14678955078125, -0.046875, 0.05303955078125, 0.1529541015625, 0.25286865234375, 0.352783203125, 0.45269775390625, 0.5526123046875, 0.65252685546875, 0.75244140625, 0.85235595703125, 0.9522705078125, 1.05218505859375, 1.152099609375, 1.25201416015625, 1.3519287109375, 1.45184326171875, 1.5517578125, 1.65167236328125, 1.7515869140625, 1.85150146484375, 1.951416015625, 2.05133056640625, 2.1512451171875, 2.25115966796875, 2.35107421875, 2.45098876953125, 2.5509033203125, 2.65081787109375, 2.750732421875, 2.85064697265625, 2.9505615234375, 3.05047607421875, 3.150390625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 7.0, 10.0, 11.0, 9.0, 10.0, 13.0, 24.0, 25.0, 25.0, 20.0, 46.0, 42.0, 53.0, 52.0, 71.0, 63.0, 64.0, 53.0, 80.0, 57.0, 47.0, 41.0, 37.0, 34.0, 21.0, 18.0, 18.0, 14.0, 7.0, 9.0, 6.0, 1.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.462890625, -1.42022705078125, -1.3775634765625, -1.33489990234375, -1.292236328125, -1.24957275390625, -1.2069091796875, -1.16424560546875, -1.12158203125, -1.07891845703125, -1.0362548828125, -0.99359130859375, -0.950927734375, -0.90826416015625, -0.8656005859375, -0.82293701171875, -0.7802734375, -0.73760986328125, -0.6949462890625, -0.65228271484375, -0.609619140625, -0.56695556640625, -0.5242919921875, -0.48162841796875, -0.43896484375, -0.39630126953125, -0.3536376953125, -0.31097412109375, -0.268310546875, -0.22564697265625, -0.1829833984375, -0.14031982421875, -0.09765625, -0.05499267578125, -0.0123291015625, 0.03033447265625, 0.072998046875, 0.11566162109375, 0.1583251953125, 0.20098876953125, 0.24365234375, 0.28631591796875, 0.3289794921875, 0.37164306640625, 0.414306640625, 0.45697021484375, 0.4996337890625, 0.54229736328125, 0.5849609375, 0.62762451171875, 0.6702880859375, 0.71295166015625, 0.755615234375, 0.79827880859375, 0.8409423828125, 0.88360595703125, 0.92626953125, 0.96893310546875, 1.0115966796875, 1.05426025390625, 1.096923828125, 1.13958740234375, 1.1822509765625, 1.22491455078125, 1.267578125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 5.0, 3.0, 6.0, 15.0, 9.0, 16.0, 16.0, 26.0, 24.0, 34.0, 37.0, 51.0, 50.0, 58.0, 50.0, 52.0, 46.0, 35.0, 43.0, 46.0, 44.0, 50.0, 45.0, 46.0, 31.0, 28.0, 20.0, 21.0, 10.0, 17.0, 12.0, 8.0, 7.0, 13.0, 7.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.845086097717285, -5.682246685028076, -5.519407749176025, -5.356568336486816, -5.193729400634766, -5.030889987945557, -4.868050575256348, -4.705211639404297, -4.542372226715088, -4.379532814025879, -4.216693878173828, -4.053854465484619, -3.8910152912139893, -3.7281761169433594, -3.5653367042541504, -3.4024975299835205, -3.2396583557128906, -3.0768191814422607, -2.913980007171631, -2.751140594482422, -2.588301420211792, -2.425462245941162, -2.262622833251953, -2.0997836589813232, -1.9369444847106934, -1.7741053104400635, -1.611266016960144, -1.4484267234802246, -1.2855875492095947, -1.1227483749389648, -0.9599090814590454, -0.797069787979126, -0.6342306137084961, -0.47139137983322144, -0.3085521459579468, -0.14571291208267212, 0.01712632179260254, 0.1799655556678772, 0.34280478954315186, 0.5056440830230713, 0.6684832572937012, 0.8313224911689758, 0.9941617250442505, 1.15700101852417, 1.3198401927947998, 1.4826793670654297, 1.6455186605453491, 1.8083579540252686, 1.9711971282958984, 2.1340363025665283, 2.296875476837158, 2.459714889526367, 2.622554063796997, 2.785393238067627, 2.948232650756836, 3.111071825027466, 3.2739109992980957, 3.4367501735687256, 3.5995893478393555, 3.7624287605285645, 3.9252679347991943, 4.088107109069824, 4.250946521759033, 4.413785934448242, 4.576624870300293]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 13.0, 6.0, 8.0, 9.0, 13.0, 13.0, 22.0, 12.0, 30.0, 28.0, 24.0, 24.0, 25.0, 40.0, 40.0, 32.0, 37.0, 46.0, 32.0, 34.0, 43.0, 28.0, 33.0, 34.0, 43.0, 42.0, 38.0, 35.0, 30.0, 30.0, 16.0, 11.0, 19.0, 15.0, 10.0, 8.0, 13.0, 14.0, 6.0, 12.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-5.317191123962402, -5.1636576652526855, -5.010124683380127, -4.85659122467041, -4.703058242797852, -4.549524784088135, -4.395991325378418, -4.242458343505859, -4.088924884796143, -3.935391664505005, -3.781858444213867, -3.6283249855041504, -3.4747917652130127, -3.321258544921875, -3.167725086212158, -3.0141918659210205, -2.860658645629883, -2.707125425338745, -2.5535922050476074, -2.4000587463378906, -2.246525526046753, -2.0929923057556152, -1.939458966255188, -1.7859256267547607, -1.632392406463623, -1.4788591861724854, -1.325325846672058, -1.1717925071716309, -1.0182592868804932, -0.8647260069847107, -0.7111927270889282, -0.557659387588501, -0.4041266441345215, -0.250593364238739, -0.09706008434295654, 0.05647319555282593, 0.2100064754486084, 0.36353975534439087, 0.5170730352401733, 0.6706063747406006, 0.8241395950317383, 0.9776728749275208, 1.1312061548233032, 1.2847394943237305, 1.4382727146148682, 1.5918059349060059, 1.745339274406433, 1.8988726139068604, 2.052405834197998, 2.2059390544891357, 2.3594722747802734, 2.5130057334899902, 2.666538953781128, 2.8200721740722656, 2.9736056327819824, 3.12713885307312, 3.280672073364258, 3.4342052936553955, 3.587738513946533, 3.74127197265625, 3.8948051929473877, 4.048338413238525, 4.201871871948242, 4.355404853820801, 4.508938312530518]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 10.0, 21.0, 32.0, 46.0, 61.0, 102.0, 130.0, 190.0, 292.0, 362.0, 549.0, 839.0, 1193.0, 1938.0, 2849.0, 4697.0, 7508.0, 12850.0, 22810.0, 44607.0, 98314.0, 248779.0, 661319.0, 1224296.0, 1060044.0, 475717.0, 174715.0, 71420.0, 33937.0, 17832.0, 10075.0, 5932.0, 3681.0, 2322.0, 1553.0, 978.0, 709.0, 516.0, 336.0, 187.0, 148.0, 109.0, 69.0, 59.0, 41.0, 34.0, 21.0, 21.0, 6.0, 8.0, 5.0, 3.0, 1.0, 4.0, 1.0], "bins": [-6.1015625, -5.9156494140625, -5.729736328125, -5.5438232421875, -5.35791015625, -5.1719970703125, -4.986083984375, -4.8001708984375, -4.6142578125, -4.4283447265625, -4.242431640625, -4.0565185546875, -3.87060546875, -3.6846923828125, -3.498779296875, -3.3128662109375, -3.126953125, -2.9410400390625, -2.755126953125, -2.5692138671875, -2.38330078125, -2.1973876953125, -2.011474609375, -1.8255615234375, -1.6396484375, -1.4537353515625, -1.267822265625, -1.0819091796875, -0.89599609375, -0.7100830078125, -0.524169921875, -0.3382568359375, -0.15234375, 0.0335693359375, 0.219482421875, 0.4053955078125, 0.59130859375, 0.7772216796875, 0.963134765625, 1.1490478515625, 1.3349609375, 1.5208740234375, 1.706787109375, 1.8927001953125, 2.07861328125, 2.2645263671875, 2.450439453125, 2.6363525390625, 2.822265625, 3.0081787109375, 3.194091796875, 3.3800048828125, 3.56591796875, 3.7518310546875, 3.937744140625, 4.1236572265625, 4.3095703125, 4.4954833984375, 4.681396484375, 4.8673095703125, 5.05322265625, 5.2391357421875, 5.425048828125, 5.6109619140625, 5.796875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 8.0, 6.0, 5.0, 8.0, 5.0, 9.0, 14.0, 15.0, 14.0, 22.0, 19.0, 17.0, 21.0, 20.0, 30.0, 26.0, 21.0, 25.0, 31.0, 39.0, 36.0, 42.0, 31.0, 38.0, 44.0, 30.0, 40.0, 33.0, 32.0, 42.0, 26.0, 30.0, 35.0, 24.0, 18.0, 25.0, 15.0, 15.0, 10.0, 14.0, 11.0, 11.0, 13.0, 5.0, 5.0, 3.0, 11.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.3828125, -3.28515625, -3.1875, -3.08984375, -2.9921875, -2.89453125, -2.796875, -2.69921875, -2.6015625, -2.50390625, -2.40625, -2.30859375, -2.2109375, -2.11328125, -2.015625, -1.91796875, -1.8203125, -1.72265625, -1.625, -1.52734375, -1.4296875, -1.33203125, -1.234375, -1.13671875, -1.0390625, -0.94140625, -0.84375, -0.74609375, -0.6484375, -0.55078125, -0.453125, -0.35546875, -0.2578125, -0.16015625, -0.0625, 0.03515625, 0.1328125, 0.23046875, 0.328125, 0.42578125, 0.5234375, 0.62109375, 0.71875, 0.81640625, 0.9140625, 1.01171875, 1.109375, 1.20703125, 1.3046875, 1.40234375, 1.5, 1.59765625, 1.6953125, 1.79296875, 1.890625, 1.98828125, 2.0859375, 2.18359375, 2.28125, 2.37890625, 2.4765625, 2.57421875, 2.671875, 2.76953125, 2.8671875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 13.0, 8.0, 11.0, 17.0, 37.0, 52.0, 91.0, 128.0, 152.0, 280.0, 452.0, 670.0, 996.0, 1579.0, 2375.0, 3878.0, 5916.0, 9999.0, 16920.0, 29802.0, 54793.0, 106323.0, 223903.0, 484979.0, 939667.0, 1073796.0, 639561.0, 298271.0, 140123.0, 69613.0, 37281.0, 20764.0, 12131.0, 7260.0, 4489.0, 2856.0, 1751.0, 1151.0, 715.0, 494.0, 338.0, 243.0, 141.0, 88.0, 66.0, 29.0, 36.0, 13.0, 17.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.23828125, -5.0703125, -4.90234375, -4.734375, -4.56640625, -4.3984375, -4.23046875, -4.0625, -3.89453125, -3.7265625, -3.55859375, -3.390625, -3.22265625, -3.0546875, -2.88671875, -2.71875, -2.55078125, -2.3828125, -2.21484375, -2.046875, -1.87890625, -1.7109375, -1.54296875, -1.375, -1.20703125, -1.0390625, -0.87109375, -0.703125, -0.53515625, -0.3671875, -0.19921875, -0.03125, 0.13671875, 0.3046875, 0.47265625, 0.640625, 0.80859375, 0.9765625, 1.14453125, 1.3125, 1.48046875, 1.6484375, 1.81640625, 1.984375, 2.15234375, 2.3203125, 2.48828125, 2.65625, 2.82421875, 2.9921875, 3.16015625, 3.328125, 3.49609375, 3.6640625, 3.83203125, 4.0, 4.16796875, 4.3359375, 4.50390625, 4.671875, 4.83984375, 5.0078125, 5.17578125, 5.34375, 5.51171875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 7.0, 5.0, 4.0, 6.0, 9.0, 12.0, 4.0, 21.0, 13.0, 21.0, 27.0, 42.0, 41.0, 59.0, 44.0, 90.0, 109.0, 105.0, 188.0, 189.0, 224.0, 254.0, 269.0, 281.0, 293.0, 268.0, 254.0, 216.0, 209.0, 153.0, 127.0, 124.0, 79.0, 68.0, 54.0, 43.0, 41.0, 33.0, 11.0, 19.0, 8.0, 10.0, 7.0, 7.0, 6.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0], "bins": [-2.0078125, -1.953155517578125, -1.89849853515625, -1.843841552734375, -1.7891845703125, -1.734527587890625, -1.67987060546875, -1.625213623046875, -1.570556640625, -1.515899658203125, -1.46124267578125, -1.406585693359375, -1.3519287109375, -1.297271728515625, -1.24261474609375, -1.187957763671875, -1.13330078125, -1.078643798828125, -1.02398681640625, -0.969329833984375, -0.9146728515625, -0.860015869140625, -0.80535888671875, -0.750701904296875, -0.696044921875, -0.641387939453125, -0.58673095703125, -0.532073974609375, -0.4774169921875, -0.422760009765625, -0.36810302734375, -0.313446044921875, -0.2587890625, -0.204132080078125, -0.14947509765625, -0.094818115234375, -0.0401611328125, 0.014495849609375, 0.06915283203125, 0.123809814453125, 0.178466796875, 0.233123779296875, 0.28778076171875, 0.342437744140625, 0.3970947265625, 0.451751708984375, 0.50640869140625, 0.561065673828125, 0.61572265625, 0.670379638671875, 0.72503662109375, 0.779693603515625, 0.8343505859375, 0.889007568359375, 0.94366455078125, 0.998321533203125, 1.052978515625, 1.107635498046875, 1.16229248046875, 1.216949462890625, 1.2716064453125, 1.326263427734375, 1.38092041015625, 1.435577392578125, 1.490234375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 10.0, 10.0, 13.0, 15.0, 18.0, 24.0, 41.0, 38.0, 45.0, 46.0, 54.0, 56.0, 55.0, 66.0, 59.0, 62.0, 57.0, 59.0, 51.0, 43.0, 26.0, 27.0, 18.0, 23.0, 13.0, 15.0, 9.0, 2.0, 10.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.952475547790527, -5.785172939300537, -5.617870330810547, -5.450567722320557, -5.283265113830566, -5.115962505340576, -4.948659896850586, -4.7813568115234375, -4.6140546798706055, -4.446752071380615, -4.279449462890625, -4.112146854400635, -3.9448442459106445, -3.7775416374206543, -3.610238790512085, -3.4429361820220947, -3.2756333351135254, -3.108330726623535, -2.941028118133545, -2.7737255096435547, -2.6064229011535645, -2.439120292663574, -2.271817445755005, -2.1045148372650146, -1.9372122287750244, -1.7699096202850342, -1.602607011795044, -1.4353042840957642, -1.268001675605774, -1.1006990671157837, -0.9333963394165039, -0.7660937309265137, -0.5987906455993652, -0.4314880073070526, -0.26418536901474, -0.09688270092010498, 0.07041990756988525, 0.2377225160598755, 0.4050252437591553, 0.5723278522491455, 0.7396304607391357, 0.906933069229126, 1.0742356777191162, 1.241538405418396, 1.4088410139083862, 1.5761436223983765, 1.7434463500976562, 1.9107489585876465, 2.0780515670776367, 2.245354175567627, 2.412656784057617, 2.5799593925476074, 2.7472620010375977, 2.914564609527588, 3.0818674564361572, 3.2491700649261475, 3.4164726734161377, 3.583775281906128, 3.751077890396118, 3.9183807373046875, 4.085683345794678, 4.252985954284668, 4.420288562774658, 4.587591171264648, 4.754893779754639]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 4.0, 3.0, 7.0, 8.0, 13.0, 5.0, 15.0, 11.0, 10.0, 19.0, 17.0, 18.0, 30.0, 29.0, 31.0, 28.0, 27.0, 36.0, 28.0, 30.0, 39.0, 32.0, 46.0, 51.0, 40.0, 42.0, 30.0, 42.0, 31.0, 27.0, 30.0, 28.0, 28.0, 26.0, 22.0, 22.0, 14.0, 17.0, 16.0, 12.0, 10.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.948421001434326, -3.8211495876312256, -3.693877935409546, -3.5666065216064453, -3.4393348693847656, -3.312063455581665, -3.1847920417785645, -3.0575203895568848, -2.930248975753784, -2.8029775619506836, -2.675705909729004, -2.5484344959259033, -2.4211630821228027, -2.293891429901123, -2.1666200160980225, -2.039348602294922, -1.9120769500732422, -1.784805417060852, -1.657533884048462, -1.5302624702453613, -1.4029909372329712, -1.275719404220581, -1.1484479904174805, -1.0211764574050903, -0.8939049243927002, -0.7666333913803101, -0.6393619179725647, -0.5120904445648193, -0.3848189115524292, -0.25754737854003906, -0.1302759051322937, -0.00300443172454834, 0.1242666244506836, 0.25153812766075134, 0.3788096308708191, 0.5060811042785645, 0.6333526372909546, 0.7606241703033447, 0.8878956437110901, 1.0151671171188354, 1.1424386501312256, 1.2697101831436157, 1.3969817161560059, 1.5242531299591064, 1.6515246629714966, 1.7787961959838867, 1.9060676097869873, 2.033339023590088, 2.1606106758117676, 2.287882089614868, 2.415153741836548, 2.5424251556396484, 2.669696807861328, 2.7969682216644287, 2.9242396354675293, 3.051511287689209, 3.1787827014923096, 3.30605411529541, 3.43332576751709, 3.5605971813201904, 3.687868595123291, 3.8151402473449707, 3.9424116611480713, 4.069683074951172, 4.196954727172852]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 10.0, 12.0, 15.0, 32.0, 27.0, 63.0, 90.0, 118.0, 166.0, 286.0, 365.0, 589.0, 868.0, 1452.0, 2372.0, 3821.0, 6537.0, 12089.0, 24174.0, 50486.0, 108656.0, 209432.0, 265815.0, 183471.0, 90107.0, 41939.0, 20288.0, 10340.0, 5825.0, 3344.0, 1987.0, 1325.0, 799.0, 561.0, 331.0, 240.0, 177.0, 105.0, 82.0, 46.0, 36.0, 28.0, 10.0, 9.0, 11.0, 1.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-6.15625, -5.9771728515625, -5.798095703125, -5.6190185546875, -5.43994140625, -5.2608642578125, -5.081787109375, -4.9027099609375, -4.7236328125, -4.5445556640625, -4.365478515625, -4.1864013671875, -4.00732421875, -3.8282470703125, -3.649169921875, -3.4700927734375, -3.291015625, -3.1119384765625, -2.932861328125, -2.7537841796875, -2.57470703125, -2.3956298828125, -2.216552734375, -2.0374755859375, -1.8583984375, -1.6793212890625, -1.500244140625, -1.3211669921875, -1.14208984375, -0.9630126953125, -0.783935546875, -0.6048583984375, -0.42578125, -0.2467041015625, -0.067626953125, 0.1114501953125, 0.29052734375, 0.4696044921875, 0.648681640625, 0.8277587890625, 1.0068359375, 1.1859130859375, 1.364990234375, 1.5440673828125, 1.72314453125, 1.9022216796875, 2.081298828125, 2.2603759765625, 2.439453125, 2.6185302734375, 2.797607421875, 2.9766845703125, 3.15576171875, 3.3348388671875, 3.513916015625, 3.6929931640625, 3.8720703125, 4.0511474609375, 4.230224609375, 4.4093017578125, 4.58837890625, 4.7674560546875, 4.946533203125, 5.1256103515625, 5.3046875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 3.0, 8.0, 11.0, 10.0, 6.0, 20.0, 12.0, 17.0, 15.0, 29.0, 32.0, 26.0, 36.0, 25.0, 29.0, 42.0, 28.0, 40.0, 44.0, 41.0, 53.0, 46.0, 32.0, 34.0, 41.0, 41.0, 27.0, 34.0, 31.0, 21.0, 31.0, 20.0, 22.0, 17.0, 15.0, 15.0, 13.0, 11.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.966796875, -3.831207275390625, -3.69561767578125, -3.560028076171875, -3.4244384765625, -3.288848876953125, -3.15325927734375, -3.017669677734375, -2.882080078125, -2.746490478515625, -2.61090087890625, -2.475311279296875, -2.3397216796875, -2.204132080078125, -2.06854248046875, -1.932952880859375, -1.79736328125, -1.661773681640625, -1.52618408203125, -1.390594482421875, -1.2550048828125, -1.119415283203125, -0.98382568359375, -0.848236083984375, -0.712646484375, -0.577056884765625, -0.44146728515625, -0.305877685546875, -0.1702880859375, -0.034698486328125, 0.10089111328125, 0.236480712890625, 0.3720703125, 0.507659912109375, 0.64324951171875, 0.778839111328125, 0.9144287109375, 1.050018310546875, 1.18560791015625, 1.321197509765625, 1.456787109375, 1.592376708984375, 1.72796630859375, 1.863555908203125, 1.9991455078125, 2.134735107421875, 2.27032470703125, 2.405914306640625, 2.54150390625, 2.677093505859375, 2.81268310546875, 2.948272705078125, 3.0838623046875, 3.219451904296875, 3.35504150390625, 3.490631103515625, 3.626220703125, 3.761810302734375, 3.89739990234375, 4.032989501953125, 4.1685791015625, 4.304168701171875, 4.43975830078125, 4.575347900390625, 4.7109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 4.0, 8.0, 12.0, 25.0, 26.0, 34.0, 44.0, 70.0, 96.0, 118.0, 179.0, 252.0, 371.0, 540.0, 776.0, 1207.0, 2053.0, 3224.0, 5742.0, 10360.0, 21078.0, 46316.0, 110154.0, 255129.0, 313334.0, 153961.0, 63849.0, 28137.0, 13560.0, 7219.0, 3934.0, 2266.0, 1504.0, 948.0, 566.0, 433.0, 299.0, 197.0, 147.0, 104.0, 71.0, 61.0, 34.0, 25.0, 24.0, 14.0, 20.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-7.37109375, -7.14208984375, -6.9130859375, -6.68408203125, -6.455078125, -6.22607421875, -5.9970703125, -5.76806640625, -5.5390625, -5.31005859375, -5.0810546875, -4.85205078125, -4.623046875, -4.39404296875, -4.1650390625, -3.93603515625, -3.70703125, -3.47802734375, -3.2490234375, -3.02001953125, -2.791015625, -2.56201171875, -2.3330078125, -2.10400390625, -1.875, -1.64599609375, -1.4169921875, -1.18798828125, -0.958984375, -0.72998046875, -0.5009765625, -0.27197265625, -0.04296875, 0.18603515625, 0.4150390625, 0.64404296875, 0.873046875, 1.10205078125, 1.3310546875, 1.56005859375, 1.7890625, 2.01806640625, 2.2470703125, 2.47607421875, 2.705078125, 2.93408203125, 3.1630859375, 3.39208984375, 3.62109375, 3.85009765625, 4.0791015625, 4.30810546875, 4.537109375, 4.76611328125, 4.9951171875, 5.22412109375, 5.453125, 5.68212890625, 5.9111328125, 6.14013671875, 6.369140625, 6.59814453125, 6.8271484375, 7.05615234375, 7.28515625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 8.0, 5.0, 2.0, 7.0, 11.0, 8.0, 9.0, 14.0, 30.0, 17.0, 37.0, 22.0, 35.0, 23.0, 27.0, 31.0, 39.0, 55.0, 41.0, 38.0, 41.0, 33.0, 39.0, 50.0, 38.0, 28.0, 24.0, 29.0, 30.0, 28.0, 32.0, 30.0, 18.0, 19.0, 18.0, 15.0, 8.0, 8.0, 13.0, 8.0, 4.0, 10.0, 0.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.46484375, -2.3814697265625, -2.298095703125, -2.2147216796875, -2.13134765625, -2.0479736328125, -1.964599609375, -1.8812255859375, -1.7978515625, -1.7144775390625, -1.631103515625, -1.5477294921875, -1.46435546875, -1.3809814453125, -1.297607421875, -1.2142333984375, -1.130859375, -1.0474853515625, -0.964111328125, -0.8807373046875, -0.79736328125, -0.7139892578125, -0.630615234375, -0.5472412109375, -0.4638671875, -0.3804931640625, -0.297119140625, -0.2137451171875, -0.13037109375, -0.0469970703125, 0.036376953125, 0.1197509765625, 0.203125, 0.2864990234375, 0.369873046875, 0.4532470703125, 0.53662109375, 0.6199951171875, 0.703369140625, 0.7867431640625, 0.8701171875, 0.9534912109375, 1.036865234375, 1.1202392578125, 1.20361328125, 1.2869873046875, 1.370361328125, 1.4537353515625, 1.537109375, 1.6204833984375, 1.703857421875, 1.7872314453125, 1.87060546875, 1.9539794921875, 2.037353515625, 2.1207275390625, 2.2041015625, 2.2874755859375, 2.370849609375, 2.4542236328125, 2.53759765625, 2.6209716796875, 2.704345703125, 2.7877197265625, 2.87109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 13.0, 17.0, 31.0, 35.0, 61.0, 91.0, 132.0, 164.0, 249.0, 402.0, 628.0, 1006.0, 1589.0, 2682.0, 5151.0, 11132.0, 28039.0, 85471.0, 296643.0, 407409.0, 135441.0, 41170.0, 15580.0, 6714.0, 3483.0, 1889.0, 1128.0, 696.0, 483.0, 321.0, 226.0, 156.0, 107.0, 64.0, 44.0, 29.0, 22.0, 14.0, 11.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.69921875, -4.54852294921875, -4.3978271484375, -4.24713134765625, -4.096435546875, -3.94573974609375, -3.7950439453125, -3.64434814453125, -3.49365234375, -3.34295654296875, -3.1922607421875, -3.04156494140625, -2.890869140625, -2.74017333984375, -2.5894775390625, -2.43878173828125, -2.2880859375, -2.13739013671875, -1.9866943359375, -1.83599853515625, -1.685302734375, -1.53460693359375, -1.3839111328125, -1.23321533203125, -1.08251953125, -0.93182373046875, -0.7811279296875, -0.63043212890625, -0.479736328125, -0.32904052734375, -0.1783447265625, -0.02764892578125, 0.123046875, 0.27374267578125, 0.4244384765625, 0.57513427734375, 0.725830078125, 0.87652587890625, 1.0272216796875, 1.17791748046875, 1.32861328125, 1.47930908203125, 1.6300048828125, 1.78070068359375, 1.931396484375, 2.08209228515625, 2.2327880859375, 2.38348388671875, 2.5341796875, 2.68487548828125, 2.8355712890625, 2.98626708984375, 3.136962890625, 3.28765869140625, 3.4383544921875, 3.58905029296875, 3.73974609375, 3.89044189453125, 4.0411376953125, 4.19183349609375, 4.342529296875, 4.49322509765625, 4.6439208984375, 4.79461669921875, 4.9453125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 33.0, 77.0, 166.0, 261.0, 239.0, 110.0, 53.0, 13.0, 7.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00038886070251464844, -0.000376235693693161, -0.0003636106848716736, -0.00035098567605018616, -0.00033836066722869873, -0.0003257356584072113, -0.0003131106495857239, -0.00030048564076423645, -0.000287860631942749, -0.0002752356231212616, -0.00026261061429977417, -0.00024998560547828674, -0.00023736059665679932, -0.0002247355878353119, -0.00021211057901382446, -0.00019948557019233704, -0.0001868605613708496, -0.00017423555254936218, -0.00016161054372787476, -0.00014898553490638733, -0.0001363605260848999, -0.00012373551726341248, -0.00011111050844192505, -9.848549962043762e-05, -8.58604907989502e-05, -7.323548197746277e-05, -6.061047315597534e-05, -4.7985464334487915e-05, -3.536045551300049e-05, -2.273544669151306e-05, -1.0110437870025635e-05, 2.514570951461792e-06, 1.5139579772949219e-05, 2.7764588594436646e-05, 4.038959741592407e-05, 5.30146062374115e-05, 6.563961505889893e-05, 7.826462388038635e-05, 9.088963270187378e-05, 0.0001035146415233612, 0.00011613965034484863, 0.00012876465916633606, 0.00014138966798782349, 0.0001540146768093109, 0.00016663968563079834, 0.00017926469445228577, 0.0001918897032737732, 0.00020451471209526062, 0.00021713972091674805, 0.00022976472973823547, 0.0002423897385597229, 0.00025501474738121033, 0.00026763975620269775, 0.0002802647650241852, 0.0002928897738456726, 0.00030551478266716003, 0.00031813979148864746, 0.0003307648003101349, 0.0003433898091316223, 0.00035601481795310974, 0.00036863982677459717, 0.0003812648355960846, 0.000393889844417572, 0.00040651485323905945, 0.0004191398620605469]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 13.0, 20.0, 19.0, 45.0, 65.0, 74.0, 111.0, 179.0, 278.0, 418.0, 624.0, 916.0, 1605.0, 2673.0, 4522.0, 9463.0, 23965.0, 69176.0, 200037.0, 363178.0, 234782.0, 84082.0, 28613.0, 10988.0, 5235.0, 2774.0, 1705.0, 1059.0, 614.0, 417.0, 277.0, 188.0, 136.0, 81.0, 69.0, 38.0, 35.0, 23.0, 20.0, 10.0, 6.0, 7.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.591796875, -3.466156005859375, -3.34051513671875, -3.214874267578125, -3.0892333984375, -2.963592529296875, -2.83795166015625, -2.712310791015625, -2.586669921875, -2.461029052734375, -2.33538818359375, -2.209747314453125, -2.0841064453125, -1.958465576171875, -1.83282470703125, -1.707183837890625, -1.58154296875, -1.455902099609375, -1.33026123046875, -1.204620361328125, -1.0789794921875, -0.953338623046875, -0.82769775390625, -0.702056884765625, -0.576416015625, -0.450775146484375, -0.32513427734375, -0.199493408203125, -0.0738525390625, 0.051788330078125, 0.17742919921875, 0.303070068359375, 0.4287109375, 0.554351806640625, 0.67999267578125, 0.805633544921875, 0.9312744140625, 1.056915283203125, 1.18255615234375, 1.308197021484375, 1.433837890625, 1.559478759765625, 1.68511962890625, 1.810760498046875, 1.9364013671875, 2.062042236328125, 2.18768310546875, 2.313323974609375, 2.43896484375, 2.564605712890625, 2.69024658203125, 2.815887451171875, 2.9415283203125, 3.067169189453125, 3.19281005859375, 3.318450927734375, 3.444091796875, 3.569732666015625, 3.69537353515625, 3.821014404296875, 3.9466552734375, 4.072296142578125, 4.19793701171875, 4.323577880859375, 4.44921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 2.0, 4.0, 8.0, 7.0, 10.0, 20.0, 35.0, 23.0, 40.0, 52.0, 57.0, 67.0, 74.0, 80.0, 87.0, 75.0, 72.0, 79.0, 46.0, 55.0, 25.0, 18.0, 19.0, 14.0, 8.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.017578125, -0.981292724609375, -0.94500732421875, -0.908721923828125, -0.8724365234375, -0.836151123046875, -0.79986572265625, -0.763580322265625, -0.727294921875, -0.691009521484375, -0.65472412109375, -0.618438720703125, -0.5821533203125, -0.545867919921875, -0.50958251953125, -0.473297119140625, -0.43701171875, -0.400726318359375, -0.36444091796875, -0.328155517578125, -0.2918701171875, -0.255584716796875, -0.21929931640625, -0.183013916015625, -0.146728515625, -0.110443115234375, -0.07415771484375, -0.037872314453125, -0.0015869140625, 0.034698486328125, 0.07098388671875, 0.107269287109375, 0.1435546875, 0.179840087890625, 0.21612548828125, 0.252410888671875, 0.2886962890625, 0.324981689453125, 0.36126708984375, 0.397552490234375, 0.433837890625, 0.470123291015625, 0.50640869140625, 0.542694091796875, 0.5789794921875, 0.615264892578125, 0.65155029296875, 0.687835693359375, 0.72412109375, 0.760406494140625, 0.79669189453125, 0.832977294921875, 0.8692626953125, 0.905548095703125, 0.94183349609375, 0.978118896484375, 1.014404296875, 1.050689697265625, 1.08697509765625, 1.123260498046875, 1.1595458984375, 1.195831298828125, 1.23211669921875, 1.268402099609375, 1.3046875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 5.0, 7.0, 6.0, 12.0, 17.0, 22.0, 26.0, 29.0, 42.0, 39.0, 50.0, 42.0, 61.0, 51.0, 64.0, 64.0, 61.0, 69.0, 45.0, 49.0, 34.0, 34.0, 28.0, 29.0, 23.0, 16.0, 6.0, 8.0, 6.0, 13.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.248778820037842, -5.094093322753906, -4.9394073486328125, -4.784721851348877, -4.630036354064941, -4.475350379943848, -4.320664882659912, -4.165979385375977, -4.011293411254883, -3.856607675552368, -3.7019219398498535, -3.547236442565918, -3.3925507068634033, -3.2378649711608887, -3.083179473876953, -2.9284937381744385, -2.773808002471924, -2.619122266769409, -2.4644365310668945, -2.309751033782959, -2.1550652980804443, -2.0003795623779297, -1.8456939458847046, -1.6910083293914795, -1.5363225936889648, -1.3816368579864502, -1.226951241493225, -1.072265625, -0.9175798892974854, -0.7628942131996155, -0.6082085371017456, -0.4535229206085205, -0.29883718490600586, -0.144151508808136, 0.010534167289733887, 0.16521984338760376, 0.31990551948547363, 0.4745911955833435, 0.6292768716812134, 0.7839624881744385, 0.9386482238769531, 1.0933339595794678, 1.2480195760726929, 1.402705192565918, 1.5573909282684326, 1.7120766639709473, 1.8667622804641724, 2.0214478969573975, 2.176133632659912, 2.3308193683624268, 2.4855051040649414, 2.640190601348877, 2.7948763370513916, 2.9495620727539062, 3.104247570037842, 3.2589333057403564, 3.413619041442871, 3.5683047771453857, 3.7229905128479004, 3.877676010131836, 4.03236198425293, 4.187047481536865, 4.341732978820801, 4.4964189529418945, 4.65110445022583]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 3.0, 5.0, 3.0, 13.0, 10.0, 8.0, 15.0, 15.0, 12.0, 15.0, 26.0, 26.0, 23.0, 26.0, 41.0, 28.0, 24.0, 27.0, 37.0, 35.0, 30.0, 47.0, 47.0, 33.0, 34.0, 40.0, 46.0, 31.0, 30.0, 32.0, 30.0, 29.0, 21.0, 21.0, 24.0, 19.0, 9.0, 14.0, 14.0, 16.0, 6.0, 11.0, 2.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6688833236694336, -3.5475361347198486, -3.4261887073516846, -3.3048415184020996, -3.1834940910339355, -3.0621469020843506, -2.9407997131347656, -2.8194522857666016, -2.6981050968170166, -2.5767579078674316, -2.4554104804992676, -2.3340632915496826, -2.2127161026000977, -2.0913686752319336, -1.9700214862823486, -1.8486741781234741, -1.7273268699645996, -1.605979561805725, -1.4846322536468506, -1.3632850646972656, -1.2419377565383911, -1.1205904483795166, -0.9992431998252869, -0.8778959512710571, -0.7565486431121826, -0.6352013349533081, -0.5138540863990784, -0.39250680804252625, -0.2711595296859741, -0.1498122215270996, -0.028464972972869873, 0.09288227558135986, 0.21422958374023438, 0.3355768620967865, 0.4569241404533386, 0.5782713890075684, 0.6996186971664429, 0.8209660053253174, 0.9423132538795471, 1.0636605024337769, 1.1850078105926514, 1.3063551187515259, 1.4277024269104004, 1.5490496158599854, 1.6703969240188599, 1.7917442321777344, 1.9130914211273193, 2.0344386100769043, 2.1557860374450684, 2.2771332263946533, 2.3984806537628174, 2.5198278427124023, 2.6411752700805664, 2.7625224590301514, 2.8838696479797363, 3.0052170753479004, 3.1265642642974854, 3.2479114532470703, 3.3692588806152344, 3.4906060695648193, 3.6119532585144043, 3.7333006858825684, 3.8546478748321533, 3.9759950637817383, 4.097342491149902]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 15.0, 19.0, 42.0, 60.0, 86.0, 114.0, 172.0, 261.0, 461.0, 670.0, 969.0, 1543.0, 2427.0, 3770.0, 6132.0, 10033.0, 16463.0, 28260.0, 46722.0, 75838.0, 113410.0, 150095.0, 163913.0, 143880.0, 106339.0, 69224.0, 42809.0, 25270.0, 15089.0, 9107.0, 5601.0, 3398.0, 2200.0, 1378.0, 942.0, 601.0, 404.0, 285.0, 175.0, 133.0, 77.0, 55.0, 42.0, 19.0, 15.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.07421875, -3.9356689453125, -3.797119140625, -3.6585693359375, -3.52001953125, -3.3814697265625, -3.242919921875, -3.1043701171875, -2.9658203125, -2.8272705078125, -2.688720703125, -2.5501708984375, -2.41162109375, -2.2730712890625, -2.134521484375, -1.9959716796875, -1.857421875, -1.7188720703125, -1.580322265625, -1.4417724609375, -1.30322265625, -1.1646728515625, -1.026123046875, -0.8875732421875, -0.7490234375, -0.6104736328125, -0.471923828125, -0.3333740234375, -0.19482421875, -0.0562744140625, 0.082275390625, 0.2208251953125, 0.359375, 0.4979248046875, 0.636474609375, 0.7750244140625, 0.91357421875, 1.0521240234375, 1.190673828125, 1.3292236328125, 1.4677734375, 1.6063232421875, 1.744873046875, 1.8834228515625, 2.02197265625, 2.1605224609375, 2.299072265625, 2.4376220703125, 2.576171875, 2.7147216796875, 2.853271484375, 2.9918212890625, 3.13037109375, 3.2689208984375, 3.407470703125, 3.5460205078125, 3.6845703125, 3.8231201171875, 3.961669921875, 4.1002197265625, 4.23876953125, 4.3773193359375, 4.515869140625, 4.6544189453125, 4.79296875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 10.0, 10.0, 7.0, 7.0, 8.0, 16.0, 13.0, 17.0, 16.0, 26.0, 25.0, 30.0, 27.0, 31.0, 36.0, 37.0, 30.0, 39.0, 40.0, 41.0, 43.0, 29.0, 44.0, 39.0, 35.0, 40.0, 30.0, 39.0, 23.0, 25.0, 30.0, 21.0, 29.0, 16.0, 12.0, 9.0, 16.0, 16.0, 7.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.916015625, -3.788177490234375, -3.66033935546875, -3.532501220703125, -3.4046630859375, -3.276824951171875, -3.14898681640625, -3.021148681640625, -2.893310546875, -2.765472412109375, -2.63763427734375, -2.509796142578125, -2.3819580078125, -2.254119873046875, -2.12628173828125, -1.998443603515625, -1.87060546875, -1.742767333984375, -1.61492919921875, -1.487091064453125, -1.3592529296875, -1.231414794921875, -1.10357666015625, -0.975738525390625, -0.847900390625, -0.720062255859375, -0.59222412109375, -0.464385986328125, -0.3365478515625, -0.208709716796875, -0.08087158203125, 0.046966552734375, 0.1748046875, 0.302642822265625, 0.43048095703125, 0.558319091796875, 0.6861572265625, 0.813995361328125, 0.94183349609375, 1.069671630859375, 1.197509765625, 1.325347900390625, 1.45318603515625, 1.581024169921875, 1.7088623046875, 1.836700439453125, 1.96453857421875, 2.092376708984375, 2.22021484375, 2.348052978515625, 2.47589111328125, 2.603729248046875, 2.7315673828125, 2.859405517578125, 2.98724365234375, 3.115081787109375, 3.242919921875, 3.370758056640625, 3.49859619140625, 3.626434326171875, 3.7542724609375, 3.882110595703125, 4.00994873046875, 4.137786865234375, 4.265625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 9.0, 20.0, 29.0, 35.0, 46.0, 75.0, 119.0, 188.0, 283.0, 382.0, 563.0, 966.0, 1473.0, 2231.0, 3708.0, 5812.0, 9175.0, 14953.0, 24222.0, 39165.0, 61904.0, 94644.0, 129995.0, 154574.0, 149933.0, 121256.0, 85403.0, 55732.0, 34524.0, 21407.0, 13240.0, 8163.0, 5246.0, 3292.0, 2057.0, 1340.0, 828.0, 556.0, 341.0, 245.0, 155.0, 91.0, 56.0, 56.0, 17.0, 24.0, 12.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.90625, -3.77972412109375, -3.6531982421875, -3.52667236328125, -3.400146484375, -3.27362060546875, -3.1470947265625, -3.02056884765625, -2.89404296875, -2.76751708984375, -2.6409912109375, -2.51446533203125, -2.387939453125, -2.26141357421875, -2.1348876953125, -2.00836181640625, -1.8818359375, -1.75531005859375, -1.6287841796875, -1.50225830078125, -1.375732421875, -1.24920654296875, -1.1226806640625, -0.99615478515625, -0.86962890625, -0.74310302734375, -0.6165771484375, -0.49005126953125, -0.363525390625, -0.23699951171875, -0.1104736328125, 0.01605224609375, 0.142578125, 0.26910400390625, 0.3956298828125, 0.52215576171875, 0.648681640625, 0.77520751953125, 0.9017333984375, 1.02825927734375, 1.15478515625, 1.28131103515625, 1.4078369140625, 1.53436279296875, 1.660888671875, 1.78741455078125, 1.9139404296875, 2.04046630859375, 2.1669921875, 2.29351806640625, 2.4200439453125, 2.54656982421875, 2.673095703125, 2.79962158203125, 2.9261474609375, 3.05267333984375, 3.17919921875, 3.30572509765625, 3.4322509765625, 3.55877685546875, 3.685302734375, 3.81182861328125, 3.9383544921875, 4.06488037109375, 4.19140625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 5.0, 5.0, 12.0, 10.0, 11.0, 9.0, 13.0, 21.0, 20.0, 23.0, 17.0, 22.0, 33.0, 26.0, 21.0, 28.0, 27.0, 29.0, 43.0, 38.0, 36.0, 44.0, 39.0, 39.0, 34.0, 32.0, 42.0, 34.0, 28.0, 24.0, 22.0, 31.0, 25.0, 29.0, 19.0, 11.0, 14.0, 11.0, 10.0, 14.0, 12.0, 4.0, 6.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.536865234375, -2.45654296875, -2.376220703125, -2.2958984375, -2.215576171875, -2.13525390625, -2.054931640625, -1.974609375, -1.894287109375, -1.81396484375, -1.733642578125, -1.6533203125, -1.572998046875, -1.49267578125, -1.412353515625, -1.33203125, -1.251708984375, -1.17138671875, -1.091064453125, -1.0107421875, -0.930419921875, -0.85009765625, -0.769775390625, -0.689453125, -0.609130859375, -0.52880859375, -0.448486328125, -0.3681640625, -0.287841796875, -0.20751953125, -0.127197265625, -0.046875, 0.033447265625, 0.11376953125, 0.194091796875, 0.2744140625, 0.354736328125, 0.43505859375, 0.515380859375, 0.595703125, 0.676025390625, 0.75634765625, 0.836669921875, 0.9169921875, 0.997314453125, 1.07763671875, 1.157958984375, 1.23828125, 1.318603515625, 1.39892578125, 1.479248046875, 1.5595703125, 1.639892578125, 1.72021484375, 1.800537109375, 1.880859375, 1.961181640625, 2.04150390625, 2.121826171875, 2.2021484375, 2.282470703125, 2.36279296875, 2.443115234375, 2.5234375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 11.0, 20.0, 20.0, 36.0, 39.0, 69.0, 113.0, 146.0, 264.0, 444.0, 612.0, 1033.0, 1693.0, 3159.0, 5798.0, 11166.0, 22853.0, 50959.0, 122232.0, 272134.0, 298335.0, 144031.0, 59820.0, 26313.0, 12380.0, 6339.0, 3429.0, 1976.0, 1196.0, 684.0, 442.0, 274.0, 174.0, 111.0, 96.0, 50.0, 35.0, 18.0, 17.0, 12.0, 9.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.05078125, -6.83770751953125, -6.6246337890625, -6.41156005859375, -6.198486328125, -5.98541259765625, -5.7723388671875, -5.55926513671875, -5.34619140625, -5.13311767578125, -4.9200439453125, -4.70697021484375, -4.493896484375, -4.28082275390625, -4.0677490234375, -3.85467529296875, -3.6416015625, -3.42852783203125, -3.2154541015625, -3.00238037109375, -2.789306640625, -2.57623291015625, -2.3631591796875, -2.15008544921875, -1.93701171875, -1.72393798828125, -1.5108642578125, -1.29779052734375, -1.084716796875, -0.87164306640625, -0.6585693359375, -0.44549560546875, -0.232421875, -0.01934814453125, 0.1937255859375, 0.40679931640625, 0.619873046875, 0.83294677734375, 1.0460205078125, 1.25909423828125, 1.47216796875, 1.68524169921875, 1.8983154296875, 2.11138916015625, 2.324462890625, 2.53753662109375, 2.7506103515625, 2.96368408203125, 3.1767578125, 3.38983154296875, 3.6029052734375, 3.81597900390625, 4.029052734375, 4.24212646484375, 4.4552001953125, 4.66827392578125, 4.88134765625, 5.09442138671875, 5.3074951171875, 5.52056884765625, 5.733642578125, 5.94671630859375, 6.1597900390625, 6.37286376953125, 6.5859375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 2.0, 11.0, 6.0, 13.0, 11.0, 19.0, 18.0, 19.0, 29.0, 39.0, 49.0, 57.0, 54.0, 82.0, 111.0, 94.0, 86.0, 61.0, 49.0, 43.0, 25.0, 18.0, 24.0, 12.0, 9.0, 13.0, 13.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005750656127929688, -0.0005580708384513855, -0.0005410760641098022, -0.000524081289768219, -0.0005070865154266357, -0.0004900917410850525, -0.00047309696674346924, -0.000456102192401886, -0.00043910741806030273, -0.0004221126437187195, -0.00040511786937713623, -0.000388123095035553, -0.0003711283206939697, -0.0003541335463523865, -0.0003371387720108032, -0.00032014399766921997, -0.0003031492233276367, -0.00028615444898605347, -0.0002691596746444702, -0.00025216490030288696, -0.0002351701259613037, -0.00021817535161972046, -0.0002011805772781372, -0.00018418580293655396, -0.0001671910285949707, -0.00015019625425338745, -0.0001332014799118042, -0.00011620670557022095, -9.92119312286377e-05, -8.221715688705444e-05, -6.522238254547119e-05, -4.822760820388794e-05, -3.123283386230469e-05, -1.4238059520721436e-05, 2.7567148208618164e-06, 1.975148916244507e-05, 3.674626350402832e-05, 5.374103784561157e-05, 7.073581218719482e-05, 8.773058652877808e-05, 0.00010472536087036133, 0.00012172013521194458, 0.00013871490955352783, 0.00015570968389511108, 0.00017270445823669434, 0.0001896992325782776, 0.00020669400691986084, 0.0002236887812614441, 0.00024068355560302734, 0.0002576783299446106, 0.00027467310428619385, 0.0002916678786277771, 0.00030866265296936035, 0.0003256574273109436, 0.00034265220165252686, 0.0003596469759941101, 0.00037664175033569336, 0.0003936365246772766, 0.00041063129901885986, 0.0004276260733604431, 0.00044462084770202637, 0.0004616156220436096, 0.00047861039638519287, 0.0004956051707267761, 0.0005125999450683594]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 27.0, 27.0, 36.0, 52.0, 94.0, 173.0, 211.0, 342.0, 511.0, 749.0, 1259.0, 1916.0, 3060.0, 4866.0, 8086.0, 13827.0, 23877.0, 41623.0, 72641.0, 125028.0, 188714.0, 202824.0, 147789.0, 89140.0, 50597.0, 28601.0, 16628.0, 9920.0, 5999.0, 3579.0, 2286.0, 1405.0, 952.0, 629.0, 372.0, 229.0, 181.0, 109.0, 60.0, 35.0, 23.0, 22.0, 12.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.73046875, -3.614532470703125, -3.49859619140625, -3.382659912109375, -3.2667236328125, -3.150787353515625, -3.03485107421875, -2.918914794921875, -2.802978515625, -2.687042236328125, -2.57110595703125, -2.455169677734375, -2.3392333984375, -2.223297119140625, -2.10736083984375, -1.991424560546875, -1.87548828125, -1.759552001953125, -1.64361572265625, -1.527679443359375, -1.4117431640625, -1.295806884765625, -1.17987060546875, -1.063934326171875, -0.947998046875, -0.832061767578125, -0.71612548828125, -0.600189208984375, -0.4842529296875, -0.368316650390625, -0.25238037109375, -0.136444091796875, -0.0205078125, 0.095428466796875, 0.21136474609375, 0.327301025390625, 0.4432373046875, 0.559173583984375, 0.67510986328125, 0.791046142578125, 0.906982421875, 1.022918701171875, 1.13885498046875, 1.254791259765625, 1.3707275390625, 1.486663818359375, 1.60260009765625, 1.718536376953125, 1.83447265625, 1.950408935546875, 2.06634521484375, 2.182281494140625, 2.2982177734375, 2.414154052734375, 2.53009033203125, 2.646026611328125, 2.761962890625, 2.877899169921875, 2.99383544921875, 3.109771728515625, 3.2257080078125, 3.341644287109375, 3.45758056640625, 3.573516845703125, 3.689453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 7.0, 9.0, 7.0, 15.0, 12.0, 16.0, 22.0, 30.0, 29.0, 52.0, 51.0, 60.0, 63.0, 75.0, 77.0, 72.0, 56.0, 61.0, 60.0, 44.0, 34.0, 31.0, 27.0, 24.0, 10.0, 17.0, 10.0, 5.0, 7.0, 6.0, 2.0, 1.0, 0.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.9580078125, -1.9060516357421875, -1.854095458984375, -1.8021392822265625, -1.75018310546875, -1.6982269287109375, -1.646270751953125, -1.5943145751953125, -1.5423583984375, -1.4904022216796875, -1.438446044921875, -1.3864898681640625, -1.33453369140625, -1.2825775146484375, -1.230621337890625, -1.1786651611328125, -1.126708984375, -1.0747528076171875, -1.022796630859375, -0.9708404541015625, -0.91888427734375, -0.8669281005859375, -0.814971923828125, -0.7630157470703125, -0.7110595703125, -0.6591033935546875, -0.607147216796875, -0.5551910400390625, -0.50323486328125, -0.4512786865234375, -0.399322509765625, -0.3473663330078125, -0.29541015625, -0.2434539794921875, -0.191497802734375, -0.1395416259765625, -0.08758544921875, -0.0356292724609375, 0.016326904296875, 0.0682830810546875, 0.1202392578125, 0.1721954345703125, 0.224151611328125, 0.2761077880859375, 0.32806396484375, 0.3800201416015625, 0.431976318359375, 0.4839324951171875, 0.535888671875, 0.5878448486328125, 0.639801025390625, 0.6917572021484375, 0.74371337890625, 0.7956695556640625, 0.847625732421875, 0.8995819091796875, 0.9515380859375, 1.0034942626953125, 1.055450439453125, 1.1074066162109375, 1.15936279296875, 1.2113189697265625, 1.263275146484375, 1.3152313232421875, 1.3671875]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 8.0, 6.0, 9.0, 15.0, 10.0, 26.0, 24.0, 27.0, 24.0, 46.0, 36.0, 50.0, 49.0, 68.0, 64.0, 62.0, 53.0, 61.0, 61.0, 39.0, 45.0, 37.0, 34.0, 29.0, 19.0, 15.0, 11.0, 12.0, 10.0, 9.0, 1.0, 5.0, 3.0, 7.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.270042419433594, -5.113237380981445, -4.956432819366455, -4.799627780914307, -4.642823219299316, -4.486018180847168, -4.3292131423950195, -4.172408103942871, -4.015603542327881, -3.8587987422943115, -3.701993942260742, -3.5451889038085938, -3.3883841037750244, -3.231579303741455, -3.0747742652893066, -2.9179694652557373, -2.761164665222168, -2.6043598651885986, -2.4475550651550293, -2.290750026702881, -2.1339452266693115, -1.9771404266357422, -1.8203355073928833, -1.6635305881500244, -1.506725788116455, -1.3499209880828857, -1.1931160688400269, -1.036311149597168, -0.8795063495635986, -0.7227014899253845, -0.5658966302871704, -0.4090917110443115, -0.252286434173584, -0.09548157453536987, 0.06132328510284424, 0.21812814474105835, 0.37493300437927246, 0.5317378640174866, 0.6885427236557007, 0.8453476428985596, 1.002152442932129, 1.1589572429656982, 1.3157621622085571, 1.472567081451416, 1.6293718814849854, 1.7861766815185547, 1.9429816007614136, 2.0997865200042725, 2.256591320037842, 2.413396120071411, 2.5702009201049805, 2.727005958557129, 2.8838107585906982, 3.0406155586242676, 3.197420597076416, 3.3542253971099854, 3.5110301971435547, 3.667834997177124, 3.8246397972106934, 3.981444835662842, 4.138249397277832, 4.2950544357299805, 4.451859474182129, 4.608664512634277, 4.765469074249268]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 6.0, 5.0, 4.0, 6.0, 6.0, 7.0, 17.0, 9.0, 17.0, 14.0, 11.0, 27.0, 22.0, 22.0, 21.0, 31.0, 27.0, 30.0, 32.0, 29.0, 40.0, 31.0, 43.0, 45.0, 39.0, 29.0, 44.0, 44.0, 37.0, 30.0, 33.0, 22.0, 35.0, 27.0, 23.0, 22.0, 11.0, 12.0, 14.0, 13.0, 6.0, 12.0, 11.0, 7.0, 8.0, 4.0, 6.0, 0.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-3.937185287475586, -3.8166260719299316, -3.6960666179656982, -3.575507402420044, -3.4549481868743896, -3.3343887329101562, -3.213829517364502, -3.0932703018188477, -2.9727110862731934, -2.852151870727539, -2.7315924167633057, -2.6110332012176514, -2.490473985671997, -2.3699145317077637, -2.2493553161621094, -2.128796100616455, -2.0082366466522217, -1.8876773118972778, -1.7671180963516235, -1.6465587615966797, -1.5259995460510254, -1.4054402112960815, -1.2848808765411377, -1.1643216609954834, -1.0437623262405396, -0.9232030510902405, -0.8026437759399414, -0.6820844411849976, -0.5615251660346985, -0.4409658908843994, -0.32040655612945557, -0.1998472809791565, -0.07928824424743652, 0.04127104580402374, 0.161830335855484, 0.28238964080810547, 0.40294891595840454, 0.5235081911087036, 0.6440675258636475, 0.7646268010139465, 0.8851860761642456, 1.0057454109191895, 1.1263046264648438, 1.2468639612197876, 1.3674232959747314, 1.4879825115203857, 1.6085418462753296, 1.7291011810302734, 1.8496603965759277, 1.9702197313308716, 2.0907790660858154, 2.2113382816314697, 2.331897497177124, 2.4524569511413574, 2.5730161666870117, 2.693575382232666, 2.8141345977783203, 2.9346938133239746, 3.055253267288208, 3.1758124828338623, 3.2963716983795166, 3.41693115234375, 3.5374903678894043, 3.6580495834350586, 3.778609037399292]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 7.0, 10.0, 24.0, 32.0, 48.0, 64.0, 102.0, 124.0, 164.0, 286.0, 402.0, 595.0, 832.0, 1275.0, 1888.0, 2905.0, 4708.0, 7541.0, 12784.0, 23668.0, 47976.0, 113712.0, 315505.0, 835844.0, 1330635.0, 901575.0, 353648.0, 126479.0, 52955.0, 25091.0, 13404.0, 7651.0, 4674.0, 2794.0, 1793.0, 1104.0, 704.0, 491.0, 278.0, 167.0, 113.0, 94.0, 45.0, 31.0, 23.0, 18.0, 5.0, 6.0, 3.0, 1.0, 1.0], "bins": [-6.34375, -6.1748046875, -6.005859375, -5.8369140625, -5.66796875, -5.4990234375, -5.330078125, -5.1611328125, -4.9921875, -4.8232421875, -4.654296875, -4.4853515625, -4.31640625, -4.1474609375, -3.978515625, -3.8095703125, -3.640625, -3.4716796875, -3.302734375, -3.1337890625, -2.96484375, -2.7958984375, -2.626953125, -2.4580078125, -2.2890625, -2.1201171875, -1.951171875, -1.7822265625, -1.61328125, -1.4443359375, -1.275390625, -1.1064453125, -0.9375, -0.7685546875, -0.599609375, -0.4306640625, -0.26171875, -0.0927734375, 0.076171875, 0.2451171875, 0.4140625, 0.5830078125, 0.751953125, 0.9208984375, 1.08984375, 1.2587890625, 1.427734375, 1.5966796875, 1.765625, 1.9345703125, 2.103515625, 2.2724609375, 2.44140625, 2.6103515625, 2.779296875, 2.9482421875, 3.1171875, 3.2861328125, 3.455078125, 3.6240234375, 3.79296875, 3.9619140625, 4.130859375, 4.2998046875, 4.46875]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 4.0, 11.0, 12.0, 13.0, 13.0, 13.0, 20.0, 22.0, 22.0, 20.0, 26.0, 27.0, 36.0, 35.0, 38.0, 26.0, 32.0, 51.0, 49.0, 35.0, 44.0, 36.0, 45.0, 52.0, 38.0, 29.0, 33.0, 25.0, 31.0, 21.0, 16.0, 16.0, 11.0, 9.0, 17.0, 10.0, 12.0, 8.0, 3.0, 6.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.919921875, -2.829345703125, -2.73876953125, -2.648193359375, -2.5576171875, -2.467041015625, -2.37646484375, -2.285888671875, -2.1953125, -2.104736328125, -2.01416015625, -1.923583984375, -1.8330078125, -1.742431640625, -1.65185546875, -1.561279296875, -1.470703125, -1.380126953125, -1.28955078125, -1.198974609375, -1.1083984375, -1.017822265625, -0.92724609375, -0.836669921875, -0.74609375, -0.655517578125, -0.56494140625, -0.474365234375, -0.3837890625, -0.293212890625, -0.20263671875, -0.112060546875, -0.021484375, 0.069091796875, 0.15966796875, 0.250244140625, 0.3408203125, 0.431396484375, 0.52197265625, 0.612548828125, 0.703125, 0.793701171875, 0.88427734375, 0.974853515625, 1.0654296875, 1.156005859375, 1.24658203125, 1.337158203125, 1.427734375, 1.518310546875, 1.60888671875, 1.699462890625, 1.7900390625, 1.880615234375, 1.97119140625, 2.061767578125, 2.15234375, 2.242919921875, 2.33349609375, 2.424072265625, 2.5146484375, 2.605224609375, 2.69580078125, 2.786376953125, 2.876953125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 4.0, 7.0, 6.0, 14.0, 16.0, 16.0, 16.0, 35.0, 43.0, 76.0, 137.0, 181.0, 240.0, 399.0, 549.0, 957.0, 1528.0, 2393.0, 3784.0, 6243.0, 11205.0, 19826.0, 36311.0, 71232.0, 151715.0, 351356.0, 817128.0, 1247686.0, 813879.0, 351394.0, 151271.0, 71243.0, 36192.0, 19351.0, 11073.0, 6422.0, 3820.0, 2394.0, 1479.0, 930.0, 607.0, 388.0, 252.0, 145.0, 110.0, 70.0, 58.0, 30.0, 27.0, 14.0, 8.0, 12.0, 6.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.99609375, -4.832275390625, -4.66845703125, -4.504638671875, -4.3408203125, -4.177001953125, -4.01318359375, -3.849365234375, -3.685546875, -3.521728515625, -3.35791015625, -3.194091796875, -3.0302734375, -2.866455078125, -2.70263671875, -2.538818359375, -2.375, -2.211181640625, -2.04736328125, -1.883544921875, -1.7197265625, -1.555908203125, -1.39208984375, -1.228271484375, -1.064453125, -0.900634765625, -0.73681640625, -0.572998046875, -0.4091796875, -0.245361328125, -0.08154296875, 0.082275390625, 0.24609375, 0.409912109375, 0.57373046875, 0.737548828125, 0.9013671875, 1.065185546875, 1.22900390625, 1.392822265625, 1.556640625, 1.720458984375, 1.88427734375, 2.048095703125, 2.2119140625, 2.375732421875, 2.53955078125, 2.703369140625, 2.8671875, 3.031005859375, 3.19482421875, 3.358642578125, 3.5224609375, 3.686279296875, 3.85009765625, 4.013916015625, 4.177734375, 4.341552734375, 4.50537109375, 4.669189453125, 4.8330078125, 4.996826171875, 5.16064453125, 5.324462890625, 5.48828125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 8.0, 4.0, 10.0, 5.0, 16.0, 15.0, 24.0, 28.0, 22.0, 51.0, 40.0, 63.0, 89.0, 103.0, 142.0, 167.0, 215.0, 262.0, 303.0, 354.0, 288.0, 343.0, 282.0, 239.0, 207.0, 187.0, 145.0, 94.0, 90.0, 68.0, 54.0, 36.0, 34.0, 22.0, 16.0, 13.0, 7.0, 9.0, 5.0, 5.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.912109375, -1.8591156005859375, -1.806121826171875, -1.7531280517578125, -1.70013427734375, -1.6471405029296875, -1.594146728515625, -1.5411529541015625, -1.4881591796875, -1.4351654052734375, -1.382171630859375, -1.3291778564453125, -1.27618408203125, -1.2231903076171875, -1.170196533203125, -1.1172027587890625, -1.064208984375, -1.0112152099609375, -0.958221435546875, -0.9052276611328125, -0.85223388671875, -0.7992401123046875, -0.746246337890625, -0.6932525634765625, -0.6402587890625, -0.5872650146484375, -0.534271240234375, -0.4812774658203125, -0.42828369140625, -0.3752899169921875, -0.322296142578125, -0.2693023681640625, -0.21630859375, -0.1633148193359375, -0.110321044921875, -0.0573272705078125, -0.00433349609375, 0.0486602783203125, 0.101654052734375, 0.1546478271484375, 0.2076416015625, 0.2606353759765625, 0.313629150390625, 0.3666229248046875, 0.41961669921875, 0.4726104736328125, 0.525604248046875, 0.5785980224609375, 0.631591796875, 0.6845855712890625, 0.737579345703125, 0.7905731201171875, 0.84356689453125, 0.8965606689453125, 0.949554443359375, 1.0025482177734375, 1.0555419921875, 1.1085357666015625, 1.161529541015625, 1.2145233154296875, 1.26751708984375, 1.3205108642578125, 1.373504638671875, 1.4264984130859375, 1.4794921875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 1.0, 7.0, 12.0, 12.0, 18.0, 7.0, 12.0, 25.0, 25.0, 31.0, 45.0, 52.0, 61.0, 49.0, 70.0, 62.0, 80.0, 68.0, 65.0, 46.0, 48.0, 40.0, 38.0, 27.0, 21.0, 20.0, 10.0, 11.0, 7.0, 8.0, 5.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9467973709106445, -4.784440994262695, -4.622085094451904, -4.459728717803955, -4.297372817993164, -4.135016441345215, -3.972660541534424, -3.8103041648864746, -3.6479482650756836, -3.4855921268463135, -3.3232359886169434, -3.1608798503875732, -2.998523712158203, -2.836167573928833, -2.673811435699463, -2.5114550590515137, -2.3490989208221436, -2.1867427825927734, -2.0243866443634033, -1.8620305061340332, -1.699674367904663, -1.537318229675293, -1.3749619722366333, -1.2126058340072632, -1.050249695777893, -0.887893557548523, -0.7255374193191528, -0.5631812214851379, -0.4008250832557678, -0.2384689450263977, -0.07611274719238281, 0.0862433910369873, 0.24859952926635742, 0.41095566749572754, 0.5733118057250977, 0.7356680035591125, 0.8980241417884827, 1.060380220413208, 1.2227364778518677, 1.3850926160812378, 1.547448754310608, 1.709804892539978, 1.8721610307693481, 2.034517288208008, 2.196873426437378, 2.359229564666748, 2.521585702896118, 2.6839418411254883, 2.8462979793548584, 3.0086541175842285, 3.1710102558135986, 3.3333663940429688, 3.495722532272339, 3.658078670501709, 3.820435047149658, 3.982790946960449, 4.145147323608398, 4.307503700256348, 4.469859600067139, 4.632215976715088, 4.794571876525879, 4.956928253173828, 5.119284152984619, 5.281640529632568, 5.443996429443359]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 1.0, 4.0, 3.0, 4.0, 7.0, 7.0, 8.0, 15.0, 12.0, 13.0, 18.0, 13.0, 26.0, 19.0, 25.0, 21.0, 32.0, 33.0, 41.0, 43.0, 41.0, 43.0, 42.0, 39.0, 48.0, 35.0, 36.0, 37.0, 37.0, 31.0, 35.0, 27.0, 28.0, 27.0, 18.0, 18.0, 19.0, 19.0, 20.0, 11.0, 10.0, 8.0, 6.0, 9.0, 5.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4119503498077393, -3.3018441200256348, -3.1917378902435303, -3.081631660461426, -2.9715256690979004, -2.861419439315796, -2.7513132095336914, -2.641206979751587, -2.5311007499694824, -2.420994520187378, -2.3108882904052734, -2.200782299041748, -2.0906760692596436, -1.980569839477539, -1.8704636096954346, -1.76035737991333, -1.6502513885498047, -1.5401451587677002, -1.4300390481948853, -1.3199328184127808, -1.2098267078399658, -1.0997204780578613, -0.9896142482757568, -0.8795080780982971, -0.7694019079208374, -0.6592957377433777, -0.549189567565918, -0.4390833377838135, -0.32897716760635376, -0.21887099742889404, -0.10876476764678955, 0.001341402530670166, 0.11144781112670898, 0.2215539962053299, 0.3316601812839508, 0.4417663812637329, 0.5518725514411926, 0.6619787216186523, 0.7720849514007568, 0.8821911215782166, 0.9922972917556763, 1.1024035215377808, 1.2125096321105957, 1.3226158618927002, 1.4327220916748047, 1.5428282022476196, 1.6529344320297241, 1.763040542602539, 1.8731467723846436, 1.983253002166748, 2.0933592319488525, 2.203465461730957, 2.3135714530944824, 2.423677682876587, 2.5337839126586914, 2.643890142440796, 2.7539963722229004, 2.864102602005005, 2.9742088317871094, 3.0843148231506348, 3.1944210529327393, 3.3045272827148438, 3.4146335124969482, 3.5247397422790527, 3.634845733642578]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 8.0, 18.0, 27.0, 31.0, 51.0, 63.0, 116.0, 167.0, 234.0, 368.0, 627.0, 925.0, 1549.0, 2552.0, 4185.0, 6983.0, 12421.0, 22427.0, 41079.0, 76594.0, 136114.0, 204427.0, 210455.0, 144820.0, 82187.0, 43889.0, 23732.0, 13463.0, 7647.0, 4361.0, 2623.0, 1599.0, 997.0, 656.0, 393.0, 270.0, 170.0, 122.0, 87.0, 50.0, 22.0, 20.0, 8.0, 11.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.880859375, -3.763458251953125, -3.64605712890625, -3.528656005859375, -3.4112548828125, -3.293853759765625, -3.17645263671875, -3.059051513671875, -2.941650390625, -2.824249267578125, -2.70684814453125, -2.589447021484375, -2.4720458984375, -2.354644775390625, -2.23724365234375, -2.119842529296875, -2.00244140625, -1.885040283203125, -1.76763916015625, -1.650238037109375, -1.5328369140625, -1.415435791015625, -1.29803466796875, -1.180633544921875, -1.063232421875, -0.945831298828125, -0.82843017578125, -0.711029052734375, -0.5936279296875, -0.476226806640625, -0.35882568359375, -0.241424560546875, -0.1240234375, -0.006622314453125, 0.11077880859375, 0.228179931640625, 0.3455810546875, 0.462982177734375, 0.58038330078125, 0.697784423828125, 0.815185546875, 0.932586669921875, 1.04998779296875, 1.167388916015625, 1.2847900390625, 1.402191162109375, 1.51959228515625, 1.636993408203125, 1.75439453125, 1.871795654296875, 1.98919677734375, 2.106597900390625, 2.2239990234375, 2.341400146484375, 2.45880126953125, 2.576202392578125, 2.693603515625, 2.811004638671875, 2.92840576171875, 3.045806884765625, 3.1632080078125, 3.280609130859375, 3.39801025390625, 3.515411376953125, 3.6328125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 14.0, 8.0, 11.0, 5.0, 15.0, 22.0, 15.0, 20.0, 28.0, 22.0, 32.0, 30.0, 22.0, 39.0, 44.0, 41.0, 35.0, 37.0, 39.0, 40.0, 46.0, 36.0, 26.0, 38.0, 38.0, 29.0, 24.0, 26.0, 27.0, 22.0, 17.0, 22.0, 17.0, 16.0, 21.0, 10.0, 7.0, 10.0, 5.0, 3.0, 7.0, 4.0, 9.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-3.580078125, -3.47216796875, -3.3642578125, -3.25634765625, -3.1484375, -3.04052734375, -2.9326171875, -2.82470703125, -2.716796875, -2.60888671875, -2.5009765625, -2.39306640625, -2.28515625, -2.17724609375, -2.0693359375, -1.96142578125, -1.853515625, -1.74560546875, -1.6376953125, -1.52978515625, -1.421875, -1.31396484375, -1.2060546875, -1.09814453125, -0.990234375, -0.88232421875, -0.7744140625, -0.66650390625, -0.55859375, -0.45068359375, -0.3427734375, -0.23486328125, -0.126953125, -0.01904296875, 0.0888671875, 0.19677734375, 0.3046875, 0.41259765625, 0.5205078125, 0.62841796875, 0.736328125, 0.84423828125, 0.9521484375, 1.06005859375, 1.16796875, 1.27587890625, 1.3837890625, 1.49169921875, 1.599609375, 1.70751953125, 1.8154296875, 1.92333984375, 2.03125, 2.13916015625, 2.2470703125, 2.35498046875, 2.462890625, 2.57080078125, 2.6787109375, 2.78662109375, 2.89453125, 3.00244140625, 3.1103515625, 3.21826171875, 3.326171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 10.0, 5.0, 16.0, 15.0, 18.0, 34.0, 43.0, 59.0, 81.0, 125.0, 149.0, 225.0, 352.0, 533.0, 886.0, 1453.0, 2242.0, 3942.0, 7036.0, 13754.0, 28591.0, 64006.0, 151885.0, 315082.0, 254948.0, 110071.0, 46360.0, 21733.0, 10669.0, 5722.0, 3267.0, 1852.0, 1151.0, 717.0, 481.0, 302.0, 224.0, 164.0, 105.0, 70.0, 57.0, 39.0, 23.0, 17.0, 11.0, 5.0, 6.0, 2.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-5.9296875, -5.73724365234375, -5.5447998046875, -5.35235595703125, -5.159912109375, -4.96746826171875, -4.7750244140625, -4.58258056640625, -4.39013671875, -4.19769287109375, -4.0052490234375, -3.81280517578125, -3.620361328125, -3.42791748046875, -3.2354736328125, -3.04302978515625, -2.8505859375, -2.65814208984375, -2.4656982421875, -2.27325439453125, -2.080810546875, -1.88836669921875, -1.6959228515625, -1.50347900390625, -1.31103515625, -1.11859130859375, -0.9261474609375, -0.73370361328125, -0.541259765625, -0.34881591796875, -0.1563720703125, 0.03607177734375, 0.228515625, 0.42095947265625, 0.6134033203125, 0.80584716796875, 0.998291015625, 1.19073486328125, 1.3831787109375, 1.57562255859375, 1.76806640625, 1.96051025390625, 2.1529541015625, 2.34539794921875, 2.537841796875, 2.73028564453125, 2.9227294921875, 3.11517333984375, 3.3076171875, 3.50006103515625, 3.6925048828125, 3.88494873046875, 4.077392578125, 4.26983642578125, 4.4622802734375, 4.65472412109375, 4.84716796875, 5.03961181640625, 5.2320556640625, 5.42449951171875, 5.616943359375, 5.80938720703125, 6.0018310546875, 6.19427490234375, 6.38671875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 9.0, 7.0, 10.0, 15.0, 16.0, 15.0, 24.0, 35.0, 18.0, 24.0, 35.0, 43.0, 46.0, 46.0, 43.0, 54.0, 58.0, 43.0, 33.0, 41.0, 37.0, 47.0, 38.0, 30.0, 40.0, 31.0, 29.0, 27.0, 21.0, 17.0, 10.0, 13.0, 7.0, 11.0, 5.0, 1.0, 3.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.490234375, -2.409881591796875, -2.32952880859375, -2.249176025390625, -2.1688232421875, -2.088470458984375, -2.00811767578125, -1.927764892578125, -1.847412109375, -1.767059326171875, -1.68670654296875, -1.606353759765625, -1.5260009765625, -1.445648193359375, -1.36529541015625, -1.284942626953125, -1.20458984375, -1.124237060546875, -1.04388427734375, -0.963531494140625, -0.8831787109375, -0.802825927734375, -0.72247314453125, -0.642120361328125, -0.561767578125, -0.481414794921875, -0.40106201171875, -0.320709228515625, -0.2403564453125, -0.160003662109375, -0.07965087890625, 0.000701904296875, 0.0810546875, 0.161407470703125, 0.24176025390625, 0.322113037109375, 0.4024658203125, 0.482818603515625, 0.56317138671875, 0.643524169921875, 0.723876953125, 0.804229736328125, 0.88458251953125, 0.964935302734375, 1.0452880859375, 1.125640869140625, 1.20599365234375, 1.286346435546875, 1.36669921875, 1.447052001953125, 1.52740478515625, 1.607757568359375, 1.6881103515625, 1.768463134765625, 1.84881591796875, 1.929168701171875, 2.009521484375, 2.089874267578125, 2.17022705078125, 2.250579833984375, 2.3309326171875, 2.411285400390625, 2.49163818359375, 2.571990966796875, 2.65234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 7.0, 17.0, 23.0, 26.0, 43.0, 53.0, 71.0, 112.0, 168.0, 218.0, 333.0, 476.0, 807.0, 1488.0, 2634.0, 5098.0, 10869.0, 26354.0, 73915.0, 243846.0, 426458.0, 166129.0, 51985.0, 19314.0, 8521.0, 4115.0, 2105.0, 1234.0, 708.0, 450.0, 325.0, 179.0, 137.0, 89.0, 75.0, 45.0, 28.0, 30.0, 15.0, 19.0, 15.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.27734375, -4.15631103515625, -4.0352783203125, -3.91424560546875, -3.793212890625, -3.67218017578125, -3.5511474609375, -3.43011474609375, -3.30908203125, -3.18804931640625, -3.0670166015625, -2.94598388671875, -2.824951171875, -2.70391845703125, -2.5828857421875, -2.46185302734375, -2.3408203125, -2.21978759765625, -2.0987548828125, -1.97772216796875, -1.856689453125, -1.73565673828125, -1.6146240234375, -1.49359130859375, -1.37255859375, -1.25152587890625, -1.1304931640625, -1.00946044921875, -0.888427734375, -0.76739501953125, -0.6463623046875, -0.52532958984375, -0.404296875, -0.28326416015625, -0.1622314453125, -0.04119873046875, 0.079833984375, 0.20086669921875, 0.3218994140625, 0.44293212890625, 0.56396484375, 0.68499755859375, 0.8060302734375, 0.92706298828125, 1.048095703125, 1.16912841796875, 1.2901611328125, 1.41119384765625, 1.5322265625, 1.65325927734375, 1.7742919921875, 1.89532470703125, 2.016357421875, 2.13739013671875, 2.2584228515625, 2.37945556640625, 2.50048828125, 2.62152099609375, 2.7425537109375, 2.86358642578125, 2.984619140625, 3.10565185546875, 3.2266845703125, 3.34771728515625, 3.46875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 8.0, 6.0, 16.0, 20.0, 26.0, 36.0, 63.0, 73.0, 110.0, 133.0, 135.0, 108.0, 78.0, 58.0, 30.0, 19.0, 17.0, 20.0, 14.0, 6.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.799003601074219e-05, -9.223446249961853e-05, -8.647888898849487e-05, -8.072331547737122e-05, -7.496774196624756e-05, -6.92121684551239e-05, -6.345659494400024e-05, -5.770102143287659e-05, -5.194544792175293e-05, -4.618987441062927e-05, -4.0434300899505615e-05, -3.467872738838196e-05, -2.89231538772583e-05, -2.3167580366134644e-05, -1.7412006855010986e-05, -1.1656433343887329e-05, -5.900859832763672e-06, -1.4528632164001465e-07, 5.610287189483643e-06, 1.13658607006073e-05, 1.7121434211730957e-05, 2.2877007722854614e-05, 2.863258123397827e-05, 3.438815474510193e-05, 4.0143728256225586e-05, 4.589930176734924e-05, 5.16548752784729e-05, 5.741044878959656e-05, 6.316602230072021e-05, 6.892159581184387e-05, 7.467716932296753e-05, 8.043274283409119e-05, 8.618831634521484e-05, 9.19438898563385e-05, 9.769946336746216e-05, 0.00010345503687858582, 0.00010921061038970947, 0.00011496618390083313, 0.00012072175741195679, 0.00012647733092308044, 0.0001322329044342041, 0.00013798847794532776, 0.00014374405145645142, 0.00014949962496757507, 0.00015525519847869873, 0.0001610107719898224, 0.00016676634550094604, 0.0001725219190120697, 0.00017827749252319336, 0.00018403306603431702, 0.00018978863954544067, 0.00019554421305656433, 0.000201299786567688, 0.00020705536007881165, 0.0002128109335899353, 0.00021856650710105896, 0.00022432208061218262, 0.00023007765412330627, 0.00023583322763442993, 0.0002415888011455536, 0.00024734437465667725, 0.0002530999481678009, 0.00025885552167892456, 0.0002646110951900482, 0.0002703666687011719]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 9.0, 6.0, 19.0, 22.0, 23.0, 37.0, 33.0, 49.0, 85.0, 108.0, 160.0, 239.0, 324.0, 494.0, 778.0, 1248.0, 2041.0, 3713.0, 6991.0, 14975.0, 36039.0, 97378.0, 256951.0, 347385.0, 170869.0, 61480.0, 23859.0, 10609.0, 5182.0, 2847.0, 1664.0, 960.0, 639.0, 442.0, 247.0, 172.0, 111.0, 99.0, 64.0, 49.0, 36.0, 31.0, 19.0, 13.0, 13.0, 19.0, 4.0, 6.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.09375, -2.997894287109375, -2.90203857421875, -2.806182861328125, -2.7103271484375, -2.614471435546875, -2.51861572265625, -2.422760009765625, -2.326904296875, -2.231048583984375, -2.13519287109375, -2.039337158203125, -1.9434814453125, -1.847625732421875, -1.75177001953125, -1.655914306640625, -1.56005859375, -1.464202880859375, -1.36834716796875, -1.272491455078125, -1.1766357421875, -1.080780029296875, -0.98492431640625, -0.889068603515625, -0.793212890625, -0.697357177734375, -0.60150146484375, -0.505645751953125, -0.4097900390625, -0.313934326171875, -0.21807861328125, -0.122222900390625, -0.0263671875, 0.069488525390625, 0.16534423828125, 0.261199951171875, 0.3570556640625, 0.452911376953125, 0.54876708984375, 0.644622802734375, 0.740478515625, 0.836334228515625, 0.93218994140625, 1.028045654296875, 1.1239013671875, 1.219757080078125, 1.31561279296875, 1.411468505859375, 1.50732421875, 1.603179931640625, 1.69903564453125, 1.794891357421875, 1.8907470703125, 1.986602783203125, 2.08245849609375, 2.178314208984375, 2.274169921875, 2.370025634765625, 2.46588134765625, 2.561737060546875, 2.6575927734375, 2.753448486328125, 2.84930419921875, 2.945159912109375, 3.041015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 6.0, 10.0, 6.0, 5.0, 8.0, 16.0, 23.0, 20.0, 30.0, 48.0, 39.0, 56.0, 69.0, 88.0, 92.0, 72.0, 78.0, 65.0, 50.0, 49.0, 34.0, 31.0, 21.0, 20.0, 11.0, 10.0, 13.0, 2.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.82470703125, -0.8004913330078125, -0.776275634765625, -0.7520599365234375, -0.72784423828125, -0.7036285400390625, -0.679412841796875, -0.6551971435546875, -0.6309814453125, -0.6067657470703125, -0.582550048828125, -0.5583343505859375, -0.53411865234375, -0.5099029541015625, -0.485687255859375, -0.4614715576171875, -0.437255859375, -0.4130401611328125, -0.388824462890625, -0.3646087646484375, -0.34039306640625, -0.3161773681640625, -0.291961669921875, -0.2677459716796875, -0.2435302734375, -0.2193145751953125, -0.195098876953125, -0.1708831787109375, -0.14666748046875, -0.1224517822265625, -0.098236083984375, -0.0740203857421875, -0.0498046875, -0.0255889892578125, -0.001373291015625, 0.0228424072265625, 0.04705810546875, 0.0712738037109375, 0.095489501953125, 0.1197052001953125, 0.1439208984375, 0.1681365966796875, 0.192352294921875, 0.2165679931640625, 0.24078369140625, 0.2649993896484375, 0.289215087890625, 0.3134307861328125, 0.337646484375, 0.3618621826171875, 0.386077880859375, 0.4102935791015625, 0.43450927734375, 0.4587249755859375, 0.482940673828125, 0.5071563720703125, 0.5313720703125, 0.5555877685546875, 0.579803466796875, 0.6040191650390625, 0.62823486328125, 0.6524505615234375, 0.676666259765625, 0.7008819580078125, 0.72509765625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 7.0, 4.0, 10.0, 8.0, 17.0, 12.0, 12.0, 10.0, 26.0, 31.0, 43.0, 38.0, 59.0, 55.0, 52.0, 67.0, 62.0, 64.0, 62.0, 73.0, 43.0, 46.0, 49.0, 23.0, 27.0, 14.0, 17.0, 17.0, 8.0, 8.0, 5.0, 8.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.794615745544434, -4.641088008880615, -4.487559795379639, -4.33403205871582, -4.180503845214844, -4.026976108551025, -3.873448371887207, -3.7199203968048096, -3.566392421722412, -3.4128644466400146, -3.259336471557617, -3.105808734893799, -2.9522807598114014, -2.798752784729004, -2.6452250480651855, -2.491697072982788, -2.3381690979003906, -2.184641122817993, -2.0311131477355957, -1.8775854110717773, -1.7240574359893799, -1.5705294609069824, -1.4170016050338745, -1.2634737491607666, -1.1099457740783691, -0.9564178586006165, -0.8028899431228638, -0.6493620276451111, -0.4958341121673584, -0.3423061966896057, -0.18877828121185303, -0.03525042533874512, 0.11827707290649414, 0.2718049883842468, 0.4253329038619995, 0.5788608193397522, 0.7323887348175049, 0.8859166502952576, 1.0394445657730103, 1.1929724216461182, 1.3465003967285156, 1.500028371810913, 1.653556227684021, 1.807084083557129, 1.9606120586395264, 2.114140033721924, 2.267667770385742, 2.4211957454681396, 2.574723720550537, 2.7282516956329346, 2.881779670715332, 3.0353074073791504, 3.188835382461548, 3.3423633575439453, 3.4958910942077637, 3.649419069290161, 3.8029470443725586, 3.956475019454956, 4.1100029945373535, 4.263530731201172, 4.417058944702148, 4.570586681365967, 4.724114418029785, 4.877642631530762, 5.03117036819458]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 1.0, 3.0, 11.0, 6.0, 9.0, 13.0, 8.0, 18.0, 20.0, 20.0, 15.0, 21.0, 25.0, 30.0, 34.0, 28.0, 37.0, 45.0, 42.0, 31.0, 51.0, 43.0, 44.0, 35.0, 39.0, 37.0, 31.0, 34.0, 33.0, 32.0, 32.0, 19.0, 17.0, 23.0, 9.0, 24.0, 15.0, 16.0, 10.0, 8.0, 7.0, 6.0, 4.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.220881462097168, -3.1128604412078857, -3.0048394203186035, -2.8968183994293213, -2.788797378540039, -2.680776357650757, -2.5727553367614746, -2.4647345542907715, -2.35671329498291, -2.248692274093628, -2.1406712532043457, -2.0326502323150635, -1.9246292114257812, -1.816608190536499, -1.7085872888565063, -1.6005662679672241, -1.4925453662872314, -1.3845243453979492, -1.276503324508667, -1.1684823036193848, -1.0604612827301025, -0.9524403214454651, -0.8444193601608276, -0.7363983392715454, -0.6283773183822632, -0.520356297492981, -0.4123353064060211, -0.3043143153190613, -0.19629329442977905, -0.08827227354049683, 0.019748687744140625, 0.12776970863342285, 0.23579049110412598, 0.3438115119934082, 0.45183250308036804, 0.5598534941673279, 0.6678745150566101, 0.7758955359458923, 0.8839164972305298, 0.991937518119812, 1.0999585390090942, 1.2079795598983765, 1.3160005807876587, 1.4240214824676514, 1.5320425033569336, 1.6400635242462158, 1.748084545135498, 1.8561055660247803, 1.9641265869140625, 2.0721476078033447, 2.180168628692627, 2.288189649581909, 2.3962106704711914, 2.5042316913604736, 2.612252712249756, 2.720273494720459, 2.8282947540283203, 2.9363157749176025, 3.0443367958068848, 3.152357816696167, 3.260378837585449, 3.3683998584747314, 3.4764208793640137, 3.584441661834717, 3.692462682723999]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 10.0, 14.0, 21.0, 31.0, 49.0, 65.0, 80.0, 134.0, 198.0, 286.0, 460.0, 659.0, 1047.0, 1763.0, 2975.0, 5431.0, 10173.0, 20251.0, 41415.0, 86450.0, 162322.0, 231706.0, 214770.0, 133357.0, 67724.0, 32332.0, 15814.0, 8107.0, 4298.0, 2532.0, 1483.0, 909.0, 532.0, 357.0, 259.0, 156.0, 114.0, 77.0, 49.0, 49.0, 31.0, 16.0, 10.0, 8.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.81524658203125, -4.6422119140625, -4.46917724609375, -4.296142578125, -4.12310791015625, -3.9500732421875, -3.77703857421875, -3.60400390625, -3.43096923828125, -3.2579345703125, -3.08489990234375, -2.911865234375, -2.73883056640625, -2.5657958984375, -2.39276123046875, -2.2197265625, -2.04669189453125, -1.8736572265625, -1.70062255859375, -1.527587890625, -1.35455322265625, -1.1815185546875, -1.00848388671875, -0.83544921875, -0.66241455078125, -0.4893798828125, -0.31634521484375, -0.143310546875, 0.02972412109375, 0.2027587890625, 0.37579345703125, 0.548828125, 0.72186279296875, 0.8948974609375, 1.06793212890625, 1.240966796875, 1.41400146484375, 1.5870361328125, 1.76007080078125, 1.93310546875, 2.10614013671875, 2.2791748046875, 2.45220947265625, 2.625244140625, 2.79827880859375, 2.9713134765625, 3.14434814453125, 3.3173828125, 3.49041748046875, 3.6634521484375, 3.83648681640625, 4.009521484375, 4.18255615234375, 4.3555908203125, 4.52862548828125, 4.70166015625, 4.87469482421875, 5.0477294921875, 5.22076416015625, 5.393798828125, 5.56683349609375, 5.7398681640625, 5.91290283203125, 6.0859375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 3.0, 9.0, 7.0, 9.0, 10.0, 13.0, 13.0, 23.0, 13.0, 22.0, 31.0, 33.0, 38.0, 29.0, 38.0, 41.0, 60.0, 38.0, 40.0, 43.0, 36.0, 42.0, 38.0, 35.0, 35.0, 36.0, 28.0, 34.0, 28.0, 18.0, 22.0, 15.0, 24.0, 15.0, 11.0, 7.0, 9.0, 11.0, 10.0, 4.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.587890625, -3.47760009765625, -3.3673095703125, -3.25701904296875, -3.146728515625, -3.03643798828125, -2.9261474609375, -2.81585693359375, -2.70556640625, -2.59527587890625, -2.4849853515625, -2.37469482421875, -2.264404296875, -2.15411376953125, -2.0438232421875, -1.93353271484375, -1.8232421875, -1.71295166015625, -1.6026611328125, -1.49237060546875, -1.382080078125, -1.27178955078125, -1.1614990234375, -1.05120849609375, -0.94091796875, -0.83062744140625, -0.7203369140625, -0.61004638671875, -0.499755859375, -0.38946533203125, -0.2791748046875, -0.16888427734375, -0.05859375, 0.05169677734375, 0.1619873046875, 0.27227783203125, 0.382568359375, 0.49285888671875, 0.6031494140625, 0.71343994140625, 0.82373046875, 0.93402099609375, 1.0443115234375, 1.15460205078125, 1.264892578125, 1.37518310546875, 1.4854736328125, 1.59576416015625, 1.7060546875, 1.81634521484375, 1.9266357421875, 2.03692626953125, 2.147216796875, 2.25750732421875, 2.3677978515625, 2.47808837890625, 2.58837890625, 2.69866943359375, 2.8089599609375, 2.91925048828125, 3.029541015625, 3.13983154296875, 3.2501220703125, 3.36041259765625, 3.470703125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 15.0, 10.0, 19.0, 19.0, 47.0, 90.0, 132.0, 202.0, 343.0, 623.0, 1029.0, 1859.0, 3499.0, 6950.0, 13189.0, 26145.0, 51995.0, 99263.0, 168813.0, 220589.0, 194317.0, 123019.0, 66445.0, 33999.0, 17189.0, 8864.0, 4372.0, 2387.0, 1315.0, 706.0, 424.0, 259.0, 143.0, 110.0, 56.0, 42.0, 27.0, 18.0, 5.0, 10.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2890625, -4.1492919921875, -4.009521484375, -3.8697509765625, -3.72998046875, -3.5902099609375, -3.450439453125, -3.3106689453125, -3.1708984375, -3.0311279296875, -2.891357421875, -2.7515869140625, -2.61181640625, -2.4720458984375, -2.332275390625, -2.1925048828125, -2.052734375, -1.9129638671875, -1.773193359375, -1.6334228515625, -1.49365234375, -1.3538818359375, -1.214111328125, -1.0743408203125, -0.9345703125, -0.7947998046875, -0.655029296875, -0.5152587890625, -0.37548828125, -0.2357177734375, -0.095947265625, 0.0438232421875, 0.18359375, 0.3233642578125, 0.463134765625, 0.6029052734375, 0.74267578125, 0.8824462890625, 1.022216796875, 1.1619873046875, 1.3017578125, 1.4415283203125, 1.581298828125, 1.7210693359375, 1.86083984375, 2.0006103515625, 2.140380859375, 2.2801513671875, 2.419921875, 2.5596923828125, 2.699462890625, 2.8392333984375, 2.97900390625, 3.1187744140625, 3.258544921875, 3.3983154296875, 3.5380859375, 3.6778564453125, 3.817626953125, 3.9573974609375, 4.09716796875, 4.2369384765625, 4.376708984375, 4.5164794921875, 4.65625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 4.0, 2.0, 10.0, 10.0, 9.0, 11.0, 9.0, 14.0, 13.0, 22.0, 25.0, 23.0, 26.0, 34.0, 35.0, 36.0, 26.0, 37.0, 33.0, 34.0, 30.0, 32.0, 36.0, 35.0, 43.0, 34.0, 44.0, 26.0, 36.0, 30.0, 23.0, 30.0, 25.0, 21.0, 22.0, 17.0, 16.0, 11.0, 11.0, 7.0, 8.0, 12.0, 11.0, 6.0, 7.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9296875, -1.868804931640625, -1.80792236328125, -1.747039794921875, -1.6861572265625, -1.625274658203125, -1.56439208984375, -1.503509521484375, -1.442626953125, -1.381744384765625, -1.32086181640625, -1.259979248046875, -1.1990966796875, -1.138214111328125, -1.07733154296875, -1.016448974609375, -0.95556640625, -0.894683837890625, -0.83380126953125, -0.772918701171875, -0.7120361328125, -0.651153564453125, -0.59027099609375, -0.529388427734375, -0.468505859375, -0.407623291015625, -0.34674072265625, -0.285858154296875, -0.2249755859375, -0.164093017578125, -0.10321044921875, -0.042327880859375, 0.0185546875, 0.079437255859375, 0.14031982421875, 0.201202392578125, 0.2620849609375, 0.322967529296875, 0.38385009765625, 0.444732666015625, 0.505615234375, 0.566497802734375, 0.62738037109375, 0.688262939453125, 0.7491455078125, 0.810028076171875, 0.87091064453125, 0.931793212890625, 0.99267578125, 1.053558349609375, 1.11444091796875, 1.175323486328125, 1.2362060546875, 1.297088623046875, 1.35797119140625, 1.418853759765625, 1.479736328125, 1.540618896484375, 1.60150146484375, 1.662384033203125, 1.7232666015625, 1.784149169921875, 1.84503173828125, 1.905914306640625, 1.966796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 10.0, 11.0, 15.0, 13.0, 24.0, 49.0, 77.0, 114.0, 165.0, 249.0, 336.0, 535.0, 799.0, 1286.0, 1868.0, 3075.0, 5027.0, 8399.0, 14674.0, 26228.0, 48538.0, 91271.0, 163478.0, 227029.0, 196283.0, 117360.0, 62763.0, 33218.0, 18469.0, 10562.0, 6143.0, 3829.0, 2251.0, 1566.0, 932.0, 649.0, 412.0, 266.0, 193.0, 117.0, 81.0, 69.0, 53.0, 21.0, 15.0, 18.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-3.861328125, -3.75006103515625, -3.6387939453125, -3.52752685546875, -3.416259765625, -3.30499267578125, -3.1937255859375, -3.08245849609375, -2.97119140625, -2.85992431640625, -2.7486572265625, -2.63739013671875, -2.526123046875, -2.41485595703125, -2.3035888671875, -2.19232177734375, -2.0810546875, -1.96978759765625, -1.8585205078125, -1.74725341796875, -1.635986328125, -1.52471923828125, -1.4134521484375, -1.30218505859375, -1.19091796875, -1.07965087890625, -0.9683837890625, -0.85711669921875, -0.745849609375, -0.63458251953125, -0.5233154296875, -0.41204833984375, -0.30078125, -0.18951416015625, -0.0782470703125, 0.03302001953125, 0.144287109375, 0.25555419921875, 0.3668212890625, 0.47808837890625, 0.58935546875, 0.70062255859375, 0.8118896484375, 0.92315673828125, 1.034423828125, 1.14569091796875, 1.2569580078125, 1.36822509765625, 1.4794921875, 1.59075927734375, 1.7020263671875, 1.81329345703125, 1.924560546875, 2.03582763671875, 2.1470947265625, 2.25836181640625, 2.36962890625, 2.48089599609375, 2.5921630859375, 2.70343017578125, 2.814697265625, 2.92596435546875, 3.0372314453125, 3.14849853515625, 3.259765625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 14.0, 14.0, 17.0, 18.0, 24.0, 35.0, 44.0, 33.0, 54.0, 80.0, 98.0, 99.0, 90.0, 74.0, 68.0, 57.0, 38.0, 35.0, 21.0, 19.0, 12.0, 13.0, 13.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005345344543457031, -0.000519976019859314, -0.0005054175853729248, -0.0004908591508865356, -0.0004763007164001465, -0.0004617422819137573, -0.00044718384742736816, -0.000432625412940979, -0.00041806697845458984, -0.0004035085439682007, -0.0003889501094818115, -0.00037439167499542236, -0.0003598332405090332, -0.00034527480602264404, -0.0003307163715362549, -0.0003161579370498657, -0.00030159950256347656, -0.0002870410680770874, -0.00027248263359069824, -0.0002579241991043091, -0.00024336576461791992, -0.00022880733013153076, -0.0002142488956451416, -0.00019969046115875244, -0.00018513202667236328, -0.00017057359218597412, -0.00015601515769958496, -0.0001414567232131958, -0.00012689828872680664, -0.00011233985424041748, -9.778141975402832e-05, -8.322298526763916e-05, -6.866455078125e-05, -5.410611629486084e-05, -3.954768180847168e-05, -2.498924732208252e-05, -1.043081283569336e-05, 4.127621650695801e-06, 1.868605613708496e-05, 3.324449062347412e-05, 4.780292510986328e-05, 6.236135959625244e-05, 7.69197940826416e-05, 9.147822856903076e-05, 0.00010603666305541992, 0.00012059509754180908, 0.00013515353202819824, 0.0001497119665145874, 0.00016427040100097656, 0.00017882883548736572, 0.00019338726997375488, 0.00020794570446014404, 0.0002225041389465332, 0.00023706257343292236, 0.0002516210079193115, 0.0002661794424057007, 0.00028073787689208984, 0.000295296311378479, 0.00030985474586486816, 0.0003244131803512573, 0.0003389716148376465, 0.00035353004932403564, 0.0003680884838104248, 0.00038264691829681396, 0.0003972053527832031]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 12.0, 15.0, 17.0, 21.0, 50.0, 66.0, 119.0, 195.0, 350.0, 632.0, 1081.0, 1997.0, 3825.0, 7287.0, 14828.0, 29686.0, 63681.0, 133223.0, 232924.0, 251424.0, 157896.0, 76993.0, 36277.0, 17471.0, 8588.0, 4542.0, 2387.0, 1228.0, 740.0, 397.0, 263.0, 127.0, 75.0, 40.0, 28.0, 24.0, 9.0, 10.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.07421875, -3.954833984375, -3.83544921875, -3.716064453125, -3.5966796875, -3.477294921875, -3.35791015625, -3.238525390625, -3.119140625, -2.999755859375, -2.88037109375, -2.760986328125, -2.6416015625, -2.522216796875, -2.40283203125, -2.283447265625, -2.1640625, -2.044677734375, -1.92529296875, -1.805908203125, -1.6865234375, -1.567138671875, -1.44775390625, -1.328369140625, -1.208984375, -1.089599609375, -0.97021484375, -0.850830078125, -0.7314453125, -0.612060546875, -0.49267578125, -0.373291015625, -0.25390625, -0.134521484375, -0.01513671875, 0.104248046875, 0.2236328125, 0.343017578125, 0.46240234375, 0.581787109375, 0.701171875, 0.820556640625, 0.93994140625, 1.059326171875, 1.1787109375, 1.298095703125, 1.41748046875, 1.536865234375, 1.65625, 1.775634765625, 1.89501953125, 2.014404296875, 2.1337890625, 2.253173828125, 2.37255859375, 2.491943359375, 2.611328125, 2.730712890625, 2.85009765625, 2.969482421875, 3.0888671875, 3.208251953125, 3.32763671875, 3.447021484375, 3.56640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 6.0, 6.0, 14.0, 6.0, 16.0, 15.0, 17.0, 24.0, 28.0, 30.0, 47.0, 43.0, 62.0, 46.0, 73.0, 60.0, 58.0, 62.0, 54.0, 47.0, 41.0, 46.0, 36.0, 31.0, 25.0, 20.0, 19.0, 19.0, 15.0, 4.0, 4.0, 8.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.986328125, -0.9546661376953125, -0.923004150390625, -0.8913421630859375, -0.85968017578125, -0.8280181884765625, -0.796356201171875, -0.7646942138671875, -0.7330322265625, -0.7013702392578125, -0.669708251953125, -0.6380462646484375, -0.60638427734375, -0.5747222900390625, -0.543060302734375, -0.5113983154296875, -0.479736328125, -0.4480743408203125, -0.416412353515625, -0.3847503662109375, -0.35308837890625, -0.3214263916015625, -0.289764404296875, -0.2581024169921875, -0.2264404296875, -0.1947784423828125, -0.163116455078125, -0.1314544677734375, -0.09979248046875, -0.0681304931640625, -0.036468505859375, -0.0048065185546875, 0.02685546875, 0.0585174560546875, 0.090179443359375, 0.1218414306640625, 0.15350341796875, 0.1851654052734375, 0.216827392578125, 0.2484893798828125, 0.2801513671875, 0.3118133544921875, 0.343475341796875, 0.3751373291015625, 0.40679931640625, 0.4384613037109375, 0.470123291015625, 0.5017852783203125, 0.533447265625, 0.5651092529296875, 0.596771240234375, 0.6284332275390625, 0.66009521484375, 0.6917572021484375, 0.723419189453125, 0.7550811767578125, 0.7867431640625, 0.8184051513671875, 0.850067138671875, 0.8817291259765625, 0.91339111328125, 0.9450531005859375, 0.976715087890625, 1.0083770751953125, 1.0400390625]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 3.0, 6.0, 10.0, 12.0, 15.0, 21.0, 11.0, 20.0, 28.0, 35.0, 45.0, 47.0, 59.0, 67.0, 77.0, 64.0, 70.0, 63.0, 63.0, 57.0, 56.0, 44.0, 25.0, 26.0, 17.0, 7.0, 10.0, 12.0, 8.0, 3.0, 2.0, 4.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.062572479248047, -5.896477699279785, -5.730382919311523, -5.564288139343262, -5.398193359375, -5.232098579406738, -5.066003799438477, -4.899909019470215, -4.733814239501953, -4.567719459533691, -4.40162467956543, -4.235529899597168, -4.069435119628906, -3.9033403396606445, -3.7372453212738037, -3.571150541305542, -3.405055522918701, -3.2389607429504395, -3.0728659629821777, -2.906771183013916, -2.7406764030456543, -2.5745816230773926, -2.4084866046905518, -2.24239182472229, -2.0762970447540283, -1.9102022647857666, -1.7441074848175049, -1.5780125856399536, -1.411917805671692, -1.2458230257034302, -1.079728126525879, -0.9136333465576172, -0.7475390434265137, -0.581444263458252, -0.41534942388534546, -0.24925461411476135, -0.08315980434417725, 0.08293497562408447, 0.24902981519699097, 0.41512465476989746, 0.5812194347381592, 0.7473142147064209, 0.9134090542793274, 1.0795038938522339, 1.2455986738204956, 1.4116934537887573, 1.5777883529663086, 1.7438831329345703, 1.909977912902832, 2.0760726928710938, 2.2421674728393555, 2.408262252807617, 2.574357032775879, 2.7404518127441406, 2.9065468311309814, 3.072641611099243, 3.238736391067505, 3.4048311710357666, 3.5709259510040283, 3.73702073097229, 3.903115749359131, 4.069210529327393, 4.235305309295654, 4.401400089263916, 4.567494869232178]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 10.0, 9.0, 9.0, 15.0, 12.0, 18.0, 18.0, 25.0, 33.0, 30.0, 27.0, 38.0, 49.0, 42.0, 38.0, 42.0, 45.0, 39.0, 43.0, 49.0, 47.0, 40.0, 28.0, 33.0, 34.0, 37.0, 25.0, 22.0, 17.0, 23.0, 17.0, 13.0, 12.0, 19.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.6480607986450195, -3.532437324523926, -3.416813611984253, -3.30118989944458, -3.1855664253234863, -3.0699429512023926, -2.9543192386627197, -2.838695526123047, -2.723072052001953, -2.6074485778808594, -2.4918248653411865, -2.3762011528015137, -2.26057767868042, -2.144954204559326, -2.0293304920196533, -1.91370689868927, -1.7980833053588867, -1.6824597120285034, -1.5668361186981201, -1.4512125253677368, -1.3355889320373535, -1.2199653387069702, -1.104341745376587, -0.9887181520462036, -0.8730945587158203, -0.757470965385437, -0.6418473720550537, -0.5262237787246704, -0.4106001853942871, -0.2949765920639038, -0.1793529987335205, -0.06372940540313721, 0.05189394950866699, 0.1675175428390503, 0.2831411361694336, 0.3987647294998169, 0.5143883228302002, 0.6300119161605835, 0.7456355094909668, 0.8612591028213501, 0.9768826961517334, 1.0925062894821167, 1.2081298828125, 1.3237534761428833, 1.4393770694732666, 1.55500066280365, 1.6706242561340332, 1.7862478494644165, 1.9018714427947998, 2.0174951553344727, 2.1331186294555664, 2.24874210357666, 2.364365816116333, 2.479989528656006, 2.5956130027770996, 2.7112364768981934, 2.826860189437866, 2.942483901977539, 3.058107376098633, 3.1737308502197266, 3.2893545627593994, 3.4049782752990723, 3.520601749420166, 3.6362252235412598, 3.7518489360809326]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 7.0, 6.0, 5.0, 12.0, 12.0, 17.0, 36.0, 40.0, 61.0, 101.0, 119.0, 219.0, 300.0, 442.0, 691.0, 1069.0, 1692.0, 2859.0, 4726.0, 8430.0, 15661.0, 31599.0, 73165.0, 206444.0, 662730.0, 1445081.0, 1118256.0, 391130.0, 127287.0, 49833.0, 23559.0, 12152.0, 6728.0, 3852.0, 2367.0, 1318.0, 823.0, 500.0, 321.0, 222.0, 112.0, 112.0, 57.0, 34.0, 32.0, 22.0, 14.0, 12.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.62109375, -5.4495849609375, -5.278076171875, -5.1065673828125, -4.93505859375, -4.7635498046875, -4.592041015625, -4.4205322265625, -4.2490234375, -4.0775146484375, -3.906005859375, -3.7344970703125, -3.56298828125, -3.3914794921875, -3.219970703125, -3.0484619140625, -2.876953125, -2.7054443359375, -2.533935546875, -2.3624267578125, -2.19091796875, -2.0194091796875, -1.847900390625, -1.6763916015625, -1.5048828125, -1.3333740234375, -1.161865234375, -0.9903564453125, -0.81884765625, -0.6473388671875, -0.475830078125, -0.3043212890625, -0.1328125, 0.0386962890625, 0.210205078125, 0.3817138671875, 0.55322265625, 0.7247314453125, 0.896240234375, 1.0677490234375, 1.2392578125, 1.4107666015625, 1.582275390625, 1.7537841796875, 1.92529296875, 2.0968017578125, 2.268310546875, 2.4398193359375, 2.611328125, 2.7828369140625, 2.954345703125, 3.1258544921875, 3.29736328125, 3.4688720703125, 3.640380859375, 3.8118896484375, 3.9833984375, 4.1549072265625, 4.326416015625, 4.4979248046875, 4.66943359375, 4.8409423828125, 5.012451171875, 5.1839599609375, 5.35546875]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 5.0, 12.0, 11.0, 12.0, 19.0, 23.0, 19.0, 30.0, 32.0, 47.0, 43.0, 32.0, 47.0, 54.0, 59.0, 53.0, 47.0, 50.0, 49.0, 48.0, 46.0, 42.0, 46.0, 30.0, 19.0, 20.0, 19.0, 21.0, 17.0, 12.0, 13.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.814422607421875, -2.72064208984375, -2.626861572265625, -2.5330810546875, -2.439300537109375, -2.34552001953125, -2.251739501953125, -2.157958984375, -2.064178466796875, -1.97039794921875, -1.876617431640625, -1.7828369140625, -1.689056396484375, -1.59527587890625, -1.501495361328125, -1.40771484375, -1.313934326171875, -1.22015380859375, -1.126373291015625, -1.0325927734375, -0.938812255859375, -0.84503173828125, -0.751251220703125, -0.657470703125, -0.563690185546875, -0.46990966796875, -0.376129150390625, -0.2823486328125, -0.188568115234375, -0.09478759765625, -0.001007080078125, 0.0927734375, 0.186553955078125, 0.28033447265625, 0.374114990234375, 0.4678955078125, 0.561676025390625, 0.65545654296875, 0.749237060546875, 0.843017578125, 0.936798095703125, 1.03057861328125, 1.124359130859375, 1.2181396484375, 1.311920166015625, 1.40570068359375, 1.499481201171875, 1.59326171875, 1.687042236328125, 1.78082275390625, 1.874603271484375, 1.9683837890625, 2.062164306640625, 2.15594482421875, 2.249725341796875, 2.343505859375, 2.437286376953125, 2.53106689453125, 2.624847412109375, 2.7186279296875, 2.812408447265625, 2.90618896484375, 2.999969482421875, 3.09375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 8.0, 7.0, 3.0, 11.0, 13.0, 16.0, 27.0, 52.0, 88.0, 147.0, 225.0, 387.0, 569.0, 976.0, 1610.0, 2516.0, 4249.0, 7453.0, 13138.0, 24380.0, 46885.0, 96595.0, 217251.0, 524571.0, 1115773.0, 1147667.0, 554049.0, 227201.0, 101554.0, 48815.0, 25135.0, 13589.0, 7844.0, 4516.0, 2667.0, 1683.0, 938.0, 646.0, 382.0, 233.0, 137.0, 104.0, 49.0, 38.0, 31.0, 20.0, 17.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-5.01171875, -4.8599853515625, -4.708251953125, -4.5565185546875, -4.40478515625, -4.2530517578125, -4.101318359375, -3.9495849609375, -3.7978515625, -3.6461181640625, -3.494384765625, -3.3426513671875, -3.19091796875, -3.0391845703125, -2.887451171875, -2.7357177734375, -2.583984375, -2.4322509765625, -2.280517578125, -2.1287841796875, -1.97705078125, -1.8253173828125, -1.673583984375, -1.5218505859375, -1.3701171875, -1.2183837890625, -1.066650390625, -0.9149169921875, -0.76318359375, -0.6114501953125, -0.459716796875, -0.3079833984375, -0.15625, -0.0045166015625, 0.147216796875, 0.2989501953125, 0.45068359375, 0.6024169921875, 0.754150390625, 0.9058837890625, 1.0576171875, 1.2093505859375, 1.361083984375, 1.5128173828125, 1.66455078125, 1.8162841796875, 1.968017578125, 2.1197509765625, 2.271484375, 2.4232177734375, 2.574951171875, 2.7266845703125, 2.87841796875, 3.0301513671875, 3.181884765625, 3.3336181640625, 3.4853515625, 3.6370849609375, 3.788818359375, 3.9405517578125, 4.09228515625, 4.2440185546875, 4.395751953125, 4.5474853515625, 4.69921875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 6.0, 8.0, 3.0, 4.0, 7.0, 13.0, 13.0, 18.0, 13.0, 16.0, 18.0, 24.0, 45.0, 50.0, 60.0, 83.0, 118.0, 129.0, 153.0, 210.0, 271.0, 284.0, 328.0, 328.0, 307.0, 265.0, 261.0, 220.0, 165.0, 135.0, 103.0, 92.0, 73.0, 57.0, 53.0, 37.0, 28.0, 22.0, 18.0, 14.0, 8.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2138671875, -1.1692657470703125, -1.124664306640625, -1.0800628662109375, -1.03546142578125, -0.9908599853515625, -0.946258544921875, -0.9016571044921875, -0.8570556640625, -0.8124542236328125, -0.767852783203125, -0.7232513427734375, -0.67864990234375, -0.6340484619140625, -0.589447021484375, -0.5448455810546875, -0.500244140625, -0.4556427001953125, -0.411041259765625, -0.3664398193359375, -0.32183837890625, -0.2772369384765625, -0.232635498046875, -0.1880340576171875, -0.1434326171875, -0.0988311767578125, -0.054229736328125, -0.0096282958984375, 0.03497314453125, 0.0795745849609375, 0.124176025390625, 0.1687774658203125, 0.21337890625, 0.2579803466796875, 0.302581787109375, 0.3471832275390625, 0.39178466796875, 0.4363861083984375, 0.480987548828125, 0.5255889892578125, 0.5701904296875, 0.6147918701171875, 0.659393310546875, 0.7039947509765625, 0.74859619140625, 0.7931976318359375, 0.837799072265625, 0.8824005126953125, 0.927001953125, 0.9716033935546875, 1.016204833984375, 1.0608062744140625, 1.10540771484375, 1.1500091552734375, 1.194610595703125, 1.2392120361328125, 1.2838134765625, 1.3284149169921875, 1.373016357421875, 1.4176177978515625, 1.46221923828125, 1.5068206787109375, 1.551422119140625, 1.5960235595703125, 1.640625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 12.0, 18.0, 20.0, 24.0, 30.0, 32.0, 55.0, 71.0, 65.0, 86.0, 88.0, 77.0, 91.0, 62.0, 45.0, 56.0, 44.0, 17.0, 19.0, 11.0, 12.0, 13.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5699920654296875, -5.396307468414307, -5.222622394561768, -5.048937797546387, -4.875252723693848, -4.701568126678467, -4.527883529663086, -4.354198455810547, -4.180513381958008, -4.006828784942627, -3.833143711090088, -3.659459114074707, -3.485774040222168, -3.312089443206787, -3.138404607772827, -2.964719772338867, -2.7910351753234863, -2.6173503398895264, -2.4436655044555664, -2.2699809074401855, -2.0962958335876465, -1.922611117362976, -1.7489264011383057, -1.5752415657043457, -1.4015567302703857, -1.2278718948364258, -1.0541870594024658, -0.8805023431777954, -0.7068175077438354, -0.5331326723098755, -0.3594479560852051, -0.18576312065124512, -0.01207876205444336, 0.1616060435771942, 0.3352908492088318, 0.508975625038147, 0.6826604604721069, 0.8563452959060669, 1.0300300121307373, 1.2037148475646973, 1.3773996829986572, 1.5510845184326172, 1.7247693538665771, 1.8984540700912476, 2.072138786315918, 2.245823860168457, 2.419508457183838, 2.593193292617798, 2.766878128051758, 2.9405629634857178, 3.1142477989196777, 3.2879323959350586, 3.4616174697875977, 3.6353020668029785, 3.8089869022369385, 3.9826717376708984, 4.1563568115234375, 4.330041408538818, 4.503726482391357, 4.677411079406738, 4.851096153259277, 5.024780750274658, 5.198465347290039, 5.372150421142578, 5.545835018157959]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 4.0, 9.0, 15.0, 19.0, 12.0, 18.0, 16.0, 23.0, 25.0, 29.0, 26.0, 23.0, 38.0, 39.0, 31.0, 44.0, 38.0, 44.0, 45.0, 40.0, 40.0, 38.0, 47.0, 35.0, 29.0, 27.0, 32.0, 30.0, 18.0, 22.0, 27.0, 18.0, 16.0, 13.0, 12.0, 12.0, 8.0, 9.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.9784116744995117, -2.8841192722320557, -2.7898266315460205, -2.6955342292785645, -2.6012418270111084, -2.5069494247436523, -2.412656784057617, -2.318364381790161, -2.224071979522705, -2.129779577255249, -2.035486936569214, -1.9411945343017578, -1.8469021320343018, -1.7526096105575562, -1.6583170890808105, -1.5640246868133545, -1.4697320461273193, -1.3754395246505737, -1.2811471223831177, -1.186854600906372, -1.092562198638916, -0.9982696771621704, -0.9039771556854248, -0.809684693813324, -0.7153922319412231, -0.6210997700691223, -0.5268073081970215, -0.4325147867202759, -0.33822232484817505, -0.24392986297607422, -0.1496373414993286, -0.05534487962722778, 0.038947343826293945, 0.13323982059955597, 0.227532297372818, 0.3218247890472412, 0.41611725091934204, 0.5104097127914429, 0.6047022342681885, 0.6989946961402893, 0.7932871580123901, 0.887579619884491, 0.9818720817565918, 1.0761646032333374, 1.170457124710083, 1.264749526977539, 1.3590420484542847, 1.4533345699310303, 1.5476269721984863, 1.641919493675232, 1.736211895942688, 1.8305044174194336, 1.9247968196868896, 2.0190892219543457, 2.113381862640381, 2.207674264907837, 2.301966667175293, 2.396259069442749, 2.490551710128784, 2.5848441123962402, 2.6791365146636963, 2.7734289169311523, 2.8677215576171875, 2.9620139598846436, 3.0563066005706787]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 12.0, 9.0, 16.0, 22.0, 37.0, 64.0, 76.0, 130.0, 179.0, 299.0, 456.0, 827.0, 1397.0, 2574.0, 4862.0, 9628.0, 19404.0, 39683.0, 80200.0, 149561.0, 223384.0, 220635.0, 143407.0, 76361.0, 37352.0, 18359.0, 9014.0, 4729.0, 2371.0, 1409.0, 807.0, 483.0, 293.0, 168.0, 105.0, 83.0, 49.0, 34.0, 27.0, 13.0, 10.0, 9.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.978515625, -2.888153076171875, -2.79779052734375, -2.707427978515625, -2.6170654296875, -2.526702880859375, -2.43634033203125, -2.345977783203125, -2.255615234375, -2.165252685546875, -2.07489013671875, -1.984527587890625, -1.8941650390625, -1.803802490234375, -1.71343994140625, -1.623077392578125, -1.53271484375, -1.442352294921875, -1.35198974609375, -1.261627197265625, -1.1712646484375, -1.080902099609375, -0.99053955078125, -0.900177001953125, -0.809814453125, -0.719451904296875, -0.62908935546875, -0.538726806640625, -0.4483642578125, -0.358001708984375, -0.26763916015625, -0.177276611328125, -0.0869140625, 0.003448486328125, 0.09381103515625, 0.184173583984375, 0.2745361328125, 0.364898681640625, 0.45526123046875, 0.545623779296875, 0.635986328125, 0.726348876953125, 0.81671142578125, 0.907073974609375, 0.9974365234375, 1.087799072265625, 1.17816162109375, 1.268524169921875, 1.35888671875, 1.449249267578125, 1.53961181640625, 1.629974365234375, 1.7203369140625, 1.810699462890625, 1.90106201171875, 1.991424560546875, 2.081787109375, 2.172149658203125, 2.26251220703125, 2.352874755859375, 2.4432373046875, 2.533599853515625, 2.62396240234375, 2.714324951171875, 2.8046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 7.0, 8.0, 14.0, 15.0, 16.0, 12.0, 19.0, 20.0, 17.0, 29.0, 33.0, 28.0, 30.0, 41.0, 39.0, 48.0, 52.0, 49.0, 35.0, 38.0, 38.0, 43.0, 41.0, 33.0, 38.0, 38.0, 31.0, 35.0, 28.0, 14.0, 21.0, 25.0, 17.0, 6.0, 8.0, 6.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.681640625, -3.574981689453125, -3.46832275390625, -3.361663818359375, -3.2550048828125, -3.148345947265625, -3.04168701171875, -2.935028076171875, -2.828369140625, -2.721710205078125, -2.61505126953125, -2.508392333984375, -2.4017333984375, -2.295074462890625, -2.18841552734375, -2.081756591796875, -1.97509765625, -1.868438720703125, -1.76177978515625, -1.655120849609375, -1.5484619140625, -1.441802978515625, -1.33514404296875, -1.228485107421875, -1.121826171875, -1.015167236328125, -0.90850830078125, -0.801849365234375, -0.6951904296875, -0.588531494140625, -0.48187255859375, -0.375213623046875, -0.2685546875, -0.161895751953125, -0.05523681640625, 0.051422119140625, 0.1580810546875, 0.264739990234375, 0.37139892578125, 0.478057861328125, 0.584716796875, 0.691375732421875, 0.79803466796875, 0.904693603515625, 1.0113525390625, 1.118011474609375, 1.22467041015625, 1.331329345703125, 1.43798828125, 1.544647216796875, 1.65130615234375, 1.757965087890625, 1.8646240234375, 1.971282958984375, 2.07794189453125, 2.184600830078125, 2.291259765625, 2.397918701171875, 2.50457763671875, 2.611236572265625, 2.7178955078125, 2.824554443359375, 2.93121337890625, 3.037872314453125, 3.14453125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 9.0, 17.0, 15.0, 22.0, 33.0, 48.0, 74.0, 108.0, 180.0, 299.0, 465.0, 787.0, 1458.0, 2707.0, 4975.0, 9918.0, 20932.0, 46293.0, 107914.0, 239648.0, 307116.0, 169787.0, 73175.0, 32227.0, 14798.0, 7209.0, 3669.0, 1925.0, 1074.0, 616.0, 365.0, 217.0, 137.0, 83.0, 81.0, 59.0, 34.0, 25.0, 16.0, 14.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0], "bins": [-4.49609375, -4.364898681640625, -4.23370361328125, -4.102508544921875, -3.9713134765625, -3.840118408203125, -3.70892333984375, -3.577728271484375, -3.446533203125, -3.315338134765625, -3.18414306640625, -3.052947998046875, -2.9217529296875, -2.790557861328125, -2.65936279296875, -2.528167724609375, -2.39697265625, -2.265777587890625, -2.13458251953125, -2.003387451171875, -1.8721923828125, -1.740997314453125, -1.60980224609375, -1.478607177734375, -1.347412109375, -1.216217041015625, -1.08502197265625, -0.953826904296875, -0.8226318359375, -0.691436767578125, -0.56024169921875, -0.429046630859375, -0.2978515625, -0.166656494140625, -0.03546142578125, 0.095733642578125, 0.2269287109375, 0.358123779296875, 0.48931884765625, 0.620513916015625, 0.751708984375, 0.882904052734375, 1.01409912109375, 1.145294189453125, 1.2764892578125, 1.407684326171875, 1.53887939453125, 1.670074462890625, 1.80126953125, 1.932464599609375, 2.06365966796875, 2.194854736328125, 2.3260498046875, 2.457244873046875, 2.58843994140625, 2.719635009765625, 2.850830078125, 2.982025146484375, 3.11322021484375, 3.244415283203125, 3.3756103515625, 3.506805419921875, 3.63800048828125, 3.769195556640625, 3.900390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 4.0, 8.0, 8.0, 7.0, 10.0, 9.0, 13.0, 16.0, 10.0, 23.0, 21.0, 20.0, 27.0, 36.0, 31.0, 30.0, 39.0, 37.0, 37.0, 50.0, 41.0, 37.0, 42.0, 29.0, 35.0, 47.0, 39.0, 28.0, 35.0, 28.0, 22.0, 21.0, 25.0, 22.0, 18.0, 10.0, 13.0, 20.0, 6.0, 7.0, 7.0, 6.0, 5.0, 5.0, 1.0, 4.0, 1.0, 5.0], "bins": [-2.076171875, -2.0203704833984375, -1.964569091796875, -1.9087677001953125, -1.85296630859375, -1.7971649169921875, -1.741363525390625, -1.6855621337890625, -1.6297607421875, -1.5739593505859375, -1.518157958984375, -1.4623565673828125, -1.40655517578125, -1.3507537841796875, -1.294952392578125, -1.2391510009765625, -1.183349609375, -1.1275482177734375, -1.071746826171875, -1.0159454345703125, -0.96014404296875, -0.9043426513671875, -0.848541259765625, -0.7927398681640625, -0.7369384765625, -0.6811370849609375, -0.625335693359375, -0.5695343017578125, -0.51373291015625, -0.4579315185546875, -0.402130126953125, -0.3463287353515625, -0.29052734375, -0.2347259521484375, -0.178924560546875, -0.1231231689453125, -0.06732177734375, -0.0115203857421875, 0.044281005859375, 0.1000823974609375, 0.1558837890625, 0.2116851806640625, 0.267486572265625, 0.3232879638671875, 0.37908935546875, 0.4348907470703125, 0.490692138671875, 0.5464935302734375, 0.602294921875, 0.6580963134765625, 0.713897705078125, 0.7696990966796875, 0.82550048828125, 0.8813018798828125, 0.937103271484375, 0.9929046630859375, 1.0487060546875, 1.1045074462890625, 1.160308837890625, 1.2161102294921875, 1.27191162109375, 1.3277130126953125, 1.383514404296875, 1.4393157958984375, 1.4951171875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 6.0, 14.0, 17.0, 23.0, 27.0, 52.0, 75.0, 83.0, 139.0, 188.0, 258.0, 355.0, 550.0, 800.0, 1189.0, 1710.0, 2632.0, 4181.0, 6648.0, 10990.0, 18934.0, 33919.0, 64012.0, 123171.0, 219087.0, 240648.0, 145531.0, 76811.0, 40338.0, 22162.0, 12554.0, 7664.0, 4757.0, 2995.0, 1960.0, 1280.0, 875.0, 613.0, 384.0, 279.0, 186.0, 127.0, 90.0, 75.0, 51.0, 30.0, 26.0, 13.0, 15.0, 8.0, 8.0, 8.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.54296875, -1.4949493408203125, -1.446929931640625, -1.3989105224609375, -1.35089111328125, -1.3028717041015625, -1.254852294921875, -1.2068328857421875, -1.1588134765625, -1.1107940673828125, -1.062774658203125, -1.0147552490234375, -0.96673583984375, -0.9187164306640625, -0.870697021484375, -0.8226776123046875, -0.774658203125, -0.7266387939453125, -0.678619384765625, -0.6305999755859375, -0.58258056640625, -0.5345611572265625, -0.486541748046875, -0.4385223388671875, -0.3905029296875, -0.3424835205078125, -0.294464111328125, -0.2464447021484375, -0.19842529296875, -0.1504058837890625, -0.102386474609375, -0.0543670654296875, -0.00634765625, 0.0416717529296875, 0.089691162109375, 0.1377105712890625, 0.18572998046875, 0.2337493896484375, 0.281768798828125, 0.3297882080078125, 0.3778076171875, 0.4258270263671875, 0.473846435546875, 0.5218658447265625, 0.56988525390625, 0.6179046630859375, 0.665924072265625, 0.7139434814453125, 0.761962890625, 0.8099822998046875, 0.858001708984375, 0.9060211181640625, 0.95404052734375, 1.0020599365234375, 1.050079345703125, 1.0980987548828125, 1.1461181640625, 1.1941375732421875, 1.242156982421875, 1.2901763916015625, 1.33819580078125, 1.3862152099609375, 1.434234619140625, 1.4822540283203125, 1.5302734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 13.0, 9.0, 5.0, 8.0, 16.0, 14.0, 16.0, 22.0, 23.0, 42.0, 38.0, 39.0, 62.0, 59.0, 74.0, 83.0, 64.0, 61.0, 66.0, 55.0, 47.0, 36.0, 30.0, 26.0, 18.0, 11.0, 15.0, 12.0, 2.0, 7.0, 3.0, 2.0, 6.0, 2.0, 5.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.121397018432617e-05, -5.9149228036403656e-05, -5.708448588848114e-05, -5.5019743740558624e-05, -5.295500159263611e-05, -5.089025944471359e-05, -4.882551729679108e-05, -4.676077514886856e-05, -4.4696033000946045e-05, -4.263129085302353e-05, -4.056654870510101e-05, -3.85018065571785e-05, -3.643706440925598e-05, -3.4372322261333466e-05, -3.230758011341095e-05, -3.0242837965488434e-05, -2.8178095817565918e-05, -2.6113353669643402e-05, -2.4048611521720886e-05, -2.198386937379837e-05, -1.9919127225875854e-05, -1.785438507795334e-05, -1.5789642930030823e-05, -1.3724900782108307e-05, -1.1660158634185791e-05, -9.595416486263275e-06, -7.530674338340759e-06, -5.465932190418243e-06, -3.4011900424957275e-06, -1.3364478945732117e-06, 7.282942533493042e-07, 2.79303640127182e-06, 4.857778549194336e-06, 6.922520697116852e-06, 8.987262845039368e-06, 1.1052004992961884e-05, 1.31167471408844e-05, 1.5181489288806915e-05, 1.724623143672943e-05, 1.9310973584651947e-05, 2.1375715732574463e-05, 2.344045788049698e-05, 2.5505200028419495e-05, 2.756994217634201e-05, 2.9634684324264526e-05, 3.169942647218704e-05, 3.376416862010956e-05, 3.5828910768032074e-05, 3.789365291595459e-05, 3.9958395063877106e-05, 4.202313721179962e-05, 4.408787935972214e-05, 4.615262150764465e-05, 4.821736365556717e-05, 5.0282105803489685e-05, 5.23468479514122e-05, 5.441159009933472e-05, 5.647633224725723e-05, 5.854107439517975e-05, 6.0605816543102264e-05, 6.267055869102478e-05, 6.47353008389473e-05, 6.680004298686981e-05, 6.886478513479233e-05, 7.092952728271484e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 5.0, 11.0, 13.0, 24.0, 43.0, 65.0, 99.0, 168.0, 254.0, 377.0, 602.0, 1016.0, 1705.0, 2953.0, 4901.0, 8924.0, 16650.0, 31739.0, 61812.0, 115918.0, 191250.0, 226071.0, 172791.0, 99192.0, 52275.0, 26955.0, 14066.0, 7793.0, 4410.0, 2564.0, 1489.0, 903.0, 551.0, 347.0, 238.0, 133.0, 87.0, 51.0, 31.0, 31.0, 19.0, 10.0, 5.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1884765625, -1.1465911865234375, -1.104705810546875, -1.0628204345703125, -1.02093505859375, -0.9790496826171875, -0.937164306640625, -0.8952789306640625, -0.8533935546875, -0.8115081787109375, -0.769622802734375, -0.7277374267578125, -0.68585205078125, -0.6439666748046875, -0.602081298828125, -0.5601959228515625, -0.518310546875, -0.4764251708984375, -0.434539794921875, -0.3926544189453125, -0.35076904296875, -0.3088836669921875, -0.266998291015625, -0.2251129150390625, -0.1832275390625, -0.1413421630859375, -0.099456787109375, -0.0575714111328125, -0.01568603515625, 0.0261993408203125, 0.068084716796875, 0.1099700927734375, 0.15185546875, 0.1937408447265625, 0.235626220703125, 0.2775115966796875, 0.31939697265625, 0.3612823486328125, 0.403167724609375, 0.4450531005859375, 0.4869384765625, 0.5288238525390625, 0.570709228515625, 0.6125946044921875, 0.65447998046875, 0.6963653564453125, 0.738250732421875, 0.7801361083984375, 0.822021484375, 0.8639068603515625, 0.905792236328125, 0.9476776123046875, 0.98956298828125, 1.0314483642578125, 1.073333740234375, 1.1152191162109375, 1.1571044921875, 1.1989898681640625, 1.240875244140625, 1.2827606201171875, 1.32464599609375, 1.3665313720703125, 1.408416748046875, 1.4503021240234375, 1.4921875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 6.0, 10.0, 6.0, 6.0, 4.0, 6.0, 10.0, 12.0, 17.0, 21.0, 21.0, 31.0, 34.0, 44.0, 61.0, 56.0, 59.0, 59.0, 55.0, 62.0, 65.0, 64.0, 58.0, 51.0, 38.0, 26.0, 21.0, 22.0, 20.0, 15.0, 8.0, 8.0, 8.0, 6.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.46826171875, -0.4537620544433594, -0.43926239013671875, -0.4247627258300781, -0.4102630615234375, -0.3957633972167969, -0.38126373291015625, -0.3667640686035156, -0.352264404296875, -0.3377647399902344, -0.32326507568359375, -0.3087654113769531, -0.2942657470703125, -0.2797660827636719, -0.26526641845703125, -0.2507667541503906, -0.23626708984375, -0.22176742553710938, -0.20726776123046875, -0.19276809692382812, -0.1782684326171875, -0.16376876831054688, -0.14926910400390625, -0.13476943969726562, -0.120269775390625, -0.10577011108398438, -0.09127044677734375, -0.07677078247070312, -0.0622711181640625, -0.047771453857421875, -0.03327178955078125, -0.018772125244140625, -0.0042724609375, 0.010227203369140625, 0.02472686767578125, 0.039226531982421875, 0.0537261962890625, 0.06822586059570312, 0.08272552490234375, 0.09722518920898438, 0.111724853515625, 0.12622451782226562, 0.14072418212890625, 0.15522384643554688, 0.1697235107421875, 0.18422317504882812, 0.19872283935546875, 0.21322250366210938, 0.22772216796875, 0.24222183227539062, 0.25672149658203125, 0.2712211608886719, 0.2857208251953125, 0.3002204895019531, 0.31472015380859375, 0.3292198181152344, 0.343719482421875, 0.3582191467285156, 0.37271881103515625, 0.3872184753417969, 0.4017181396484375, 0.4162178039550781, 0.43071746826171875, 0.4452171325683594, 0.459716796875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 6.0, 8.0, 11.0, 11.0, 11.0, 28.0, 21.0, 17.0, 34.0, 43.0, 74.0, 63.0, 89.0, 75.0, 87.0, 75.0, 74.0, 65.0, 51.0, 44.0, 23.0, 23.0, 15.0, 11.0, 10.0, 11.0, 4.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53507137298584, -5.364937782287598, -5.1948041915893555, -5.024670600891113, -4.854537010192871, -4.684403419494629, -4.514269828796387, -4.3441362380981445, -4.174002647399902, -4.00386905670166, -3.833735466003418, -3.663601875305176, -3.4934682846069336, -3.3233346939086914, -3.1532013416290283, -2.983067750930786, -2.812934398651123, -2.642800807952881, -2.4726672172546387, -2.3025336265563965, -2.1324000358581543, -1.9622665643692017, -1.792133092880249, -1.6219995021820068, -1.4518659114837646, -1.2817323207855225, -1.1115987300872803, -0.9414652585983276, -0.7713316679000854, -0.6011980772018433, -0.4310646057128906, -0.26093101501464844, -0.09079790115356445, 0.07933565974235535, 0.24946922063827515, 0.41960275173187256, 0.5897363424301147, 0.7598699331283569, 0.9300034046173096, 1.1001369953155518, 1.270270586013794, 1.4404041767120361, 1.6105377674102783, 1.780671238899231, 1.9508048295974731, 2.120938301086426, 2.291071891784668, 2.46120548248291, 2.6313390731811523, 2.8014726638793945, 2.9716062545776367, 3.141739845275879, 3.311873435974121, 3.4820070266723633, 3.6521403789520264, 3.8222739696502686, 3.9924075603485107, 4.162540912628174, 4.332674503326416, 4.502808094024658, 4.6729416847229, 4.843075275421143, 5.013208866119385, 5.183342456817627, 5.353476047515869]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 6.0, 6.0, 17.0, 14.0, 21.0, 19.0, 13.0, 16.0, 27.0, 32.0, 29.0, 28.0, 27.0, 33.0, 42.0, 43.0, 47.0, 39.0, 44.0, 45.0, 31.0, 43.0, 49.0, 33.0, 31.0, 29.0, 32.0, 21.0, 29.0, 23.0, 21.0, 13.0, 16.0, 18.0, 15.0, 8.0, 9.0, 4.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.994032859802246, -2.899569511413574, -2.8051059246063232, -2.7106425762176514, -2.6161792278289795, -2.5217156410217285, -2.4272522926330566, -2.3327889442443848, -2.238325357437134, -2.143862009048462, -2.049398422241211, -1.954935073852539, -1.8604716062545776, -1.7660081386566162, -1.6715447902679443, -1.577081322669983, -1.482617974281311, -1.3881545066833496, -1.2936911582946777, -1.1992276906967163, -1.1047642230987549, -1.010300874710083, -0.9158374071121216, -0.8213739395141602, -0.7269105315208435, -0.6324471235275269, -0.5379836559295654, -0.4435202479362488, -0.34905681014060974, -0.2545933723449707, -0.16012996435165405, -0.06566649675369263, 0.028796911239624023, 0.12326034158468246, 0.2177237719297409, 0.31218719482421875, 0.4066506326198578, 0.5011140704154968, 0.5955774784088135, 0.6900409460067749, 0.7845043540000916, 0.8789677619934082, 0.9734312295913696, 1.067894697189331, 1.162358045578003, 1.2568215131759644, 1.3512849807739258, 1.4457483291625977, 1.540211796760559, 1.6346752643585205, 1.7291386127471924, 1.8236020803451538, 1.9180655479431152, 2.012528896331787, 2.106992244720459, 2.20145583152771, 2.295919179916382, 2.3903825283050537, 2.4848461151123047, 2.5793094635009766, 2.6737728118896484, 2.7682363986968994, 2.8626997470855713, 2.9571633338928223, 3.051626682281494]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 8.0, 7.0, 16.0, 18.0, 42.0, 55.0, 88.0, 154.0, 269.0, 408.0, 780.0, 1473.0, 2686.0, 5212.0, 10706.0, 22894.0, 48022.0, 99128.0, 174852.0, 233315.0, 202876.0, 124814.0, 62663.0, 30023.0, 13996.0, 6687.0, 3355.0, 1750.0, 916.0, 558.0, 300.0, 156.0, 125.0, 73.0, 40.0, 31.0, 23.0, 6.0, 14.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.32421875, -4.19952392578125, -4.0748291015625, -3.95013427734375, -3.825439453125, -3.70074462890625, -3.5760498046875, -3.45135498046875, -3.32666015625, -3.20196533203125, -3.0772705078125, -2.95257568359375, -2.827880859375, -2.70318603515625, -2.5784912109375, -2.45379638671875, -2.3291015625, -2.20440673828125, -2.0797119140625, -1.95501708984375, -1.830322265625, -1.70562744140625, -1.5809326171875, -1.45623779296875, -1.33154296875, -1.20684814453125, -1.0821533203125, -0.95745849609375, -0.832763671875, -0.70806884765625, -0.5833740234375, -0.45867919921875, -0.333984375, -0.20928955078125, -0.0845947265625, 0.04010009765625, 0.164794921875, 0.28948974609375, 0.4141845703125, 0.53887939453125, 0.66357421875, 0.78826904296875, 0.9129638671875, 1.03765869140625, 1.162353515625, 1.28704833984375, 1.4117431640625, 1.53643798828125, 1.6611328125, 1.78582763671875, 1.9105224609375, 2.03521728515625, 2.159912109375, 2.28460693359375, 2.4093017578125, 2.53399658203125, 2.65869140625, 2.78338623046875, 2.9080810546875, 3.03277587890625, 3.157470703125, 3.28216552734375, 3.4068603515625, 3.53155517578125, 3.65625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 7.0, 2.0, 8.0, 9.0, 6.0, 10.0, 13.0, 18.0, 16.0, 17.0, 29.0, 29.0, 29.0, 29.0, 30.0, 38.0, 30.0, 46.0, 46.0, 41.0, 40.0, 42.0, 52.0, 38.0, 35.0, 40.0, 33.0, 40.0, 22.0, 31.0, 21.0, 25.0, 18.0, 23.0, 19.0, 11.0, 16.0, 13.0, 4.0, 7.0, 8.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.21240234375, -3.1123046875, -3.01220703125, -2.912109375, -2.81201171875, -2.7119140625, -2.61181640625, -2.51171875, -2.41162109375, -2.3115234375, -2.21142578125, -2.111328125, -2.01123046875, -1.9111328125, -1.81103515625, -1.7109375, -1.61083984375, -1.5107421875, -1.41064453125, -1.310546875, -1.21044921875, -1.1103515625, -1.01025390625, -0.91015625, -0.81005859375, -0.7099609375, -0.60986328125, -0.509765625, -0.40966796875, -0.3095703125, -0.20947265625, -0.109375, -0.00927734375, 0.0908203125, 0.19091796875, 0.291015625, 0.39111328125, 0.4912109375, 0.59130859375, 0.69140625, 0.79150390625, 0.8916015625, 0.99169921875, 1.091796875, 1.19189453125, 1.2919921875, 1.39208984375, 1.4921875, 1.59228515625, 1.6923828125, 1.79248046875, 1.892578125, 1.99267578125, 2.0927734375, 2.19287109375, 2.29296875, 2.39306640625, 2.4931640625, 2.59326171875, 2.693359375, 2.79345703125, 2.8935546875, 2.99365234375, 3.09375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 7.0, 4.0, 6.0, 12.0, 24.0, 32.0, 49.0, 65.0, 107.0, 165.0, 252.0, 439.0, 713.0, 1055.0, 1751.0, 2927.0, 4752.0, 7761.0, 12864.0, 21770.0, 36068.0, 59163.0, 93153.0, 132736.0, 162221.0, 159330.0, 126192.0, 87013.0, 54601.0, 33069.0, 19872.0, 11935.0, 7245.0, 4284.0, 2567.0, 1591.0, 1024.0, 621.0, 409.0, 229.0, 179.0, 107.0, 73.0, 37.0, 35.0, 15.0, 9.0, 13.0, 10.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-2.626953125, -2.544647216796875, -2.46234130859375, -2.380035400390625, -2.2977294921875, -2.215423583984375, -2.13311767578125, -2.050811767578125, -1.968505859375, -1.886199951171875, -1.80389404296875, -1.721588134765625, -1.6392822265625, -1.556976318359375, -1.47467041015625, -1.392364501953125, -1.31005859375, -1.227752685546875, -1.14544677734375, -1.063140869140625, -0.9808349609375, -0.898529052734375, -0.81622314453125, -0.733917236328125, -0.651611328125, -0.569305419921875, -0.48699951171875, -0.404693603515625, -0.3223876953125, -0.240081787109375, -0.15777587890625, -0.075469970703125, 0.0068359375, 0.089141845703125, 0.17144775390625, 0.253753662109375, 0.3360595703125, 0.418365478515625, 0.50067138671875, 0.582977294921875, 0.665283203125, 0.747589111328125, 0.82989501953125, 0.912200927734375, 0.9945068359375, 1.076812744140625, 1.15911865234375, 1.241424560546875, 1.32373046875, 1.406036376953125, 1.48834228515625, 1.570648193359375, 1.6529541015625, 1.735260009765625, 1.81756591796875, 1.899871826171875, 1.982177734375, 2.064483642578125, 2.14678955078125, 2.229095458984375, 2.3114013671875, 2.393707275390625, 2.47601318359375, 2.558319091796875, 2.640625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 9.0, 9.0, 6.0, 12.0, 18.0, 11.0, 16.0, 19.0, 15.0, 25.0, 14.0, 29.0, 25.0, 29.0, 38.0, 28.0, 49.0, 40.0, 54.0, 39.0, 40.0, 52.0, 42.0, 38.0, 45.0, 37.0, 27.0, 27.0, 31.0, 26.0, 23.0, 20.0, 16.0, 20.0, 12.0, 14.0, 10.0, 5.0, 10.0, 5.0, 2.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.927734375, -1.8666229248046875, -1.805511474609375, -1.7444000244140625, -1.68328857421875, -1.6221771240234375, -1.561065673828125, -1.4999542236328125, -1.4388427734375, -1.3777313232421875, -1.316619873046875, -1.2555084228515625, -1.19439697265625, -1.1332855224609375, -1.072174072265625, -1.0110626220703125, -0.949951171875, -0.8888397216796875, -0.827728271484375, -0.7666168212890625, -0.70550537109375, -0.6443939208984375, -0.583282470703125, -0.5221710205078125, -0.4610595703125, -0.3999481201171875, -0.338836669921875, -0.2777252197265625, -0.21661376953125, -0.1555023193359375, -0.094390869140625, -0.0332794189453125, 0.02783203125, 0.0889434814453125, 0.150054931640625, 0.2111663818359375, 0.27227783203125, 0.3333892822265625, 0.394500732421875, 0.4556121826171875, 0.5167236328125, 0.5778350830078125, 0.638946533203125, 0.7000579833984375, 0.76116943359375, 0.8222808837890625, 0.883392333984375, 0.9445037841796875, 1.005615234375, 1.0667266845703125, 1.127838134765625, 1.1889495849609375, 1.25006103515625, 1.3111724853515625, 1.372283935546875, 1.4333953857421875, 1.4945068359375, 1.5556182861328125, 1.616729736328125, 1.6778411865234375, 1.73895263671875, 1.8000640869140625, 1.861175537109375, 1.9222869873046875, 1.9833984375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 2.0, 7.0, 19.0, 15.0, 19.0, 39.0, 28.0, 49.0, 72.0, 91.0, 142.0, 179.0, 274.0, 470.0, 831.0, 1762.0, 4354.0, 12979.0, 45681.0, 184696.0, 465485.0, 243669.0, 60944.0, 16490.0, 5495.0, 2177.0, 1023.0, 531.0, 319.0, 241.0, 127.0, 95.0, 64.0, 49.0, 37.0, 24.0, 26.0, 11.0, 11.0, 4.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.62890625, -5.4508056640625, -5.272705078125, -5.0946044921875, -4.91650390625, -4.7384033203125, -4.560302734375, -4.3822021484375, -4.2041015625, -4.0260009765625, -3.847900390625, -3.6697998046875, -3.49169921875, -3.3135986328125, -3.135498046875, -2.9573974609375, -2.779296875, -2.6011962890625, -2.423095703125, -2.2449951171875, -2.06689453125, -1.8887939453125, -1.710693359375, -1.5325927734375, -1.3544921875, -1.1763916015625, -0.998291015625, -0.8201904296875, -0.64208984375, -0.4639892578125, -0.285888671875, -0.1077880859375, 0.0703125, 0.2484130859375, 0.426513671875, 0.6046142578125, 0.78271484375, 0.9608154296875, 1.138916015625, 1.3170166015625, 1.4951171875, 1.6732177734375, 1.851318359375, 2.0294189453125, 2.20751953125, 2.3856201171875, 2.563720703125, 2.7418212890625, 2.919921875, 3.0980224609375, 3.276123046875, 3.4542236328125, 3.63232421875, 3.8104248046875, 3.988525390625, 4.1666259765625, 4.3447265625, 4.5228271484375, 4.700927734375, 4.8790283203125, 5.05712890625, 5.2352294921875, 5.413330078125, 5.5914306640625, 5.76953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 1.0, 5.0, 7.0, 9.0, 13.0, 20.0, 48.0, 54.0, 86.0, 128.0, 138.0, 135.0, 123.0, 75.0, 56.0, 29.0, 22.0, 12.0, 15.0, 9.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004968643188476562, -0.00048177316784858704, -0.0004666820168495178, -0.0004515908658504486, -0.0004364997148513794, -0.0004214085638523102, -0.00040631741285324097, -0.00039122626185417175, -0.00037613511085510254, -0.0003610439598560333, -0.0003459528088569641, -0.0003308616578578949, -0.0003157705068588257, -0.00030067935585975647, -0.00028558820486068726, -0.00027049705386161804, -0.00025540590286254883, -0.00024031475186347961, -0.0002252236008644104, -0.0002101324498653412, -0.00019504129886627197, -0.00017995014786720276, -0.00016485899686813354, -0.00014976784586906433, -0.00013467669486999512, -0.0001195855438709259, -0.00010449439287185669, -8.940324187278748e-05, -7.431209087371826e-05, -5.922093987464905e-05, -4.4129788875579834e-05, -2.903863787651062e-05, -1.3947486877441406e-05, 1.1436641216278076e-06, 1.623481512069702e-05, 3.1325966119766235e-05, 4.641711711883545e-05, 6.150826811790466e-05, 7.659941911697388e-05, 9.169057011604309e-05, 0.0001067817211151123, 0.00012187287211418152, 0.00013696402311325073, 0.00015205517411231995, 0.00016714632511138916, 0.00018223747611045837, 0.0001973286271095276, 0.0002124197781085968, 0.00022751092910766602, 0.00024260208010673523, 0.00025769323110580444, 0.00027278438210487366, 0.00028787553310394287, 0.0003029666841030121, 0.0003180578351020813, 0.0003331489861011505, 0.0003482401371002197, 0.00036333128809928894, 0.00037842243909835815, 0.00039351359009742737, 0.0004086047410964966, 0.0004236958920955658, 0.000438787043094635, 0.0004538781940937042, 0.00046896934509277344]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 14.0, 22.0, 23.0, 46.0, 43.0, 57.0, 85.0, 105.0, 135.0, 205.0, 267.0, 370.0, 522.0, 885.0, 1500.0, 3064.0, 6797.0, 17970.0, 51333.0, 155027.0, 346058.0, 291474.0, 110928.0, 37031.0, 13185.0, 5221.0, 2420.0, 1281.0, 722.0, 501.0, 334.0, 243.0, 187.0, 124.0, 103.0, 73.0, 43.0, 48.0, 34.0, 15.0, 19.0, 10.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.81640625, -3.68853759765625, -3.5606689453125, -3.43280029296875, -3.304931640625, -3.17706298828125, -3.0491943359375, -2.92132568359375, -2.79345703125, -2.66558837890625, -2.5377197265625, -2.40985107421875, -2.281982421875, -2.15411376953125, -2.0262451171875, -1.89837646484375, -1.7705078125, -1.64263916015625, -1.5147705078125, -1.38690185546875, -1.259033203125, -1.13116455078125, -1.0032958984375, -0.87542724609375, -0.74755859375, -0.61968994140625, -0.4918212890625, -0.36395263671875, -0.236083984375, -0.10821533203125, 0.0196533203125, 0.14752197265625, 0.275390625, 0.40325927734375, 0.5311279296875, 0.65899658203125, 0.786865234375, 0.91473388671875, 1.0426025390625, 1.17047119140625, 1.29833984375, 1.42620849609375, 1.5540771484375, 1.68194580078125, 1.809814453125, 1.93768310546875, 2.0655517578125, 2.19342041015625, 2.3212890625, 2.44915771484375, 2.5770263671875, 2.70489501953125, 2.832763671875, 2.96063232421875, 3.0885009765625, 3.21636962890625, 3.34423828125, 3.47210693359375, 3.5999755859375, 3.72784423828125, 3.855712890625, 3.98358154296875, 4.1114501953125, 4.23931884765625, 4.3671875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 15.0, 14.0, 30.0, 40.0, 60.0, 89.0, 104.0, 140.0, 136.0, 110.0, 81.0, 65.0, 45.0, 20.0, 16.0, 6.0, 9.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5283203125, -1.4804534912109375, -1.432586669921875, -1.3847198486328125, -1.33685302734375, -1.2889862060546875, -1.241119384765625, -1.1932525634765625, -1.1453857421875, -1.0975189208984375, -1.049652099609375, -1.0017852783203125, -0.95391845703125, -0.9060516357421875, -0.858184814453125, -0.8103179931640625, -0.762451171875, -0.7145843505859375, -0.666717529296875, -0.6188507080078125, -0.57098388671875, -0.5231170654296875, -0.475250244140625, -0.4273834228515625, -0.3795166015625, -0.3316497802734375, -0.283782958984375, -0.2359161376953125, -0.18804931640625, -0.1401824951171875, -0.092315673828125, -0.0444488525390625, 0.00341796875, 0.0512847900390625, 0.099151611328125, 0.1470184326171875, 0.19488525390625, 0.2427520751953125, 0.290618896484375, 0.3384857177734375, 0.3863525390625, 0.4342193603515625, 0.482086181640625, 0.5299530029296875, 0.57781982421875, 0.6256866455078125, 0.673553466796875, 0.7214202880859375, 0.769287109375, 0.8171539306640625, 0.865020751953125, 0.9128875732421875, 0.96075439453125, 1.0086212158203125, 1.056488037109375, 1.1043548583984375, 1.1522216796875, 1.2000885009765625, 1.247955322265625, 1.2958221435546875, 1.34368896484375, 1.3915557861328125, 1.439422607421875, 1.4872894287109375, 1.53515625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 12.0, 13.0, 9.0, 24.0, 29.0, 36.0, 39.0, 42.0, 46.0, 74.0, 76.0, 96.0, 80.0, 77.0, 79.0, 62.0, 39.0, 41.0, 26.0, 27.0, 17.0, 16.0, 7.0, 5.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.667759418487549, -5.493546962738037, -5.319334506988525, -5.145122051239014, -4.970909595489502, -4.79669713973999, -4.6224846839904785, -4.448272228240967, -4.274059772491455, -4.099847316741943, -3.9256348609924316, -3.75142240524292, -3.577209949493408, -3.4029974937438965, -3.2287850379943848, -3.054572582244873, -2.8803601264953613, -2.7061476707458496, -2.531935214996338, -2.357722759246826, -2.1835103034973145, -2.0092978477478027, -1.835085391998291, -1.6608729362487793, -1.4866604804992676, -1.3124480247497559, -1.1382355690002441, -0.9640231132507324, -0.7898106575012207, -0.615598201751709, -0.44138574600219727, -0.26717329025268555, -0.09296035766601562, 0.0812520980834961, 0.2554645538330078, 0.42967700958251953, 0.6038894653320312, 0.778101921081543, 0.9523143768310547, 1.1265268325805664, 1.3007392883300781, 1.4749517440795898, 1.6491641998291016, 1.8233766555786133, 1.997589111328125, 2.1718015670776367, 2.3460140228271484, 2.52022647857666, 2.694438934326172, 2.8686513900756836, 3.0428638458251953, 3.217076301574707, 3.3912887573242188, 3.5655012130737305, 3.739713668823242, 3.913926124572754, 4.088138580322266, 4.262351036071777, 4.436563491821289, 4.610775947570801, 4.7849884033203125, 4.959200859069824, 5.133413314819336, 5.307625770568848, 5.481838226318359]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 5.0, 7.0, 8.0, 12.0, 18.0, 21.0, 22.0, 20.0, 17.0, 25.0, 23.0, 24.0, 34.0, 36.0, 36.0, 33.0, 39.0, 46.0, 35.0, 29.0, 49.0, 42.0, 46.0, 39.0, 39.0, 32.0, 36.0, 29.0, 27.0, 23.0, 27.0, 20.0, 17.0, 15.0, 22.0, 9.0, 9.0, 9.0, 4.0, 6.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.061811923980713, -2.9657697677612305, -2.869727373123169, -2.7736852169036865, -2.677642822265625, -2.5816006660461426, -2.48555850982666, -2.3895163536071777, -2.293473958969116, -2.197431802749634, -2.1013894081115723, -2.00534725189209, -1.9093049764633179, -1.813262701034546, -1.7172205448150635, -1.6211782693862915, -1.5251359939575195, -1.4290937185287476, -1.3330514430999756, -1.2370092868804932, -1.1409670114517212, -1.0449247360229492, -0.948882520198822, -0.8528403043746948, -0.7567980289459229, -0.6607557535171509, -0.5647135376930237, -0.4686712920665741, -0.3726290464401245, -0.2765868008136749, -0.18054455518722534, -0.08450233936309814, 0.011539697647094727, 0.10758194327354431, 0.2036241888999939, 0.2996664345264435, 0.39570868015289307, 0.49175092577934265, 0.5877931714057922, 0.6838353872299194, 0.7798776626586914, 0.8759199380874634, 0.9719621539115906, 1.0680043697357178, 1.1640466451644897, 1.2600889205932617, 1.3561310768127441, 1.4521733522415161, 1.548215627670288, 1.64425790309906, 1.740300178527832, 1.8363423347473145, 1.9323846101760864, 2.0284268856048584, 2.124469041824341, 2.2205114364624023, 2.3165535926818848, 2.412595748901367, 2.5086381435394287, 2.604680299758911, 2.7007226943969727, 2.796764850616455, 2.8928070068359375, 2.98884916305542, 3.0848915576934814]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 8.0, 6.0, 12.0, 20.0, 28.0, 36.0, 51.0, 85.0, 128.0, 173.0, 277.0, 416.0, 651.0, 924.0, 1593.0, 2676.0, 4587.0, 8219.0, 15883.0, 34806.0, 91781.0, 309021.0, 1074645.0, 1628821.0, 702787.0, 194962.0, 64417.0, 27055.0, 13215.0, 7182.0, 3909.0, 2300.0, 1350.0, 904.0, 506.0, 309.0, 181.0, 125.0, 75.0, 50.0, 44.0, 23.0, 16.0, 11.0, 10.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.609375, -5.435791015625, -5.26220703125, -5.088623046875, -4.9150390625, -4.741455078125, -4.56787109375, -4.394287109375, -4.220703125, -4.047119140625, -3.87353515625, -3.699951171875, -3.5263671875, -3.352783203125, -3.17919921875, -3.005615234375, -2.83203125, -2.658447265625, -2.48486328125, -2.311279296875, -2.1376953125, -1.964111328125, -1.79052734375, -1.616943359375, -1.443359375, -1.269775390625, -1.09619140625, -0.922607421875, -0.7490234375, -0.575439453125, -0.40185546875, -0.228271484375, -0.0546875, 0.118896484375, 0.29248046875, 0.466064453125, 0.6396484375, 0.813232421875, 0.98681640625, 1.160400390625, 1.333984375, 1.507568359375, 1.68115234375, 1.854736328125, 2.0283203125, 2.201904296875, 2.37548828125, 2.549072265625, 2.72265625, 2.896240234375, 3.06982421875, 3.243408203125, 3.4169921875, 3.590576171875, 3.76416015625, 3.937744140625, 4.111328125, 4.284912109375, 4.45849609375, 4.632080078125, 4.8056640625, 4.979248046875, 5.15283203125, 5.326416015625, 5.5]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 6.0, 7.0, 10.0, 18.0, 15.0, 19.0, 13.0, 24.0, 27.0, 29.0, 29.0, 23.0, 38.0, 34.0, 49.0, 51.0, 42.0, 34.0, 48.0, 41.0, 48.0, 65.0, 33.0, 34.0, 38.0, 25.0, 39.0, 20.0, 23.0, 17.0, 18.0, 15.0, 16.0, 13.0, 7.0, 10.0, 6.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.070831298828125, -1.99713134765625, -1.923431396484375, -1.8497314453125, -1.776031494140625, -1.70233154296875, -1.628631591796875, -1.554931640625, -1.481231689453125, -1.40753173828125, -1.333831787109375, -1.2601318359375, -1.186431884765625, -1.11273193359375, -1.039031982421875, -0.96533203125, -0.891632080078125, -0.81793212890625, -0.744232177734375, -0.6705322265625, -0.596832275390625, -0.52313232421875, -0.449432373046875, -0.375732421875, -0.302032470703125, -0.22833251953125, -0.154632568359375, -0.0809326171875, -0.007232666015625, 0.06646728515625, 0.140167236328125, 0.2138671875, 0.287567138671875, 0.36126708984375, 0.434967041015625, 0.5086669921875, 0.582366943359375, 0.65606689453125, 0.729766845703125, 0.803466796875, 0.877166748046875, 0.95086669921875, 1.024566650390625, 1.0982666015625, 1.171966552734375, 1.24566650390625, 1.319366455078125, 1.39306640625, 1.466766357421875, 1.54046630859375, 1.614166259765625, 1.6878662109375, 1.761566162109375, 1.83526611328125, 1.908966064453125, 1.982666015625, 2.056365966796875, 2.13006591796875, 2.203765869140625, 2.2774658203125, 2.351165771484375, 2.42486572265625, 2.498565673828125, 2.572265625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 8.0, 7.0, 13.0, 15.0, 14.0, 20.0, 30.0, 49.0, 65.0, 105.0, 174.0, 227.0, 375.0, 636.0, 962.0, 1577.0, 2526.0, 4485.0, 7886.0, 14924.0, 28938.0, 62344.0, 148463.0, 401194.0, 1098154.0, 1418646.0, 615253.0, 217701.0, 86658.0, 39033.0, 19383.0, 10162.0, 5702.0, 3270.0, 1929.0, 1173.0, 788.0, 509.0, 294.0, 201.0, 134.0, 91.0, 53.0, 34.0, 25.0, 17.0, 15.0, 8.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.4609375, -5.30126953125, -5.1416015625, -4.98193359375, -4.822265625, -4.66259765625, -4.5029296875, -4.34326171875, -4.18359375, -4.02392578125, -3.8642578125, -3.70458984375, -3.544921875, -3.38525390625, -3.2255859375, -3.06591796875, -2.90625, -2.74658203125, -2.5869140625, -2.42724609375, -2.267578125, -2.10791015625, -1.9482421875, -1.78857421875, -1.62890625, -1.46923828125, -1.3095703125, -1.14990234375, -0.990234375, -0.83056640625, -0.6708984375, -0.51123046875, -0.3515625, -0.19189453125, -0.0322265625, 0.12744140625, 0.287109375, 0.44677734375, 0.6064453125, 0.76611328125, 0.92578125, 1.08544921875, 1.2451171875, 1.40478515625, 1.564453125, 1.72412109375, 1.8837890625, 2.04345703125, 2.203125, 2.36279296875, 2.5224609375, 2.68212890625, 2.841796875, 3.00146484375, 3.1611328125, 3.32080078125, 3.48046875, 3.64013671875, 3.7998046875, 3.95947265625, 4.119140625, 4.27880859375, 4.4384765625, 4.59814453125, 4.7578125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 5.0, 5.0, 11.0, 2.0, 10.0, 13.0, 13.0, 20.0, 22.0, 29.0, 31.0, 46.0, 82.0, 104.0, 159.0, 189.0, 214.0, 269.0, 357.0, 382.0, 380.0, 370.0, 333.0, 234.0, 212.0, 146.0, 111.0, 90.0, 65.0, 46.0, 38.0, 35.0, 17.0, 12.0, 11.0, 7.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6083984375, -1.559722900390625, -1.51104736328125, -1.462371826171875, -1.4136962890625, -1.365020751953125, -1.31634521484375, -1.267669677734375, -1.218994140625, -1.170318603515625, -1.12164306640625, -1.072967529296875, -1.0242919921875, -0.975616455078125, -0.92694091796875, -0.878265380859375, -0.82958984375, -0.780914306640625, -0.73223876953125, -0.683563232421875, -0.6348876953125, -0.586212158203125, -0.53753662109375, -0.488861083984375, -0.440185546875, -0.391510009765625, -0.34283447265625, -0.294158935546875, -0.2454833984375, -0.196807861328125, -0.14813232421875, -0.099456787109375, -0.05078125, -0.002105712890625, 0.04656982421875, 0.095245361328125, 0.1439208984375, 0.192596435546875, 0.24127197265625, 0.289947509765625, 0.338623046875, 0.387298583984375, 0.43597412109375, 0.484649658203125, 0.5333251953125, 0.582000732421875, 0.63067626953125, 0.679351806640625, 0.72802734375, 0.776702880859375, 0.82537841796875, 0.874053955078125, 0.9227294921875, 0.971405029296875, 1.02008056640625, 1.068756103515625, 1.117431640625, 1.166107177734375, 1.21478271484375, 1.263458251953125, 1.3121337890625, 1.360809326171875, 1.40948486328125, 1.458160400390625, 1.5068359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 3.0, 2.0, 5.0, 6.0, 3.0, 7.0, 12.0, 7.0, 12.0, 18.0, 21.0, 31.0, 36.0, 39.0, 50.0, 55.0, 63.0, 81.0, 94.0, 93.0, 72.0, 83.0, 46.0, 44.0, 33.0, 24.0, 20.0, 17.0, 9.0, 4.0, 8.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.728549480438232, -4.56507682800293, -4.401604175567627, -4.238131999969482, -4.07465934753418, -3.911186695098877, -3.747714042663574, -3.5842413902282715, -3.420768976211548, -3.257296323776245, -3.0938239097595215, -2.9303512573242188, -2.766878604888916, -2.6034061908721924, -2.4399335384368896, -2.276461124420166, -2.1129884719848633, -1.94951593875885, -1.786043405532837, -1.6225707530975342, -1.459098219871521, -1.2956256866455078, -1.132153034210205, -0.9686805009841919, -0.8052079677581787, -0.6417354345321655, -0.47826284170150757, -0.314790278673172, -0.15131771564483643, 0.012154817581176758, 0.17562741041183472, 0.3391000032424927, 0.5025725364685059, 0.666045069694519, 0.829517662525177, 0.992990255355835, 1.1564627885818481, 1.3199353218078613, 1.483407974243164, 1.6468805074691772, 1.8103530406951904, 1.9738255739212036, 2.137298107147217, 2.3007707595825195, 2.4642434120178223, 2.627715826034546, 2.7911884784698486, 2.9546608924865723, 3.118133544921875, 3.2816061973571777, 3.4450786113739014, 3.608551263809204, 3.7720236778259277, 3.9354963302612305, 4.098968982696533, 4.262441635131836, 4.4259138107299805, 4.589386463165283, 4.752859115600586, 4.9163312911987305, 5.079803943634033, 5.243276596069336, 5.406749248504639, 5.570221900939941, 5.733694553375244]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 2.0, 7.0, 5.0, 13.0, 12.0, 11.0, 19.0, 17.0, 19.0, 30.0, 23.0, 37.0, 34.0, 34.0, 34.0, 47.0, 33.0, 41.0, 48.0, 45.0, 53.0, 40.0, 31.0, 38.0, 34.0, 24.0, 33.0, 30.0, 36.0, 34.0, 28.0, 20.0, 13.0, 14.0, 12.0, 7.0, 6.0, 9.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5626726150512695, -2.4737019538879395, -2.3847312927246094, -2.2957606315612793, -2.206789970397949, -2.117819309234619, -2.028848648071289, -1.939877986907959, -1.850907325744629, -1.7619366645812988, -1.6729660034179688, -1.5839953422546387, -1.4950246810913086, -1.4060540199279785, -1.3170833587646484, -1.2281126976013184, -1.1391420364379883, -1.0501713752746582, -0.9612007141113281, -0.872230052947998, -0.783259391784668, -0.6942887306213379, -0.6053180694580078, -0.5163474082946777, -0.42737674713134766, -0.3384060859680176, -0.2494354248046875, -0.16046476364135742, -0.07149410247802734, 0.017476558685302734, 0.10644721984863281, 0.1954178810119629, 0.28438830375671387, 0.37335896492004395, 0.462329626083374, 0.5513002872467041, 0.6402709484100342, 0.7292416095733643, 0.8182122707366943, 0.9071829319000244, 0.9961535930633545, 1.0851242542266846, 1.1740949153900146, 1.2630655765533447, 1.3520362377166748, 1.4410068988800049, 1.529977560043335, 1.618948221206665, 1.7079188823699951, 1.7968895435333252, 1.8858602046966553, 1.9748308658599854, 2.0638015270233154, 2.1527721881866455, 2.2417428493499756, 2.3307135105133057, 2.4196841716766357, 2.508654832839966, 2.597625494003296, 2.686596155166626, 2.775566816329956, 2.864537477493286, 2.953508138656616, 3.0424787998199463, 3.1314494609832764]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 6.0, 8.0, 10.0, 9.0, 20.0, 30.0, 41.0, 38.0, 89.0, 137.0, 205.0, 357.0, 630.0, 998.0, 1812.0, 3359.0, 6606.0, 12776.0, 26864.0, 56591.0, 115948.0, 202554.0, 245309.0, 181870.0, 98825.0, 47564.0, 22709.0, 10807.0, 5611.0, 2857.0, 1579.0, 933.0, 512.0, 331.0, 218.0, 120.0, 99.0, 47.0, 24.0, 21.0, 12.0, 6.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.791015625, -2.7098388671875, -2.628662109375, -2.5474853515625, -2.46630859375, -2.3851318359375, -2.303955078125, -2.2227783203125, -2.1416015625, -2.0604248046875, -1.979248046875, -1.8980712890625, -1.81689453125, -1.7357177734375, -1.654541015625, -1.5733642578125, -1.4921875, -1.4110107421875, -1.329833984375, -1.2486572265625, -1.16748046875, -1.0863037109375, -1.005126953125, -0.9239501953125, -0.8427734375, -0.7615966796875, -0.680419921875, -0.5992431640625, -0.51806640625, -0.4368896484375, -0.355712890625, -0.2745361328125, -0.193359375, -0.1121826171875, -0.031005859375, 0.0501708984375, 0.13134765625, 0.2125244140625, 0.293701171875, 0.3748779296875, 0.4560546875, 0.5372314453125, 0.618408203125, 0.6995849609375, 0.78076171875, 0.8619384765625, 0.943115234375, 1.0242919921875, 1.10546875, 1.1866455078125, 1.267822265625, 1.3489990234375, 1.43017578125, 1.5113525390625, 1.592529296875, 1.6737060546875, 1.7548828125, 1.8360595703125, 1.917236328125, 1.9984130859375, 2.07958984375, 2.1607666015625, 2.241943359375, 2.3231201171875, 2.404296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 3.0, 11.0, 13.0, 12.0, 15.0, 25.0, 16.0, 17.0, 20.0, 23.0, 24.0, 29.0, 29.0, 34.0, 43.0, 49.0, 44.0, 55.0, 38.0, 40.0, 42.0, 43.0, 41.0, 34.0, 39.0, 35.0, 31.0, 28.0, 20.0, 24.0, 20.0, 23.0, 22.0, 8.0, 8.0, 8.0, 9.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.6107177734375, -2.516357421875, -2.4219970703125, -2.32763671875, -2.2332763671875, -2.138916015625, -2.0445556640625, -1.9501953125, -1.8558349609375, -1.761474609375, -1.6671142578125, -1.57275390625, -1.4783935546875, -1.384033203125, -1.2896728515625, -1.1953125, -1.1009521484375, -1.006591796875, -0.9122314453125, -0.81787109375, -0.7235107421875, -0.629150390625, -0.5347900390625, -0.4404296875, -0.3460693359375, -0.251708984375, -0.1573486328125, -0.06298828125, 0.0313720703125, 0.125732421875, 0.2200927734375, 0.314453125, 0.4088134765625, 0.503173828125, 0.5975341796875, 0.69189453125, 0.7862548828125, 0.880615234375, 0.9749755859375, 1.0693359375, 1.1636962890625, 1.258056640625, 1.3524169921875, 1.44677734375, 1.5411376953125, 1.635498046875, 1.7298583984375, 1.82421875, 1.9185791015625, 2.012939453125, 2.1072998046875, 2.20166015625, 2.2960205078125, 2.390380859375, 2.4847412109375, 2.5791015625, 2.6734619140625, 2.767822265625, 2.8621826171875, 2.95654296875, 3.0509033203125, 3.145263671875, 3.2396240234375, 3.333984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 5.0, 7.0, 14.0, 11.0, 14.0, 27.0, 33.0, 51.0, 91.0, 133.0, 197.0, 302.0, 537.0, 998.0, 1830.0, 3495.0, 7033.0, 14607.0, 31813.0, 74064.0, 174772.0, 318778.0, 234337.0, 102811.0, 43964.0, 19346.0, 9385.0, 4564.0, 2325.0, 1293.0, 684.0, 397.0, 231.0, 133.0, 77.0, 70.0, 34.0, 28.0, 19.0, 9.0, 13.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.09375, -3.975738525390625, -3.85772705078125, -3.739715576171875, -3.6217041015625, -3.503692626953125, -3.38568115234375, -3.267669677734375, -3.149658203125, -3.031646728515625, -2.91363525390625, -2.795623779296875, -2.6776123046875, -2.559600830078125, -2.44158935546875, -2.323577880859375, -2.20556640625, -2.087554931640625, -1.96954345703125, -1.851531982421875, -1.7335205078125, -1.615509033203125, -1.49749755859375, -1.379486083984375, -1.261474609375, -1.143463134765625, -1.02545166015625, -0.907440185546875, -0.7894287109375, -0.671417236328125, -0.55340576171875, -0.435394287109375, -0.3173828125, -0.199371337890625, -0.08135986328125, 0.036651611328125, 0.1546630859375, 0.272674560546875, 0.39068603515625, 0.508697509765625, 0.626708984375, 0.744720458984375, 0.86273193359375, 0.980743408203125, 1.0987548828125, 1.216766357421875, 1.33477783203125, 1.452789306640625, 1.57080078125, 1.688812255859375, 1.80682373046875, 1.924835205078125, 2.0428466796875, 2.160858154296875, 2.27886962890625, 2.396881103515625, 2.514892578125, 2.632904052734375, 2.75091552734375, 2.868927001953125, 2.9869384765625, 3.104949951171875, 3.22296142578125, 3.340972900390625, 3.458984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 9.0, 7.0, 8.0, 14.0, 16.0, 23.0, 12.0, 24.0, 27.0, 22.0, 24.0, 22.0, 41.0, 40.0, 36.0, 36.0, 40.0, 44.0, 31.0, 39.0, 50.0, 32.0, 30.0, 39.0, 27.0, 28.0, 27.0, 21.0, 27.0, 20.0, 23.0, 22.0, 18.0, 12.0, 18.0, 14.0, 9.0, 6.0, 8.0, 10.0, 3.0, 5.0, 3.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5263671875, -1.4771728515625, -1.427978515625, -1.3787841796875, -1.32958984375, -1.2803955078125, -1.231201171875, -1.1820068359375, -1.1328125, -1.0836181640625, -1.034423828125, -0.9852294921875, -0.93603515625, -0.8868408203125, -0.837646484375, -0.7884521484375, -0.7392578125, -0.6900634765625, -0.640869140625, -0.5916748046875, -0.54248046875, -0.4932861328125, -0.444091796875, -0.3948974609375, -0.345703125, -0.2965087890625, -0.247314453125, -0.1981201171875, -0.14892578125, -0.0997314453125, -0.050537109375, -0.0013427734375, 0.0478515625, 0.0970458984375, 0.146240234375, 0.1954345703125, 0.24462890625, 0.2938232421875, 0.343017578125, 0.3922119140625, 0.44140625, 0.4906005859375, 0.539794921875, 0.5889892578125, 0.63818359375, 0.6873779296875, 0.736572265625, 0.7857666015625, 0.8349609375, 0.8841552734375, 0.933349609375, 0.9825439453125, 1.03173828125, 1.0809326171875, 1.130126953125, 1.1793212890625, 1.228515625, 1.2777099609375, 1.326904296875, 1.3760986328125, 1.42529296875, 1.4744873046875, 1.523681640625, 1.5728759765625, 1.6220703125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 7.0, 3.0, 5.0, 10.0, 6.0, 10.0, 22.0, 35.0, 50.0, 58.0, 87.0, 138.0, 195.0, 274.0, 453.0, 733.0, 1081.0, 1750.0, 2800.0, 4876.0, 8455.0, 15033.0, 27985.0, 52996.0, 102927.0, 189150.0, 251611.0, 180218.0, 96554.0, 50239.0, 26301.0, 14294.0, 8073.0, 4666.0, 2723.0, 1666.0, 1007.0, 706.0, 448.0, 288.0, 204.0, 133.0, 77.0, 64.0, 35.0, 38.0, 18.0, 13.0, 19.0, 12.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.1311492919921875, -1.091400146484375, -1.0516510009765625, -1.01190185546875, -0.9721527099609375, -0.932403564453125, -0.8926544189453125, -0.8529052734375, -0.8131561279296875, -0.773406982421875, -0.7336578369140625, -0.69390869140625, -0.6541595458984375, -0.614410400390625, -0.5746612548828125, -0.534912109375, -0.4951629638671875, -0.455413818359375, -0.4156646728515625, -0.37591552734375, -0.3361663818359375, -0.296417236328125, -0.2566680908203125, -0.2169189453125, -0.1771697998046875, -0.137420654296875, -0.0976715087890625, -0.05792236328125, -0.0181732177734375, 0.021575927734375, 0.0613250732421875, 0.10107421875, 0.1408233642578125, 0.180572509765625, 0.2203216552734375, 0.26007080078125, 0.2998199462890625, 0.339569091796875, 0.3793182373046875, 0.4190673828125, 0.4588165283203125, 0.498565673828125, 0.5383148193359375, 0.57806396484375, 0.6178131103515625, 0.657562255859375, 0.6973114013671875, 0.737060546875, 0.7768096923828125, 0.816558837890625, 0.8563079833984375, 0.89605712890625, 0.9358062744140625, 0.975555419921875, 1.0153045654296875, 1.0550537109375, 1.0948028564453125, 1.134552001953125, 1.1743011474609375, 1.21405029296875, 1.2537994384765625, 1.293548583984375, 1.3332977294921875, 1.373046875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 5.0, 4.0, 5.0, 8.0, 11.0, 11.0, 16.0, 19.0, 26.0, 33.0, 47.0, 38.0, 62.0, 51.0, 55.0, 70.0, 66.0, 65.0, 64.0, 50.0, 61.0, 38.0, 42.0, 30.0, 23.0, 22.0, 12.0, 18.0, 11.0, 10.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-6.175041198730469e-05, -6.000883877277374e-05, -5.82672655582428e-05, -5.652569234371185e-05, -5.478411912918091e-05, -5.304254591464996e-05, -5.130097270011902e-05, -4.9559399485588074e-05, -4.781782627105713e-05, -4.6076253056526184e-05, -4.433467984199524e-05, -4.2593106627464294e-05, -4.085153341293335e-05, -3.9109960198402405e-05, -3.736838698387146e-05, -3.5626813769340515e-05, -3.388524055480957e-05, -3.2143667340278625e-05, -3.040209412574768e-05, -2.8660520911216736e-05, -2.691894769668579e-05, -2.5177374482154846e-05, -2.34358012676239e-05, -2.1694228053092957e-05, -1.9952654838562012e-05, -1.8211081624031067e-05, -1.6469508409500122e-05, -1.4727935194969177e-05, -1.2986361980438232e-05, -1.1244788765907288e-05, -9.503215551376343e-06, -7.761642336845398e-06, -6.020069122314453e-06, -4.278495907783508e-06, -2.5369226932525635e-06, -7.953494787216187e-07, 9.462237358093262e-07, 2.687796950340271e-06, 4.429370164871216e-06, 6.170943379402161e-06, 7.912516593933105e-06, 9.65408980846405e-06, 1.1395663022994995e-05, 1.313723623752594e-05, 1.4878809452056885e-05, 1.662038266658783e-05, 1.8361955881118774e-05, 2.010352909564972e-05, 2.1845102310180664e-05, 2.358667552471161e-05, 2.5328248739242554e-05, 2.70698219537735e-05, 2.8811395168304443e-05, 3.055296838283539e-05, 3.229454159736633e-05, 3.403611481189728e-05, 3.577768802642822e-05, 3.751926124095917e-05, 3.926083445549011e-05, 4.100240767002106e-05, 4.2743980884552e-05, 4.448555409908295e-05, 4.622712731361389e-05, 4.7968700528144836e-05, 4.971027374267578e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 7.0, 16.0, 15.0, 31.0, 36.0, 40.0, 83.0, 87.0, 178.0, 216.0, 352.0, 592.0, 899.0, 1574.0, 2646.0, 4492.0, 7947.0, 13937.0, 25314.0, 45292.0, 77816.0, 125526.0, 174377.0, 186411.0, 149380.0, 98263.0, 57636.0, 32537.0, 18292.0, 10212.0, 5879.0, 3376.0, 1921.0, 1110.0, 750.0, 476.0, 279.0, 206.0, 112.0, 102.0, 38.0, 36.0, 24.0, 13.0, 8.0, 7.0, 9.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.94921875, -0.9197616577148438, -0.8903045654296875, -0.8608474731445312, -0.831390380859375, -0.8019332885742188, -0.7724761962890625, -0.7430191040039062, -0.71356201171875, -0.6841049194335938, -0.6546478271484375, -0.6251907348632812, -0.595733642578125, -0.5662765502929688, -0.5368194580078125, -0.5073623657226562, -0.4779052734375, -0.44844818115234375, -0.4189910888671875, -0.38953399658203125, -0.360076904296875, -0.33061981201171875, -0.3011627197265625, -0.27170562744140625, -0.24224853515625, -0.21279144287109375, -0.1833343505859375, -0.15387725830078125, -0.124420166015625, -0.09496307373046875, -0.0655059814453125, -0.03604888916015625, -0.006591796875, 0.02286529541015625, 0.0523223876953125, 0.08177947998046875, 0.111236572265625, 0.14069366455078125, 0.1701507568359375, 0.19960784912109375, 0.22906494140625, 0.25852203369140625, 0.2879791259765625, 0.31743621826171875, 0.346893310546875, 0.37635040283203125, 0.4058074951171875, 0.43526458740234375, 0.4647216796875, 0.49417877197265625, 0.5236358642578125, 0.5530929565429688, 0.582550048828125, 0.6120071411132812, 0.6414642333984375, 0.6709213256835938, 0.70037841796875, 0.7298355102539062, 0.7592926025390625, 0.7887496948242188, 0.818206787109375, 0.8476638793945312, 0.8771209716796875, 0.9065780639648438, 0.93603515625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 7.0, 7.0, 16.0, 6.0, 9.0, 21.0, 8.0, 28.0, 28.0, 42.0, 46.0, 39.0, 59.0, 42.0, 65.0, 58.0, 58.0, 57.0, 58.0, 43.0, 37.0, 43.0, 40.0, 37.0, 25.0, 20.0, 20.0, 15.0, 13.0, 12.0, 13.0, 7.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.402099609375, -0.3919639587402344, -0.38182830810546875, -0.3716926574707031, -0.3615570068359375, -0.3514213562011719, -0.34128570556640625, -0.3311500549316406, -0.321014404296875, -0.3108787536621094, -0.30074310302734375, -0.2906074523925781, -0.2804718017578125, -0.2703361511230469, -0.26020050048828125, -0.2500648498535156, -0.23992919921875, -0.22979354858398438, -0.21965789794921875, -0.20952224731445312, -0.1993865966796875, -0.18925094604492188, -0.17911529541015625, -0.16897964477539062, -0.158843994140625, -0.14870834350585938, -0.13857269287109375, -0.12843704223632812, -0.1183013916015625, -0.10816574096679688, -0.09803009033203125, -0.08789443969726562, -0.0777587890625, -0.06762313842773438, -0.05748748779296875, -0.047351837158203125, -0.0372161865234375, -0.027080535888671875, -0.01694488525390625, -0.006809234619140625, 0.003326416015625, 0.013462066650390625, 0.02359771728515625, 0.033733367919921875, 0.0438690185546875, 0.054004669189453125, 0.06414031982421875, 0.07427597045898438, 0.08441162109375, 0.09454727172851562, 0.10468292236328125, 0.11481857299804688, 0.1249542236328125, 0.13508987426757812, 0.14522552490234375, 0.15536117553710938, 0.165496826171875, 0.17563247680664062, 0.18576812744140625, 0.19590377807617188, 0.2060394287109375, 0.21617507934570312, 0.22631072998046875, 0.23644638061523438, 0.24658203125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 5.0, 6.0, 4.0, 6.0, 6.0, 13.0, 7.0, 22.0, 21.0, 27.0, 35.0, 45.0, 42.0, 50.0, 68.0, 84.0, 87.0, 98.0, 77.0, 71.0, 61.0, 40.0, 35.0, 21.0, 26.0, 17.0, 10.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7426934242248535, -4.5798563957214355, -4.417019367218018, -4.2541823387146, -4.091345310211182, -3.9285082817077637, -3.7656710147857666, -3.6028339862823486, -3.4399969577789307, -3.2771599292755127, -3.1143229007720947, -2.9514858722686768, -2.7886486053466797, -2.6258115768432617, -2.4629745483398438, -2.300137519836426, -2.137300491333008, -1.9744634628295898, -1.8116264343261719, -1.6487892866134644, -1.4859522581100464, -1.3231152296066284, -1.160278081893921, -0.9974410533905029, -0.834604024887085, -0.671766996383667, -0.5089299082756042, -0.3460928499698639, -0.18325579166412354, -0.020418763160705566, 0.14241832494735718, 0.3052554130554199, 0.4680929183959961, 0.6309299468994141, 0.7937670350074768, 0.9566041231155396, 1.1194411516189575, 1.2822781801223755, 1.445115327835083, 1.607952356338501, 1.770789384841919, 1.933626413345337, 2.096463441848755, 2.259300470352173, 2.42213773727417, 2.584974765777588, 2.747811794281006, 2.910648822784424, 3.073485851287842, 3.2363228797912598, 3.3991599082946777, 3.5619969367980957, 3.7248339653015137, 3.8876709938049316, 4.05050802230835, 4.213345527648926, 4.376182556152344, 4.539019584655762, 4.70185661315918, 4.864693641662598, 5.027530670166016, 5.190367698669434, 5.353204727172852, 5.5160417556762695, 5.6788787841796875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 3.0, 8.0, 9.0, 9.0, 11.0, 18.0, 20.0, 13.0, 18.0, 38.0, 21.0, 32.0, 38.0, 31.0, 37.0, 39.0, 43.0, 40.0, 53.0, 47.0, 43.0, 40.0, 33.0, 36.0, 32.0, 25.0, 29.0, 34.0, 31.0, 33.0, 36.0, 17.0, 11.0, 10.0, 12.0, 5.0, 10.0, 7.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.489727258682251, -2.40222430229187, -2.3147213459014893, -2.2272186279296875, -2.1397156715393066, -2.052212715148926, -1.964709758758545, -1.877206802368164, -1.7897039651870728, -1.702201008796692, -1.6146981716156006, -1.5271952152252197, -1.4396922588348389, -1.3521894216537476, -1.2646864652633667, -1.1771836280822754, -1.0896806716918945, -1.0021777153015137, -0.9146748781204224, -0.8271719217300415, -0.7396690249443054, -0.6521661281585693, -0.5646631717681885, -0.4771602749824524, -0.3896573781967163, -0.3021544814109802, -0.21465155482292175, -0.12714862823486328, -0.0396457314491272, 0.04785716533660889, 0.13536012172698975, 0.22286301851272583, 0.3103659152984619, 0.397868812084198, 0.48537173867225647, 0.5728746652603149, 0.660377562046051, 0.7478804588317871, 0.835383415222168, 0.922886312007904, 1.0103892087936401, 1.097892165184021, 1.1853950023651123, 1.2728979587554932, 1.360400915145874, 1.4479037523269653, 1.5354067087173462, 1.6229095458984375, 1.7104125022888184, 1.7979154586791992, 1.8854182958602905, 1.9729212522506714, 2.0604240894317627, 2.1479270458221436, 2.2354300022125244, 2.3229329586029053, 2.410435676574707, 2.497938632965088, 2.5854415893554688, 2.6729445457458496, 2.7604472637176514, 2.8479502201080322, 2.935453176498413, 3.022956132888794, 3.110459089279175]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 15.0, 16.0, 20.0, 32.0, 54.0, 82.0, 111.0, 179.0, 320.0, 527.0, 822.0, 1309.0, 2158.0, 3596.0, 6159.0, 10182.0, 17808.0, 29654.0, 49429.0, 79789.0, 117098.0, 152707.0, 163343.0, 140694.0, 103527.0, 67442.0, 41069.0, 24388.0, 14594.0, 8564.0, 5099.0, 3011.0, 1797.0, 1104.0, 695.0, 411.0, 295.0, 158.0, 88.0, 62.0, 52.0, 31.0, 16.0, 17.0, 9.0, 6.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.515625, -2.44012451171875, -2.3646240234375, -2.28912353515625, -2.213623046875, -2.13812255859375, -2.0626220703125, -1.98712158203125, -1.91162109375, -1.83612060546875, -1.7606201171875, -1.68511962890625, -1.609619140625, -1.53411865234375, -1.4586181640625, -1.38311767578125, -1.3076171875, -1.23211669921875, -1.1566162109375, -1.08111572265625, -1.005615234375, -0.93011474609375, -0.8546142578125, -0.77911376953125, -0.70361328125, -0.62811279296875, -0.5526123046875, -0.47711181640625, -0.401611328125, -0.32611083984375, -0.2506103515625, -0.17510986328125, -0.099609375, -0.02410888671875, 0.0513916015625, 0.12689208984375, 0.202392578125, 0.27789306640625, 0.3533935546875, 0.42889404296875, 0.50439453125, 0.57989501953125, 0.6553955078125, 0.73089599609375, 0.806396484375, 0.88189697265625, 0.9573974609375, 1.03289794921875, 1.1083984375, 1.18389892578125, 1.2593994140625, 1.33489990234375, 1.410400390625, 1.48590087890625, 1.5614013671875, 1.63690185546875, 1.71240234375, 1.78790283203125, 1.8634033203125, 1.93890380859375, 2.014404296875, 2.08990478515625, 2.1654052734375, 2.24090576171875, 2.31640625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 16.0, 16.0, 10.0, 20.0, 13.0, 19.0, 24.0, 36.0, 29.0, 35.0, 27.0, 29.0, 54.0, 41.0, 46.0, 53.0, 42.0, 39.0, 34.0, 51.0, 46.0, 37.0, 26.0, 26.0, 34.0, 33.0, 23.0, 29.0, 20.0, 8.0, 14.0, 9.0, 9.0, 9.0, 6.0, 3.0, 1.0, 7.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.57763671875, -2.4833984375, -2.38916015625, -2.294921875, -2.20068359375, -2.1064453125, -2.01220703125, -1.91796875, -1.82373046875, -1.7294921875, -1.63525390625, -1.541015625, -1.44677734375, -1.3525390625, -1.25830078125, -1.1640625, -1.06982421875, -0.9755859375, -0.88134765625, -0.787109375, -0.69287109375, -0.5986328125, -0.50439453125, -0.41015625, -0.31591796875, -0.2216796875, -0.12744140625, -0.033203125, 0.06103515625, 0.1552734375, 0.24951171875, 0.34375, 0.43798828125, 0.5322265625, 0.62646484375, 0.720703125, 0.81494140625, 0.9091796875, 1.00341796875, 1.09765625, 1.19189453125, 1.2861328125, 1.38037109375, 1.474609375, 1.56884765625, 1.6630859375, 1.75732421875, 1.8515625, 1.94580078125, 2.0400390625, 2.13427734375, 2.228515625, 2.32275390625, 2.4169921875, 2.51123046875, 2.60546875, 2.69970703125, 2.7939453125, 2.88818359375, 2.982421875, 3.07666015625, 3.1708984375, 3.26513671875, 3.359375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 9.0, 13.0, 11.0, 24.0, 38.0, 57.0, 107.0, 163.0, 360.0, 677.0, 1407.0, 2905.0, 6354.0, 14386.0, 33521.0, 76426.0, 156150.0, 243372.0, 237710.0, 147772.0, 71039.0, 31270.0, 13475.0, 5942.0, 2664.0, 1257.0, 657.0, 339.0, 193.0, 81.0, 57.0, 31.0, 23.0, 19.0, 10.0, 15.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.305755615234375, -3.19158935546875, -3.077423095703125, -2.9632568359375, -2.849090576171875, -2.73492431640625, -2.620758056640625, -2.506591796875, -2.392425537109375, -2.27825927734375, -2.164093017578125, -2.0499267578125, -1.935760498046875, -1.82159423828125, -1.707427978515625, -1.59326171875, -1.479095458984375, -1.36492919921875, -1.250762939453125, -1.1365966796875, -1.022430419921875, -0.90826416015625, -0.794097900390625, -0.679931640625, -0.565765380859375, -0.45159912109375, -0.337432861328125, -0.2232666015625, -0.109100341796875, 0.00506591796875, 0.119232177734375, 0.2333984375, 0.347564697265625, 0.46173095703125, 0.575897216796875, 0.6900634765625, 0.804229736328125, 0.91839599609375, 1.032562255859375, 1.146728515625, 1.260894775390625, 1.37506103515625, 1.489227294921875, 1.6033935546875, 1.717559814453125, 1.83172607421875, 1.945892333984375, 2.06005859375, 2.174224853515625, 2.28839111328125, 2.402557373046875, 2.5167236328125, 2.630889892578125, 2.74505615234375, 2.859222412109375, 2.973388671875, 3.087554931640625, 3.20172119140625, 3.315887451171875, 3.4300537109375, 3.544219970703125, 3.65838623046875, 3.772552490234375, 3.88671875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 6.0, 9.0, 13.0, 12.0, 15.0, 20.0, 23.0, 26.0, 27.0, 37.0, 37.0, 48.0, 46.0, 42.0, 48.0, 34.0, 55.0, 39.0, 40.0, 48.0, 38.0, 40.0, 44.0, 36.0, 24.0, 27.0, 29.0, 17.0, 9.0, 21.0, 15.0, 11.0, 7.0, 12.0, 11.0, 5.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8876953125, -1.8268585205078125, -1.766021728515625, -1.7051849365234375, -1.64434814453125, -1.5835113525390625, -1.522674560546875, -1.4618377685546875, -1.4010009765625, -1.3401641845703125, -1.279327392578125, -1.2184906005859375, -1.15765380859375, -1.0968170166015625, -1.035980224609375, -0.9751434326171875, -0.914306640625, -0.8534698486328125, -0.792633056640625, -0.7317962646484375, -0.67095947265625, -0.6101226806640625, -0.549285888671875, -0.4884490966796875, -0.4276123046875, -0.3667755126953125, -0.305938720703125, -0.2451019287109375, -0.18426513671875, -0.1234283447265625, -0.062591552734375, -0.0017547607421875, 0.05908203125, 0.1199188232421875, 0.180755615234375, 0.2415924072265625, 0.30242919921875, 0.3632659912109375, 0.424102783203125, 0.4849395751953125, 0.5457763671875, 0.6066131591796875, 0.667449951171875, 0.7282867431640625, 0.78912353515625, 0.8499603271484375, 0.910797119140625, 0.9716339111328125, 1.032470703125, 1.0933074951171875, 1.154144287109375, 1.2149810791015625, 1.27581787109375, 1.3366546630859375, 1.397491455078125, 1.4583282470703125, 1.5191650390625, 1.5800018310546875, 1.640838623046875, 1.7016754150390625, 1.76251220703125, 1.8233489990234375, 1.884185791015625, 1.9450225830078125, 2.005859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 14.0, 28.0, 39.0, 67.0, 101.0, 157.0, 245.0, 375.0, 560.0, 937.0, 1503.0, 2356.0, 3955.0, 6792.0, 11691.0, 21260.0, 38068.0, 67596.0, 114920.0, 172432.0, 197957.0, 161658.0, 105463.0, 61155.0, 34152.0, 18702.0, 10839.0, 6103.0, 3619.0, 2114.0, 1297.0, 843.0, 529.0, 364.0, 229.0, 153.0, 108.0, 55.0, 46.0, 27.0, 16.0, 7.0, 12.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.529296875, -1.47900390625, -1.4287109375, -1.37841796875, -1.328125, -1.27783203125, -1.2275390625, -1.17724609375, -1.126953125, -1.07666015625, -1.0263671875, -0.97607421875, -0.92578125, -0.87548828125, -0.8251953125, -0.77490234375, -0.724609375, -0.67431640625, -0.6240234375, -0.57373046875, -0.5234375, -0.47314453125, -0.4228515625, -0.37255859375, -0.322265625, -0.27197265625, -0.2216796875, -0.17138671875, -0.12109375, -0.07080078125, -0.0205078125, 0.02978515625, 0.080078125, 0.13037109375, 0.1806640625, 0.23095703125, 0.28125, 0.33154296875, 0.3818359375, 0.43212890625, 0.482421875, 0.53271484375, 0.5830078125, 0.63330078125, 0.68359375, 0.73388671875, 0.7841796875, 0.83447265625, 0.884765625, 0.93505859375, 0.9853515625, 1.03564453125, 1.0859375, 1.13623046875, 1.1865234375, 1.23681640625, 1.287109375, 1.33740234375, 1.3876953125, 1.43798828125, 1.48828125, 1.53857421875, 1.5888671875, 1.63916015625, 1.689453125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 8.0, 11.0, 9.0, 17.0, 26.0, 31.0, 26.0, 59.0, 61.0, 64.0, 75.0, 63.0, 73.0, 81.0, 80.0, 66.0, 43.0, 30.0, 39.0, 29.0, 26.0, 17.0, 11.0, 14.0, 5.0, 7.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013768672943115234, -0.000132070854306221, -0.00012645497918128967, -0.00012083910405635834, -0.000115223228931427, -0.00010960735380649567, -0.00010399147868156433, -9.8375603556633e-05, -9.275972843170166e-05, -8.714385330677032e-05, -8.152797818183899e-05, -7.591210305690765e-05, -7.029622793197632e-05, -6.468035280704498e-05, -5.906447768211365e-05, -5.344860255718231e-05, -4.7832727432250977e-05, -4.221685230731964e-05, -3.6600977182388306e-05, -3.098510205745697e-05, -2.5369226932525635e-05, -1.97533518075943e-05, -1.4137476682662964e-05, -8.521601557731628e-06, -2.905726432800293e-06, 2.7101486921310425e-06, 8.326023817062378e-06, 1.3941898941993713e-05, 1.955777406692505e-05, 2.5173649191856384e-05, 3.078952431678772e-05, 3.6405399441719055e-05, 4.202127456665039e-05, 4.7637149691581726e-05, 5.325302481651306e-05, 5.88688999414444e-05, 6.448477506637573e-05, 7.010065019130707e-05, 7.57165253162384e-05, 8.133240044116974e-05, 8.694827556610107e-05, 9.256415069103241e-05, 9.818002581596375e-05, 0.00010379590094089508, 0.00010941177606582642, 0.00011502765119075775, 0.00012064352631568909, 0.00012625940144062042, 0.00013187527656555176, 0.0001374911516904831, 0.00014310702681541443, 0.00014872290194034576, 0.0001543387770652771, 0.00015995465219020844, 0.00016557052731513977, 0.0001711864024400711, 0.00017680227756500244, 0.00018241815268993378, 0.0001880340278148651, 0.00019364990293979645, 0.00019926577806472778, 0.00020488165318965912, 0.00021049752831459045, 0.0002161134034395218, 0.00022172927856445312]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 13.0, 16.0, 20.0, 38.0, 40.0, 69.0, 98.0, 126.0, 196.0, 260.0, 363.0, 575.0, 807.0, 1143.0, 1726.0, 2600.0, 3905.0, 5784.0, 8871.0, 13186.0, 20481.0, 31520.0, 48199.0, 72658.0, 104517.0, 135506.0, 149140.0, 134668.0, 103075.0, 71732.0, 47445.0, 30853.0, 19761.0, 13075.0, 8672.0, 5701.0, 3746.0, 2571.0, 1666.0, 1176.0, 768.0, 554.0, 393.0, 248.0, 180.0, 137.0, 91.0, 61.0, 37.0, 27.0, 25.0, 5.0, 11.0, 8.0, 12.0, 2.0, 4.0], "bins": [-1.25, -1.2126617431640625, -1.175323486328125, -1.1379852294921875, -1.10064697265625, -1.0633087158203125, -1.025970458984375, -0.9886322021484375, -0.9512939453125, -0.9139556884765625, -0.876617431640625, -0.8392791748046875, -0.80194091796875, -0.7646026611328125, -0.727264404296875, -0.6899261474609375, -0.652587890625, -0.6152496337890625, -0.577911376953125, -0.5405731201171875, -0.50323486328125, -0.4658966064453125, -0.428558349609375, -0.3912200927734375, -0.3538818359375, -0.3165435791015625, -0.279205322265625, -0.2418670654296875, -0.20452880859375, -0.1671905517578125, -0.129852294921875, -0.0925140380859375, -0.05517578125, -0.0178375244140625, 0.019500732421875, 0.0568389892578125, 0.09417724609375, 0.1315155029296875, 0.168853759765625, 0.2061920166015625, 0.2435302734375, 0.2808685302734375, 0.318206787109375, 0.3555450439453125, 0.39288330078125, 0.4302215576171875, 0.467559814453125, 0.5048980712890625, 0.542236328125, 0.5795745849609375, 0.616912841796875, 0.6542510986328125, 0.69158935546875, 0.7289276123046875, 0.766265869140625, 0.8036041259765625, 0.8409423828125, 0.8782806396484375, 0.915618896484375, 0.9529571533203125, 0.99029541015625, 1.0276336669921875, 1.064971923828125, 1.1023101806640625, 1.1396484375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 3.0, 8.0, 6.0, 10.0, 10.0, 15.0, 6.0, 13.0, 13.0, 20.0, 18.0, 22.0, 35.0, 31.0, 37.0, 46.0, 41.0, 38.0, 52.0, 45.0, 41.0, 41.0, 58.0, 43.0, 37.0, 44.0, 45.0, 35.0, 20.0, 28.0, 20.0, 18.0, 19.0, 10.0, 14.0, 10.0, 8.0, 8.0, 7.0, 6.0, 3.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.44189453125, -0.4282951354980469, -0.41469573974609375, -0.4010963439941406, -0.3874969482421875, -0.3738975524902344, -0.36029815673828125, -0.3466987609863281, -0.333099365234375, -0.3194999694824219, -0.30590057373046875, -0.2923011779785156, -0.2787017822265625, -0.2651023864746094, -0.25150299072265625, -0.23790359497070312, -0.22430419921875, -0.21070480346679688, -0.19710540771484375, -0.18350601196289062, -0.1699066162109375, -0.15630722045898438, -0.14270782470703125, -0.12910842895507812, -0.115509033203125, -0.10190963745117188, -0.08831024169921875, -0.07471084594726562, -0.0611114501953125, -0.047512054443359375, -0.03391265869140625, -0.020313262939453125, -0.0067138671875, 0.006885528564453125, 0.02048492431640625, 0.034084320068359375, 0.0476837158203125, 0.061283111572265625, 0.07488250732421875, 0.08848190307617188, 0.102081298828125, 0.11568069458007812, 0.12928009033203125, 0.14287948608398438, 0.1564788818359375, 0.17007827758789062, 0.18367767333984375, 0.19727706909179688, 0.21087646484375, 0.22447586059570312, 0.23807525634765625, 0.2516746520996094, 0.2652740478515625, 0.2788734436035156, 0.29247283935546875, 0.3060722351074219, 0.319671630859375, 0.3332710266113281, 0.34687042236328125, 0.3604698181152344, 0.3740692138671875, 0.3876686096191406, 0.40126800537109375, 0.4148674011230469, 0.428466796875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 8.0, 7.0, 4.0, 4.0, 14.0, 12.0, 18.0, 20.0, 20.0, 29.0, 42.0, 52.0, 61.0, 75.0, 97.0, 86.0, 97.0, 89.0, 71.0, 63.0, 37.0, 32.0, 24.0, 22.0, 9.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.418567180633545, -5.239041328430176, -5.059515953063965, -4.879990100860596, -4.700464725494385, -4.520938873291016, -4.341413497924805, -4.1618876457214355, -3.9823620319366455, -3.8028364181518555, -3.6233108043670654, -3.4437851905822754, -3.2642593383789062, -3.0847339630126953, -2.905208110809326, -2.725682497024536, -2.546156883239746, -2.366631269454956, -2.187105655670166, -2.007579803466797, -1.8280543088912964, -1.6485286951065063, -1.4690029621124268, -1.2894773483276367, -1.1099517345428467, -0.9304261207580566, -0.7509004473686218, -0.571374773979187, -0.391849160194397, -0.21232354640960693, -0.032797813415527344, 0.1467278003692627, 0.32625293731689453, 0.5057785511016846, 0.6853042244911194, 0.8648298978805542, 1.0443555116653442, 1.2238811254501343, 1.4034068584442139, 1.582932472229004, 1.762458086013794, 1.941983699798584, 2.121509313583374, 2.301034927368164, 2.480560779571533, 2.660086154937744, 2.8396120071411133, 3.0191376209259033, 3.1986632347106934, 3.3781888484954834, 3.5577144622802734, 3.7372403144836426, 3.9167656898498535, 4.096291542053223, 4.275816917419434, 4.455342769622803, 4.634868621826172, 4.814394474029541, 4.993919849395752, 5.173445701599121, 5.352971076965332, 5.532496929168701, 5.71202278137207, 5.891548156738281, 6.071073532104492]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 1.0, 6.0, 3.0, 6.0, 4.0, 14.0, 16.0, 12.0, 10.0, 20.0, 12.0, 16.0, 24.0, 33.0, 35.0, 33.0, 29.0, 37.0, 33.0, 35.0, 52.0, 34.0, 42.0, 44.0, 35.0, 39.0, 30.0, 37.0, 29.0, 31.0, 29.0, 25.0, 19.0, 19.0, 27.0, 20.0, 11.0, 11.0, 12.0, 16.0, 10.0, 12.0, 8.0, 7.0, 5.0, 5.0, 5.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.536133050918579, -2.456820011138916, -2.377506971359253, -2.29819393157959, -2.2188808917999268, -2.1395678520202637, -2.0602545738220215, -1.9809415340423584, -1.9016284942626953, -1.8223154544830322, -1.7430024147033691, -1.663689374923706, -1.5843762159347534, -1.5050631761550903, -1.4257501363754272, -1.3464369773864746, -1.267124056816101, -1.187811017036438, -1.108497977256775, -1.0291848182678223, -0.9498717784881592, -0.8705587387084961, -0.791245698928833, -0.7119325995445251, -0.6326195597648621, -0.553306519985199, -0.4739934206008911, -0.394680380821228, -0.31536731123924255, -0.23605424165725708, -0.156741201877594, -0.07742810249328613, 0.0018849372863769531, 0.08119799941778183, 0.1605110615491867, 0.239824116230011, 0.31913718581199646, 0.39845025539398193, 0.477763295173645, 0.5570763945579529, 0.636389434337616, 0.715702474117279, 0.7950155735015869, 0.87432861328125, 0.9536416530609131, 1.0329546928405762, 1.1122677326202393, 1.191580891609192, 1.270893931388855, 1.350206971168518, 1.4295200109481812, 1.5088331699371338, 1.5881462097167969, 1.66745924949646, 1.746772289276123, 1.8260853290557861, 1.9053983688354492, 1.9847114086151123, 2.0640244483947754, 2.1433374881744385, 2.2226505279541016, 2.3019638061523438, 2.3812766075134277, 2.46058988571167, 2.539902925491333]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 11.0, 10.0, 15.0, 21.0, 30.0, 58.0, 70.0, 127.0, 168.0, 243.0, 370.0, 533.0, 827.0, 1354.0, 2065.0, 3411.0, 5632.0, 9722.0, 17371.0, 34325.0, 75012.0, 200289.0, 599981.0, 1344032.0, 1170329.0, 448482.0, 152505.0, 61160.0, 28687.0, 15398.0, 8608.0, 5081.0, 3085.0, 1917.0, 1210.0, 781.0, 489.0, 315.0, 192.0, 142.0, 75.0, 48.0, 35.0, 25.0, 17.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.4375, -4.302490234375, -4.16748046875, -4.032470703125, -3.8974609375, -3.762451171875, -3.62744140625, -3.492431640625, -3.357421875, -3.222412109375, -3.08740234375, -2.952392578125, -2.8173828125, -2.682373046875, -2.54736328125, -2.412353515625, -2.27734375, -2.142333984375, -2.00732421875, -1.872314453125, -1.7373046875, -1.602294921875, -1.46728515625, -1.332275390625, -1.197265625, -1.062255859375, -0.92724609375, -0.792236328125, -0.6572265625, -0.522216796875, -0.38720703125, -0.252197265625, -0.1171875, 0.017822265625, 0.15283203125, 0.287841796875, 0.4228515625, 0.557861328125, 0.69287109375, 0.827880859375, 0.962890625, 1.097900390625, 1.23291015625, 1.367919921875, 1.5029296875, 1.637939453125, 1.77294921875, 1.907958984375, 2.04296875, 2.177978515625, 2.31298828125, 2.447998046875, 2.5830078125, 2.718017578125, 2.85302734375, 2.988037109375, 3.123046875, 3.258056640625, 3.39306640625, 3.528076171875, 3.6630859375, 3.798095703125, 3.93310546875, 4.068115234375, 4.203125]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 2.0, 9.0, 15.0, 13.0, 9.0, 9.0, 11.0, 26.0, 20.0, 19.0, 18.0, 37.0, 31.0, 28.0, 39.0, 38.0, 39.0, 44.0, 54.0, 49.0, 37.0, 35.0, 29.0, 45.0, 43.0, 28.0, 40.0, 19.0, 22.0, 29.0, 21.0, 17.0, 17.0, 14.0, 12.0, 9.0, 8.0, 17.0, 14.0, 3.0, 3.0, 6.0, 4.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73828125, -1.679718017578125, -1.62115478515625, -1.562591552734375, -1.5040283203125, -1.445465087890625, -1.38690185546875, -1.328338623046875, -1.269775390625, -1.211212158203125, -1.15264892578125, -1.094085693359375, -1.0355224609375, -0.976959228515625, -0.91839599609375, -0.859832763671875, -0.80126953125, -0.742706298828125, -0.68414306640625, -0.625579833984375, -0.5670166015625, -0.508453369140625, -0.44989013671875, -0.391326904296875, -0.332763671875, -0.274200439453125, -0.21563720703125, -0.157073974609375, -0.0985107421875, -0.039947509765625, 0.01861572265625, 0.077178955078125, 0.1357421875, 0.194305419921875, 0.25286865234375, 0.311431884765625, 0.3699951171875, 0.428558349609375, 0.48712158203125, 0.545684814453125, 0.604248046875, 0.662811279296875, 0.72137451171875, 0.779937744140625, 0.8385009765625, 0.897064208984375, 0.95562744140625, 1.014190673828125, 1.07275390625, 1.131317138671875, 1.18988037109375, 1.248443603515625, 1.3070068359375, 1.365570068359375, 1.42413330078125, 1.482696533203125, 1.541259765625, 1.599822998046875, 1.65838623046875, 1.716949462890625, 1.7755126953125, 1.834075927734375, 1.89263916015625, 1.951202392578125, 2.009765625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 2.0, 5.0, 4.0, 8.0, 10.0, 18.0, 26.0, 23.0, 50.0, 61.0, 111.0, 148.0, 252.0, 393.0, 620.0, 1041.0, 1798.0, 3256.0, 5702.0, 10856.0, 21448.0, 45701.0, 106992.0, 288729.0, 886074.0, 1607045.0, 780560.0, 253842.0, 95690.0, 41505.0, 19562.0, 9974.0, 5178.0, 2978.0, 1806.0, 1019.0, 645.0, 403.0, 252.0, 171.0, 114.0, 77.0, 39.0, 23.0, 22.0, 17.0, 15.0, 8.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3203125, -5.15631103515625, -4.9923095703125, -4.82830810546875, -4.664306640625, -4.50030517578125, -4.3363037109375, -4.17230224609375, -4.00830078125, -3.84429931640625, -3.6802978515625, -3.51629638671875, -3.352294921875, -3.18829345703125, -3.0242919921875, -2.86029052734375, -2.6962890625, -2.53228759765625, -2.3682861328125, -2.20428466796875, -2.040283203125, -1.87628173828125, -1.7122802734375, -1.54827880859375, -1.38427734375, -1.22027587890625, -1.0562744140625, -0.89227294921875, -0.728271484375, -0.56427001953125, -0.4002685546875, -0.23626708984375, -0.072265625, 0.09173583984375, 0.2557373046875, 0.41973876953125, 0.583740234375, 0.74774169921875, 0.9117431640625, 1.07574462890625, 1.23974609375, 1.40374755859375, 1.5677490234375, 1.73175048828125, 1.895751953125, 2.05975341796875, 2.2237548828125, 2.38775634765625, 2.5517578125, 2.71575927734375, 2.8797607421875, 3.04376220703125, 3.207763671875, 3.37176513671875, 3.5357666015625, 3.69976806640625, 3.86376953125, 4.02777099609375, 4.1917724609375, 4.35577392578125, 4.519775390625, 4.68377685546875, 4.8477783203125, 5.01177978515625, 5.17578125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 7.0, 8.0, 2.0, 5.0, 11.0, 15.0, 17.0, 26.0, 30.0, 39.0, 49.0, 64.0, 101.0, 108.0, 157.0, 208.0, 234.0, 291.0, 393.0, 359.0, 358.0, 308.0, 307.0, 211.0, 142.0, 145.0, 112.0, 96.0, 53.0, 52.0, 27.0, 21.0, 26.0, 33.0, 15.0, 8.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.595703125, -1.55419921875, -1.5126953125, -1.47119140625, -1.4296875, -1.38818359375, -1.3466796875, -1.30517578125, -1.263671875, -1.22216796875, -1.1806640625, -1.13916015625, -1.09765625, -1.05615234375, -1.0146484375, -0.97314453125, -0.931640625, -0.89013671875, -0.8486328125, -0.80712890625, -0.765625, -0.72412109375, -0.6826171875, -0.64111328125, -0.599609375, -0.55810546875, -0.5166015625, -0.47509765625, -0.43359375, -0.39208984375, -0.3505859375, -0.30908203125, -0.267578125, -0.22607421875, -0.1845703125, -0.14306640625, -0.1015625, -0.06005859375, -0.0185546875, 0.02294921875, 0.064453125, 0.10595703125, 0.1474609375, 0.18896484375, 0.23046875, 0.27197265625, 0.3134765625, 0.35498046875, 0.396484375, 0.43798828125, 0.4794921875, 0.52099609375, 0.5625, 0.60400390625, 0.6455078125, 0.68701171875, 0.728515625, 0.77001953125, 0.8115234375, 0.85302734375, 0.89453125, 0.93603515625, 0.9775390625, 1.01904296875, 1.060546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 8.0, 19.0, 17.0, 19.0, 30.0, 31.0, 47.0, 59.0, 83.0, 95.0, 97.0, 102.0, 96.0, 73.0, 60.0, 32.0, 39.0, 16.0, 18.0, 12.0, 14.0, 7.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.538046360015869, -4.360090732574463, -4.182135105133057, -4.00417947769165, -3.826223850250244, -3.648268222808838, -3.4703125953674316, -3.2923569679260254, -3.114401340484619, -2.936445713043213, -2.7584900856018066, -2.5805344581604004, -2.402578830718994, -2.224623203277588, -2.0466675758361816, -1.868712067604065, -1.6907565593719482, -1.512800931930542, -1.3348453044891357, -1.1568896770477295, -0.978934109210968, -0.8009784817695618, -0.6230229139328003, -0.44506728649139404, -0.2671116590499878, -0.08915604650974274, 0.08879956603050232, 0.2667551636695862, 0.44471079111099243, 0.6226664185523987, 0.8006219863891602, 0.9785776138305664, 1.1565332412719727, 1.334488868713379, 1.5124444961547852, 1.6904001235961914, 1.8683557510375977, 2.046311378479004, 2.22426700592041, 2.4022226333618164, 2.5801782608032227, 2.758133888244629, 2.936089515686035, 3.1140451431274414, 3.2920007705688477, 3.469956398010254, 3.64791202545166, 3.8258676528930664, 4.003823280334473, 4.181778907775879, 4.359734535217285, 4.537690162658691, 4.715645790100098, 4.893601417541504, 5.07155704498291, 5.249512672424316, 5.4274678230285645, 5.605423450469971, 5.783379077911377, 5.961334705352783, 6.1392903327941895, 6.317245960235596, 6.495201587677002, 6.673157215118408, 6.8511128425598145]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 11.0, 12.0, 14.0, 16.0, 15.0, 19.0, 17.0, 13.0, 30.0, 27.0, 30.0, 27.0, 42.0, 32.0, 36.0, 30.0, 35.0, 50.0, 44.0, 36.0, 39.0, 41.0, 38.0, 48.0, 25.0, 27.0, 33.0, 32.0, 17.0, 21.0, 17.0, 14.0, 24.0, 16.0, 14.0, 9.0, 6.0, 7.0, 7.0, 5.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.4920685291290283, -2.4166033267974854, -2.3411381244659424, -2.2656726837158203, -2.1902074813842773, -2.1147422790527344, -2.0392770767211914, -1.9638117551803589, -1.8883464336395264, -1.8128812313079834, -1.7374159097671509, -1.661950707435608, -1.5864853858947754, -1.5110201835632324, -1.4355549812316895, -1.360089659690857, -1.284624457359314, -1.209159255027771, -1.1336939334869385, -1.0582287311553955, -0.982763409614563, -0.90729820728302, -0.8318329453468323, -0.7563676834106445, -0.6809024214744568, -0.605437159538269, -0.5299718976020813, -0.45450666546821594, -0.3790414035320282, -0.30357614159584045, -0.2281109094619751, -0.15264564752578735, -0.07718038558959961, -0.0017151311039924622, 0.07375012338161469, 0.14921537041664124, 0.22468063235282898, 0.3001458942890167, 0.3756111264228821, 0.4510763883590698, 0.5265416502952576, 0.6020069122314453, 0.6774721741676331, 0.7529374361038208, 0.8284026384353638, 0.9038679599761963, 0.9793331623077393, 1.0547983646392822, 1.1302636861801147, 1.2057288885116577, 1.2811942100524902, 1.3566594123840332, 1.4321247339248657, 1.5075899362564087, 1.5830552577972412, 1.6585204601287842, 1.7339856624603271, 1.8094508647918701, 1.8849161863327026, 1.9603813886642456, 2.035846710205078, 2.111311912536621, 2.186777114868164, 2.262242317199707, 2.337707757949829]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 6.0, 10.0, 14.0, 22.0, 35.0, 51.0, 77.0, 109.0, 163.0, 234.0, 365.0, 553.0, 938.0, 1391.0, 1930.0, 3142.0, 4907.0, 7639.0, 11886.0, 18425.0, 28706.0, 44392.0, 68391.0, 100776.0, 136286.0, 155055.0, 142501.0, 108305.0, 74614.0, 49144.0, 31759.0, 20359.0, 12812.0, 8308.0, 5435.0, 3357.0, 2143.0, 1497.0, 993.0, 646.0, 367.0, 263.0, 196.0, 126.0, 84.0, 47.0, 41.0, 25.0, 14.0, 15.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.4052734375, -1.360809326171875, -1.31634521484375, -1.271881103515625, -1.2274169921875, -1.182952880859375, -1.13848876953125, -1.094024658203125, -1.049560546875, -1.005096435546875, -0.96063232421875, -0.916168212890625, -0.8717041015625, -0.827239990234375, -0.78277587890625, -0.738311767578125, -0.69384765625, -0.649383544921875, -0.60491943359375, -0.560455322265625, -0.5159912109375, -0.471527099609375, -0.42706298828125, -0.382598876953125, -0.338134765625, -0.293670654296875, -0.24920654296875, -0.204742431640625, -0.1602783203125, -0.115814208984375, -0.07135009765625, -0.026885986328125, 0.017578125, 0.062042236328125, 0.10650634765625, 0.150970458984375, 0.1954345703125, 0.239898681640625, 0.28436279296875, 0.328826904296875, 0.373291015625, 0.417755126953125, 0.46221923828125, 0.506683349609375, 0.5511474609375, 0.595611572265625, 0.64007568359375, 0.684539794921875, 0.72900390625, 0.773468017578125, 0.81793212890625, 0.862396240234375, 0.9068603515625, 0.951324462890625, 0.99578857421875, 1.040252685546875, 1.084716796875, 1.129180908203125, 1.17364501953125, 1.218109130859375, 1.2625732421875, 1.307037353515625, 1.35150146484375, 1.395965576171875, 1.4404296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 7.0, 7.0, 3.0, 10.0, 13.0, 12.0, 18.0, 19.0, 22.0, 18.0, 23.0, 38.0, 34.0, 32.0, 34.0, 29.0, 36.0, 44.0, 52.0, 42.0, 40.0, 47.0, 62.0, 41.0, 33.0, 42.0, 28.0, 33.0, 30.0, 21.0, 24.0, 17.0, 18.0, 15.0, 10.0, 11.0, 8.0, 9.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.81640625, -2.7259521484375, -2.635498046875, -2.5450439453125, -2.45458984375, -2.3641357421875, -2.273681640625, -2.1832275390625, -2.0927734375, -2.0023193359375, -1.911865234375, -1.8214111328125, -1.73095703125, -1.6405029296875, -1.550048828125, -1.4595947265625, -1.369140625, -1.2786865234375, -1.188232421875, -1.0977783203125, -1.00732421875, -0.9168701171875, -0.826416015625, -0.7359619140625, -0.6455078125, -0.5550537109375, -0.464599609375, -0.3741455078125, -0.28369140625, -0.1932373046875, -0.102783203125, -0.0123291015625, 0.078125, 0.1685791015625, 0.259033203125, 0.3494873046875, 0.43994140625, 0.5303955078125, 0.620849609375, 0.7113037109375, 0.8017578125, 0.8922119140625, 0.982666015625, 1.0731201171875, 1.16357421875, 1.2540283203125, 1.344482421875, 1.4349365234375, 1.525390625, 1.6158447265625, 1.706298828125, 1.7967529296875, 1.88720703125, 1.9776611328125, 2.068115234375, 2.1585693359375, 2.2490234375, 2.3394775390625, 2.429931640625, 2.5203857421875, 2.61083984375, 2.7012939453125, 2.791748046875, 2.8822021484375, 2.97265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 14.0, 19.0, 38.0, 48.0, 93.0, 134.0, 200.0, 317.0, 508.0, 869.0, 1290.0, 2347.0, 4091.0, 7482.0, 13961.0, 27878.0, 56421.0, 114256.0, 216795.0, 264857.0, 167221.0, 84003.0, 40641.0, 20635.0, 10840.0, 5801.0, 3128.0, 1826.0, 1064.0, 674.0, 400.0, 233.0, 180.0, 96.0, 69.0, 51.0, 17.0, 13.0, 18.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.630859375, -2.5467529296875, -2.462646484375, -2.3785400390625, -2.29443359375, -2.2103271484375, -2.126220703125, -2.0421142578125, -1.9580078125, -1.8739013671875, -1.789794921875, -1.7056884765625, -1.62158203125, -1.5374755859375, -1.453369140625, -1.3692626953125, -1.28515625, -1.2010498046875, -1.116943359375, -1.0328369140625, -0.94873046875, -0.8646240234375, -0.780517578125, -0.6964111328125, -0.6123046875, -0.5281982421875, -0.444091796875, -0.3599853515625, -0.27587890625, -0.1917724609375, -0.107666015625, -0.0235595703125, 0.060546875, 0.1446533203125, 0.228759765625, 0.3128662109375, 0.39697265625, 0.4810791015625, 0.565185546875, 0.6492919921875, 0.7333984375, 0.8175048828125, 0.901611328125, 0.9857177734375, 1.06982421875, 1.1539306640625, 1.238037109375, 1.3221435546875, 1.40625, 1.4903564453125, 1.574462890625, 1.6585693359375, 1.74267578125, 1.8267822265625, 1.910888671875, 1.9949951171875, 2.0791015625, 2.1632080078125, 2.247314453125, 2.3314208984375, 2.41552734375, 2.4996337890625, 2.583740234375, 2.6678466796875, 2.751953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 9.0, 6.0, 9.0, 6.0, 8.0, 9.0, 12.0, 20.0, 15.0, 18.0, 13.0, 29.0, 20.0, 28.0, 30.0, 32.0, 40.0, 39.0, 42.0, 42.0, 48.0, 40.0, 40.0, 44.0, 43.0, 39.0, 35.0, 21.0, 40.0, 44.0, 21.0, 22.0, 24.0, 17.0, 19.0, 13.0, 20.0, 11.0, 6.0, 10.0, 7.0, 2.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.732421875, -1.68060302734375, -1.6287841796875, -1.57696533203125, -1.525146484375, -1.47332763671875, -1.4215087890625, -1.36968994140625, -1.31787109375, -1.26605224609375, -1.2142333984375, -1.16241455078125, -1.110595703125, -1.05877685546875, -1.0069580078125, -0.95513916015625, -0.9033203125, -0.85150146484375, -0.7996826171875, -0.74786376953125, -0.696044921875, -0.64422607421875, -0.5924072265625, -0.54058837890625, -0.48876953125, -0.43695068359375, -0.3851318359375, -0.33331298828125, -0.281494140625, -0.22967529296875, -0.1778564453125, -0.12603759765625, -0.07421875, -0.02239990234375, 0.0294189453125, 0.08123779296875, 0.133056640625, 0.18487548828125, 0.2366943359375, 0.28851318359375, 0.34033203125, 0.39215087890625, 0.4439697265625, 0.49578857421875, 0.547607421875, 0.59942626953125, 0.6512451171875, 0.70306396484375, 0.7548828125, 0.80670166015625, 0.8585205078125, 0.91033935546875, 0.962158203125, 1.01397705078125, 1.0657958984375, 1.11761474609375, 1.16943359375, 1.22125244140625, 1.2730712890625, 1.32489013671875, 1.376708984375, 1.42852783203125, 1.4803466796875, 1.53216552734375, 1.583984375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 20.0, 23.0, 30.0, 44.0, 61.0, 76.0, 115.0, 177.0, 241.0, 326.0, 524.0, 850.0, 1351.0, 2078.0, 3599.0, 5927.0, 10128.0, 18688.0, 33908.0, 65139.0, 124467.0, 217675.0, 241585.0, 149816.0, 78595.0, 41065.0, 21814.0, 12073.0, 7094.0, 4097.0, 2441.0, 1499.0, 1007.0, 612.0, 444.0, 303.0, 200.0, 140.0, 95.0, 64.0, 54.0, 27.0, 18.0, 14.0, 12.0, 10.0, 8.0, 5.0, 0.0, 2.0, 2.0, 3.0], "bins": [-1.05859375, -1.0275955200195312, -0.9965972900390625, -0.9655990600585938, -0.934600830078125, -0.9036026000976562, -0.8726043701171875, -0.8416061401367188, -0.81060791015625, -0.7796096801757812, -0.7486114501953125, -0.7176132202148438, -0.686614990234375, -0.6556167602539062, -0.6246185302734375, -0.5936203002929688, -0.5626220703125, -0.5316238403320312, -0.5006256103515625, -0.46962738037109375, -0.438629150390625, -0.40763092041015625, -0.3766326904296875, -0.34563446044921875, -0.31463623046875, -0.28363800048828125, -0.2526397705078125, -0.22164154052734375, -0.190643310546875, -0.15964508056640625, -0.1286468505859375, -0.09764862060546875, -0.066650390625, -0.03565216064453125, -0.0046539306640625, 0.02634429931640625, 0.057342529296875, 0.08834075927734375, 0.1193389892578125, 0.15033721923828125, 0.18133544921875, 0.21233367919921875, 0.2433319091796875, 0.27433013916015625, 0.305328369140625, 0.33632659912109375, 0.3673248291015625, 0.39832305908203125, 0.4293212890625, 0.46031951904296875, 0.4913177490234375, 0.5223159790039062, 0.553314208984375, 0.5843124389648438, 0.6153106689453125, 0.6463088989257812, 0.67730712890625, 0.7083053588867188, 0.7393035888671875, 0.7703018188476562, 0.801300048828125, 0.8322982788085938, 0.8632965087890625, 0.8942947387695312, 0.92529296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 3.0, 15.0, 5.0, 7.0, 16.0, 21.0, 24.0, 28.0, 29.0, 47.0, 62.0, 75.0, 72.0, 81.0, 86.0, 80.0, 84.0, 57.0, 36.0, 39.0, 35.0, 14.0, 24.0, 9.0, 8.0, 8.0, 11.0, 9.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.27501106262207e-05, -5.086418241262436e-05, -4.8978254199028015e-05, -4.709232598543167e-05, -4.520639777183533e-05, -4.332046955823898e-05, -4.143454134464264e-05, -3.9548613131046295e-05, -3.766268491744995e-05, -3.577675670385361e-05, -3.389082849025726e-05, -3.200490027666092e-05, -3.0118972063064575e-05, -2.823304384946823e-05, -2.6347115635871887e-05, -2.4461187422275543e-05, -2.25752592086792e-05, -2.0689330995082855e-05, -1.880340278148651e-05, -1.6917474567890167e-05, -1.5031546354293823e-05, -1.314561814069748e-05, -1.1259689927101135e-05, -9.373761713504791e-06, -7.487833499908447e-06, -5.601905286312103e-06, -3.7159770727157593e-06, -1.8300488591194153e-06, 5.587935447692871e-08, 1.9418075680732727e-06, 3.827735781669617e-06, 5.713663995265961e-06, 7.599592208862305e-06, 9.485520422458649e-06, 1.1371448636054993e-05, 1.3257376849651337e-05, 1.514330506324768e-05, 1.7029233276844025e-05, 1.891516149044037e-05, 2.0801089704036713e-05, 2.2687017917633057e-05, 2.45729461312294e-05, 2.6458874344825745e-05, 2.834480255842209e-05, 3.0230730772018433e-05, 3.2116658985614777e-05, 3.400258719921112e-05, 3.5888515412807465e-05, 3.777444362640381e-05, 3.966037184000015e-05, 4.1546300053596497e-05, 4.343222826719284e-05, 4.5318156480789185e-05, 4.720408469438553e-05, 4.909001290798187e-05, 5.0975941121578217e-05, 5.286186933517456e-05, 5.4747797548770905e-05, 5.663372576236725e-05, 5.851965397596359e-05, 6.0405582189559937e-05, 6.229151040315628e-05, 6.417743861675262e-05, 6.606336683034897e-05, 6.794929504394531e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 12.0, 18.0, 26.0, 42.0, 51.0, 71.0, 93.0, 113.0, 184.0, 288.0, 383.0, 679.0, 1029.0, 1832.0, 3356.0, 6321.0, 12298.0, 25476.0, 52893.0, 109810.0, 199898.0, 249791.0, 186695.0, 100681.0, 48361.0, 23254.0, 11397.0, 5666.0, 3117.0, 1711.0, 1102.0, 654.0, 397.0, 271.0, 157.0, 134.0, 78.0, 55.0, 31.0, 38.0, 21.0, 18.0, 13.0, 13.0, 6.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.98046875, -0.94927978515625, -0.9180908203125, -0.88690185546875, -0.855712890625, -0.82452392578125, -0.7933349609375, -0.76214599609375, -0.73095703125, -0.69976806640625, -0.6685791015625, -0.63739013671875, -0.606201171875, -0.57501220703125, -0.5438232421875, -0.51263427734375, -0.4814453125, -0.45025634765625, -0.4190673828125, -0.38787841796875, -0.356689453125, -0.32550048828125, -0.2943115234375, -0.26312255859375, -0.23193359375, -0.20074462890625, -0.1695556640625, -0.13836669921875, -0.107177734375, -0.07598876953125, -0.0447998046875, -0.01361083984375, 0.017578125, 0.04876708984375, 0.0799560546875, 0.11114501953125, 0.142333984375, 0.17352294921875, 0.2047119140625, 0.23590087890625, 0.26708984375, 0.29827880859375, 0.3294677734375, 0.36065673828125, 0.391845703125, 0.42303466796875, 0.4542236328125, 0.48541259765625, 0.5166015625, 0.54779052734375, 0.5789794921875, 0.61016845703125, 0.641357421875, 0.67254638671875, 0.7037353515625, 0.73492431640625, 0.76611328125, 0.79730224609375, 0.8284912109375, 0.85968017578125, 0.890869140625, 0.92205810546875, 0.9532470703125, 0.98443603515625, 1.015625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 5.0, 4.0, 10.0, 12.0, 12.0, 20.0, 15.0, 11.0, 27.0, 38.0, 39.0, 61.0, 50.0, 55.0, 56.0, 59.0, 51.0, 67.0, 57.0, 58.0, 48.0, 44.0, 42.0, 22.0, 28.0, 22.0, 17.0, 16.0, 10.0, 10.0, 6.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.302978515625, -0.2939796447753906, -0.28498077392578125, -0.2759819030761719, -0.2669830322265625, -0.2579841613769531, -0.24898529052734375, -0.23998641967773438, -0.230987548828125, -0.22198867797851562, -0.21298980712890625, -0.20399093627929688, -0.1949920654296875, -0.18599319458007812, -0.17699432373046875, -0.16799545288085938, -0.15899658203125, -0.14999771118164062, -0.14099884033203125, -0.13199996948242188, -0.1230010986328125, -0.11400222778320312, -0.10500335693359375, -0.09600448608398438, -0.087005615234375, -0.07800674438476562, -0.06900787353515625, -0.060009002685546875, -0.0510101318359375, -0.042011260986328125, -0.03301239013671875, -0.024013519287109375, -0.0150146484375, -0.006015777587890625, 0.00298309326171875, 0.011981964111328125, 0.0209808349609375, 0.029979705810546875, 0.03897857666015625, 0.047977447509765625, 0.056976318359375, 0.06597518920898438, 0.07497406005859375, 0.08397293090820312, 0.0929718017578125, 0.10197067260742188, 0.11096954345703125, 0.11996841430664062, 0.12896728515625, 0.13796615600585938, 0.14696502685546875, 0.15596389770507812, 0.1649627685546875, 0.17396163940429688, 0.18296051025390625, 0.19195938110351562, 0.200958251953125, 0.20995712280273438, 0.21895599365234375, 0.22795486450195312, 0.2369537353515625, 0.24595260620117188, 0.25495147705078125, 0.2639503479003906, 0.27294921875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 7.0, 10.0, 12.0, 10.0, 19.0, 22.0, 22.0, 31.0, 51.0, 66.0, 74.0, 77.0, 101.0, 103.0, 92.0, 70.0, 65.0, 51.0, 28.0, 21.0, 8.0, 17.0, 12.0, 9.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.374643802642822, -4.203861713409424, -4.033079624176025, -3.862297534942627, -3.6915156841278076, -3.520733594894409, -3.3499515056610107, -3.1791696548461914, -3.008387565612793, -2.8376054763793945, -2.666823387145996, -2.4960412979125977, -2.3252594470977783, -2.15447735786438, -1.9836952686309814, -1.8129132986068726, -1.6421310901641846, -1.4713490009307861, -1.3005670309066772, -1.1297849416732788, -0.9590029120445251, -0.7882208824157715, -0.617438793182373, -0.44665682315826416, -0.2758747339248657, -0.10509268939495087, 0.06568935513496399, 0.23647141456604004, 0.4072534441947937, 0.5780354738235474, 0.7488175630569458, 0.9195995330810547, 1.0903816223144531, 1.2611637115478516, 1.4319456815719604, 1.6027277708053589, 1.7735097408294678, 1.9442918300628662, 2.1150739192962646, 2.285855770111084, 2.4566378593444824, 2.627419948577881, 2.7982020378112793, 2.9689841270446777, 3.139765977859497, 3.3105480670928955, 3.481330156326294, 3.6521120071411133, 3.822894334793091, 3.9936764240264893, 4.164458274841309, 4.335240364074707, 4.5060224533081055, 4.676804542541504, 4.847586631774902, 5.018368721008301, 5.189150810241699, 5.359932899475098, 5.530714988708496, 5.7014970779418945, 5.872279167175293, 6.043061256408691, 6.21384334564209, 6.38462495803833, 6.5554070472717285]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 12.0, 12.0, 15.0, 19.0, 15.0, 15.0, 18.0, 21.0, 25.0, 31.0, 24.0, 35.0, 39.0, 28.0, 39.0, 32.0, 33.0, 47.0, 43.0, 38.0, 39.0, 47.0, 40.0, 30.0, 29.0, 32.0, 35.0, 26.0, 15.0, 18.0, 22.0, 15.0, 24.0, 15.0, 12.0, 10.0, 6.0, 5.0, 5.0, 8.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.40902042388916, -2.3349692821502686, -2.260918378829956, -2.1868672370910645, -2.112816333770752, -2.0387651920318604, -1.9647140502929688, -1.8906630277633667, -1.8166120052337646, -1.7425609827041626, -1.6685099601745605, -1.594458818435669, -1.520407795906067, -1.4463567733764648, -1.3723056316375732, -1.2982546091079712, -1.2242035865783691, -1.150152564048767, -1.076101541519165, -1.0020503997802734, -0.9279993772506714, -0.8539483547210693, -0.7798972725868225, -0.7058461904525757, -0.6317951679229736, -0.5577441453933716, -0.48369306325912476, -0.4096420109272003, -0.3355909585952759, -0.26153990626335144, -0.187488853931427, -0.11343777179718018, -0.03938651084899902, 0.034664541482925415, 0.10871559381484985, 0.1827666461467743, 0.25681769847869873, 0.33086875081062317, 0.4049198031425476, 0.47897088527679443, 0.5530219078063965, 0.6270729303359985, 0.7011240124702454, 0.7751750946044922, 0.8492261171340942, 0.9232771396636963, 0.9973282217979431, 1.07137930393219, 1.145430326461792, 1.219481348991394, 1.293532371520996, 1.3675835132598877, 1.4416345357894897, 1.5156855583190918, 1.5897367000579834, 1.6637877225875854, 1.7378387451171875, 1.8118897676467896, 1.8859407901763916, 1.9599919319152832, 2.0340428352355957, 2.1080939769744873, 2.182145118713379, 2.2561960220336914, 2.330247163772583]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 0.0, 11.0, 13.0, 19.0, 23.0, 54.0, 82.0, 133.0, 230.0, 364.0, 675.0, 1072.0, 2011.0, 3710.0, 7033.0, 13586.0, 27496.0, 55278.0, 106647.0, 175744.0, 220893.0, 188503.0, 117978.0, 62815.0, 31418.0, 15466.0, 8010.0, 4058.0, 2269.0, 1188.0, 712.0, 437.0, 240.0, 142.0, 84.0, 59.0, 33.0, 26.0, 20.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.90625, -2.811248779296875, -2.71624755859375, -2.621246337890625, -2.5262451171875, -2.431243896484375, -2.33624267578125, -2.241241455078125, -2.146240234375, -2.051239013671875, -1.95623779296875, -1.861236572265625, -1.7662353515625, -1.671234130859375, -1.57623291015625, -1.481231689453125, -1.38623046875, -1.291229248046875, -1.19622802734375, -1.101226806640625, -1.0062255859375, -0.911224365234375, -0.81622314453125, -0.721221923828125, -0.626220703125, -0.531219482421875, -0.43621826171875, -0.341217041015625, -0.2462158203125, -0.151214599609375, -0.05621337890625, 0.038787841796875, 0.1337890625, 0.228790283203125, 0.32379150390625, 0.418792724609375, 0.5137939453125, 0.608795166015625, 0.70379638671875, 0.798797607421875, 0.893798828125, 0.988800048828125, 1.08380126953125, 1.178802490234375, 1.2738037109375, 1.368804931640625, 1.46380615234375, 1.558807373046875, 1.65380859375, 1.748809814453125, 1.84381103515625, 1.938812255859375, 2.0338134765625, 2.128814697265625, 2.22381591796875, 2.318817138671875, 2.413818359375, 2.508819580078125, 2.60382080078125, 2.698822021484375, 2.7938232421875, 2.888824462890625, 2.98382568359375, 3.078826904296875, 3.173828125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 9.0, 4.0, 5.0, 8.0, 11.0, 12.0, 18.0, 16.0, 20.0, 25.0, 22.0, 32.0, 31.0, 30.0, 25.0, 31.0, 33.0, 36.0, 50.0, 45.0, 41.0, 40.0, 50.0, 40.0, 42.0, 36.0, 36.0, 38.0, 26.0, 30.0, 26.0, 15.0, 16.0, 21.0, 24.0, 9.0, 10.0, 14.0, 5.0, 4.0, 1.0, 3.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-2.853515625, -2.76898193359375, -2.6844482421875, -2.59991455078125, -2.515380859375, -2.43084716796875, -2.3463134765625, -2.26177978515625, -2.17724609375, -2.09271240234375, -2.0081787109375, -1.92364501953125, -1.839111328125, -1.75457763671875, -1.6700439453125, -1.58551025390625, -1.5009765625, -1.41644287109375, -1.3319091796875, -1.24737548828125, -1.162841796875, -1.07830810546875, -0.9937744140625, -0.90924072265625, -0.82470703125, -0.74017333984375, -0.6556396484375, -0.57110595703125, -0.486572265625, -0.40203857421875, -0.3175048828125, -0.23297119140625, -0.1484375, -0.06390380859375, 0.0206298828125, 0.10516357421875, 0.189697265625, 0.27423095703125, 0.3587646484375, 0.44329833984375, 0.52783203125, 0.61236572265625, 0.6968994140625, 0.78143310546875, 0.865966796875, 0.95050048828125, 1.0350341796875, 1.11956787109375, 1.2041015625, 1.28863525390625, 1.3731689453125, 1.45770263671875, 1.542236328125, 1.62677001953125, 1.7113037109375, 1.79583740234375, 1.88037109375, 1.96490478515625, 2.0494384765625, 2.13397216796875, 2.218505859375, 2.30303955078125, 2.3875732421875, 2.47210693359375, 2.556640625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 13.0, 6.0, 13.0, 22.0, 39.0, 40.0, 66.0, 90.0, 125.0, 196.0, 294.0, 426.0, 705.0, 1142.0, 1963.0, 3506.0, 6470.0, 12660.0, 25004.0, 49052.0, 94501.0, 159733.0, 210292.0, 196728.0, 132611.0, 74041.0, 37750.0, 19021.0, 9862.0, 5073.0, 2798.0, 1568.0, 1022.0, 595.0, 338.0, 227.0, 182.0, 130.0, 85.0, 55.0, 46.0, 15.0, 17.0, 20.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.1015625, -3.012451171875, -2.92333984375, -2.834228515625, -2.7451171875, -2.656005859375, -2.56689453125, -2.477783203125, -2.388671875, -2.299560546875, -2.21044921875, -2.121337890625, -2.0322265625, -1.943115234375, -1.85400390625, -1.764892578125, -1.67578125, -1.586669921875, -1.49755859375, -1.408447265625, -1.3193359375, -1.230224609375, -1.14111328125, -1.052001953125, -0.962890625, -0.873779296875, -0.78466796875, -0.695556640625, -0.6064453125, -0.517333984375, -0.42822265625, -0.339111328125, -0.25, -0.160888671875, -0.07177734375, 0.017333984375, 0.1064453125, 0.195556640625, 0.28466796875, 0.373779296875, 0.462890625, 0.552001953125, 0.64111328125, 0.730224609375, 0.8193359375, 0.908447265625, 0.99755859375, 1.086669921875, 1.17578125, 1.264892578125, 1.35400390625, 1.443115234375, 1.5322265625, 1.621337890625, 1.71044921875, 1.799560546875, 1.888671875, 1.977783203125, 2.06689453125, 2.156005859375, 2.2451171875, 2.334228515625, 2.42333984375, 2.512451171875, 2.6015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 11.0, 14.0, 10.0, 17.0, 13.0, 18.0, 31.0, 18.0, 31.0, 42.0, 28.0, 23.0, 39.0, 33.0, 36.0, 32.0, 28.0, 38.0, 48.0, 47.0, 37.0, 37.0, 39.0, 32.0, 28.0, 22.0, 31.0, 32.0, 19.0, 22.0, 16.0, 11.0, 11.0, 16.0, 11.0, 8.0, 6.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.419921875, -1.37432861328125, -1.3287353515625, -1.28314208984375, -1.237548828125, -1.19195556640625, -1.1463623046875, -1.10076904296875, -1.05517578125, -1.00958251953125, -0.9639892578125, -0.91839599609375, -0.872802734375, -0.82720947265625, -0.7816162109375, -0.73602294921875, -0.6904296875, -0.64483642578125, -0.5992431640625, -0.55364990234375, -0.508056640625, -0.46246337890625, -0.4168701171875, -0.37127685546875, -0.32568359375, -0.28009033203125, -0.2344970703125, -0.18890380859375, -0.143310546875, -0.09771728515625, -0.0521240234375, -0.00653076171875, 0.0390625, 0.08465576171875, 0.1302490234375, 0.17584228515625, 0.221435546875, 0.26702880859375, 0.3126220703125, 0.35821533203125, 0.40380859375, 0.44940185546875, 0.4949951171875, 0.54058837890625, 0.586181640625, 0.63177490234375, 0.6773681640625, 0.72296142578125, 0.7685546875, 0.81414794921875, 0.8597412109375, 0.90533447265625, 0.950927734375, 0.99652099609375, 1.0421142578125, 1.08770751953125, 1.13330078125, 1.17889404296875, 1.2244873046875, 1.27008056640625, 1.315673828125, 1.36126708984375, 1.4068603515625, 1.45245361328125, 1.498046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 9.0, 5.0, 17.0, 29.0, 50.0, 63.0, 103.0, 168.0, 208.0, 342.0, 605.0, 938.0, 1495.0, 2531.0, 4309.0, 7034.0, 12282.0, 21398.0, 38427.0, 68630.0, 117607.0, 176631.0, 200971.0, 160010.0, 100547.0, 57823.0, 32545.0, 18031.0, 10358.0, 6047.0, 3516.0, 2177.0, 1334.0, 811.0, 496.0, 343.0, 229.0, 154.0, 94.0, 59.0, 40.0, 28.0, 16.0, 20.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.439453125, -1.39495849609375, -1.3504638671875, -1.30596923828125, -1.261474609375, -1.21697998046875, -1.1724853515625, -1.12799072265625, -1.08349609375, -1.03900146484375, -0.9945068359375, -0.95001220703125, -0.905517578125, -0.86102294921875, -0.8165283203125, -0.77203369140625, -0.7275390625, -0.68304443359375, -0.6385498046875, -0.59405517578125, -0.549560546875, -0.50506591796875, -0.4605712890625, -0.41607666015625, -0.37158203125, -0.32708740234375, -0.2825927734375, -0.23809814453125, -0.193603515625, -0.14910888671875, -0.1046142578125, -0.06011962890625, -0.015625, 0.02886962890625, 0.0733642578125, 0.11785888671875, 0.162353515625, 0.20684814453125, 0.2513427734375, 0.29583740234375, 0.34033203125, 0.38482666015625, 0.4293212890625, 0.47381591796875, 0.518310546875, 0.56280517578125, 0.6072998046875, 0.65179443359375, 0.6962890625, 0.74078369140625, 0.7852783203125, 0.82977294921875, 0.874267578125, 0.91876220703125, 0.9632568359375, 1.00775146484375, 1.05224609375, 1.09674072265625, 1.1412353515625, 1.18572998046875, 1.230224609375, 1.27471923828125, 1.3192138671875, 1.36370849609375, 1.408203125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 6.0, 8.0, 7.0, 13.0, 13.0, 18.0, 19.0, 32.0, 32.0, 46.0, 46.0, 50.0, 53.0, 53.0, 49.0, 55.0, 50.0, 63.0, 71.0, 38.0, 43.0, 34.0, 37.0, 23.0, 20.0, 14.0, 17.0, 17.0, 12.0, 11.0, 4.0, 7.0, 1.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012421607971191406, -0.00012047495692968369, -0.00011673383414745331, -0.00011299271136522293, -0.00010925158858299255, -0.00010551046580076218, -0.0001017693430185318, -9.802822023630142e-05, -9.428709745407104e-05, -9.054597467184067e-05, -8.680485188961029e-05, -8.306372910737991e-05, -7.932260632514954e-05, -7.558148354291916e-05, -7.184036076068878e-05, -6.80992379784584e-05, -6.435811519622803e-05, -6.061699241399765e-05, -5.687586963176727e-05, -5.3134746849536896e-05, -4.939362406730652e-05, -4.565250128507614e-05, -4.1911378502845764e-05, -3.817025572061539e-05, -3.442913293838501e-05, -3.068801015615463e-05, -2.6946887373924255e-05, -2.3205764591693878e-05, -1.94646418094635e-05, -1.5723519027233124e-05, -1.1982396245002747e-05, -8.24127346277237e-06, -4.500150680541992e-06, -7.59027898311615e-07, 2.982094883918762e-06, 6.723217666149139e-06, 1.0464340448379517e-05, 1.4205463230609894e-05, 1.794658601284027e-05, 2.1687708795070648e-05, 2.5428831577301025e-05, 2.9169954359531403e-05, 3.291107714176178e-05, 3.665219992399216e-05, 4.0393322706222534e-05, 4.413444548845291e-05, 4.787556827068329e-05, 5.1616691052913666e-05, 5.535781383514404e-05, 5.909893661737442e-05, 6.28400593996048e-05, 6.658118218183517e-05, 7.032230496406555e-05, 7.406342774629593e-05, 7.78045505285263e-05, 8.154567331075668e-05, 8.528679609298706e-05, 8.902791887521744e-05, 9.276904165744781e-05, 9.651016443967819e-05, 0.00010025128722190857, 0.00010399241000413895, 0.00010773353278636932, 0.0001114746555685997, 0.00011521577835083008]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 11.0, 16.0, 14.0, 22.0, 33.0, 49.0, 59.0, 86.0, 137.0, 194.0, 324.0, 444.0, 727.0, 1084.0, 1592.0, 2581.0, 3908.0, 6170.0, 9886.0, 16112.0, 25844.0, 42462.0, 68563.0, 106560.0, 149686.0, 171611.0, 150567.0, 108110.0, 69296.0, 42281.0, 26392.0, 16082.0, 9884.0, 6287.0, 4007.0, 2603.0, 1672.0, 1029.0, 777.0, 460.0, 310.0, 191.0, 139.0, 83.0, 65.0, 48.0, 31.0, 16.0, 15.0, 11.0, 8.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.037109375, -1.000732421875, -0.96435546875, -0.927978515625, -0.8916015625, -0.855224609375, -0.81884765625, -0.782470703125, -0.74609375, -0.709716796875, -0.67333984375, -0.636962890625, -0.6005859375, -0.564208984375, -0.52783203125, -0.491455078125, -0.455078125, -0.418701171875, -0.38232421875, -0.345947265625, -0.3095703125, -0.273193359375, -0.23681640625, -0.200439453125, -0.1640625, -0.127685546875, -0.09130859375, -0.054931640625, -0.0185546875, 0.017822265625, 0.05419921875, 0.090576171875, 0.126953125, 0.163330078125, 0.19970703125, 0.236083984375, 0.2724609375, 0.308837890625, 0.34521484375, 0.381591796875, 0.41796875, 0.454345703125, 0.49072265625, 0.527099609375, 0.5634765625, 0.599853515625, 0.63623046875, 0.672607421875, 0.708984375, 0.745361328125, 0.78173828125, 0.818115234375, 0.8544921875, 0.890869140625, 0.92724609375, 0.963623046875, 1.0, 1.036376953125, 1.07275390625, 1.109130859375, 1.1455078125, 1.181884765625, 1.21826171875, 1.254638671875, 1.291015625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 2.0, 2.0, 6.0, 14.0, 11.0, 12.0, 23.0, 20.0, 31.0, 27.0, 52.0, 49.0, 62.0, 61.0, 60.0, 48.0, 81.0, 70.0, 60.0, 57.0, 43.0, 49.0, 40.0, 28.0, 22.0, 19.0, 12.0, 8.0, 6.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4169921875, -0.4029998779296875, -0.389007568359375, -0.3750152587890625, -0.36102294921875, -0.3470306396484375, -0.333038330078125, -0.3190460205078125, -0.3050537109375, -0.2910614013671875, -0.277069091796875, -0.2630767822265625, -0.24908447265625, -0.2350921630859375, -0.221099853515625, -0.2071075439453125, -0.193115234375, -0.1791229248046875, -0.165130615234375, -0.1511383056640625, -0.13714599609375, -0.1231536865234375, -0.109161376953125, -0.0951690673828125, -0.0811767578125, -0.0671844482421875, -0.053192138671875, -0.0391998291015625, -0.02520751953125, -0.0112152099609375, 0.002777099609375, 0.0167694091796875, 0.03076171875, 0.0447540283203125, 0.058746337890625, 0.0727386474609375, 0.08673095703125, 0.1007232666015625, 0.114715576171875, 0.1287078857421875, 0.1427001953125, 0.1566925048828125, 0.170684814453125, 0.1846771240234375, 0.19866943359375, 0.2126617431640625, 0.226654052734375, 0.2406463623046875, 0.254638671875, 0.2686309814453125, 0.282623291015625, 0.2966156005859375, 0.31060791015625, 0.3246002197265625, 0.338592529296875, 0.3525848388671875, 0.3665771484375, 0.3805694580078125, 0.394561767578125, 0.4085540771484375, 0.42254638671875, 0.4365386962890625, 0.450531005859375, 0.4645233154296875, 0.478515625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 3.0, 5.0, 10.0, 11.0, 14.0, 17.0, 25.0, 20.0, 49.0, 61.0, 58.0, 71.0, 85.0, 96.0, 93.0, 90.0, 74.0, 47.0, 36.0, 35.0, 19.0, 17.0, 10.0, 12.0, 11.0, 11.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.410089015960693, -4.2487945556640625, -4.087499618530273, -3.9262051582336426, -3.7649106979370117, -3.603616237640381, -3.442321538925171, -3.281026840209961, -3.11973237991333, -2.958437919616699, -2.7971432209014893, -2.6358485221862793, -2.4745540618896484, -2.3132596015930176, -2.1519649028778076, -1.9906703233718872, -1.8293757438659668, -1.6680811643600464, -1.506786584854126, -1.3454920053482056, -1.1841974258422852, -1.0229028463363647, -0.8616082668304443, -0.7003136873245239, -0.5390191078186035, -0.3777245283126831, -0.2164299488067627, -0.055135369300842285, 0.10615921020507812, 0.26745378971099854, 0.42874836921691895, 0.5900429487228394, 0.751338005065918, 0.9126325845718384, 1.0739271640777588, 1.2352217435836792, 1.3965163230895996, 1.55781090259552, 1.7191054821014404, 1.8804000616073608, 2.0416946411132812, 2.202989101409912, 2.364283800125122, 2.525578498840332, 2.686872959136963, 2.8481674194335938, 3.0094621181488037, 3.1707568168640137, 3.3320512771606445, 3.4933457374572754, 3.6546404361724854, 3.8159351348876953, 3.977229595184326, 4.138524055480957, 4.299818992614746, 4.461113452911377, 4.622407913208008, 4.783702373504639, 4.9449968338012695, 5.106291770935059, 5.2675862312316895, 5.42888069152832, 5.590175628662109, 5.75147008895874, 5.912764549255371]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 13.0, 13.0, 14.0, 13.0, 15.0, 27.0, 28.0, 29.0, 21.0, 23.0, 25.0, 37.0, 25.0, 39.0, 41.0, 42.0, 36.0, 43.0, 49.0, 32.0, 40.0, 29.0, 23.0, 38.0, 38.0, 29.0, 33.0, 34.0, 23.0, 18.0, 19.0, 15.0, 19.0, 13.0, 11.0, 7.0, 11.0, 6.0, 4.0, 4.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.564207077026367, -2.489161968231201, -2.4141170978546143, -2.3390719890594482, -2.2640268802642822, -2.1889820098876953, -2.1139369010925293, -2.0388917922973633, -1.9638468027114868, -1.8888018131256104, -1.8137567043304443, -1.7387117147445679, -1.6636667251586914, -1.5886216163635254, -1.513576626777649, -1.4385316371917725, -1.3634865283966064, -1.28844153881073, -1.213396430015564, -1.1383514404296875, -1.0633063316345215, -0.988261342048645, -0.9132163524627686, -0.8381713032722473, -0.7631262540817261, -0.6880812048912048, -0.6130361557006836, -0.5379911661148071, -0.4629461169242859, -0.38790106773376465, -0.3128560483455658, -0.23781102895736694, -0.1627657413482666, -0.08772070705890656, -0.012675672769546509, 0.06236936151981354, 0.13741439580917358, 0.21245944499969482, 0.2875044643878937, 0.36254948377609253, 0.43759453296661377, 0.512639582157135, 0.5876846313476562, 0.6627296209335327, 0.737774670124054, 0.8128197193145752, 0.8878647089004517, 0.9629097580909729, 1.0379548072814941, 1.1129997968673706, 1.1880449056625366, 1.263089895248413, 1.338135004043579, 1.4131799936294556, 1.488224983215332, 1.563270092010498, 1.6383150815963745, 1.713360071182251, 1.788405179977417, 1.8634501695632935, 1.93849515914917, 2.013540267944336, 2.088585376739502, 2.163630247116089, 2.238675355911255]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 5.0, 7.0, 13.0, 18.0, 38.0, 40.0, 53.0, 85.0, 116.0, 199.0, 281.0, 441.0, 664.0, 1061.0, 1736.0, 2964.0, 5603.0, 10695.0, 22474.0, 53385.0, 151705.0, 554276.0, 1651552.0, 1240542.0, 331755.0, 95175.0, 35601.0, 15637.0, 7854.0, 4151.0, 2294.0, 1423.0, 842.0, 520.0, 312.0, 256.0, 157.0, 101.0, 76.0, 70.0, 35.0, 24.0, 16.0, 10.0, 8.0, 6.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.26953125, -5.1038818359375, -4.938232421875, -4.7725830078125, -4.60693359375, -4.4412841796875, -4.275634765625, -4.1099853515625, -3.9443359375, -3.7786865234375, -3.613037109375, -3.4473876953125, -3.28173828125, -3.1160888671875, -2.950439453125, -2.7847900390625, -2.619140625, -2.4534912109375, -2.287841796875, -2.1221923828125, -1.95654296875, -1.7908935546875, -1.625244140625, -1.4595947265625, -1.2939453125, -1.1282958984375, -0.962646484375, -0.7969970703125, -0.63134765625, -0.4656982421875, -0.300048828125, -0.1343994140625, 0.03125, 0.1968994140625, 0.362548828125, 0.5281982421875, 0.69384765625, 0.8594970703125, 1.025146484375, 1.1907958984375, 1.3564453125, 1.5220947265625, 1.687744140625, 1.8533935546875, 2.01904296875, 2.1846923828125, 2.350341796875, 2.5159912109375, 2.681640625, 2.8472900390625, 3.012939453125, 3.1785888671875, 3.34423828125, 3.5098876953125, 3.675537109375, 3.8411865234375, 4.0068359375, 4.1724853515625, 4.338134765625, 4.5037841796875, 4.66943359375, 4.8350830078125, 5.000732421875, 5.1663818359375, 5.33203125]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 13.0, 9.0, 8.0, 17.0, 15.0, 18.0, 21.0, 28.0, 26.0, 25.0, 29.0, 16.0, 34.0, 38.0, 42.0, 35.0, 48.0, 52.0, 38.0, 33.0, 46.0, 34.0, 36.0, 27.0, 33.0, 42.0, 35.0, 34.0, 21.0, 34.0, 21.0, 16.0, 11.0, 13.0, 11.0, 10.0, 7.0, 4.0, 7.0, 1.0, 3.0, 7.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.927734375, -1.872467041015625, -1.81719970703125, -1.761932373046875, -1.7066650390625, -1.651397705078125, -1.59613037109375, -1.540863037109375, -1.485595703125, -1.430328369140625, -1.37506103515625, -1.319793701171875, -1.2645263671875, -1.209259033203125, -1.15399169921875, -1.098724365234375, -1.04345703125, -0.988189697265625, -0.93292236328125, -0.877655029296875, -0.8223876953125, -0.767120361328125, -0.71185302734375, -0.656585693359375, -0.601318359375, -0.546051025390625, -0.49078369140625, -0.435516357421875, -0.3802490234375, -0.324981689453125, -0.26971435546875, -0.214447021484375, -0.1591796875, -0.103912353515625, -0.04864501953125, 0.006622314453125, 0.0618896484375, 0.117156982421875, 0.17242431640625, 0.227691650390625, 0.282958984375, 0.338226318359375, 0.39349365234375, 0.448760986328125, 0.5040283203125, 0.559295654296875, 0.61456298828125, 0.669830322265625, 0.72509765625, 0.780364990234375, 0.83563232421875, 0.890899658203125, 0.9461669921875, 1.001434326171875, 1.05670166015625, 1.111968994140625, 1.167236328125, 1.222503662109375, 1.27777099609375, 1.333038330078125, 1.3883056640625, 1.443572998046875, 1.49884033203125, 1.554107666015625, 1.609375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 9.0, 3.0, 9.0, 11.0, 26.0, 19.0, 28.0, 47.0, 82.0, 123.0, 157.0, 307.0, 380.0, 630.0, 951.0, 1395.0, 2285.0, 3639.0, 5757.0, 9458.0, 16079.0, 27983.0, 51445.0, 99963.0, 212406.0, 491724.0, 1064675.0, 1151854.0, 565296.0, 243265.0, 112566.0, 56720.0, 30393.0, 17242.0, 10283.0, 6264.0, 3893.0, 2381.0, 1500.0, 1019.0, 680.0, 435.0, 295.0, 203.0, 132.0, 95.0, 58.0, 38.0, 21.0, 29.0, 11.0, 13.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.904296875, -3.7825927734375, -3.660888671875, -3.5391845703125, -3.41748046875, -3.2957763671875, -3.174072265625, -3.0523681640625, -2.9306640625, -2.8089599609375, -2.687255859375, -2.5655517578125, -2.44384765625, -2.3221435546875, -2.200439453125, -2.0787353515625, -1.95703125, -1.8353271484375, -1.713623046875, -1.5919189453125, -1.47021484375, -1.3485107421875, -1.226806640625, -1.1051025390625, -0.9833984375, -0.8616943359375, -0.739990234375, -0.6182861328125, -0.49658203125, -0.3748779296875, -0.253173828125, -0.1314697265625, -0.009765625, 0.1119384765625, 0.233642578125, 0.3553466796875, 0.47705078125, 0.5987548828125, 0.720458984375, 0.8421630859375, 0.9638671875, 1.0855712890625, 1.207275390625, 1.3289794921875, 1.45068359375, 1.5723876953125, 1.694091796875, 1.8157958984375, 1.9375, 2.0592041015625, 2.180908203125, 2.3026123046875, 2.42431640625, 2.5460205078125, 2.667724609375, 2.7894287109375, 2.9111328125, 3.0328369140625, 3.154541015625, 3.2762451171875, 3.39794921875, 3.5196533203125, 3.641357421875, 3.7630615234375, 3.884765625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 6.0, 14.0, 16.0, 30.0, 23.0, 35.0, 38.0, 46.0, 38.0, 73.0, 102.0, 105.0, 132.0, 169.0, 229.0, 271.0, 307.0, 305.0, 327.0, 326.0, 243.0, 254.0, 222.0, 146.0, 144.0, 86.0, 70.0, 82.0, 48.0, 37.0, 30.0, 25.0, 18.0, 10.0, 6.0, 9.0, 10.0, 7.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2109375, -1.1753692626953125, -1.139801025390625, -1.1042327880859375, -1.06866455078125, -1.0330963134765625, -0.997528076171875, -0.9619598388671875, -0.9263916015625, -0.8908233642578125, -0.855255126953125, -0.8196868896484375, -0.78411865234375, -0.7485504150390625, -0.712982177734375, -0.6774139404296875, -0.641845703125, -0.6062774658203125, -0.570709228515625, -0.5351409912109375, -0.49957275390625, -0.4640045166015625, -0.428436279296875, -0.3928680419921875, -0.3572998046875, -0.3217315673828125, -0.286163330078125, -0.2505950927734375, -0.21502685546875, -0.1794586181640625, -0.143890380859375, -0.1083221435546875, -0.07275390625, -0.0371856689453125, -0.001617431640625, 0.0339508056640625, 0.06951904296875, 0.1050872802734375, 0.140655517578125, 0.1762237548828125, 0.2117919921875, 0.2473602294921875, 0.282928466796875, 0.3184967041015625, 0.35406494140625, 0.3896331787109375, 0.425201416015625, 0.4607696533203125, 0.496337890625, 0.5319061279296875, 0.567474365234375, 0.6030426025390625, 0.63861083984375, 0.6741790771484375, 0.709747314453125, 0.7453155517578125, 0.7808837890625, 0.8164520263671875, 0.852020263671875, 0.8875885009765625, 0.92315673828125, 0.9587249755859375, 0.994293212890625, 1.0298614501953125, 1.0654296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 2.0, 8.0, 11.0, 18.0, 16.0, 21.0, 27.0, 21.0, 30.0, 64.0, 58.0, 59.0, 70.0, 75.0, 85.0, 70.0, 73.0, 56.0, 40.0, 43.0, 30.0, 19.0, 22.0, 11.0, 7.0, 7.0, 12.0, 7.0, 3.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2183146476745605, -4.084728240966797, -3.951141834259033, -3.8175554275512695, -3.683969020843506, -3.550382614135742, -3.4167959690093994, -3.2832095623016357, -3.149623155593872, -3.0160367488861084, -2.8824503421783447, -2.748863935470581, -2.6152772903442383, -2.4816908836364746, -2.348104476928711, -2.2145180702209473, -2.0809316635131836, -1.94734525680542, -1.8137588500976562, -1.680172324180603, -1.5465859174728394, -1.4129995107650757, -1.2794129848480225, -1.1458265781402588, -1.0122401714324951, -0.8786537647247314, -0.745067298412323, -0.6114808320999146, -0.4778944253921509, -0.3443080186843872, -0.21072155237197876, -0.07713508605957031, 0.056450843811035156, 0.19003728032112122, 0.3236237168312073, 0.45721015334129333, 0.5907965898513794, 0.7243829965591431, 0.8579694628715515, 0.99155592918396, 1.1251423358917236, 1.2587287425994873, 1.392315149307251, 1.5259016752243042, 1.6594880819320679, 1.7930744886398315, 1.9266610145568848, 2.0602474212646484, 2.193833827972412, 2.327420234680176, 2.4610066413879395, 2.594593048095703, 2.728179454803467, 2.8617658615112305, 2.9953525066375732, 3.128938913345337, 3.2625253200531006, 3.3961117267608643, 3.529698133468628, 3.6632845401763916, 3.7968711853027344, 3.930457592010498, 4.064043998718262, 4.197630405426025, 4.331216812133789]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 7.0, 8.0, 7.0, 6.0, 8.0, 9.0, 5.0, 10.0, 15.0, 15.0, 22.0, 11.0, 21.0, 23.0, 24.0, 21.0, 23.0, 28.0, 38.0, 33.0, 37.0, 38.0, 40.0, 28.0, 40.0, 41.0, 27.0, 27.0, 35.0, 42.0, 33.0, 29.0, 33.0, 32.0, 20.0, 23.0, 19.0, 21.0, 16.0, 15.0, 11.0, 13.0, 8.0, 4.0, 14.0, 4.0, 9.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.0427536964416504, -1.977946400642395, -1.9131391048431396, -1.8483316898345947, -1.7835243940353394, -1.718717098236084, -1.6539098024368286, -1.5891025066375732, -1.5242950916290283, -1.459487795829773, -1.3946805000305176, -1.3298730850219727, -1.2650657892227173, -1.200258493423462, -1.1354511976242065, -1.0706439018249512, -1.0058366060256958, -0.9410293102264404, -0.8762219548225403, -0.8114146590232849, -0.7466073036193848, -0.6818000078201294, -0.616992712020874, -0.5521854162216187, -0.4873780608177185, -0.42257073521614075, -0.357763409614563, -0.2929561138153076, -0.22814878821372986, -0.1633414626121521, -0.09853416681289673, -0.03372684121131897, 0.03108048439025879, 0.09588780254125595, 0.1606951206922531, 0.22550243139266968, 0.29030975699424744, 0.3551170825958252, 0.41992437839508057, 0.4847317039966583, 0.5495390295982361, 0.6143463253974915, 0.6791536808013916, 0.743960976600647, 0.8087682723999023, 0.8735756278038025, 0.9383829236030579, 1.003190279006958, 1.0679975748062134, 1.1328048706054688, 1.1976121664047241, 1.2624194622039795, 1.3272268772125244, 1.3920341730117798, 1.4568414688110352, 1.5216487646102905, 1.586456060409546, 1.6512633562088013, 1.7160706520080566, 1.7808780670166016, 1.845685362815857, 1.9104926586151123, 1.9752999544143677, 2.040107250213623, 2.104914665222168]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 8.0, 13.0, 7.0, 9.0, 19.0, 45.0, 40.0, 57.0, 92.0, 129.0, 201.0, 267.0, 413.0, 622.0, 901.0, 1616.0, 2628.0, 4796.0, 9223.0, 18939.0, 40077.0, 85650.0, 171273.0, 257030.0, 219911.0, 121640.0, 57768.0, 26698.0, 12726.0, 6512.0, 3532.0, 2155.0, 1246.0, 810.0, 470.0, 341.0, 203.0, 147.0, 93.0, 64.0, 56.0, 36.0, 34.0, 23.0, 11.0, 4.0, 3.0, 7.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.240234375, -2.169647216796875, -2.09906005859375, -2.028472900390625, -1.9578857421875, -1.887298583984375, -1.81671142578125, -1.746124267578125, -1.675537109375, -1.604949951171875, -1.53436279296875, -1.463775634765625, -1.3931884765625, -1.322601318359375, -1.25201416015625, -1.181427001953125, -1.11083984375, -1.040252685546875, -0.96966552734375, -0.899078369140625, -0.8284912109375, -0.757904052734375, -0.68731689453125, -0.616729736328125, -0.546142578125, -0.475555419921875, -0.40496826171875, -0.334381103515625, -0.2637939453125, -0.193206787109375, -0.12261962890625, -0.052032470703125, 0.0185546875, 0.089141845703125, 0.15972900390625, 0.230316162109375, 0.3009033203125, 0.371490478515625, 0.44207763671875, 0.512664794921875, 0.583251953125, 0.653839111328125, 0.72442626953125, 0.795013427734375, 0.8656005859375, 0.936187744140625, 1.00677490234375, 1.077362060546875, 1.14794921875, 1.218536376953125, 1.28912353515625, 1.359710693359375, 1.4302978515625, 1.500885009765625, 1.57147216796875, 1.642059326171875, 1.712646484375, 1.783233642578125, 1.85382080078125, 1.924407958984375, 1.9949951171875, 2.065582275390625, 2.13616943359375, 2.206756591796875, 2.27734375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 9.0, 4.0, 12.0, 11.0, 11.0, 10.0, 10.0, 21.0, 25.0, 24.0, 27.0, 28.0, 27.0, 36.0, 32.0, 44.0, 39.0, 42.0, 36.0, 42.0, 37.0, 39.0, 41.0, 41.0, 42.0, 39.0, 38.0, 42.0, 31.0, 20.0, 21.0, 24.0, 24.0, 16.0, 8.0, 10.0, 8.0, 4.0, 11.0, 5.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.744140625, -2.663787841796875, -2.58343505859375, -2.503082275390625, -2.4227294921875, -2.342376708984375, -2.26202392578125, -2.181671142578125, -2.101318359375, -2.020965576171875, -1.94061279296875, -1.860260009765625, -1.7799072265625, -1.699554443359375, -1.61920166015625, -1.538848876953125, -1.45849609375, -1.378143310546875, -1.29779052734375, -1.217437744140625, -1.1370849609375, -1.056732177734375, -0.97637939453125, -0.896026611328125, -0.815673828125, -0.735321044921875, -0.65496826171875, -0.574615478515625, -0.4942626953125, -0.413909912109375, -0.33355712890625, -0.253204345703125, -0.1728515625, -0.092498779296875, -0.01214599609375, 0.068206787109375, 0.1485595703125, 0.228912353515625, 0.30926513671875, 0.389617919921875, 0.469970703125, 0.550323486328125, 0.63067626953125, 0.711029052734375, 0.7913818359375, 0.871734619140625, 0.95208740234375, 1.032440185546875, 1.11279296875, 1.193145751953125, 1.27349853515625, 1.353851318359375, 1.4342041015625, 1.514556884765625, 1.59490966796875, 1.675262451171875, 1.755615234375, 1.835968017578125, 1.91632080078125, 1.996673583984375, 2.0770263671875, 2.157379150390625, 2.23773193359375, 2.318084716796875, 2.3984375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 4.0, 11.0, 20.0, 28.0, 42.0, 69.0, 87.0, 137.0, 248.0, 350.0, 596.0, 1007.0, 1707.0, 3287.0, 6000.0, 12022.0, 25279.0, 57228.0, 136164.0, 286968.0, 281072.0, 131487.0, 55241.0, 24784.0, 11642.0, 5951.0, 3011.0, 1667.0, 950.0, 570.0, 322.0, 229.0, 108.0, 88.0, 64.0, 40.0, 22.0, 13.0, 8.0, 6.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.138671875, -3.046295166015625, -2.95391845703125, -2.861541748046875, -2.7691650390625, -2.676788330078125, -2.58441162109375, -2.492034912109375, -2.399658203125, -2.307281494140625, -2.21490478515625, -2.122528076171875, -2.0301513671875, -1.937774658203125, -1.84539794921875, -1.753021240234375, -1.66064453125, -1.568267822265625, -1.47589111328125, -1.383514404296875, -1.2911376953125, -1.198760986328125, -1.10638427734375, -1.014007568359375, -0.921630859375, -0.829254150390625, -0.73687744140625, -0.644500732421875, -0.5521240234375, -0.459747314453125, -0.36737060546875, -0.274993896484375, -0.1826171875, -0.090240478515625, 0.00213623046875, 0.094512939453125, 0.1868896484375, 0.279266357421875, 0.37164306640625, 0.464019775390625, 0.556396484375, 0.648773193359375, 0.74114990234375, 0.833526611328125, 0.9259033203125, 1.018280029296875, 1.11065673828125, 1.203033447265625, 1.29541015625, 1.387786865234375, 1.48016357421875, 1.572540283203125, 1.6649169921875, 1.757293701171875, 1.84967041015625, 1.942047119140625, 2.034423828125, 2.126800537109375, 2.21917724609375, 2.311553955078125, 2.4039306640625, 2.496307373046875, 2.58868408203125, 2.681060791015625, 2.7734375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 12.0, 10.0, 15.0, 20.0, 23.0, 21.0, 23.0, 36.0, 33.0, 35.0, 31.0, 34.0, 43.0, 49.0, 55.0, 45.0, 43.0, 40.0, 42.0, 46.0, 39.0, 32.0, 28.0, 34.0, 19.0, 29.0, 16.0, 24.0, 18.0, 18.0, 14.0, 16.0, 12.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.3623046875, -1.317047119140625, -1.27178955078125, -1.226531982421875, -1.1812744140625, -1.136016845703125, -1.09075927734375, -1.045501708984375, -1.000244140625, -0.954986572265625, -0.90972900390625, -0.864471435546875, -0.8192138671875, -0.773956298828125, -0.72869873046875, -0.683441162109375, -0.63818359375, -0.592926025390625, -0.54766845703125, -0.502410888671875, -0.4571533203125, -0.411895751953125, -0.36663818359375, -0.321380615234375, -0.276123046875, -0.230865478515625, -0.18560791015625, -0.140350341796875, -0.0950927734375, -0.049835205078125, -0.00457763671875, 0.040679931640625, 0.0859375, 0.131195068359375, 0.17645263671875, 0.221710205078125, 0.2669677734375, 0.312225341796875, 0.35748291015625, 0.402740478515625, 0.447998046875, 0.493255615234375, 0.53851318359375, 0.583770751953125, 0.6290283203125, 0.674285888671875, 0.71954345703125, 0.764801025390625, 0.81005859375, 0.855316162109375, 0.90057373046875, 0.945831298828125, 0.9910888671875, 1.036346435546875, 1.08160400390625, 1.126861572265625, 1.172119140625, 1.217376708984375, 1.26263427734375, 1.307891845703125, 1.3531494140625, 1.398406982421875, 1.44366455078125, 1.488922119140625, 1.5341796875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 13.0, 14.0, 22.0, 37.0, 45.0, 66.0, 79.0, 119.0, 173.0, 261.0, 360.0, 658.0, 1111.0, 2223.0, 5426.0, 16947.0, 73510.0, 421610.0, 423701.0, 74521.0, 16972.0, 5454.0, 2193.0, 1094.0, 670.0, 402.0, 248.0, 168.0, 133.0, 90.0, 54.0, 44.0, 40.0, 27.0, 13.0, 12.0, 7.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.853515625, -2.76959228515625, -2.6856689453125, -2.60174560546875, -2.517822265625, -2.43389892578125, -2.3499755859375, -2.26605224609375, -2.18212890625, -2.09820556640625, -2.0142822265625, -1.93035888671875, -1.846435546875, -1.76251220703125, -1.6785888671875, -1.59466552734375, -1.5107421875, -1.42681884765625, -1.3428955078125, -1.25897216796875, -1.175048828125, -1.09112548828125, -1.0072021484375, -0.92327880859375, -0.83935546875, -0.75543212890625, -0.6715087890625, -0.58758544921875, -0.503662109375, -0.41973876953125, -0.3358154296875, -0.25189208984375, -0.16796875, -0.08404541015625, -0.0001220703125, 0.08380126953125, 0.167724609375, 0.25164794921875, 0.3355712890625, 0.41949462890625, 0.50341796875, 0.58734130859375, 0.6712646484375, 0.75518798828125, 0.839111328125, 0.92303466796875, 1.0069580078125, 1.09088134765625, 1.1748046875, 1.25872802734375, 1.3426513671875, 1.42657470703125, 1.510498046875, 1.59442138671875, 1.6783447265625, 1.76226806640625, 1.84619140625, 1.93011474609375, 2.0140380859375, 2.09796142578125, 2.181884765625, 2.26580810546875, 2.3497314453125, 2.43365478515625, 2.517578125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 28.0, 80.0, 235.0, 324.0, 212.0, 67.0, 21.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018334388732910156, -0.00017614290118217468, -0.0001689419150352478, -0.00016174092888832092, -0.00015453994274139404, -0.00014733895659446716, -0.00014013797044754028, -0.0001329369843006134, -0.00012573599815368652, -0.00011853501200675964, -0.00011133402585983276, -0.00010413303971290588, -9.6932053565979e-05, -8.973106741905212e-05, -8.253008127212524e-05, -7.532909512519836e-05, -6.812810897827148e-05, -6.0927122831344604e-05, -5.3726136684417725e-05, -4.6525150537490845e-05, -3.9324164390563965e-05, -3.2123178243637085e-05, -2.4922192096710205e-05, -1.7721205949783325e-05, -1.0520219802856445e-05, -3.3192336559295654e-06, 3.8817524909973145e-06, 1.1082738637924194e-05, 1.8283724784851074e-05, 2.5484710931777954e-05, 3.2685697078704834e-05, 3.9886683225631714e-05, 4.7087669372558594e-05, 5.4288655519485474e-05, 6.148964166641235e-05, 6.869062781333923e-05, 7.589161396026611e-05, 8.309260010719299e-05, 9.029358625411987e-05, 9.749457240104675e-05, 0.00010469555854797363, 0.00011189654469490051, 0.00011909753084182739, 0.00012629851698875427, 0.00013349950313568115, 0.00014070048928260803, 0.0001479014754295349, 0.0001551024615764618, 0.00016230344772338867, 0.00016950443387031555, 0.00017670542001724243, 0.0001839064061641693, 0.0001911073923110962, 0.00019830837845802307, 0.00020550936460494995, 0.00021271035075187683, 0.0002199113368988037, 0.0002271123230457306, 0.00023431330919265747, 0.00024151429533958435, 0.00024871528148651123, 0.0002559162676334381, 0.000263117253780365, 0.00027031823992729187, 0.00027751922607421875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 10.0, 13.0, 16.0, 20.0, 37.0, 39.0, 56.0, 68.0, 98.0, 115.0, 178.0, 214.0, 270.0, 401.0, 523.0, 781.0, 1034.0, 1720.0, 3154.0, 6739.0, 18361.0, 60403.0, 215586.0, 423064.0, 219520.0, 61741.0, 18571.0, 6980.0, 3142.0, 1739.0, 1114.0, 739.0, 518.0, 396.0, 321.0, 214.0, 170.0, 126.0, 92.0, 68.0, 51.0, 44.0, 34.0, 19.0, 22.0, 9.0, 8.0, 7.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.779296875, -1.7245635986328125, -1.669830322265625, -1.6150970458984375, -1.56036376953125, -1.5056304931640625, -1.450897216796875, -1.3961639404296875, -1.3414306640625, -1.2866973876953125, -1.231964111328125, -1.1772308349609375, -1.12249755859375, -1.0677642822265625, -1.013031005859375, -0.9582977294921875, -0.903564453125, -0.8488311767578125, -0.794097900390625, -0.7393646240234375, -0.68463134765625, -0.6298980712890625, -0.575164794921875, -0.5204315185546875, -0.4656982421875, -0.4109649658203125, -0.356231689453125, -0.3014984130859375, -0.24676513671875, -0.1920318603515625, -0.137298583984375, -0.0825653076171875, -0.02783203125, 0.0269012451171875, 0.081634521484375, 0.1363677978515625, 0.19110107421875, 0.2458343505859375, 0.300567626953125, 0.3553009033203125, 0.4100341796875, 0.4647674560546875, 0.519500732421875, 0.5742340087890625, 0.62896728515625, 0.6837005615234375, 0.738433837890625, 0.7931671142578125, 0.847900390625, 0.9026336669921875, 0.957366943359375, 1.0121002197265625, 1.06683349609375, 1.1215667724609375, 1.176300048828125, 1.2310333251953125, 1.2857666015625, 1.3404998779296875, 1.395233154296875, 1.4499664306640625, 1.50469970703125, 1.5594329833984375, 1.614166259765625, 1.6688995361328125, 1.7236328125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 23.0, 21.0, 27.0, 43.0, 39.0, 74.0, 81.0, 97.0, 103.0, 92.0, 92.0, 92.0, 56.0, 51.0, 24.0, 24.0, 15.0, 11.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41845703125, -0.4048576354980469, -0.39125823974609375, -0.3776588439941406, -0.3640594482421875, -0.3504600524902344, -0.33686065673828125, -0.3232612609863281, -0.309661865234375, -0.2960624694824219, -0.28246307373046875, -0.2688636779785156, -0.2552642822265625, -0.24166488647460938, -0.22806549072265625, -0.21446609497070312, -0.20086669921875, -0.18726730346679688, -0.17366790771484375, -0.16006851196289062, -0.1464691162109375, -0.13286972045898438, -0.11927032470703125, -0.10567092895507812, -0.092071533203125, -0.07847213745117188, -0.06487274169921875, -0.051273345947265625, -0.0376739501953125, -0.024074554443359375, -0.01047515869140625, 0.003124237060546875, 0.0167236328125, 0.030323028564453125, 0.04392242431640625, 0.057521820068359375, 0.0711212158203125, 0.08472061157226562, 0.09832000732421875, 0.11191940307617188, 0.125518798828125, 0.13911819458007812, 0.15271759033203125, 0.16631698608398438, 0.1799163818359375, 0.19351577758789062, 0.20711517333984375, 0.22071456909179688, 0.23431396484375, 0.24791336059570312, 0.26151275634765625, 0.2751121520996094, 0.2887115478515625, 0.3023109436035156, 0.31591033935546875, 0.3295097351074219, 0.343109130859375, 0.3567085266113281, 0.37030792236328125, 0.3839073181152344, 0.3975067138671875, 0.4111061096191406, 0.42470550537109375, 0.4383049011230469, 0.451904296875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 7.0, 3.0, 2.0, 7.0, 7.0, 15.0, 17.0, 14.0, 18.0, 22.0, 25.0, 36.0, 43.0, 55.0, 77.0, 63.0, 72.0, 79.0, 81.0, 65.0, 56.0, 56.0, 36.0, 24.0, 30.0, 17.0, 11.0, 11.0, 10.0, 8.0, 7.0, 3.0, 7.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.105947494506836, -3.9765522480010986, -3.8471570014953613, -3.717761754989624, -3.5883665084838867, -3.4589712619781494, -3.329576015472412, -3.200180768966675, -3.0707855224609375, -2.9413902759552, -2.811995029449463, -2.6825997829437256, -2.5532045364379883, -2.423809289932251, -2.2944140434265137, -2.1650187969207764, -2.035623550415039, -1.9062283039093018, -1.7768330574035645, -1.6474378108978271, -1.5180425643920898, -1.3886473178863525, -1.2592520713806152, -1.129856824874878, -1.0004615783691406, -0.8710663318634033, -0.741671085357666, -0.6122758388519287, -0.4828805923461914, -0.3534853458404541, -0.2240900993347168, -0.09469485282897949, 0.03470039367675781, 0.16409564018249512, 0.2934908866882324, 0.4228861331939697, 0.552281379699707, 0.6816766262054443, 0.8110718727111816, 0.940467119216919, 1.0698623657226562, 1.1992576122283936, 1.3286528587341309, 1.4580481052398682, 1.5874433517456055, 1.7168385982513428, 1.84623384475708, 1.9756290912628174, 2.1050243377685547, 2.234419584274292, 2.3638148307800293, 2.4932100772857666, 2.622605323791504, 2.752000570297241, 2.8813958168029785, 3.010791063308716, 3.140186309814453, 3.2695815563201904, 3.3989768028259277, 3.528372049331665, 3.6577672958374023, 3.7871625423431396, 3.916557788848877, 4.045952796936035, 4.175348281860352]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 9.0, 3.0, 9.0, 9.0, 8.0, 4.0, 9.0, 12.0, 13.0, 21.0, 10.0, 11.0, 26.0, 20.0, 27.0, 18.0, 30.0, 35.0, 41.0, 20.0, 42.0, 31.0, 46.0, 34.0, 26.0, 38.0, 30.0, 28.0, 42.0, 40.0, 38.0, 27.0, 30.0, 22.0, 29.0, 19.0, 26.0, 18.0, 15.0, 13.0, 12.0, 9.0, 8.0, 11.0, 4.0, 11.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.072899341583252, -2.0089309215545654, -1.944962739944458, -1.880994439125061, -1.817026138305664, -1.7530577182769775, -1.6890894174575806, -1.6251211166381836, -1.5611528158187866, -1.4971845149993896, -1.4332162141799927, -1.3692479133605957, -1.3052794933319092, -1.2413113117218018, -1.1773428916931152, -1.1133745908737183, -1.0494062900543213, -0.9854379892349243, -0.9214696884155273, -0.8575013279914856, -0.7935330271720886, -0.7295647263526917, -0.6655963659286499, -0.6016280651092529, -0.537659764289856, -0.473691463470459, -0.4097231328487396, -0.34575480222702026, -0.2817865014076233, -0.21781820058822632, -0.15384986996650696, -0.0898815393447876, -0.025913476943969727, 0.03805483877658844, 0.1020231544971466, 0.16599147021770477, 0.22995978593826294, 0.2939280867576599, 0.3578964173793793, 0.42186474800109863, 0.4858330488204956, 0.5498013496398926, 0.6137696504592896, 0.6777380108833313, 0.7417063117027283, 0.8056746125221252, 0.869642972946167, 0.933611273765564, 0.9975795745849609, 1.061547875404358, 1.1255161762237549, 1.1894844770431519, 1.2534527778625488, 1.3174211978912354, 1.3813894987106323, 1.4453577995300293, 1.5093261003494263, 1.5732944011688232, 1.6372627019882202, 1.7012310028076172, 1.7651994228363037, 1.8291676044464111, 1.8931360244750977, 1.9571043252944946, 2.0210726261138916]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 10.0, 8.0, 4.0, 12.0, 13.0, 23.0, 41.0, 65.0, 101.0, 136.0, 212.0, 268.0, 459.0, 564.0, 945.0, 1373.0, 2114.0, 3216.0, 5160.0, 7911.0, 12904.0, 20939.0, 33283.0, 52149.0, 79049.0, 110845.0, 139571.0, 148253.0, 132619.0, 101741.0, 70122.0, 46263.0, 28879.0, 18109.0, 11248.0, 6978.0, 4472.0, 2900.0, 1826.0, 1247.0, 784.0, 566.0, 340.0, 252.0, 176.0, 130.0, 86.0, 61.0, 49.0, 34.0, 11.0, 23.0, 3.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.853515625, -1.794403076171875, -1.73529052734375, -1.676177978515625, -1.6170654296875, -1.557952880859375, -1.49884033203125, -1.439727783203125, -1.380615234375, -1.321502685546875, -1.26239013671875, -1.203277587890625, -1.1441650390625, -1.085052490234375, -1.02593994140625, -0.966827392578125, -0.90771484375, -0.848602294921875, -0.78948974609375, -0.730377197265625, -0.6712646484375, -0.612152099609375, -0.55303955078125, -0.493927001953125, -0.434814453125, -0.375701904296875, -0.31658935546875, -0.257476806640625, -0.1983642578125, -0.139251708984375, -0.08013916015625, -0.021026611328125, 0.0380859375, 0.097198486328125, 0.15631103515625, 0.215423583984375, 0.2745361328125, 0.333648681640625, 0.39276123046875, 0.451873779296875, 0.510986328125, 0.570098876953125, 0.62921142578125, 0.688323974609375, 0.7474365234375, 0.806549072265625, 0.86566162109375, 0.924774169921875, 0.98388671875, 1.042999267578125, 1.10211181640625, 1.161224365234375, 1.2203369140625, 1.279449462890625, 1.33856201171875, 1.397674560546875, 1.456787109375, 1.515899658203125, 1.57501220703125, 1.634124755859375, 1.6932373046875, 1.752349853515625, 1.81146240234375, 1.870574951171875, 1.9296875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 5.0, 5.0, 10.0, 19.0, 18.0, 13.0, 23.0, 24.0, 18.0, 25.0, 24.0, 40.0, 26.0, 34.0, 23.0, 39.0, 39.0, 33.0, 43.0, 39.0, 33.0, 30.0, 41.0, 40.0, 25.0, 42.0, 29.0, 30.0, 30.0, 29.0, 25.0, 21.0, 12.0, 16.0, 14.0, 13.0, 8.0, 8.0, 5.0, 6.0, 10.0, 9.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.38671875, -2.31341552734375, -2.2401123046875, -2.16680908203125, -2.093505859375, -2.02020263671875, -1.9468994140625, -1.87359619140625, -1.80029296875, -1.72698974609375, -1.6536865234375, -1.58038330078125, -1.507080078125, -1.43377685546875, -1.3604736328125, -1.28717041015625, -1.2138671875, -1.14056396484375, -1.0672607421875, -0.99395751953125, -0.920654296875, -0.84735107421875, -0.7740478515625, -0.70074462890625, -0.62744140625, -0.55413818359375, -0.4808349609375, -0.40753173828125, -0.334228515625, -0.26092529296875, -0.1876220703125, -0.11431884765625, -0.041015625, 0.03228759765625, 0.1055908203125, 0.17889404296875, 0.252197265625, 0.32550048828125, 0.3988037109375, 0.47210693359375, 0.54541015625, 0.61871337890625, 0.6920166015625, 0.76531982421875, 0.838623046875, 0.91192626953125, 0.9852294921875, 1.05853271484375, 1.1318359375, 1.20513916015625, 1.2784423828125, 1.35174560546875, 1.425048828125, 1.49835205078125, 1.5716552734375, 1.64495849609375, 1.71826171875, 1.79156494140625, 1.8648681640625, 1.93817138671875, 2.011474609375, 2.08477783203125, 2.1580810546875, 2.23138427734375, 2.3046875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 13.0, 10.0, 17.0, 35.0, 46.0, 70.0, 117.0, 188.0, 278.0, 469.0, 720.0, 1242.0, 2220.0, 3684.0, 6278.0, 11218.0, 20174.0, 36806.0, 66451.0, 114120.0, 169794.0, 197147.0, 165606.0, 108285.0, 63291.0, 35171.0, 19464.0, 10937.0, 6103.0, 3459.0, 1999.0, 1245.0, 718.0, 421.0, 282.0, 172.0, 116.0, 61.0, 51.0, 21.0, 19.0, 10.0, 5.0, 7.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5546875, -2.473480224609375, -2.39227294921875, -2.311065673828125, -2.2298583984375, -2.148651123046875, -2.06744384765625, -1.986236572265625, -1.905029296875, -1.823822021484375, -1.74261474609375, -1.661407470703125, -1.5802001953125, -1.498992919921875, -1.41778564453125, -1.336578369140625, -1.25537109375, -1.174163818359375, -1.09295654296875, -1.011749267578125, -0.9305419921875, -0.849334716796875, -0.76812744140625, -0.686920166015625, -0.605712890625, -0.524505615234375, -0.44329833984375, -0.362091064453125, -0.2808837890625, -0.199676513671875, -0.11846923828125, -0.037261962890625, 0.0439453125, 0.125152587890625, 0.20635986328125, 0.287567138671875, 0.3687744140625, 0.449981689453125, 0.53118896484375, 0.612396240234375, 0.693603515625, 0.774810791015625, 0.85601806640625, 0.937225341796875, 1.0184326171875, 1.099639892578125, 1.18084716796875, 1.262054443359375, 1.34326171875, 1.424468994140625, 1.50567626953125, 1.586883544921875, 1.6680908203125, 1.749298095703125, 1.83050537109375, 1.911712646484375, 1.992919921875, 2.074127197265625, 2.15533447265625, 2.236541748046875, 2.3177490234375, 2.398956298828125, 2.48016357421875, 2.561370849609375, 2.642578125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 9.0, 5.0, 9.0, 4.0, 10.0, 7.0, 8.0, 18.0, 21.0, 5.0, 16.0, 23.0, 17.0, 29.0, 28.0, 28.0, 29.0, 29.0, 38.0, 38.0, 36.0, 36.0, 35.0, 31.0, 42.0, 33.0, 27.0, 36.0, 23.0, 31.0, 30.0, 28.0, 30.0, 29.0, 26.0, 18.0, 14.0, 18.0, 14.0, 12.0, 8.0, 17.0, 7.0, 7.0, 10.0, 11.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.330078125, -1.2884979248046875, -1.246917724609375, -1.2053375244140625, -1.16375732421875, -1.1221771240234375, -1.080596923828125, -1.0390167236328125, -0.9974365234375, -0.9558563232421875, -0.914276123046875, -0.8726959228515625, -0.83111572265625, -0.7895355224609375, -0.747955322265625, -0.7063751220703125, -0.664794921875, -0.6232147216796875, -0.581634521484375, -0.5400543212890625, -0.49847412109375, -0.4568939208984375, -0.415313720703125, -0.3737335205078125, -0.3321533203125, -0.2905731201171875, -0.248992919921875, -0.2074127197265625, -0.16583251953125, -0.1242523193359375, -0.082672119140625, -0.0410919189453125, 0.00048828125, 0.0420684814453125, 0.083648681640625, 0.1252288818359375, 0.16680908203125, 0.2083892822265625, 0.249969482421875, 0.2915496826171875, 0.3331298828125, 0.3747100830078125, 0.416290283203125, 0.4578704833984375, 0.49945068359375, 0.5410308837890625, 0.582611083984375, 0.6241912841796875, 0.665771484375, 0.7073516845703125, 0.748931884765625, 0.7905120849609375, 0.83209228515625, 0.8736724853515625, 0.915252685546875, 0.9568328857421875, 0.9984130859375, 1.0399932861328125, 1.081573486328125, 1.1231536865234375, 1.16473388671875, 1.2063140869140625, 1.247894287109375, 1.2894744873046875, 1.3310546875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 11.0, 20.0, 26.0, 30.0, 44.0, 63.0, 82.0, 134.0, 191.0, 325.0, 412.0, 599.0, 876.0, 1553.0, 2397.0, 3997.0, 6607.0, 11744.0, 21367.0, 40468.0, 76684.0, 144638.0, 226565.0, 218787.0, 134974.0, 70775.0, 37184.0, 20312.0, 10968.0, 6317.0, 3827.0, 2363.0, 1437.0, 925.0, 614.0, 390.0, 252.0, 160.0, 134.0, 68.0, 80.0, 45.0, 30.0, 14.0, 15.0, 11.0, 9.0, 7.0, 6.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.6494140625, -1.5977783203125, -1.546142578125, -1.4945068359375, -1.44287109375, -1.3912353515625, -1.339599609375, -1.2879638671875, -1.236328125, -1.1846923828125, -1.133056640625, -1.0814208984375, -1.02978515625, -0.9781494140625, -0.926513671875, -0.8748779296875, -0.8232421875, -0.7716064453125, -0.719970703125, -0.6683349609375, -0.61669921875, -0.5650634765625, -0.513427734375, -0.4617919921875, -0.41015625, -0.3585205078125, -0.306884765625, -0.2552490234375, -0.20361328125, -0.1519775390625, -0.100341796875, -0.0487060546875, 0.0029296875, 0.0545654296875, 0.106201171875, 0.1578369140625, 0.20947265625, 0.2611083984375, 0.312744140625, 0.3643798828125, 0.416015625, 0.4676513671875, 0.519287109375, 0.5709228515625, 0.62255859375, 0.6741943359375, 0.725830078125, 0.7774658203125, 0.8291015625, 0.8807373046875, 0.932373046875, 0.9840087890625, 1.03564453125, 1.0872802734375, 1.138916015625, 1.1905517578125, 1.2421875, 1.2938232421875, 1.345458984375, 1.3970947265625, 1.44873046875, 1.5003662109375, 1.552001953125, 1.6036376953125, 1.6552734375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 7.0, 4.0, 4.0, 6.0, 6.0, 16.0, 16.0, 17.0, 21.0, 25.0, 28.0, 39.0, 52.0, 68.0, 70.0, 78.0, 82.0, 74.0, 84.0, 62.0, 48.0, 40.0, 33.0, 25.0, 21.0, 19.0, 11.0, 8.0, 8.0, 3.0, 11.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0001614093780517578, -0.00015684589743614197, -0.00015228241682052612, -0.00014771893620491028, -0.00014315545558929443, -0.0001385919749736786, -0.00013402849435806274, -0.0001294650137424469, -0.00012490153312683105, -0.00012033805251121521, -0.00011577457189559937, -0.00011121109127998352, -0.00010664761066436768, -0.00010208413004875183, -9.752064943313599e-05, -9.295716881752014e-05, -8.83936882019043e-05, -8.383020758628845e-05, -7.926672697067261e-05, -7.470324635505676e-05, -7.013976573944092e-05, -6.557628512382507e-05, -6.101280450820923e-05, -5.6449323892593384e-05, -5.188584327697754e-05, -4.7322362661361694e-05, -4.275888204574585e-05, -3.8195401430130005e-05, -3.363192081451416e-05, -2.9068440198898315e-05, -2.450495958328247e-05, -1.9941478967666626e-05, -1.537799835205078e-05, -1.0814517736434937e-05, -6.251037120819092e-06, -1.687556505203247e-06, 2.8759241104125977e-06, 7.439404726028442e-06, 1.2002885341644287e-05, 1.6566365957260132e-05, 2.1129846572875977e-05, 2.569332718849182e-05, 3.0256807804107666e-05, 3.482028841972351e-05, 3.9383769035339355e-05, 4.39472496509552e-05, 4.8510730266571045e-05, 5.307421088218689e-05, 5.7637691497802734e-05, 6.220117211341858e-05, 6.676465272903442e-05, 7.132813334465027e-05, 7.589161396026611e-05, 8.045509457588196e-05, 8.50185751914978e-05, 8.958205580711365e-05, 9.414553642272949e-05, 9.870901703834534e-05, 0.00010327249765396118, 0.00010783597826957703, 0.00011239945888519287, 0.00011696293950080872, 0.00012152642011642456, 0.0001260899007320404, 0.00013065338134765625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 5.0, 7.0, 10.0, 12.0, 21.0, 19.0, 26.0, 40.0, 60.0, 77.0, 104.0, 140.0, 215.0, 274.0, 382.0, 589.0, 813.0, 1237.0, 1789.0, 2647.0, 4317.0, 6908.0, 11380.0, 19107.0, 34487.0, 63486.0, 116322.0, 186701.0, 217745.0, 163481.0, 94409.0, 51749.0, 27877.0, 15826.0, 9462.0, 5698.0, 3615.0, 2417.0, 1537.0, 1056.0, 736.0, 479.0, 380.0, 241.0, 203.0, 151.0, 78.0, 60.0, 54.0, 39.0, 27.0, 21.0, 18.0, 15.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0], "bins": [-1.498046875, -1.4517059326171875, -1.405364990234375, -1.3590240478515625, -1.31268310546875, -1.2663421630859375, -1.220001220703125, -1.1736602783203125, -1.1273193359375, -1.0809783935546875, -1.034637451171875, -0.9882965087890625, -0.94195556640625, -0.8956146240234375, -0.849273681640625, -0.8029327392578125, -0.756591796875, -0.7102508544921875, -0.663909912109375, -0.6175689697265625, -0.57122802734375, -0.5248870849609375, -0.478546142578125, -0.4322052001953125, -0.3858642578125, -0.3395233154296875, -0.293182373046875, -0.2468414306640625, -0.20050048828125, -0.1541595458984375, -0.107818603515625, -0.0614776611328125, -0.01513671875, 0.0312042236328125, 0.077545166015625, 0.1238861083984375, 0.17022705078125, 0.2165679931640625, 0.262908935546875, 0.3092498779296875, 0.3555908203125, 0.4019317626953125, 0.448272705078125, 0.4946136474609375, 0.54095458984375, 0.5872955322265625, 0.633636474609375, 0.6799774169921875, 0.726318359375, 0.7726593017578125, 0.819000244140625, 0.8653411865234375, 0.91168212890625, 0.9580230712890625, 1.004364013671875, 1.0507049560546875, 1.0970458984375, 1.1433868408203125, 1.189727783203125, 1.2360687255859375, 1.28240966796875, 1.3287506103515625, 1.375091552734375, 1.4214324951171875, 1.4677734375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 9.0, 8.0, 14.0, 15.0, 14.0, 28.0, 30.0, 43.0, 59.0, 56.0, 65.0, 76.0, 96.0, 74.0, 59.0, 65.0, 57.0, 56.0, 41.0, 24.0, 21.0, 18.0, 17.0, 15.0, 9.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49853515625, -0.482269287109375, -0.46600341796875, -0.449737548828125, -0.4334716796875, -0.417205810546875, -0.40093994140625, -0.384674072265625, -0.368408203125, -0.352142333984375, -0.33587646484375, -0.319610595703125, -0.3033447265625, -0.287078857421875, -0.27081298828125, -0.254547119140625, -0.23828125, -0.222015380859375, -0.20574951171875, -0.189483642578125, -0.1732177734375, -0.156951904296875, -0.14068603515625, -0.124420166015625, -0.108154296875, -0.091888427734375, -0.07562255859375, -0.059356689453125, -0.0430908203125, -0.026824951171875, -0.01055908203125, 0.005706787109375, 0.02197265625, 0.038238525390625, 0.05450439453125, 0.070770263671875, 0.0870361328125, 0.103302001953125, 0.11956787109375, 0.135833740234375, 0.152099609375, 0.168365478515625, 0.18463134765625, 0.200897216796875, 0.2171630859375, 0.233428955078125, 0.24969482421875, 0.265960693359375, 0.2822265625, 0.298492431640625, 0.31475830078125, 0.331024169921875, 0.3472900390625, 0.363555908203125, 0.37982177734375, 0.396087646484375, 0.412353515625, 0.428619384765625, 0.44488525390625, 0.461151123046875, 0.4774169921875, 0.493682861328125, 0.50994873046875, 0.526214599609375, 0.54248046875]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 8.0, 8.0, 10.0, 14.0, 16.0, 22.0, 29.0, 36.0, 28.0, 40.0, 43.0, 52.0, 70.0, 64.0, 70.0, 76.0, 52.0, 62.0, 38.0, 39.0, 32.0, 38.0, 28.0, 21.0, 20.0, 13.0, 6.0, 8.0, 5.0, 3.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.877723455429077, -3.7642858028411865, -3.650848388671875, -3.5374107360839844, -3.4239730834960938, -3.310535430908203, -3.1970980167388916, -3.083660364151001, -2.9702229499816895, -2.856785297393799, -2.7433478832244873, -2.6299102306365967, -2.516472578048706, -2.4030351638793945, -2.289597511291504, -2.1761598587036133, -2.0627222061157227, -1.9492846727371216, -1.835847020149231, -1.7224094867706299, -1.6089718341827393, -1.4955343008041382, -1.382096767425537, -1.2686591148376465, -1.1552215814590454, -1.0417840480804443, -0.9283463954925537, -0.8149088621139526, -0.7014712691307068, -0.5880336761474609, -0.47459614276885986, -0.361158549785614, -0.24772119522094727, -0.1342836171388626, -0.020846039056777954, 0.09259152412414551, 0.20602911710739136, 0.3194667100906372, 0.4329042434692383, 0.5463418364524841, 0.65977942943573, 0.7732170224189758, 0.8866546154022217, 1.0000921487808228, 1.1135296821594238, 1.2269673347473145, 1.3404048681259155, 1.4538424015045166, 1.5672800540924072, 1.6807175874710083, 1.794155240058899, 1.9075927734375, 2.0210304260253906, 2.1344680786132812, 2.2479054927825928, 2.3613431453704834, 2.474780559539795, 2.5882182121276855, 2.701655626296997, 2.8150932788848877, 2.9285309314727783, 3.04196834564209, 3.1554059982299805, 3.268843650817871, 3.3822813034057617]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 5.0, 5.0, 3.0, 5.0, 6.0, 17.0, 8.0, 16.0, 11.0, 15.0, 18.0, 23.0, 16.0, 21.0, 18.0, 28.0, 34.0, 27.0, 38.0, 47.0, 36.0, 40.0, 32.0, 37.0, 41.0, 39.0, 38.0, 42.0, 35.0, 27.0, 33.0, 38.0, 20.0, 20.0, 19.0, 25.0, 21.0, 19.0, 12.0, 14.0, 13.0, 6.0, 11.0, 4.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1356964111328125, -2.069744825363159, -2.003793239593506, -1.9378416538238525, -1.8718900680541992, -1.805938482284546, -1.7399868965148926, -1.6740353107452393, -1.608083724975586, -1.5421321392059326, -1.4761805534362793, -1.410228967666626, -1.3442773818969727, -1.2783257961273193, -1.212374210357666, -1.1464226245880127, -1.0804709196090698, -1.0145193338394165, -0.9485677480697632, -0.8826161623001099, -0.8166645765304565, -0.7507129907608032, -0.6847613453865051, -0.6188097596168518, -0.5528581738471985, -0.48690658807754517, -0.42095500230789185, -0.35500338673591614, -0.2890518009662628, -0.2231002151966095, -0.1571485996246338, -0.09119701385498047, -0.02524542808532715, 0.04070616513490677, 0.10665775835514069, 0.1726093590259552, 0.23856094479560852, 0.30451253056526184, 0.37046414613723755, 0.43641573190689087, 0.5023673176765442, 0.5683189034461975, 0.6342704892158508, 0.7002221345901489, 0.7661737203598022, 0.8321253061294556, 0.8980768918991089, 0.9640284776687622, 1.0299800634384155, 1.0959316492080688, 1.1618832349777222, 1.2278348207473755, 1.2937864065170288, 1.3597379922866821, 1.425689697265625, 1.4916412830352783, 1.5575928688049316, 1.623544454574585, 1.6894960403442383, 1.7554476261138916, 1.821399211883545, 1.8873507976531982, 1.9533023834228516, 2.019253969192505, 2.085205554962158]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 11.0, 12.0, 11.0, 30.0, 40.0, 48.0, 89.0, 134.0, 200.0, 299.0, 457.0, 687.0, 1075.0, 1727.0, 2750.0, 4598.0, 8223.0, 15491.0, 30653.0, 69691.0, 189800.0, 610057.0, 1488332.0, 1169937.0, 375590.0, 121340.0, 48895.0, 23296.0, 12348.0, 6966.0, 4294.0, 2509.0, 1600.0, 1047.0, 701.0, 423.0, 313.0, 187.0, 138.0, 85.0, 63.0, 46.0, 23.0, 21.0, 16.0, 9.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-4.625, -4.4840087890625, -4.343017578125, -4.2020263671875, -4.06103515625, -3.9200439453125, -3.779052734375, -3.6380615234375, -3.4970703125, -3.3560791015625, -3.215087890625, -3.0740966796875, -2.93310546875, -2.7921142578125, -2.651123046875, -2.5101318359375, -2.369140625, -2.2281494140625, -2.087158203125, -1.9461669921875, -1.80517578125, -1.6641845703125, -1.523193359375, -1.3822021484375, -1.2412109375, -1.1002197265625, -0.959228515625, -0.8182373046875, -0.67724609375, -0.5362548828125, -0.395263671875, -0.2542724609375, -0.11328125, 0.0277099609375, 0.168701171875, 0.3096923828125, 0.45068359375, 0.5916748046875, 0.732666015625, 0.8736572265625, 1.0146484375, 1.1556396484375, 1.296630859375, 1.4376220703125, 1.57861328125, 1.7196044921875, 1.860595703125, 2.0015869140625, 2.142578125, 2.2835693359375, 2.424560546875, 2.5655517578125, 2.70654296875, 2.8475341796875, 2.988525390625, 3.1295166015625, 3.2705078125, 3.4114990234375, 3.552490234375, 3.6934814453125, 3.83447265625, 3.9754638671875, 4.116455078125, 4.2574462890625, 4.3984375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 6.0, 1.0, 7.0, 5.0, 8.0, 9.0, 7.0, 11.0, 8.0, 17.0, 17.0, 20.0, 17.0, 17.0, 30.0, 26.0, 36.0, 37.0, 39.0, 38.0, 35.0, 47.0, 37.0, 48.0, 34.0, 42.0, 24.0, 31.0, 49.0, 40.0, 34.0, 31.0, 35.0, 26.0, 20.0, 24.0, 18.0, 11.0, 10.0, 8.0, 12.0, 8.0, 7.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.62109375, -1.5695037841796875, -1.517913818359375, -1.4663238525390625, -1.41473388671875, -1.3631439208984375, -1.311553955078125, -1.2599639892578125, -1.2083740234375, -1.1567840576171875, -1.105194091796875, -1.0536041259765625, -1.00201416015625, -0.9504241943359375, -0.898834228515625, -0.8472442626953125, -0.795654296875, -0.7440643310546875, -0.692474365234375, -0.6408843994140625, -0.58929443359375, -0.5377044677734375, -0.486114501953125, -0.4345245361328125, -0.3829345703125, -0.3313446044921875, -0.279754638671875, -0.2281646728515625, -0.17657470703125, -0.1249847412109375, -0.073394775390625, -0.0218048095703125, 0.02978515625, 0.0813751220703125, 0.132965087890625, 0.1845550537109375, 0.23614501953125, 0.2877349853515625, 0.339324951171875, 0.3909149169921875, 0.4425048828125, 0.4940948486328125, 0.545684814453125, 0.5972747802734375, 0.64886474609375, 0.7004547119140625, 0.752044677734375, 0.8036346435546875, 0.855224609375, 0.9068145751953125, 0.958404541015625, 1.0099945068359375, 1.06158447265625, 1.1131744384765625, 1.164764404296875, 1.2163543701171875, 1.2679443359375, 1.3195343017578125, 1.371124267578125, 1.4227142333984375, 1.47430419921875, 1.5258941650390625, 1.577484130859375, 1.6290740966796875, 1.6806640625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 13.0, 28.0, 25.0, 51.0, 63.0, 92.0, 122.0, 187.0, 257.0, 359.0, 511.0, 746.0, 1123.0, 1671.0, 2397.0, 3620.0, 5532.0, 8927.0, 14110.0, 23500.0, 40214.0, 73569.0, 143731.0, 303259.0, 673455.0, 1168290.0, 897465.0, 417855.0, 191582.0, 94624.0, 50737.0, 28747.0, 16994.0, 10628.0, 6703.0, 4201.0, 2876.0, 1845.0, 1270.0, 934.0, 617.0, 415.0, 297.0, 228.0, 116.0, 107.0, 63.0, 31.0, 35.0, 20.0, 12.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0], "bins": [-3.705078125, -3.591766357421875, -3.47845458984375, -3.365142822265625, -3.2518310546875, -3.138519287109375, -3.02520751953125, -2.911895751953125, -2.798583984375, -2.685272216796875, -2.57196044921875, -2.458648681640625, -2.3453369140625, -2.232025146484375, -2.11871337890625, -2.005401611328125, -1.89208984375, -1.778778076171875, -1.66546630859375, -1.552154541015625, -1.4388427734375, -1.325531005859375, -1.21221923828125, -1.098907470703125, -0.985595703125, -0.872283935546875, -0.75897216796875, -0.645660400390625, -0.5323486328125, -0.419036865234375, -0.30572509765625, -0.192413330078125, -0.0791015625, 0.034210205078125, 0.14752197265625, 0.260833740234375, 0.3741455078125, 0.487457275390625, 0.60076904296875, 0.714080810546875, 0.827392578125, 0.940704345703125, 1.05401611328125, 1.167327880859375, 1.2806396484375, 1.393951416015625, 1.50726318359375, 1.620574951171875, 1.73388671875, 1.847198486328125, 1.96051025390625, 2.073822021484375, 2.1871337890625, 2.300445556640625, 2.41375732421875, 2.527069091796875, 2.640380859375, 2.753692626953125, 2.86700439453125, 2.980316162109375, 3.0936279296875, 3.206939697265625, 3.32025146484375, 3.433563232421875, 3.546875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 6.0, 3.0, 6.0, 7.0, 5.0, 13.0, 13.0, 20.0, 18.0, 15.0, 26.0, 40.0, 51.0, 37.0, 68.0, 80.0, 105.0, 135.0, 162.0, 235.0, 238.0, 306.0, 298.0, 327.0, 333.0, 273.0, 273.0, 185.0, 161.0, 116.0, 108.0, 104.0, 72.0, 52.0, 46.0, 23.0, 24.0, 17.0, 18.0, 16.0, 10.0, 8.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.220703125, -1.186004638671875, -1.15130615234375, -1.116607666015625, -1.0819091796875, -1.047210693359375, -1.01251220703125, -0.977813720703125, -0.943115234375, -0.908416748046875, -0.87371826171875, -0.839019775390625, -0.8043212890625, -0.769622802734375, -0.73492431640625, -0.700225830078125, -0.66552734375, -0.630828857421875, -0.59613037109375, -0.561431884765625, -0.5267333984375, -0.492034912109375, -0.45733642578125, -0.422637939453125, -0.387939453125, -0.353240966796875, -0.31854248046875, -0.283843994140625, -0.2491455078125, -0.214447021484375, -0.17974853515625, -0.145050048828125, -0.1103515625, -0.075653076171875, -0.04095458984375, -0.006256103515625, 0.0284423828125, 0.063140869140625, 0.09783935546875, 0.132537841796875, 0.167236328125, 0.201934814453125, 0.23663330078125, 0.271331787109375, 0.3060302734375, 0.340728759765625, 0.37542724609375, 0.410125732421875, 0.44482421875, 0.479522705078125, 0.51422119140625, 0.548919677734375, 0.5836181640625, 0.618316650390625, 0.65301513671875, 0.687713623046875, 0.722412109375, 0.757110595703125, 0.79180908203125, 0.826507568359375, 0.8612060546875, 0.895904541015625, 0.93060302734375, 0.965301513671875, 1.0]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 10.0, 7.0, 11.0, 14.0, 12.0, 23.0, 33.0, 33.0, 39.0, 61.0, 80.0, 94.0, 84.0, 78.0, 99.0, 74.0, 58.0, 41.0, 31.0, 22.0, 23.0, 17.0, 11.0, 12.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.556830883026123, -5.396080493927002, -5.235330104827881, -5.074579238891602, -4.9138288497924805, -4.753078460693359, -4.592328071594238, -4.431577682495117, -4.270827293395996, -4.110076904296875, -3.949326276779175, -3.7885758876800537, -3.6278252601623535, -3.4670748710632324, -3.3063244819641113, -3.1455740928649902, -2.984823226928711, -2.82407283782959, -2.6633222103118896, -2.5025718212127686, -2.3418211936950684, -2.1810708045959473, -2.020320415496826, -1.8595699071884155, -1.6988193988800049, -1.5380688905715942, -1.3773183822631836, -1.2165679931640625, -1.0558174848556519, -0.8950669765472412, -0.7343165278434753, -0.5735660791397095, -0.4128150939941406, -0.25206461548805237, -0.09131413698196411, 0.06943634152412415, 0.2301868200302124, 0.39093732833862305, 0.5516877770423889, 0.7124382257461548, 0.8731887340545654, 1.033939242362976, 1.1946897506713867, 1.3554401397705078, 1.5161906480789185, 1.676941156387329, 1.8376915454864502, 1.9984420537948608, 2.1591925621032715, 2.3199429512023926, 2.4806935787200928, 2.641443967819214, 2.802194595336914, 2.962944984436035, 3.1236953735351562, 3.2844457626342773, 3.4451963901519775, 3.6059467792510986, 3.766697406768799, 3.92744779586792, 4.088198184967041, 4.24894905090332, 4.409699440002441, 4.5704498291015625, 4.731200218200684]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 0.0, 4.0, 4.0, 5.0, 8.0, 10.0, 10.0, 16.0, 11.0, 14.0, 12.0, 13.0, 22.0, 28.0, 21.0, 25.0, 32.0, 42.0, 37.0, 35.0, 43.0, 50.0, 44.0, 39.0, 46.0, 37.0, 43.0, 35.0, 20.0, 33.0, 35.0, 23.0, 24.0, 28.0, 23.0, 22.0, 23.0, 9.0, 22.0, 8.0, 9.0, 6.0, 4.0, 5.0, 6.0, 5.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0998904705047607, -2.034689426422119, -1.9694881439208984, -1.9042869806289673, -1.8390858173370361, -1.773884654045105, -1.7086834907531738, -1.6434824466705322, -1.5782811641693115, -1.5130800008773804, -1.4478788375854492, -1.382677674293518, -1.317476511001587, -1.2522753477096558, -1.1870741844177246, -1.121873140335083, -1.0566719770431519, -0.9914708137512207, -0.9262696504592896, -0.8610684871673584, -0.7958673238754272, -0.7306661605834961, -0.6654650568962097, -0.6002638936042786, -0.5350627303123474, -0.46986156702041626, -0.4046604037284851, -0.33945927023887634, -0.2742581069469452, -0.20905694365501404, -0.14385581016540527, -0.07865464687347412, -0.013453483581542969, 0.05174767225980759, 0.11694882810115814, 0.1821499764919281, 0.24735113978385925, 0.3125523030757904, 0.37775343656539917, 0.4429545998573303, 0.5081557631492615, 0.5733569264411926, 0.6385580897331238, 0.7037591934204102, 0.7689603567123413, 0.8341615200042725, 0.8993626832962036, 0.9645638465881348, 1.029765009880066, 1.094966173171997, 1.1601673364639282, 1.2253684997558594, 1.2905696630477905, 1.3557708263397217, 1.4209718704223633, 1.486173152923584, 1.5513741970062256, 1.6165753602981567, 1.681776523590088, 1.746977686882019, 1.8121788501739502, 1.8773800134658813, 1.9425811767578125, 2.007782220840454, 2.072983503341675]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 13.0, 22.0, 26.0, 43.0, 59.0, 70.0, 122.0, 165.0, 302.0, 443.0, 684.0, 1138.0, 1952.0, 3296.0, 5603.0, 10346.0, 19197.0, 37606.0, 75495.0, 148129.0, 238740.0, 228533.0, 134726.0, 68012.0, 33728.0, 17539.0, 9588.0, 5202.0, 3014.0, 1727.0, 1091.0, 689.0, 435.0, 276.0, 155.0, 99.0, 88.0, 52.0, 41.0, 21.0, 16.0, 11.0, 11.0, 14.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 4.0], "bins": [-2.35546875, -2.286041259765625, -2.21661376953125, -2.147186279296875, -2.0777587890625, -2.008331298828125, -1.93890380859375, -1.869476318359375, -1.800048828125, -1.730621337890625, -1.66119384765625, -1.591766357421875, -1.5223388671875, -1.452911376953125, -1.38348388671875, -1.314056396484375, -1.24462890625, -1.175201416015625, -1.10577392578125, -1.036346435546875, -0.9669189453125, -0.897491455078125, -0.82806396484375, -0.758636474609375, -0.689208984375, -0.619781494140625, -0.55035400390625, -0.480926513671875, -0.4114990234375, -0.342071533203125, -0.27264404296875, -0.203216552734375, -0.1337890625, -0.064361572265625, 0.00506591796875, 0.074493408203125, 0.1439208984375, 0.213348388671875, 0.28277587890625, 0.352203369140625, 0.421630859375, 0.491058349609375, 0.56048583984375, 0.629913330078125, 0.6993408203125, 0.768768310546875, 0.83819580078125, 0.907623291015625, 0.97705078125, 1.046478271484375, 1.11590576171875, 1.185333251953125, 1.2547607421875, 1.324188232421875, 1.39361572265625, 1.463043212890625, 1.532470703125, 1.601898193359375, 1.67132568359375, 1.740753173828125, 1.8101806640625, 1.879608154296875, 1.94903564453125, 2.018463134765625, 2.087890625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 4.0, 5.0, 2.0, 7.0, 5.0, 8.0, 11.0, 9.0, 13.0, 9.0, 21.0, 11.0, 19.0, 23.0, 26.0, 21.0, 27.0, 35.0, 21.0, 35.0, 33.0, 42.0, 44.0, 40.0, 42.0, 36.0, 23.0, 38.0, 34.0, 44.0, 35.0, 32.0, 31.0, 31.0, 27.0, 21.0, 19.0, 17.0, 19.0, 10.0, 13.0, 7.0, 14.0, 9.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.130859375, -2.063262939453125, -1.99566650390625, -1.928070068359375, -1.8604736328125, -1.792877197265625, -1.72528076171875, -1.657684326171875, -1.590087890625, -1.522491455078125, -1.45489501953125, -1.387298583984375, -1.3197021484375, -1.252105712890625, -1.18450927734375, -1.116912841796875, -1.04931640625, -0.981719970703125, -0.91412353515625, -0.846527099609375, -0.7789306640625, -0.711334228515625, -0.64373779296875, -0.576141357421875, -0.508544921875, -0.440948486328125, -0.37335205078125, -0.305755615234375, -0.2381591796875, -0.170562744140625, -0.10296630859375, -0.035369873046875, 0.0322265625, 0.099822998046875, 0.16741943359375, 0.235015869140625, 0.3026123046875, 0.370208740234375, 0.43780517578125, 0.505401611328125, 0.572998046875, 0.640594482421875, 0.70819091796875, 0.775787353515625, 0.8433837890625, 0.910980224609375, 0.97857666015625, 1.046173095703125, 1.11376953125, 1.181365966796875, 1.24896240234375, 1.316558837890625, 1.3841552734375, 1.451751708984375, 1.51934814453125, 1.586944580078125, 1.654541015625, 1.722137451171875, 1.78973388671875, 1.857330322265625, 1.9249267578125, 1.992523193359375, 2.06011962890625, 2.127716064453125, 2.1953125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 0.0, 7.0, 1.0, 4.0, 5.0, 9.0, 22.0, 29.0, 37.0, 56.0, 68.0, 109.0, 154.0, 204.0, 362.0, 516.0, 893.0, 1717.0, 3772.0, 9270.0, 26451.0, 87285.0, 301345.0, 416661.0, 136378.0, 39735.0, 13257.0, 5032.0, 2262.0, 1123.0, 613.0, 394.0, 247.0, 169.0, 134.0, 70.0, 56.0, 38.0, 17.0, 9.0, 19.0, 11.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.813323974609375, -3.66766357421875, -3.522003173828125, -3.3763427734375, -3.230682373046875, -3.08502197265625, -2.939361572265625, -2.793701171875, -2.648040771484375, -2.50238037109375, -2.356719970703125, -2.2110595703125, -2.065399169921875, -1.91973876953125, -1.774078369140625, -1.62841796875, -1.482757568359375, -1.33709716796875, -1.191436767578125, -1.0457763671875, -0.900115966796875, -0.75445556640625, -0.608795166015625, -0.463134765625, -0.317474365234375, -0.17181396484375, -0.026153564453125, 0.1195068359375, 0.265167236328125, 0.41082763671875, 0.556488037109375, 0.7021484375, 0.847808837890625, 0.99346923828125, 1.139129638671875, 1.2847900390625, 1.430450439453125, 1.57611083984375, 1.721771240234375, 1.867431640625, 2.013092041015625, 2.15875244140625, 2.304412841796875, 2.4500732421875, 2.595733642578125, 2.74139404296875, 2.887054443359375, 3.03271484375, 3.178375244140625, 3.32403564453125, 3.469696044921875, 3.6153564453125, 3.761016845703125, 3.90667724609375, 4.052337646484375, 4.197998046875, 4.343658447265625, 4.48931884765625, 4.634979248046875, 4.7806396484375, 4.926300048828125, 5.07196044921875, 5.217620849609375, 5.36328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 3.0, 13.0, 8.0, 13.0, 12.0, 17.0, 22.0, 18.0, 22.0, 22.0, 19.0, 32.0, 38.0, 41.0, 35.0, 54.0, 46.0, 38.0, 47.0, 36.0, 33.0, 43.0, 34.0, 47.0, 34.0, 41.0, 33.0, 18.0, 39.0, 26.0, 19.0, 21.0, 17.0, 11.0, 5.0, 11.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5517578125, -1.50567626953125, -1.4595947265625, -1.41351318359375, -1.367431640625, -1.32135009765625, -1.2752685546875, -1.22918701171875, -1.18310546875, -1.13702392578125, -1.0909423828125, -1.04486083984375, -0.998779296875, -0.95269775390625, -0.9066162109375, -0.86053466796875, -0.814453125, -0.76837158203125, -0.7222900390625, -0.67620849609375, -0.630126953125, -0.58404541015625, -0.5379638671875, -0.49188232421875, -0.44580078125, -0.39971923828125, -0.3536376953125, -0.30755615234375, -0.261474609375, -0.21539306640625, -0.1693115234375, -0.12322998046875, -0.0771484375, -0.03106689453125, 0.0150146484375, 0.06109619140625, 0.107177734375, 0.15325927734375, 0.1993408203125, 0.24542236328125, 0.29150390625, 0.33758544921875, 0.3836669921875, 0.42974853515625, 0.475830078125, 0.52191162109375, 0.5679931640625, 0.61407470703125, 0.66015625, 0.70623779296875, 0.7523193359375, 0.79840087890625, 0.844482421875, 0.89056396484375, 0.9366455078125, 0.98272705078125, 1.02880859375, 1.07489013671875, 1.1209716796875, 1.16705322265625, 1.213134765625, 1.25921630859375, 1.3052978515625, 1.35137939453125, 1.3974609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 10.0, 22.0, 23.0, 21.0, 50.0, 67.0, 96.0, 142.0, 194.0, 292.0, 391.0, 628.0, 897.0, 1394.0, 2252.0, 3600.0, 5890.0, 10532.0, 19476.0, 38272.0, 83617.0, 190138.0, 315340.0, 198734.0, 87910.0, 40554.0, 20321.0, 11042.0, 6351.0, 3686.0, 2280.0, 1447.0, 989.0, 583.0, 423.0, 253.0, 197.0, 126.0, 88.0, 62.0, 40.0, 41.0, 23.0, 19.0, 14.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.2368316650390625, -1.196319580078125, -1.1558074951171875, -1.11529541015625, -1.0747833251953125, -1.034271240234375, -0.9937591552734375, -0.9532470703125, -0.9127349853515625, -0.872222900390625, -0.8317108154296875, -0.79119873046875, -0.7506866455078125, -0.710174560546875, -0.6696624755859375, -0.629150390625, -0.5886383056640625, -0.548126220703125, -0.5076141357421875, -0.46710205078125, -0.4265899658203125, -0.386077880859375, -0.3455657958984375, -0.3050537109375, -0.2645416259765625, -0.224029541015625, -0.1835174560546875, -0.14300537109375, -0.1024932861328125, -0.061981201171875, -0.0214691162109375, 0.01904296875, 0.0595550537109375, 0.100067138671875, 0.1405792236328125, 0.18109130859375, 0.2216033935546875, 0.262115478515625, 0.3026275634765625, 0.3431396484375, 0.3836517333984375, 0.424163818359375, 0.4646759033203125, 0.50518798828125, 0.5457000732421875, 0.586212158203125, 0.6267242431640625, 0.667236328125, 0.7077484130859375, 0.748260498046875, 0.7887725830078125, 0.82928466796875, 0.8697967529296875, 0.910308837890625, 0.9508209228515625, 0.9913330078125, 1.0318450927734375, 1.072357177734375, 1.1128692626953125, 1.15338134765625, 1.1938934326171875, 1.234405517578125, 1.2749176025390625, 1.3154296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 9.0, 3.0, 13.0, 13.0, 20.0, 35.0, 41.0, 72.0, 132.0, 150.0, 134.0, 114.0, 70.0, 60.0, 52.0, 20.0, 13.0, 9.0, 9.0, 8.0, 7.0, 1.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001093149185180664, -0.00010611582547426224, -0.00010291673243045807, -9.97176393866539e-05, -9.651854634284973e-05, -9.331945329904556e-05, -9.01203602552414e-05, -8.692126721143723e-05, -8.372217416763306e-05, -8.052308112382889e-05, -7.732398808002472e-05, -7.412489503622055e-05, -7.092580199241638e-05, -6.772670894861221e-05, -6.452761590480804e-05, -6.132852286100388e-05, -5.812942981719971e-05, -5.493033677339554e-05, -5.173124372959137e-05, -4.85321506857872e-05, -4.533305764198303e-05, -4.2133964598178864e-05, -3.8934871554374695e-05, -3.5735778510570526e-05, -3.253668546676636e-05, -2.933759242296219e-05, -2.613849937915802e-05, -2.293940633535385e-05, -1.9740313291549683e-05, -1.6541220247745514e-05, -1.3342127203941345e-05, -1.0143034160137177e-05, -6.943941116333008e-06, -3.744848072528839e-06, -5.457550287246704e-07, 2.6533380150794983e-06, 5.852431058883667e-06, 9.051524102687836e-06, 1.2250617146492004e-05, 1.5449710190296173e-05, 1.8648803234100342e-05, 2.184789627790451e-05, 2.504698932170868e-05, 2.8246082365512848e-05, 3.1445175409317017e-05, 3.4644268453121185e-05, 3.7843361496925354e-05, 4.104245454072952e-05, 4.424154758453369e-05, 4.744064062833786e-05, 5.063973367214203e-05, 5.38388267159462e-05, 5.7037919759750366e-05, 6.0237012803554535e-05, 6.34361058473587e-05, 6.663519889116287e-05, 6.983429193496704e-05, 7.303338497877121e-05, 7.623247802257538e-05, 7.943157106637955e-05, 8.263066411018372e-05, 8.582975715398788e-05, 8.902885019779205e-05, 9.222794324159622e-05, 9.542703628540039e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 0.0, 7.0, 4.0, 10.0, 10.0, 19.0, 24.0, 40.0, 63.0, 88.0, 133.0, 222.0, 365.0, 518.0, 812.0, 1401.0, 2547.0, 4670.0, 9570.0, 21715.0, 57286.0, 164441.0, 361943.0, 264422.0, 95130.0, 34291.0, 14088.0, 6464.0, 3509.0, 1862.0, 1134.0, 625.0, 400.0, 246.0, 162.0, 107.0, 69.0, 57.0, 26.0, 28.0, 16.0, 9.0, 11.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.67578125, -1.6275482177734375, -1.579315185546875, -1.5310821533203125, -1.48284912109375, -1.4346160888671875, -1.386383056640625, -1.3381500244140625, -1.2899169921875, -1.2416839599609375, -1.193450927734375, -1.1452178955078125, -1.09698486328125, -1.0487518310546875, -1.000518798828125, -0.9522857666015625, -0.904052734375, -0.8558197021484375, -0.807586669921875, -0.7593536376953125, -0.71112060546875, -0.6628875732421875, -0.614654541015625, -0.5664215087890625, -0.5181884765625, -0.4699554443359375, -0.421722412109375, -0.3734893798828125, -0.32525634765625, -0.2770233154296875, -0.228790283203125, -0.1805572509765625, -0.13232421875, -0.0840911865234375, -0.035858154296875, 0.0123748779296875, 0.06060791015625, 0.1088409423828125, 0.157073974609375, 0.2053070068359375, 0.2535400390625, 0.3017730712890625, 0.350006103515625, 0.3982391357421875, 0.44647216796875, 0.4947052001953125, 0.542938232421875, 0.5911712646484375, 0.639404296875, 0.6876373291015625, 0.735870361328125, 0.7841033935546875, 0.83233642578125, 0.8805694580078125, 0.928802490234375, 0.9770355224609375, 1.0252685546875, 1.0735015869140625, 1.121734619140625, 1.1699676513671875, 1.21820068359375, 1.2664337158203125, 1.314666748046875, 1.3628997802734375, 1.4111328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 10.0, 21.0, 33.0, 40.0, 65.0, 81.0, 99.0, 119.0, 128.0, 110.0, 92.0, 71.0, 42.0, 33.0, 14.0, 7.0, 12.0, 8.0, 2.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.572265625, -0.5564537048339844, -0.5406417846679688, -0.5248298645019531, -0.5090179443359375, -0.4932060241699219, -0.47739410400390625, -0.4615821838378906, -0.445770263671875, -0.4299583435058594, -0.41414642333984375, -0.3983345031738281, -0.3825225830078125, -0.3667106628417969, -0.35089874267578125, -0.3350868225097656, -0.31927490234375, -0.3034629821777344, -0.28765106201171875, -0.2718391418457031, -0.2560272216796875, -0.24021530151367188, -0.22440338134765625, -0.20859146118164062, -0.192779541015625, -0.17696762084960938, -0.16115570068359375, -0.14534378051757812, -0.1295318603515625, -0.11371994018554688, -0.09790802001953125, -0.08209609985351562, -0.0662841796875, -0.050472259521484375, -0.03466033935546875, -0.018848419189453125, -0.0030364990234375, 0.012775421142578125, 0.02858734130859375, 0.044399261474609375, 0.060211181640625, 0.07602310180664062, 0.09183502197265625, 0.10764694213867188, 0.1234588623046875, 0.13927078247070312, 0.15508270263671875, 0.17089462280273438, 0.18670654296875, 0.20251846313476562, 0.21833038330078125, 0.23414230346679688, 0.2499542236328125, 0.2657661437988281, 0.28157806396484375, 0.2973899841308594, 0.313201904296875, 0.3290138244628906, 0.34482574462890625, 0.3606376647949219, 0.3764495849609375, 0.3922615051269531, 0.40807342529296875, 0.4238853454589844, 0.439697265625]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 5.0, 11.0, 16.0, 10.0, 12.0, 20.0, 24.0, 28.0, 30.0, 51.0, 94.0, 82.0, 85.0, 80.0, 82.0, 90.0, 56.0, 53.0, 32.0, 30.0, 19.0, 18.0, 13.0, 19.0, 6.0, 2.0, 4.0, 8.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.250214099884033, -5.0959577560424805, -4.941701412200928, -4.787445068359375, -4.633188247680664, -4.478931903839111, -4.324675559997559, -4.170419216156006, -4.016162872314453, -3.8619065284729004, -3.7076501846313477, -3.553393602371216, -3.399137258529663, -3.2448809146881104, -3.0906243324279785, -2.936367988586426, -2.782111644744873, -2.6278553009033203, -2.4735989570617676, -2.3193423748016357, -2.165086030960083, -2.0108296871185303, -1.856573224067688, -1.7023167610168457, -1.548060417175293, -1.3938040733337402, -1.239547610282898, -1.0852911472320557, -0.9310348033905029, -0.7767783999443054, -0.6225219964981079, -0.4682655334472656, -0.3140096664428711, -0.15975326299667358, -0.005496859550476074, 0.14875954389572144, 0.30301594734191895, 0.45727235078811646, 0.611528754234314, 0.7657852172851562, 0.920041561126709, 1.0742979049682617, 1.228554368019104, 1.3828108310699463, 1.537067174911499, 1.6913235187530518, 1.845579981803894, 1.9998364448547363, 2.154092788696289, 2.308349132537842, 2.4626054763793945, 2.6168620586395264, 2.771118402481079, 2.925374746322632, 3.0796313285827637, 3.2338876724243164, 3.388144016265869, 3.542400360107422, 3.6966567039489746, 3.8509132862091064, 4.005169868469238, 4.159426212310791, 4.313682556152344, 4.4679388999938965, 4.622195243835449]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 4.0, 11.0, 9.0, 12.0, 13.0, 13.0, 16.0, 21.0, 13.0, 32.0, 19.0, 25.0, 33.0, 34.0, 48.0, 39.0, 33.0, 54.0, 42.0, 41.0, 39.0, 36.0, 52.0, 29.0, 30.0, 29.0, 32.0, 34.0, 15.0, 24.0, 24.0, 19.0, 26.0, 15.0, 13.0, 14.0, 6.0, 7.0, 5.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0121726989746094, -1.9477243423461914, -1.8832759857177734, -1.8188276290893555, -1.7543792724609375, -1.6899309158325195, -1.6254825592041016, -1.5610342025756836, -1.4965858459472656, -1.4321374893188477, -1.3676891326904297, -1.3032407760620117, -1.2387924194335938, -1.1743440628051758, -1.1098957061767578, -1.0454473495483398, -0.9809989929199219, -0.9165506362915039, -0.8521022796630859, -0.787653923034668, -0.72320556640625, -0.658757209777832, -0.5943088531494141, -0.5298604965209961, -0.4654121398925781, -0.40096378326416016, -0.3365154266357422, -0.2720670700073242, -0.20761871337890625, -0.14317035675048828, -0.07872200012207031, -0.014273643493652344, 0.050174713134765625, 0.1146230697631836, 0.17907142639160156, 0.24351978302001953, 0.3079681396484375, 0.37241649627685547, 0.43686485290527344, 0.5013132095336914, 0.5657615661621094, 0.6302099227905273, 0.6946582794189453, 0.7591066360473633, 0.8235549926757812, 0.8880033493041992, 0.9524517059326172, 1.0169000625610352, 1.0813484191894531, 1.145796775817871, 1.210245132446289, 1.274693489074707, 1.339141845703125, 1.403590202331543, 1.468038558959961, 1.532486915588379, 1.5969352722167969, 1.6613836288452148, 1.7258319854736328, 1.7902803421020508, 1.8547286987304688, 1.9191770553588867, 1.9836254119873047, 2.0480737686157227, 2.1125221252441406]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 5.0, 4.0, 10.0, 10.0, 17.0, 17.0, 27.0, 38.0, 51.0, 86.0, 110.0, 117.0, 141.0, 238.0, 343.0, 477.0, 679.0, 1066.0, 1730.0, 3035.0, 5162.0, 10190.0, 20268.0, 43262.0, 91155.0, 171527.0, 237870.0, 211380.0, 126654.0, 62033.0, 29181.0, 14162.0, 7325.0, 3807.0, 2297.0, 1312.0, 884.0, 546.0, 365.0, 259.0, 177.0, 148.0, 87.0, 68.0, 60.0, 42.0, 29.0, 27.0, 23.0, 16.0, 10.0, 12.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.021484375, -2.919891357421875, -2.81829833984375, -2.716705322265625, -2.6151123046875, -2.513519287109375, -2.41192626953125, -2.310333251953125, -2.208740234375, -2.107147216796875, -2.00555419921875, -1.903961181640625, -1.8023681640625, -1.700775146484375, -1.59918212890625, -1.497589111328125, -1.39599609375, -1.294403076171875, -1.19281005859375, -1.091217041015625, -0.9896240234375, -0.888031005859375, -0.78643798828125, -0.684844970703125, -0.583251953125, -0.481658935546875, -0.38006591796875, -0.278472900390625, -0.1768798828125, -0.075286865234375, 0.02630615234375, 0.127899169921875, 0.2294921875, 0.331085205078125, 0.43267822265625, 0.534271240234375, 0.6358642578125, 0.737457275390625, 0.83905029296875, 0.940643310546875, 1.042236328125, 1.143829345703125, 1.24542236328125, 1.347015380859375, 1.4486083984375, 1.550201416015625, 1.65179443359375, 1.753387451171875, 1.85498046875, 1.956573486328125, 2.05816650390625, 2.159759521484375, 2.2613525390625, 2.362945556640625, 2.46453857421875, 2.566131591796875, 2.667724609375, 2.769317626953125, 2.87091064453125, 2.972503662109375, 3.0740966796875, 3.175689697265625, 3.27728271484375, 3.378875732421875, 3.48046875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 6.0, 7.0, 8.0, 9.0, 3.0, 15.0, 7.0, 9.0, 18.0, 18.0, 22.0, 23.0, 24.0, 29.0, 27.0, 36.0, 48.0, 37.0, 37.0, 39.0, 41.0, 37.0, 37.0, 45.0, 41.0, 36.0, 33.0, 38.0, 20.0, 27.0, 29.0, 26.0, 23.0, 18.0, 24.0, 25.0, 14.0, 11.0, 8.0, 4.0, 10.0, 5.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.095703125, -2.025115966796875, -1.95452880859375, -1.883941650390625, -1.8133544921875, -1.742767333984375, -1.67218017578125, -1.601593017578125, -1.531005859375, -1.460418701171875, -1.38983154296875, -1.319244384765625, -1.2486572265625, -1.178070068359375, -1.10748291015625, -1.036895751953125, -0.96630859375, -0.895721435546875, -0.82513427734375, -0.754547119140625, -0.6839599609375, -0.613372802734375, -0.54278564453125, -0.472198486328125, -0.401611328125, -0.331024169921875, -0.26043701171875, -0.189849853515625, -0.1192626953125, -0.048675537109375, 0.02191162109375, 0.092498779296875, 0.1630859375, 0.233673095703125, 0.30426025390625, 0.374847412109375, 0.4454345703125, 0.516021728515625, 0.58660888671875, 0.657196044921875, 0.727783203125, 0.798370361328125, 0.86895751953125, 0.939544677734375, 1.0101318359375, 1.080718994140625, 1.15130615234375, 1.221893310546875, 1.29248046875, 1.363067626953125, 1.43365478515625, 1.504241943359375, 1.5748291015625, 1.645416259765625, 1.71600341796875, 1.786590576171875, 1.857177734375, 1.927764892578125, 1.99835205078125, 2.068939208984375, 2.1395263671875, 2.210113525390625, 2.28070068359375, 2.351287841796875, 2.421875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 6.0, 7.0, 8.0, 12.0, 12.0, 14.0, 16.0, 32.0, 26.0, 58.0, 54.0, 79.0, 108.0, 166.0, 226.0, 374.0, 574.0, 1111.0, 2544.0, 7025.0, 22942.0, 83957.0, 268342.0, 392354.0, 190522.0, 53865.0, 14945.0, 4848.0, 1897.0, 895.0, 490.0, 309.0, 196.0, 145.0, 96.0, 82.0, 46.0, 41.0, 28.0, 26.0, 20.0, 16.0, 11.0, 9.0, 9.0, 9.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.73828125, -5.560791015625, -5.38330078125, -5.205810546875, -5.0283203125, -4.850830078125, -4.67333984375, -4.495849609375, -4.318359375, -4.140869140625, -3.96337890625, -3.785888671875, -3.6083984375, -3.430908203125, -3.25341796875, -3.075927734375, -2.8984375, -2.720947265625, -2.54345703125, -2.365966796875, -2.1884765625, -2.010986328125, -1.83349609375, -1.656005859375, -1.478515625, -1.301025390625, -1.12353515625, -0.946044921875, -0.7685546875, -0.591064453125, -0.41357421875, -0.236083984375, -0.05859375, 0.118896484375, 0.29638671875, 0.473876953125, 0.6513671875, 0.828857421875, 1.00634765625, 1.183837890625, 1.361328125, 1.538818359375, 1.71630859375, 1.893798828125, 2.0712890625, 2.248779296875, 2.42626953125, 2.603759765625, 2.78125, 2.958740234375, 3.13623046875, 3.313720703125, 3.4912109375, 3.668701171875, 3.84619140625, 4.023681640625, 4.201171875, 4.378662109375, 4.55615234375, 4.733642578125, 4.9111328125, 5.088623046875, 5.26611328125, 5.443603515625, 5.62109375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 14.0, 5.0, 8.0, 18.0, 19.0, 17.0, 35.0, 25.0, 22.0, 26.0, 30.0, 34.0, 44.0, 37.0, 38.0, 26.0, 40.0, 40.0, 40.0, 32.0, 38.0, 40.0, 44.0, 37.0, 26.0, 31.0, 41.0, 26.0, 19.0, 23.0, 17.0, 14.0, 16.0, 16.0, 7.0, 6.0, 9.0, 3.0, 9.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.373046875, -1.329925537109375, -1.28680419921875, -1.243682861328125, -1.2005615234375, -1.157440185546875, -1.11431884765625, -1.071197509765625, -1.028076171875, -0.984954833984375, -0.94183349609375, -0.898712158203125, -0.8555908203125, -0.812469482421875, -0.76934814453125, -0.726226806640625, -0.68310546875, -0.639984130859375, -0.59686279296875, -0.553741455078125, -0.5106201171875, -0.467498779296875, -0.42437744140625, -0.381256103515625, -0.338134765625, -0.295013427734375, -0.25189208984375, -0.208770751953125, -0.1656494140625, -0.122528076171875, -0.07940673828125, -0.036285400390625, 0.0068359375, 0.049957275390625, 0.09307861328125, 0.136199951171875, 0.1793212890625, 0.222442626953125, 0.26556396484375, 0.308685302734375, 0.351806640625, 0.394927978515625, 0.43804931640625, 0.481170654296875, 0.5242919921875, 0.567413330078125, 0.61053466796875, 0.653656005859375, 0.69677734375, 0.739898681640625, 0.78302001953125, 0.826141357421875, 0.8692626953125, 0.912384033203125, 0.95550537109375, 0.998626708984375, 1.041748046875, 1.084869384765625, 1.12799072265625, 1.171112060546875, 1.2142333984375, 1.257354736328125, 1.30047607421875, 1.343597412109375, 1.38671875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 15.0, 15.0, 18.0, 33.0, 59.0, 70.0, 82.0, 140.0, 153.0, 260.0, 359.0, 508.0, 684.0, 956.0, 1342.0, 1896.0, 2672.0, 5128.0, 29890.0, 646243.0, 330245.0, 15281.0, 4087.0, 2387.0, 1698.0, 1214.0, 876.0, 640.0, 462.0, 339.0, 203.0, 167.0, 124.0, 84.0, 64.0, 41.0, 26.0, 24.0, 19.0, 6.0, 12.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.80126953125, -7.5400390625, -7.27880859375, -7.017578125, -6.75634765625, -6.4951171875, -6.23388671875, -5.97265625, -5.71142578125, -5.4501953125, -5.18896484375, -4.927734375, -4.66650390625, -4.4052734375, -4.14404296875, -3.8828125, -3.62158203125, -3.3603515625, -3.09912109375, -2.837890625, -2.57666015625, -2.3154296875, -2.05419921875, -1.79296875, -1.53173828125, -1.2705078125, -1.00927734375, -0.748046875, -0.48681640625, -0.2255859375, 0.03564453125, 0.296875, 0.55810546875, 0.8193359375, 1.08056640625, 1.341796875, 1.60302734375, 1.8642578125, 2.12548828125, 2.38671875, 2.64794921875, 2.9091796875, 3.17041015625, 3.431640625, 3.69287109375, 3.9541015625, 4.21533203125, 4.4765625, 4.73779296875, 4.9990234375, 5.26025390625, 5.521484375, 5.78271484375, 6.0439453125, 6.30517578125, 6.56640625, 6.82763671875, 7.0888671875, 7.35009765625, 7.611328125, 7.87255859375, 8.1337890625, 8.39501953125, 8.65625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 14.0, 35.0, 125.0, 360.0, 282.0, 119.0, 35.0, 11.0, 7.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004940032958984375, -0.0004703402519226074, -0.00044667720794677734, -0.00042301416397094727, -0.0003993511199951172, -0.0003756880760192871, -0.00035202503204345703, -0.00032836198806762695, -0.0003046989440917969, -0.0002810359001159668, -0.0002573728561401367, -0.00023370981216430664, -0.00021004676818847656, -0.00018638372421264648, -0.0001627206802368164, -0.00013905763626098633, -0.00011539459228515625, -9.173154830932617e-05, -6.80685043334961e-05, -4.4405460357666016e-05, -2.0742416381835938e-05, 2.9206275939941406e-06, 2.658367156982422e-05, 5.02467155456543e-05, 7.390975952148438e-05, 9.757280349731445e-05, 0.00012123584747314453, 0.0001448988914489746, 0.0001685619354248047, 0.00019222497940063477, 0.00021588802337646484, 0.00023955106735229492, 0.000263214111328125, 0.0002868771553039551, 0.00031054019927978516, 0.00033420324325561523, 0.0003578662872314453, 0.0003815293312072754, 0.00040519237518310547, 0.00042885541915893555, 0.0004525184631347656, 0.0004761815071105957, 0.0004998445510864258, 0.0005235075950622559, 0.0005471706390380859, 0.000570833683013916, 0.0005944967269897461, 0.0006181597709655762, 0.0006418228149414062, 0.0006654858589172363, 0.0006891489028930664, 0.0007128119468688965, 0.0007364749908447266, 0.0007601380348205566, 0.0007838010787963867, 0.0008074641227722168, 0.0008311271667480469, 0.000854790210723877, 0.000878453254699707, 0.0009021162986755371, 0.0009257793426513672, 0.0009494423866271973, 0.0009731054306030273, 0.0009967684745788574, 0.0010204315185546875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 12.0, 15.0, 21.0, 37.0, 54.0, 79.0, 88.0, 162.0, 198.0, 286.0, 369.0, 485.0, 657.0, 893.0, 1222.0, 1726.0, 2637.0, 5106.0, 23176.0, 222028.0, 649732.0, 113755.0, 13820.0, 3975.0, 2166.0, 1604.0, 1136.0, 853.0, 637.0, 450.0, 338.0, 232.0, 172.0, 105.0, 107.0, 67.0, 42.0, 46.0, 18.0, 13.0, 11.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.984375, -5.81512451171875, -5.6458740234375, -5.47662353515625, -5.307373046875, -5.13812255859375, -4.9688720703125, -4.79962158203125, -4.63037109375, -4.46112060546875, -4.2918701171875, -4.12261962890625, -3.953369140625, -3.78411865234375, -3.6148681640625, -3.44561767578125, -3.2763671875, -3.10711669921875, -2.9378662109375, -2.76861572265625, -2.599365234375, -2.43011474609375, -2.2608642578125, -2.09161376953125, -1.92236328125, -1.75311279296875, -1.5838623046875, -1.41461181640625, -1.245361328125, -1.07611083984375, -0.9068603515625, -0.73760986328125, -0.568359375, -0.39910888671875, -0.2298583984375, -0.06060791015625, 0.108642578125, 0.27789306640625, 0.4471435546875, 0.61639404296875, 0.78564453125, 0.95489501953125, 1.1241455078125, 1.29339599609375, 1.462646484375, 1.63189697265625, 1.8011474609375, 1.97039794921875, 2.1396484375, 2.30889892578125, 2.4781494140625, 2.64739990234375, 2.816650390625, 2.98590087890625, 3.1551513671875, 3.32440185546875, 3.49365234375, 3.66290283203125, 3.8321533203125, 4.00140380859375, 4.170654296875, 4.33990478515625, 4.5091552734375, 4.67840576171875, 4.84765625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 19.0, 68.0, 148.0, 272.0, 233.0, 137.0, 53.0, 24.0, 6.0, 5.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.486328125, -1.43988037109375, -1.3934326171875, -1.34698486328125, -1.300537109375, -1.25408935546875, -1.2076416015625, -1.16119384765625, -1.11474609375, -1.06829833984375, -1.0218505859375, -0.97540283203125, -0.928955078125, -0.88250732421875, -0.8360595703125, -0.78961181640625, -0.7431640625, -0.69671630859375, -0.6502685546875, -0.60382080078125, -0.557373046875, -0.51092529296875, -0.4644775390625, -0.41802978515625, -0.37158203125, -0.32513427734375, -0.2786865234375, -0.23223876953125, -0.185791015625, -0.13934326171875, -0.0928955078125, -0.04644775390625, 0.0, 0.04644775390625, 0.0928955078125, 0.13934326171875, 0.185791015625, 0.23223876953125, 0.2786865234375, 0.32513427734375, 0.37158203125, 0.41802978515625, 0.4644775390625, 0.51092529296875, 0.557373046875, 0.60382080078125, 0.6502685546875, 0.69671630859375, 0.7431640625, 0.78961181640625, 0.8360595703125, 0.88250732421875, 0.928955078125, 0.97540283203125, 1.0218505859375, 1.06829833984375, 1.11474609375, 1.16119384765625, 1.2076416015625, 1.25408935546875, 1.300537109375, 1.34698486328125, 1.3934326171875, 1.43988037109375, 1.486328125]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 6.0, 8.0, 10.0, 11.0, 12.0, 9.0, 17.0, 18.0, 21.0, 37.0, 40.0, 52.0, 69.0, 87.0, 92.0, 85.0, 83.0, 48.0, 56.0, 55.0, 40.0, 26.0, 23.0, 15.0, 16.0, 13.0, 5.0, 6.0, 2.0, 7.0, 5.0, 7.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5651140213012695, -4.420884609222412, -4.276655673980713, -4.1324262619018555, -3.988196849822998, -3.8439676761627197, -3.6997385025024414, -3.555509090423584, -3.4112799167633057, -3.2670507431030273, -3.12282133102417, -2.9785921573638916, -2.8343629837036133, -2.690133571624756, -2.5459043979644775, -2.401675224304199, -2.257445812225342, -2.1132166385650635, -1.968987226486206, -1.8247580528259277, -1.6805287599563599, -1.536299467086792, -1.3920702934265137, -1.2478410005569458, -1.103611707687378, -0.9593824148178101, -0.815153181552887, -0.6709239482879639, -0.526694655418396, -0.3824653625488281, -0.23823612928390503, -0.09400689601898193, 0.050221920013427734, 0.19445118308067322, 0.3386804461479187, 0.4829097092151642, 0.6271389722824097, 0.7713682651519775, 0.9155974984169006, 1.0598267316818237, 1.2040560245513916, 1.3482853174209595, 1.4925146102905273, 1.6367437839508057, 1.7809730768203735, 1.9252023696899414, 2.0694315433502197, 2.213660717010498, 2.3578901290893555, 2.502119302749634, 2.646348714828491, 2.7905778884887695, 2.934807300567627, 3.0790364742279053, 3.2232656478881836, 3.367495059967041, 3.5117242336273193, 3.6559534072875977, 3.800182819366455, 3.9444119930267334, 4.088641166687012, 4.232870578765869, 4.377099990844727, 4.521328926086426, 4.665558338165283]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 6.0, 7.0, 6.0, 10.0, 13.0, 9.0, 16.0, 24.0, 23.0, 37.0, 36.0, 41.0, 39.0, 40.0, 47.0, 46.0, 40.0, 51.0, 43.0, 52.0, 42.0, 33.0, 30.0, 38.0, 33.0, 43.0, 39.0, 25.0, 21.0, 14.0, 10.0, 15.0, 10.0, 10.0, 5.0, 2.0, 6.0, 9.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3335120677948, -2.2579541206359863, -2.182396173477173, -2.1068382263183594, -2.031280279159546, -1.9557222127914429, -1.8801642656326294, -1.8046061992645264, -1.729048252105713, -1.6534903049468994, -1.577932357788086, -1.5023744106292725, -1.4268163442611694, -1.351258397102356, -1.2757004499435425, -1.2001423835754395, -1.1245845556259155, -1.049026608467102, -0.9734686017036438, -0.8979106545448303, -0.8223526477813721, -0.7467947006225586, -0.6712367534637451, -0.5956787467002869, -0.5201207995414734, -0.4445628225803375, -0.36900484561920166, -0.2934468984603882, -0.21788892149925232, -0.14233094453811646, -0.06677299737930298, 0.008785009384155273, 0.08434295654296875, 0.15990093350410461, 0.23545889556407928, 0.31101685762405396, 0.3865748345851898, 0.4621328115463257, 0.5376907587051392, 0.6132487654685974, 0.6888067126274109, 0.7643646597862244, 0.8399226665496826, 0.9154806137084961, 0.9910385608673096, 1.066596508026123, 1.1421544551849365, 1.2177125215530396, 1.293270468711853, 1.3688284158706665, 1.44438636302948, 1.519944429397583, 1.5955023765563965, 1.67106032371521, 1.7466182708740234, 1.822176218032837, 1.8977341651916504, 1.9732921123504639, 2.0488500595092773, 2.124408006668091, 2.1999659538269043, 2.275524139404297, 2.3510818481445312, 2.426640033721924, 2.5021979808807373]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 10.0, 14.0, 22.0, 27.0, 41.0, 50.0, 79.0, 127.0, 200.0, 236.0, 329.0, 512.0, 799.0, 1172.0, 1687.0, 2741.0, 4271.0, 6970.0, 12204.0, 21805.0, 42820.0, 96989.0, 259892.0, 773099.0, 1490972.0, 936624.0, 321404.0, 113504.0, 48780.0, 23963.0, 13009.0, 7533.0, 4364.0, 2733.0, 1812.0, 1116.0, 744.0, 494.0, 345.0, 235.0, 152.0, 116.0, 86.0, 65.0, 44.0, 26.0, 14.0, 12.0, 12.0, 11.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.421875, -4.28192138671875, -4.1419677734375, -4.00201416015625, -3.862060546875, -3.72210693359375, -3.5821533203125, -3.44219970703125, -3.30224609375, -3.16229248046875, -3.0223388671875, -2.88238525390625, -2.742431640625, -2.60247802734375, -2.4625244140625, -2.32257080078125, -2.1826171875, -2.04266357421875, -1.9027099609375, -1.76275634765625, -1.622802734375, -1.48284912109375, -1.3428955078125, -1.20294189453125, -1.06298828125, -0.92303466796875, -0.7830810546875, -0.64312744140625, -0.503173828125, -0.36322021484375, -0.2232666015625, -0.08331298828125, 0.056640625, 0.19659423828125, 0.3365478515625, 0.47650146484375, 0.616455078125, 0.75640869140625, 0.8963623046875, 1.03631591796875, 1.17626953125, 1.31622314453125, 1.4561767578125, 1.59613037109375, 1.736083984375, 1.87603759765625, 2.0159912109375, 2.15594482421875, 2.2958984375, 2.43585205078125, 2.5758056640625, 2.71575927734375, 2.855712890625, 2.99566650390625, 3.1356201171875, 3.27557373046875, 3.41552734375, 3.55548095703125, 3.6954345703125, 3.83538818359375, 3.975341796875, 4.11529541015625, 4.2552490234375, 4.39520263671875, 4.53515625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 4.0, 8.0, 8.0, 7.0, 1.0, 9.0, 10.0, 13.0, 17.0, 19.0, 26.0, 34.0, 30.0, 27.0, 37.0, 35.0, 38.0, 43.0, 39.0, 50.0, 50.0, 40.0, 49.0, 52.0, 37.0, 25.0, 43.0, 35.0, 39.0, 27.0, 17.0, 22.0, 25.0, 20.0, 12.0, 13.0, 3.0, 5.0, 6.0, 6.0, 3.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.8984375, -1.8424072265625, -1.786376953125, -1.7303466796875, -1.67431640625, -1.6182861328125, -1.562255859375, -1.5062255859375, -1.4501953125, -1.3941650390625, -1.338134765625, -1.2821044921875, -1.22607421875, -1.1700439453125, -1.114013671875, -1.0579833984375, -1.001953125, -0.9459228515625, -0.889892578125, -0.8338623046875, -0.77783203125, -0.7218017578125, -0.665771484375, -0.6097412109375, -0.5537109375, -0.4976806640625, -0.441650390625, -0.3856201171875, -0.32958984375, -0.2735595703125, -0.217529296875, -0.1614990234375, -0.10546875, -0.0494384765625, 0.006591796875, 0.0626220703125, 0.11865234375, 0.1746826171875, 0.230712890625, 0.2867431640625, 0.3427734375, 0.3988037109375, 0.454833984375, 0.5108642578125, 0.56689453125, 0.6229248046875, 0.678955078125, 0.7349853515625, 0.791015625, 0.8470458984375, 0.903076171875, 0.9591064453125, 1.01513671875, 1.0711669921875, 1.127197265625, 1.1832275390625, 1.2392578125, 1.2952880859375, 1.351318359375, 1.4073486328125, 1.46337890625, 1.5194091796875, 1.575439453125, 1.6314697265625, 1.6875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 17.0, 23.0, 34.0, 37.0, 67.0, 93.0, 173.0, 260.0, 346.0, 558.0, 840.0, 1287.0, 1943.0, 3213.0, 4937.0, 7990.0, 13867.0, 24041.0, 44763.0, 89408.0, 194271.0, 473730.0, 1112655.0, 1223215.0, 553470.0, 225318.0, 101636.0, 50751.0, 26775.0, 15051.0, 8864.0, 5411.0, 3296.0, 2120.0, 1354.0, 826.0, 581.0, 351.0, 251.0, 126.0, 106.0, 68.0, 61.0, 25.0, 29.0, 13.0, 9.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.43359375, -4.29541015625, -4.1572265625, -4.01904296875, -3.880859375, -3.74267578125, -3.6044921875, -3.46630859375, -3.328125, -3.18994140625, -3.0517578125, -2.91357421875, -2.775390625, -2.63720703125, -2.4990234375, -2.36083984375, -2.22265625, -2.08447265625, -1.9462890625, -1.80810546875, -1.669921875, -1.53173828125, -1.3935546875, -1.25537109375, -1.1171875, -0.97900390625, -0.8408203125, -0.70263671875, -0.564453125, -0.42626953125, -0.2880859375, -0.14990234375, -0.01171875, 0.12646484375, 0.2646484375, 0.40283203125, 0.541015625, 0.67919921875, 0.8173828125, 0.95556640625, 1.09375, 1.23193359375, 1.3701171875, 1.50830078125, 1.646484375, 1.78466796875, 1.9228515625, 2.06103515625, 2.19921875, 2.33740234375, 2.4755859375, 2.61376953125, 2.751953125, 2.89013671875, 3.0283203125, 3.16650390625, 3.3046875, 3.44287109375, 3.5810546875, 3.71923828125, 3.857421875, 3.99560546875, 4.1337890625, 4.27197265625, 4.41015625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 7.0, 10.0, 9.0, 9.0, 11.0, 15.0, 18.0, 22.0, 23.0, 38.0, 37.0, 43.0, 56.0, 61.0, 116.0, 119.0, 174.0, 229.0, 256.0, 344.0, 305.0, 330.0, 347.0, 291.0, 235.0, 227.0, 169.0, 112.0, 112.0, 89.0, 69.0, 39.0, 39.0, 31.0, 20.0, 18.0, 8.0, 14.0, 5.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.4453125, -1.4065399169921875, -1.367767333984375, -1.3289947509765625, -1.29022216796875, -1.2514495849609375, -1.212677001953125, -1.1739044189453125, -1.1351318359375, -1.0963592529296875, -1.057586669921875, -1.0188140869140625, -0.98004150390625, -0.9412689208984375, -0.902496337890625, -0.8637237548828125, -0.824951171875, -0.7861785888671875, -0.747406005859375, -0.7086334228515625, -0.66986083984375, -0.6310882568359375, -0.592315673828125, -0.5535430908203125, -0.5147705078125, -0.4759979248046875, -0.437225341796875, -0.3984527587890625, -0.35968017578125, -0.3209075927734375, -0.282135009765625, -0.2433624267578125, -0.20458984375, -0.1658172607421875, -0.127044677734375, -0.0882720947265625, -0.04949951171875, -0.0107269287109375, 0.028045654296875, 0.0668182373046875, 0.1055908203125, 0.1443634033203125, 0.183135986328125, 0.2219085693359375, 0.26068115234375, 0.2994537353515625, 0.338226318359375, 0.3769989013671875, 0.415771484375, 0.4545440673828125, 0.493316650390625, 0.5320892333984375, 0.57086181640625, 0.6096343994140625, 0.648406982421875, 0.6871795654296875, 0.7259521484375, 0.7647247314453125, 0.803497314453125, 0.8422698974609375, 0.88104248046875, 0.9198150634765625, 0.958587646484375, 0.9973602294921875, 1.0361328125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 5.0, 6.0, 4.0, 9.0, 15.0, 9.0, 14.0, 20.0, 18.0, 28.0, 53.0, 48.0, 70.0, 87.0, 114.0, 94.0, 80.0, 82.0, 67.0, 49.0, 34.0, 20.0, 15.0, 14.0, 14.0, 10.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.305171012878418, -5.121412754058838, -4.9376540184021, -4.7538957595825195, -4.570137023925781, -4.386378765106201, -4.202620506286621, -4.018861770629883, -3.8351032733917236, -3.6513447761535645, -3.4675862789154053, -3.283827781677246, -3.100069522857666, -2.9163107872009277, -2.7325525283813477, -2.5487940311431885, -2.3650355339050293, -2.18127703666687, -1.997518539428711, -1.8137601613998413, -1.6300016641616821, -1.446243166923523, -1.2624847888946533, -1.0787262916564941, -0.894967794418335, -0.7112092971801758, -0.5274508595466614, -0.343692421913147, -0.1599339246749878, 0.023824572563171387, 0.20758295059204102, 0.3913414478302002, 0.5750999450683594, 0.7588584423065186, 0.942616879940033, 1.1263753175735474, 1.3101338148117065, 1.4938923120498657, 1.6776506900787354, 1.8614091873168945, 2.0451676845550537, 2.228926181793213, 2.412684679031372, 2.5964431762695312, 2.7802014350891113, 2.9639601707458496, 3.1477184295654297, 3.331476926803589, 3.515235424041748, 3.6989939212799072, 3.8827524185180664, 4.0665106773376465, 4.250269412994385, 4.434027671813965, 4.617786407470703, 4.801544666290283, 4.985302925109863, 5.169061183929443, 5.352819919586182, 5.536578178405762, 5.7203369140625, 5.90409517288208, 6.08785343170166, 6.271612167358398, 6.455370903015137]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 2.0, 9.0, 9.0, 12.0, 9.0, 11.0, 5.0, 21.0, 16.0, 11.0, 15.0, 28.0, 15.0, 42.0, 29.0, 40.0, 29.0, 41.0, 41.0, 32.0, 38.0, 46.0, 36.0, 38.0, 38.0, 31.0, 37.0, 34.0, 29.0, 25.0, 25.0, 29.0, 25.0, 21.0, 27.0, 21.0, 7.0, 15.0, 9.0, 7.0, 8.0, 5.0, 6.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.196519613265991, -2.129795551300049, -2.0630717277526855, -1.9963477849960327, -1.9296238422393799, -1.862899899482727, -1.7961759567260742, -1.7294520139694214, -1.6627280712127686, -1.5960041284561157, -1.529280185699463, -1.46255624294281, -1.3958323001861572, -1.3291083574295044, -1.2623844146728516, -1.1956604719161987, -1.128936529159546, -1.062212586402893, -0.9954886436462402, -0.9287647008895874, -0.8620407581329346, -0.7953168153762817, -0.7285928726196289, -0.6618689298629761, -0.5951449871063232, -0.5284210443496704, -0.4616971015930176, -0.39497315883636475, -0.3282492160797119, -0.2615252733230591, -0.19480133056640625, -0.12807738780975342, -0.061353206634521484, 0.005370736122131348, 0.07209467887878418, 0.138818621635437, 0.20554256439208984, 0.2722665071487427, 0.3389904499053955, 0.40571439266204834, 0.47243833541870117, 0.539162278175354, 0.6058862209320068, 0.6726101636886597, 0.7393341064453125, 0.8060580492019653, 0.8727819919586182, 0.939505934715271, 1.0062298774719238, 1.0729538202285767, 1.1396777629852295, 1.2064017057418823, 1.2731256484985352, 1.339849591255188, 1.4065735340118408, 1.4732974767684937, 1.5400214195251465, 1.6067453622817993, 1.6734693050384521, 1.740193247795105, 1.8069171905517578, 1.8736411333084106, 1.9403650760650635, 2.007089138031006, 2.073812961578369]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 6.0, 13.0, 8.0, 14.0, 19.0, 33.0, 39.0, 52.0, 92.0, 152.0, 211.0, 327.0, 485.0, 752.0, 1167.0, 1844.0, 2992.0, 4804.0, 7988.0, 13506.0, 22796.0, 38128.0, 63871.0, 101515.0, 147450.0, 176596.0, 159855.0, 116070.0, 74852.0, 45438.0, 26931.0, 15928.0, 9351.0, 5738.0, 3398.0, 2143.0, 1367.0, 888.0, 565.0, 380.0, 249.0, 186.0, 104.0, 85.0, 52.0, 47.0, 26.0, 18.0, 13.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.275390625, -1.232391357421875, -1.18939208984375, -1.146392822265625, -1.1033935546875, -1.060394287109375, -1.01739501953125, -0.974395751953125, -0.931396484375, -0.888397216796875, -0.84539794921875, -0.802398681640625, -0.7593994140625, -0.716400146484375, -0.67340087890625, -0.630401611328125, -0.58740234375, -0.544403076171875, -0.50140380859375, -0.458404541015625, -0.4154052734375, -0.372406005859375, -0.32940673828125, -0.286407470703125, -0.243408203125, -0.200408935546875, -0.15740966796875, -0.114410400390625, -0.0714111328125, -0.028411865234375, 0.01458740234375, 0.057586669921875, 0.1005859375, 0.143585205078125, 0.18658447265625, 0.229583740234375, 0.2725830078125, 0.315582275390625, 0.35858154296875, 0.401580810546875, 0.444580078125, 0.487579345703125, 0.53057861328125, 0.573577880859375, 0.6165771484375, 0.659576416015625, 0.70257568359375, 0.745574951171875, 0.78857421875, 0.831573486328125, 0.87457275390625, 0.917572021484375, 0.9605712890625, 1.003570556640625, 1.04656982421875, 1.089569091796875, 1.132568359375, 1.175567626953125, 1.21856689453125, 1.261566162109375, 1.3045654296875, 1.347564697265625, 1.39056396484375, 1.433563232421875, 1.4765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 2.0, 2.0, 2.0, 7.0, 10.0, 5.0, 10.0, 11.0, 12.0, 20.0, 9.0, 16.0, 23.0, 29.0, 30.0, 41.0, 33.0, 41.0, 29.0, 40.0, 40.0, 41.0, 41.0, 48.0, 43.0, 25.0, 38.0, 32.0, 43.0, 32.0, 28.0, 32.0, 33.0, 23.0, 21.0, 13.0, 20.0, 17.0, 6.0, 10.0, 8.0, 8.0, 8.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.341796875, -2.26312255859375, -2.1844482421875, -2.10577392578125, -2.027099609375, -1.94842529296875, -1.8697509765625, -1.79107666015625, -1.71240234375, -1.63372802734375, -1.5550537109375, -1.47637939453125, -1.397705078125, -1.31903076171875, -1.2403564453125, -1.16168212890625, -1.0830078125, -1.00433349609375, -0.9256591796875, -0.84698486328125, -0.768310546875, -0.68963623046875, -0.6109619140625, -0.53228759765625, -0.45361328125, -0.37493896484375, -0.2962646484375, -0.21759033203125, -0.138916015625, -0.06024169921875, 0.0184326171875, 0.09710693359375, 0.17578125, 0.25445556640625, 0.3331298828125, 0.41180419921875, 0.490478515625, 0.56915283203125, 0.6478271484375, 0.72650146484375, 0.80517578125, 0.88385009765625, 0.9625244140625, 1.04119873046875, 1.119873046875, 1.19854736328125, 1.2772216796875, 1.35589599609375, 1.4345703125, 1.51324462890625, 1.5919189453125, 1.67059326171875, 1.749267578125, 1.82794189453125, 1.9066162109375, 1.98529052734375, 2.06396484375, 2.14263916015625, 2.2213134765625, 2.29998779296875, 2.378662109375, 2.45733642578125, 2.5360107421875, 2.61468505859375, 2.693359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 12.0, 18.0, 30.0, 47.0, 59.0, 71.0, 105.0, 175.0, 283.0, 395.0, 666.0, 1028.0, 1521.0, 2429.0, 3941.0, 6661.0, 11105.0, 18817.0, 32862.0, 59243.0, 104756.0, 175690.0, 223606.0, 170880.0, 100598.0, 56842.0, 31578.0, 18182.0, 10521.0, 6192.0, 3799.0, 2311.0, 1498.0, 912.0, 593.0, 361.0, 230.0, 163.0, 111.0, 77.0, 56.0, 39.0, 22.0, 32.0, 13.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0], "bins": [-2.177734375, -2.1163330078125, -2.054931640625, -1.9935302734375, -1.93212890625, -1.8707275390625, -1.809326171875, -1.7479248046875, -1.6865234375, -1.6251220703125, -1.563720703125, -1.5023193359375, -1.44091796875, -1.3795166015625, -1.318115234375, -1.2567138671875, -1.1953125, -1.1339111328125, -1.072509765625, -1.0111083984375, -0.94970703125, -0.8883056640625, -0.826904296875, -0.7655029296875, -0.7041015625, -0.6427001953125, -0.581298828125, -0.5198974609375, -0.45849609375, -0.3970947265625, -0.335693359375, -0.2742919921875, -0.212890625, -0.1514892578125, -0.090087890625, -0.0286865234375, 0.03271484375, 0.0941162109375, 0.155517578125, 0.2169189453125, 0.2783203125, 0.3397216796875, 0.401123046875, 0.4625244140625, 0.52392578125, 0.5853271484375, 0.646728515625, 0.7081298828125, 0.76953125, 0.8309326171875, 0.892333984375, 0.9537353515625, 1.01513671875, 1.0765380859375, 1.137939453125, 1.1993408203125, 1.2607421875, 1.3221435546875, 1.383544921875, 1.4449462890625, 1.50634765625, 1.5677490234375, 1.629150390625, 1.6905517578125, 1.751953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 10.0, 19.0, 12.0, 12.0, 23.0, 19.0, 21.0, 31.0, 26.0, 29.0, 36.0, 34.0, 47.0, 37.0, 42.0, 43.0, 47.0, 43.0, 42.0, 46.0, 43.0, 34.0, 41.0, 39.0, 27.0, 33.0, 27.0, 17.0, 19.0, 24.0, 15.0, 12.0, 8.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6181640625, -1.5682220458984375, -1.518280029296875, -1.4683380126953125, -1.41839599609375, -1.3684539794921875, -1.318511962890625, -1.2685699462890625, -1.2186279296875, -1.1686859130859375, -1.118743896484375, -1.0688018798828125, -1.01885986328125, -0.9689178466796875, -0.918975830078125, -0.8690338134765625, -0.819091796875, -0.7691497802734375, -0.719207763671875, -0.6692657470703125, -0.61932373046875, -0.5693817138671875, -0.519439697265625, -0.4694976806640625, -0.4195556640625, -0.3696136474609375, -0.319671630859375, -0.2697296142578125, -0.21978759765625, -0.1698455810546875, -0.119903564453125, -0.0699615478515625, -0.02001953125, 0.0299224853515625, 0.079864501953125, 0.1298065185546875, 0.17974853515625, 0.2296905517578125, 0.279632568359375, 0.3295745849609375, 0.3795166015625, 0.4294586181640625, 0.479400634765625, 0.5293426513671875, 0.57928466796875, 0.6292266845703125, 0.679168701171875, 0.7291107177734375, 0.779052734375, 0.8289947509765625, 0.878936767578125, 0.9288787841796875, 0.97882080078125, 1.0287628173828125, 1.078704833984375, 1.1286468505859375, 1.1785888671875, 1.2285308837890625, 1.278472900390625, 1.3284149169921875, 1.37835693359375, 1.4282989501953125, 1.478240966796875, 1.5281829833984375, 1.578125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 2.0, 9.0, 9.0, 7.0, 19.0, 26.0, 44.0, 53.0, 78.0, 105.0, 173.0, 252.0, 409.0, 641.0, 1067.0, 1704.0, 3017.0, 5186.0, 9448.0, 17829.0, 35635.0, 72871.0, 148866.0, 255185.0, 236320.0, 129870.0, 63173.0, 30868.0, 15912.0, 8389.0, 4518.0, 2635.0, 1576.0, 939.0, 615.0, 386.0, 227.0, 174.0, 116.0, 61.0, 42.0, 32.0, 19.0, 11.0, 18.0, 6.0, 7.0, 3.0, 5.0, 0.0, 2.0, 3.0, 1.0], "bins": [-1.072265625, -1.0415420532226562, -1.0108184814453125, -0.9800949096679688, -0.949371337890625, -0.9186477661132812, -0.8879241943359375, -0.8572006225585938, -0.82647705078125, -0.7957534790039062, -0.7650299072265625, -0.7343063354492188, -0.703582763671875, -0.6728591918945312, -0.6421356201171875, -0.6114120483398438, -0.5806884765625, -0.5499649047851562, -0.5192413330078125, -0.48851776123046875, -0.457794189453125, -0.42707061767578125, -0.3963470458984375, -0.36562347412109375, -0.33489990234375, -0.30417633056640625, -0.2734527587890625, -0.24272918701171875, -0.212005615234375, -0.18128204345703125, -0.1505584716796875, -0.11983489990234375, -0.089111328125, -0.05838775634765625, -0.0276641845703125, 0.00305938720703125, 0.033782958984375, 0.06450653076171875, 0.0952301025390625, 0.12595367431640625, 0.15667724609375, 0.18740081787109375, 0.2181243896484375, 0.24884796142578125, 0.279571533203125, 0.31029510498046875, 0.3410186767578125, 0.37174224853515625, 0.4024658203125, 0.43318939208984375, 0.4639129638671875, 0.49463653564453125, 0.525360107421875, 0.5560836791992188, 0.5868072509765625, 0.6175308227539062, 0.64825439453125, 0.6789779663085938, 0.7097015380859375, 0.7404251098632812, 0.771148681640625, 0.8018722534179688, 0.8325958251953125, 0.8633193969726562, 0.89404296875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 5.0, 11.0, 7.0, 6.0, 16.0, 18.0, 22.0, 24.0, 32.0, 27.0, 38.0, 47.0, 49.0, 41.0, 52.0, 48.0, 49.0, 63.0, 48.0, 56.0, 48.0, 38.0, 39.0, 34.0, 20.0, 25.0, 25.0, 17.0, 16.0, 9.0, 9.0, 7.0, 4.0, 4.0, 7.0, 3.0, 7.0, 3.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.403425216674805e-05, -3.2986514270305634e-05, -3.193877637386322e-05, -3.089103847742081e-05, -2.9843300580978394e-05, -2.879556268453598e-05, -2.7747824788093567e-05, -2.6700086891651154e-05, -2.565234899520874e-05, -2.4604611098766327e-05, -2.3556873202323914e-05, -2.25091353058815e-05, -2.1461397409439087e-05, -2.0413659512996674e-05, -1.936592161655426e-05, -1.8318183720111847e-05, -1.7270445823669434e-05, -1.622270792722702e-05, -1.5174970030784607e-05, -1.4127232134342194e-05, -1.307949423789978e-05, -1.2031756341457367e-05, -1.0984018445014954e-05, -9.93628054857254e-06, -8.888542652130127e-06, -7.840804755687714e-06, -6.7930668592453e-06, -5.745328962802887e-06, -4.697591066360474e-06, -3.6498531699180603e-06, -2.602115273475647e-06, -1.5543773770332336e-06, -5.066394805908203e-07, 5.41098415851593e-07, 1.5888363122940063e-06, 2.6365742087364197e-06, 3.684312105178833e-06, 4.732050001621246e-06, 5.77978789806366e-06, 6.827525794506073e-06, 7.875263690948486e-06, 8.9230015873909e-06, 9.970739483833313e-06, 1.1018477380275726e-05, 1.206621527671814e-05, 1.3113953173160553e-05, 1.4161691069602966e-05, 1.520942896604538e-05, 1.6257166862487793e-05, 1.7304904758930206e-05, 1.835264265537262e-05, 1.9400380551815033e-05, 2.0448118448257446e-05, 2.149585634469986e-05, 2.2543594241142273e-05, 2.3591332137584686e-05, 2.46390700340271e-05, 2.5686807930469513e-05, 2.6734545826911926e-05, 2.778228372335434e-05, 2.8830021619796753e-05, 2.9877759516239166e-05, 3.092549741268158e-05, 3.197323530912399e-05, 3.3020973205566406e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 10.0, 16.0, 29.0, 43.0, 65.0, 94.0, 118.0, 189.0, 327.0, 442.0, 784.0, 1069.0, 1642.0, 2452.0, 4033.0, 6280.0, 9955.0, 16278.0, 26101.0, 42756.0, 69272.0, 105356.0, 145060.0, 164909.0, 149266.0, 109645.0, 72729.0, 45253.0, 27882.0, 17230.0, 10631.0, 6713.0, 4154.0, 2756.0, 1755.0, 1113.0, 707.0, 465.0, 320.0, 185.0, 151.0, 106.0, 70.0, 37.0, 25.0, 25.0, 16.0, 4.0, 8.0, 9.0, 3.0, 2.0, 2.0], "bins": [-0.6728515625, -0.65338134765625, -0.6339111328125, -0.61444091796875, -0.594970703125, -0.57550048828125, -0.5560302734375, -0.53656005859375, -0.51708984375, -0.49761962890625, -0.4781494140625, -0.45867919921875, -0.439208984375, -0.41973876953125, -0.4002685546875, -0.38079833984375, -0.361328125, -0.34185791015625, -0.3223876953125, -0.30291748046875, -0.283447265625, -0.26397705078125, -0.2445068359375, -0.22503662109375, -0.20556640625, -0.18609619140625, -0.1666259765625, -0.14715576171875, -0.127685546875, -0.10821533203125, -0.0887451171875, -0.06927490234375, -0.0498046875, -0.03033447265625, -0.0108642578125, 0.00860595703125, 0.028076171875, 0.04754638671875, 0.0670166015625, 0.08648681640625, 0.10595703125, 0.12542724609375, 0.1448974609375, 0.16436767578125, 0.183837890625, 0.20330810546875, 0.2227783203125, 0.24224853515625, 0.26171875, 0.28118896484375, 0.3006591796875, 0.32012939453125, 0.339599609375, 0.35906982421875, 0.3785400390625, 0.39801025390625, 0.41748046875, 0.43695068359375, 0.4564208984375, 0.47589111328125, 0.495361328125, 0.51483154296875, 0.5343017578125, 0.55377197265625, 0.5732421875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 2.0, 9.0, 10.0, 7.0, 9.0, 18.0, 24.0, 25.0, 30.0, 29.0, 27.0, 33.0, 35.0, 40.0, 36.0, 49.0, 53.0, 46.0, 50.0, 44.0, 50.0, 48.0, 48.0, 42.0, 40.0, 29.0, 20.0, 32.0, 16.0, 10.0, 16.0, 10.0, 8.0, 11.0, 10.0, 5.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1639404296875, -0.15859031677246094, -0.15324020385742188, -0.1478900909423828, -0.14253997802734375, -0.1371898651123047, -0.13183975219726562, -0.12648963928222656, -0.1211395263671875, -0.11578941345214844, -0.11043930053710938, -0.10508918762207031, -0.09973907470703125, -0.09438896179199219, -0.08903884887695312, -0.08368873596191406, -0.078338623046875, -0.07298851013183594, -0.06763839721679688, -0.06228828430175781, -0.05693817138671875, -0.05158805847167969, -0.046237945556640625, -0.04088783264160156, -0.0355377197265625, -0.030187606811523438, -0.024837493896484375, -0.019487380981445312, -0.01413726806640625, -0.008787155151367188, -0.003437042236328125, 0.0019130706787109375, 0.00726318359375, 0.012613296508789062, 0.017963409423828125, 0.023313522338867188, 0.02866363525390625, 0.03401374816894531, 0.039363861083984375, 0.04471397399902344, 0.0500640869140625, 0.05541419982910156, 0.060764312744140625, 0.06611442565917969, 0.07146453857421875, 0.07681465148925781, 0.08216476440429688, 0.08751487731933594, 0.092864990234375, 0.09821510314941406, 0.10356521606445312, 0.10891532897949219, 0.11426544189453125, 0.11961555480957031, 0.12496566772460938, 0.13031578063964844, 0.1356658935546875, 0.14101600646972656, 0.14636611938476562, 0.1517162322998047, 0.15706634521484375, 0.1624164581298828, 0.16776657104492188, 0.17311668395996094, 0.178466796875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 5.0, 7.0, 9.0, 10.0, 10.0, 12.0, 20.0, 16.0, 21.0, 31.0, 54.0, 57.0, 76.0, 96.0, 109.0, 83.0, 81.0, 81.0, 64.0, 46.0, 27.0, 17.0, 13.0, 12.0, 17.0, 6.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.372339725494385, -5.190568447113037, -5.008797645568848, -4.8270263671875, -4.645255088806152, -4.463484287261963, -4.281713008880615, -4.099942207336426, -3.918170928955078, -3.7363998889923096, -3.554628849029541, -3.3728575706481934, -3.191086530685425, -3.0093154907226562, -2.8275442123413086, -2.64577317237854, -2.4640021324157715, -2.282231092453003, -2.1004600524902344, -1.9186887741088867, -1.7369177341461182, -1.5551466941833496, -1.3733755350112915, -1.1916043758392334, -1.0098333358764648, -0.8280622363090515, -0.6462911367416382, -0.46452003717422485, -0.2827489376068115, -0.1009778380393982, 0.08079326152801514, 0.26256442070007324, 0.4443359375, 0.6261070370674133, 0.8078781366348267, 0.98964923620224, 1.1714203357696533, 1.3531913757324219, 1.53496253490448, 1.716733694076538, 1.8985047340393066, 2.080275774002075, 2.2620468139648438, 2.4438180923461914, 2.62558913230896, 2.8073601722717285, 2.989131450653076, 3.1709024906158447, 3.3526735305786133, 3.534444570541382, 3.7162156105041504, 3.897986888885498, 4.0797576904296875, 4.261528968811035, 4.443300247192383, 4.6250715255737305, 4.80684232711792, 4.988613605499268, 5.170384407043457, 5.352155685424805, 5.533926963806152, 5.715697765350342, 5.8974690437316895, 6.079239845275879, 6.261011123657227]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 6.0, 3.0, 5.0, 8.0, 11.0, 10.0, 11.0, 11.0, 9.0, 20.0, 11.0, 19.0, 22.0, 20.0, 24.0, 40.0, 30.0, 38.0, 39.0, 34.0, 38.0, 40.0, 45.0, 34.0, 41.0, 44.0, 31.0, 35.0, 37.0, 31.0, 23.0, 29.0, 29.0, 23.0, 24.0, 22.0, 24.0, 15.0, 8.0, 13.0, 8.0, 7.0, 4.0, 7.0, 8.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.2398760318756104, -2.172515869140625, -2.1051554679870605, -2.037795305252075, -1.9704349040985107, -1.9030747413635254, -1.8357144594192505, -1.7683541774749756, -1.7009938955307007, -1.6336336135864258, -1.5662733316421509, -1.498913049697876, -1.4315528869628906, -1.3641924858093262, -1.2968323230743408, -1.229472041130066, -1.162111759185791, -1.0947514772415161, -1.0273911952972412, -0.9600309729576111, -0.8926706910133362, -0.8253104090690613, -0.7579501867294312, -0.6905899047851562, -0.6232296228408813, -0.5558693408966064, -0.48850908875465393, -0.4211488366127014, -0.3537885546684265, -0.2864282727241516, -0.2190680205821991, -0.15170776844024658, -0.08434772491455078, -0.016987457871437073, 0.050372809171676636, 0.11773307621479034, 0.18509334325790405, 0.25245362520217896, 0.31981387734413147, 0.387174129486084, 0.4545344114303589, 0.5218946933746338, 0.5892549753189087, 0.6566151976585388, 0.7239754796028137, 0.7913357615470886, 0.8586959838867188, 0.9260562658309937, 0.9934165477752686, 1.0607768297195435, 1.1281371116638184, 1.1954973936080933, 1.2628576755523682, 1.3302178382873535, 1.3975781202316284, 1.4649384021759033, 1.5322986841201782, 1.5996589660644531, 1.667019248008728, 1.734379529953003, 1.8017396926879883, 1.8691000938415527, 1.936460256576538, 2.0038204193115234, 2.071180820465088]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 3.0, 4.0, 10.0, 17.0, 18.0, 29.0, 26.0, 50.0, 64.0, 113.0, 174.0, 242.0, 369.0, 548.0, 864.0, 1386.0, 2143.0, 3369.0, 5240.0, 8687.0, 14063.0, 23336.0, 38441.0, 61782.0, 94571.0, 133030.0, 158621.0, 154403.0, 122135.0, 84094.0, 54217.0, 33342.0, 20316.0, 12308.0, 7403.0, 4768.0, 2959.0, 1873.0, 1209.0, 801.0, 505.0, 349.0, 217.0, 161.0, 96.0, 67.0, 42.0, 38.0, 14.0, 11.0, 11.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.974609375, -1.908477783203125, -1.84234619140625, -1.776214599609375, -1.7100830078125, -1.643951416015625, -1.57781982421875, -1.511688232421875, -1.445556640625, -1.379425048828125, -1.31329345703125, -1.247161865234375, -1.1810302734375, -1.114898681640625, -1.04876708984375, -0.982635498046875, -0.91650390625, -0.850372314453125, -0.78424072265625, -0.718109130859375, -0.6519775390625, -0.585845947265625, -0.51971435546875, -0.453582763671875, -0.387451171875, -0.321319580078125, -0.25518798828125, -0.189056396484375, -0.1229248046875, -0.056793212890625, 0.00933837890625, 0.075469970703125, 0.1416015625, 0.207733154296875, 0.27386474609375, 0.339996337890625, 0.4061279296875, 0.472259521484375, 0.53839111328125, 0.604522705078125, 0.670654296875, 0.736785888671875, 0.80291748046875, 0.869049072265625, 0.9351806640625, 1.001312255859375, 1.06744384765625, 1.133575439453125, 1.19970703125, 1.265838623046875, 1.33197021484375, 1.398101806640625, 1.4642333984375, 1.530364990234375, 1.59649658203125, 1.662628173828125, 1.728759765625, 1.794891357421875, 1.86102294921875, 1.927154541015625, 1.9932861328125, 2.059417724609375, 2.12554931640625, 2.191680908203125, 2.2578125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 3.0, 6.0, 5.0, 10.0, 9.0, 14.0, 10.0, 16.0, 17.0, 18.0, 20.0, 23.0, 25.0, 30.0, 31.0, 35.0, 47.0, 49.0, 47.0, 33.0, 41.0, 41.0, 36.0, 40.0, 35.0, 42.0, 36.0, 36.0, 31.0, 28.0, 30.0, 23.0, 23.0, 18.0, 17.0, 11.0, 10.0, 13.0, 6.0, 8.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.607421875, -2.52935791015625, -2.4512939453125, -2.37322998046875, -2.295166015625, -2.21710205078125, -2.1390380859375, -2.06097412109375, -1.98291015625, -1.90484619140625, -1.8267822265625, -1.74871826171875, -1.670654296875, -1.59259033203125, -1.5145263671875, -1.43646240234375, -1.3583984375, -1.28033447265625, -1.2022705078125, -1.12420654296875, -1.046142578125, -0.96807861328125, -0.8900146484375, -0.81195068359375, -0.73388671875, -0.65582275390625, -0.5777587890625, -0.49969482421875, -0.421630859375, -0.34356689453125, -0.2655029296875, -0.18743896484375, -0.109375, -0.03131103515625, 0.0467529296875, 0.12481689453125, 0.202880859375, 0.28094482421875, 0.3590087890625, 0.43707275390625, 0.51513671875, 0.59320068359375, 0.6712646484375, 0.74932861328125, 0.827392578125, 0.90545654296875, 0.9835205078125, 1.06158447265625, 1.1396484375, 1.21771240234375, 1.2957763671875, 1.37384033203125, 1.451904296875, 1.52996826171875, 1.6080322265625, 1.68609619140625, 1.76416015625, 1.84222412109375, 1.9202880859375, 1.99835205078125, 2.076416015625, 2.15447998046875, 2.2325439453125, 2.31060791015625, 2.388671875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 7.0, 25.0, 20.0, 32.0, 63.0, 73.0, 154.0, 179.0, 281.0, 486.0, 820.0, 1297.0, 2066.0, 3593.0, 6196.0, 10643.0, 18891.0, 32343.0, 56093.0, 92004.0, 137933.0, 173000.0, 169817.0, 131374.0, 86443.0, 52234.0, 30594.0, 17655.0, 10064.0, 5596.0, 3365.0, 2068.0, 1164.0, 737.0, 429.0, 270.0, 186.0, 109.0, 67.0, 52.0, 41.0, 32.0, 12.0, 15.0, 13.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.351715087890625, -2.27569580078125, -2.199676513671875, -2.1236572265625, -2.047637939453125, -1.97161865234375, -1.895599365234375, -1.819580078125, -1.743560791015625, -1.66754150390625, -1.591522216796875, -1.5155029296875, -1.439483642578125, -1.36346435546875, -1.287445068359375, -1.21142578125, -1.135406494140625, -1.05938720703125, -0.983367919921875, -0.9073486328125, -0.831329345703125, -0.75531005859375, -0.679290771484375, -0.603271484375, -0.527252197265625, -0.45123291015625, -0.375213623046875, -0.2991943359375, -0.223175048828125, -0.14715576171875, -0.071136474609375, 0.0048828125, 0.080902099609375, 0.15692138671875, 0.232940673828125, 0.3089599609375, 0.384979248046875, 0.46099853515625, 0.537017822265625, 0.613037109375, 0.689056396484375, 0.76507568359375, 0.841094970703125, 0.9171142578125, 0.993133544921875, 1.06915283203125, 1.145172119140625, 1.22119140625, 1.297210693359375, 1.37322998046875, 1.449249267578125, 1.5252685546875, 1.601287841796875, 1.67730712890625, 1.753326416015625, 1.829345703125, 1.905364990234375, 1.98138427734375, 2.057403564453125, 2.1334228515625, 2.209442138671875, 2.28546142578125, 2.361480712890625, 2.4375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 11.0, 11.0, 11.0, 12.0, 12.0, 11.0, 12.0, 26.0, 25.0, 21.0, 23.0, 33.0, 29.0, 39.0, 38.0, 39.0, 37.0, 52.0, 45.0, 59.0, 51.0, 36.0, 44.0, 36.0, 29.0, 40.0, 32.0, 19.0, 26.0, 22.0, 13.0, 22.0, 16.0, 10.0, 15.0, 11.0, 4.0, 4.0, 10.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6123046875, -1.5637969970703125, -1.515289306640625, -1.4667816162109375, -1.41827392578125, -1.3697662353515625, -1.321258544921875, -1.2727508544921875, -1.2242431640625, -1.1757354736328125, -1.127227783203125, -1.0787200927734375, -1.03021240234375, -0.9817047119140625, -0.933197021484375, -0.8846893310546875, -0.836181640625, -0.7876739501953125, -0.739166259765625, -0.6906585693359375, -0.64215087890625, -0.5936431884765625, -0.545135498046875, -0.4966278076171875, -0.4481201171875, -0.3996124267578125, -0.351104736328125, -0.3025970458984375, -0.25408935546875, -0.2055816650390625, -0.157073974609375, -0.1085662841796875, -0.06005859375, -0.0115509033203125, 0.036956787109375, 0.0854644775390625, 0.13397216796875, 0.1824798583984375, 0.230987548828125, 0.2794952392578125, 0.3280029296875, 0.3765106201171875, 0.425018310546875, 0.4735260009765625, 0.52203369140625, 0.5705413818359375, 0.619049072265625, 0.6675567626953125, 0.716064453125, 0.7645721435546875, 0.813079833984375, 0.8615875244140625, 0.91009521484375, 0.9586029052734375, 1.007110595703125, 1.0556182861328125, 1.1041259765625, 1.1526336669921875, 1.201141357421875, 1.2496490478515625, 1.29815673828125, 1.3466644287109375, 1.395172119140625, 1.4436798095703125, 1.4921875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 15.0, 16.0, 34.0, 47.0, 76.0, 115.0, 209.0, 279.0, 423.0, 648.0, 1016.0, 1592.0, 2517.0, 3896.0, 6359.0, 10181.0, 16972.0, 28853.0, 49085.0, 84335.0, 140201.0, 192452.0, 187133.0, 130793.0, 78368.0, 45421.0, 26282.0, 15669.0, 9589.0, 5805.0, 3694.0, 2365.0, 1432.0, 942.0, 621.0, 385.0, 244.0, 154.0, 114.0, 72.0, 53.0, 35.0, 20.0, 8.0, 12.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2294921875, -1.19097900390625, -1.1524658203125, -1.11395263671875, -1.075439453125, -1.03692626953125, -0.9984130859375, -0.95989990234375, -0.92138671875, -0.88287353515625, -0.8443603515625, -0.80584716796875, -0.767333984375, -0.72882080078125, -0.6903076171875, -0.65179443359375, -0.61328125, -0.57476806640625, -0.5362548828125, -0.49774169921875, -0.459228515625, -0.42071533203125, -0.3822021484375, -0.34368896484375, -0.30517578125, -0.26666259765625, -0.2281494140625, -0.18963623046875, -0.151123046875, -0.11260986328125, -0.0740966796875, -0.03558349609375, 0.0029296875, 0.04144287109375, 0.0799560546875, 0.11846923828125, 0.156982421875, 0.19549560546875, 0.2340087890625, 0.27252197265625, 0.31103515625, 0.34954833984375, 0.3880615234375, 0.42657470703125, 0.465087890625, 0.50360107421875, 0.5421142578125, 0.58062744140625, 0.619140625, 0.65765380859375, 0.6961669921875, 0.73468017578125, 0.773193359375, 0.81170654296875, 0.8502197265625, 0.88873291015625, 0.92724609375, 0.96575927734375, 1.0042724609375, 1.04278564453125, 1.081298828125, 1.11981201171875, 1.1583251953125, 1.19683837890625, 1.2353515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 4.0, 5.0, 11.0, 12.0, 9.0, 19.0, 26.0, 31.0, 46.0, 72.0, 65.0, 68.0, 82.0, 96.0, 96.0, 72.0, 57.0, 44.0, 32.0, 29.0, 27.0, 25.0, 17.0, 13.0, 13.0, 2.0, 6.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00014781951904296875, -0.00014281272888183594, -0.00013780593872070312, -0.0001327991485595703, -0.0001277923583984375, -0.0001227855682373047, -0.00011777877807617188, -0.00011277198791503906, -0.00010776519775390625, -0.00010275840759277344, -9.775161743164062e-05, -9.274482727050781e-05, -8.7738037109375e-05, -8.273124694824219e-05, -7.772445678710938e-05, -7.271766662597656e-05, -6.771087646484375e-05, -6.270408630371094e-05, -5.7697296142578125e-05, -5.269050598144531e-05, -4.76837158203125e-05, -4.267692565917969e-05, -3.7670135498046875e-05, -3.266334533691406e-05, -2.765655517578125e-05, -2.2649765014648438e-05, -1.7642974853515625e-05, -1.2636184692382812e-05, -7.62939453125e-06, -2.6226043701171875e-06, 2.384185791015625e-06, 7.3909759521484375e-06, 1.239776611328125e-05, 1.7404556274414062e-05, 2.2411346435546875e-05, 2.7418136596679688e-05, 3.24249267578125e-05, 3.743171691894531e-05, 4.2438507080078125e-05, 4.744529724121094e-05, 5.245208740234375e-05, 5.745887756347656e-05, 6.246566772460938e-05, 6.747245788574219e-05, 7.2479248046875e-05, 7.748603820800781e-05, 8.249282836914062e-05, 8.749961853027344e-05, 9.250640869140625e-05, 9.751319885253906e-05, 0.00010251998901367188, 0.00010752677917480469, 0.0001125335693359375, 0.00011754035949707031, 0.00012254714965820312, 0.00012755393981933594, 0.00013256072998046875, 0.00013756752014160156, 0.00014257431030273438, 0.0001475811004638672, 0.000152587890625, 0.0001575946807861328, 0.00016260147094726562, 0.00016760826110839844, 0.00017261505126953125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 7.0, 6.0, 11.0, 18.0, 22.0, 34.0, 48.0, 67.0, 113.0, 145.0, 206.0, 257.0, 383.0, 541.0, 755.0, 1055.0, 1488.0, 2184.0, 3131.0, 4567.0, 6608.0, 10149.0, 15523.0, 23798.0, 37209.0, 58330.0, 88184.0, 123415.0, 151065.0, 150234.0, 121166.0, 85797.0, 56516.0, 36240.0, 23165.0, 15134.0, 9765.0, 6538.0, 4428.0, 3098.0, 2091.0, 1530.0, 997.0, 744.0, 515.0, 398.0, 269.0, 176.0, 130.0, 92.0, 71.0, 44.0, 46.0, 20.0, 10.0, 12.0, 8.0, 8.0, 5.0, 0.0, 3.0], "bins": [-0.95458984375, -0.9247283935546875, -0.894866943359375, -0.8650054931640625, -0.83514404296875, -0.8052825927734375, -0.775421142578125, -0.7455596923828125, -0.7156982421875, -0.6858367919921875, -0.655975341796875, -0.6261138916015625, -0.59625244140625, -0.5663909912109375, -0.536529541015625, -0.5066680908203125, -0.476806640625, -0.4469451904296875, -0.417083740234375, -0.3872222900390625, -0.35736083984375, -0.3274993896484375, -0.297637939453125, -0.2677764892578125, -0.2379150390625, -0.2080535888671875, -0.178192138671875, -0.1483306884765625, -0.11846923828125, -0.0886077880859375, -0.058746337890625, -0.0288848876953125, 0.0009765625, 0.0308380126953125, 0.060699462890625, 0.0905609130859375, 0.12042236328125, 0.1502838134765625, 0.180145263671875, 0.2100067138671875, 0.2398681640625, 0.2697296142578125, 0.299591064453125, 0.3294525146484375, 0.35931396484375, 0.3891754150390625, 0.419036865234375, 0.4488983154296875, 0.478759765625, 0.5086212158203125, 0.538482666015625, 0.5683441162109375, 0.59820556640625, 0.6280670166015625, 0.657928466796875, 0.6877899169921875, 0.7176513671875, 0.7475128173828125, 0.777374267578125, 0.8072357177734375, 0.83709716796875, 0.8669586181640625, 0.896820068359375, 0.9266815185546875, 0.95654296875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 2.0, 7.0, 8.0, 6.0, 8.0, 8.0, 11.0, 12.0, 13.0, 18.0, 20.0, 23.0, 21.0, 18.0, 35.0, 52.0, 31.0, 47.0, 46.0, 42.0, 31.0, 39.0, 45.0, 42.0, 46.0, 32.0, 32.0, 38.0, 38.0, 35.0, 19.0, 30.0, 22.0, 19.0, 21.0, 15.0, 16.0, 8.0, 7.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.2327880859375, -0.2254810333251953, -0.21817398071289062, -0.21086692810058594, -0.20355987548828125, -0.19625282287597656, -0.18894577026367188, -0.1816387176513672, -0.1743316650390625, -0.1670246124267578, -0.15971755981445312, -0.15241050720214844, -0.14510345458984375, -0.13779640197753906, -0.13048934936523438, -0.12318229675292969, -0.115875244140625, -0.10856819152832031, -0.10126113891601562, -0.09395408630371094, -0.08664703369140625, -0.07933998107910156, -0.07203292846679688, -0.06472587585449219, -0.0574188232421875, -0.05011177062988281, -0.042804718017578125, -0.03549766540527344, -0.02819061279296875, -0.020883560180664062, -0.013576507568359375, -0.0062694549560546875, 0.00103759765625, 0.008344650268554688, 0.015651702880859375, 0.022958755493164062, 0.03026580810546875, 0.03757286071777344, 0.044879913330078125, 0.05218696594238281, 0.0594940185546875, 0.06680107116699219, 0.07410812377929688, 0.08141517639160156, 0.08872222900390625, 0.09602928161621094, 0.10333633422851562, 0.11064338684082031, 0.117950439453125, 0.1252574920654297, 0.13256454467773438, 0.13987159729003906, 0.14717864990234375, 0.15448570251464844, 0.16179275512695312, 0.1690998077392578, 0.1764068603515625, 0.1837139129638672, 0.19102096557617188, 0.19832801818847656, 0.20563507080078125, 0.21294212341308594, 0.22024917602539062, 0.2275562286376953, 0.23486328125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 11.0, 8.0, 13.0, 13.0, 7.0, 18.0, 24.0, 27.0, 53.0, 62.0, 76.0, 88.0, 117.0, 88.0, 97.0, 66.0, 61.0, 53.0, 22.0, 29.0, 12.0, 11.0, 16.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64752197265625, -5.456513404846191, -5.265504837036133, -5.074496269226074, -4.883487701416016, -4.692479133605957, -4.501470565795898, -4.31046199798584, -4.119453430175781, -3.9284448623657227, -3.737436294555664, -3.5464277267456055, -3.355419158935547, -3.1644105911254883, -2.9734020233154297, -2.782393455505371, -2.5913851261138916, -2.400376558303833, -2.2093679904937744, -2.018359422683716, -1.8273508548736572, -1.6363422870635986, -1.4453338384628296, -1.254325270652771, -1.0633167028427124, -0.8723081350326538, -0.6812995672225952, -0.4902910590171814, -0.2992824912071228, -0.10827392339706421, 0.08273458480834961, 0.2737431526184082, 0.4647517204284668, 0.6557602882385254, 0.846768856048584, 1.0377774238586426, 1.2287859916687012, 1.4197945594787598, 1.6108030080795288, 1.8018115758895874, 1.992820143699646, 2.183828592300415, 2.3748371601104736, 2.5658457279205322, 2.756854295730591, 2.9478628635406494, 3.138871431350708, 3.3298799991607666, 3.520888566970825, 3.711897134780884, 3.9029057025909424, 4.093914031982422, 4.2849225997924805, 4.475931167602539, 4.666939735412598, 4.857948303222656, 5.048956871032715, 5.239965438842773, 5.430974006652832, 5.621982574462891, 5.812991142272949, 6.003999710083008, 6.195008277893066, 6.386016845703125, 6.577025413513184]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 9.0, 4.0, 10.0, 8.0, 18.0, 18.0, 18.0, 20.0, 22.0, 18.0, 25.0, 23.0, 27.0, 28.0, 47.0, 44.0, 33.0, 43.0, 40.0, 38.0, 44.0, 42.0, 31.0, 39.0, 47.0, 24.0, 28.0, 29.0, 28.0, 34.0, 24.0, 22.0, 25.0, 18.0, 14.0, 13.0, 4.0, 8.0, 6.0, 3.0, 4.0, 5.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.291991949081421, -2.221914529800415, -2.151837110519409, -2.0817599296569824, -2.0116825103759766, -1.9416050910949707, -1.8715276718139648, -1.801450252532959, -1.7313729524612427, -1.6612955331802368, -1.5912182331085205, -1.5211408138275146, -1.4510633945465088, -1.3809860944747925, -1.3109086751937866, -1.2408313751220703, -1.1707539558410645, -1.1006765365600586, -1.0305992364883423, -0.9605218172073364, -0.8904444575309753, -0.8203670978546143, -0.7502896785736084, -0.6802123188972473, -0.6101349592208862, -0.5400575995445251, -0.4699802100658417, -0.3999028205871582, -0.3298254609107971, -0.25974810123443604, -0.18967071175575256, -0.11959332227706909, -0.049515724182128906, 0.02056165039539337, 0.09063902497291565, 0.16071639955043793, 0.2307937741279602, 0.3008711338043213, 0.37094852328300476, 0.44102591276168823, 0.5111032724380493, 0.5811806321144104, 0.6512579917907715, 0.7213354110717773, 0.7914127707481384, 0.8614901304244995, 0.9315675497055054, 1.0016448497772217, 1.0717222690582275, 1.1417996883392334, 1.2118769884109497, 1.2819544076919556, 1.3520317077636719, 1.4221091270446777, 1.4921865463256836, 1.5622639656066895, 1.6323412656784058, 1.7024186849594116, 1.772495985031128, 1.8425734043121338, 1.9126508235931396, 1.982728123664856, 2.0528054237365723, 2.122882843017578, 2.192960262298584]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 6.0, 14.0, 16.0, 36.0, 42.0, 60.0, 89.0, 117.0, 177.0, 233.0, 303.0, 433.0, 604.0, 878.0, 1235.0, 1785.0, 2785.0, 4087.0, 6494.0, 10523.0, 17979.0, 33068.0, 67799.0, 159752.0, 434541.0, 1100285.0, 1323447.0, 622068.0, 221104.0, 88091.0, 40430.0, 21355.0, 12404.0, 7486.0, 4613.0, 3123.0, 2062.0, 1444.0, 954.0, 680.0, 499.0, 344.0, 244.0, 160.0, 123.0, 92.0, 79.0, 45.0, 36.0, 25.0, 9.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0], "bins": [-4.3828125, -4.25067138671875, -4.1185302734375, -3.98638916015625, -3.854248046875, -3.72210693359375, -3.5899658203125, -3.45782470703125, -3.32568359375, -3.19354248046875, -3.0614013671875, -2.92926025390625, -2.797119140625, -2.66497802734375, -2.5328369140625, -2.40069580078125, -2.2685546875, -2.13641357421875, -2.0042724609375, -1.87213134765625, -1.739990234375, -1.60784912109375, -1.4757080078125, -1.34356689453125, -1.21142578125, -1.07928466796875, -0.9471435546875, -0.81500244140625, -0.682861328125, -0.55072021484375, -0.4185791015625, -0.28643798828125, -0.154296875, -0.02215576171875, 0.1099853515625, 0.24212646484375, 0.374267578125, 0.50640869140625, 0.6385498046875, 0.77069091796875, 0.90283203125, 1.03497314453125, 1.1671142578125, 1.29925537109375, 1.431396484375, 1.56353759765625, 1.6956787109375, 1.82781982421875, 1.9599609375, 2.09210205078125, 2.2242431640625, 2.35638427734375, 2.488525390625, 2.62066650390625, 2.7528076171875, 2.88494873046875, 3.01708984375, 3.14923095703125, 3.2813720703125, 3.41351318359375, 3.545654296875, 3.67779541015625, 3.8099365234375, 3.94207763671875, 4.07421875]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 4.0, 7.0, 12.0, 8.0, 15.0, 12.0, 14.0, 15.0, 27.0, 18.0, 31.0, 36.0, 25.0, 29.0, 32.0, 36.0, 55.0, 40.0, 31.0, 40.0, 42.0, 41.0, 42.0, 34.0, 36.0, 30.0, 30.0, 36.0, 24.0, 27.0, 28.0, 19.0, 31.0, 14.0, 16.0, 9.0, 11.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8017578125, -1.745574951171875, -1.68939208984375, -1.633209228515625, -1.5770263671875, -1.520843505859375, -1.46466064453125, -1.408477783203125, -1.352294921875, -1.296112060546875, -1.23992919921875, -1.183746337890625, -1.1275634765625, -1.071380615234375, -1.01519775390625, -0.959014892578125, -0.90283203125, -0.846649169921875, -0.79046630859375, -0.734283447265625, -0.6781005859375, -0.621917724609375, -0.56573486328125, -0.509552001953125, -0.453369140625, -0.397186279296875, -0.34100341796875, -0.284820556640625, -0.2286376953125, -0.172454833984375, -0.11627197265625, -0.060089111328125, -0.00390625, 0.052276611328125, 0.10845947265625, 0.164642333984375, 0.2208251953125, 0.277008056640625, 0.33319091796875, 0.389373779296875, 0.445556640625, 0.501739501953125, 0.55792236328125, 0.614105224609375, 0.6702880859375, 0.726470947265625, 0.78265380859375, 0.838836669921875, 0.89501953125, 0.951202392578125, 1.00738525390625, 1.063568115234375, 1.1197509765625, 1.175933837890625, 1.23211669921875, 1.288299560546875, 1.344482421875, 1.400665283203125, 1.45684814453125, 1.513031005859375, 1.5692138671875, 1.625396728515625, 1.68157958984375, 1.737762451171875, 1.7939453125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 5.0, 7.0, 6.0, 16.0, 18.0, 32.0, 40.0, 59.0, 89.0, 149.0, 187.0, 280.0, 403.0, 637.0, 1031.0, 1643.0, 2655.0, 4457.0, 7663.0, 13879.0, 25974.0, 52771.0, 116763.0, 296557.0, 861412.0, 1575927.0, 758207.0, 263519.0, 106191.0, 48556.0, 24115.0, 13062.0, 7154.0, 4157.0, 2505.0, 1443.0, 970.0, 543.0, 407.0, 266.0, 179.0, 100.0, 78.0, 61.0, 35.0, 34.0, 20.0, 14.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.37890625, -5.20782470703125, -5.0367431640625, -4.86566162109375, -4.694580078125, -4.52349853515625, -4.3524169921875, -4.18133544921875, -4.01025390625, -3.83917236328125, -3.6680908203125, -3.49700927734375, -3.325927734375, -3.15484619140625, -2.9837646484375, -2.81268310546875, -2.6416015625, -2.47052001953125, -2.2994384765625, -2.12835693359375, -1.957275390625, -1.78619384765625, -1.6151123046875, -1.44403076171875, -1.27294921875, -1.10186767578125, -0.9307861328125, -0.75970458984375, -0.588623046875, -0.41754150390625, -0.2464599609375, -0.07537841796875, 0.095703125, 0.26678466796875, 0.4378662109375, 0.60894775390625, 0.780029296875, 0.95111083984375, 1.1221923828125, 1.29327392578125, 1.46435546875, 1.63543701171875, 1.8065185546875, 1.97760009765625, 2.148681640625, 2.31976318359375, 2.4908447265625, 2.66192626953125, 2.8330078125, 3.00408935546875, 3.1751708984375, 3.34625244140625, 3.517333984375, 3.68841552734375, 3.8594970703125, 4.03057861328125, 4.20166015625, 4.37274169921875, 4.5438232421875, 4.71490478515625, 4.885986328125, 5.05706787109375, 5.2281494140625, 5.39923095703125, 5.5703125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 13.0, 13.0, 14.0, 16.0, 21.0, 25.0, 41.0, 56.0, 59.0, 84.0, 128.0, 152.0, 212.0, 277.0, 355.0, 385.0, 421.0, 383.0, 306.0, 266.0, 189.0, 139.0, 124.0, 130.0, 62.0, 52.0, 37.0, 27.0, 17.0, 16.0, 12.0, 9.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.7646484375, -1.71734619140625, -1.6700439453125, -1.62274169921875, -1.575439453125, -1.52813720703125, -1.4808349609375, -1.43353271484375, -1.38623046875, -1.33892822265625, -1.2916259765625, -1.24432373046875, -1.197021484375, -1.14971923828125, -1.1024169921875, -1.05511474609375, -1.0078125, -0.96051025390625, -0.9132080078125, -0.86590576171875, -0.818603515625, -0.77130126953125, -0.7239990234375, -0.67669677734375, -0.62939453125, -0.58209228515625, -0.5347900390625, -0.48748779296875, -0.440185546875, -0.39288330078125, -0.3455810546875, -0.29827880859375, -0.2509765625, -0.20367431640625, -0.1563720703125, -0.10906982421875, -0.061767578125, -0.01446533203125, 0.0328369140625, 0.08013916015625, 0.12744140625, 0.17474365234375, 0.2220458984375, 0.26934814453125, 0.316650390625, 0.36395263671875, 0.4112548828125, 0.45855712890625, 0.505859375, 0.55316162109375, 0.6004638671875, 0.64776611328125, 0.695068359375, 0.74237060546875, 0.7896728515625, 0.83697509765625, 0.88427734375, 0.93157958984375, 0.9788818359375, 1.02618408203125, 1.073486328125, 1.12078857421875, 1.1680908203125, 1.21539306640625, 1.2626953125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 5.0, 9.0, 10.0, 14.0, 8.0, 22.0, 22.0, 26.0, 36.0, 46.0, 48.0, 72.0, 98.0, 97.0, 93.0, 63.0, 76.0, 58.0, 49.0, 32.0, 24.0, 16.0, 17.0, 14.0, 6.0, 12.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.629872798919678, -5.445515155792236, -5.261157512664795, -5.0767998695373535, -4.892442226409912, -4.708084583282471, -4.523726463317871, -4.33936882019043, -4.155011177062988, -3.970653533935547, -3.7862958908081055, -3.601938247680664, -3.4175806045532227, -3.2332229614257812, -3.0488650798797607, -2.8645074367523193, -2.680150032043457, -2.4957923889160156, -2.311434745788574, -2.127077102661133, -1.9427193403244019, -1.7583616971969604, -1.5740039348602295, -1.389646291732788, -1.2052886486053467, -1.0209310054779053, -0.8365733027458191, -0.6522156000137329, -0.4678579568862915, -0.2835003137588501, -0.09914255142211914, 0.08521509170532227, 0.26957225799560547, 0.45392993092536926, 0.6382876038551331, 0.8226453065872192, 1.0070029497146606, 1.191360592842102, 1.375718355178833, 1.5600759983062744, 1.7444336414337158, 1.9287912845611572, 2.1131489276885986, 2.297506809234619, 2.4818644523620605, 2.666222095489502, 2.8505797386169434, 3.0349373817443848, 3.219295024871826, 3.4036526679992676, 3.588010311126709, 3.7723679542541504, 3.956725597381592, 4.141083240509033, 4.325441360473633, 4.509799003601074, 4.694156646728516, 4.878514289855957, 5.062871932983398, 5.24722957611084, 5.431587219238281, 5.615944862365723, 5.800302505493164, 5.9846601486206055, 6.169017791748047]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 9.0, 7.0, 10.0, 10.0, 15.0, 25.0, 13.0, 20.0, 26.0, 22.0, 30.0, 34.0, 39.0, 33.0, 47.0, 39.0, 40.0, 36.0, 39.0, 37.0, 57.0, 52.0, 34.0, 32.0, 31.0, 31.0, 28.0, 27.0, 29.0, 27.0, 17.0, 18.0, 15.0, 12.0, 13.0, 6.0, 10.0, 9.0, 6.0, 2.0, 1.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.5577101707458496, -2.480426073074341, -2.403141975402832, -2.3258578777313232, -2.2485737800598145, -2.1712896823883057, -2.094005584716797, -2.016721487045288, -1.9394373893737793, -1.8621532917022705, -1.7848691940307617, -1.707585096359253, -1.6303009986877441, -1.5530169010162354, -1.4757328033447266, -1.3984487056732178, -1.3211647272109985, -1.2438806295394897, -1.166596531867981, -1.0893124341964722, -1.0120283365249634, -0.9347442388534546, -0.8574602007865906, -0.7801761031150818, -0.702892005443573, -0.6256079077720642, -0.5483238101005554, -0.471039742231369, -0.39375564455986023, -0.31647154688835144, -0.23918747901916504, -0.16190338134765625, -0.08461928367614746, -0.007335193455219269, 0.06994889676570892, 0.14723297953605652, 0.2245170772075653, 0.3018011748790741, 0.3790852427482605, 0.4563693404197693, 0.5336534380912781, 0.6109375357627869, 0.6882216334342957, 0.7655056715011597, 0.8427897691726685, 0.9200738668441772, 0.997357964515686, 1.0746420621871948, 1.1519261598587036, 1.2292102575302124, 1.3064943552017212, 1.38377845287323, 1.4610625505447388, 1.5383466482162476, 1.6156306266784668, 1.6929147243499756, 1.7701988220214844, 1.8474829196929932, 1.924767017364502, 2.0020511150360107, 2.0793352127075195, 2.1566193103790283, 2.233903408050537, 2.311187505722046, 2.3884716033935547]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 8.0, 16.0, 19.0, 35.0, 48.0, 69.0, 96.0, 141.0, 172.0, 261.0, 389.0, 546.0, 853.0, 1293.0, 2098.0, 3356.0, 5278.0, 8480.0, 14745.0, 24784.0, 43174.0, 74627.0, 124234.0, 178948.0, 192954.0, 148303.0, 92567.0, 53633.0, 31156.0, 18129.0, 10789.0, 6340.0, 3925.0, 2394.0, 1649.0, 1016.0, 648.0, 431.0, 316.0, 212.0, 129.0, 87.0, 62.0, 45.0, 38.0, 27.0, 5.0, 7.0, 11.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.58984375, -1.537200927734375, -1.48455810546875, -1.431915283203125, -1.3792724609375, -1.326629638671875, -1.27398681640625, -1.221343994140625, -1.168701171875, -1.116058349609375, -1.06341552734375, -1.010772705078125, -0.9581298828125, -0.905487060546875, -0.85284423828125, -0.800201416015625, -0.74755859375, -0.694915771484375, -0.64227294921875, -0.589630126953125, -0.5369873046875, -0.484344482421875, -0.43170166015625, -0.379058837890625, -0.326416015625, -0.273773193359375, -0.22113037109375, -0.168487548828125, -0.1158447265625, -0.063201904296875, -0.01055908203125, 0.042083740234375, 0.0947265625, 0.147369384765625, 0.20001220703125, 0.252655029296875, 0.3052978515625, 0.357940673828125, 0.41058349609375, 0.463226318359375, 0.515869140625, 0.568511962890625, 0.62115478515625, 0.673797607421875, 0.7264404296875, 0.779083251953125, 0.83172607421875, 0.884368896484375, 0.93701171875, 0.989654541015625, 1.04229736328125, 1.094940185546875, 1.1475830078125, 1.200225830078125, 1.25286865234375, 1.305511474609375, 1.358154296875, 1.410797119140625, 1.46343994140625, 1.516082763671875, 1.5687255859375, 1.621368408203125, 1.67401123046875, 1.726654052734375, 1.779296875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 13.0, 10.0, 14.0, 18.0, 23.0, 22.0, 31.0, 21.0, 18.0, 40.0, 24.0, 34.0, 34.0, 34.0, 36.0, 47.0, 45.0, 35.0, 38.0, 45.0, 46.0, 33.0, 31.0, 31.0, 38.0, 24.0, 28.0, 24.0, 25.0, 20.0, 12.0, 16.0, 16.0, 9.0, 8.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.5078125, -2.4259033203125, -2.343994140625, -2.2620849609375, -2.18017578125, -2.0982666015625, -2.016357421875, -1.9344482421875, -1.8525390625, -1.7706298828125, -1.688720703125, -1.6068115234375, -1.52490234375, -1.4429931640625, -1.361083984375, -1.2791748046875, -1.197265625, -1.1153564453125, -1.033447265625, -0.9515380859375, -0.86962890625, -0.7877197265625, -0.705810546875, -0.6239013671875, -0.5419921875, -0.4600830078125, -0.378173828125, -0.2962646484375, -0.21435546875, -0.1324462890625, -0.050537109375, 0.0313720703125, 0.11328125, 0.1951904296875, 0.277099609375, 0.3590087890625, 0.44091796875, 0.5228271484375, 0.604736328125, 0.6866455078125, 0.7685546875, 0.8504638671875, 0.932373046875, 1.0142822265625, 1.09619140625, 1.1781005859375, 1.260009765625, 1.3419189453125, 1.423828125, 1.5057373046875, 1.587646484375, 1.6695556640625, 1.75146484375, 1.8333740234375, 1.915283203125, 1.9971923828125, 2.0791015625, 2.1610107421875, 2.242919921875, 2.3248291015625, 2.40673828125, 2.4886474609375, 2.570556640625, 2.6524658203125, 2.734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 13.0, 10.0, 22.0, 34.0, 62.0, 83.0, 116.0, 184.0, 280.0, 401.0, 675.0, 1051.0, 1761.0, 2814.0, 4762.0, 8264.0, 15173.0, 27803.0, 52551.0, 101907.0, 190408.0, 256518.0, 178435.0, 95789.0, 48904.0, 26193.0, 14117.0, 7997.0, 4625.0, 2823.0, 1761.0, 1060.0, 677.0, 449.0, 296.0, 170.0, 128.0, 80.0, 47.0, 36.0, 28.0, 24.0, 10.0, 2.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.5703125, -2.49346923828125, -2.4166259765625, -2.33978271484375, -2.262939453125, -2.18609619140625, -2.1092529296875, -2.03240966796875, -1.95556640625, -1.87872314453125, -1.8018798828125, -1.72503662109375, -1.648193359375, -1.57135009765625, -1.4945068359375, -1.41766357421875, -1.3408203125, -1.26397705078125, -1.1871337890625, -1.11029052734375, -1.033447265625, -0.95660400390625, -0.8797607421875, -0.80291748046875, -0.72607421875, -0.64923095703125, -0.5723876953125, -0.49554443359375, -0.418701171875, -0.34185791015625, -0.2650146484375, -0.18817138671875, -0.111328125, -0.03448486328125, 0.0423583984375, 0.11920166015625, 0.196044921875, 0.27288818359375, 0.3497314453125, 0.42657470703125, 0.50341796875, 0.58026123046875, 0.6571044921875, 0.73394775390625, 0.810791015625, 0.88763427734375, 0.9644775390625, 1.04132080078125, 1.1181640625, 1.19500732421875, 1.2718505859375, 1.34869384765625, 1.425537109375, 1.50238037109375, 1.5792236328125, 1.65606689453125, 1.73291015625, 1.80975341796875, 1.8865966796875, 1.96343994140625, 2.040283203125, 2.11712646484375, 2.1939697265625, 2.27081298828125, 2.34765625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 7.0, 10.0, 12.0, 16.0, 17.0, 21.0, 21.0, 26.0, 26.0, 36.0, 32.0, 33.0, 43.0, 37.0, 35.0, 37.0, 38.0, 41.0, 56.0, 45.0, 51.0, 51.0, 32.0, 39.0, 44.0, 30.0, 25.0, 19.0, 17.0, 24.0, 15.0, 11.0, 15.0, 12.0, 11.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.478515625, -1.42303466796875, -1.3675537109375, -1.31207275390625, -1.256591796875, -1.20111083984375, -1.1456298828125, -1.09014892578125, -1.03466796875, -0.97918701171875, -0.9237060546875, -0.86822509765625, -0.812744140625, -0.75726318359375, -0.7017822265625, -0.64630126953125, -0.5908203125, -0.53533935546875, -0.4798583984375, -0.42437744140625, -0.368896484375, -0.31341552734375, -0.2579345703125, -0.20245361328125, -0.14697265625, -0.09149169921875, -0.0360107421875, 0.01947021484375, 0.074951171875, 0.13043212890625, 0.1859130859375, 0.24139404296875, 0.296875, 0.35235595703125, 0.4078369140625, 0.46331787109375, 0.518798828125, 0.57427978515625, 0.6297607421875, 0.68524169921875, 0.74072265625, 0.79620361328125, 0.8516845703125, 0.90716552734375, 0.962646484375, 1.01812744140625, 1.0736083984375, 1.12908935546875, 1.1845703125, 1.24005126953125, 1.2955322265625, 1.35101318359375, 1.406494140625, 1.46197509765625, 1.5174560546875, 1.57293701171875, 1.62841796875, 1.68389892578125, 1.7393798828125, 1.79486083984375, 1.850341796875, 1.90582275390625, 1.9613037109375, 2.01678466796875, 2.072265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 7.0, 8.0, 14.0, 17.0, 25.0, 28.0, 37.0, 56.0, 84.0, 107.0, 146.0, 208.0, 266.0, 416.0, 629.0, 1005.0, 1734.0, 3486.0, 8558.0, 25626.0, 100561.0, 424736.0, 361739.0, 82331.0, 21619.0, 7362.0, 3175.0, 1684.0, 948.0, 607.0, 384.0, 285.0, 181.0, 140.0, 104.0, 67.0, 48.0, 29.0, 38.0, 13.0, 13.0, 9.0, 11.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.34375, -2.267974853515625, -2.19219970703125, -2.116424560546875, -2.0406494140625, -1.964874267578125, -1.88909912109375, -1.813323974609375, -1.737548828125, -1.661773681640625, -1.58599853515625, -1.510223388671875, -1.4344482421875, -1.358673095703125, -1.28289794921875, -1.207122802734375, -1.13134765625, -1.055572509765625, -0.97979736328125, -0.904022216796875, -0.8282470703125, -0.752471923828125, -0.67669677734375, -0.600921630859375, -0.525146484375, -0.449371337890625, -0.37359619140625, -0.297821044921875, -0.2220458984375, -0.146270751953125, -0.07049560546875, 0.005279541015625, 0.0810546875, 0.156829833984375, 0.23260498046875, 0.308380126953125, 0.3841552734375, 0.459930419921875, 0.53570556640625, 0.611480712890625, 0.687255859375, 0.763031005859375, 0.83880615234375, 0.914581298828125, 0.9903564453125, 1.066131591796875, 1.14190673828125, 1.217681884765625, 1.29345703125, 1.369232177734375, 1.44500732421875, 1.520782470703125, 1.5965576171875, 1.672332763671875, 1.74810791015625, 1.823883056640625, 1.899658203125, 1.975433349609375, 2.05120849609375, 2.126983642578125, 2.2027587890625, 2.278533935546875, 2.35430908203125, 2.430084228515625, 2.505859375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 11.0, 11.0, 17.0, 29.0, 28.0, 59.0, 76.0, 117.0, 157.0, 123.0, 118.0, 78.0, 55.0, 38.0, 24.0, 23.0, 13.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.98377799987793e-05, -9.640119969844818e-05, -9.296461939811707e-05, -8.952803909778595e-05, -8.609145879745483e-05, -8.265487849712372e-05, -7.92182981967926e-05, -7.578171789646149e-05, -7.234513759613037e-05, -6.890855729579926e-05, -6.547197699546814e-05, -6.203539669513702e-05, -5.859881639480591e-05, -5.516223609447479e-05, -5.172565579414368e-05, -4.828907549381256e-05, -4.4852495193481445e-05, -4.141591489315033e-05, -3.7979334592819214e-05, -3.45427542924881e-05, -3.110617399215698e-05, -2.7669593691825867e-05, -2.423301339149475e-05, -2.0796433091163635e-05, -1.735985279083252e-05, -1.3923272490501404e-05, -1.0486692190170288e-05, -7.050111889839172e-06, -3.6135315895080566e-06, -1.7695128917694092e-07, 3.259629011154175e-06, 6.6962093114852905e-06, 1.0132789611816406e-05, 1.3569369912147522e-05, 1.7005950212478638e-05, 2.0442530512809753e-05, 2.387911081314087e-05, 2.7315691113471985e-05, 3.07522714138031e-05, 3.4188851714134216e-05, 3.762543201446533e-05, 4.106201231479645e-05, 4.4498592615127563e-05, 4.793517291545868e-05, 5.1371753215789795e-05, 5.480833351612091e-05, 5.8244913816452026e-05, 6.168149411678314e-05, 6.511807441711426e-05, 6.855465471744537e-05, 7.199123501777649e-05, 7.54278153181076e-05, 7.886439561843872e-05, 8.230097591876984e-05, 8.573755621910095e-05, 8.917413651943207e-05, 9.261071681976318e-05, 9.60472971200943e-05, 9.948387742042542e-05, 0.00010292045772075653, 0.00010635703802108765, 0.00010979361832141876, 0.00011323019862174988, 0.000116666778922081, 0.00012010335922241211]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 0.0, 3.0, 2.0, 5.0, 6.0, 5.0, 10.0, 20.0, 14.0, 39.0, 31.0, 49.0, 85.0, 109.0, 162.0, 244.0, 379.0, 591.0, 1030.0, 1858.0, 3665.0, 8172.0, 20552.0, 56226.0, 158642.0, 333831.0, 280779.0, 113755.0, 40263.0, 15066.0, 6172.0, 2828.0, 1547.0, 883.0, 503.0, 314.0, 234.0, 158.0, 85.0, 71.0, 44.0, 37.0, 24.0, 21.0, 14.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5126953125, -1.465179443359375, -1.41766357421875, -1.370147705078125, -1.3226318359375, -1.275115966796875, -1.22760009765625, -1.180084228515625, -1.132568359375, -1.085052490234375, -1.03753662109375, -0.990020751953125, -0.9425048828125, -0.894989013671875, -0.84747314453125, -0.799957275390625, -0.75244140625, -0.704925537109375, -0.65740966796875, -0.609893798828125, -0.5623779296875, -0.514862060546875, -0.46734619140625, -0.419830322265625, -0.372314453125, -0.324798583984375, -0.27728271484375, -0.229766845703125, -0.1822509765625, -0.134735107421875, -0.08721923828125, -0.039703369140625, 0.0078125, 0.055328369140625, 0.10284423828125, 0.150360107421875, 0.1978759765625, 0.245391845703125, 0.29290771484375, 0.340423583984375, 0.387939453125, 0.435455322265625, 0.48297119140625, 0.530487060546875, 0.5780029296875, 0.625518798828125, 0.67303466796875, 0.720550537109375, 0.76806640625, 0.815582275390625, 0.86309814453125, 0.910614013671875, 0.9581298828125, 1.005645751953125, 1.05316162109375, 1.100677490234375, 1.148193359375, 1.195709228515625, 1.24322509765625, 1.290740966796875, 1.3382568359375, 1.385772705078125, 1.43328857421875, 1.480804443359375, 1.5283203125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 5.0, 14.0, 13.0, 25.0, 38.0, 32.0, 60.0, 73.0, 79.0, 98.0, 95.0, 77.0, 92.0, 70.0, 60.0, 52.0, 25.0, 21.0, 20.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.482177734375, -0.4699516296386719, -0.45772552490234375, -0.4454994201660156, -0.4332733154296875, -0.4210472106933594, -0.40882110595703125, -0.3965950012207031, -0.384368896484375, -0.3721427917480469, -0.35991668701171875, -0.3476905822753906, -0.3354644775390625, -0.3232383728027344, -0.31101226806640625, -0.2987861633300781, -0.28656005859375, -0.2743339538574219, -0.26210784912109375, -0.24988174438476562, -0.2376556396484375, -0.22542953491210938, -0.21320343017578125, -0.20097732543945312, -0.188751220703125, -0.17652511596679688, -0.16429901123046875, -0.15207290649414062, -0.1398468017578125, -0.12762069702148438, -0.11539459228515625, -0.10316848754882812, -0.0909423828125, -0.07871627807617188, -0.06649017333984375, -0.054264068603515625, -0.0420379638671875, -0.029811859130859375, -0.01758575439453125, -0.005359649658203125, 0.006866455078125, 0.019092559814453125, 0.03131866455078125, 0.043544769287109375, 0.0557708740234375, 0.06799697875976562, 0.08022308349609375, 0.09244918823242188, 0.10467529296875, 0.11690139770507812, 0.12912750244140625, 0.14135360717773438, 0.1535797119140625, 0.16580581665039062, 0.17803192138671875, 0.19025802612304688, 0.202484130859375, 0.21471023559570312, 0.22693634033203125, 0.23916244506835938, 0.2513885498046875, 0.2636146545410156, 0.27584075927734375, 0.2880668640136719, 0.30029296875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 5.0, 7.0, 5.0, 8.0, 10.0, 11.0, 13.0, 22.0, 20.0, 27.0, 42.0, 56.0, 48.0, 87.0, 88.0, 103.0, 95.0, 75.0, 62.0, 49.0, 47.0, 26.0, 20.0, 18.0, 18.0, 7.0, 11.0, 8.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.888411045074463, -5.7000813484191895, -5.511752128601074, -5.323422431945801, -5.1350932121276855, -4.946763515472412, -4.758434295654297, -4.570104598999023, -4.38177490234375, -4.193445205688477, -4.005115985870361, -3.816786289215088, -3.6284570693969727, -3.440127372741699, -3.251797914505005, -3.0634684562683105, -2.8751392364501953, -2.686809778213501, -2.4984803199768066, -2.310150623321533, -2.121821403503418, -1.933491826057434, -1.7451622486114502, -1.5568327903747559, -1.3685033321380615, -1.1801738739013672, -0.9918443560600281, -0.803514838218689, -0.6151853799819946, -0.4268559217453003, -0.2385263442993164, -0.05019688606262207, 0.13813257217407227, 0.326462060213089, 0.5147915482521057, 0.7031210660934448, 0.8914505243301392, 1.0797799825668335, 1.2681095600128174, 1.4564390182495117, 1.644768476486206, 1.8330979347229004, 2.0214273929595947, 2.209756851196289, 2.3980865478515625, 2.5864157676696777, 2.774745464324951, 2.9630749225616455, 3.15140438079834, 3.339733839035034, 3.5280632972717285, 3.716392993927002, 3.904722213745117, 4.093051910400391, 4.281381607055664, 4.469710826873779, 4.6580400466918945, 4.846369743347168, 5.034698963165283, 5.223028659820557, 5.411357879638672, 5.599687576293945, 5.788017272949219, 5.976346492767334, 6.164676189422607]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 1.0, 3.0, 9.0, 9.0, 11.0, 9.0, 21.0, 22.0, 22.0, 24.0, 22.0, 28.0, 24.0, 40.0, 37.0, 42.0, 43.0, 41.0, 38.0, 42.0, 35.0, 57.0, 54.0, 35.0, 34.0, 30.0, 33.0, 34.0, 25.0, 27.0, 28.0, 20.0, 19.0, 15.0, 11.0, 10.0, 13.0, 6.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.561657190322876, -2.4844746589660645, -2.407291889190674, -2.3301093578338623, -2.252926826477051, -2.17574405670166, -2.0985615253448486, -2.021378993988037, -1.944196343421936, -1.867013692855835, -1.7898311614990234, -1.7126485109329224, -1.6354658603668213, -1.5582833290100098, -1.4811006784439087, -1.4039180278778076, -1.326735496520996, -1.249552845954895, -1.1723703145980835, -1.0951876640319824, -1.018005132675171, -0.9408224821090698, -0.8636398315429688, -0.7864572405815125, -0.7092746496200562, -0.6320920586585999, -0.5549094676971436, -0.4777268171310425, -0.4005442261695862, -0.3233616352081299, -0.2461790144443512, -0.1689963936805725, -0.09181404113769531, -0.01463143527507782, 0.06255117058753967, 0.13973377645015717, 0.21691638231277466, 0.29409897327423096, 0.37128159403800964, 0.44846421480178833, 0.5256468057632446, 0.6028293967247009, 0.6800119876861572, 0.7571946382522583, 0.8343772292137146, 0.9115598201751709, 0.988742470741272, 1.065925121307373, 1.1431076526641846, 1.2202903032302856, 1.2974728345870972, 1.3746554851531982, 1.4518380165100098, 1.5290206670761108, 1.606203317642212, 1.6833858489990234, 1.7605684995651245, 1.8377511501312256, 1.914933681488037, 1.9921163320541382, 2.0692989826202393, 2.146481513977051, 2.2236640453338623, 2.300846815109253, 2.3780293464660645]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 6.0, 11.0, 11.0, 29.0, 34.0, 61.0, 79.0, 129.0, 166.0, 271.0, 406.0, 581.0, 790.0, 1298.0, 2133.0, 3277.0, 5247.0, 8718.0, 14123.0, 23841.0, 39772.0, 65644.0, 103395.0, 145436.0, 170429.0, 155819.0, 115644.0, 74993.0, 45820.0, 27484.0, 16392.0, 9909.0, 6025.0, 3874.0, 2279.0, 1472.0, 1040.0, 664.0, 415.0, 276.0, 182.0, 133.0, 93.0, 56.0, 38.0, 25.0, 15.0, 10.0, 14.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.53125, -2.453704833984375, -2.37615966796875, -2.298614501953125, -2.2210693359375, -2.143524169921875, -2.06597900390625, -1.988433837890625, -1.910888671875, -1.833343505859375, -1.75579833984375, -1.678253173828125, -1.6007080078125, -1.523162841796875, -1.44561767578125, -1.368072509765625, -1.29052734375, -1.212982177734375, -1.13543701171875, -1.057891845703125, -0.9803466796875, -0.902801513671875, -0.82525634765625, -0.747711181640625, -0.670166015625, -0.592620849609375, -0.51507568359375, -0.437530517578125, -0.3599853515625, -0.282440185546875, -0.20489501953125, -0.127349853515625, -0.0498046875, 0.027740478515625, 0.10528564453125, 0.182830810546875, 0.2603759765625, 0.337921142578125, 0.41546630859375, 0.493011474609375, 0.570556640625, 0.648101806640625, 0.72564697265625, 0.803192138671875, 0.8807373046875, 0.958282470703125, 1.03582763671875, 1.113372802734375, 1.19091796875, 1.268463134765625, 1.34600830078125, 1.423553466796875, 1.5010986328125, 1.578643798828125, 1.65618896484375, 1.733734130859375, 1.811279296875, 1.888824462890625, 1.96636962890625, 2.043914794921875, 2.1214599609375, 2.199005126953125, 2.27655029296875, 2.354095458984375, 2.431640625]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 7.0, 3.0, 3.0, 8.0, 12.0, 24.0, 15.0, 21.0, 22.0, 26.0, 35.0, 25.0, 35.0, 38.0, 54.0, 29.0, 36.0, 47.0, 66.0, 50.0, 52.0, 42.0, 41.0, 29.0, 29.0, 33.0, 29.0, 38.0, 21.0, 26.0, 21.0, 13.0, 15.0, 15.0, 13.0, 7.0, 7.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9296875, -2.8380126953125, -2.746337890625, -2.6546630859375, -2.56298828125, -2.4713134765625, -2.379638671875, -2.2879638671875, -2.1962890625, -2.1046142578125, -2.012939453125, -1.9212646484375, -1.82958984375, -1.7379150390625, -1.646240234375, -1.5545654296875, -1.462890625, -1.3712158203125, -1.279541015625, -1.1878662109375, -1.09619140625, -1.0045166015625, -0.912841796875, -0.8211669921875, -0.7294921875, -0.6378173828125, -0.546142578125, -0.4544677734375, -0.36279296875, -0.2711181640625, -0.179443359375, -0.0877685546875, 0.00390625, 0.0955810546875, 0.187255859375, 0.2789306640625, 0.37060546875, 0.4622802734375, 0.553955078125, 0.6456298828125, 0.7373046875, 0.8289794921875, 0.920654296875, 1.0123291015625, 1.10400390625, 1.1956787109375, 1.287353515625, 1.3790283203125, 1.470703125, 1.5623779296875, 1.654052734375, 1.7457275390625, 1.83740234375, 1.9290771484375, 2.020751953125, 2.1124267578125, 2.2041015625, 2.2957763671875, 2.387451171875, 2.4791259765625, 2.57080078125, 2.6624755859375, 2.754150390625, 2.8458251953125, 2.9375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 11.0, 6.0, 13.0, 19.0, 13.0, 29.0, 37.0, 61.0, 69.0, 94.0, 172.0, 283.0, 443.0, 707.0, 1200.0, 2067.0, 3437.0, 5976.0, 11374.0, 21297.0, 40693.0, 78621.0, 138556.0, 202703.0, 208139.0, 149228.0, 85923.0, 45498.0, 23467.0, 12367.0, 6813.0, 3721.0, 2100.0, 1249.0, 789.0, 471.0, 315.0, 198.0, 135.0, 100.0, 54.0, 35.0, 28.0, 20.0, 13.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.14453125, -3.03997802734375, -2.9354248046875, -2.83087158203125, -2.726318359375, -2.62176513671875, -2.5172119140625, -2.41265869140625, -2.30810546875, -2.20355224609375, -2.0989990234375, -1.99444580078125, -1.889892578125, -1.78533935546875, -1.6807861328125, -1.57623291015625, -1.4716796875, -1.36712646484375, -1.2625732421875, -1.15802001953125, -1.053466796875, -0.94891357421875, -0.8443603515625, -0.73980712890625, -0.63525390625, -0.53070068359375, -0.4261474609375, -0.32159423828125, -0.217041015625, -0.11248779296875, -0.0079345703125, 0.09661865234375, 0.201171875, 0.30572509765625, 0.4102783203125, 0.51483154296875, 0.619384765625, 0.72393798828125, 0.8284912109375, 0.93304443359375, 1.03759765625, 1.14215087890625, 1.2467041015625, 1.35125732421875, 1.455810546875, 1.56036376953125, 1.6649169921875, 1.76947021484375, 1.8740234375, 1.97857666015625, 2.0831298828125, 2.18768310546875, 2.292236328125, 2.39678955078125, 2.5013427734375, 2.60589599609375, 2.71044921875, 2.81500244140625, 2.9195556640625, 3.02410888671875, 3.128662109375, 3.23321533203125, 3.3377685546875, 3.44232177734375, 3.546875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 7.0, 6.0, 6.0, 10.0, 12.0, 20.0, 18.0, 18.0, 25.0, 19.0, 23.0, 26.0, 34.0, 40.0, 35.0, 35.0, 37.0, 44.0, 36.0, 36.0, 39.0, 43.0, 36.0, 45.0, 44.0, 38.0, 29.0, 26.0, 29.0, 25.0, 21.0, 21.0, 23.0, 21.0, 11.0, 11.0, 12.0, 8.0, 5.0, 4.0, 2.0, 5.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6611328125, -1.6121826171875, -1.563232421875, -1.5142822265625, -1.46533203125, -1.4163818359375, -1.367431640625, -1.3184814453125, -1.26953125, -1.2205810546875, -1.171630859375, -1.1226806640625, -1.07373046875, -1.0247802734375, -0.975830078125, -0.9268798828125, -0.8779296875, -0.8289794921875, -0.780029296875, -0.7310791015625, -0.68212890625, -0.6331787109375, -0.584228515625, -0.5352783203125, -0.486328125, -0.4373779296875, -0.388427734375, -0.3394775390625, -0.29052734375, -0.2415771484375, -0.192626953125, -0.1436767578125, -0.0947265625, -0.0457763671875, 0.003173828125, 0.0521240234375, 0.10107421875, 0.1500244140625, 0.198974609375, 0.2479248046875, 0.296875, 0.3458251953125, 0.394775390625, 0.4437255859375, 0.49267578125, 0.5416259765625, 0.590576171875, 0.6395263671875, 0.6884765625, 0.7374267578125, 0.786376953125, 0.8353271484375, 0.88427734375, 0.9332275390625, 0.982177734375, 1.0311279296875, 1.080078125, 1.1290283203125, 1.177978515625, 1.2269287109375, 1.27587890625, 1.3248291015625, 1.373779296875, 1.4227294921875, 1.4716796875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 9.0, 11.0, 12.0, 18.0, 28.0, 39.0, 41.0, 69.0, 121.0, 155.0, 260.0, 451.0, 700.0, 1294.0, 2622.0, 5432.0, 12208.0, 30480.0, 83799.0, 227310.0, 361301.0, 202228.0, 72008.0, 26629.0, 10948.0, 4912.0, 2359.0, 1215.0, 732.0, 431.0, 253.0, 165.0, 106.0, 54.0, 40.0, 38.0, 30.0, 13.0, 8.0, 5.0, 4.0, 0.0, 8.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.328125, -2.2490234375, -2.169921875, -2.0908203125, -2.01171875, -1.9326171875, -1.853515625, -1.7744140625, -1.6953125, -1.6162109375, -1.537109375, -1.4580078125, -1.37890625, -1.2998046875, -1.220703125, -1.1416015625, -1.0625, -0.9833984375, -0.904296875, -0.8251953125, -0.74609375, -0.6669921875, -0.587890625, -0.5087890625, -0.4296875, -0.3505859375, -0.271484375, -0.1923828125, -0.11328125, -0.0341796875, 0.044921875, 0.1240234375, 0.203125, 0.2822265625, 0.361328125, 0.4404296875, 0.51953125, 0.5986328125, 0.677734375, 0.7568359375, 0.8359375, 0.9150390625, 0.994140625, 1.0732421875, 1.15234375, 1.2314453125, 1.310546875, 1.3896484375, 1.46875, 1.5478515625, 1.626953125, 1.7060546875, 1.78515625, 1.8642578125, 1.943359375, 2.0224609375, 2.1015625, 2.1806640625, 2.259765625, 2.3388671875, 2.41796875, 2.4970703125, 2.576171875, 2.6552734375, 2.734375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 8.0, 9.0, 12.0, 28.0, 29.0, 48.0, 71.0, 77.0, 96.0, 103.0, 106.0, 101.0, 73.0, 65.0, 35.0, 28.0, 25.0, 21.0, 11.0, 8.0, 10.0, 5.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002073049545288086, -0.0002006329596042633, -0.00019396096467971802, -0.00018728896975517273, -0.00018061697483062744, -0.00017394497990608215, -0.00016727298498153687, -0.00016060099005699158, -0.0001539289951324463, -0.000147257000207901, -0.0001405850052833557, -0.00013391301035881042, -0.00012724101543426514, -0.00012056902050971985, -0.00011389702558517456, -0.00010722503066062927, -0.00010055303573608398, -9.38810408115387e-05, -8.720904588699341e-05, -8.053705096244812e-05, -7.386505603790283e-05, -6.719306111335754e-05, -6.0521066188812256e-05, -5.384907126426697e-05, -4.717707633972168e-05, -4.050508141517639e-05, -3.3833086490631104e-05, -2.7161091566085815e-05, -2.0489096641540527e-05, -1.381710171699524e-05, -7.145106792449951e-06, -4.731118679046631e-07, 6.198883056640625e-06, 1.2870877981185913e-05, 1.95428729057312e-05, 2.621486783027649e-05, 3.288686275482178e-05, 3.9558857679367065e-05, 4.6230852603912354e-05, 5.290284752845764e-05, 5.957484245300293e-05, 6.624683737754822e-05, 7.29188323020935e-05, 7.95908272266388e-05, 8.626282215118408e-05, 9.293481707572937e-05, 9.960681200027466e-05, 0.00010627880692481995, 0.00011295080184936523, 0.00011962279677391052, 0.0001262947916984558, 0.0001329667866230011, 0.0001396387815475464, 0.00014631077647209167, 0.00015298277139663696, 0.00015965476632118225, 0.00016632676124572754, 0.00017299875617027283, 0.00017967075109481812, 0.0001863427460193634, 0.0001930147409439087, 0.00019968673586845398, 0.00020635873079299927, 0.00021303072571754456, 0.00021970272064208984]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 9.0, 13.0, 17.0, 31.0, 48.0, 66.0, 99.0, 148.0, 229.0, 340.0, 497.0, 804.0, 1247.0, 2001.0, 3338.0, 5502.0, 9183.0, 15690.0, 27373.0, 49470.0, 88406.0, 148808.0, 205393.0, 191846.0, 126957.0, 73580.0, 41069.0, 23013.0, 13212.0, 7766.0, 4673.0, 2819.0, 1801.0, 1123.0, 658.0, 452.0, 315.0, 187.0, 122.0, 77.0, 62.0, 44.0, 29.0, 12.0, 9.0, 11.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.4541015625, -1.4111328125, -1.3681640625, -1.3251953125, -1.2822265625, -1.2392578125, -1.1962890625, -1.1533203125, -1.1103515625, -1.0673828125, -1.0244140625, -0.9814453125, -0.9384765625, -0.8955078125, -0.8525390625, -0.8095703125, -0.7666015625, -0.7236328125, -0.6806640625, -0.6376953125, -0.5947265625, -0.5517578125, -0.5087890625, -0.4658203125, -0.4228515625, -0.3798828125, -0.3369140625, -0.2939453125, -0.2509765625, -0.2080078125, -0.1650390625, -0.1220703125, -0.0791015625, -0.0361328125, 0.0068359375, 0.0498046875, 0.0927734375, 0.1357421875, 0.1787109375, 0.2216796875, 0.2646484375, 0.3076171875, 0.3505859375, 0.3935546875, 0.4365234375, 0.4794921875, 0.5224609375, 0.5654296875, 0.6083984375, 0.6513671875, 0.6943359375, 0.7373046875, 0.7802734375, 0.8232421875, 0.8662109375, 0.9091796875, 0.9521484375, 0.9951171875, 1.0380859375, 1.0810546875, 1.1240234375, 1.1669921875, 1.2099609375, 1.2529296875, 1.2958984375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 3.0, 6.0, 4.0, 5.0, 10.0, 13.0, 18.0, 21.0, 30.0, 25.0, 42.0, 42.0, 47.0, 60.0, 40.0, 76.0, 60.0, 77.0, 69.0, 47.0, 50.0, 42.0, 42.0, 34.0, 24.0, 26.0, 19.0, 16.0, 12.0, 8.0, 11.0, 4.0, 4.0, 0.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412109375, -0.4001312255859375, -0.388153076171875, -0.3761749267578125, -0.36419677734375, -0.3522186279296875, -0.340240478515625, -0.3282623291015625, -0.3162841796875, -0.3043060302734375, -0.292327880859375, -0.2803497314453125, -0.26837158203125, -0.2563934326171875, -0.244415283203125, -0.2324371337890625, -0.220458984375, -0.2084808349609375, -0.196502685546875, -0.1845245361328125, -0.17254638671875, -0.1605682373046875, -0.148590087890625, -0.1366119384765625, -0.1246337890625, -0.1126556396484375, -0.100677490234375, -0.0886993408203125, -0.07672119140625, -0.0647430419921875, -0.052764892578125, -0.0407867431640625, -0.02880859375, -0.0168304443359375, -0.004852294921875, 0.0071258544921875, 0.01910400390625, 0.0310821533203125, 0.043060302734375, 0.0550384521484375, 0.0670166015625, 0.0789947509765625, 0.090972900390625, 0.1029510498046875, 0.11492919921875, 0.1269073486328125, 0.138885498046875, 0.1508636474609375, 0.162841796875, 0.1748199462890625, 0.186798095703125, 0.1987762451171875, 0.21075439453125, 0.2227325439453125, 0.234710693359375, 0.2466888427734375, 0.2586669921875, 0.2706451416015625, 0.282623291015625, 0.2946014404296875, 0.30657958984375, 0.3185577392578125, 0.330535888671875, 0.3425140380859375, 0.3544921875]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 1.0, 5.0, 5.0, 9.0, 9.0, 15.0, 15.0, 13.0, 26.0, 31.0, 31.0, 42.0, 50.0, 65.0, 93.0, 83.0, 98.0, 89.0, 63.0, 57.0, 48.0, 34.0, 27.0, 19.0, 15.0, 13.0, 7.0, 10.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.055029392242432, -5.875762462615967, -5.696495532989502, -5.517228603363037, -5.337961673736572, -5.158694744110107, -4.979427814483643, -4.800160884857178, -4.620893955230713, -4.441627025604248, -4.262360095977783, -4.083093166351318, -3.9038262367248535, -3.7245593070983887, -3.545292377471924, -3.366025447845459, -3.186758518218994, -3.0074915885925293, -2.8282246589660645, -2.6489577293395996, -2.4696907997131348, -2.29042387008667, -2.111156940460205, -1.9318900108337402, -1.7526230812072754, -1.5733561515808105, -1.3940892219543457, -1.2148222923278809, -1.035555362701416, -0.8562884330749512, -0.6770215034484863, -0.4977545738220215, -0.31848812103271484, -0.13922119140625, 0.040045738220214844, 0.2193126678466797, 0.39857959747314453, 0.5778465270996094, 0.7571134567260742, 0.9363803863525391, 1.115647315979004, 1.2949142456054688, 1.4741811752319336, 1.6534481048583984, 1.8327150344848633, 2.011981964111328, 2.191248893737793, 2.370515823364258, 2.5497827529907227, 2.7290496826171875, 2.9083166122436523, 3.087583541870117, 3.266850471496582, 3.446117401123047, 3.6253843307495117, 3.8046512603759766, 3.9839181900024414, 4.163185119628906, 4.342452049255371, 4.521718978881836, 4.700985908508301, 4.880252838134766, 5.0595197677612305, 5.238786697387695, 5.41805362701416]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 7.0, 6.0, 9.0, 12.0, 13.0, 15.0, 15.0, 21.0, 24.0, 18.0, 33.0, 26.0, 30.0, 28.0, 40.0, 41.0, 47.0, 34.0, 43.0, 48.0, 45.0, 43.0, 43.0, 38.0, 32.0, 36.0, 25.0, 14.0, 23.0, 30.0, 22.0, 18.0, 23.0, 19.0, 12.0, 10.0, 8.0, 12.0, 15.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0], "bins": [-2.5916800498962402, -2.515676259994507, -2.4396724700927734, -2.363668441772461, -2.2876646518707275, -2.211660861968994, -2.1356570720672607, -2.0596532821655273, -1.9836493730545044, -1.907645583152771, -1.831641674041748, -1.7556378841400146, -1.6796340942382812, -1.6036301851272583, -1.527626395225525, -1.451622486114502, -1.3756186962127686, -1.2996149063110352, -1.2236109972000122, -1.1476072072982788, -1.0716032981872559, -0.9955995082855225, -0.9195957183837891, -0.8435918688774109, -0.7675880193710327, -0.6915841698646545, -0.6155803203582764, -0.539576530456543, -0.4635726809501648, -0.3875688314437866, -0.31156501173973083, -0.23556119203567505, -0.15955734252929688, -0.0835535079240799, -0.007549673318862915, 0.06845416128635406, 0.14445799589157104, 0.22046184539794922, 0.296465665102005, 0.3724694848060608, 0.44847333431243896, 0.5244771838188171, 0.6004810333251953, 0.6764848232269287, 0.7524886727333069, 0.8284925222396851, 0.9044963121414185, 0.9805001616477966, 1.0565040111541748, 1.1325078010559082, 1.2085117101669312, 1.2845155000686646, 1.3605194091796875, 1.436523199081421, 1.5125269889831543, 1.5885307788848877, 1.6645346879959106, 1.740538477897644, 1.816542387008667, 1.8925461769104004, 1.9685499668121338, 2.044553756713867, 2.1205577850341797, 2.196561574935913, 2.2725653648376465]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 3.0, 9.0, 13.0, 29.0, 19.0, 46.0, 89.0, 145.0, 266.0, 452.0, 764.0, 1358.0, 2439.0, 4644.0, 9027.0, 18040.0, 41123.0, 109517.0, 368495.0, 1326791.0, 1587015.0, 491653.0, 138018.0, 49592.0, 21493.0, 10405.0, 5500.0, 2949.0, 1737.0, 1056.0, 619.0, 377.0, 224.0, 140.0, 95.0, 53.0, 30.0, 20.0, 10.0, 13.0, 9.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.453125, -6.263916015625, -6.07470703125, -5.885498046875, -5.6962890625, -5.507080078125, -5.31787109375, -5.128662109375, -4.939453125, -4.750244140625, -4.56103515625, -4.371826171875, -4.1826171875, -3.993408203125, -3.80419921875, -3.614990234375, -3.42578125, -3.236572265625, -3.04736328125, -2.858154296875, -2.6689453125, -2.479736328125, -2.29052734375, -2.101318359375, -1.912109375, -1.722900390625, -1.53369140625, -1.344482421875, -1.1552734375, -0.966064453125, -0.77685546875, -0.587646484375, -0.3984375, -0.209228515625, -0.02001953125, 0.169189453125, 0.3583984375, 0.547607421875, 0.73681640625, 0.926025390625, 1.115234375, 1.304443359375, 1.49365234375, 1.682861328125, 1.8720703125, 2.061279296875, 2.25048828125, 2.439697265625, 2.62890625, 2.818115234375, 3.00732421875, 3.196533203125, 3.3857421875, 3.574951171875, 3.76416015625, 3.953369140625, 4.142578125, 4.331787109375, 4.52099609375, 4.710205078125, 4.8994140625, 5.088623046875, 5.27783203125, 5.467041015625, 5.65625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 8.0, 9.0, 13.0, 11.0, 8.0, 18.0, 17.0, 20.0, 27.0, 16.0, 30.0, 24.0, 47.0, 29.0, 50.0, 34.0, 51.0, 57.0, 53.0, 54.0, 52.0, 46.0, 43.0, 38.0, 29.0, 28.0, 21.0, 24.0, 24.0, 16.0, 18.0, 19.0, 15.0, 13.0, 13.0, 7.0, 4.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.287109375, -2.220703125, -2.154296875, -2.087890625, -2.021484375, -1.955078125, -1.888671875, -1.822265625, -1.755859375, -1.689453125, -1.623046875, -1.556640625, -1.490234375, -1.423828125, -1.357421875, -1.291015625, -1.224609375, -1.158203125, -1.091796875, -1.025390625, -0.958984375, -0.892578125, -0.826171875, -0.759765625, -0.693359375, -0.626953125, -0.560546875, -0.494140625, -0.427734375, -0.361328125, -0.294921875, -0.228515625, -0.162109375, -0.095703125, -0.029296875, 0.037109375, 0.103515625, 0.169921875, 0.236328125, 0.302734375, 0.369140625, 0.435546875, 0.501953125, 0.568359375, 0.634765625, 0.701171875, 0.767578125, 0.833984375, 0.900390625, 0.966796875, 1.033203125, 1.099609375, 1.166015625, 1.232421875, 1.298828125, 1.365234375, 1.431640625, 1.498046875, 1.564453125, 1.630859375, 1.697265625, 1.763671875, 1.830078125, 1.896484375, 1.962890625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 6.0, 4.0, 8.0, 14.0, 25.0, 19.0, 22.0, 51.0, 60.0, 78.0, 128.0, 193.0, 308.0, 494.0, 822.0, 1358.0, 2309.0, 4015.0, 7283.0, 14437.0, 30445.0, 71489.0, 201332.0, 700038.0, 1847631.0, 902720.0, 251582.0, 85940.0, 35411.0, 16280.0, 8720.0, 4635.0, 2557.0, 1494.0, 891.0, 528.0, 330.0, 227.0, 123.0, 88.0, 48.0, 47.0, 24.0, 25.0, 20.0, 6.0, 13.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.80859375, -7.5828857421875, -7.357177734375, -7.1314697265625, -6.90576171875, -6.6800537109375, -6.454345703125, -6.2286376953125, -6.0029296875, -5.7772216796875, -5.551513671875, -5.3258056640625, -5.10009765625, -4.8743896484375, -4.648681640625, -4.4229736328125, -4.197265625, -3.9715576171875, -3.745849609375, -3.5201416015625, -3.29443359375, -3.0687255859375, -2.843017578125, -2.6173095703125, -2.3916015625, -2.1658935546875, -1.940185546875, -1.7144775390625, -1.48876953125, -1.2630615234375, -1.037353515625, -0.8116455078125, -0.5859375, -0.3602294921875, -0.134521484375, 0.0911865234375, 0.31689453125, 0.5426025390625, 0.768310546875, 0.9940185546875, 1.2197265625, 1.4454345703125, 1.671142578125, 1.8968505859375, 2.12255859375, 2.3482666015625, 2.573974609375, 2.7996826171875, 3.025390625, 3.2510986328125, 3.476806640625, 3.7025146484375, 3.92822265625, 4.1539306640625, 4.379638671875, 4.6053466796875, 4.8310546875, 5.0567626953125, 5.282470703125, 5.5081787109375, 5.73388671875, 5.9595947265625, 6.185302734375, 6.4110107421875, 6.63671875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 7.0, 13.0, 12.0, 24.0, 23.0, 24.0, 45.0, 53.0, 69.0, 118.0, 161.0, 228.0, 295.0, 355.0, 477.0, 455.0, 412.0, 373.0, 243.0, 187.0, 145.0, 113.0, 64.0, 43.0, 38.0, 23.0, 23.0, 11.0, 13.0, 6.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.390625, -2.3328094482421875, -2.274993896484375, -2.2171783447265625, -2.15936279296875, -2.1015472412109375, -2.043731689453125, -1.9859161376953125, -1.9281005859375, -1.8702850341796875, -1.812469482421875, -1.7546539306640625, -1.69683837890625, -1.6390228271484375, -1.581207275390625, -1.5233917236328125, -1.465576171875, -1.4077606201171875, -1.349945068359375, -1.2921295166015625, -1.23431396484375, -1.1764984130859375, -1.118682861328125, -1.0608673095703125, -1.0030517578125, -0.9452362060546875, -0.887420654296875, -0.8296051025390625, -0.77178955078125, -0.7139739990234375, -0.656158447265625, -0.5983428955078125, -0.54052734375, -0.4827117919921875, -0.424896240234375, -0.3670806884765625, -0.30926513671875, -0.2514495849609375, -0.193634033203125, -0.1358184814453125, -0.0780029296875, -0.0201873779296875, 0.037628173828125, 0.0954437255859375, 0.15325927734375, 0.2110748291015625, 0.268890380859375, 0.3267059326171875, 0.384521484375, 0.4423370361328125, 0.500152587890625, 0.5579681396484375, 0.61578369140625, 0.6735992431640625, 0.731414794921875, 0.7892303466796875, 0.8470458984375, 0.9048614501953125, 0.962677001953125, 1.0204925537109375, 1.07830810546875, 1.1361236572265625, 1.193939208984375, 1.2517547607421875, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 4.0, 4.0, 9.0, 5.0, 9.0, 5.0, 6.0, 7.0, 13.0, 18.0, 19.0, 16.0, 35.0, 31.0, 39.0, 38.0, 53.0, 70.0, 71.0, 83.0, 70.0, 55.0, 51.0, 51.0, 40.0, 29.0, 31.0, 25.0, 22.0, 13.0, 20.0, 6.0, 7.0, 11.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-5.197975158691406, -5.046141147613525, -4.894307613372803, -4.742473602294922, -4.590640068054199, -4.438806056976318, -4.2869720458984375, -4.135138511657715, -3.983304500579834, -3.8314707279205322, -3.6796369552612305, -3.5278029441833496, -3.375969171524048, -3.224135398864746, -3.0723016262054443, -2.9204678535461426, -2.768634080886841, -2.616800308227539, -2.4649665355682373, -2.3131327629089355, -2.1612987518310547, -2.009464979171753, -1.8576312065124512, -1.7057973146438599, -1.553963541984558, -1.4021297693252563, -1.250295877456665, -1.0984621047973633, -0.9466282725334167, -0.7947944402694702, -0.6429606676101685, -0.49112677574157715, -0.3392930030822754, -0.18745918571949005, -0.03562536835670471, 0.11620843410491943, 0.26804226636886597, 0.4198760986328125, 0.5717098712921143, 0.7235437631607056, 0.8753775358200073, 1.027211308479309, 1.1790452003479004, 1.3308789730072021, 1.482712745666504, 1.6345466375350952, 1.786380410194397, 1.9382143020629883, 2.09004807472229, 2.241881847381592, 2.3937156200408936, 2.5455493927001953, 2.697383403778076, 2.849217176437378, 3.0010509490966797, 3.1528849601745605, 3.304718494415283, 3.456552267074585, 3.6083860397338867, 3.7602200508117676, 3.9120538234710693, 4.063887596130371, 4.215721130371094, 4.367555141448975, 4.5193891525268555]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 7.0, 11.0, 19.0, 12.0, 25.0, 24.0, 19.0, 29.0, 21.0, 32.0, 28.0, 28.0, 48.0, 31.0, 47.0, 36.0, 46.0, 53.0, 38.0, 32.0, 43.0, 49.0, 26.0, 37.0, 29.0, 32.0, 22.0, 33.0, 19.0, 18.0, 15.0, 14.0, 14.0, 6.0, 8.0, 5.0, 5.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.438157558441162, -2.3558928966522217, -2.2736284732818604, -2.19136381149292, -2.1090993881225586, -2.026834726333618, -1.9445700645446777, -1.8623055219650269, -1.780040979385376, -1.697776436805725, -1.6155118942260742, -1.5332472324371338, -1.450982689857483, -1.368718147277832, -1.2864534854888916, -1.2041889429092407, -1.1219244003295898, -1.039659857749939, -0.9573952555656433, -0.8751306533813477, -0.7928661108016968, -0.7106015682220459, -0.6283369660377502, -0.5460723638534546, -0.4638078212738037, -0.38154324889183044, -0.2992786765098572, -0.2170141041278839, -0.13474953174591064, -0.05248495936393738, 0.02977961301803589, 0.11204421520233154, 0.19430851936340332, 0.2765730917453766, 0.35883766412734985, 0.4411022365093231, 0.5233668088912964, 0.6056313514709473, 0.6878959536552429, 0.7701605558395386, 0.8524250984191895, 0.9346896409988403, 1.0169541835784912, 1.0992188453674316, 1.1814833879470825, 1.2637479305267334, 1.3460125923156738, 1.4282771348953247, 1.5105416774749756, 1.5928062200546265, 1.6750707626342773, 1.7573354244232178, 1.8395999670028687, 1.9218645095825195, 2.00412917137146, 2.0863938331604004, 2.1686582565307617, 2.250922918319702, 2.3331873416900635, 2.415452003479004, 2.4977164268493652, 2.5799810886383057, 2.662245750427246, 2.7445101737976074, 2.826774835586548]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 21.0, 17.0, 27.0, 52.0, 62.0, 87.0, 109.0, 160.0, 265.0, 474.0, 630.0, 1055.0, 1661.0, 2647.0, 4717.0, 8375.0, 15956.0, 31627.0, 67340.0, 144404.0, 257538.0, 249241.0, 134951.0, 62909.0, 29786.0, 14748.0, 8128.0, 4435.0, 2635.0, 1578.0, 980.0, 677.0, 442.0, 260.0, 170.0, 113.0, 79.0, 42.0, 36.0, 33.0, 25.0, 13.0, 9.0, 9.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.806640625, -2.715972900390625, -2.62530517578125, -2.534637451171875, -2.4439697265625, -2.353302001953125, -2.26263427734375, -2.171966552734375, -2.081298828125, -1.990631103515625, -1.89996337890625, -1.809295654296875, -1.7186279296875, -1.627960205078125, -1.53729248046875, -1.446624755859375, -1.35595703125, -1.265289306640625, -1.17462158203125, -1.083953857421875, -0.9932861328125, -0.902618408203125, -0.81195068359375, -0.721282958984375, -0.630615234375, -0.539947509765625, -0.44927978515625, -0.358612060546875, -0.2679443359375, -0.177276611328125, -0.08660888671875, 0.004058837890625, 0.0947265625, 0.185394287109375, 0.27606201171875, 0.366729736328125, 0.4573974609375, 0.548065185546875, 0.63873291015625, 0.729400634765625, 0.820068359375, 0.910736083984375, 1.00140380859375, 1.092071533203125, 1.1827392578125, 1.273406982421875, 1.36407470703125, 1.454742431640625, 1.54541015625, 1.636077880859375, 1.72674560546875, 1.817413330078125, 1.9080810546875, 1.998748779296875, 2.08941650390625, 2.180084228515625, 2.270751953125, 2.361419677734375, 2.45208740234375, 2.542755126953125, 2.6334228515625, 2.724090576171875, 2.81475830078125, 2.905426025390625, 2.99609375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 10.0, 5.0, 6.0, 10.0, 12.0, 13.0, 22.0, 16.0, 28.0, 13.0, 28.0, 33.0, 27.0, 29.0, 25.0, 38.0, 41.0, 44.0, 42.0, 49.0, 43.0, 34.0, 37.0, 40.0, 45.0, 33.0, 37.0, 36.0, 27.0, 21.0, 24.0, 16.0, 24.0, 21.0, 8.0, 11.0, 13.0, 13.0, 6.0, 6.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.705078125, -2.612457275390625, -2.51983642578125, -2.427215576171875, -2.3345947265625, -2.241973876953125, -2.14935302734375, -2.056732177734375, -1.964111328125, -1.871490478515625, -1.77886962890625, -1.686248779296875, -1.5936279296875, -1.501007080078125, -1.40838623046875, -1.315765380859375, -1.22314453125, -1.130523681640625, -1.03790283203125, -0.945281982421875, -0.8526611328125, -0.760040283203125, -0.66741943359375, -0.574798583984375, -0.482177734375, -0.389556884765625, -0.29693603515625, -0.204315185546875, -0.1116943359375, -0.019073486328125, 0.07354736328125, 0.166168212890625, 0.2587890625, 0.351409912109375, 0.44403076171875, 0.536651611328125, 0.6292724609375, 0.721893310546875, 0.81451416015625, 0.907135009765625, 0.999755859375, 1.092376708984375, 1.18499755859375, 1.277618408203125, 1.3702392578125, 1.462860107421875, 1.55548095703125, 1.648101806640625, 1.74072265625, 1.833343505859375, 1.92596435546875, 2.018585205078125, 2.1112060546875, 2.203826904296875, 2.29644775390625, 2.389068603515625, 2.481689453125, 2.574310302734375, 2.66693115234375, 2.759552001953125, 2.8521728515625, 2.944793701171875, 3.03741455078125, 3.130035400390625, 3.22265625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 5.0, 6.0, 12.0, 13.0, 17.0, 13.0, 27.0, 28.0, 54.0, 54.0, 81.0, 108.0, 129.0, 196.0, 270.0, 346.0, 485.0, 800.0, 1133.0, 1820.0, 3196.0, 6181.0, 13469.0, 35790.0, 117295.0, 385936.0, 330729.0, 95112.0, 30142.0, 11609.0, 5427.0, 2981.0, 1667.0, 1063.0, 682.0, 453.0, 313.0, 226.0, 179.0, 126.0, 90.0, 60.0, 68.0, 39.0, 24.0, 27.0, 21.0, 13.0, 11.0, 15.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.28515625, -5.11956787109375, -4.9539794921875, -4.78839111328125, -4.622802734375, -4.45721435546875, -4.2916259765625, -4.12603759765625, -3.96044921875, -3.79486083984375, -3.6292724609375, -3.46368408203125, -3.298095703125, -3.13250732421875, -2.9669189453125, -2.80133056640625, -2.6357421875, -2.47015380859375, -2.3045654296875, -2.13897705078125, -1.973388671875, -1.80780029296875, -1.6422119140625, -1.47662353515625, -1.31103515625, -1.14544677734375, -0.9798583984375, -0.81427001953125, -0.648681640625, -0.48309326171875, -0.3175048828125, -0.15191650390625, 0.013671875, 0.17926025390625, 0.3448486328125, 0.51043701171875, 0.676025390625, 0.84161376953125, 1.0072021484375, 1.17279052734375, 1.33837890625, 1.50396728515625, 1.6695556640625, 1.83514404296875, 2.000732421875, 2.16632080078125, 2.3319091796875, 2.49749755859375, 2.6630859375, 2.82867431640625, 2.9942626953125, 3.15985107421875, 3.325439453125, 3.49102783203125, 3.6566162109375, 3.82220458984375, 3.98779296875, 4.15338134765625, 4.3189697265625, 4.48455810546875, 4.650146484375, 4.81573486328125, 4.9813232421875, 5.14691162109375, 5.3125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 11.0, 5.0, 18.0, 20.0, 15.0, 22.0, 24.0, 25.0, 24.0, 34.0, 30.0, 43.0, 49.0, 31.0, 53.0, 51.0, 42.0, 47.0, 45.0, 48.0, 37.0, 35.0, 37.0, 33.0, 26.0, 35.0, 20.0, 21.0, 15.0, 24.0, 13.0, 12.0, 4.0, 6.0, 7.0, 10.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.71484375, -1.657135009765625, -1.59942626953125, -1.541717529296875, -1.4840087890625, -1.426300048828125, -1.36859130859375, -1.310882568359375, -1.253173828125, -1.195465087890625, -1.13775634765625, -1.080047607421875, -1.0223388671875, -0.964630126953125, -0.90692138671875, -0.849212646484375, -0.79150390625, -0.733795166015625, -0.67608642578125, -0.618377685546875, -0.5606689453125, -0.502960205078125, -0.44525146484375, -0.387542724609375, -0.329833984375, -0.272125244140625, -0.21441650390625, -0.156707763671875, -0.0989990234375, -0.041290283203125, 0.01641845703125, 0.074127197265625, 0.1318359375, 0.189544677734375, 0.24725341796875, 0.304962158203125, 0.3626708984375, 0.420379638671875, 0.47808837890625, 0.535797119140625, 0.593505859375, 0.651214599609375, 0.70892333984375, 0.766632080078125, 0.8243408203125, 0.882049560546875, 0.93975830078125, 0.997467041015625, 1.05517578125, 1.112884521484375, 1.17059326171875, 1.228302001953125, 1.2860107421875, 1.343719482421875, 1.40142822265625, 1.459136962890625, 1.516845703125, 1.574554443359375, 1.63226318359375, 1.689971923828125, 1.7476806640625, 1.805389404296875, 1.86309814453125, 1.920806884765625, 1.978515625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 22.0, 19.0, 29.0, 55.0, 62.0, 100.0, 112.0, 134.0, 227.0, 275.0, 437.0, 618.0, 890.0, 1404.0, 2101.0, 3505.0, 6386.0, 34551.0, 907845.0, 71046.0, 7559.0, 3896.0, 2376.0, 1498.0, 969.0, 763.0, 466.0, 331.0, 232.0, 179.0, 125.0, 74.0, 66.0, 58.0, 39.0, 26.0, 19.0, 14.0, 13.0, 5.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6328125, -9.3179931640625, -9.003173828125, -8.6883544921875, -8.37353515625, -8.0587158203125, -7.743896484375, -7.4290771484375, -7.1142578125, -6.7994384765625, -6.484619140625, -6.1697998046875, -5.85498046875, -5.5401611328125, -5.225341796875, -4.9105224609375, -4.595703125, -4.2808837890625, -3.966064453125, -3.6512451171875, -3.33642578125, -3.0216064453125, -2.706787109375, -2.3919677734375, -2.0771484375, -1.7623291015625, -1.447509765625, -1.1326904296875, -0.81787109375, -0.5030517578125, -0.188232421875, 0.1265869140625, 0.44140625, 0.7562255859375, 1.071044921875, 1.3858642578125, 1.70068359375, 2.0155029296875, 2.330322265625, 2.6451416015625, 2.9599609375, 3.2747802734375, 3.589599609375, 3.9044189453125, 4.21923828125, 4.5340576171875, 4.848876953125, 5.1636962890625, 5.478515625, 5.7933349609375, 6.108154296875, 6.4229736328125, 6.73779296875, 7.0526123046875, 7.367431640625, 7.6822509765625, 7.9970703125, 8.3118896484375, 8.626708984375, 8.9415283203125, 9.25634765625, 9.5711669921875, 9.885986328125, 10.2008056640625, 10.515625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 23.0, 162.0, 553.0, 192.0, 31.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006341934204101562, -0.0006158500909805298, -0.0005975067615509033, -0.0005791634321212769, -0.0005608201026916504, -0.0005424767732620239, -0.0005241334438323975, -0.000505790114402771, -0.00048744678497314453, -0.00046910345554351807, -0.0004507601261138916, -0.00043241679668426514, -0.00041407346725463867, -0.0003957301378250122, -0.00037738680839538574, -0.0003590434789657593, -0.0003407001495361328, -0.00032235682010650635, -0.0003040134906768799, -0.0002856701612472534, -0.00026732683181762695, -0.0002489835023880005, -0.00023064017295837402, -0.00021229684352874756, -0.0001939535140991211, -0.00017561018466949463, -0.00015726685523986816, -0.0001389235258102417, -0.00012058019638061523, -0.00010223686695098877, -8.38935375213623e-05, -6.555020809173584e-05, -4.7206878662109375e-05, -2.886354923248291e-05, -1.0520219802856445e-05, 7.82310962677002e-06, 2.6166439056396484e-05, 4.450976848602295e-05, 6.285309791564941e-05, 8.119642734527588e-05, 9.953975677490234e-05, 0.00011788308620452881, 0.00013622641563415527, 0.00015456974506378174, 0.0001729130744934082, 0.00019125640392303467, 0.00020959973335266113, 0.0002279430627822876, 0.00024628639221191406, 0.00026462972164154053, 0.000282973051071167, 0.00030131638050079346, 0.0003196597099304199, 0.0003380030393600464, 0.00035634636878967285, 0.0003746896982192993, 0.0003930330276489258, 0.00041137635707855225, 0.0004297196865081787, 0.0004480630159378052, 0.00046640634536743164, 0.0004847496747970581, 0.0005030930042266846, 0.000521436333656311, 0.0005397796630859375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 12.0, 19.0, 27.0, 31.0, 41.0, 66.0, 94.0, 101.0, 168.0, 226.0, 313.0, 397.0, 553.0, 735.0, 1140.0, 1555.0, 2318.0, 3326.0, 5464.0, 18184.0, 704234.0, 284076.0, 10717.0, 4752.0, 3000.0, 2015.0, 1367.0, 967.0, 717.0, 543.0, 388.0, 268.0, 204.0, 164.0, 109.0, 66.0, 56.0, 34.0, 20.0, 26.0, 20.0, 8.0, 8.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.796875, -7.5357666015625, -7.274658203125, -7.0135498046875, -6.75244140625, -6.4913330078125, -6.230224609375, -5.9691162109375, -5.7080078125, -5.4468994140625, -5.185791015625, -4.9246826171875, -4.66357421875, -4.4024658203125, -4.141357421875, -3.8802490234375, -3.619140625, -3.3580322265625, -3.096923828125, -2.8358154296875, -2.57470703125, -2.3135986328125, -2.052490234375, -1.7913818359375, -1.5302734375, -1.2691650390625, -1.008056640625, -0.7469482421875, -0.48583984375, -0.2247314453125, 0.036376953125, 0.2974853515625, 0.55859375, 0.8197021484375, 1.080810546875, 1.3419189453125, 1.60302734375, 1.8641357421875, 2.125244140625, 2.3863525390625, 2.6474609375, 2.9085693359375, 3.169677734375, 3.4307861328125, 3.69189453125, 3.9530029296875, 4.214111328125, 4.4752197265625, 4.736328125, 4.9974365234375, 5.258544921875, 5.5196533203125, 5.78076171875, 6.0418701171875, 6.302978515625, 6.5640869140625, 6.8251953125, 7.0863037109375, 7.347412109375, 7.6085205078125, 7.86962890625, 8.1307373046875, 8.391845703125, 8.6529541015625, 8.9140625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 29.0, 193.0, 537.0, 169.0, 30.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.302734375, -3.2169189453125, -3.131103515625, -3.0452880859375, -2.95947265625, -2.8736572265625, -2.787841796875, -2.7020263671875, -2.6162109375, -2.5303955078125, -2.444580078125, -2.3587646484375, -2.27294921875, -2.1871337890625, -2.101318359375, -2.0155029296875, -1.9296875, -1.8438720703125, -1.758056640625, -1.6722412109375, -1.58642578125, -1.5006103515625, -1.414794921875, -1.3289794921875, -1.2431640625, -1.1573486328125, -1.071533203125, -0.9857177734375, -0.89990234375, -0.8140869140625, -0.728271484375, -0.6424560546875, -0.556640625, -0.4708251953125, -0.385009765625, -0.2991943359375, -0.21337890625, -0.1275634765625, -0.041748046875, 0.0440673828125, 0.1298828125, 0.2156982421875, 0.301513671875, 0.3873291015625, 0.47314453125, 0.5589599609375, 0.644775390625, 0.7305908203125, 0.81640625, 0.9022216796875, 0.988037109375, 1.0738525390625, 1.15966796875, 1.2454833984375, 1.331298828125, 1.4171142578125, 1.5029296875, 1.5887451171875, 1.674560546875, 1.7603759765625, 1.84619140625, 1.9320068359375, 2.017822265625, 2.1036376953125, 2.189453125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 1.0, 7.0, 5.0, 11.0, 11.0, 11.0, 10.0, 14.0, 16.0, 23.0, 29.0, 41.0, 38.0, 46.0, 58.0, 60.0, 70.0, 79.0, 61.0, 68.0, 55.0, 51.0, 40.0, 29.0, 27.0, 25.0, 18.0, 14.0, 13.0, 11.0, 8.0, 5.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.277956008911133, -5.12339973449707, -4.968843936920166, -4.8142876625061035, -4.659731864929199, -4.505175590515137, -4.350619792938232, -4.19606351852417, -4.041507720947266, -3.8869516849517822, -3.732395648956299, -3.5778396129608154, -3.423283576965332, -3.2687273025512695, -3.114171266555786, -2.9596152305603027, -2.8050589561462402, -2.650502920150757, -2.4959468841552734, -2.34139084815979, -2.1868348121643066, -2.032278537750244, -1.8777225017547607, -1.7231664657592773, -1.568610429763794, -1.4140543937683105, -1.2594983577728271, -1.1049422025680542, -0.9503861665725708, -0.7958301305770874, -0.6412740349769592, -0.48671793937683105, -0.33216142654418945, -0.17760536074638367, -0.02304929494857788, 0.1315067708492279, 0.2860628366470337, 0.4406188726425171, 0.5951749682426453, 0.7497310638427734, 0.9042870998382568, 1.0588431358337402, 1.2133991718292236, 1.3679553270339966, 1.52251136302948, 1.6770673990249634, 1.8316235542297363, 1.9861795902252197, 2.140735626220703, 2.2952916622161865, 2.44984769821167, 2.6044037342071533, 2.7589597702026367, 2.913516044616699, 3.0680720806121826, 3.222628116607666, 3.3771841526031494, 3.531740188598633, 3.686296224594116, 3.8408522605895996, 3.995408535003662, 4.149964332580566, 4.304520606994629, 4.459076881408691, 4.613632678985596]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 9.0, 4.0, 5.0, 5.0, 12.0, 12.0, 11.0, 11.0, 19.0, 20.0, 28.0, 26.0, 25.0, 32.0, 34.0, 33.0, 30.0, 34.0, 31.0, 38.0, 38.0, 43.0, 41.0, 49.0, 39.0, 39.0, 40.0, 40.0, 25.0, 24.0, 27.0, 22.0, 29.0, 15.0, 14.0, 10.0, 10.0, 20.0, 7.0, 8.0, 8.0, 10.0, 9.0, 6.0, 0.0, 4.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3807549476623535, -2.3013877868652344, -2.222020387649536, -2.142653226852417, -2.0632858276367188, -1.9839186668395996, -1.9045515060424805, -1.8251842260360718, -1.745816946029663, -1.6664496660232544, -1.5870823860168457, -1.5077152252197266, -1.4283479452133179, -1.3489806652069092, -1.26961350440979, -1.1902462244033813, -1.1108789443969727, -1.031511664390564, -0.9521444439888, -0.8727772235870361, -0.7934099435806274, -0.7140426635742188, -0.6346754431724548, -0.5553082227706909, -0.4759409427642822, -0.3965736925601959, -0.3172064423561096, -0.23783919215202332, -0.158471941947937, -0.07910469174385071, 0.0002625584602355957, 0.07962977886199951, 0.1589970588684082, 0.2383643090724945, 0.3177315592765808, 0.3970988094806671, 0.4764660596847534, 0.5558333396911621, 0.635200560092926, 0.7145677804946899, 0.7939350605010986, 0.8733023405075073, 0.9526695609092712, 1.0320367813110352, 1.1114040613174438, 1.1907713413238525, 1.2701385021209717, 1.3495057821273804, 1.428873062133789, 1.5082403421401978, 1.5876076221466064, 1.6669747829437256, 1.7463420629501343, 1.825709342956543, 1.905076503753662, 1.9844437837600708, 2.0638110637664795, 2.1431782245635986, 2.222545623779297, 2.301912784576416, 2.381279945373535, 2.4606473445892334, 2.5400145053863525, 2.619381904602051, 2.69874906539917]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 6.0, 2.0, 10.0, 12.0, 6.0, 14.0, 22.0, 35.0, 41.0, 66.0, 80.0, 140.0, 158.0, 251.0, 347.0, 502.0, 779.0, 1171.0, 1981.0, 3311.0, 6081.0, 11944.0, 24931.0, 55586.0, 124908.0, 235782.0, 268324.0, 167008.0, 76616.0, 33935.0, 15667.0, 7777.0, 4274.0, 2492.0, 1423.0, 880.0, 567.0, 451.0, 308.0, 186.0, 146.0, 101.0, 71.0, 46.0, 29.0, 22.0, 26.0, 11.0, 8.0, 12.0, 4.0, 8.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-5.03515625, -4.88348388671875, -4.7318115234375, -4.58013916015625, -4.428466796875, -4.27679443359375, -4.1251220703125, -3.97344970703125, -3.82177734375, -3.67010498046875, -3.5184326171875, -3.36676025390625, -3.215087890625, -3.06341552734375, -2.9117431640625, -2.76007080078125, -2.6083984375, -2.45672607421875, -2.3050537109375, -2.15338134765625, -2.001708984375, -1.85003662109375, -1.6983642578125, -1.54669189453125, -1.39501953125, -1.24334716796875, -1.0916748046875, -0.94000244140625, -0.788330078125, -0.63665771484375, -0.4849853515625, -0.33331298828125, -0.181640625, -0.02996826171875, 0.1217041015625, 0.27337646484375, 0.425048828125, 0.57672119140625, 0.7283935546875, 0.88006591796875, 1.03173828125, 1.18341064453125, 1.3350830078125, 1.48675537109375, 1.638427734375, 1.79010009765625, 1.9417724609375, 2.09344482421875, 2.2451171875, 2.39678955078125, 2.5484619140625, 2.70013427734375, 2.851806640625, 3.00347900390625, 3.1551513671875, 3.30682373046875, 3.45849609375, 3.61016845703125, 3.7618408203125, 3.91351318359375, 4.065185546875, 4.21685791015625, 4.3685302734375, 4.52020263671875, 4.671875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 6.0, 11.0, 8.0, 14.0, 11.0, 14.0, 16.0, 27.0, 25.0, 26.0, 27.0, 33.0, 27.0, 43.0, 33.0, 35.0, 38.0, 46.0, 59.0, 42.0, 42.0, 45.0, 51.0, 41.0, 36.0, 29.0, 33.0, 30.0, 23.0, 17.0, 22.0, 21.0, 9.0, 9.0, 17.0, 5.0, 7.0, 4.0, 8.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.508697509765625, -2.41192626953125, -2.315155029296875, -2.2183837890625, -2.121612548828125, -2.02484130859375, -1.928070068359375, -1.831298828125, -1.734527587890625, -1.63775634765625, -1.540985107421875, -1.4442138671875, -1.347442626953125, -1.25067138671875, -1.153900146484375, -1.05712890625, -0.960357666015625, -0.86358642578125, -0.766815185546875, -0.6700439453125, -0.573272705078125, -0.47650146484375, -0.379730224609375, -0.282958984375, -0.186187744140625, -0.08941650390625, 0.007354736328125, 0.1041259765625, 0.200897216796875, 0.29766845703125, 0.394439697265625, 0.4912109375, 0.587982177734375, 0.68475341796875, 0.781524658203125, 0.8782958984375, 0.975067138671875, 1.07183837890625, 1.168609619140625, 1.265380859375, 1.362152099609375, 1.45892333984375, 1.555694580078125, 1.6524658203125, 1.749237060546875, 1.84600830078125, 1.942779541015625, 2.03955078125, 2.136322021484375, 2.23309326171875, 2.329864501953125, 2.4266357421875, 2.523406982421875, 2.62017822265625, 2.716949462890625, 2.813720703125, 2.910491943359375, 3.00726318359375, 3.104034423828125, 3.2008056640625, 3.297576904296875, 3.39434814453125, 3.491119384765625, 3.587890625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 6.0, 8.0, 10.0, 13.0, 27.0, 38.0, 44.0, 72.0, 125.0, 163.0, 240.0, 358.0, 557.0, 992.0, 1393.0, 2497.0, 4580.0, 9332.0, 21957.0, 63990.0, 209844.0, 400344.0, 220450.0, 67799.0, 22875.0, 9434.0, 4675.0, 2587.0, 1479.0, 906.0, 627.0, 390.0, 250.0, 150.0, 108.0, 77.0, 53.0, 33.0, 35.0, 17.0, 7.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.90911865234375, -6.6580810546875, -6.40704345703125, -6.156005859375, -5.90496826171875, -5.6539306640625, -5.40289306640625, -5.15185546875, -4.90081787109375, -4.6497802734375, -4.39874267578125, -4.147705078125, -3.89666748046875, -3.6456298828125, -3.39459228515625, -3.1435546875, -2.89251708984375, -2.6414794921875, -2.39044189453125, -2.139404296875, -1.88836669921875, -1.6373291015625, -1.38629150390625, -1.13525390625, -0.88421630859375, -0.6331787109375, -0.38214111328125, -0.131103515625, 0.11993408203125, 0.3709716796875, 0.62200927734375, 0.873046875, 1.12408447265625, 1.3751220703125, 1.62615966796875, 1.877197265625, 2.12823486328125, 2.3792724609375, 2.63031005859375, 2.88134765625, 3.13238525390625, 3.3834228515625, 3.63446044921875, 3.885498046875, 4.13653564453125, 4.3875732421875, 4.63861083984375, 4.8896484375, 5.14068603515625, 5.3917236328125, 5.64276123046875, 5.893798828125, 6.14483642578125, 6.3958740234375, 6.64691162109375, 6.89794921875, 7.14898681640625, 7.4000244140625, 7.65106201171875, 7.902099609375, 8.15313720703125, 8.4041748046875, 8.65521240234375, 8.90625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 3.0, 9.0, 11.0, 9.0, 11.0, 16.0, 17.0, 25.0, 28.0, 25.0, 22.0, 31.0, 34.0, 35.0, 41.0, 53.0, 42.0, 53.0, 39.0, 47.0, 39.0, 42.0, 42.0, 36.0, 41.0, 32.0, 22.0, 30.0, 23.0, 20.0, 17.0, 18.0, 15.0, 9.0, 10.0, 11.0, 7.0, 8.0, 7.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.021484375, -1.957275390625, -1.89306640625, -1.828857421875, -1.7646484375, -1.700439453125, -1.63623046875, -1.572021484375, -1.5078125, -1.443603515625, -1.37939453125, -1.315185546875, -1.2509765625, -1.186767578125, -1.12255859375, -1.058349609375, -0.994140625, -0.929931640625, -0.86572265625, -0.801513671875, -0.7373046875, -0.673095703125, -0.60888671875, -0.544677734375, -0.48046875, -0.416259765625, -0.35205078125, -0.287841796875, -0.2236328125, -0.159423828125, -0.09521484375, -0.031005859375, 0.033203125, 0.097412109375, 0.16162109375, 0.225830078125, 0.2900390625, 0.354248046875, 0.41845703125, 0.482666015625, 0.546875, 0.611083984375, 0.67529296875, 0.739501953125, 0.8037109375, 0.867919921875, 0.93212890625, 0.996337890625, 1.060546875, 1.124755859375, 1.18896484375, 1.253173828125, 1.3173828125, 1.381591796875, 1.44580078125, 1.510009765625, 1.57421875, 1.638427734375, 1.70263671875, 1.766845703125, 1.8310546875, 1.895263671875, 1.95947265625, 2.023681640625, 2.087890625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 6.0, 9.0, 7.0, 15.0, 22.0, 30.0, 41.0, 58.0, 80.0, 92.0, 138.0, 171.0, 234.0, 343.0, 458.0, 590.0, 885.0, 1192.0, 1696.0, 2456.0, 3677.0, 6112.0, 11893.0, 34299.0, 182188.0, 599343.0, 144457.0, 29651.0, 10915.0, 5814.0, 3580.0, 2309.0, 1610.0, 1165.0, 802.0, 612.0, 426.0, 321.0, 235.0, 167.0, 127.0, 101.0, 72.0, 48.0, 32.0, 25.0, 16.0, 17.0, 6.0, 4.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.19921875, -5.98126220703125, -5.7633056640625, -5.54534912109375, -5.327392578125, -5.10943603515625, -4.8914794921875, -4.67352294921875, -4.45556640625, -4.23760986328125, -4.0196533203125, -3.80169677734375, -3.583740234375, -3.36578369140625, -3.1478271484375, -2.92987060546875, -2.7119140625, -2.49395751953125, -2.2760009765625, -2.05804443359375, -1.840087890625, -1.62213134765625, -1.4041748046875, -1.18621826171875, -0.96826171875, -0.75030517578125, -0.5323486328125, -0.31439208984375, -0.096435546875, 0.12152099609375, 0.3394775390625, 0.55743408203125, 0.775390625, 0.99334716796875, 1.2113037109375, 1.42926025390625, 1.647216796875, 1.86517333984375, 2.0831298828125, 2.30108642578125, 2.51904296875, 2.73699951171875, 2.9549560546875, 3.17291259765625, 3.390869140625, 3.60882568359375, 3.8267822265625, 4.04473876953125, 4.2626953125, 4.48065185546875, 4.6986083984375, 4.91656494140625, 5.134521484375, 5.35247802734375, 5.5704345703125, 5.78839111328125, 6.00634765625, 6.22430419921875, 6.4422607421875, 6.66021728515625, 6.878173828125, 7.09613037109375, 7.3140869140625, 7.53204345703125, 7.75]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 7.0, 5.0, 4.0, 13.0, 23.0, 44.0, 120.0, 194.0, 230.0, 163.0, 79.0, 33.0, 22.0, 12.0, 9.0, 4.0, 11.0, 2.0, 6.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000713348388671875, -0.0006926059722900391, -0.0006718635559082031, -0.0006511211395263672, -0.0006303787231445312, -0.0006096363067626953, -0.0005888938903808594, -0.0005681514739990234, -0.0005474090576171875, -0.0005266666412353516, -0.0005059242248535156, -0.0004851818084716797, -0.00046443939208984375, -0.0004436969757080078, -0.0004229545593261719, -0.00040221214294433594, -0.0003814697265625, -0.00036072731018066406, -0.0003399848937988281, -0.0003192424774169922, -0.00029850006103515625, -0.0002777576446533203, -0.0002570152282714844, -0.00023627281188964844, -0.0002155303955078125, -0.00019478797912597656, -0.00017404556274414062, -0.0001533031463623047, -0.00013256072998046875, -0.00011181831359863281, -9.107589721679688e-05, -7.033348083496094e-05, -4.9591064453125e-05, -2.8848648071289062e-05, -8.106231689453125e-06, 1.2636184692382812e-05, 3.337860107421875e-05, 5.412101745605469e-05, 7.486343383789062e-05, 9.560585021972656e-05, 0.0001163482666015625, 0.00013709068298339844, 0.00015783309936523438, 0.0001785755157470703, 0.00019931793212890625, 0.0002200603485107422, 0.00024080276489257812, 0.00026154518127441406, 0.00028228759765625, 0.00030303001403808594, 0.0003237724304199219, 0.0003445148468017578, 0.00036525726318359375, 0.0003859996795654297, 0.0004067420959472656, 0.00042748451232910156, 0.0004482269287109375, 0.00046896934509277344, 0.0004897117614746094, 0.0005104541778564453, 0.0005311965942382812, 0.0005519390106201172, 0.0005726814270019531, 0.0005934238433837891, 0.000614166259765625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 7.0, 25.0, 22.0, 26.0, 42.0, 44.0, 97.0, 111.0, 162.0, 207.0, 329.0, 457.0, 663.0, 988.0, 1400.0, 2080.0, 3215.0, 5023.0, 8563.0, 17220.0, 45539.0, 175271.0, 480203.0, 209659.0, 52946.0, 19323.0, 9295.0, 5328.0, 3354.0, 2164.0, 1437.0, 979.0, 712.0, 495.0, 333.0, 246.0, 181.0, 127.0, 75.0, 59.0, 36.0, 30.0, 29.0, 9.0, 12.0, 6.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.6484375, -4.496337890625, -4.34423828125, -4.192138671875, -4.0400390625, -3.887939453125, -3.73583984375, -3.583740234375, -3.431640625, -3.279541015625, -3.12744140625, -2.975341796875, -2.8232421875, -2.671142578125, -2.51904296875, -2.366943359375, -2.21484375, -2.062744140625, -1.91064453125, -1.758544921875, -1.6064453125, -1.454345703125, -1.30224609375, -1.150146484375, -0.998046875, -0.845947265625, -0.69384765625, -0.541748046875, -0.3896484375, -0.237548828125, -0.08544921875, 0.066650390625, 0.21875, 0.370849609375, 0.52294921875, 0.675048828125, 0.8271484375, 0.979248046875, 1.13134765625, 1.283447265625, 1.435546875, 1.587646484375, 1.73974609375, 1.891845703125, 2.0439453125, 2.196044921875, 2.34814453125, 2.500244140625, 2.65234375, 2.804443359375, 2.95654296875, 3.108642578125, 3.2607421875, 3.412841796875, 3.56494140625, 3.717041015625, 3.869140625, 4.021240234375, 4.17333984375, 4.325439453125, 4.4775390625, 4.629638671875, 4.78173828125, 4.933837890625, 5.0859375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 4.0, 7.0, 1.0, 12.0, 9.0, 26.0, 36.0, 44.0, 59.0, 82.0, 102.0, 142.0, 126.0, 103.0, 72.0, 51.0, 36.0, 17.0, 14.0, 10.0, 6.0, 5.0, 2.0, 2.0, 6.0, 5.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99853515625, -0.9623489379882812, -0.9261627197265625, -0.8899765014648438, -0.853790283203125, -0.8176040649414062, -0.7814178466796875, -0.7452316284179688, -0.70904541015625, -0.6728591918945312, -0.6366729736328125, -0.6004867553710938, -0.564300537109375, -0.5281143188476562, -0.4919281005859375, -0.45574188232421875, -0.4195556640625, -0.38336944580078125, -0.3471832275390625, -0.31099700927734375, -0.274810791015625, -0.23862457275390625, -0.2024383544921875, -0.16625213623046875, -0.13006591796875, -0.09387969970703125, -0.0576934814453125, -0.02150726318359375, 0.014678955078125, 0.05086517333984375, 0.0870513916015625, 0.12323760986328125, 0.159423828125, 0.19561004638671875, 0.2317962646484375, 0.26798248291015625, 0.304168701171875, 0.34035491943359375, 0.3765411376953125, 0.41272735595703125, 0.44891357421875, 0.48509979248046875, 0.5212860107421875, 0.5574722290039062, 0.593658447265625, 0.6298446655273438, 0.6660308837890625, 0.7022171020507812, 0.7384033203125, 0.7745895385742188, 0.8107757568359375, 0.8469619750976562, 0.883148193359375, 0.9193344116210938, 0.9555206298828125, 0.9917068481445312, 1.02789306640625, 1.0640792846679688, 1.1002655029296875, 1.1364517211914062, 1.172637939453125, 1.2088241577148438, 1.2450103759765625, 1.2811965942382812, 1.3173828125]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 6.0, 11.0, 8.0, 5.0, 12.0, 12.0, 19.0, 17.0, 26.0, 17.0, 30.0, 39.0, 50.0, 48.0, 71.0, 69.0, 72.0, 72.0, 60.0, 53.0, 41.0, 48.0, 30.0, 34.0, 26.0, 20.0, 16.0, 11.0, 14.0, 9.0, 9.0, 4.0, 2.0, 1.0, 6.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0], "bins": [-5.73045015335083, -5.577670574188232, -5.424890518188477, -5.272110939025879, -5.119331359863281, -4.966551780700684, -4.813771724700928, -4.66099214553833, -4.508212566375732, -4.355432987213135, -4.202652931213379, -4.049873352050781, -3.8970937728881836, -3.744313955307007, -3.59153413772583, -3.4387545585632324, -3.2859747409820557, -3.133194923400879, -2.9804153442382812, -2.8276355266571045, -2.674855947494507, -2.52207612991333, -2.3692965507507324, -2.2165167331695557, -2.063736915588379, -1.9109572172164917, -1.7581775188446045, -1.6053977012634277, -1.45261812210083, -1.2998383045196533, -1.1470586061477661, -0.9942789077758789, -0.8414993286132812, -0.688719630241394, -0.5359399318695068, -0.38316017389297485, -0.23038047552108765, -0.07760077714920044, 0.07517898082733154, 0.22795867919921875, 0.38073837757110596, 0.5335180759429932, 0.6862977743148804, 0.8390775322914124, 0.9918572306632996, 1.144636869430542, 1.2974166870117188, 1.450196385383606, 1.6029760837554932, 1.7557557821273804, 1.9085354804992676, 2.0613152980804443, 2.214094877243042, 2.3668746948242188, 2.5196542739868164, 2.672434091567993, 2.82521390914917, 2.9779937267303467, 3.1307733058929443, 3.283553123474121, 3.4363327026367188, 3.5891125202178955, 3.7418923377990723, 3.89467191696167, 4.047451496124268]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 5.0, 8.0, 7.0, 14.0, 14.0, 29.0, 18.0, 10.0, 24.0, 27.0, 25.0, 26.0, 33.0, 43.0, 36.0, 42.0, 40.0, 51.0, 35.0, 37.0, 40.0, 40.0, 40.0, 38.0, 43.0, 35.0, 32.0, 28.0, 28.0, 21.0, 20.0, 18.0, 17.0, 8.0, 15.0, 10.0, 8.0, 7.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.605104923248291, -2.5159752368927, -2.4268453121185303, -2.3377156257629395, -2.2485859394073486, -2.159456253051758, -2.070326328277588, -1.981196641921997, -1.8920668363571167, -1.8029370307922363, -1.7138073444366455, -1.6246775388717651, -1.5355477333068848, -1.446418046951294, -1.3572882413864136, -1.2681584358215332, -1.1790287494659424, -1.089898943901062, -1.0007692575454712, -0.9116394519805908, -0.8225097060203552, -0.7333799600601196, -0.6442501544952393, -0.5551204085350037, -0.46599066257476807, -0.37686091661453247, -0.2877311408519745, -0.1986013650894165, -0.10947161912918091, -0.020341873168945312, 0.06878793239593506, 0.15791767835617065, 0.24704766273498535, 0.33617740869522095, 0.42530718445777893, 0.5144369602203369, 0.6035667061805725, 0.6926964521408081, 0.7818262577056885, 0.8709560036659241, 0.9600857496261597, 1.04921555519104, 1.1383452415466309, 1.2274750471115112, 1.3166048526763916, 1.4057345390319824, 1.4948643445968628, 1.5839941501617432, 1.673123836517334, 1.7622536420822144, 1.8513833284378052, 1.9405131340026855, 2.0296428203582764, 2.118772506713867, 2.207902431488037, 2.297032117843628, 2.3861618041992188, 2.4752914905548096, 2.5644214153289795, 2.6535511016845703, 2.742680788040161, 2.831810474395752, 2.920940399169922, 3.0100700855255127, 3.0992000102996826]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 4.0, 3.0, 8.0, 15.0, 20.0, 26.0, 37.0, 57.0, 81.0, 108.0, 170.0, 226.0, 345.0, 524.0, 819.0, 1251.0, 2077.0, 3552.0, 6018.0, 10991.0, 21512.0, 47169.0, 118820.0, 367913.0, 1174520.0, 1550455.0, 580295.0, 174880.0, 66219.0, 30141.0, 15215.0, 8276.0, 4736.0, 2836.0, 1802.0, 1097.0, 720.0, 399.0, 294.0, 214.0, 152.0, 92.0, 65.0, 45.0, 24.0, 26.0, 7.0, 10.0, 7.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.58203125, -6.38372802734375, -6.1854248046875, -5.98712158203125, -5.788818359375, -5.59051513671875, -5.3922119140625, -5.19390869140625, -4.99560546875, -4.79730224609375, -4.5989990234375, -4.40069580078125, -4.202392578125, -4.00408935546875, -3.8057861328125, -3.60748291015625, -3.4091796875, -3.21087646484375, -3.0125732421875, -2.81427001953125, -2.615966796875, -2.41766357421875, -2.2193603515625, -2.02105712890625, -1.82275390625, -1.62445068359375, -1.4261474609375, -1.22784423828125, -1.029541015625, -0.83123779296875, -0.6329345703125, -0.43463134765625, -0.236328125, -0.03802490234375, 0.1602783203125, 0.35858154296875, 0.556884765625, 0.75518798828125, 0.9534912109375, 1.15179443359375, 1.35009765625, 1.54840087890625, 1.7467041015625, 1.94500732421875, 2.143310546875, 2.34161376953125, 2.5399169921875, 2.73822021484375, 2.9365234375, 3.13482666015625, 3.3331298828125, 3.53143310546875, 3.729736328125, 3.92803955078125, 4.1263427734375, 4.32464599609375, 4.52294921875, 4.72125244140625, 4.9195556640625, 5.11785888671875, 5.316162109375, 5.51446533203125, 5.7127685546875, 5.91107177734375, 6.109375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 10.0, 3.0, 3.0, 6.0, 8.0, 11.0, 10.0, 19.0, 15.0, 22.0, 23.0, 20.0, 22.0, 24.0, 37.0, 29.0, 40.0, 34.0, 25.0, 40.0, 45.0, 39.0, 51.0, 37.0, 42.0, 28.0, 35.0, 25.0, 30.0, 28.0, 36.0, 26.0, 30.0, 22.0, 25.0, 19.0, 13.0, 14.0, 7.0, 11.0, 10.0, 3.0, 4.0, 3.0, 5.0, 3.0, 9.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8583984375, -1.7924957275390625, -1.726593017578125, -1.6606903076171875, -1.59478759765625, -1.5288848876953125, -1.462982177734375, -1.3970794677734375, -1.3311767578125, -1.2652740478515625, -1.199371337890625, -1.1334686279296875, -1.06756591796875, -1.0016632080078125, -0.935760498046875, -0.8698577880859375, -0.803955078125, -0.7380523681640625, -0.672149658203125, -0.6062469482421875, -0.54034423828125, -0.4744415283203125, -0.408538818359375, -0.3426361083984375, -0.2767333984375, -0.2108306884765625, -0.144927978515625, -0.0790252685546875, -0.01312255859375, 0.0527801513671875, 0.118682861328125, 0.1845855712890625, 0.25048828125, 0.3163909912109375, 0.382293701171875, 0.4481964111328125, 0.51409912109375, 0.5800018310546875, 0.645904541015625, 0.7118072509765625, 0.7777099609375, 0.8436126708984375, 0.909515380859375, 0.9754180908203125, 1.04132080078125, 1.1072235107421875, 1.173126220703125, 1.2390289306640625, 1.304931640625, 1.3708343505859375, 1.436737060546875, 1.5026397705078125, 1.56854248046875, 1.6344451904296875, 1.700347900390625, 1.7662506103515625, 1.8321533203125, 1.8980560302734375, 1.963958740234375, 2.0298614501953125, 2.09576416015625, 2.1616668701171875, 2.227569580078125, 2.2934722900390625, 2.359375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 0.0, 15.0, 8.0, 11.0, 13.0, 33.0, 49.0, 69.0, 92.0, 155.0, 230.0, 357.0, 579.0, 904.0, 1529.0, 2548.0, 4605.0, 8334.0, 16477.0, 34899.0, 82963.0, 231175.0, 763806.0, 1769328.0, 855195.0, 254962.0, 90093.0, 37323.0, 17622.0, 8889.0, 4821.0, 2837.0, 1657.0, 979.0, 585.0, 374.0, 258.0, 158.0, 108.0, 82.0, 59.0, 31.0, 30.0, 20.0, 5.0, 7.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.140625, -7.89794921875, -7.6552734375, -7.41259765625, -7.169921875, -6.92724609375, -6.6845703125, -6.44189453125, -6.19921875, -5.95654296875, -5.7138671875, -5.47119140625, -5.228515625, -4.98583984375, -4.7431640625, -4.50048828125, -4.2578125, -4.01513671875, -3.7724609375, -3.52978515625, -3.287109375, -3.04443359375, -2.8017578125, -2.55908203125, -2.31640625, -2.07373046875, -1.8310546875, -1.58837890625, -1.345703125, -1.10302734375, -0.8603515625, -0.61767578125, -0.375, -0.13232421875, 0.1103515625, 0.35302734375, 0.595703125, 0.83837890625, 1.0810546875, 1.32373046875, 1.56640625, 1.80908203125, 2.0517578125, 2.29443359375, 2.537109375, 2.77978515625, 3.0224609375, 3.26513671875, 3.5078125, 3.75048828125, 3.9931640625, 4.23583984375, 4.478515625, 4.72119140625, 4.9638671875, 5.20654296875, 5.44921875, 5.69189453125, 5.9345703125, 6.17724609375, 6.419921875, 6.66259765625, 6.9052734375, 7.14794921875, 7.390625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 8.0, 8.0, 11.0, 12.0, 6.0, 20.0, 21.0, 32.0, 36.0, 42.0, 52.0, 83.0, 109.0, 151.0, 173.0, 233.0, 316.0, 358.0, 388.0, 359.0, 353.0, 299.0, 241.0, 197.0, 131.0, 122.0, 75.0, 65.0, 51.0, 33.0, 22.0, 18.0, 12.0, 17.0, 6.0, 5.0, 4.0, 5.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-2.232421875, -2.17645263671875, -2.1204833984375, -2.06451416015625, -2.008544921875, -1.95257568359375, -1.8966064453125, -1.84063720703125, -1.78466796875, -1.72869873046875, -1.6727294921875, -1.61676025390625, -1.560791015625, -1.50482177734375, -1.4488525390625, -1.39288330078125, -1.3369140625, -1.28094482421875, -1.2249755859375, -1.16900634765625, -1.113037109375, -1.05706787109375, -1.0010986328125, -0.94512939453125, -0.88916015625, -0.83319091796875, -0.7772216796875, -0.72125244140625, -0.665283203125, -0.60931396484375, -0.5533447265625, -0.49737548828125, -0.44140625, -0.38543701171875, -0.3294677734375, -0.27349853515625, -0.217529296875, -0.16156005859375, -0.1055908203125, -0.04962158203125, 0.00634765625, 0.06231689453125, 0.1182861328125, 0.17425537109375, 0.230224609375, 0.28619384765625, 0.3421630859375, 0.39813232421875, 0.4541015625, 0.51007080078125, 0.5660400390625, 0.62200927734375, 0.677978515625, 0.73394775390625, 0.7899169921875, 0.84588623046875, 0.90185546875, 0.95782470703125, 1.0137939453125, 1.06976318359375, 1.125732421875, 1.18170166015625, 1.2376708984375, 1.29364013671875, 1.349609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 7.0, 6.0, 5.0, 7.0, 6.0, 8.0, 5.0, 11.0, 14.0, 25.0, 14.0, 20.0, 31.0, 33.0, 52.0, 54.0, 60.0, 71.0, 77.0, 86.0, 52.0, 62.0, 53.0, 45.0, 42.0, 38.0, 21.0, 14.0, 18.0, 13.0, 6.0, 6.0, 6.0, 6.0, 7.0, 7.0, 5.0, 3.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.286518096923828, -5.108894348144531, -4.931271076202393, -4.753647804260254, -4.576024055480957, -4.39840030670166, -4.2207770347595215, -4.043153762817383, -3.865530014038086, -3.687906503677368, -3.5102829933166504, -3.3326594829559326, -3.155035972595215, -2.977412462234497, -2.7997889518737793, -2.6221654415130615, -2.4445419311523438, -2.266918420791626, -2.089294910430908, -1.9116714000701904, -1.7340478897094727, -1.5564243793487549, -1.378800868988037, -1.2011773586273193, -1.0235538482666016, -0.8459303379058838, -0.668306827545166, -0.49068331718444824, -0.31305980682373047, -0.1354362964630127, 0.04218721389770508, 0.21981072425842285, 0.3974342346191406, 0.5750577449798584, 0.7526812553405762, 0.930304765701294, 1.1079282760620117, 1.2855517864227295, 1.4631752967834473, 1.640798807144165, 1.8184223175048828, 1.9960458278656006, 2.1736693382263184, 2.351292848587036, 2.528916358947754, 2.7065398693084717, 2.8841633796691895, 3.0617868900299072, 3.239410400390625, 3.4170339107513428, 3.5946574211120605, 3.7722809314727783, 3.949904441833496, 4.127528190612793, 4.305151462554932, 4.48277473449707, 4.660398483276367, 4.838022232055664, 5.015645503997803, 5.193268775939941, 5.370892524719238, 5.548516273498535, 5.726139545440674, 5.9037628173828125, 6.081386566162109]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 6.0, 9.0, 4.0, 11.0, 12.0, 11.0, 13.0, 14.0, 18.0, 23.0, 13.0, 27.0, 25.0, 25.0, 33.0, 37.0, 34.0, 30.0, 30.0, 34.0, 46.0, 41.0, 44.0, 46.0, 38.0, 37.0, 31.0, 30.0, 36.0, 23.0, 31.0, 29.0, 22.0, 25.0, 9.0, 12.0, 13.0, 15.0, 11.0, 8.0, 6.0, 9.0, 11.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4830620288848877, -2.3990890979766846, -2.3151161670684814, -2.231142997741699, -2.147170066833496, -2.063197135925293, -1.9792242050170898, -1.8952511548995972, -1.8112781047821045, -1.7273051738739014, -1.6433321237564087, -1.5593591928482056, -1.475386142730713, -1.3914132118225098, -1.3074402809143066, -1.223467230796814, -1.1394942998886108, -1.0555213689804077, -0.971548318862915, -0.8875753879547119, -0.8036023378372192, -0.7196294069290161, -0.6356564164161682, -0.5516834259033203, -0.4677104353904724, -0.3837374448776245, -0.2997644543647766, -0.2157914936542511, -0.1318185031414032, -0.0478455126285553, 0.036127448081970215, 0.12010043859481812, 0.20407342910766602, 0.2880464196205139, 0.3720194101333618, 0.45599237084388733, 0.5399653911590576, 0.6239383220672607, 0.7079113125801086, 0.7918843030929565, 0.8758572936058044, 0.9598302841186523, 1.0438032150268555, 1.1277762651443481, 1.2117491960525513, 1.295722246170044, 1.379695177078247, 1.4636681079864502, 1.5476411581039429, 1.631614089012146, 1.7155871391296387, 1.7995600700378418, 1.8835331201553345, 1.9675060510635376, 2.0514791011810303, 2.1354520320892334, 2.2194249629974365, 2.3033978939056396, 2.3873708248138428, 2.471343994140625, 2.555316925048828, 2.6392898559570312, 2.7232627868652344, 2.8072357177734375, 2.8912088871002197]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 3.0, 9.0, 10.0, 14.0, 12.0, 18.0, 24.0, 37.0, 49.0, 60.0, 94.0, 127.0, 169.0, 231.0, 358.0, 475.0, 732.0, 1116.0, 1905.0, 3258.0, 5963.0, 11664.0, 24401.0, 56747.0, 138646.0, 288283.0, 279849.0, 131826.0, 53590.0, 23490.0, 11302.0, 5631.0, 3185.0, 1815.0, 1144.0, 672.0, 438.0, 338.0, 248.0, 164.0, 138.0, 84.0, 64.0, 57.0, 37.0, 25.0, 14.0, 9.0, 8.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.50390625, -3.386993408203125, -3.27008056640625, -3.153167724609375, -3.0362548828125, -2.919342041015625, -2.80242919921875, -2.685516357421875, -2.568603515625, -2.451690673828125, -2.33477783203125, -2.217864990234375, -2.1009521484375, -1.984039306640625, -1.86712646484375, -1.750213623046875, -1.63330078125, -1.516387939453125, -1.39947509765625, -1.282562255859375, -1.1656494140625, -1.048736572265625, -0.93182373046875, -0.814910888671875, -0.697998046875, -0.581085205078125, -0.46417236328125, -0.347259521484375, -0.2303466796875, -0.113433837890625, 0.00347900390625, 0.120391845703125, 0.2373046875, 0.354217529296875, 0.47113037109375, 0.588043212890625, 0.7049560546875, 0.821868896484375, 0.93878173828125, 1.055694580078125, 1.172607421875, 1.289520263671875, 1.40643310546875, 1.523345947265625, 1.6402587890625, 1.757171630859375, 1.87408447265625, 1.990997314453125, 2.10791015625, 2.224822998046875, 2.34173583984375, 2.458648681640625, 2.5755615234375, 2.692474365234375, 2.80938720703125, 2.926300048828125, 3.043212890625, 3.160125732421875, 3.27703857421875, 3.393951416015625, 3.5108642578125, 3.627777099609375, 3.74468994140625, 3.861602783203125, 3.978515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 1.0, 4.0, 6.0, 6.0, 10.0, 8.0, 11.0, 13.0, 11.0, 10.0, 19.0, 20.0, 16.0, 25.0, 22.0, 32.0, 34.0, 34.0, 26.0, 39.0, 36.0, 48.0, 31.0, 30.0, 49.0, 36.0, 40.0, 43.0, 42.0, 40.0, 28.0, 29.0, 30.0, 15.0, 22.0, 17.0, 14.0, 13.0, 12.0, 14.0, 10.0, 14.0, 11.0, 8.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.931640625, -2.8360595703125, -2.740478515625, -2.6448974609375, -2.54931640625, -2.4537353515625, -2.358154296875, -2.2625732421875, -2.1669921875, -2.0714111328125, -1.975830078125, -1.8802490234375, -1.78466796875, -1.6890869140625, -1.593505859375, -1.4979248046875, -1.40234375, -1.3067626953125, -1.211181640625, -1.1156005859375, -1.02001953125, -0.9244384765625, -0.828857421875, -0.7332763671875, -0.6376953125, -0.5421142578125, -0.446533203125, -0.3509521484375, -0.25537109375, -0.1597900390625, -0.064208984375, 0.0313720703125, 0.126953125, 0.2225341796875, 0.318115234375, 0.4136962890625, 0.50927734375, 0.6048583984375, 0.700439453125, 0.7960205078125, 0.8916015625, 0.9871826171875, 1.082763671875, 1.1783447265625, 1.27392578125, 1.3695068359375, 1.465087890625, 1.5606689453125, 1.65625, 1.7518310546875, 1.847412109375, 1.9429931640625, 2.03857421875, 2.1341552734375, 2.229736328125, 2.3253173828125, 2.4208984375, 2.5164794921875, 2.612060546875, 2.7076416015625, 2.80322265625, 2.8988037109375, 2.994384765625, 3.0899658203125, 3.185546875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 10.0, 7.0, 12.0, 14.0, 40.0, 41.0, 43.0, 50.0, 89.0, 117.0, 167.0, 258.0, 362.0, 592.0, 1214.0, 3702.0, 17594.0, 168468.0, 738297.0, 100082.0, 11926.0, 2802.0, 1028.0, 512.0, 309.0, 222.0, 158.0, 124.0, 81.0, 61.0, 47.0, 37.0, 18.0, 15.0, 10.0, 9.0, 5.0, 6.0, 8.0, 4.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.0234375, -12.6214599609375, -12.219482421875, -11.8175048828125, -11.41552734375, -11.0135498046875, -10.611572265625, -10.2095947265625, -9.8076171875, -9.4056396484375, -9.003662109375, -8.6016845703125, -8.19970703125, -7.7977294921875, -7.395751953125, -6.9937744140625, -6.591796875, -6.1898193359375, -5.787841796875, -5.3858642578125, -4.98388671875, -4.5819091796875, -4.179931640625, -3.7779541015625, -3.3759765625, -2.9739990234375, -2.572021484375, -2.1700439453125, -1.76806640625, -1.3660888671875, -0.964111328125, -0.5621337890625, -0.16015625, 0.2418212890625, 0.643798828125, 1.0457763671875, 1.44775390625, 1.8497314453125, 2.251708984375, 2.6536865234375, 3.0556640625, 3.4576416015625, 3.859619140625, 4.2615966796875, 4.66357421875, 5.0655517578125, 5.467529296875, 5.8695068359375, 6.271484375, 6.6734619140625, 7.075439453125, 7.4774169921875, 7.87939453125, 8.2813720703125, 8.683349609375, 9.0853271484375, 9.4873046875, 9.8892822265625, 10.291259765625, 10.6932373046875, 11.09521484375, 11.4971923828125, 11.899169921875, 12.3011474609375, 12.703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 7.0, 4.0, 6.0, 19.0, 12.0, 14.0, 17.0, 19.0, 20.0, 33.0, 32.0, 30.0, 40.0, 36.0, 43.0, 53.0, 42.0, 49.0, 54.0, 49.0, 44.0, 37.0, 36.0, 43.0, 29.0, 26.0, 30.0, 35.0, 29.0, 23.0, 16.0, 15.0, 13.0, 9.0, 4.0, 12.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.04296875, -1.97772216796875, -1.9124755859375, -1.84722900390625, -1.781982421875, -1.71673583984375, -1.6514892578125, -1.58624267578125, -1.52099609375, -1.45574951171875, -1.3905029296875, -1.32525634765625, -1.260009765625, -1.19476318359375, -1.1295166015625, -1.06427001953125, -0.9990234375, -0.93377685546875, -0.8685302734375, -0.80328369140625, -0.738037109375, -0.67279052734375, -0.6075439453125, -0.54229736328125, -0.47705078125, -0.41180419921875, -0.3465576171875, -0.28131103515625, -0.216064453125, -0.15081787109375, -0.0855712890625, -0.02032470703125, 0.044921875, 0.11016845703125, 0.1754150390625, 0.24066162109375, 0.305908203125, 0.37115478515625, 0.4364013671875, 0.50164794921875, 0.56689453125, 0.63214111328125, 0.6973876953125, 0.76263427734375, 0.827880859375, 0.89312744140625, 0.9583740234375, 1.02362060546875, 1.0888671875, 1.15411376953125, 1.2193603515625, 1.28460693359375, 1.349853515625, 1.41510009765625, 1.4803466796875, 1.54559326171875, 1.61083984375, 1.67608642578125, 1.7413330078125, 1.80657958984375, 1.871826171875, 1.93707275390625, 2.0023193359375, 2.06756591796875, 2.1328125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 8.0, 11.0, 21.0, 22.0, 31.0, 44.0, 46.0, 58.0, 73.0, 88.0, 122.0, 163.0, 231.0, 307.0, 425.0, 652.0, 967.0, 1953.0, 4611.0, 17348.0, 119472.0, 684660.0, 182133.0, 23631.0, 5780.0, 2100.0, 1094.0, 649.0, 483.0, 327.0, 246.0, 179.0, 136.0, 114.0, 75.0, 65.0, 59.0, 31.0, 34.0, 20.0, 22.0, 15.0, 12.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.58203125, -4.4322509765625, -4.282470703125, -4.1326904296875, -3.98291015625, -3.8331298828125, -3.683349609375, -3.5335693359375, -3.3837890625, -3.2340087890625, -3.084228515625, -2.9344482421875, -2.78466796875, -2.6348876953125, -2.485107421875, -2.3353271484375, -2.185546875, -2.0357666015625, -1.885986328125, -1.7362060546875, -1.58642578125, -1.4366455078125, -1.286865234375, -1.1370849609375, -0.9873046875, -0.8375244140625, -0.687744140625, -0.5379638671875, -0.38818359375, -0.2384033203125, -0.088623046875, 0.0611572265625, 0.2109375, 0.3607177734375, 0.510498046875, 0.6602783203125, 0.81005859375, 0.9598388671875, 1.109619140625, 1.2593994140625, 1.4091796875, 1.5589599609375, 1.708740234375, 1.8585205078125, 2.00830078125, 2.1580810546875, 2.307861328125, 2.4576416015625, 2.607421875, 2.7572021484375, 2.906982421875, 3.0567626953125, 3.20654296875, 3.3563232421875, 3.506103515625, 3.6558837890625, 3.8056640625, 3.9554443359375, 4.105224609375, 4.2550048828125, 4.40478515625, 4.5545654296875, 4.704345703125, 4.8541259765625, 5.00390625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 8.0, 7.0, 20.0, 43.0, 127.0, 215.0, 252.0, 152.0, 80.0, 42.0, 15.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0003457069396972656, -0.0003379005938768387, -0.00033009424805641174, -0.0003222879022359848, -0.00031448155641555786, -0.0003066752105951309, -0.000298868864774704, -0.00029106251895427704, -0.0002832561731338501, -0.00027544982731342316, -0.0002676434814929962, -0.0002598371356725693, -0.00025203078985214233, -0.0002442244440317154, -0.00023641809821128845, -0.0002286117523908615, -0.00022080540657043457, -0.00021299906075000763, -0.0002051927149295807, -0.00019738636910915375, -0.0001895800232887268, -0.00018177367746829987, -0.00017396733164787292, -0.00016616098582744598, -0.00015835464000701904, -0.0001505482941865921, -0.00014274194836616516, -0.00013493560254573822, -0.00012712925672531128, -0.00011932291090488434, -0.0001115165650844574, -0.00010371021926403046, -9.590387344360352e-05, -8.809752762317657e-05, -8.029118180274963e-05, -7.248483598232269e-05, -6.467849016189575e-05, -5.687214434146881e-05, -4.906579852104187e-05, -4.125945270061493e-05, -3.345310688018799e-05, -2.5646761059761047e-05, -1.7840415239334106e-05, -1.0034069418907166e-05, -2.2277235984802246e-06, 5.578622221946716e-06, 1.3384968042373657e-05, 2.1191313862800598e-05, 2.899765968322754e-05, 3.680400550365448e-05, 4.461035132408142e-05, 5.241669714450836e-05, 6.02230429649353e-05, 6.802938878536224e-05, 7.583573460578918e-05, 8.364208042621613e-05, 9.144842624664307e-05, 9.925477206707001e-05, 0.00010706111788749695, 0.00011486746370792389, 0.00012267380952835083, 0.00013048015534877777, 0.0001382865011692047, 0.00014609284698963165, 0.0001538991928100586]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 10.0, 4.0, 7.0, 16.0, 14.0, 20.0, 17.0, 41.0, 42.0, 49.0, 73.0, 96.0, 126.0, 176.0, 244.0, 295.0, 379.0, 502.0, 686.0, 990.0, 1451.0, 2395.0, 4420.0, 11119.0, 42361.0, 227320.0, 529209.0, 173113.0, 33147.0, 9207.0, 3821.0, 2145.0, 1412.0, 974.0, 695.0, 499.0, 369.0, 259.0, 182.0, 165.0, 140.0, 107.0, 68.0, 51.0, 20.0, 26.0, 21.0, 20.0, 11.0, 12.0, 9.0, 6.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0], "bins": [-3.109375, -3.010406494140625, -2.91143798828125, -2.812469482421875, -2.7135009765625, -2.614532470703125, -2.51556396484375, -2.416595458984375, -2.317626953125, -2.218658447265625, -2.11968994140625, -2.020721435546875, -1.9217529296875, -1.822784423828125, -1.72381591796875, -1.624847412109375, -1.52587890625, -1.426910400390625, -1.32794189453125, -1.228973388671875, -1.1300048828125, -1.031036376953125, -0.93206787109375, -0.833099365234375, -0.734130859375, -0.635162353515625, -0.53619384765625, -0.437225341796875, -0.3382568359375, -0.239288330078125, -0.14031982421875, -0.041351318359375, 0.0576171875, 0.156585693359375, 0.25555419921875, 0.354522705078125, 0.4534912109375, 0.552459716796875, 0.65142822265625, 0.750396728515625, 0.849365234375, 0.948333740234375, 1.04730224609375, 1.146270751953125, 1.2452392578125, 1.344207763671875, 1.44317626953125, 1.542144775390625, 1.64111328125, 1.740081787109375, 1.83905029296875, 1.938018798828125, 2.0369873046875, 2.135955810546875, 2.23492431640625, 2.333892822265625, 2.432861328125, 2.531829833984375, 2.63079833984375, 2.729766845703125, 2.8287353515625, 2.927703857421875, 3.02667236328125, 3.125640869140625, 3.224609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 10.0, 14.0, 32.0, 53.0, 88.0, 149.0, 177.0, 169.0, 116.0, 86.0, 34.0, 25.0, 9.0, 11.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7822265625, -0.7559356689453125, -0.729644775390625, -0.7033538818359375, -0.67706298828125, -0.6507720947265625, -0.624481201171875, -0.5981903076171875, -0.5718994140625, -0.5456085205078125, -0.519317626953125, -0.4930267333984375, -0.46673583984375, -0.4404449462890625, -0.414154052734375, -0.3878631591796875, -0.361572265625, -0.3352813720703125, -0.308990478515625, -0.2826995849609375, -0.25640869140625, -0.2301177978515625, -0.203826904296875, -0.1775360107421875, -0.1512451171875, -0.1249542236328125, -0.098663330078125, -0.0723724365234375, -0.04608154296875, -0.0197906494140625, 0.006500244140625, 0.0327911376953125, 0.05908203125, 0.0853729248046875, 0.111663818359375, 0.1379547119140625, 0.16424560546875, 0.1905364990234375, 0.216827392578125, 0.2431182861328125, 0.2694091796875, 0.2957000732421875, 0.321990966796875, 0.3482818603515625, 0.37457275390625, 0.4008636474609375, 0.427154541015625, 0.4534454345703125, 0.479736328125, 0.5060272216796875, 0.532318115234375, 0.5586090087890625, 0.58489990234375, 0.6111907958984375, 0.637481689453125, 0.6637725830078125, 0.6900634765625, 0.7163543701171875, 0.742645263671875, 0.7689361572265625, 0.79522705078125, 0.8215179443359375, 0.847808837890625, 0.8740997314453125, 0.900390625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 7.0, 7.0, 9.0, 11.0, 13.0, 18.0, 12.0, 19.0, 32.0, 39.0, 38.0, 62.0, 55.0, 73.0, 86.0, 85.0, 57.0, 70.0, 67.0, 42.0, 35.0, 37.0, 20.0, 12.0, 20.0, 10.0, 10.0, 9.0, 5.0, 3.0, 7.0, 5.0, 4.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.620943069458008, -5.432906150817871, -5.244869232177734, -5.056832313537598, -4.868794918060303, -4.680757999420166, -4.492721080780029, -4.304684162139893, -4.116646766662598, -3.928609848022461, -3.740572690963745, -3.5525357723236084, -3.3644986152648926, -3.176461696624756, -2.988424777984619, -2.8003878593444824, -2.6123509407043457, -2.424314022064209, -2.236276865005493, -2.0482399463653564, -1.8602029085159302, -1.672165870666504, -1.4841289520263672, -1.296091914176941, -1.1080548763275146, -0.9200178384780884, -0.7319808602333069, -0.5439438819885254, -0.3559068441390991, -0.16786980628967285, 0.020167112350463867, 0.20820415019989014, 0.3962407112121582, 0.5842777490615845, 0.772314727306366, 0.9603517055511475, 1.1483887434005737, 1.33642578125, 1.5244626998901367, 1.712499737739563, 1.9005367755889893, 2.088573694229126, 2.276610851287842, 2.4646477699279785, 2.6526846885681152, 2.840721845626831, 3.0287587642669678, 3.2167959213256836, 3.4048328399658203, 3.592869758605957, 3.780906915664673, 3.9689438343048096, 4.156980991363525, 4.345017910003662, 4.533054828643799, 4.7210917472839355, 4.9091291427612305, 5.097166061401367, 5.285202980041504, 5.473239898681641, 5.6612772941589355, 5.849314212799072, 6.037351131439209, 6.225388050079346, 6.413424968719482]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 7.0, 15.0, 7.0, 12.0, 16.0, 17.0, 20.0, 19.0, 18.0, 31.0, 25.0, 29.0, 26.0, 35.0, 31.0, 33.0, 34.0, 42.0, 40.0, 35.0, 47.0, 40.0, 36.0, 39.0, 29.0, 30.0, 35.0, 25.0, 31.0, 25.0, 28.0, 12.0, 15.0, 11.0, 11.0, 9.0, 17.0, 6.0, 3.0, 11.0, 6.0, 8.0, 8.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.442962169647217, -2.36234974861145, -2.2817375659942627, -2.201125144958496, -2.1205127239227295, -2.039900302886963, -1.9592881202697754, -1.8786756992340088, -1.7980633974075317, -1.7174510955810547, -1.636838674545288, -1.556226372718811, -1.475614070892334, -1.3950016498565674, -1.3143893480300903, -1.2337770462036133, -1.1531646251678467, -1.0725523233413696, -0.991939902305603, -0.911327600479126, -0.8307152390480042, -0.7501028776168823, -0.6694905757904053, -0.5888782143592834, -0.5082658529281616, -0.4276534914970398, -0.34704115986824036, -0.2664288282394409, -0.1858164668083191, -0.10520410537719727, -0.024591773748397827, 0.05602055788040161, 0.13663268089294434, 0.21724502742290497, 0.2978573739528656, 0.37846970558166504, 0.45908206701278687, 0.5396944284439087, 0.6203067302703857, 0.7009190917015076, 0.7815314531326294, 0.8621438145637512, 0.942756175994873, 1.02336847782135, 1.1039807796478271, 1.1845932006835938, 1.2652055025100708, 1.3458178043365479, 1.4264302253723145, 1.5070425271987915, 1.587654948234558, 1.6682672500610352, 1.7488796710968018, 1.8294919729232788, 1.9101042747497559, 1.9907166957855225, 2.071329116821289, 2.1519415378570557, 2.232553720474243, 2.3131661415100098, 2.3937785625457764, 2.474390983581543, 2.5550031661987305, 2.635615587234497, 2.7162277698516846]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 8.0, 10.0, 13.0, 16.0, 29.0, 29.0, 52.0, 51.0, 95.0, 145.0, 210.0, 324.0, 524.0, 817.0, 1236.0, 2090.0, 3567.0, 6426.0, 12313.0, 24309.0, 51174.0, 108314.0, 204311.0, 261583.0, 185774.0, 94408.0, 44624.0, 21270.0, 10620.0, 5939.0, 3228.0, 1845.0, 1210.0, 660.0, 441.0, 277.0, 188.0, 151.0, 76.0, 59.0, 43.0, 38.0, 15.0, 22.0, 7.0, 5.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0], "bins": [-6.796875, -6.60491943359375, -6.4129638671875, -6.22100830078125, -6.029052734375, -5.83709716796875, -5.6451416015625, -5.45318603515625, -5.26123046875, -5.06927490234375, -4.8773193359375, -4.68536376953125, -4.493408203125, -4.30145263671875, -4.1094970703125, -3.91754150390625, -3.7255859375, -3.53363037109375, -3.3416748046875, -3.14971923828125, -2.957763671875, -2.76580810546875, -2.5738525390625, -2.38189697265625, -2.18994140625, -1.99798583984375, -1.8060302734375, -1.61407470703125, -1.422119140625, -1.23016357421875, -1.0382080078125, -0.84625244140625, -0.654296875, -0.46234130859375, -0.2703857421875, -0.07843017578125, 0.113525390625, 0.30548095703125, 0.4974365234375, 0.68939208984375, 0.88134765625, 1.07330322265625, 1.2652587890625, 1.45721435546875, 1.649169921875, 1.84112548828125, 2.0330810546875, 2.22503662109375, 2.4169921875, 2.60894775390625, 2.8009033203125, 2.99285888671875, 3.184814453125, 3.37677001953125, 3.5687255859375, 3.76068115234375, 3.95263671875, 4.14459228515625, 4.3365478515625, 4.52850341796875, 4.720458984375, 4.91241455078125, 5.1043701171875, 5.29632568359375, 5.48828125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 7.0, 14.0, 14.0, 13.0, 20.0, 22.0, 10.0, 19.0, 23.0, 23.0, 33.0, 27.0, 28.0, 35.0, 34.0, 43.0, 44.0, 43.0, 45.0, 37.0, 35.0, 37.0, 43.0, 31.0, 33.0, 34.0, 34.0, 33.0, 21.0, 20.0, 20.0, 14.0, 16.0, 17.0, 12.0, 9.0, 7.0, 10.0, 8.0, 10.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.88671875, -2.7872314453125, -2.687744140625, -2.5882568359375, -2.48876953125, -2.3892822265625, -2.289794921875, -2.1903076171875, -2.0908203125, -1.9913330078125, -1.891845703125, -1.7923583984375, -1.69287109375, -1.5933837890625, -1.493896484375, -1.3944091796875, -1.294921875, -1.1954345703125, -1.095947265625, -0.9964599609375, -0.89697265625, -0.7974853515625, -0.697998046875, -0.5985107421875, -0.4990234375, -0.3995361328125, -0.300048828125, -0.2005615234375, -0.10107421875, -0.0015869140625, 0.097900390625, 0.1973876953125, 0.296875, 0.3963623046875, 0.495849609375, 0.5953369140625, 0.69482421875, 0.7943115234375, 0.893798828125, 0.9932861328125, 1.0927734375, 1.1922607421875, 1.291748046875, 1.3912353515625, 1.49072265625, 1.5902099609375, 1.689697265625, 1.7891845703125, 1.888671875, 1.9881591796875, 2.087646484375, 2.1871337890625, 2.28662109375, 2.3861083984375, 2.485595703125, 2.5850830078125, 2.6845703125, 2.7840576171875, 2.883544921875, 2.9830322265625, 3.08251953125, 3.1820068359375, 3.281494140625, 3.3809814453125, 3.48046875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 13.0, 14.0, 28.0, 28.0, 47.0, 89.0, 116.0, 212.0, 301.0, 504.0, 839.0, 1321.0, 2217.0, 3879.0, 6822.0, 13027.0, 25606.0, 53181.0, 108715.0, 199481.0, 253470.0, 184485.0, 97092.0, 46745.0, 23422.0, 11816.0, 6360.0, 3501.0, 2060.0, 1153.0, 711.0, 459.0, 285.0, 183.0, 124.0, 72.0, 55.0, 43.0, 26.0, 17.0, 11.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.78515625, -5.58160400390625, -5.3780517578125, -5.17449951171875, -4.970947265625, -4.76739501953125, -4.5638427734375, -4.36029052734375, -4.15673828125, -3.95318603515625, -3.7496337890625, -3.54608154296875, -3.342529296875, -3.13897705078125, -2.9354248046875, -2.73187255859375, -2.5283203125, -2.32476806640625, -2.1212158203125, -1.91766357421875, -1.714111328125, -1.51055908203125, -1.3070068359375, -1.10345458984375, -0.89990234375, -0.69635009765625, -0.4927978515625, -0.28924560546875, -0.085693359375, 0.11785888671875, 0.3214111328125, 0.52496337890625, 0.728515625, 0.93206787109375, 1.1356201171875, 1.33917236328125, 1.542724609375, 1.74627685546875, 1.9498291015625, 2.15338134765625, 2.35693359375, 2.56048583984375, 2.7640380859375, 2.96759033203125, 3.171142578125, 3.37469482421875, 3.5782470703125, 3.78179931640625, 3.9853515625, 4.18890380859375, 4.3924560546875, 4.59600830078125, 4.799560546875, 5.00311279296875, 5.2066650390625, 5.41021728515625, 5.61376953125, 5.81732177734375, 6.0208740234375, 6.22442626953125, 6.427978515625, 6.63153076171875, 6.8350830078125, 7.03863525390625, 7.2421875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 8.0, 5.0, 4.0, 11.0, 6.0, 16.0, 15.0, 12.0, 15.0, 18.0, 20.0, 16.0, 29.0, 20.0, 25.0, 29.0, 31.0, 31.0, 42.0, 27.0, 43.0, 47.0, 35.0, 44.0, 46.0, 30.0, 35.0, 30.0, 44.0, 41.0, 33.0, 26.0, 25.0, 21.0, 18.0, 17.0, 17.0, 17.0, 10.0, 12.0, 8.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.79296875, -1.73211669921875, -1.6712646484375, -1.61041259765625, -1.549560546875, -1.48870849609375, -1.4278564453125, -1.36700439453125, -1.30615234375, -1.24530029296875, -1.1844482421875, -1.12359619140625, -1.062744140625, -1.00189208984375, -0.9410400390625, -0.88018798828125, -0.8193359375, -0.75848388671875, -0.6976318359375, -0.63677978515625, -0.575927734375, -0.51507568359375, -0.4542236328125, -0.39337158203125, -0.33251953125, -0.27166748046875, -0.2108154296875, -0.14996337890625, -0.089111328125, -0.02825927734375, 0.0325927734375, 0.09344482421875, 0.154296875, 0.21514892578125, 0.2760009765625, 0.33685302734375, 0.397705078125, 0.45855712890625, 0.5194091796875, 0.58026123046875, 0.64111328125, 0.70196533203125, 0.7628173828125, 0.82366943359375, 0.884521484375, 0.94537353515625, 1.0062255859375, 1.06707763671875, 1.1279296875, 1.18878173828125, 1.2496337890625, 1.31048583984375, 1.371337890625, 1.43218994140625, 1.4930419921875, 1.55389404296875, 1.61474609375, 1.67559814453125, 1.7364501953125, 1.79730224609375, 1.858154296875, 1.91900634765625, 1.9798583984375, 2.04071044921875, 2.1015625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 12.0, 10.0, 21.0, 21.0, 33.0, 58.0, 83.0, 102.0, 215.0, 328.0, 526.0, 770.0, 1316.0, 2108.0, 3576.0, 6107.0, 11034.0, 21281.0, 47231.0, 127784.0, 371090.0, 285133.0, 93182.0, 36813.0, 17543.0, 9218.0, 5145.0, 2993.0, 1807.0, 1135.0, 689.0, 443.0, 255.0, 182.0, 120.0, 61.0, 50.0, 24.0, 23.0, 11.0, 11.0, 6.0, 6.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.4140625, -8.14990234375, -7.8857421875, -7.62158203125, -7.357421875, -7.09326171875, -6.8291015625, -6.56494140625, -6.30078125, -6.03662109375, -5.7724609375, -5.50830078125, -5.244140625, -4.97998046875, -4.7158203125, -4.45166015625, -4.1875, -3.92333984375, -3.6591796875, -3.39501953125, -3.130859375, -2.86669921875, -2.6025390625, -2.33837890625, -2.07421875, -1.81005859375, -1.5458984375, -1.28173828125, -1.017578125, -0.75341796875, -0.4892578125, -0.22509765625, 0.0390625, 0.30322265625, 0.5673828125, 0.83154296875, 1.095703125, 1.35986328125, 1.6240234375, 1.88818359375, 2.15234375, 2.41650390625, 2.6806640625, 2.94482421875, 3.208984375, 3.47314453125, 3.7373046875, 4.00146484375, 4.265625, 4.52978515625, 4.7939453125, 5.05810546875, 5.322265625, 5.58642578125, 5.8505859375, 6.11474609375, 6.37890625, 6.64306640625, 6.9072265625, 7.17138671875, 7.435546875, 7.69970703125, 7.9638671875, 8.22802734375, 8.4921875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 6.0, 13.0, 10.0, 23.0, 27.0, 42.0, 56.0, 82.0, 121.0, 134.0, 149.0, 91.0, 77.0, 40.0, 29.0, 22.0, 20.0, 13.0, 7.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009045600891113281, -0.000870920717716217, -0.000837281346321106, -0.0008036419749259949, -0.0007700026035308838, -0.0007363632321357727, -0.0007027238607406616, -0.0006690844893455505, -0.0006354451179504395, -0.0006018057465553284, -0.0005681663751602173, -0.0005345270037651062, -0.0005008876323699951, -0.00046724826097488403, -0.00043360888957977295, -0.00039996951818466187, -0.0003663301467895508, -0.0003326907753944397, -0.0002990514039993286, -0.00026541203260421753, -0.00023177266120910645, -0.00019813328981399536, -0.00016449391841888428, -0.0001308545470237732, -9.721517562866211e-05, -6.357580423355103e-05, -2.993643283843994e-05, 3.7029385566711426e-06, 3.7342309951782227e-05, 7.098168134689331e-05, 0.0001046210527420044, 0.00013826042413711548, 0.00017189979553222656, 0.00020553916692733765, 0.00023917853832244873, 0.0002728179097175598, 0.0003064572811126709, 0.000340096652507782, 0.00037373602390289307, 0.00040737539529800415, 0.00044101476669311523, 0.0004746541380882263, 0.0005082935094833374, 0.0005419328808784485, 0.0005755722522735596, 0.0006092116236686707, 0.0006428509950637817, 0.0006764903664588928, 0.0007101297378540039, 0.000743769109249115, 0.0007774084806442261, 0.0008110478520393372, 0.0008446872234344482, 0.0008783265948295593, 0.0009119659662246704, 0.0009456053376197815, 0.0009792447090148926, 0.0010128840804100037, 0.0010465234518051147, 0.0010801628232002258, 0.001113802194595337, 0.001147441565990448, 0.001181080937385559, 0.0012147203087806702, 0.0012483596801757812]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 5.0, 15.0, 17.0, 26.0, 26.0, 50.0, 53.0, 96.0, 147.0, 217.0, 317.0, 509.0, 823.0, 1275.0, 2127.0, 3688.0, 6368.0, 12008.0, 23704.0, 52408.0, 139832.0, 354427.0, 272863.0, 97276.0, 39471.0, 18559.0, 9440.0, 5159.0, 2871.0, 1692.0, 1031.0, 715.0, 422.0, 278.0, 196.0, 134.0, 88.0, 62.0, 48.0, 41.0, 16.0, 11.0, 14.0, 7.0, 7.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.9921875, -6.78546142578125, -6.5787353515625, -6.37200927734375, -6.165283203125, -5.95855712890625, -5.7518310546875, -5.54510498046875, -5.33837890625, -5.13165283203125, -4.9249267578125, -4.71820068359375, -4.511474609375, -4.30474853515625, -4.0980224609375, -3.89129638671875, -3.6845703125, -3.47784423828125, -3.2711181640625, -3.06439208984375, -2.857666015625, -2.65093994140625, -2.4442138671875, -2.23748779296875, -2.03076171875, -1.82403564453125, -1.6173095703125, -1.41058349609375, -1.203857421875, -0.99713134765625, -0.7904052734375, -0.58367919921875, -0.376953125, -0.17022705078125, 0.0364990234375, 0.24322509765625, 0.449951171875, 0.65667724609375, 0.8634033203125, 1.07012939453125, 1.27685546875, 1.48358154296875, 1.6903076171875, 1.89703369140625, 2.103759765625, 2.31048583984375, 2.5172119140625, 2.72393798828125, 2.9306640625, 3.13739013671875, 3.3441162109375, 3.55084228515625, 3.757568359375, 3.96429443359375, 4.1710205078125, 4.37774658203125, 4.58447265625, 4.79119873046875, 4.9979248046875, 5.20465087890625, 5.411376953125, 5.61810302734375, 5.8248291015625, 6.03155517578125, 6.23828125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 8.0, 8.0, 11.0, 10.0, 13.0, 18.0, 21.0, 24.0, 24.0, 29.0, 48.0, 63.0, 50.0, 61.0, 69.0, 69.0, 74.0, 52.0, 54.0, 33.0, 45.0, 28.0, 26.0, 36.0, 17.0, 19.0, 13.0, 14.0, 16.0, 9.0, 7.0, 6.0, 9.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.392578125, -1.3511505126953125, -1.309722900390625, -1.2682952880859375, -1.22686767578125, -1.1854400634765625, -1.144012451171875, -1.1025848388671875, -1.0611572265625, -1.0197296142578125, -0.978302001953125, -0.9368743896484375, -0.89544677734375, -0.8540191650390625, -0.812591552734375, -0.7711639404296875, -0.729736328125, -0.6883087158203125, -0.646881103515625, -0.6054534912109375, -0.56402587890625, -0.5225982666015625, -0.481170654296875, -0.4397430419921875, -0.3983154296875, -0.3568878173828125, -0.315460205078125, -0.2740325927734375, -0.23260498046875, -0.1911773681640625, -0.149749755859375, -0.1083221435546875, -0.06689453125, -0.0254669189453125, 0.015960693359375, 0.0573883056640625, 0.09881591796875, 0.1402435302734375, 0.181671142578125, 0.2230987548828125, 0.2645263671875, 0.3059539794921875, 0.347381591796875, 0.3888092041015625, 0.43023681640625, 0.4716644287109375, 0.513092041015625, 0.5545196533203125, 0.595947265625, 0.6373748779296875, 0.678802490234375, 0.7202301025390625, 0.76165771484375, 0.8030853271484375, 0.844512939453125, 0.8859405517578125, 0.9273681640625, 0.9687957763671875, 1.010223388671875, 1.0516510009765625, 1.09307861328125, 1.1345062255859375, 1.175933837890625, 1.2173614501953125, 1.2587890625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 6.0, 2.0, 6.0, 8.0, 5.0, 8.0, 6.0, 12.0, 16.0, 13.0, 16.0, 26.0, 33.0, 47.0, 52.0, 51.0, 66.0, 62.0, 63.0, 62.0, 72.0, 54.0, 51.0, 41.0, 31.0, 28.0, 27.0, 22.0, 21.0, 19.0, 12.0, 9.0, 10.0, 13.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.625375270843506, -5.441492080688477, -5.257608890533447, -5.073725700378418, -4.889842987060547, -4.705959796905518, -4.522076606750488, -4.338193416595459, -4.15431022644043, -3.9704270362854004, -3.78654408454895, -3.602660894393921, -3.4187779426574707, -3.2348947525024414, -3.051011562347412, -2.867128372192383, -2.6832456588745117, -2.4993624687194824, -2.3154795169830322, -2.131596326828003, -1.9477132558822632, -1.7638301849365234, -1.5799469947814941, -1.3960639238357544, -1.2121808528900146, -1.028297781944275, -0.8444146513938904, -0.6605315208435059, -0.4766484498977661, -0.29276537895202637, -0.10888218879699707, 0.07500088214874268, 0.2588839530944824, 0.44276705384254456, 0.6266501545906067, 0.8105332851409912, 0.994416356086731, 1.1782994270324707, 1.3621826171875, 1.5460656881332397, 1.7299487590789795, 1.9138318300247192, 2.097714900970459, 2.2815980911254883, 2.4654812812805176, 2.6493642330169678, 2.833247423171997, 3.0171303749084473, 3.2010135650634766, 3.384896755218506, 3.568779706954956, 3.7526628971099854, 3.9365458488464355, 4.120429039001465, 4.304312229156494, 4.488195419311523, 4.6720781326293945, 4.855961322784424, 5.039844512939453, 5.223727226257324, 5.4076104164123535, 5.591493606567383, 5.775376796722412, 5.959259986877441, 6.143143177032471]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 1.0, 10.0, 8.0, 10.0, 11.0, 16.0, 18.0, 17.0, 19.0, 24.0, 24.0, 25.0, 32.0, 32.0, 36.0, 32.0, 32.0, 39.0, 51.0, 47.0, 46.0, 59.0, 36.0, 38.0, 36.0, 30.0, 41.0, 28.0, 27.0, 20.0, 25.0, 22.0, 15.0, 18.0, 17.0, 9.0, 6.0, 7.0, 9.0, 2.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.908379077911377, -2.8105523586273193, -2.7127254009246826, -2.614898681640625, -2.5170717239379883, -2.4192450046539307, -2.321418285369873, -2.2235913276672363, -2.1257643699645996, -2.027937650680542, -1.9301106929779053, -1.8322839736938477, -1.734457015991211, -1.6366302967071533, -1.5388034582138062, -1.440976619720459, -1.3431499004364014, -1.2453230619430542, -1.147496223449707, -1.0496695041656494, -0.9518426060676575, -0.8540157675743103, -0.7561889886856079, -0.6583621501922607, -0.5605353116989136, -0.4627084732055664, -0.3648816645145416, -0.26705485582351685, -0.16922801733016968, -0.07140117883682251, 0.026425600051879883, 0.12425243854522705, 0.22207903861999512, 0.3199058771133423, 0.41773268580436707, 0.5155594944953918, 0.613386332988739, 0.7112131714820862, 0.8090399503707886, 0.9068667888641357, 1.004693627357483, 1.10252046585083, 1.2003473043441772, 1.2981741428375244, 1.396000862121582, 1.4938278198242188, 1.5916545391082764, 1.6894813776016235, 1.7873082160949707, 1.8851350545883179, 1.982961893081665, 2.0807886123657227, 2.1786155700683594, 2.276442289352417, 2.3742690086364746, 2.4720959663391113, 2.569922924041748, 2.6677496433258057, 2.7655766010284424, 2.8634033203125, 2.9612302780151367, 3.0590569972991943, 3.156883716583252, 3.2547106742858887, 3.3525373935699463]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 9.0, 10.0, 16.0, 17.0, 25.0, 41.0, 55.0, 75.0, 108.0, 167.0, 280.0, 400.0, 607.0, 860.0, 1378.0, 2176.0, 3554.0, 5933.0, 10584.0, 20502.0, 44055.0, 114643.0, 375865.0, 1273347.0, 1553615.0, 518301.0, 152762.0, 57156.0, 25392.0, 13132.0, 7462.0, 4423.0, 2649.0, 1698.0, 1077.0, 708.0, 421.0, 285.0, 198.0, 117.0, 68.0, 42.0, 24.0, 21.0, 12.0, 9.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6953125, -8.45465087890625, -8.2139892578125, -7.97332763671875, -7.732666015625, -7.49200439453125, -7.2513427734375, -7.01068115234375, -6.77001953125, -6.52935791015625, -6.2886962890625, -6.04803466796875, -5.807373046875, -5.56671142578125, -5.3260498046875, -5.08538818359375, -4.8447265625, -4.60406494140625, -4.3634033203125, -4.12274169921875, -3.882080078125, -3.64141845703125, -3.4007568359375, -3.16009521484375, -2.91943359375, -2.67877197265625, -2.4381103515625, -2.19744873046875, -1.956787109375, -1.71612548828125, -1.4754638671875, -1.23480224609375, -0.994140625, -0.75347900390625, -0.5128173828125, -0.27215576171875, -0.031494140625, 0.20916748046875, 0.4498291015625, 0.69049072265625, 0.93115234375, 1.17181396484375, 1.4124755859375, 1.65313720703125, 1.893798828125, 2.13446044921875, 2.3751220703125, 2.61578369140625, 2.8564453125, 3.09710693359375, 3.3377685546875, 3.57843017578125, 3.819091796875, 4.05975341796875, 4.3004150390625, 4.54107666015625, 4.78173828125, 5.02239990234375, 5.2630615234375, 5.50372314453125, 5.744384765625, 5.98504638671875, 6.2257080078125, 6.46636962890625, 6.70703125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 5.0, 10.0, 8.0, 13.0, 16.0, 9.0, 25.0, 17.0, 19.0, 33.0, 24.0, 34.0, 30.0, 29.0, 40.0, 39.0, 46.0, 36.0, 41.0, 36.0, 45.0, 48.0, 38.0, 32.0, 37.0, 36.0, 35.0, 34.0, 28.0, 30.0, 16.0, 13.0, 18.0, 13.0, 16.0, 3.0, 8.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.55859375, -2.4755859375, -2.392578125, -2.3095703125, -2.2265625, -2.1435546875, -2.060546875, -1.9775390625, -1.89453125, -1.8115234375, -1.728515625, -1.6455078125, -1.5625, -1.4794921875, -1.396484375, -1.3134765625, -1.23046875, -1.1474609375, -1.064453125, -0.9814453125, -0.8984375, -0.8154296875, -0.732421875, -0.6494140625, -0.56640625, -0.4833984375, -0.400390625, -0.3173828125, -0.234375, -0.1513671875, -0.068359375, 0.0146484375, 0.09765625, 0.1806640625, 0.263671875, 0.3466796875, 0.4296875, 0.5126953125, 0.595703125, 0.6787109375, 0.76171875, 0.8447265625, 0.927734375, 1.0107421875, 1.09375, 1.1767578125, 1.259765625, 1.3427734375, 1.42578125, 1.5087890625, 1.591796875, 1.6748046875, 1.7578125, 1.8408203125, 1.923828125, 2.0068359375, 2.08984375, 2.1728515625, 2.255859375, 2.3388671875, 2.421875, 2.5048828125, 2.587890625, 2.6708984375, 2.75390625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 10.0, 13.0, 26.0, 33.0, 63.0, 88.0, 130.0, 228.0, 327.0, 535.0, 888.0, 1429.0, 2395.0, 4095.0, 7325.0, 13889.0, 27653.0, 59971.0, 145815.0, 422512.0, 1331312.0, 1428569.0, 464860.0, 156811.0, 63235.0, 29032.0, 14427.0, 7635.0, 4379.0, 2504.0, 1491.0, 926.0, 592.0, 407.0, 257.0, 155.0, 94.0, 51.0, 34.0, 19.0, 19.0, 12.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.453125, -8.1807861328125, -7.908447265625, -7.6361083984375, -7.36376953125, -7.0914306640625, -6.819091796875, -6.5467529296875, -6.2744140625, -6.0020751953125, -5.729736328125, -5.4573974609375, -5.18505859375, -4.9127197265625, -4.640380859375, -4.3680419921875, -4.095703125, -3.8233642578125, -3.551025390625, -3.2786865234375, -3.00634765625, -2.7340087890625, -2.461669921875, -2.1893310546875, -1.9169921875, -1.6446533203125, -1.372314453125, -1.0999755859375, -0.82763671875, -0.5552978515625, -0.282958984375, -0.0106201171875, 0.26171875, 0.5340576171875, 0.806396484375, 1.0787353515625, 1.35107421875, 1.6234130859375, 1.895751953125, 2.1680908203125, 2.4404296875, 2.7127685546875, 2.985107421875, 3.2574462890625, 3.52978515625, 3.8021240234375, 4.074462890625, 4.3468017578125, 4.619140625, 4.8914794921875, 5.163818359375, 5.4361572265625, 5.70849609375, 5.9808349609375, 6.253173828125, 6.5255126953125, 6.7978515625, 7.0701904296875, 7.342529296875, 7.6148681640625, 7.88720703125, 8.1595458984375, 8.431884765625, 8.7042236328125, 8.9765625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 3.0, 5.0, 7.0, 3.0, 6.0, 14.0, 12.0, 17.0, 25.0, 23.0, 33.0, 34.0, 39.0, 63.0, 82.0, 115.0, 137.0, 201.0, 238.0, 286.0, 312.0, 375.0, 368.0, 320.0, 281.0, 204.0, 154.0, 149.0, 142.0, 107.0, 76.0, 61.0, 37.0, 30.0, 30.0, 12.0, 12.0, 13.0, 10.0, 10.0, 4.0, 8.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.125, -2.0672607421875, -2.009521484375, -1.9517822265625, -1.89404296875, -1.8363037109375, -1.778564453125, -1.7208251953125, -1.6630859375, -1.6053466796875, -1.547607421875, -1.4898681640625, -1.43212890625, -1.3743896484375, -1.316650390625, -1.2589111328125, -1.201171875, -1.1434326171875, -1.085693359375, -1.0279541015625, -0.97021484375, -0.9124755859375, -0.854736328125, -0.7969970703125, -0.7392578125, -0.6815185546875, -0.623779296875, -0.5660400390625, -0.50830078125, -0.4505615234375, -0.392822265625, -0.3350830078125, -0.27734375, -0.2196044921875, -0.161865234375, -0.1041259765625, -0.04638671875, 0.0113525390625, 0.069091796875, 0.1268310546875, 0.1845703125, 0.2423095703125, 0.300048828125, 0.3577880859375, 0.41552734375, 0.4732666015625, 0.531005859375, 0.5887451171875, 0.646484375, 0.7042236328125, 0.761962890625, 0.8197021484375, 0.87744140625, 0.9351806640625, 0.992919921875, 1.0506591796875, 1.1083984375, 1.1661376953125, 1.223876953125, 1.2816162109375, 1.33935546875, 1.3970947265625, 1.454833984375, 1.5125732421875, 1.5703125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 10.0, 11.0, 12.0, 12.0, 17.0, 12.0, 22.0, 25.0, 34.0, 39.0, 53.0, 49.0, 61.0, 85.0, 87.0, 70.0, 73.0, 64.0, 53.0, 35.0, 35.0, 32.0, 31.0, 23.0, 10.0, 11.0, 6.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.243377685546875, -7.0129170417785645, -6.782456874847412, -6.551996231079102, -6.321536064147949, -6.091075420379639, -5.860614776611328, -5.630154609680176, -5.399693965911865, -5.169233322143555, -4.938773155212402, -4.708312511444092, -4.477851867675781, -4.247391700744629, -4.016931056976318, -3.786470651626587, -3.5560102462768555, -3.325549840927124, -3.0950894355773926, -2.864628791809082, -2.6341683864593506, -2.403707981109619, -2.1732473373413086, -1.9427869319915771, -1.7123265266418457, -1.4818661212921143, -1.2514055967330933, -1.0209450721740723, -0.7904846668243408, -0.5600242614746094, -0.3295637369155884, -0.09910321235656738, 0.13135671615600586, 0.3618171811103821, 0.5922776460647583, 0.8227381110191345, 1.0531985759735107, 1.2836589813232422, 1.5141195058822632, 1.7445800304412842, 1.9750404357910156, 2.205500841140747, 2.4359612464904785, 2.666421890258789, 2.8968822956085205, 3.127342700958252, 3.3578033447265625, 3.588263750076294, 3.8187241554260254, 4.049184799194336, 4.279644966125488, 4.510105609893799, 4.740566253662109, 4.971026420593262, 5.201487064361572, 5.431947708129883, 5.662407875061035, 5.892868518829346, 6.123328685760498, 6.353789329528809, 6.584249496459961, 6.8147101402282715, 7.045170783996582, 7.275630950927734, 7.506091594696045]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 6.0, 5.0, 1.0, 4.0, 5.0, 5.0, 6.0, 7.0, 5.0, 10.0, 21.0, 21.0, 25.0, 21.0, 25.0, 22.0, 28.0, 28.0, 28.0, 22.0, 37.0, 37.0, 49.0, 38.0, 39.0, 34.0, 44.0, 43.0, 34.0, 34.0, 37.0, 26.0, 34.0, 35.0, 31.0, 38.0, 19.0, 18.0, 17.0, 11.0, 12.0, 14.0, 6.0, 3.0, 1.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0], "bins": [-3.1982321739196777, -3.10054087638855, -3.002849578857422, -2.905158042907715, -2.807466745376587, -2.709775447845459, -2.612084150314331, -2.514392852783203, -2.416701316833496, -2.319010019302368, -2.2213187217712402, -2.123627185821533, -2.0259358882904053, -1.9282445907592773, -1.8305532932281494, -1.7328619956970215, -1.6351706981658936, -1.5374794006347656, -1.4397879838943481, -1.3420966863632202, -1.2444052696228027, -1.1467139720916748, -1.0490226745605469, -0.9513313174247742, -0.8536399602890015, -0.7559486031532288, -0.658257246017456, -0.5605659484863281, -0.4628745913505554, -0.3651832342147827, -0.2674919366836548, -0.16980057954788208, -0.07210922241210938, 0.025582119822502136, 0.12327346205711365, 0.22096478939056396, 0.31865614652633667, 0.4163475036621094, 0.5140388011932373, 0.61173015832901, 0.7094215154647827, 0.8071128726005554, 0.9048042297363281, 1.002495527267456, 1.100186824798584, 1.1978782415390015, 1.2955695390701294, 1.3932609558105469, 1.4909522533416748, 1.5886435508728027, 1.6863349676132202, 1.7840262651443481, 1.8817176818847656, 1.9794089794158936, 2.0771002769470215, 2.1747915744781494, 2.2724828720092773, 2.3701741695404053, 2.467865467071533, 2.5655570030212402, 2.663248300552368, 2.760939598083496, 2.858630895614624, 2.956322193145752, 3.054013729095459]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 11.0, 22.0, 23.0, 29.0, 39.0, 76.0, 87.0, 139.0, 229.0, 311.0, 518.0, 891.0, 1508.0, 2974.0, 5881.0, 13006.0, 31590.0, 86067.0, 231365.0, 359243.0, 194408.0, 71460.0, 26466.0, 11027.0, 5074.0, 2569.0, 1383.0, 770.0, 520.0, 286.0, 192.0, 114.0, 84.0, 49.0, 44.0, 32.0, 16.0, 17.0, 10.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.79022216796875, -4.6273193359375, -4.46441650390625, -4.301513671875, -4.13861083984375, -3.9757080078125, -3.81280517578125, -3.64990234375, -3.48699951171875, -3.3240966796875, -3.16119384765625, -2.998291015625, -2.83538818359375, -2.6724853515625, -2.50958251953125, -2.3466796875, -2.18377685546875, -2.0208740234375, -1.85797119140625, -1.695068359375, -1.53216552734375, -1.3692626953125, -1.20635986328125, -1.04345703125, -0.88055419921875, -0.7176513671875, -0.55474853515625, -0.391845703125, -0.22894287109375, -0.0660400390625, 0.09686279296875, 0.259765625, 0.42266845703125, 0.5855712890625, 0.74847412109375, 0.911376953125, 1.07427978515625, 1.2371826171875, 1.40008544921875, 1.56298828125, 1.72589111328125, 1.8887939453125, 2.05169677734375, 2.214599609375, 2.37750244140625, 2.5404052734375, 2.70330810546875, 2.8662109375, 3.02911376953125, 3.1920166015625, 3.35491943359375, 3.517822265625, 3.68072509765625, 3.8436279296875, 4.00653076171875, 4.16943359375, 4.33233642578125, 4.4952392578125, 4.65814208984375, 4.821044921875, 4.98394775390625, 5.1468505859375, 5.30975341796875, 5.47265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 6.0, 2.0, 6.0, 5.0, 10.0, 9.0, 5.0, 11.0, 13.0, 23.0, 31.0, 31.0, 27.0, 25.0, 22.0, 40.0, 24.0, 52.0, 41.0, 43.0, 47.0, 39.0, 38.0, 48.0, 36.0, 29.0, 53.0, 37.0, 33.0, 42.0, 23.0, 24.0, 25.0, 24.0, 16.0, 17.0, 6.0, 9.0, 6.0, 2.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.046875, -3.926239013671875, -3.80560302734375, -3.684967041015625, -3.5643310546875, -3.443695068359375, -3.32305908203125, -3.202423095703125, -3.081787109375, -2.961151123046875, -2.84051513671875, -2.719879150390625, -2.5992431640625, -2.478607177734375, -2.35797119140625, -2.237335205078125, -2.11669921875, -1.996063232421875, -1.87542724609375, -1.754791259765625, -1.6341552734375, -1.513519287109375, -1.39288330078125, -1.272247314453125, -1.151611328125, -1.030975341796875, -0.91033935546875, -0.789703369140625, -0.6690673828125, -0.548431396484375, -0.42779541015625, -0.307159423828125, -0.1865234375, -0.065887451171875, 0.05474853515625, 0.175384521484375, 0.2960205078125, 0.416656494140625, 0.53729248046875, 0.657928466796875, 0.778564453125, 0.899200439453125, 1.01983642578125, 1.140472412109375, 1.2611083984375, 1.381744384765625, 1.50238037109375, 1.623016357421875, 1.74365234375, 1.864288330078125, 1.98492431640625, 2.105560302734375, 2.2261962890625, 2.346832275390625, 2.46746826171875, 2.588104248046875, 2.708740234375, 2.829376220703125, 2.95001220703125, 3.070648193359375, 3.1912841796875, 3.311920166015625, 3.43255615234375, 3.553192138671875, 3.673828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 11.0, 8.0, 20.0, 13.0, 30.0, 27.0, 44.0, 37.0, 66.0, 85.0, 112.0, 136.0, 183.0, 264.0, 358.0, 515.0, 787.0, 1306.0, 2373.0, 4704.0, 11358.0, 33748.0, 131269.0, 473098.0, 285011.0, 67132.0, 19836.0, 7573.0, 3293.0, 1767.0, 1020.0, 679.0, 434.0, 317.0, 226.0, 161.0, 129.0, 99.0, 79.0, 62.0, 45.0, 38.0, 25.0, 22.0, 11.0, 8.0, 16.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0], "bins": [-8.4921875, -8.24066162109375, -7.9891357421875, -7.73760986328125, -7.486083984375, -7.23455810546875, -6.9830322265625, -6.73150634765625, -6.47998046875, -6.22845458984375, -5.9769287109375, -5.72540283203125, -5.473876953125, -5.22235107421875, -4.9708251953125, -4.71929931640625, -4.4677734375, -4.21624755859375, -3.9647216796875, -3.71319580078125, -3.461669921875, -3.21014404296875, -2.9586181640625, -2.70709228515625, -2.45556640625, -2.20404052734375, -1.9525146484375, -1.70098876953125, -1.449462890625, -1.19793701171875, -0.9464111328125, -0.69488525390625, -0.443359375, -0.19183349609375, 0.0596923828125, 0.31121826171875, 0.562744140625, 0.81427001953125, 1.0657958984375, 1.31732177734375, 1.56884765625, 1.82037353515625, 2.0718994140625, 2.32342529296875, 2.574951171875, 2.82647705078125, 3.0780029296875, 3.32952880859375, 3.5810546875, 3.83258056640625, 4.0841064453125, 4.33563232421875, 4.587158203125, 4.83868408203125, 5.0902099609375, 5.34173583984375, 5.59326171875, 5.84478759765625, 6.0963134765625, 6.34783935546875, 6.599365234375, 6.85089111328125, 7.1024169921875, 7.35394287109375, 7.60546875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 3.0, 5.0, 5.0, 1.0, 10.0, 1.0, 19.0, 9.0, 13.0, 14.0, 21.0, 22.0, 18.0, 21.0, 32.0, 27.0, 41.0, 31.0, 33.0, 36.0, 37.0, 37.0, 37.0, 46.0, 40.0, 39.0, 32.0, 36.0, 28.0, 26.0, 27.0, 29.0, 25.0, 25.0, 28.0, 15.0, 21.0, 17.0, 20.0, 18.0, 9.0, 12.0, 4.0, 10.0, 6.0, 3.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.94140625, -1.879730224609375, -1.81805419921875, -1.756378173828125, -1.6947021484375, -1.633026123046875, -1.57135009765625, -1.509674072265625, -1.447998046875, -1.386322021484375, -1.32464599609375, -1.262969970703125, -1.2012939453125, -1.139617919921875, -1.07794189453125, -1.016265869140625, -0.95458984375, -0.892913818359375, -0.83123779296875, -0.769561767578125, -0.7078857421875, -0.646209716796875, -0.58453369140625, -0.522857666015625, -0.461181640625, -0.399505615234375, -0.33782958984375, -0.276153564453125, -0.2144775390625, -0.152801513671875, -0.09112548828125, -0.029449462890625, 0.0322265625, 0.093902587890625, 0.15557861328125, 0.217254638671875, 0.2789306640625, 0.340606689453125, 0.40228271484375, 0.463958740234375, 0.525634765625, 0.587310791015625, 0.64898681640625, 0.710662841796875, 0.7723388671875, 0.834014892578125, 0.89569091796875, 0.957366943359375, 1.01904296875, 1.080718994140625, 1.14239501953125, 1.204071044921875, 1.2657470703125, 1.327423095703125, 1.38909912109375, 1.450775146484375, 1.512451171875, 1.574127197265625, 1.63580322265625, 1.697479248046875, 1.7591552734375, 1.820831298828125, 1.88250732421875, 1.944183349609375, 2.005859375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 6.0, 11.0, 11.0, 25.0, 37.0, 50.0, 81.0, 104.0, 126.0, 207.0, 268.0, 407.0, 650.0, 996.0, 1675.0, 2833.0, 6073.0, 33199.0, 794492.0, 186127.0, 11302.0, 3862.0, 2226.0, 1228.0, 823.0, 574.0, 331.0, 232.0, 166.0, 143.0, 73.0, 65.0, 34.0, 28.0, 24.0, 13.0, 7.0, 10.0, 9.0, 10.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7734375, -8.457275390625, -8.14111328125, -7.824951171875, -7.5087890625, -7.192626953125, -6.87646484375, -6.560302734375, -6.244140625, -5.927978515625, -5.61181640625, -5.295654296875, -4.9794921875, -4.663330078125, -4.34716796875, -4.031005859375, -3.71484375, -3.398681640625, -3.08251953125, -2.766357421875, -2.4501953125, -2.134033203125, -1.81787109375, -1.501708984375, -1.185546875, -0.869384765625, -0.55322265625, -0.237060546875, 0.0791015625, 0.395263671875, 0.71142578125, 1.027587890625, 1.34375, 1.659912109375, 1.97607421875, 2.292236328125, 2.6083984375, 2.924560546875, 3.24072265625, 3.556884765625, 3.873046875, 4.189208984375, 4.50537109375, 4.821533203125, 5.1376953125, 5.453857421875, 5.77001953125, 6.086181640625, 6.40234375, 6.718505859375, 7.03466796875, 7.350830078125, 7.6669921875, 7.983154296875, 8.29931640625, 8.615478515625, 8.931640625, 9.247802734375, 9.56396484375, 9.880126953125, 10.1962890625, 10.512451171875, 10.82861328125, 11.144775390625, 11.4609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 17.0, 201.0, 528.0, 189.0, 30.0, 11.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005908012390136719, -0.0005707666277885437, -0.0005507320165634155, -0.0005306974053382874, -0.0005106627941131592, -0.000490628182888031, -0.00047059357166290283, -0.00045055896043777466, -0.0004305243492126465, -0.0004104897379875183, -0.00039045512676239014, -0.00037042051553726196, -0.0003503859043121338, -0.0003303512930870056, -0.00031031668186187744, -0.00029028207063674927, -0.0002702474594116211, -0.0002502128481864929, -0.00023017823696136475, -0.00021014362573623657, -0.0001901090145111084, -0.00017007440328598022, -0.00015003979206085205, -0.00013000518083572388, -0.0001099705696105957, -8.993595838546753e-05, -6.990134716033936e-05, -4.986673593521118e-05, -2.9832124710083008e-05, -9.797513484954834e-06, 1.023709774017334e-05, 3.0271708965301514e-05, 5.030632019042969e-05, 7.034093141555786e-05, 9.037554264068604e-05, 0.00011041015386581421, 0.00013044476509094238, 0.00015047937631607056, 0.00017051398754119873, 0.0001905485987663269, 0.00021058320999145508, 0.00023061782121658325, 0.0002506524324417114, 0.0002706870436668396, 0.0002907216548919678, 0.00031075626611709595, 0.0003307908773422241, 0.0003508254885673523, 0.00037086009979248047, 0.00039089471101760864, 0.0004109293222427368, 0.000430963933467865, 0.00045099854469299316, 0.00047103315591812134, 0.0004910677671432495, 0.0005111023783683777, 0.0005311369895935059, 0.000551171600818634, 0.0005712062120437622, 0.0005912408232688904, 0.0006112754344940186, 0.0006313100457191467, 0.0006513446569442749, 0.0006713792681694031, 0.0006914138793945312]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 7.0, 14.0, 30.0, 29.0, 40.0, 44.0, 75.0, 89.0, 122.0, 198.0, 244.0, 397.0, 465.0, 774.0, 1011.0, 1628.0, 2523.0, 4197.0, 10363.0, 108389.0, 788805.0, 107096.0, 10235.0, 4052.0, 2487.0, 1604.0, 1093.0, 710.0, 501.0, 367.0, 246.0, 175.0, 160.0, 105.0, 71.0, 54.0, 36.0, 26.0, 20.0, 15.0, 15.0, 10.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.65625, -7.420654296875, -7.18505859375, -6.949462890625, -6.7138671875, -6.478271484375, -6.24267578125, -6.007080078125, -5.771484375, -5.535888671875, -5.30029296875, -5.064697265625, -4.8291015625, -4.593505859375, -4.35791015625, -4.122314453125, -3.88671875, -3.651123046875, -3.41552734375, -3.179931640625, -2.9443359375, -2.708740234375, -2.47314453125, -2.237548828125, -2.001953125, -1.766357421875, -1.53076171875, -1.295166015625, -1.0595703125, -0.823974609375, -0.58837890625, -0.352783203125, -0.1171875, 0.118408203125, 0.35400390625, 0.589599609375, 0.8251953125, 1.060791015625, 1.29638671875, 1.531982421875, 1.767578125, 2.003173828125, 2.23876953125, 2.474365234375, 2.7099609375, 2.945556640625, 3.18115234375, 3.416748046875, 3.65234375, 3.887939453125, 4.12353515625, 4.359130859375, 4.5947265625, 4.830322265625, 5.06591796875, 5.301513671875, 5.537109375, 5.772705078125, 6.00830078125, 6.243896484375, 6.4794921875, 6.715087890625, 6.95068359375, 7.186279296875, 7.421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 10.0, 14.0, 71.0, 197.0, 285.0, 235.0, 112.0, 41.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.900390625, -1.8456268310546875, -1.790863037109375, -1.7360992431640625, -1.68133544921875, -1.6265716552734375, -1.571807861328125, -1.5170440673828125, -1.4622802734375, -1.4075164794921875, -1.352752685546875, -1.2979888916015625, -1.24322509765625, -1.1884613037109375, -1.133697509765625, -1.0789337158203125, -1.024169921875, -0.9694061279296875, -0.914642333984375, -0.8598785400390625, -0.80511474609375, -0.7503509521484375, -0.695587158203125, -0.6408233642578125, -0.5860595703125, -0.5312957763671875, -0.476531982421875, -0.4217681884765625, -0.36700439453125, -0.3122406005859375, -0.257476806640625, -0.2027130126953125, -0.14794921875, -0.0931854248046875, -0.038421630859375, 0.0163421630859375, 0.07110595703125, 0.1258697509765625, 0.180633544921875, 0.2353973388671875, 0.2901611328125, 0.3449249267578125, 0.399688720703125, 0.4544525146484375, 0.50921630859375, 0.5639801025390625, 0.618743896484375, 0.6735076904296875, 0.728271484375, 0.7830352783203125, 0.837799072265625, 0.8925628662109375, 0.94732666015625, 1.0020904541015625, 1.056854248046875, 1.1116180419921875, 1.1663818359375, 1.2211456298828125, 1.275909423828125, 1.3306732177734375, 1.38543701171875, 1.4402008056640625, 1.494964599609375, 1.5497283935546875, 1.6044921875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 8.0, 4.0, 5.0, 14.0, 8.0, 11.0, 10.0, 17.0, 17.0, 23.0, 19.0, 19.0, 33.0, 44.0, 46.0, 48.0, 68.0, 62.0, 65.0, 61.0, 52.0, 54.0, 62.0, 36.0, 45.0, 26.0, 24.0, 25.0, 22.0, 15.0, 13.0, 7.0, 2.0, 10.0, 6.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-5.988524436950684, -5.798193454742432, -5.60786247253418, -5.417531490325928, -5.227200508117676, -5.036870002746582, -4.84653902053833, -4.656208038330078, -4.465877056121826, -4.275546073913574, -4.085215091705322, -3.8948843479156494, -3.7045533657073975, -3.5142223834991455, -3.3238916397094727, -3.1335606575012207, -2.9432296752929688, -2.752898693084717, -2.562567710876465, -2.372236967086792, -2.18190598487854, -1.991575002670288, -1.8012441396713257, -1.6109132766723633, -1.4205822944641113, -1.2302513122558594, -1.039920449256897, -0.8495895266532898, -0.6592586040496826, -0.46892768144607544, -0.27859675884246826, -0.08826589584350586, 0.1020650863647461, 0.29239600896835327, 0.48272693157196045, 0.6730578541755676, 0.8633887767791748, 1.0537197589874268, 1.2440506219863892, 1.4343814849853516, 1.6247124671936035, 1.8150434494018555, 2.0053744316101074, 2.1957051753997803, 2.3860361576080322, 2.576367139816284, 2.766697883605957, 2.957028865814209, 3.147359848022461, 3.337690830230713, 3.528021812438965, 3.7183525562286377, 3.9086835384368896, 4.0990142822265625, 4.2893452644348145, 4.479676246643066, 4.670007228851318, 4.86033821105957, 5.050669193267822, 5.241000175476074, 5.431330680847168, 5.62166166305542, 5.811992645263672, 6.002323627471924, 6.192654609680176]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 4.0, 4.0, 1.0, 4.0, 9.0, 6.0, 2.0, 7.0, 13.0, 12.0, 20.0, 25.0, 24.0, 22.0, 28.0, 22.0, 29.0, 37.0, 25.0, 31.0, 31.0, 40.0, 43.0, 36.0, 42.0, 48.0, 40.0, 30.0, 31.0, 41.0, 32.0, 37.0, 28.0, 37.0, 34.0, 20.0, 16.0, 24.0, 10.0, 12.0, 10.0, 5.0, 3.0, 7.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.9983208179473877, -2.902001142501831, -2.8056814670562744, -2.709362030029297, -2.6130423545837402, -2.5167226791381836, -2.420403003692627, -2.3240833282470703, -2.2277638912200928, -2.131444215774536, -2.0351245403289795, -1.9388049840927124, -1.8424854278564453, -1.7461657524108887, -1.649846076965332, -1.553526520729065, -1.4572068452835083, -1.3608871698379517, -1.2645676136016846, -1.168247938156128, -1.0719283819198608, -0.9756087064743042, -0.8792890906333923, -0.7829694747924805, -0.6866498589515686, -0.5903302431106567, -0.4940106272697449, -0.3976909816265106, -0.30137136578559875, -0.2050517499446869, -0.10873210430145264, -0.012412488460540771, 0.0839071273803711, 0.18022674322128296, 0.2765463590621948, 0.3728660047054291, 0.46918562054634094, 0.5655052661895752, 0.6618248820304871, 0.7581444978713989, 0.8544641137123108, 0.9507837295532227, 1.0471034049987793, 1.1434229612350464, 1.239742636680603, 1.3360621929168701, 1.4323818683624268, 1.5287015438079834, 1.6250211000442505, 1.7213407754898071, 1.8176603317260742, 1.9139800071716309, 2.0102996826171875, 2.106619119644165, 2.2029387950897217, 2.2992584705352783, 2.395578145980835, 2.4918978214263916, 2.5882174968719482, 2.684536933898926, 2.7808566093444824, 2.877176284790039, 2.9734959602355957, 3.0698156356811523, 3.16613507270813]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 10.0, 14.0, 21.0, 19.0, 34.0, 51.0, 59.0, 110.0, 116.0, 208.0, 274.0, 417.0, 680.0, 955.0, 1586.0, 2423.0, 3994.0, 6679.0, 11276.0, 19859.0, 34348.0, 59740.0, 100481.0, 152976.0, 187586.0, 170327.0, 120076.0, 72417.0, 42102.0, 24561.0, 14069.0, 8074.0, 4843.0, 2895.0, 1773.0, 1229.0, 701.0, 528.0, 284.0, 216.0, 161.0, 116.0, 68.0, 60.0, 35.0, 26.0, 20.0, 14.0, 10.0, 4.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-4.5234375, -4.38067626953125, -4.2379150390625, -4.09515380859375, -3.952392578125, -3.80963134765625, -3.6668701171875, -3.52410888671875, -3.38134765625, -3.23858642578125, -3.0958251953125, -2.95306396484375, -2.810302734375, -2.66754150390625, -2.5247802734375, -2.38201904296875, -2.2392578125, -2.09649658203125, -1.9537353515625, -1.81097412109375, -1.668212890625, -1.52545166015625, -1.3826904296875, -1.23992919921875, -1.09716796875, -0.95440673828125, -0.8116455078125, -0.66888427734375, -0.526123046875, -0.38336181640625, -0.2406005859375, -0.09783935546875, 0.044921875, 0.18768310546875, 0.3304443359375, 0.47320556640625, 0.615966796875, 0.75872802734375, 0.9014892578125, 1.04425048828125, 1.18701171875, 1.32977294921875, 1.4725341796875, 1.61529541015625, 1.758056640625, 1.90081787109375, 2.0435791015625, 2.18634033203125, 2.3291015625, 2.47186279296875, 2.6146240234375, 2.75738525390625, 2.900146484375, 3.04290771484375, 3.1856689453125, 3.32843017578125, 3.47119140625, 3.61395263671875, 3.7567138671875, 3.89947509765625, 4.042236328125, 4.18499755859375, 4.3277587890625, 4.47052001953125, 4.61328125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 9.0, 2.0, 11.0, 5.0, 7.0, 12.0, 14.0, 15.0, 23.0, 20.0, 23.0, 32.0, 30.0, 33.0, 36.0, 37.0, 38.0, 50.0, 44.0, 34.0, 48.0, 45.0, 44.0, 47.0, 34.0, 40.0, 36.0, 37.0, 38.0, 27.0, 27.0, 23.0, 15.0, 12.0, 16.0, 12.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.295318603515625, -3.17462158203125, -3.053924560546875, -2.9332275390625, -2.812530517578125, -2.69183349609375, -2.571136474609375, -2.450439453125, -2.329742431640625, -2.20904541015625, -2.088348388671875, -1.9676513671875, -1.846954345703125, -1.72625732421875, -1.605560302734375, -1.48486328125, -1.364166259765625, -1.24346923828125, -1.122772216796875, -1.0020751953125, -0.881378173828125, -0.76068115234375, -0.639984130859375, -0.519287109375, -0.398590087890625, -0.27789306640625, -0.157196044921875, -0.0364990234375, 0.084197998046875, 0.20489501953125, 0.325592041015625, 0.4462890625, 0.566986083984375, 0.68768310546875, 0.808380126953125, 0.9290771484375, 1.049774169921875, 1.17047119140625, 1.291168212890625, 1.411865234375, 1.532562255859375, 1.65325927734375, 1.773956298828125, 1.8946533203125, 2.015350341796875, 2.13604736328125, 2.256744384765625, 2.37744140625, 2.498138427734375, 2.61883544921875, 2.739532470703125, 2.8602294921875, 2.980926513671875, 3.10162353515625, 3.222320556640625, 3.343017578125, 3.463714599609375, 3.58441162109375, 3.705108642578125, 3.8258056640625, 3.946502685546875, 4.06719970703125, 4.187896728515625, 4.30859375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 15.0, 29.0, 39.0, 63.0, 72.0, 114.0, 154.0, 290.0, 377.0, 629.0, 944.0, 1635.0, 2592.0, 4493.0, 7283.0, 12893.0, 22515.0, 40405.0, 72478.0, 124976.0, 182559.0, 199082.0, 154331.0, 96244.0, 53640.0, 29883.0, 16805.0, 9489.0, 5554.0, 3367.0, 2037.0, 1305.0, 789.0, 483.0, 322.0, 211.0, 140.0, 99.0, 61.0, 46.0, 27.0, 22.0, 18.0, 10.0, 8.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.16796875, -5.0076904296875, -4.847412109375, -4.6871337890625, -4.52685546875, -4.3665771484375, -4.206298828125, -4.0460205078125, -3.8857421875, -3.7254638671875, -3.565185546875, -3.4049072265625, -3.24462890625, -3.0843505859375, -2.924072265625, -2.7637939453125, -2.603515625, -2.4432373046875, -2.282958984375, -2.1226806640625, -1.96240234375, -1.8021240234375, -1.641845703125, -1.4815673828125, -1.3212890625, -1.1610107421875, -1.000732421875, -0.8404541015625, -0.68017578125, -0.5198974609375, -0.359619140625, -0.1993408203125, -0.0390625, 0.1212158203125, 0.281494140625, 0.4417724609375, 0.60205078125, 0.7623291015625, 0.922607421875, 1.0828857421875, 1.2431640625, 1.4034423828125, 1.563720703125, 1.7239990234375, 1.88427734375, 2.0445556640625, 2.204833984375, 2.3651123046875, 2.525390625, 2.6856689453125, 2.845947265625, 3.0062255859375, 3.16650390625, 3.3267822265625, 3.487060546875, 3.6473388671875, 3.8076171875, 3.9678955078125, 4.128173828125, 4.2884521484375, 4.44873046875, 4.6090087890625, 4.769287109375, 4.9295654296875, 5.08984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 5.0, 8.0, 15.0, 17.0, 17.0, 12.0, 23.0, 13.0, 15.0, 27.0, 31.0, 25.0, 29.0, 28.0, 34.0, 46.0, 44.0, 33.0, 38.0, 46.0, 51.0, 31.0, 38.0, 44.0, 34.0, 31.0, 39.0, 31.0, 15.0, 24.0, 16.0, 18.0, 18.0, 16.0, 13.0, 11.0, 9.0, 9.0, 5.0, 7.0, 7.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0234375, -1.956939697265625, -1.89044189453125, -1.823944091796875, -1.7574462890625, -1.690948486328125, -1.62445068359375, -1.557952880859375, -1.491455078125, -1.424957275390625, -1.35845947265625, -1.291961669921875, -1.2254638671875, -1.158966064453125, -1.09246826171875, -1.025970458984375, -0.95947265625, -0.892974853515625, -0.82647705078125, -0.759979248046875, -0.6934814453125, -0.626983642578125, -0.56048583984375, -0.493988037109375, -0.427490234375, -0.360992431640625, -0.29449462890625, -0.227996826171875, -0.1614990234375, -0.095001220703125, -0.02850341796875, 0.037994384765625, 0.1044921875, 0.170989990234375, 0.23748779296875, 0.303985595703125, 0.3704833984375, 0.436981201171875, 0.50347900390625, 0.569976806640625, 0.636474609375, 0.702972412109375, 0.76947021484375, 0.835968017578125, 0.9024658203125, 0.968963623046875, 1.03546142578125, 1.101959228515625, 1.16845703125, 1.234954833984375, 1.30145263671875, 1.367950439453125, 1.4344482421875, 1.500946044921875, 1.56744384765625, 1.633941650390625, 1.700439453125, 1.766937255859375, 1.83343505859375, 1.899932861328125, 1.9664306640625, 2.032928466796875, 2.09942626953125, 2.165924072265625, 2.232421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 1.0, 5.0, 8.0, 14.0, 12.0, 20.0, 18.0, 26.0, 47.0, 63.0, 94.0, 107.0, 192.0, 280.0, 455.0, 644.0, 1056.0, 1757.0, 2959.0, 5345.0, 9810.0, 19461.0, 48792.0, 213758.0, 551086.0, 122410.0, 35355.0, 15679.0, 8006.0, 4373.0, 2598.0, 1429.0, 934.0, 624.0, 367.0, 243.0, 193.0, 107.0, 64.0, 43.0, 43.0, 23.0, 20.0, 17.0, 9.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3125, -13.895751953125, -13.47900390625, -13.062255859375, -12.6455078125, -12.228759765625, -11.81201171875, -11.395263671875, -10.978515625, -10.561767578125, -10.14501953125, -9.728271484375, -9.3115234375, -8.894775390625, -8.47802734375, -8.061279296875, -7.64453125, -7.227783203125, -6.81103515625, -6.394287109375, -5.9775390625, -5.560791015625, -5.14404296875, -4.727294921875, -4.310546875, -3.893798828125, -3.47705078125, -3.060302734375, -2.6435546875, -2.226806640625, -1.81005859375, -1.393310546875, -0.9765625, -0.559814453125, -0.14306640625, 0.273681640625, 0.6904296875, 1.107177734375, 1.52392578125, 1.940673828125, 2.357421875, 2.774169921875, 3.19091796875, 3.607666015625, 4.0244140625, 4.441162109375, 4.85791015625, 5.274658203125, 5.69140625, 6.108154296875, 6.52490234375, 6.941650390625, 7.3583984375, 7.775146484375, 8.19189453125, 8.608642578125, 9.025390625, 9.442138671875, 9.85888671875, 10.275634765625, 10.6923828125, 11.109130859375, 11.52587890625, 11.942626953125, 12.359375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 9.0, 12.0, 13.0, 18.0, 24.0, 32.0, 49.0, 70.0, 113.0, 141.0, 139.0, 126.0, 82.0, 50.0, 19.0, 28.0, 11.0, 12.0, 7.0, 5.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009908676147460938, -0.00096091628074646, -0.0009309649467468262, -0.0009010136127471924, -0.0008710622787475586, -0.0008411109447479248, -0.000811159610748291, -0.0007812082767486572, -0.0007512569427490234, -0.0007213056087493896, -0.0006913542747497559, -0.0006614029407501221, -0.0006314516067504883, -0.0006015002727508545, -0.0005715489387512207, -0.0005415976047515869, -0.0005116462707519531, -0.00048169493675231934, -0.00045174360275268555, -0.00042179226875305176, -0.00039184093475341797, -0.0003618896007537842, -0.0003319382667541504, -0.0003019869327545166, -0.0002720355987548828, -0.00024208426475524902, -0.00021213293075561523, -0.00018218159675598145, -0.00015223026275634766, -0.00012227892875671387, -9.232759475708008e-05, -6.237626075744629e-05, -3.24249267578125e-05, -2.473592758178711e-06, 2.7477741241455078e-05, 5.742907524108887e-05, 8.738040924072266e-05, 0.00011733174324035645, 0.00014728307723999023, 0.00017723441123962402, 0.0002071857452392578, 0.0002371370792388916, 0.0002670884132385254, 0.0002970397472381592, 0.00032699108123779297, 0.00035694241523742676, 0.00038689374923706055, 0.00041684508323669434, 0.0004467964172363281, 0.0004767477512359619, 0.0005066990852355957, 0.0005366504192352295, 0.0005666017532348633, 0.0005965530872344971, 0.0006265044212341309, 0.0006564557552337646, 0.0006864070892333984, 0.0007163584232330322, 0.000746309757232666, 0.0007762610912322998, 0.0008062124252319336, 0.0008361637592315674, 0.0008661150932312012, 0.000896066427230835, 0.0009260177612304688]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 10.0, 9.0, 11.0, 20.0, 31.0, 34.0, 53.0, 78.0, 98.0, 159.0, 241.0, 288.0, 448.0, 662.0, 1049.0, 1725.0, 2780.0, 4765.0, 8628.0, 17504.0, 41027.0, 140454.0, 494248.0, 229069.0, 57460.0, 22154.0, 10602.0, 5833.0, 3290.0, 2029.0, 1243.0, 839.0, 549.0, 330.0, 260.0, 168.0, 125.0, 95.0, 58.0, 31.0, 23.0, 17.0, 14.0, 8.0, 15.0, 9.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-10.859375, -10.5367431640625, -10.214111328125, -9.8914794921875, -9.56884765625, -9.2462158203125, -8.923583984375, -8.6009521484375, -8.2783203125, -7.9556884765625, -7.633056640625, -7.3104248046875, -6.98779296875, -6.6651611328125, -6.342529296875, -6.0198974609375, -5.697265625, -5.3746337890625, -5.052001953125, -4.7293701171875, -4.40673828125, -4.0841064453125, -3.761474609375, -3.4388427734375, -3.1162109375, -2.7935791015625, -2.470947265625, -2.1483154296875, -1.82568359375, -1.5030517578125, -1.180419921875, -0.8577880859375, -0.53515625, -0.2125244140625, 0.110107421875, 0.4327392578125, 0.75537109375, 1.0780029296875, 1.400634765625, 1.7232666015625, 2.0458984375, 2.3685302734375, 2.691162109375, 3.0137939453125, 3.33642578125, 3.6590576171875, 3.981689453125, 4.3043212890625, 4.626953125, 4.9495849609375, 5.272216796875, 5.5948486328125, 5.91748046875, 6.2401123046875, 6.562744140625, 6.8853759765625, 7.2080078125, 7.5306396484375, 7.853271484375, 8.1759033203125, 8.49853515625, 8.8211669921875, 9.143798828125, 9.4664306640625, 9.7890625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 3.0, 9.0, 6.0, 9.0, 12.0, 18.0, 15.0, 19.0, 22.0, 36.0, 51.0, 53.0, 70.0, 103.0, 110.0, 82.0, 86.0, 63.0, 49.0, 38.0, 35.0, 30.0, 13.0, 16.0, 6.0, 9.0, 5.0, 2.0, 2.0, 3.0, 9.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.0859375, -2.0260162353515625, -1.966094970703125, -1.9061737060546875, -1.84625244140625, -1.7863311767578125, -1.726409912109375, -1.6664886474609375, -1.6065673828125, -1.5466461181640625, -1.486724853515625, -1.4268035888671875, -1.36688232421875, -1.3069610595703125, -1.247039794921875, -1.1871185302734375, -1.127197265625, -1.0672760009765625, -1.007354736328125, -0.9474334716796875, -0.88751220703125, -0.8275909423828125, -0.767669677734375, -0.7077484130859375, -0.6478271484375, -0.5879058837890625, -0.527984619140625, -0.4680633544921875, -0.40814208984375, -0.3482208251953125, -0.288299560546875, -0.2283782958984375, -0.16845703125, -0.1085357666015625, -0.048614501953125, 0.0113067626953125, 0.07122802734375, 0.1311492919921875, 0.191070556640625, 0.2509918212890625, 0.3109130859375, 0.3708343505859375, 0.430755615234375, 0.4906768798828125, 0.55059814453125, 0.6105194091796875, 0.670440673828125, 0.7303619384765625, 0.790283203125, 0.8502044677734375, 0.910125732421875, 0.9700469970703125, 1.02996826171875, 1.0898895263671875, 1.149810791015625, 1.2097320556640625, 1.2696533203125, 1.3295745849609375, 1.389495849609375, 1.4494171142578125, 1.50933837890625, 1.5692596435546875, 1.629180908203125, 1.6891021728515625, 1.7490234375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 6.0, 3.0, 8.0, 12.0, 12.0, 19.0, 14.0, 22.0, 15.0, 26.0, 40.0, 34.0, 50.0, 58.0, 65.0, 72.0, 72.0, 65.0, 74.0, 72.0, 50.0, 43.0, 27.0, 39.0, 25.0, 21.0, 10.0, 12.0, 7.0, 5.0, 7.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.956976890563965, -6.702872276306152, -6.44876766204834, -6.194663047790527, -5.940558433532715, -5.686453819274902, -5.432348728179932, -5.178244113922119, -4.924139499664307, -4.670034885406494, -4.415930271148682, -4.161825656890869, -3.9077208042144775, -3.653616189956665, -3.3995113372802734, -3.145406723022461, -2.8913021087646484, -2.637197494506836, -2.3830928802490234, -2.128988027572632, -1.8748834133148193, -1.6207787990570068, -1.3666740655899048, -1.1125693321228027, -0.8584647178649902, -0.604360044002533, -0.3502553701400757, -0.09615069627761841, 0.15795397758483887, 0.41205859184265137, 0.6661633253097534, 0.9202680587768555, 1.1743736267089844, 1.4284782409667969, 1.682582974433899, 1.936687707901001, 2.1907923221588135, 2.444896936416626, 2.6990017890930176, 2.95310640335083, 3.2072110176086426, 3.461315631866455, 3.7154202461242676, 3.969525098800659, 4.223629951477051, 4.477734565734863, 4.731839179992676, 4.985943794250488, 5.240048408508301, 5.494153022766113, 5.748257637023926, 6.002362251281738, 6.256466865539551, 6.510571479797363, 6.764676570892334, 7.0187811851501465, 7.272885799407959, 7.5269904136657715, 7.781095027923584, 8.035200119018555, 8.289304733276367, 8.54340934753418, 8.797513961791992, 9.051618576049805, 9.305723190307617]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 7.0, 11.0, 12.0, 15.0, 15.0, 19.0, 21.0, 29.0, 35.0, 35.0, 27.0, 32.0, 40.0, 39.0, 55.0, 33.0, 46.0, 36.0, 39.0, 36.0, 38.0, 48.0, 46.0, 31.0, 43.0, 21.0, 31.0, 23.0, 19.0, 9.0, 18.0, 12.0, 11.0, 9.0, 8.0, 6.0, 9.0, 1.0, 9.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3813626766204834, -3.2690913677215576, -3.156820058822632, -3.044548749923706, -2.9322774410247803, -2.8200061321258545, -2.7077348232269287, -2.595463514328003, -2.483192205429077, -2.3709208965301514, -2.2586495876312256, -2.1463782787323, -2.034106969833374, -1.9218356609344482, -1.8095643520355225, -1.6972930431365967, -1.5850216150283813, -1.4727503061294556, -1.3604789972305298, -1.248207688331604, -1.1359363794326782, -1.023664951324463, -0.9113937020301819, -0.7991223931312561, -0.6868510842323303, -0.5745797753334045, -0.46230846643447876, -0.3500371277332306, -0.2377658188343048, -0.12549448013305664, -0.01322317123413086, 0.09904813766479492, 0.2113194465637207, 0.3235907554626465, 0.43586206436157227, 0.548133373260498, 0.6604046821594238, 0.7726760506629944, 0.8849473595619202, 0.997218668460846, 1.109489917755127, 1.2217612266540527, 1.3340325355529785, 1.4463038444519043, 1.55857515335083, 1.6708464622497559, 1.7831177711486816, 1.8953890800476074, 2.007660388946533, 2.119931697845459, 2.2322030067443848, 2.3444743156433105, 2.4567456245422363, 2.569016933441162, 2.681288242340088, 2.7935595512390137, 2.9058310985565186, 3.0181024074554443, 3.13037371635437, 3.242645025253296, 3.3549163341522217, 3.4671876430511475, 3.5794589519500732, 3.691730260848999, 3.804001569747925]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 5.0, 12.0, 13.0, 13.0, 20.0, 33.0, 39.0, 46.0, 69.0, 113.0, 179.0, 246.0, 384.0, 521.0, 797.0, 1181.0, 1789.0, 2875.0, 4694.0, 7763.0, 13901.0, 26439.0, 55801.0, 139312.0, 419863.0, 1257042.0, 1432856.0, 528031.0, 168586.0, 65122.0, 29888.0, 15279.0, 8354.0, 4866.0, 2848.0, 1860.0, 1151.0, 728.0, 511.0, 346.0, 213.0, 155.0, 110.0, 85.0, 51.0, 40.0, 29.0, 10.0, 13.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.75, -8.485595703125, -8.22119140625, -7.956787109375, -7.6923828125, -7.427978515625, -7.16357421875, -6.899169921875, -6.634765625, -6.370361328125, -6.10595703125, -5.841552734375, -5.5771484375, -5.312744140625, -5.04833984375, -4.783935546875, -4.51953125, -4.255126953125, -3.99072265625, -3.726318359375, -3.4619140625, -3.197509765625, -2.93310546875, -2.668701171875, -2.404296875, -2.139892578125, -1.87548828125, -1.611083984375, -1.3466796875, -1.082275390625, -0.81787109375, -0.553466796875, -0.2890625, -0.024658203125, 0.23974609375, 0.504150390625, 0.7685546875, 1.032958984375, 1.29736328125, 1.561767578125, 1.826171875, 2.090576171875, 2.35498046875, 2.619384765625, 2.8837890625, 3.148193359375, 3.41259765625, 3.677001953125, 3.94140625, 4.205810546875, 4.47021484375, 4.734619140625, 4.9990234375, 5.263427734375, 5.52783203125, 5.792236328125, 6.056640625, 6.321044921875, 6.58544921875, 6.849853515625, 7.1142578125, 7.378662109375, 7.64306640625, 7.907470703125, 8.171875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 5.0, 7.0, 7.0, 9.0, 13.0, 11.0, 17.0, 29.0, 17.0, 14.0, 27.0, 33.0, 30.0, 26.0, 37.0, 45.0, 43.0, 31.0, 49.0, 47.0, 45.0, 40.0, 42.0, 48.0, 40.0, 35.0, 40.0, 24.0, 35.0, 26.0, 16.0, 15.0, 18.0, 10.0, 17.0, 8.0, 5.0, 13.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.21484375, -3.117340087890625, -3.01983642578125, -2.922332763671875, -2.8248291015625, -2.727325439453125, -2.62982177734375, -2.532318115234375, -2.434814453125, -2.337310791015625, -2.23980712890625, -2.142303466796875, -2.0447998046875, -1.947296142578125, -1.84979248046875, -1.752288818359375, -1.65478515625, -1.557281494140625, -1.45977783203125, -1.362274169921875, -1.2647705078125, -1.167266845703125, -1.06976318359375, -0.972259521484375, -0.874755859375, -0.777252197265625, -0.67974853515625, -0.582244873046875, -0.4847412109375, -0.387237548828125, -0.28973388671875, -0.192230224609375, -0.0947265625, 0.002777099609375, 0.10028076171875, 0.197784423828125, 0.2952880859375, 0.392791748046875, 0.49029541015625, 0.587799072265625, 0.685302734375, 0.782806396484375, 0.88031005859375, 0.977813720703125, 1.0753173828125, 1.172821044921875, 1.27032470703125, 1.367828369140625, 1.46533203125, 1.562835693359375, 1.66033935546875, 1.757843017578125, 1.8553466796875, 1.952850341796875, 2.05035400390625, 2.147857666015625, 2.245361328125, 2.342864990234375, 2.44036865234375, 2.537872314453125, 2.6353759765625, 2.732879638671875, 2.83038330078125, 2.927886962890625, 3.025390625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 8.0, 9.0, 20.0, 16.0, 34.0, 43.0, 67.0, 72.0, 127.0, 151.0, 188.0, 327.0, 483.0, 772.0, 1200.0, 1780.0, 3028.0, 5455.0, 9550.0, 17925.0, 34234.0, 70808.0, 162179.0, 424824.0, 1200365.0, 1381444.0, 520855.0, 192184.0, 82190.0, 38743.0, 19358.0, 10567.0, 5845.0, 3409.0, 2080.0, 1302.0, 845.0, 528.0, 411.0, 220.0, 182.0, 132.0, 81.0, 66.0, 50.0, 42.0, 21.0, 15.0, 14.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 4.0, 2.0], "bins": [-9.3828125, -9.0904541015625, -8.798095703125, -8.5057373046875, -8.21337890625, -7.9210205078125, -7.628662109375, -7.3363037109375, -7.0439453125, -6.7515869140625, -6.459228515625, -6.1668701171875, -5.87451171875, -5.5821533203125, -5.289794921875, -4.9974365234375, -4.705078125, -4.4127197265625, -4.120361328125, -3.8280029296875, -3.53564453125, -3.2432861328125, -2.950927734375, -2.6585693359375, -2.3662109375, -2.0738525390625, -1.781494140625, -1.4891357421875, -1.19677734375, -0.9044189453125, -0.612060546875, -0.3197021484375, -0.02734375, 0.2650146484375, 0.557373046875, 0.8497314453125, 1.14208984375, 1.4344482421875, 1.726806640625, 2.0191650390625, 2.3115234375, 2.6038818359375, 2.896240234375, 3.1885986328125, 3.48095703125, 3.7733154296875, 4.065673828125, 4.3580322265625, 4.650390625, 4.9427490234375, 5.235107421875, 5.5274658203125, 5.81982421875, 6.1121826171875, 6.404541015625, 6.6968994140625, 6.9892578125, 7.2816162109375, 7.573974609375, 7.8663330078125, 8.15869140625, 8.4510498046875, 8.743408203125, 9.0357666015625, 9.328125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 10.0, 11.0, 13.0, 18.0, 15.0, 32.0, 34.0, 48.0, 77.0, 97.0, 146.0, 203.0, 262.0, 333.0, 382.0, 416.0, 441.0, 336.0, 288.0, 225.0, 193.0, 129.0, 108.0, 57.0, 59.0, 33.0, 30.0, 24.0, 16.0, 9.0, 7.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.21875, -3.133209228515625, -3.04766845703125, -2.962127685546875, -2.8765869140625, -2.791046142578125, -2.70550537109375, -2.619964599609375, -2.534423828125, -2.448883056640625, -2.36334228515625, -2.277801513671875, -2.1922607421875, -2.106719970703125, -2.02117919921875, -1.935638427734375, -1.85009765625, -1.764556884765625, -1.67901611328125, -1.593475341796875, -1.5079345703125, -1.422393798828125, -1.33685302734375, -1.251312255859375, -1.165771484375, -1.080230712890625, -0.99468994140625, -0.909149169921875, -0.8236083984375, -0.738067626953125, -0.65252685546875, -0.566986083984375, -0.4814453125, -0.395904541015625, -0.31036376953125, -0.224822998046875, -0.1392822265625, -0.053741455078125, 0.03179931640625, 0.117340087890625, 0.202880859375, 0.288421630859375, 0.37396240234375, 0.459503173828125, 0.5450439453125, 0.630584716796875, 0.71612548828125, 0.801666259765625, 0.88720703125, 0.972747802734375, 1.05828857421875, 1.143829345703125, 1.2293701171875, 1.314910888671875, 1.40045166015625, 1.485992431640625, 1.571533203125, 1.657073974609375, 1.74261474609375, 1.828155517578125, 1.9136962890625, 1.999237060546875, 2.08477783203125, 2.170318603515625, 2.255859375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 10.0, 16.0, 17.0, 21.0, 29.0, 32.0, 39.0, 65.0, 63.0, 79.0, 80.0, 84.0, 75.0, 59.0, 62.0, 64.0, 37.0, 28.0, 27.0, 22.0, 16.0, 14.0, 7.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.55660343170166, -9.277507781982422, -8.998412132263184, -8.719316482543945, -8.44021987915039, -8.161124229431152, -7.882028579711914, -7.602932929992676, -7.3238372802734375, -7.044741630554199, -6.765645503997803, -6.4865498542785645, -6.207454204559326, -5.92835807800293, -5.649262428283691, -5.370166778564453, -5.091070652008057, -4.811975002288818, -4.532878875732422, -4.253783226013184, -3.9746875762939453, -3.695591688156128, -3.4164958000183105, -3.1374001502990723, -2.858304262161255, -2.5792083740234375, -2.300112724304199, -2.021016836166382, -1.741921067237854, -1.4628252983093262, -1.1837294101715088, -0.904633641242981, -0.6255378723144531, -0.3464420735836029, -0.06734627485275269, 0.21174955368041992, 0.49084532260894775, 0.7699410915374756, 1.049036979675293, 1.3281327486038208, 1.6072285175323486, 1.8863242864608765, 2.1654200553894043, 2.4445159435272217, 2.723611831665039, 3.0027074813842773, 3.2818033695220947, 3.560899257659912, 3.8399949073791504, 4.119090557098389, 4.398186683654785, 4.677282333374023, 4.956377983093262, 5.2354736328125, 5.5145697593688965, 5.793665409088135, 6.072761535644531, 6.3518571853637695, 6.630953311920166, 6.910048961639404, 7.189144611358643, 7.468240737915039, 7.747336387634277, 8.026432037353516, 8.305527687072754]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 10.0, 7.0, 10.0, 18.0, 14.0, 14.0, 19.0, 23.0, 27.0, 30.0, 33.0, 39.0, 39.0, 40.0, 40.0, 53.0, 44.0, 50.0, 42.0, 44.0, 51.0, 43.0, 35.0, 40.0, 39.0, 36.0, 28.0, 19.0, 24.0, 15.0, 10.0, 16.0, 7.0, 6.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.077478408813477, -3.9431145191192627, -3.808750867843628, -3.674386978149414, -3.5400233268737793, -3.4056594371795654, -3.2712955474853516, -3.136931896209717, -3.002568244934082, -2.868204355239868, -2.7338407039642334, -2.5994768142700195, -2.4651131629943848, -2.330749273300171, -2.196385383605957, -2.0620217323303223, -1.9276578426361084, -1.793294072151184, -1.6589303016662598, -1.524566411972046, -1.3902027606964111, -1.2558388710021973, -1.121475100517273, -0.9871113300323486, -0.8527475595474243, -0.7183837890625, -0.5840200185775757, -0.4496561884880066, -0.3152924180030823, -0.18092864751815796, -0.04656481742858887, 0.08779895305633545, 0.22216272354125977, 0.3565264940261841, 0.4908902943134308, 0.6252540946006775, 0.7596178650856018, 0.8939816355705261, 1.0283454656600952, 1.1627092361450195, 1.2970730066299438, 1.4314367771148682, 1.5658005475997925, 1.7001643180847168, 1.8345282077789307, 1.9688918590545654, 2.1032557487487793, 2.237619400024414, 2.371983289718628, 2.506347179412842, 2.6407108306884766, 2.7750747203826904, 2.909438371658325, 3.043802261352539, 3.178165912628174, 3.3125298023223877, 3.4468936920166016, 3.5812575817108154, 3.71562123298645, 3.849985122680664, 3.984348773956299, 4.118712425231934, 4.253076553344727, 4.387440204620361, 4.521803855895996]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 9.0, 16.0, 25.0, 28.0, 37.0, 68.0, 79.0, 121.0, 158.0, 274.0, 401.0, 636.0, 922.0, 1471.0, 2352.0, 3673.0, 6217.0, 10722.0, 18403.0, 32396.0, 57982.0, 102301.0, 165611.0, 207505.0, 175798.0, 112129.0, 63721.0, 35732.0, 20012.0, 11784.0, 6842.0, 4100.0, 2460.0, 1536.0, 1055.0, 654.0, 429.0, 296.0, 171.0, 122.0, 80.0, 71.0, 44.0, 34.0, 17.0, 21.0, 14.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.822265625, -2.72998046875, -2.6376953125, -2.54541015625, -2.453125, -2.36083984375, -2.2685546875, -2.17626953125, -2.083984375, -1.99169921875, -1.8994140625, -1.80712890625, -1.71484375, -1.62255859375, -1.5302734375, -1.43798828125, -1.345703125, -1.25341796875, -1.1611328125, -1.06884765625, -0.9765625, -0.88427734375, -0.7919921875, -0.69970703125, -0.607421875, -0.51513671875, -0.4228515625, -0.33056640625, -0.23828125, -0.14599609375, -0.0537109375, 0.03857421875, 0.130859375, 0.22314453125, 0.3154296875, 0.40771484375, 0.5, 0.59228515625, 0.6845703125, 0.77685546875, 0.869140625, 0.96142578125, 1.0537109375, 1.14599609375, 1.23828125, 1.33056640625, 1.4228515625, 1.51513671875, 1.607421875, 1.69970703125, 1.7919921875, 1.88427734375, 1.9765625, 2.06884765625, 2.1611328125, 2.25341796875, 2.345703125, 2.43798828125, 2.5302734375, 2.62255859375, 2.71484375, 2.80712890625, 2.8994140625, 2.99169921875, 3.083984375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 5.0, 6.0, 8.0, 9.0, 10.0, 17.0, 22.0, 27.0, 22.0, 32.0, 29.0, 32.0, 24.0, 42.0, 48.0, 43.0, 40.0, 45.0, 57.0, 41.0, 42.0, 43.0, 41.0, 48.0, 31.0, 46.0, 37.0, 27.0, 24.0, 19.0, 10.0, 12.0, 11.0, 14.0, 5.0, 7.0, 3.0, 7.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.5909423828125, -4.439697265625, -4.2884521484375, -4.13720703125, -3.9859619140625, -3.834716796875, -3.6834716796875, -3.5322265625, -3.3809814453125, -3.229736328125, -3.0784912109375, -2.92724609375, -2.7760009765625, -2.624755859375, -2.4735107421875, -2.322265625, -2.1710205078125, -2.019775390625, -1.8685302734375, -1.71728515625, -1.5660400390625, -1.414794921875, -1.2635498046875, -1.1123046875, -0.9610595703125, -0.809814453125, -0.6585693359375, -0.50732421875, -0.3560791015625, -0.204833984375, -0.0535888671875, 0.09765625, 0.2489013671875, 0.400146484375, 0.5513916015625, 0.70263671875, 0.8538818359375, 1.005126953125, 1.1563720703125, 1.3076171875, 1.4588623046875, 1.610107421875, 1.7613525390625, 1.91259765625, 2.0638427734375, 2.215087890625, 2.3663330078125, 2.517578125, 2.6688232421875, 2.820068359375, 2.9713134765625, 3.12255859375, 3.2738037109375, 3.425048828125, 3.5762939453125, 3.7275390625, 3.8787841796875, 4.030029296875, 4.1812744140625, 4.33251953125, 4.4837646484375, 4.635009765625, 4.7862548828125, 4.9375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 7.0, 8.0, 10.0, 13.0, 23.0, 31.0, 23.0, 53.0, 87.0, 131.0, 181.0, 314.0, 448.0, 722.0, 1145.0, 1783.0, 2761.0, 4676.0, 7914.0, 13679.0, 24098.0, 43638.0, 81320.0, 150105.0, 235005.0, 209150.0, 122133.0, 65761.0, 35290.0, 19651.0, 11280.0, 6613.0, 3922.0, 2385.0, 1503.0, 930.0, 630.0, 410.0, 255.0, 162.0, 109.0, 52.0, 50.0, 38.0, 15.0, 15.0, 14.0, 11.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310546875, -3.195709228515625, -3.08087158203125, -2.966033935546875, -2.8511962890625, -2.736358642578125, -2.62152099609375, -2.506683349609375, -2.391845703125, -2.277008056640625, -2.16217041015625, -2.047332763671875, -1.9324951171875, -1.817657470703125, -1.70281982421875, -1.587982177734375, -1.47314453125, -1.358306884765625, -1.24346923828125, -1.128631591796875, -1.0137939453125, -0.898956298828125, -0.78411865234375, -0.669281005859375, -0.554443359375, -0.439605712890625, -0.32476806640625, -0.209930419921875, -0.0950927734375, 0.019744873046875, 0.13458251953125, 0.249420166015625, 0.3642578125, 0.479095458984375, 0.59393310546875, 0.708770751953125, 0.8236083984375, 0.938446044921875, 1.05328369140625, 1.168121337890625, 1.282958984375, 1.397796630859375, 1.51263427734375, 1.627471923828125, 1.7423095703125, 1.857147216796875, 1.97198486328125, 2.086822509765625, 2.20166015625, 2.316497802734375, 2.43133544921875, 2.546173095703125, 2.6610107421875, 2.775848388671875, 2.89068603515625, 3.005523681640625, 3.120361328125, 3.235198974609375, 3.35003662109375, 3.464874267578125, 3.5797119140625, 3.694549560546875, 3.80938720703125, 3.924224853515625, 4.0390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 1.0, 7.0, 12.0, 5.0, 13.0, 13.0, 12.0, 19.0, 23.0, 30.0, 26.0, 32.0, 31.0, 27.0, 27.0, 42.0, 35.0, 50.0, 38.0, 41.0, 42.0, 46.0, 45.0, 52.0, 42.0, 39.0, 35.0, 32.0, 21.0, 25.0, 23.0, 16.0, 23.0, 15.0, 13.0, 4.0, 11.0, 7.0, 12.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0], "bins": [-2.615234375, -2.537750244140625, -2.46026611328125, -2.382781982421875, -2.3052978515625, -2.227813720703125, -2.15032958984375, -2.072845458984375, -1.995361328125, -1.917877197265625, -1.84039306640625, -1.762908935546875, -1.6854248046875, -1.607940673828125, -1.53045654296875, -1.452972412109375, -1.37548828125, -1.298004150390625, -1.22052001953125, -1.143035888671875, -1.0655517578125, -0.988067626953125, -0.91058349609375, -0.833099365234375, -0.755615234375, -0.678131103515625, -0.60064697265625, -0.523162841796875, -0.4456787109375, -0.368194580078125, -0.29071044921875, -0.213226318359375, -0.1357421875, -0.058258056640625, 0.01922607421875, 0.096710205078125, 0.1741943359375, 0.251678466796875, 0.32916259765625, 0.406646728515625, 0.484130859375, 0.561614990234375, 0.63909912109375, 0.716583251953125, 0.7940673828125, 0.871551513671875, 0.94903564453125, 1.026519775390625, 1.10400390625, 1.181488037109375, 1.25897216796875, 1.336456298828125, 1.4139404296875, 1.491424560546875, 1.56890869140625, 1.646392822265625, 1.723876953125, 1.801361083984375, 1.87884521484375, 1.956329345703125, 2.0338134765625, 2.111297607421875, 2.18878173828125, 2.266265869140625, 2.34375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 7.0, 19.0, 28.0, 33.0, 43.0, 60.0, 109.0, 122.0, 203.0, 279.0, 401.0, 606.0, 956.0, 1505.0, 2305.0, 3708.0, 5984.0, 10273.0, 17457.0, 30342.0, 54179.0, 98339.0, 170515.0, 229097.0, 179858.0, 104831.0, 58294.0, 32510.0, 18302.0, 10928.0, 6312.0, 3859.0, 2464.0, 1615.0, 978.0, 675.0, 400.0, 305.0, 194.0, 132.0, 98.0, 78.0, 41.0, 31.0, 14.0, 20.0, 9.0, 11.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.609375, -1.5599365234375, -1.510498046875, -1.4610595703125, -1.41162109375, -1.3621826171875, -1.312744140625, -1.2633056640625, -1.2138671875, -1.1644287109375, -1.114990234375, -1.0655517578125, -1.01611328125, -0.9666748046875, -0.917236328125, -0.8677978515625, -0.818359375, -0.7689208984375, -0.719482421875, -0.6700439453125, -0.62060546875, -0.5711669921875, -0.521728515625, -0.4722900390625, -0.4228515625, -0.3734130859375, -0.323974609375, -0.2745361328125, -0.22509765625, -0.1756591796875, -0.126220703125, -0.0767822265625, -0.02734375, 0.0220947265625, 0.071533203125, 0.1209716796875, 0.17041015625, 0.2198486328125, 0.269287109375, 0.3187255859375, 0.3681640625, 0.4176025390625, 0.467041015625, 0.5164794921875, 0.56591796875, 0.6153564453125, 0.664794921875, 0.7142333984375, 0.763671875, 0.8131103515625, 0.862548828125, 0.9119873046875, 0.96142578125, 1.0108642578125, 1.060302734375, 1.1097412109375, 1.1591796875, 1.2086181640625, 1.258056640625, 1.3074951171875, 1.35693359375, 1.4063720703125, 1.455810546875, 1.5052490234375, 1.5546875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 9.0, 19.0, 13.0, 20.0, 27.0, 26.0, 44.0, 72.0, 74.0, 62.0, 98.0, 92.0, 76.0, 73.0, 63.0, 46.0, 40.0, 31.0, 20.0, 19.0, 18.0, 16.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00013518333435058594, -0.0001317458227276802, -0.00012830831110477448, -0.00012487079948186874, -0.00012143328785896301, -0.00011799577623605728, -0.00011455826461315155, -0.00011112075299024582, -0.00010768324136734009, -0.00010424572974443436, -0.00010080821812152863, -9.73707064986229e-05, -9.393319487571716e-05, -9.049568325281143e-05, -8.70581716299057e-05, -8.362066000699997e-05, -8.018314838409424e-05, -7.674563676118851e-05, -7.330812513828278e-05, -6.987061351537704e-05, -6.643310189247131e-05, -6.299559026956558e-05, -5.955807864665985e-05, -5.612056702375412e-05, -5.268305540084839e-05, -4.924554377794266e-05, -4.5808032155036926e-05, -4.2370520532131195e-05, -3.8933008909225464e-05, -3.549549728631973e-05, -3.2057985663414e-05, -2.862047404050827e-05, -2.518296241760254e-05, -2.1745450794696808e-05, -1.8307939171791077e-05, -1.4870427548885345e-05, -1.1432915925979614e-05, -7.995404303073883e-06, -4.557892680168152e-06, -1.1203810572624207e-06, 2.3171305656433105e-06, 5.754642188549042e-06, 9.192153811454773e-06, 1.2629665434360504e-05, 1.6067177057266235e-05, 1.9504688680171967e-05, 2.2942200303077698e-05, 2.637971192598343e-05, 2.981722354888916e-05, 3.325473517179489e-05, 3.669224679470062e-05, 4.0129758417606354e-05, 4.3567270040512085e-05, 4.7004781663417816e-05, 5.044229328632355e-05, 5.387980490922928e-05, 5.731731653213501e-05, 6.075482815504074e-05, 6.419233977794647e-05, 6.76298514008522e-05, 7.106736302375793e-05, 7.450487464666367e-05, 7.79423862695694e-05, 8.137989789247513e-05, 8.481740951538086e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 8.0, 5.0, 12.0, 9.0, 12.0, 21.0, 26.0, 37.0, 45.0, 73.0, 90.0, 145.0, 235.0, 337.0, 512.0, 665.0, 1140.0, 1684.0, 2628.0, 3846.0, 6214.0, 9982.0, 16001.0, 26234.0, 43169.0, 69919.0, 106909.0, 148048.0, 169440.0, 149065.0, 108178.0, 70043.0, 43531.0, 26206.0, 16151.0, 10039.0, 6365.0, 3919.0, 2562.0, 1603.0, 1116.0, 755.0, 536.0, 295.0, 234.0, 168.0, 122.0, 65.0, 51.0, 39.0, 22.0, 18.0, 9.0, 9.0, 8.0, 6.0, 4.0, 1.0, 3.0, 3.0], "bins": [-1.2509765625, -1.212493896484375, -1.17401123046875, -1.135528564453125, -1.0970458984375, -1.058563232421875, -1.02008056640625, -0.981597900390625, -0.943115234375, -0.904632568359375, -0.86614990234375, -0.827667236328125, -0.7891845703125, -0.750701904296875, -0.71221923828125, -0.673736572265625, -0.63525390625, -0.596771240234375, -0.55828857421875, -0.519805908203125, -0.4813232421875, -0.442840576171875, -0.40435791015625, -0.365875244140625, -0.327392578125, -0.288909912109375, -0.25042724609375, -0.211944580078125, -0.1734619140625, -0.134979248046875, -0.09649658203125, -0.058013916015625, -0.01953125, 0.018951416015625, 0.05743408203125, 0.095916748046875, 0.1343994140625, 0.172882080078125, 0.21136474609375, 0.249847412109375, 0.288330078125, 0.326812744140625, 0.36529541015625, 0.403778076171875, 0.4422607421875, 0.480743408203125, 0.51922607421875, 0.557708740234375, 0.59619140625, 0.634674072265625, 0.67315673828125, 0.711639404296875, 0.7501220703125, 0.788604736328125, 0.82708740234375, 0.865570068359375, 0.904052734375, 0.942535400390625, 0.98101806640625, 1.019500732421875, 1.0579833984375, 1.096466064453125, 1.13494873046875, 1.173431396484375, 1.2119140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 11.0, 1.0, 11.0, 7.0, 15.0, 9.0, 19.0, 17.0, 23.0, 21.0, 29.0, 41.0, 46.0, 53.0, 43.0, 61.0, 56.0, 59.0, 62.0, 51.0, 56.0, 38.0, 51.0, 35.0, 36.0, 27.0, 22.0, 20.0, 16.0, 12.0, 14.0, 9.0, 5.0, 3.0, 7.0, 8.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393798828125, -0.3816986083984375, -0.369598388671875, -0.3574981689453125, -0.34539794921875, -0.3332977294921875, -0.321197509765625, -0.3090972900390625, -0.2969970703125, -0.2848968505859375, -0.272796630859375, -0.2606964111328125, -0.24859619140625, -0.2364959716796875, -0.224395751953125, -0.2122955322265625, -0.2001953125, -0.1880950927734375, -0.175994873046875, -0.1638946533203125, -0.15179443359375, -0.1396942138671875, -0.127593994140625, -0.1154937744140625, -0.1033935546875, -0.0912933349609375, -0.079193115234375, -0.0670928955078125, -0.05499267578125, -0.0428924560546875, -0.030792236328125, -0.0186920166015625, -0.006591796875, 0.0055084228515625, 0.017608642578125, 0.0297088623046875, 0.04180908203125, 0.0539093017578125, 0.066009521484375, 0.0781097412109375, 0.0902099609375, 0.1023101806640625, 0.114410400390625, 0.1265106201171875, 0.13861083984375, 0.1507110595703125, 0.162811279296875, 0.1749114990234375, 0.18701171875, 0.1991119384765625, 0.211212158203125, 0.2233123779296875, 0.23541259765625, 0.2475128173828125, 0.259613037109375, 0.2717132568359375, 0.2838134765625, 0.2959136962890625, 0.308013916015625, 0.3201141357421875, 0.33221435546875, 0.3443145751953125, 0.356414794921875, 0.3685150146484375, 0.380615234375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 3.0, 9.0, 6.0, 15.0, 22.0, 27.0, 27.0, 37.0, 48.0, 67.0, 74.0, 94.0, 92.0, 87.0, 62.0, 62.0, 81.0, 34.0, 31.0, 22.0, 27.0, 12.0, 12.0, 8.0, 6.0, 5.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.351263999938965, -10.052410125732422, -9.753556251525879, -9.454703330993652, -9.15584945678711, -8.856995582580566, -8.558141708374023, -8.25928783416748, -7.960434436798096, -7.661580562591553, -7.362727165222168, -7.063873291015625, -6.765019416809082, -6.466166019439697, -6.167312145233154, -5.8684587478637695, -5.569604873657227, -5.270750999450684, -4.971897602081299, -4.673043727874756, -4.374190330505371, -4.075336456298828, -3.776482582092285, -3.4776289463043213, -3.1787753105163574, -2.8799216747283936, -2.5810680389404297, -2.2822141647338867, -1.9833605289459229, -1.684506893157959, -1.3856531381607056, -1.0867993831634521, -0.7879457473754883, -0.48909205198287964, -0.190238356590271, 0.10861533880233765, 0.4074690341949463, 0.7063226699829102, 1.0051764249801636, 1.304030179977417, 1.6028838157653809, 1.9017374515533447, 2.2005910873413086, 2.4994449615478516, 2.7982985973358154, 3.0971522331237793, 3.3960061073303223, 3.694859743118286, 3.99371337890625, 4.292567253112793, 4.591420650482178, 4.890274524688721, 5.1891279220581055, 5.487981796264648, 5.786835670471191, 6.085689544677734, 6.384542942047119, 6.683396816253662, 6.982250213623047, 7.28110408782959, 7.579957962036133, 7.878811359405518, 8.177664756774902, 8.476518630981445, 8.775372505187988]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 6.0, 4.0, 11.0, 10.0, 7.0, 23.0, 7.0, 17.0, 20.0, 23.0, 23.0, 38.0, 29.0, 40.0, 43.0, 39.0, 42.0, 55.0, 40.0, 45.0, 43.0, 47.0, 40.0, 46.0, 38.0, 41.0, 36.0, 35.0, 29.0, 23.0, 16.0, 17.0, 12.0, 9.0, 13.0, 4.0, 11.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.968970775604248, -3.8381659984588623, -3.7073612213134766, -3.5765562057495117, -3.445751428604126, -3.3149466514587402, -3.1841416358947754, -3.0533368587493896, -2.922532081604004, -2.791727304458618, -2.6609225273132324, -2.5301175117492676, -2.399312734603882, -2.268507957458496, -2.1377029418945312, -2.0068981647491455, -1.8760933876037598, -1.745288610458374, -1.6144837141036987, -1.4836788177490234, -1.3528740406036377, -1.222069263458252, -1.0912643671035767, -0.9604595303535461, -0.8296546936035156, -0.6988498568534851, -0.5680450201034546, -0.4372401833534241, -0.30643534660339355, -0.17563050985336304, -0.04482567310333252, 0.085979163646698, 0.21678447723388672, 0.34758931398391724, 0.47839415073394775, 0.6091989874839783, 0.7400038242340088, 0.8708086609840393, 1.0016134977340698, 1.1324183940887451, 1.2632231712341309, 1.3940279483795166, 1.524832844734192, 1.6556377410888672, 1.786442518234253, 1.9172472953796387, 2.0480523109436035, 2.1788570880889893, 2.309661865234375, 2.4404666423797607, 2.5712714195251465, 2.7020764350891113, 2.832881212234497, 2.963685989379883, 3.0944910049438477, 3.2252957820892334, 3.356100559234619, 3.486905336380005, 3.6177101135253906, 3.7485151290893555, 3.879319906234741, 4.010124683380127, 4.140929698944092, 4.271734237670898, 4.402539253234863]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 11.0, 12.0, 18.0, 13.0, 25.0, 45.0, 51.0, 53.0, 89.0, 134.0, 159.0, 187.0, 333.0, 440.0, 665.0, 1100.0, 1932.0, 3557.0, 7745.0, 19677.0, 55696.0, 164182.0, 354967.0, 275401.0, 102461.0, 34522.0, 12786.0, 5408.0, 2640.0, 1358.0, 857.0, 568.0, 408.0, 292.0, 195.0, 144.0, 99.0, 69.0, 68.0, 48.0, 27.0, 34.0, 16.0, 17.0, 8.0, 9.0, 7.0, 5.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-11.0625, -10.7349853515625, -10.407470703125, -10.0799560546875, -9.75244140625, -9.4249267578125, -9.097412109375, -8.7698974609375, -8.4423828125, -8.1148681640625, -7.787353515625, -7.4598388671875, -7.13232421875, -6.8048095703125, -6.477294921875, -6.1497802734375, -5.822265625, -5.4947509765625, -5.167236328125, -4.8397216796875, -4.51220703125, -4.1846923828125, -3.857177734375, -3.5296630859375, -3.2021484375, -2.8746337890625, -2.547119140625, -2.2196044921875, -1.89208984375, -1.5645751953125, -1.237060546875, -0.9095458984375, -0.58203125, -0.2545166015625, 0.072998046875, 0.4005126953125, 0.72802734375, 1.0555419921875, 1.383056640625, 1.7105712890625, 2.0380859375, 2.3656005859375, 2.693115234375, 3.0206298828125, 3.34814453125, 3.6756591796875, 4.003173828125, 4.3306884765625, 4.658203125, 4.9857177734375, 5.313232421875, 5.6407470703125, 5.96826171875, 6.2957763671875, 6.623291015625, 6.9508056640625, 7.2783203125, 7.6058349609375, 7.933349609375, 8.2608642578125, 8.58837890625, 8.9158935546875, 9.243408203125, 9.5709228515625, 9.8984375]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 4.0, 11.0, 15.0, 9.0, 22.0, 16.0, 21.0, 27.0, 37.0, 33.0, 24.0, 45.0, 33.0, 52.0, 52.0, 42.0, 61.0, 53.0, 36.0, 41.0, 44.0, 36.0, 33.0, 41.0, 28.0, 22.0, 23.0, 21.0, 24.0, 14.0, 17.0, 11.0, 9.0, 11.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.0692138671875, -3.923583984375, -3.7779541015625, -3.63232421875, -3.4866943359375, -3.341064453125, -3.1954345703125, -3.0498046875, -2.9041748046875, -2.758544921875, -2.6129150390625, -2.46728515625, -2.3216552734375, -2.176025390625, -2.0303955078125, -1.884765625, -1.7391357421875, -1.593505859375, -1.4478759765625, -1.30224609375, -1.1566162109375, -1.010986328125, -0.8653564453125, -0.7197265625, -0.5740966796875, -0.428466796875, -0.2828369140625, -0.13720703125, 0.0084228515625, 0.154052734375, 0.2996826171875, 0.4453125, 0.5909423828125, 0.736572265625, 0.8822021484375, 1.02783203125, 1.1734619140625, 1.319091796875, 1.4647216796875, 1.6103515625, 1.7559814453125, 1.901611328125, 2.0472412109375, 2.19287109375, 2.3385009765625, 2.484130859375, 2.6297607421875, 2.775390625, 2.9210205078125, 3.066650390625, 3.2122802734375, 3.35791015625, 3.5035400390625, 3.649169921875, 3.7947998046875, 3.9404296875, 4.0860595703125, 4.231689453125, 4.3773193359375, 4.52294921875, 4.6685791015625, 4.814208984375, 4.9598388671875, 5.10546875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 8.0, 12.0, 10.0, 13.0, 12.0, 25.0, 23.0, 35.0, 50.0, 68.0, 88.0, 135.0, 163.0, 263.0, 406.0, 548.0, 862.0, 1353.0, 2362.0, 4281.0, 8122.0, 16671.0, 35666.0, 78921.0, 168934.0, 270276.0, 232070.0, 120641.0, 55103.0, 25088.0, 12028.0, 5923.0, 3146.0, 1828.0, 1072.0, 687.0, 475.0, 292.0, 239.0, 197.0, 130.0, 92.0, 73.0, 40.0, 36.0, 21.0, 18.0, 7.0, 13.0, 10.0, 7.0, 4.0, 5.0, 3.0, 5.0], "bins": [-8.96875, -8.7108154296875, -8.452880859375, -8.1949462890625, -7.93701171875, -7.6790771484375, -7.421142578125, -7.1632080078125, -6.9052734375, -6.6473388671875, -6.389404296875, -6.1314697265625, -5.87353515625, -5.6156005859375, -5.357666015625, -5.0997314453125, -4.841796875, -4.5838623046875, -4.325927734375, -4.0679931640625, -3.81005859375, -3.5521240234375, -3.294189453125, -3.0362548828125, -2.7783203125, -2.5203857421875, -2.262451171875, -2.0045166015625, -1.74658203125, -1.4886474609375, -1.230712890625, -0.9727783203125, -0.71484375, -0.4569091796875, -0.198974609375, 0.0589599609375, 0.31689453125, 0.5748291015625, 0.832763671875, 1.0906982421875, 1.3486328125, 1.6065673828125, 1.864501953125, 2.1224365234375, 2.38037109375, 2.6383056640625, 2.896240234375, 3.1541748046875, 3.412109375, 3.6700439453125, 3.927978515625, 4.1859130859375, 4.44384765625, 4.7017822265625, 4.959716796875, 5.2176513671875, 5.4755859375, 5.7335205078125, 5.991455078125, 6.2493896484375, 6.50732421875, 6.7652587890625, 7.023193359375, 7.2811279296875, 7.5390625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 4.0, 7.0, 12.0, 19.0, 17.0, 24.0, 17.0, 25.0, 24.0, 20.0, 29.0, 33.0, 36.0, 39.0, 43.0, 38.0, 45.0, 46.0, 45.0, 34.0, 43.0, 34.0, 31.0, 38.0, 34.0, 36.0, 24.0, 23.0, 37.0, 27.0, 14.0, 14.0, 14.0, 14.0, 12.0, 12.0, 9.0, 6.0, 1.0, 1.0, 2.0, 8.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.9375, -2.852081298828125, -2.76666259765625, -2.681243896484375, -2.5958251953125, -2.510406494140625, -2.42498779296875, -2.339569091796875, -2.254150390625, -2.168731689453125, -2.08331298828125, -1.997894287109375, -1.9124755859375, -1.827056884765625, -1.74163818359375, -1.656219482421875, -1.57080078125, -1.485382080078125, -1.39996337890625, -1.314544677734375, -1.2291259765625, -1.143707275390625, -1.05828857421875, -0.972869873046875, -0.887451171875, -0.802032470703125, -0.71661376953125, -0.631195068359375, -0.5457763671875, -0.460357666015625, -0.37493896484375, -0.289520263671875, -0.2041015625, -0.118682861328125, -0.03326416015625, 0.052154541015625, 0.1375732421875, 0.222991943359375, 0.30841064453125, 0.393829345703125, 0.479248046875, 0.564666748046875, 0.65008544921875, 0.735504150390625, 0.8209228515625, 0.906341552734375, 0.99176025390625, 1.077178955078125, 1.16259765625, 1.248016357421875, 1.33343505859375, 1.418853759765625, 1.5042724609375, 1.589691162109375, 1.67510986328125, 1.760528564453125, 1.845947265625, 1.931365966796875, 2.01678466796875, 2.102203369140625, 2.1876220703125, 2.273040771484375, 2.35845947265625, 2.443878173828125, 2.529296875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 9.0, 9.0, 15.0, 17.0, 27.0, 37.0, 62.0, 90.0, 107.0, 166.0, 265.0, 465.0, 643.0, 1059.0, 1711.0, 2841.0, 4747.0, 8449.0, 15988.0, 32192.0, 71610.0, 193823.0, 385903.0, 189544.0, 70908.0, 31399.0, 15945.0, 8382.0, 4746.0, 2796.0, 1652.0, 1048.0, 680.0, 418.0, 285.0, 153.0, 126.0, 61.0, 46.0, 32.0, 29.0, 19.0, 15.0, 6.0, 4.0, 5.0, 7.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.5626220703125, -6.332275390625, -6.1019287109375, -5.87158203125, -5.6412353515625, -5.410888671875, -5.1805419921875, -4.9501953125, -4.7198486328125, -4.489501953125, -4.2591552734375, -4.02880859375, -3.7984619140625, -3.568115234375, -3.3377685546875, -3.107421875, -2.8770751953125, -2.646728515625, -2.4163818359375, -2.18603515625, -1.9556884765625, -1.725341796875, -1.4949951171875, -1.2646484375, -1.0343017578125, -0.803955078125, -0.5736083984375, -0.34326171875, -0.1129150390625, 0.117431640625, 0.3477783203125, 0.578125, 0.8084716796875, 1.038818359375, 1.2691650390625, 1.49951171875, 1.7298583984375, 1.960205078125, 2.1905517578125, 2.4208984375, 2.6512451171875, 2.881591796875, 3.1119384765625, 3.34228515625, 3.5726318359375, 3.802978515625, 4.0333251953125, 4.263671875, 4.4940185546875, 4.724365234375, 4.9547119140625, 5.18505859375, 5.4154052734375, 5.645751953125, 5.8760986328125, 6.1064453125, 6.3367919921875, 6.567138671875, 6.7974853515625, 7.02783203125, 7.2581787109375, 7.488525390625, 7.7188720703125, 7.94921875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 7.0, 12.0, 13.0, 23.0, 24.0, 28.0, 44.0, 78.0, 127.0, 165.0, 159.0, 96.0, 56.0, 45.0, 27.0, 17.0, 17.0, 12.0, 8.0, 6.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010614395141601562, -0.0010290443897247314, -0.0009966492652893066, -0.0009642541408538818, -0.000931859016418457, -0.0008994638919830322, -0.0008670687675476074, -0.0008346736431121826, -0.0008022785186767578, -0.000769883394241333, -0.0007374882698059082, -0.0007050931453704834, -0.0006726980209350586, -0.0006403028964996338, -0.000607907772064209, -0.0005755126476287842, -0.0005431175231933594, -0.0005107223987579346, -0.00047832727432250977, -0.00044593214988708496, -0.00041353702545166016, -0.00038114190101623535, -0.00034874677658081055, -0.00031635165214538574, -0.00028395652770996094, -0.00025156140327453613, -0.00021916627883911133, -0.00018677115440368652, -0.00015437602996826172, -0.00012198090553283691, -8.958578109741211e-05, -5.7190656661987305e-05, -2.47955322265625e-05, 7.599592208862305e-06, 3.999471664428711e-05, 7.238984107971191e-05, 0.00010478496551513672, 0.00013718008995056152, 0.00016957521438598633, 0.00020197033882141113, 0.00023436546325683594, 0.00026676058769226074, 0.00029915571212768555, 0.00033155083656311035, 0.00036394596099853516, 0.00039634108543395996, 0.00042873620986938477, 0.00046113133430480957, 0.0004935264587402344, 0.0005259215831756592, 0.000558316707611084, 0.0005907118320465088, 0.0006231069564819336, 0.0006555020809173584, 0.0006878972053527832, 0.000720292329788208, 0.0007526874542236328, 0.0007850825786590576, 0.0008174777030944824, 0.0008498728275299072, 0.000882267951965332, 0.0009146630764007568, 0.0009470582008361816, 0.0009794533252716064, 0.0010118484497070312]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 17.0, 16.0, 26.0, 33.0, 57.0, 80.0, 121.0, 203.0, 280.0, 417.0, 723.0, 1166.0, 1919.0, 3243.0, 5707.0, 10731.0, 21895.0, 49174.0, 130659.0, 352938.0, 289148.0, 100778.0, 40016.0, 17833.0, 8987.0, 4955.0, 2932.0, 1674.0, 1016.0, 671.0, 404.0, 263.0, 158.0, 104.0, 63.0, 46.0, 37.0, 15.0, 11.0, 12.0, 8.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.31640625, -6.09765625, -5.87890625, -5.66015625, -5.44140625, -5.22265625, -5.00390625, -4.78515625, -4.56640625, -4.34765625, -4.12890625, -3.91015625, -3.69140625, -3.47265625, -3.25390625, -3.03515625, -2.81640625, -2.59765625, -2.37890625, -2.16015625, -1.94140625, -1.72265625, -1.50390625, -1.28515625, -1.06640625, -0.84765625, -0.62890625, -0.41015625, -0.19140625, 0.02734375, 0.24609375, 0.46484375, 0.68359375, 0.90234375, 1.12109375, 1.33984375, 1.55859375, 1.77734375, 1.99609375, 2.21484375, 2.43359375, 2.65234375, 2.87109375, 3.08984375, 3.30859375, 3.52734375, 3.74609375, 3.96484375, 4.18359375, 4.40234375, 4.62109375, 4.83984375, 5.05859375, 5.27734375, 5.49609375, 5.71484375, 5.93359375, 6.15234375, 6.37109375, 6.58984375, 6.80859375, 7.02734375, 7.24609375, 7.46484375, 7.68359375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 9.0, 4.0, 5.0, 16.0, 10.0, 6.0, 20.0, 16.0, 18.0, 25.0, 28.0, 39.0, 49.0, 47.0, 63.0, 66.0, 72.0, 74.0, 65.0, 65.0, 51.0, 39.0, 35.0, 29.0, 27.0, 21.0, 14.0, 21.0, 13.0, 15.0, 9.0, 4.0, 2.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.9833984375, -0.95294189453125, -0.9224853515625, -0.89202880859375, -0.861572265625, -0.83111572265625, -0.8006591796875, -0.77020263671875, -0.73974609375, -0.70928955078125, -0.6788330078125, -0.64837646484375, -0.617919921875, -0.58746337890625, -0.5570068359375, -0.52655029296875, -0.49609375, -0.46563720703125, -0.4351806640625, -0.40472412109375, -0.374267578125, -0.34381103515625, -0.3133544921875, -0.28289794921875, -0.25244140625, -0.22198486328125, -0.1915283203125, -0.16107177734375, -0.130615234375, -0.10015869140625, -0.0697021484375, -0.03924560546875, -0.0087890625, 0.02166748046875, 0.0521240234375, 0.08258056640625, 0.113037109375, 0.14349365234375, 0.1739501953125, 0.20440673828125, 0.23486328125, 0.26531982421875, 0.2957763671875, 0.32623291015625, 0.356689453125, 0.38714599609375, 0.4176025390625, 0.44805908203125, 0.478515625, 0.50897216796875, 0.5394287109375, 0.56988525390625, 0.600341796875, 0.63079833984375, 0.6612548828125, 0.69171142578125, 0.72216796875, 0.75262451171875, 0.7830810546875, 0.81353759765625, 0.843994140625, 0.87445068359375, 0.9049072265625, 0.93536376953125, 0.9658203125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 4.0, 7.0, 11.0, 12.0, 19.0, 21.0, 15.0, 21.0, 32.0, 41.0, 51.0, 49.0, 78.0, 87.0, 74.0, 67.0, 70.0, 65.0, 50.0, 42.0, 39.0, 27.0, 32.0, 13.0, 10.0, 19.0, 8.0, 6.0, 3.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.361222267150879, -9.09194564819336, -8.822669982910156, -8.553393363952637, -8.284116744995117, -8.014841079711914, -7.7455644607543945, -7.476287841796875, -7.207011699676514, -6.937735557556152, -6.668458938598633, -6.3991827964782715, -6.12990665435791, -5.860630035400391, -5.591353893280029, -5.322077751159668, -5.052801132202148, -4.783524990081787, -4.514248371124268, -4.244972229003906, -3.975695848464966, -3.7064194679260254, -3.437143325805664, -3.1678669452667236, -2.898590564727783, -2.6293141841888428, -2.3600378036499023, -2.090761661529541, -1.8214852809906006, -1.5522089004516602, -1.2829326391220093, -1.0136563777923584, -0.7443790435791016, -0.4751027226448059, -0.20582640171051025, 0.0634499192237854, 0.33272624015808105, 0.6020026206970215, 0.8712788820266724, 1.1405551433563232, 1.4098315238952637, 1.679107904434204, 1.948384165763855, 2.217660427093506, 2.4869368076324463, 2.7562131881713867, 3.025489330291748, 3.2947657108306885, 3.564042091369629, 3.8333184719085693, 4.10259485244751, 4.371870994567871, 4.641147613525391, 4.910423755645752, 5.179699897766113, 5.448976516723633, 5.718252658843994, 5.9875288009643555, 6.256805419921875, 6.526081562042236, 6.795357704162598, 7.064634323120117, 7.3339104652404785, 7.60318660736084, 7.872463226318359]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 1.0, 7.0, 10.0, 7.0, 11.0, 5.0, 7.0, 19.0, 15.0, 21.0, 20.0, 29.0, 31.0, 32.0, 35.0, 38.0, 32.0, 37.0, 41.0, 35.0, 40.0, 53.0, 38.0, 41.0, 37.0, 46.0, 36.0, 41.0, 34.0, 31.0, 23.0, 31.0, 19.0, 10.0, 18.0, 9.0, 10.0, 8.0, 8.0, 6.0, 10.0, 7.0, 3.0, 2.0, 0.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.97306752204895, -3.848686933517456, -3.724306106567383, -3.5999255180358887, -3.4755449295043945, -3.3511643409729004, -3.2267837524414062, -3.102402925491333, -2.978022336959839, -2.8536417484283447, -2.7292609214782715, -2.6048803329467773, -2.480499744415283, -2.356119155883789, -2.231738567352295, -2.1073577404022217, -1.9829771518707275, -1.8585965633392334, -1.7342158555984497, -1.609835147857666, -1.4854545593261719, -1.3610739707946777, -1.236693263053894, -1.1123125553131104, -0.9879319667816162, -0.8635513186454773, -0.7391706705093384, -0.6147900223731995, -0.49040937423706055, -0.36602872610092163, -0.24164807796478271, -0.1172674298286438, 0.007112979888916016, 0.13149362802505493, 0.25587427616119385, 0.38025492429733276, 0.5046355724334717, 0.6290162205696106, 0.7533968687057495, 0.8777775168418884, 1.0021581649780273, 1.1265387535095215, 1.2509194612503052, 1.3753001689910889, 1.499680757522583, 1.6240613460540771, 1.7484420537948608, 1.8728227615356445, 1.9972033500671387, 2.121583938598633, 2.245964527130127, 2.3703453540802, 2.4947259426116943, 2.6191065311431885, 2.7434873580932617, 2.867867946624756, 2.99224853515625, 3.116629123687744, 3.2410097122192383, 3.3653905391693115, 3.4897711277008057, 3.6141517162323, 3.738532543182373, 3.862913131713867, 3.9872937202453613]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 3.0, 10.0, 4.0, 14.0, 17.0, 21.0, 50.0, 53.0, 85.0, 113.0, 176.0, 247.0, 367.0, 537.0, 837.0, 1252.0, 1966.0, 2930.0, 4581.0, 7450.0, 12224.0, 21527.0, 40174.0, 82261.0, 192796.0, 513456.0, 1209359.0, 1215075.0, 517320.0, 192864.0, 81598.0, 40078.0, 21678.0, 12421.0, 7451.0, 4442.0, 2945.0, 1927.0, 1257.0, 854.0, 553.0, 416.0, 283.0, 183.0, 120.0, 105.0, 63.0, 42.0, 26.0, 27.0, 20.0, 8.0, 11.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-7.9921875, -7.734375, -7.4765625, -7.21875, -6.9609375, -6.703125, -6.4453125, -6.1875, -5.9296875, -5.671875, -5.4140625, -5.15625, -4.8984375, -4.640625, -4.3828125, -4.125, -3.8671875, -3.609375, -3.3515625, -3.09375, -2.8359375, -2.578125, -2.3203125, -2.0625, -1.8046875, -1.546875, -1.2890625, -1.03125, -0.7734375, -0.515625, -0.2578125, 0.0, 0.2578125, 0.515625, 0.7734375, 1.03125, 1.2890625, 1.546875, 1.8046875, 2.0625, 2.3203125, 2.578125, 2.8359375, 3.09375, 3.3515625, 3.609375, 3.8671875, 4.125, 4.3828125, 4.640625, 4.8984375, 5.15625, 5.4140625, 5.671875, 5.9296875, 6.1875, 6.4453125, 6.703125, 6.9609375, 7.21875, 7.4765625, 7.734375, 7.9921875, 8.25, 8.5078125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 8.0, 10.0, 5.0, 11.0, 8.0, 11.0, 25.0, 19.0, 23.0, 25.0, 33.0, 34.0, 31.0, 41.0, 49.0, 48.0, 51.0, 51.0, 52.0, 45.0, 54.0, 44.0, 35.0, 46.0, 37.0, 34.0, 34.0, 33.0, 20.0, 18.0, 11.0, 4.0, 8.0, 12.0, 8.0, 7.0, 7.0, 2.0, 3.0, 3.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.932525634765625, -3.81427001953125, -3.696014404296875, -3.5777587890625, -3.459503173828125, -3.34124755859375, -3.222991943359375, -3.104736328125, -2.986480712890625, -2.86822509765625, -2.749969482421875, -2.6317138671875, -2.513458251953125, -2.39520263671875, -2.276947021484375, -2.15869140625, -2.040435791015625, -1.92218017578125, -1.803924560546875, -1.6856689453125, -1.567413330078125, -1.44915771484375, -1.330902099609375, -1.212646484375, -1.094390869140625, -0.97613525390625, -0.857879638671875, -0.7396240234375, -0.621368408203125, -0.50311279296875, -0.384857177734375, -0.2666015625, -0.148345947265625, -0.03009033203125, 0.088165283203125, 0.2064208984375, 0.324676513671875, 0.44293212890625, 0.561187744140625, 0.679443359375, 0.797698974609375, 0.91595458984375, 1.034210205078125, 1.1524658203125, 1.270721435546875, 1.38897705078125, 1.507232666015625, 1.62548828125, 1.743743896484375, 1.86199951171875, 1.980255126953125, 2.0985107421875, 2.216766357421875, 2.33502197265625, 2.453277587890625, 2.571533203125, 2.689788818359375, 2.80804443359375, 2.926300048828125, 3.0445556640625, 3.162811279296875, 3.28106689453125, 3.399322509765625, 3.517578125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 6.0, 6.0, 9.0, 10.0, 7.0, 18.0, 34.0, 41.0, 46.0, 83.0, 119.0, 173.0, 267.0, 464.0, 717.0, 1159.0, 2026.0, 3808.0, 6938.0, 13926.0, 28623.0, 64548.0, 160039.0, 478464.0, 1474714.0, 1305951.0, 404950.0, 138701.0, 55728.0, 25575.0, 12296.0, 6247.0, 3407.0, 1967.0, 1178.0, 662.0, 462.0, 283.0, 183.0, 154.0, 104.0, 50.0, 42.0, 29.0, 28.0, 19.0, 10.0, 8.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.7225341796875, -11.343505859375, -10.9644775390625, -10.58544921875, -10.2064208984375, -9.827392578125, -9.4483642578125, -9.0693359375, -8.6903076171875, -8.311279296875, -7.9322509765625, -7.55322265625, -7.1741943359375, -6.795166015625, -6.4161376953125, -6.037109375, -5.6580810546875, -5.279052734375, -4.9000244140625, -4.52099609375, -4.1419677734375, -3.762939453125, -3.3839111328125, -3.0048828125, -2.6258544921875, -2.246826171875, -1.8677978515625, -1.48876953125, -1.1097412109375, -0.730712890625, -0.3516845703125, 0.02734375, 0.4063720703125, 0.785400390625, 1.1644287109375, 1.54345703125, 1.9224853515625, 2.301513671875, 2.6805419921875, 3.0595703125, 3.4385986328125, 3.817626953125, 4.1966552734375, 4.57568359375, 4.9547119140625, 5.333740234375, 5.7127685546875, 6.091796875, 6.4708251953125, 6.849853515625, 7.2288818359375, 7.60791015625, 7.9869384765625, 8.365966796875, 8.7449951171875, 9.1240234375, 9.5030517578125, 9.882080078125, 10.2611083984375, 10.64013671875, 11.0191650390625, 11.398193359375, 11.7772216796875, 12.15625]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 5.0, 12.0, 19.0, 7.0, 14.0, 18.0, 23.0, 34.0, 37.0, 47.0, 58.0, 82.0, 98.0, 125.0, 164.0, 196.0, 252.0, 313.0, 340.0, 357.0, 334.0, 301.0, 258.0, 203.0, 170.0, 138.0, 97.0, 92.0, 62.0, 53.0, 43.0, 29.0, 21.0, 16.0, 16.0, 9.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.9609375, -2.8836669921875, -2.806396484375, -2.7291259765625, -2.65185546875, -2.5745849609375, -2.497314453125, -2.4200439453125, -2.3427734375, -2.2655029296875, -2.188232421875, -2.1109619140625, -2.03369140625, -1.9564208984375, -1.879150390625, -1.8018798828125, -1.724609375, -1.6473388671875, -1.570068359375, -1.4927978515625, -1.41552734375, -1.3382568359375, -1.260986328125, -1.1837158203125, -1.1064453125, -1.0291748046875, -0.951904296875, -0.8746337890625, -0.79736328125, -0.7200927734375, -0.642822265625, -0.5655517578125, -0.48828125, -0.4110107421875, -0.333740234375, -0.2564697265625, -0.17919921875, -0.1019287109375, -0.024658203125, 0.0526123046875, 0.1298828125, 0.2071533203125, 0.284423828125, 0.3616943359375, 0.43896484375, 0.5162353515625, 0.593505859375, 0.6707763671875, 0.748046875, 0.8253173828125, 0.902587890625, 0.9798583984375, 1.05712890625, 1.1343994140625, 1.211669921875, 1.2889404296875, 1.3662109375, 1.4434814453125, 1.520751953125, 1.5980224609375, 1.67529296875, 1.7525634765625, 1.829833984375, 1.9071044921875, 1.984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 3.0, 3.0, 9.0, 4.0, 8.0, 9.0, 7.0, 16.0, 22.0, 32.0, 37.0, 49.0, 71.0, 72.0, 80.0, 90.0, 81.0, 84.0, 71.0, 64.0, 35.0, 37.0, 21.0, 24.0, 16.0, 16.0, 8.0, 6.0, 7.0, 4.0, 3.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-13.12568187713623, -12.796414375305176, -12.467145919799805, -12.13787841796875, -11.808609962463379, -11.479342460632324, -11.150074005126953, -10.820806503295898, -10.491539001464844, -10.162271499633789, -9.833003044128418, -9.503735542297363, -9.174467086791992, -8.845199584960938, -8.515931129455566, -8.186663627624512, -7.857395172119141, -7.528127193450928, -7.198859214782715, -6.869591236114502, -6.540323257446289, -6.211055755615234, -5.8817877769470215, -5.552519798278809, -5.223251819610596, -4.893983840942383, -4.56471586227417, -4.235447883605957, -3.9061801433563232, -3.5769121646881104, -3.2476444244384766, -2.9183764457702637, -2.589108943939209, -2.259840965270996, -1.9305731058120728, -1.6013052463531494, -1.2720372676849365, -0.9427692890167236, -0.6135014295578003, -0.28423357009887695, 0.04503440856933594, 0.37430232763290405, 0.7035702466964722, 1.0328381061553955, 1.3621060848236084, 1.6913740634918213, 2.020641803741455, 2.349909782409668, 2.679177761077881, 3.0084457397460938, 3.3377137184143066, 3.6669814586639404, 3.9962494373321533, 4.325517654418945, 4.65478515625, 4.984053134918213, 5.313321113586426, 5.642589092254639, 5.971857070922852, 6.3011250495910645, 6.630393028259277, 6.959660530090332, 7.288928508758545, 7.618196487426758, 7.947464466094971]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 6.0, 11.0, 8.0, 14.0, 17.0, 18.0, 21.0, 21.0, 23.0, 27.0, 34.0, 20.0, 52.0, 38.0, 49.0, 48.0, 48.0, 47.0, 53.0, 39.0, 45.0, 37.0, 34.0, 32.0, 34.0, 31.0, 27.0, 27.0, 21.0, 24.0, 23.0, 19.0, 13.0, 9.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7233405113220215, -4.575067520141602, -4.426794052124023, -4.2785210609436035, -4.130247592926025, -3.9819746017456055, -3.8337013721466064, -3.6854281425476074, -3.5371551513671875, -3.3888819217681885, -3.2406086921691895, -3.0923357009887695, -2.9440624713897705, -2.7957892417907715, -2.6475160121917725, -2.4992427825927734, -2.3509695529937744, -2.2026963233947754, -2.0544230937957764, -1.906149983406067, -1.7578768730163574, -1.6096036434173584, -1.4613304138183594, -1.31305730342865, -1.1647840738296509, -1.0165108442306519, -0.8682377338409424, -0.7199645042419434, -0.5716913342475891, -0.42341816425323486, -0.27514493465423584, -0.12687182426452637, 0.021401405334472656, 0.1696745902299881, 0.31794777512550354, 0.4662209749221802, 0.6144941449165344, 0.7627673149108887, 0.9110405445098877, 1.0593136548995972, 1.2075868844985962, 1.3558601140975952, 1.5041332244873047, 1.6524064540863037, 1.8006796836853027, 1.9489527940750122, 2.097226142883301, 2.2454991340637207, 2.3937723636627197, 2.5420455932617188, 2.6903188228607178, 2.838592052459717, 2.9868650436401367, 3.1351382732391357, 3.2834115028381348, 3.4316844940185547, 3.579957962036133, 3.728231191635132, 3.876504421234131, 4.024777412414551, 4.173050880432129, 4.321323871612549, 4.469596862792969, 4.617870330810547, 4.766143321990967]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 6.0, 5.0, 16.0, 17.0, 24.0, 43.0, 47.0, 77.0, 87.0, 141.0, 226.0, 269.0, 382.0, 590.0, 850.0, 1267.0, 1952.0, 2982.0, 4737.0, 7763.0, 13780.0, 24542.0, 47903.0, 97333.0, 190067.0, 259319.0, 189478.0, 97148.0, 47622.0, 24610.0, 13642.0, 8021.0, 4670.0, 2957.0, 1907.0, 1256.0, 848.0, 607.0, 395.0, 315.0, 210.0, 136.0, 87.0, 62.0, 37.0, 39.0, 28.0, 18.0, 12.0, 8.0, 11.0, 4.0, 2.0, 1.0, 4.0, 2.0], "bins": [-5.32421875, -5.165283203125, -5.00634765625, -4.847412109375, -4.6884765625, -4.529541015625, -4.37060546875, -4.211669921875, -4.052734375, -3.893798828125, -3.73486328125, -3.575927734375, -3.4169921875, -3.258056640625, -3.09912109375, -2.940185546875, -2.78125, -2.622314453125, -2.46337890625, -2.304443359375, -2.1455078125, -1.986572265625, -1.82763671875, -1.668701171875, -1.509765625, -1.350830078125, -1.19189453125, -1.032958984375, -0.8740234375, -0.715087890625, -0.55615234375, -0.397216796875, -0.23828125, -0.079345703125, 0.07958984375, 0.238525390625, 0.3974609375, 0.556396484375, 0.71533203125, 0.874267578125, 1.033203125, 1.192138671875, 1.35107421875, 1.510009765625, 1.6689453125, 1.827880859375, 1.98681640625, 2.145751953125, 2.3046875, 2.463623046875, 2.62255859375, 2.781494140625, 2.9404296875, 3.099365234375, 3.25830078125, 3.417236328125, 3.576171875, 3.735107421875, 3.89404296875, 4.052978515625, 4.2119140625, 4.370849609375, 4.52978515625, 4.688720703125, 4.84765625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 8.0, 10.0, 4.0, 11.0, 12.0, 7.0, 20.0, 15.0, 27.0, 24.0, 22.0, 30.0, 36.0, 45.0, 45.0, 48.0, 34.0, 52.0, 56.0, 61.0, 57.0, 34.0, 46.0, 45.0, 27.0, 30.0, 31.0, 32.0, 21.0, 19.0, 22.0, 19.0, 18.0, 11.0, 4.0, 8.0, 5.0, 8.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.859375, -5.68011474609375, -5.5008544921875, -5.32159423828125, -5.142333984375, -4.96307373046875, -4.7838134765625, -4.60455322265625, -4.42529296875, -4.24603271484375, -4.0667724609375, -3.88751220703125, -3.708251953125, -3.52899169921875, -3.3497314453125, -3.17047119140625, -2.9912109375, -2.81195068359375, -2.6326904296875, -2.45343017578125, -2.274169921875, -2.09490966796875, -1.9156494140625, -1.73638916015625, -1.55712890625, -1.37786865234375, -1.1986083984375, -1.01934814453125, -0.840087890625, -0.66082763671875, -0.4815673828125, -0.30230712890625, -0.123046875, 0.05621337890625, 0.2354736328125, 0.41473388671875, 0.593994140625, 0.77325439453125, 0.9525146484375, 1.13177490234375, 1.31103515625, 1.49029541015625, 1.6695556640625, 1.84881591796875, 2.028076171875, 2.20733642578125, 2.3865966796875, 2.56585693359375, 2.7451171875, 2.92437744140625, 3.1036376953125, 3.28289794921875, 3.462158203125, 3.64141845703125, 3.8206787109375, 3.99993896484375, 4.17919921875, 4.35845947265625, 4.5377197265625, 4.71697998046875, 4.896240234375, 5.07550048828125, 5.2547607421875, 5.43402099609375, 5.61328125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 10.0, 1.0, 9.0, 10.0, 24.0, 12.0, 15.0, 28.0, 36.0, 51.0, 72.0, 111.0, 159.0, 206.0, 309.0, 446.0, 728.0, 1213.0, 1977.0, 3889.0, 8436.0, 22352.0, 85325.0, 439977.0, 376280.0, 71297.0, 19465.0, 7481.0, 3462.0, 1990.0, 1147.0, 675.0, 412.0, 276.0, 186.0, 141.0, 93.0, 73.0, 39.0, 29.0, 31.0, 18.0, 16.0, 14.0, 12.0, 7.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.0859375, -12.67626953125, -12.2666015625, -11.85693359375, -11.447265625, -11.03759765625, -10.6279296875, -10.21826171875, -9.80859375, -9.39892578125, -8.9892578125, -8.57958984375, -8.169921875, -7.76025390625, -7.3505859375, -6.94091796875, -6.53125, -6.12158203125, -5.7119140625, -5.30224609375, -4.892578125, -4.48291015625, -4.0732421875, -3.66357421875, -3.25390625, -2.84423828125, -2.4345703125, -2.02490234375, -1.615234375, -1.20556640625, -0.7958984375, -0.38623046875, 0.0234375, 0.43310546875, 0.8427734375, 1.25244140625, 1.662109375, 2.07177734375, 2.4814453125, 2.89111328125, 3.30078125, 3.71044921875, 4.1201171875, 4.52978515625, 4.939453125, 5.34912109375, 5.7587890625, 6.16845703125, 6.578125, 6.98779296875, 7.3974609375, 7.80712890625, 8.216796875, 8.62646484375, 9.0361328125, 9.44580078125, 9.85546875, 10.26513671875, 10.6748046875, 11.08447265625, 11.494140625, 11.90380859375, 12.3134765625, 12.72314453125, 13.1328125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 9.0, 2.0, 8.0, 11.0, 13.0, 17.0, 12.0, 20.0, 21.0, 21.0, 25.0, 22.0, 48.0, 45.0, 55.0, 43.0, 64.0, 49.0, 54.0, 49.0, 47.0, 42.0, 40.0, 50.0, 34.0, 32.0, 22.0, 21.0, 26.0, 20.0, 18.0, 18.0, 12.0, 6.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25, -3.143341064453125, -3.03668212890625, -2.930023193359375, -2.8233642578125, -2.716705322265625, -2.61004638671875, -2.503387451171875, -2.396728515625, -2.290069580078125, -2.18341064453125, -2.076751708984375, -1.9700927734375, -1.863433837890625, -1.75677490234375, -1.650115966796875, -1.54345703125, -1.436798095703125, -1.33013916015625, -1.223480224609375, -1.1168212890625, -1.010162353515625, -0.90350341796875, -0.796844482421875, -0.690185546875, -0.583526611328125, -0.47686767578125, -0.370208740234375, -0.2635498046875, -0.156890869140625, -0.05023193359375, 0.056427001953125, 0.1630859375, 0.269744873046875, 0.37640380859375, 0.483062744140625, 0.5897216796875, 0.696380615234375, 0.80303955078125, 0.909698486328125, 1.016357421875, 1.123016357421875, 1.22967529296875, 1.336334228515625, 1.4429931640625, 1.549652099609375, 1.65631103515625, 1.762969970703125, 1.86962890625, 1.976287841796875, 2.08294677734375, 2.189605712890625, 2.2962646484375, 2.402923583984375, 2.50958251953125, 2.616241455078125, 2.722900390625, 2.829559326171875, 2.93621826171875, 3.042877197265625, 3.1495361328125, 3.256195068359375, 3.36285400390625, 3.469512939453125, 3.576171875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 9.0, 12.0, 21.0, 27.0, 33.0, 39.0, 59.0, 83.0, 135.0, 201.0, 277.0, 416.0, 620.0, 1053.0, 1670.0, 2665.0, 4663.0, 9227.0, 23993.0, 96279.0, 497865.0, 316457.0, 58290.0, 17006.0, 7439.0, 3811.0, 2198.0, 1399.0, 882.0, 573.0, 372.0, 260.0, 177.0, 106.0, 73.0, 63.0, 29.0, 31.0, 12.0, 12.0, 8.0, 10.0, 2.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.5379638671875, -6.325927734375, -6.1138916015625, -5.90185546875, -5.6898193359375, -5.477783203125, -5.2657470703125, -5.0537109375, -4.8416748046875, -4.629638671875, -4.4176025390625, -4.20556640625, -3.9935302734375, -3.781494140625, -3.5694580078125, -3.357421875, -3.1453857421875, -2.933349609375, -2.7213134765625, -2.50927734375, -2.2972412109375, -2.085205078125, -1.8731689453125, -1.6611328125, -1.4490966796875, -1.237060546875, -1.0250244140625, -0.81298828125, -0.6009521484375, -0.388916015625, -0.1768798828125, 0.03515625, 0.2471923828125, 0.459228515625, 0.6712646484375, 0.88330078125, 1.0953369140625, 1.307373046875, 1.5194091796875, 1.7314453125, 1.9434814453125, 2.155517578125, 2.3675537109375, 2.57958984375, 2.7916259765625, 3.003662109375, 3.2156982421875, 3.427734375, 3.6397705078125, 3.851806640625, 4.0638427734375, 4.27587890625, 4.4879150390625, 4.699951171875, 4.9119873046875, 5.1240234375, 5.3360595703125, 5.548095703125, 5.7601318359375, 5.97216796875, 6.1842041015625, 6.396240234375, 6.6082763671875, 6.8203125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 3.0, 9.0, 14.0, 25.0, 39.0, 81.0, 185.0, 245.0, 185.0, 94.0, 44.0, 24.0, 18.0, 13.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024020671844482422, -0.0002264995127916336, -0.000212792307138443, -0.00019908510148525238, -0.00018537789583206177, -0.00017167069017887115, -0.00015796348452568054, -0.00014425627887248993, -0.00013054907321929932, -0.0001168418675661087, -0.00010313466191291809, -8.942745625972748e-05, -7.572025060653687e-05, -6.201304495334625e-05, -4.830583930015564e-05, -3.459863364696503e-05, -2.0891427993774414e-05, -7.184222340583801e-06, 6.5229833126068115e-06, 2.0230188965797424e-05, 3.393739461898804e-05, 4.764460027217865e-05, 6.135180592536926e-05, 7.505901157855988e-05, 8.876621723175049e-05, 0.0001024734228849411, 0.00011618062853813171, 0.00012988783419132233, 0.00014359503984451294, 0.00015730224549770355, 0.00017100945115089417, 0.00018471665680408478, 0.0001984238624572754, 0.000212131068110466, 0.00022583827376365662, 0.00023954547941684723, 0.00025325268507003784, 0.00026695989072322845, 0.00028066709637641907, 0.0002943743020296097, 0.0003080815076828003, 0.0003217887133359909, 0.0003354959189891815, 0.00034920312464237213, 0.00036291033029556274, 0.00037661753594875336, 0.00039032474160194397, 0.0004040319472551346, 0.0004177391529083252, 0.0004314463585615158, 0.0004451535642147064, 0.00045886076986789703, 0.00047256797552108765, 0.00048627518117427826, 0.0004999823868274689, 0.0005136895924806595, 0.0005273967981338501, 0.0005411040037870407, 0.0005548112094402313, 0.0005685184150934219, 0.0005822256207466125, 0.0005959328263998032, 0.0006096400320529938, 0.0006233472377061844, 0.000637054443359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 14.0, 13.0, 25.0, 18.0, 35.0, 48.0, 67.0, 93.0, 127.0, 124.0, 210.0, 335.0, 468.0, 699.0, 1152.0, 1798.0, 3134.0, 5726.0, 12164.0, 40800.0, 275766.0, 559447.0, 106229.0, 21034.0, 8224.0, 4152.0, 2444.0, 1436.0, 906.0, 574.0, 361.0, 248.0, 195.0, 133.0, 95.0, 73.0, 44.0, 36.0, 28.0, 17.0, 11.0, 13.0, 12.0, 5.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.72265625, -7.4832763671875, -7.243896484375, -7.0045166015625, -6.76513671875, -6.5257568359375, -6.286376953125, -6.0469970703125, -5.8076171875, -5.5682373046875, -5.328857421875, -5.0894775390625, -4.85009765625, -4.6107177734375, -4.371337890625, -4.1319580078125, -3.892578125, -3.6531982421875, -3.413818359375, -3.1744384765625, -2.93505859375, -2.6956787109375, -2.456298828125, -2.2169189453125, -1.9775390625, -1.7381591796875, -1.498779296875, -1.2593994140625, -1.02001953125, -0.7806396484375, -0.541259765625, -0.3018798828125, -0.0625, 0.1768798828125, 0.416259765625, 0.6556396484375, 0.89501953125, 1.1343994140625, 1.373779296875, 1.6131591796875, 1.8525390625, 2.0919189453125, 2.331298828125, 2.5706787109375, 2.81005859375, 3.0494384765625, 3.288818359375, 3.5281982421875, 3.767578125, 4.0069580078125, 4.246337890625, 4.4857177734375, 4.72509765625, 4.9644775390625, 5.203857421875, 5.4432373046875, 5.6826171875, 5.9219970703125, 6.161376953125, 6.4007568359375, 6.64013671875, 6.8795166015625, 7.118896484375, 7.3582763671875, 7.59765625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 16.0, 19.0, 34.0, 58.0, 123.0, 125.0, 151.0, 149.0, 108.0, 75.0, 53.0, 25.0, 9.0, 8.0, 6.0, 10.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5224609375, -1.472900390625, -1.42333984375, -1.373779296875, -1.32421875, -1.274658203125, -1.22509765625, -1.175537109375, -1.1259765625, -1.076416015625, -1.02685546875, -0.977294921875, -0.927734375, -0.878173828125, -0.82861328125, -0.779052734375, -0.7294921875, -0.679931640625, -0.63037109375, -0.580810546875, -0.53125, -0.481689453125, -0.43212890625, -0.382568359375, -0.3330078125, -0.283447265625, -0.23388671875, -0.184326171875, -0.134765625, -0.085205078125, -0.03564453125, 0.013916015625, 0.0634765625, 0.113037109375, 0.16259765625, 0.212158203125, 0.26171875, 0.311279296875, 0.36083984375, 0.410400390625, 0.4599609375, 0.509521484375, 0.55908203125, 0.608642578125, 0.658203125, 0.707763671875, 0.75732421875, 0.806884765625, 0.8564453125, 0.906005859375, 0.95556640625, 1.005126953125, 1.0546875, 1.104248046875, 1.15380859375, 1.203369140625, 1.2529296875, 1.302490234375, 1.35205078125, 1.401611328125, 1.451171875, 1.500732421875, 1.55029296875, 1.599853515625, 1.6494140625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 3.0, 9.0, 15.0, 18.0, 20.0, 30.0, 38.0, 37.0, 59.0, 78.0, 82.0, 81.0, 74.0, 75.0, 69.0, 58.0, 51.0, 46.0, 30.0, 16.0, 14.0, 16.0, 11.0, 10.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-11.893698692321777, -11.58962345123291, -11.28554916381836, -10.981473922729492, -10.677399635314941, -10.373324394226074, -10.069250106811523, -9.765174865722656, -9.461099624633789, -9.157024383544922, -8.852950096130371, -8.548874855041504, -8.244800567626953, -7.940725326538086, -7.636650562286377, -7.332575798034668, -7.028501510620117, -6.724426746368408, -6.420351982116699, -6.11627721786499, -5.812202453613281, -5.508127212524414, -5.204052448272705, -4.899977684020996, -4.595902919769287, -4.291828155517578, -3.987753391265869, -3.683678388595581, -3.379603624343872, -3.075528860092163, -2.771453857421875, -2.467379093170166, -2.1633033752441406, -1.8592286109924316, -1.555153727531433, -1.2510788440704346, -0.9470040798187256, -0.6429293155670166, -0.33885443210601807, -0.03477954864501953, 0.26929521560668945, 0.5733700394630432, 0.877444863319397, 1.1815197467803955, 1.4855945110321045, 1.7896692752838135, 2.0937442779541016, 2.3978190422058105, 2.7018938064575195, 3.0059685707092285, 3.3100433349609375, 3.6141183376312256, 3.9181931018829346, 4.222268104553223, 4.526342868804932, 4.830417633056641, 5.13449239730835, 5.438567161560059, 5.742641925811768, 6.046716690063477, 6.350791931152344, 6.6548662185668945, 6.958941459655762, 7.263016223907471, 7.56709098815918]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 12.0, 15.0, 21.0, 18.0, 23.0, 23.0, 22.0, 34.0, 27.0, 45.0, 46.0, 44.0, 43.0, 48.0, 45.0, 56.0, 50.0, 42.0, 36.0, 29.0, 38.0, 32.0, 26.0, 31.0, 24.0, 31.0, 18.0, 24.0, 21.0, 11.0, 9.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.537633895874023, -4.39125919342041, -4.244884014129639, -4.098509311676025, -3.952134609222412, -3.8057596683502197, -3.6593847274780273, -3.513010025024414, -3.3666350841522217, -3.2202601432800293, -3.073885440826416, -2.9275104999542236, -2.7811355590820312, -2.634760856628418, -2.4883859157562256, -2.342010974884033, -2.19563627243042, -2.0492613315582275, -1.9028866291046143, -1.7565116882324219, -1.610136866569519, -1.4637620449066162, -1.3173871040344238, -1.171012282371521, -1.0246374607086182, -0.8782626390457153, -0.7318877577781677, -0.5855128765106201, -0.4391380548477173, -0.29276323318481445, -0.14638835191726685, -1.3470649719238281e-05, 0.1463608741760254, 0.2927357256412506, 0.43911057710647583, 0.5854854583740234, 0.7318602800369263, 0.8782351016998291, 1.0246100425720215, 1.1709848642349243, 1.3173596858978271, 1.46373450756073, 1.6101093292236328, 1.7564842700958252, 1.902859091758728, 2.049233913421631, 2.1956088542938232, 2.3419837951660156, 2.488358497619629, 2.6347334384918213, 2.7811081409454346, 2.927483081817627, 3.0738577842712402, 3.2202327251434326, 3.366607666015625, 3.5129823684692383, 3.6593573093414307, 3.805732250213623, 3.9521069526672363, 4.09848165512085, 4.244856834411621, 4.391231536865234, 4.537606239318848, 4.683981418609619, 4.830356121063232]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 10.0, 15.0, 31.0, 34.0, 58.0, 71.0, 139.0, 197.0, 248.0, 402.0, 644.0, 1011.0, 1495.0, 2534.0, 4377.0, 6932.0, 11809.0, 20406.0, 34578.0, 57549.0, 93620.0, 140528.0, 177464.0, 167944.0, 125155.0, 80519.0, 49265.0, 28906.0, 17390.0, 10013.0, 5927.0, 3425.0, 2106.0, 1350.0, 810.0, 506.0, 346.0, 228.0, 151.0, 108.0, 78.0, 56.0, 35.0, 24.0, 19.0, 11.0, 12.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.35546875, -4.2142333984375, -4.072998046875, -3.9317626953125, -3.79052734375, -3.6492919921875, -3.508056640625, -3.3668212890625, -3.2255859375, -3.0843505859375, -2.943115234375, -2.8018798828125, -2.66064453125, -2.5194091796875, -2.378173828125, -2.2369384765625, -2.095703125, -1.9544677734375, -1.813232421875, -1.6719970703125, -1.53076171875, -1.3895263671875, -1.248291015625, -1.1070556640625, -0.9658203125, -0.8245849609375, -0.683349609375, -0.5421142578125, -0.40087890625, -0.2596435546875, -0.118408203125, 0.0228271484375, 0.1640625, 0.3052978515625, 0.446533203125, 0.5877685546875, 0.72900390625, 0.8702392578125, 1.011474609375, 1.1527099609375, 1.2939453125, 1.4351806640625, 1.576416015625, 1.7176513671875, 1.85888671875, 2.0001220703125, 2.141357421875, 2.2825927734375, 2.423828125, 2.5650634765625, 2.706298828125, 2.8475341796875, 2.98876953125, 3.1300048828125, 3.271240234375, 3.4124755859375, 3.5537109375, 3.6949462890625, 3.836181640625, 3.9774169921875, 4.11865234375, 4.2598876953125, 4.401123046875, 4.5423583984375, 4.68359375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 8.0, 14.0, 10.0, 14.0, 14.0, 17.0, 19.0, 14.0, 22.0, 22.0, 28.0, 41.0, 28.0, 45.0, 40.0, 48.0, 59.0, 38.0, 42.0, 48.0, 41.0, 43.0, 35.0, 39.0, 26.0, 24.0, 34.0, 23.0, 24.0, 30.0, 16.0, 18.0, 15.0, 14.0, 10.0, 5.0, 8.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.46875, -5.31475830078125, -5.1607666015625, -5.00677490234375, -4.852783203125, -4.69879150390625, -4.5447998046875, -4.39080810546875, -4.23681640625, -4.08282470703125, -3.9288330078125, -3.77484130859375, -3.620849609375, -3.46685791015625, -3.3128662109375, -3.15887451171875, -3.0048828125, -2.85089111328125, -2.6968994140625, -2.54290771484375, -2.388916015625, -2.23492431640625, -2.0809326171875, -1.92694091796875, -1.77294921875, -1.61895751953125, -1.4649658203125, -1.31097412109375, -1.156982421875, -1.00299072265625, -0.8489990234375, -0.69500732421875, -0.541015625, -0.38702392578125, -0.2330322265625, -0.07904052734375, 0.074951171875, 0.22894287109375, 0.3829345703125, 0.53692626953125, 0.69091796875, 0.84490966796875, 0.9989013671875, 1.15289306640625, 1.306884765625, 1.46087646484375, 1.6148681640625, 1.76885986328125, 1.9228515625, 2.07684326171875, 2.2308349609375, 2.38482666015625, 2.538818359375, 2.69281005859375, 2.8468017578125, 3.00079345703125, 3.15478515625, 3.30877685546875, 3.4627685546875, 3.61676025390625, 3.770751953125, 3.92474365234375, 4.0787353515625, 4.23272705078125, 4.38671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 14.0, 14.0, 15.0, 27.0, 49.0, 52.0, 87.0, 133.0, 168.0, 266.0, 416.0, 714.0, 1132.0, 1876.0, 3123.0, 5437.0, 9409.0, 16758.0, 29994.0, 54468.0, 97164.0, 156958.0, 202810.0, 183164.0, 122926.0, 71247.0, 39212.0, 21587.0, 12024.0, 6919.0, 4074.0, 2438.0, 1430.0, 886.0, 538.0, 355.0, 215.0, 133.0, 86.0, 79.0, 49.0, 24.0, 22.0, 21.0, 16.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.23583984375, -5.0654296875, -4.89501953125, -4.724609375, -4.55419921875, -4.3837890625, -4.21337890625, -4.04296875, -3.87255859375, -3.7021484375, -3.53173828125, -3.361328125, -3.19091796875, -3.0205078125, -2.85009765625, -2.6796875, -2.50927734375, -2.3388671875, -2.16845703125, -1.998046875, -1.82763671875, -1.6572265625, -1.48681640625, -1.31640625, -1.14599609375, -0.9755859375, -0.80517578125, -0.634765625, -0.46435546875, -0.2939453125, -0.12353515625, 0.046875, 0.21728515625, 0.3876953125, 0.55810546875, 0.728515625, 0.89892578125, 1.0693359375, 1.23974609375, 1.41015625, 1.58056640625, 1.7509765625, 1.92138671875, 2.091796875, 2.26220703125, 2.4326171875, 2.60302734375, 2.7734375, 2.94384765625, 3.1142578125, 3.28466796875, 3.455078125, 3.62548828125, 3.7958984375, 3.96630859375, 4.13671875, 4.30712890625, 4.4775390625, 4.64794921875, 4.818359375, 4.98876953125, 5.1591796875, 5.32958984375, 5.5]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 6.0, 6.0, 5.0, 12.0, 13.0, 13.0, 8.0, 20.0, 17.0, 19.0, 24.0, 23.0, 23.0, 46.0, 20.0, 43.0, 37.0, 38.0, 40.0, 45.0, 54.0, 48.0, 41.0, 38.0, 36.0, 31.0, 43.0, 41.0, 35.0, 21.0, 24.0, 14.0, 9.0, 22.0, 17.0, 12.0, 14.0, 9.0, 13.0, 9.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.818878173828125, -2.72955322265625, -2.640228271484375, -2.5509033203125, -2.461578369140625, -2.37225341796875, -2.282928466796875, -2.193603515625, -2.104278564453125, -2.01495361328125, -1.925628662109375, -1.8363037109375, -1.746978759765625, -1.65765380859375, -1.568328857421875, -1.47900390625, -1.389678955078125, -1.30035400390625, -1.211029052734375, -1.1217041015625, -1.032379150390625, -0.94305419921875, -0.853729248046875, -0.764404296875, -0.675079345703125, -0.58575439453125, -0.496429443359375, -0.4071044921875, -0.317779541015625, -0.22845458984375, -0.139129638671875, -0.0498046875, 0.039520263671875, 0.12884521484375, 0.218170166015625, 0.3074951171875, 0.396820068359375, 0.48614501953125, 0.575469970703125, 0.664794921875, 0.754119873046875, 0.84344482421875, 0.932769775390625, 1.0220947265625, 1.111419677734375, 1.20074462890625, 1.290069580078125, 1.37939453125, 1.468719482421875, 1.55804443359375, 1.647369384765625, 1.7366943359375, 1.826019287109375, 1.91534423828125, 2.004669189453125, 2.093994140625, 2.183319091796875, 2.27264404296875, 2.361968994140625, 2.4512939453125, 2.540618896484375, 2.62994384765625, 2.719268798828125, 2.80859375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 9.0, 12.0, 17.0, 17.0, 30.0, 46.0, 70.0, 67.0, 125.0, 181.0, 297.0, 437.0, 627.0, 1041.0, 1652.0, 2610.0, 4252.0, 6894.0, 12085.0, 21672.0, 40283.0, 78046.0, 148786.0, 232130.0, 217766.0, 130105.0, 67757.0, 35138.0, 19239.0, 10649.0, 6326.0, 3723.0, 2265.0, 1451.0, 884.0, 610.0, 394.0, 259.0, 197.0, 113.0, 89.0, 65.0, 48.0, 32.0, 17.0, 14.0, 9.0, 6.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.25, -4.12078857421875, -3.9915771484375, -3.86236572265625, -3.733154296875, -3.60394287109375, -3.4747314453125, -3.34552001953125, -3.21630859375, -3.08709716796875, -2.9578857421875, -2.82867431640625, -2.699462890625, -2.57025146484375, -2.4410400390625, -2.31182861328125, -2.1826171875, -2.05340576171875, -1.9241943359375, -1.79498291015625, -1.665771484375, -1.53656005859375, -1.4073486328125, -1.27813720703125, -1.14892578125, -1.01971435546875, -0.8905029296875, -0.76129150390625, -0.632080078125, -0.50286865234375, -0.3736572265625, -0.24444580078125, -0.115234375, 0.01397705078125, 0.1431884765625, 0.27239990234375, 0.401611328125, 0.53082275390625, 0.6600341796875, 0.78924560546875, 0.91845703125, 1.04766845703125, 1.1768798828125, 1.30609130859375, 1.435302734375, 1.56451416015625, 1.6937255859375, 1.82293701171875, 1.9521484375, 2.08135986328125, 2.2105712890625, 2.33978271484375, 2.468994140625, 2.59820556640625, 2.7274169921875, 2.85662841796875, 2.98583984375, 3.11505126953125, 3.2442626953125, 3.37347412109375, 3.502685546875, 3.63189697265625, 3.7611083984375, 3.89031982421875, 4.01953125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 9.0, 9.0, 7.0, 11.0, 12.0, 24.0, 25.0, 30.0, 50.0, 51.0, 65.0, 68.0, 82.0, 69.0, 63.0, 67.0, 68.0, 53.0, 59.0, 25.0, 22.0, 19.0, 19.0, 16.0, 7.0, 11.0, 4.0, 5.0, 6.0, 2.0, 6.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00027680397033691406, -0.00026660412549972534, -0.0002564042806625366, -0.0002462044358253479, -0.00023600459098815918, -0.00022580474615097046, -0.00021560490131378174, -0.00020540505647659302, -0.0001952052116394043, -0.00018500536680221558, -0.00017480552196502686, -0.00016460567712783813, -0.00015440583229064941, -0.0001442059874534607, -0.00013400614261627197, -0.00012380629777908325, -0.00011360645294189453, -0.00010340660810470581, -9.320676326751709e-05, -8.300691843032837e-05, -7.280707359313965e-05, -6.260722875595093e-05, -5.240738391876221e-05, -4.2207539081573486e-05, -3.2007694244384766e-05, -2.1807849407196045e-05, -1.1608004570007324e-05, -1.4081597328186035e-06, 8.791685104370117e-06, 1.8991529941558838e-05, 2.919137477874756e-05, 3.939121961593628e-05, 4.9591064453125e-05, 5.979090929031372e-05, 6.999075412750244e-05, 8.019059896469116e-05, 9.039044380187988e-05, 0.0001005902886390686, 0.00011079013347625732, 0.00012098997831344604, 0.00013118982315063477, 0.00014138966798782349, 0.0001515895128250122, 0.00016178935766220093, 0.00017198920249938965, 0.00018218904733657837, 0.0001923888921737671, 0.0002025887370109558, 0.00021278858184814453, 0.00022298842668533325, 0.00023318827152252197, 0.0002433881163597107, 0.0002535879611968994, 0.00026378780603408813, 0.00027398765087127686, 0.0002841874957084656, 0.0002943873405456543, 0.000304587185382843, 0.00031478703022003174, 0.00032498687505722046, 0.0003351867198944092, 0.0003453865647315979, 0.0003555864095687866, 0.00036578625440597534, 0.00037598609924316406]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 5.0, 4.0, 2.0, 11.0, 6.0, 16.0, 23.0, 33.0, 37.0, 51.0, 73.0, 97.0, 166.0, 261.0, 321.0, 503.0, 713.0, 1060.0, 1631.0, 2358.0, 3835.0, 6320.0, 10322.0, 17482.0, 30725.0, 55655.0, 101648.0, 171735.0, 219903.0, 177756.0, 106941.0, 58756.0, 32398.0, 18612.0, 10691.0, 6486.0, 4105.0, 2696.0, 1669.0, 1123.0, 725.0, 465.0, 335.0, 244.0, 168.0, 120.0, 81.0, 51.0, 41.0, 32.0, 21.0, 22.0, 10.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.796875, -3.676513671875, -3.55615234375, -3.435791015625, -3.3154296875, -3.195068359375, -3.07470703125, -2.954345703125, -2.833984375, -2.713623046875, -2.59326171875, -2.472900390625, -2.3525390625, -2.232177734375, -2.11181640625, -1.991455078125, -1.87109375, -1.750732421875, -1.63037109375, -1.510009765625, -1.3896484375, -1.269287109375, -1.14892578125, -1.028564453125, -0.908203125, -0.787841796875, -0.66748046875, -0.547119140625, -0.4267578125, -0.306396484375, -0.18603515625, -0.065673828125, 0.0546875, 0.175048828125, 0.29541015625, 0.415771484375, 0.5361328125, 0.656494140625, 0.77685546875, 0.897216796875, 1.017578125, 1.137939453125, 1.25830078125, 1.378662109375, 1.4990234375, 1.619384765625, 1.73974609375, 1.860107421875, 1.98046875, 2.100830078125, 2.22119140625, 2.341552734375, 2.4619140625, 2.582275390625, 2.70263671875, 2.822998046875, 2.943359375, 3.063720703125, 3.18408203125, 3.304443359375, 3.4248046875, 3.545166015625, 3.66552734375, 3.785888671875, 3.90625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 16.0, 12.0, 9.0, 15.0, 20.0, 26.0, 30.0, 30.0, 41.0, 36.0, 54.0, 41.0, 42.0, 39.0, 48.0, 56.0, 62.0, 69.0, 45.0, 46.0, 42.0, 38.0, 26.0, 29.0, 17.0, 24.0, 13.0, 15.0, 7.0, 6.0, 12.0, 4.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92138671875, -0.8920135498046875, -0.862640380859375, -0.8332672119140625, -0.80389404296875, -0.7745208740234375, -0.745147705078125, -0.7157745361328125, -0.6864013671875, -0.6570281982421875, -0.627655029296875, -0.5982818603515625, -0.56890869140625, -0.5395355224609375, -0.510162353515625, -0.4807891845703125, -0.451416015625, -0.4220428466796875, -0.392669677734375, -0.3632965087890625, -0.33392333984375, -0.3045501708984375, -0.275177001953125, -0.2458038330078125, -0.2164306640625, -0.1870574951171875, -0.157684326171875, -0.1283111572265625, -0.09893798828125, -0.0695648193359375, -0.040191650390625, -0.0108184814453125, 0.0185546875, 0.0479278564453125, 0.077301025390625, 0.1066741943359375, 0.13604736328125, 0.1654205322265625, 0.194793701171875, 0.2241668701171875, 0.2535400390625, 0.2829132080078125, 0.312286376953125, 0.3416595458984375, 0.37103271484375, 0.4004058837890625, 0.429779052734375, 0.4591522216796875, 0.488525390625, 0.5178985595703125, 0.547271728515625, 0.5766448974609375, 0.60601806640625, 0.6353912353515625, 0.664764404296875, 0.6941375732421875, 0.7235107421875, 0.7528839111328125, 0.782257080078125, 0.8116302490234375, 0.84100341796875, 0.8703765869140625, 0.899749755859375, 0.9291229248046875, 0.95849609375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 5.0, 9.0, 9.0, 16.0, 14.0, 17.0, 18.0, 20.0, 30.0, 57.0, 46.0, 70.0, 95.0, 75.0, 75.0, 76.0, 63.0, 70.0, 47.0, 39.0, 33.0, 35.0, 17.0, 8.0, 11.0, 7.0, 7.0, 12.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.502902030944824, -12.192047119140625, -11.88119125366211, -11.57033634185791, -11.259481430053711, -10.948625564575195, -10.637770652770996, -10.326915740966797, -10.016059875488281, -9.705204963684082, -9.394349098205566, -9.083494186401367, -8.772638320922852, -8.461783409118652, -8.150928497314453, -7.840073108673096, -7.529217720031738, -7.218362331390381, -6.907506942749023, -6.596652030944824, -6.285796642303467, -5.974941253662109, -5.66408634185791, -5.353230953216553, -5.042375564575195, -4.731520175933838, -4.4206647872924805, -4.109809875488281, -3.798954486846924, -3.4880990982055664, -3.177243947982788, -2.8663887977600098, -2.5555338859558105, -2.244678497314453, -1.9338233470916748, -1.622968077659607, -1.312112808227539, -1.0012575387954712, -0.6904022693634033, -0.379547119140625, -0.06869173049926758, 0.2421635389328003, 0.5530188083648682, 0.863874077796936, 1.174729347229004, 1.4855846166610718, 1.7964398860931396, 2.107295036315918, 2.4181504249572754, 2.729005813598633, 3.039860963821411, 3.3507161140441895, 3.661571502685547, 3.9724268913269043, 4.283282279968262, 4.594137191772461, 4.904992580413818, 5.215847969055176, 5.526702880859375, 5.837558269500732, 6.14841365814209, 6.459269046783447, 6.770124435424805, 7.080979347229004, 7.391834735870361]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 6.0, 6.0, 12.0, 12.0, 13.0, 22.0, 20.0, 19.0, 20.0, 25.0, 28.0, 40.0, 32.0, 40.0, 38.0, 50.0, 41.0, 48.0, 47.0, 49.0, 53.0, 46.0, 33.0, 36.0, 39.0, 26.0, 30.0, 23.0, 23.0, 11.0, 17.0, 21.0, 16.0, 11.0, 9.0, 7.0, 5.0, 4.0, 5.0, 4.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55970573425293, -4.413398742675781, -4.267091751098633, -4.120784759521484, -3.974478006362915, -3.8281710147857666, -3.6818642616271973, -3.535557270050049, -3.3892502784729004, -3.242943286895752, -3.0966362953186035, -2.950329542160034, -2.8040225505828857, -2.6577155590057373, -2.511408805847168, -2.3651018142700195, -2.218794822692871, -2.0724878311157227, -1.9261809587478638, -1.7798740863800049, -1.6335670948028564, -1.487260103225708, -1.3409532308578491, -1.1946463584899902, -1.0483393669128418, -0.9020324349403381, -0.7557255029678345, -0.6094185709953308, -0.46311163902282715, -0.3168047070503235, -0.17049777507781982, -0.024190902709960938, 0.1221156120300293, 0.26842254400253296, 0.4147294759750366, 0.5610364079475403, 0.707343339920044, 0.8536502718925476, 0.9999572038650513, 1.1462640762329102, 1.2925710678100586, 1.438878059387207, 1.585184931755066, 1.7314918041229248, 1.8777987957000732, 2.0241057872772217, 2.170412540435791, 2.3167195320129395, 2.463026523590088, 2.6093335151672363, 2.7556405067443848, 2.901947259902954, 3.0482542514801025, 3.194561243057251, 3.3408679962158203, 3.4871749877929688, 3.633481979370117, 3.7797889709472656, 3.926095962524414, 4.0724029541015625, 4.218709945678711, 4.365016460418701, 4.51132345199585, 4.657630443572998, 4.8039374351501465]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 7.0, 19.0, 30.0, 43.0, 60.0, 64.0, 138.0, 200.0, 303.0, 419.0, 662.0, 943.0, 1490.0, 2312.0, 3700.0, 6039.0, 10041.0, 17556.0, 32840.0, 68120.0, 163997.0, 464194.0, 1205593.0, 1310406.0, 545341.0, 193945.0, 79481.0, 37752.0, 19703.0, 11244.0, 6609.0, 3960.0, 2432.0, 1544.0, 1062.0, 636.0, 447.0, 311.0, 193.0, 130.0, 97.0, 68.0, 61.0, 25.0, 19.0, 12.0, 10.0, 12.0, 9.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.0, -8.6904296875, -8.380859375, -8.0712890625, -7.76171875, -7.4521484375, -7.142578125, -6.8330078125, -6.5234375, -6.2138671875, -5.904296875, -5.5947265625, -5.28515625, -4.9755859375, -4.666015625, -4.3564453125, -4.046875, -3.7373046875, -3.427734375, -3.1181640625, -2.80859375, -2.4990234375, -2.189453125, -1.8798828125, -1.5703125, -1.2607421875, -0.951171875, -0.6416015625, -0.33203125, -0.0224609375, 0.287109375, 0.5966796875, 0.90625, 1.2158203125, 1.525390625, 1.8349609375, 2.14453125, 2.4541015625, 2.763671875, 3.0732421875, 3.3828125, 3.6923828125, 4.001953125, 4.3115234375, 4.62109375, 4.9306640625, 5.240234375, 5.5498046875, 5.859375, 6.1689453125, 6.478515625, 6.7880859375, 7.09765625, 7.4072265625, 7.716796875, 8.0263671875, 8.3359375, 8.6455078125, 8.955078125, 9.2646484375, 9.57421875, 9.8837890625, 10.193359375, 10.5029296875, 10.8125]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 7.0, 12.0, 9.0, 12.0, 14.0, 12.0, 9.0, 23.0, 32.0, 28.0, 26.0, 30.0, 41.0, 41.0, 45.0, 36.0, 43.0, 52.0, 45.0, 45.0, 52.0, 41.0, 44.0, 40.0, 37.0, 26.0, 30.0, 27.0, 18.0, 15.0, 27.0, 13.0, 14.0, 15.0, 4.0, 9.0, 8.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.685546875, -3.563385009765625, -3.44122314453125, -3.319061279296875, -3.1968994140625, -3.074737548828125, -2.95257568359375, -2.830413818359375, -2.708251953125, -2.586090087890625, -2.46392822265625, -2.341766357421875, -2.2196044921875, -2.097442626953125, -1.97528076171875, -1.853118896484375, -1.73095703125, -1.608795166015625, -1.48663330078125, -1.364471435546875, -1.2423095703125, -1.120147705078125, -0.99798583984375, -0.875823974609375, -0.753662109375, -0.631500244140625, -0.50933837890625, -0.387176513671875, -0.2650146484375, -0.142852783203125, -0.02069091796875, 0.101470947265625, 0.2236328125, 0.345794677734375, 0.46795654296875, 0.590118408203125, 0.7122802734375, 0.834442138671875, 0.95660400390625, 1.078765869140625, 1.200927734375, 1.323089599609375, 1.44525146484375, 1.567413330078125, 1.6895751953125, 1.811737060546875, 1.93389892578125, 2.056060791015625, 2.17822265625, 2.300384521484375, 2.42254638671875, 2.544708251953125, 2.6668701171875, 2.789031982421875, 2.91119384765625, 3.033355712890625, 3.155517578125, 3.277679443359375, 3.39984130859375, 3.522003173828125, 3.6441650390625, 3.766326904296875, 3.88848876953125, 4.010650634765625, 4.1328125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 8.0, 8.0, 23.0, 25.0, 32.0, 63.0, 87.0, 124.0, 183.0, 260.0, 374.0, 591.0, 898.0, 1410.0, 2296.0, 3676.0, 6267.0, 11005.0, 19586.0, 36817.0, 74005.0, 157721.0, 387037.0, 1013603.0, 1379014.0, 636536.0, 243816.0, 105425.0, 51402.0, 26392.0, 14341.0, 8209.0, 4867.0, 2889.0, 1825.0, 1194.0, 716.0, 477.0, 333.0, 222.0, 156.0, 109.0, 74.0, 55.0, 36.0, 31.0, 16.0, 19.0, 15.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.09375, -10.749755859375, -10.40576171875, -10.061767578125, -9.7177734375, -9.373779296875, -9.02978515625, -8.685791015625, -8.341796875, -7.997802734375, -7.65380859375, -7.309814453125, -6.9658203125, -6.621826171875, -6.27783203125, -5.933837890625, -5.58984375, -5.245849609375, -4.90185546875, -4.557861328125, -4.2138671875, -3.869873046875, -3.52587890625, -3.181884765625, -2.837890625, -2.493896484375, -2.14990234375, -1.805908203125, -1.4619140625, -1.117919921875, -0.77392578125, -0.429931640625, -0.0859375, 0.258056640625, 0.60205078125, 0.946044921875, 1.2900390625, 1.634033203125, 1.97802734375, 2.322021484375, 2.666015625, 3.010009765625, 3.35400390625, 3.697998046875, 4.0419921875, 4.385986328125, 4.72998046875, 5.073974609375, 5.41796875, 5.761962890625, 6.10595703125, 6.449951171875, 6.7939453125, 7.137939453125, 7.48193359375, 7.825927734375, 8.169921875, 8.513916015625, 8.85791015625, 9.201904296875, 9.5458984375, 9.889892578125, 10.23388671875, 10.577880859375, 10.921875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 13.0, 10.0, 23.0, 17.0, 15.0, 24.0, 51.0, 52.0, 56.0, 80.0, 98.0, 127.0, 170.0, 214.0, 252.0, 305.0, 348.0, 355.0, 290.0, 283.0, 265.0, 216.0, 165.0, 160.0, 108.0, 75.0, 61.0, 69.0, 38.0, 31.0, 24.0, 16.0, 12.0, 8.0, 2.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.717315673828125, -2.62994384765625, -2.542572021484375, -2.4552001953125, -2.367828369140625, -2.28045654296875, -2.193084716796875, -2.105712890625, -2.018341064453125, -1.93096923828125, -1.843597412109375, -1.7562255859375, -1.668853759765625, -1.58148193359375, -1.494110107421875, -1.40673828125, -1.319366455078125, -1.23199462890625, -1.144622802734375, -1.0572509765625, -0.969879150390625, -0.88250732421875, -0.795135498046875, -0.707763671875, -0.620391845703125, -0.53302001953125, -0.445648193359375, -0.3582763671875, -0.270904541015625, -0.18353271484375, -0.096160888671875, -0.0087890625, 0.078582763671875, 0.16595458984375, 0.253326416015625, 0.3406982421875, 0.428070068359375, 0.51544189453125, 0.602813720703125, 0.690185546875, 0.777557373046875, 0.86492919921875, 0.952301025390625, 1.0396728515625, 1.127044677734375, 1.21441650390625, 1.301788330078125, 1.38916015625, 1.476531982421875, 1.56390380859375, 1.651275634765625, 1.7386474609375, 1.826019287109375, 1.91339111328125, 2.000762939453125, 2.088134765625, 2.175506591796875, 2.26287841796875, 2.350250244140625, 2.4376220703125, 2.524993896484375, 2.61236572265625, 2.699737548828125, 2.787109375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 8.0, 8.0, 10.0, 11.0, 21.0, 25.0, 37.0, 37.0, 54.0, 65.0, 65.0, 93.0, 93.0, 99.0, 101.0, 75.0, 57.0, 26.0, 24.0, 12.0, 23.0, 11.0, 10.0, 12.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.812979698181152, -10.431965827941895, -10.050951957702637, -9.669939041137695, -9.288925170898438, -8.90791130065918, -8.526897430419922, -8.145883560180664, -7.764869689941406, -7.383855819702148, -7.002842426300049, -6.621828556060791, -6.240814685821533, -5.859801292419434, -5.478787422180176, -5.097773551940918, -4.716760158538818, -4.3357462882995605, -3.954732656478882, -3.573719024658203, -3.1927051544189453, -2.8116915225982666, -2.430677890777588, -2.04966402053833, -1.6686503887176514, -1.287636637687683, -0.9066229462623596, -0.5256092548370361, -0.14459550380706787, 0.2364182472229004, 0.6174318790435791, 0.9984457492828369, 1.3794593811035156, 1.7604731321334839, 2.141486883163452, 2.522500514984131, 2.9035143852233887, 3.2845280170440674, 3.665541648864746, 4.046555519104004, 4.427569389343262, 4.8085832595825195, 5.189596652984619, 5.570610523223877, 5.951624393463135, 6.332637786865234, 6.713651657104492, 7.09466552734375, 7.47567892074585, 7.856692790985107, 8.237706184387207, 8.618720054626465, 8.999733924865723, 9.38074779510498, 9.761760711669922, 10.14277458190918, 10.523788452148438, 10.904802322387695, 11.285816192626953, 11.666830062866211, 12.047842979431152, 12.42885684967041, 12.809870719909668, 13.190884590148926, 13.571898460388184]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 4.0, 2.0, 7.0, 7.0, 7.0, 10.0, 15.0, 12.0, 26.0, 29.0, 24.0, 28.0, 29.0, 56.0, 37.0, 51.0, 44.0, 44.0, 55.0, 48.0, 38.0, 49.0, 40.0, 50.0, 38.0, 35.0, 33.0, 28.0, 24.0, 30.0, 19.0, 17.0, 16.0, 10.0, 12.0, 5.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.688699722290039, -5.51816463470459, -5.347629547119141, -5.177094459533691, -5.006559371948242, -4.836024284362793, -4.665489196777344, -4.4949541091918945, -4.324419021606445, -4.153883934020996, -3.983348846435547, -3.8128137588500977, -3.6422786712646484, -3.471743583679199, -3.30120849609375, -3.130673408508301, -2.9601383209228516, -2.7896032333374023, -2.619068145751953, -2.448533058166504, -2.2779979705810547, -2.1074628829956055, -1.9369277954101562, -1.766392707824707, -1.5958576202392578, -1.4253225326538086, -1.2547874450683594, -1.0842523574829102, -0.9137172698974609, -0.7431821823120117, -0.5726470947265625, -0.4021120071411133, -0.23157691955566406, -0.061041831970214844, 0.10949325561523438, 0.2800283432006836, 0.4505634307861328, 0.621098518371582, 0.7916336059570312, 0.9621686935424805, 1.1327037811279297, 1.303238868713379, 1.4737739562988281, 1.6443090438842773, 1.8148441314697266, 1.9853792190551758, 2.155914306640625, 2.326449394226074, 2.4969844818115234, 2.6675195693969727, 2.838054656982422, 3.008589744567871, 3.1791248321533203, 3.3496599197387695, 3.5201950073242188, 3.690730094909668, 3.861265182495117, 4.031800270080566, 4.202335357666016, 4.372870445251465, 4.543405532836914, 4.713940620422363, 4.8844757080078125, 5.055010795593262, 5.225545883178711]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 10.0, 10.0, 14.0, 24.0, 25.0, 57.0, 70.0, 81.0, 154.0, 265.0, 336.0, 491.0, 808.0, 1172.0, 1861.0, 3026.0, 4665.0, 7697.0, 12686.0, 21605.0, 35995.0, 60638.0, 99437.0, 149626.0, 184632.0, 166201.0, 116209.0, 72299.0, 43508.0, 25441.0, 15251.0, 9129.0, 5644.0, 3391.0, 2101.0, 1301.0, 889.0, 601.0, 414.0, 247.0, 173.0, 108.0, 94.0, 49.0, 29.0, 29.0, 19.0, 11.0, 10.0, 7.0, 5.0, 8.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.61328125, -3.502685546875, -3.39208984375, -3.281494140625, -3.1708984375, -3.060302734375, -2.94970703125, -2.839111328125, -2.728515625, -2.617919921875, -2.50732421875, -2.396728515625, -2.2861328125, -2.175537109375, -2.06494140625, -1.954345703125, -1.84375, -1.733154296875, -1.62255859375, -1.511962890625, -1.4013671875, -1.290771484375, -1.18017578125, -1.069580078125, -0.958984375, -0.848388671875, -0.73779296875, -0.627197265625, -0.5166015625, -0.406005859375, -0.29541015625, -0.184814453125, -0.07421875, 0.036376953125, 0.14697265625, 0.257568359375, 0.3681640625, 0.478759765625, 0.58935546875, 0.699951171875, 0.810546875, 0.921142578125, 1.03173828125, 1.142333984375, 1.2529296875, 1.363525390625, 1.47412109375, 1.584716796875, 1.6953125, 1.805908203125, 1.91650390625, 2.027099609375, 2.1376953125, 2.248291015625, 2.35888671875, 2.469482421875, 2.580078125, 2.690673828125, 2.80126953125, 2.911865234375, 3.0224609375, 3.133056640625, 3.24365234375, 3.354248046875, 3.46484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 3.0, 10.0, 7.0, 13.0, 15.0, 10.0, 14.0, 28.0, 27.0, 33.0, 34.0, 39.0, 43.0, 49.0, 39.0, 49.0, 53.0, 50.0, 46.0, 52.0, 41.0, 34.0, 44.0, 49.0, 36.0, 26.0, 21.0, 26.0, 23.0, 21.0, 19.0, 6.0, 10.0, 8.0, 7.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.5703125, -6.37530517578125, -6.1802978515625, -5.98529052734375, -5.790283203125, -5.59527587890625, -5.4002685546875, -5.20526123046875, -5.01025390625, -4.81524658203125, -4.6202392578125, -4.42523193359375, -4.230224609375, -4.03521728515625, -3.8402099609375, -3.64520263671875, -3.4501953125, -3.25518798828125, -3.0601806640625, -2.86517333984375, -2.670166015625, -2.47515869140625, -2.2801513671875, -2.08514404296875, -1.89013671875, -1.69512939453125, -1.5001220703125, -1.30511474609375, -1.110107421875, -0.91510009765625, -0.7200927734375, -0.52508544921875, -0.330078125, -0.13507080078125, 0.0599365234375, 0.25494384765625, 0.449951171875, 0.64495849609375, 0.8399658203125, 1.03497314453125, 1.22998046875, 1.42498779296875, 1.6199951171875, 1.81500244140625, 2.010009765625, 2.20501708984375, 2.4000244140625, 2.59503173828125, 2.7900390625, 2.98504638671875, 3.1800537109375, 3.37506103515625, 3.570068359375, 3.76507568359375, 3.9600830078125, 4.15509033203125, 4.35009765625, 4.54510498046875, 4.7401123046875, 4.93511962890625, 5.130126953125, 5.32513427734375, 5.5201416015625, 5.71514892578125, 5.91015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 11.0, 12.0, 10.0, 15.0, 24.0, 31.0, 47.0, 71.0, 121.0, 187.0, 291.0, 487.0, 655.0, 1175.0, 2177.0, 3724.0, 6837.0, 13089.0, 25992.0, 55005.0, 120289.0, 251163.0, 286763.0, 147555.0, 67094.0, 31551.0, 15617.0, 7979.0, 4372.0, 2497.0, 1456.0, 841.0, 522.0, 300.0, 187.0, 132.0, 97.0, 67.0, 41.0, 26.0, 17.0, 7.0, 11.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.625, -6.425048828125, -6.22509765625, -6.025146484375, -5.8251953125, -5.625244140625, -5.42529296875, -5.225341796875, -5.025390625, -4.825439453125, -4.62548828125, -4.425537109375, -4.2255859375, -4.025634765625, -3.82568359375, -3.625732421875, -3.42578125, -3.225830078125, -3.02587890625, -2.825927734375, -2.6259765625, -2.426025390625, -2.22607421875, -2.026123046875, -1.826171875, -1.626220703125, -1.42626953125, -1.226318359375, -1.0263671875, -0.826416015625, -0.62646484375, -0.426513671875, -0.2265625, -0.026611328125, 0.17333984375, 0.373291015625, 0.5732421875, 0.773193359375, 0.97314453125, 1.173095703125, 1.373046875, 1.572998046875, 1.77294921875, 1.972900390625, 2.1728515625, 2.372802734375, 2.57275390625, 2.772705078125, 2.97265625, 3.172607421875, 3.37255859375, 3.572509765625, 3.7724609375, 3.972412109375, 4.17236328125, 4.372314453125, 4.572265625, 4.772216796875, 4.97216796875, 5.172119140625, 5.3720703125, 5.572021484375, 5.77197265625, 5.971923828125, 6.171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 11.0, 6.0, 5.0, 5.0, 11.0, 4.0, 12.0, 10.0, 19.0, 9.0, 16.0, 26.0, 19.0, 21.0, 41.0, 27.0, 34.0, 43.0, 34.0, 43.0, 50.0, 40.0, 35.0, 26.0, 38.0, 38.0, 46.0, 32.0, 37.0, 26.0, 26.0, 29.0, 27.0, 26.0, 19.0, 21.0, 20.0, 14.0, 9.0, 10.0, 10.0, 10.0, 4.0, 5.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-3.0234375, -2.935546875, -2.84765625, -2.759765625, -2.671875, -2.583984375, -2.49609375, -2.408203125, -2.3203125, -2.232421875, -2.14453125, -2.056640625, -1.96875, -1.880859375, -1.79296875, -1.705078125, -1.6171875, -1.529296875, -1.44140625, -1.353515625, -1.265625, -1.177734375, -1.08984375, -1.001953125, -0.9140625, -0.826171875, -0.73828125, -0.650390625, -0.5625, -0.474609375, -0.38671875, -0.298828125, -0.2109375, -0.123046875, -0.03515625, 0.052734375, 0.140625, 0.228515625, 0.31640625, 0.404296875, 0.4921875, 0.580078125, 0.66796875, 0.755859375, 0.84375, 0.931640625, 1.01953125, 1.107421875, 1.1953125, 1.283203125, 1.37109375, 1.458984375, 1.546875, 1.634765625, 1.72265625, 1.810546875, 1.8984375, 1.986328125, 2.07421875, 2.162109375, 2.25, 2.337890625, 2.42578125, 2.513671875, 2.6015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 4.0, 4.0, 8.0, 15.0, 27.0, 43.0, 70.0, 123.0, 190.0, 318.0, 491.0, 808.0, 1404.0, 2547.0, 4592.0, 8628.0, 16626.0, 35058.0, 78198.0, 179955.0, 316637.0, 219883.0, 97171.0, 42843.0, 20232.0, 10173.0, 5300.0, 2913.0, 1736.0, 1013.0, 603.0, 357.0, 218.0, 142.0, 82.0, 59.0, 35.0, 20.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.12689208984375, -3.0213623046875, -2.91583251953125, -2.810302734375, -2.70477294921875, -2.5992431640625, -2.49371337890625, -2.38818359375, -2.28265380859375, -2.1771240234375, -2.07159423828125, -1.966064453125, -1.86053466796875, -1.7550048828125, -1.64947509765625, -1.5439453125, -1.43841552734375, -1.3328857421875, -1.22735595703125, -1.121826171875, -1.01629638671875, -0.9107666015625, -0.80523681640625, -0.69970703125, -0.59417724609375, -0.4886474609375, -0.38311767578125, -0.277587890625, -0.17205810546875, -0.0665283203125, 0.03900146484375, 0.14453125, 0.25006103515625, 0.3555908203125, 0.46112060546875, 0.566650390625, 0.67218017578125, 0.7777099609375, 0.88323974609375, 0.98876953125, 1.09429931640625, 1.1998291015625, 1.30535888671875, 1.410888671875, 1.51641845703125, 1.6219482421875, 1.72747802734375, 1.8330078125, 1.93853759765625, 2.0440673828125, 2.14959716796875, 2.255126953125, 2.36065673828125, 2.4661865234375, 2.57171630859375, 2.67724609375, 2.78277587890625, 2.8883056640625, 2.99383544921875, 3.099365234375, 3.20489501953125, 3.3104248046875, 3.41595458984375, 3.521484375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 6.0, 3.0, 15.0, 12.0, 18.0, 34.0, 32.0, 40.0, 39.0, 44.0, 64.0, 60.0, 74.0, 63.0, 67.0, 74.0, 61.0, 57.0, 39.0, 44.0, 31.0, 24.0, 13.0, 12.0, 9.0, 14.0, 5.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.934736251831055e-05, -8.594151586294174e-05, -8.253566920757294e-05, -7.912982255220413e-05, -7.572397589683533e-05, -7.231812924146652e-05, -6.891228258609772e-05, -6.550643593072891e-05, -6.210058927536011e-05, -5.86947426199913e-05, -5.52888959646225e-05, -5.188304930925369e-05, -4.847720265388489e-05, -4.507135599851608e-05, -4.166550934314728e-05, -3.825966268777847e-05, -3.485381603240967e-05, -3.144796937704086e-05, -2.8042122721672058e-05, -2.4636276066303253e-05, -2.1230429410934448e-05, -1.7824582755565643e-05, -1.4418736100196838e-05, -1.1012889444828033e-05, -7.6070427894592285e-06, -4.201196134090424e-06, -7.953494787216187e-07, 2.6104971766471863e-06, 6.016343832015991e-06, 9.422190487384796e-06, 1.2828037142753601e-05, 1.6233883798122406e-05, 1.963973045349121e-05, 2.3045577108860016e-05, 2.645142376422882e-05, 2.9857270419597626e-05, 3.326311707496643e-05, 3.6668963730335236e-05, 4.007481038570404e-05, 4.3480657041072845e-05, 4.688650369644165e-05, 5.0292350351810455e-05, 5.369819700717926e-05, 5.7104043662548065e-05, 6.050989031791687e-05, 6.391573697328568e-05, 6.732158362865448e-05, 7.072743028402328e-05, 7.413327693939209e-05, 7.75391235947609e-05, 8.09449702501297e-05, 8.43508169054985e-05, 8.775666356086731e-05, 9.116251021623611e-05, 9.456835687160492e-05, 9.797420352697372e-05, 0.00010138005018234253, 0.00010478589683771133, 0.00010819174349308014, 0.00011159759014844894, 0.00011500343680381775, 0.00011840928345918655, 0.00012181513011455536, 0.00012522097676992416, 0.00012862682342529297]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [5.0, 2.0, 10.0, 9.0, 14.0, 28.0, 39.0, 46.0, 72.0, 93.0, 120.0, 180.0, 245.0, 399.0, 550.0, 787.0, 1169.0, 1839.0, 2571.0, 4180.0, 6029.0, 9455.0, 14868.0, 23101.0, 36863.0, 58082.0, 89746.0, 129795.0, 162055.0, 157524.0, 121070.0, 82160.0, 52688.0, 33383.0, 20723.0, 13337.0, 8571.0, 5496.0, 3602.0, 2468.0, 1633.0, 1109.0, 740.0, 506.0, 383.0, 235.0, 176.0, 123.0, 90.0, 66.0, 41.0, 30.0, 19.0, 19.0, 9.0, 10.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7919921875, -1.7299652099609375, -1.667938232421875, -1.6059112548828125, -1.54388427734375, -1.4818572998046875, -1.419830322265625, -1.3578033447265625, -1.2957763671875, -1.2337493896484375, -1.171722412109375, -1.1096954345703125, -1.04766845703125, -0.9856414794921875, -0.923614501953125, -0.8615875244140625, -0.799560546875, -0.7375335693359375, -0.675506591796875, -0.6134796142578125, -0.55145263671875, -0.4894256591796875, -0.427398681640625, -0.3653717041015625, -0.3033447265625, -0.2413177490234375, -0.179290771484375, -0.1172637939453125, -0.05523681640625, 0.0067901611328125, 0.068817138671875, 0.1308441162109375, 0.19287109375, 0.2548980712890625, 0.316925048828125, 0.3789520263671875, 0.44097900390625, 0.5030059814453125, 0.565032958984375, 0.6270599365234375, 0.6890869140625, 0.7511138916015625, 0.813140869140625, 0.8751678466796875, 0.93719482421875, 0.9992218017578125, 1.061248779296875, 1.1232757568359375, 1.185302734375, 1.2473297119140625, 1.309356689453125, 1.3713836669921875, 1.43341064453125, 1.4954376220703125, 1.557464599609375, 1.6194915771484375, 1.6815185546875, 1.7435455322265625, 1.805572509765625, 1.8675994873046875, 1.92962646484375, 1.9916534423828125, 2.053680419921875, 2.1157073974609375, 2.177734375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 6.0, 8.0, 8.0, 14.0, 15.0, 23.0, 26.0, 26.0, 36.0, 42.0, 50.0, 62.0, 62.0, 51.0, 87.0, 64.0, 65.0, 49.0, 58.0, 33.0, 36.0, 38.0, 23.0, 19.0, 17.0, 12.0, 8.0, 13.0, 12.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8056640625, -0.7835235595703125, -0.761383056640625, -0.7392425537109375, -0.71710205078125, -0.6949615478515625, -0.672821044921875, -0.6506805419921875, -0.6285400390625, -0.6063995361328125, -0.584259033203125, -0.5621185302734375, -0.53997802734375, -0.5178375244140625, -0.495697021484375, -0.4735565185546875, -0.451416015625, -0.4292755126953125, -0.407135009765625, -0.3849945068359375, -0.36285400390625, -0.3407135009765625, -0.318572998046875, -0.2964324951171875, -0.2742919921875, -0.2521514892578125, -0.230010986328125, -0.2078704833984375, -0.18572998046875, -0.1635894775390625, -0.141448974609375, -0.1193084716796875, -0.09716796875, -0.0750274658203125, -0.052886962890625, -0.0307464599609375, -0.00860595703125, 0.0135345458984375, 0.035675048828125, 0.0578155517578125, 0.0799560546875, 0.1020965576171875, 0.124237060546875, 0.1463775634765625, 0.16851806640625, 0.1906585693359375, 0.212799072265625, 0.2349395751953125, 0.257080078125, 0.2792205810546875, 0.301361083984375, 0.3235015869140625, 0.34564208984375, 0.3677825927734375, 0.389923095703125, 0.4120635986328125, 0.4342041015625, 0.4563446044921875, 0.478485107421875, 0.5006256103515625, 0.52276611328125, 0.5449066162109375, 0.567047119140625, 0.5891876220703125, 0.611328125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 2.0, 10.0, 12.0, 11.0, 15.0, 30.0, 27.0, 38.0, 39.0, 67.0, 58.0, 79.0, 89.0, 107.0, 83.0, 74.0, 58.0, 46.0, 34.0, 27.0, 17.0, 17.0, 9.0, 8.0, 12.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.631583213806152, -10.2763090133667, -9.921034812927246, -9.565760612487793, -9.21048641204834, -8.855212211608887, -8.499937057495117, -8.144662857055664, -7.789389133453369, -7.434114933013916, -7.078840732574463, -6.723566055297852, -6.368291854858398, -6.013017654418945, -5.657743453979492, -5.302469253540039, -4.947195053100586, -4.591920852661133, -4.23664665222168, -3.8813722133636475, -3.5260980129241943, -3.170823812484741, -2.815549373626709, -2.460275173187256, -2.1050009727478027, -1.7497267723083496, -1.394452452659607, -1.0391781330108643, -0.6839039325714111, -0.328629732131958, 0.02664470672607422, 0.38191890716552734, 0.7371931076049805, 1.0924673080444336, 1.4477416276931763, 1.803015947341919, 2.158290147781372, 2.513564348220825, 2.8688387870788574, 3.2241129875183105, 3.5793871879577637, 3.934661388397217, 4.28993558883667, 4.645210266113281, 5.000484466552734, 5.3557586669921875, 5.711032867431641, 6.066307067871094, 6.421581268310547, 6.77685546875, 7.132129669189453, 7.487403869628906, 7.842678070068359, 8.197952270507812, 8.553226470947266, 8.908500671386719, 9.263774871826172, 9.619049072265625, 9.974323272705078, 10.329597473144531, 10.684871673583984, 11.040145874023438, 11.39542007446289, 11.750694274902344, 12.105969429016113]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 5.0, 5.0, 6.0, 7.0, 14.0, 10.0, 15.0, 11.0, 34.0, 19.0, 31.0, 26.0, 33.0, 46.0, 47.0, 43.0, 41.0, 55.0, 48.0, 47.0, 48.0, 40.0, 42.0, 44.0, 43.0, 31.0, 32.0, 32.0, 25.0, 17.0, 21.0, 14.0, 22.0, 12.0, 10.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.483592987060547, -5.317099571228027, -5.150606155395508, -4.984112739562988, -4.817619323730469, -4.651125907897949, -4.48463249206543, -4.318138599395752, -4.151645183563232, -3.985151767730713, -3.8186583518981934, -3.652164936065674, -3.485671281814575, -3.3191778659820557, -3.152684450149536, -2.9861907958984375, -2.819697618484497, -2.6532042026519775, -2.486710786819458, -2.3202171325683594, -2.15372371673584, -1.9872303009033203, -1.8207368850708008, -1.6542433500289917, -1.4877499341964722, -1.3212565183639526, -1.1547629833221436, -0.988269567489624, -0.8217760920524597, -0.6552826166152954, -0.4887892007827759, -0.3222956657409668, -0.15580224990844727, 0.010691210627555847, 0.17718467116355896, 0.3436781167984009, 0.5101715922355652, 0.6766650676727295, 0.843158483505249, 1.009652018547058, 1.1761454343795776, 1.3426388502120972, 1.5091323852539062, 1.6756258010864258, 1.8421192169189453, 2.008612632751465, 2.1751060485839844, 2.341599702835083, 2.5080931186676025, 2.674586534500122, 2.8410799503326416, 3.0075736045837402, 3.1740670204162598, 3.3405604362487793, 3.507053852081299, 3.6735472679138184, 3.840040683746338, 4.006534099578857, 4.173027515411377, 4.3395209312438965, 4.506014347076416, 4.672508239746094, 4.839001655578613, 5.005495071411133, 5.171988487243652]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 5.0, 14.0, 23.0, 19.0, 34.0, 45.0, 91.0, 142.0, 236.0, 335.0, 567.0, 1013.0, 1541.0, 2530.0, 4334.0, 7110.0, 12259.0, 19948.0, 33004.0, 53764.0, 84936.0, 123766.0, 156783.0, 161887.0, 133449.0, 94122.0, 61337.0, 37597.0, 22808.0, 13847.0, 8274.0, 5013.0, 2954.0, 1792.0, 1152.0, 688.0, 428.0, 266.0, 157.0, 90.0, 76.0, 31.0, 32.0, 20.0, 18.0, 9.0, 8.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.58544921875, -3.4482421875, -3.31103515625, -3.173828125, -3.03662109375, -2.8994140625, -2.76220703125, -2.625, -2.48779296875, -2.3505859375, -2.21337890625, -2.076171875, -1.93896484375, -1.8017578125, -1.66455078125, -1.52734375, -1.39013671875, -1.2529296875, -1.11572265625, -0.978515625, -0.84130859375, -0.7041015625, -0.56689453125, -0.4296875, -0.29248046875, -0.1552734375, -0.01806640625, 0.119140625, 0.25634765625, 0.3935546875, 0.53076171875, 0.66796875, 0.80517578125, 0.9423828125, 1.07958984375, 1.216796875, 1.35400390625, 1.4912109375, 1.62841796875, 1.765625, 1.90283203125, 2.0400390625, 2.17724609375, 2.314453125, 2.45166015625, 2.5888671875, 2.72607421875, 2.86328125, 3.00048828125, 3.1376953125, 3.27490234375, 3.412109375, 3.54931640625, 3.6865234375, 3.82373046875, 3.9609375, 4.09814453125, 4.2353515625, 4.37255859375, 4.509765625, 4.64697265625, 4.7841796875, 4.92138671875, 5.05859375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 0.0, 5.0, 4.0, 6.0, 8.0, 8.0, 15.0, 8.0, 11.0, 25.0, 22.0, 15.0, 22.0, 27.0, 27.0, 21.0, 31.0, 50.0, 33.0, 38.0, 42.0, 46.0, 46.0, 45.0, 32.0, 35.0, 34.0, 34.0, 35.0, 38.0, 38.0, 25.0, 32.0, 16.0, 16.0, 16.0, 20.0, 14.0, 15.0, 9.0, 6.0, 3.0, 5.0, 5.0, 6.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.33984375, -5.18145751953125, -5.0230712890625, -4.86468505859375, -4.706298828125, -4.54791259765625, -4.3895263671875, -4.23114013671875, -4.07275390625, -3.91436767578125, -3.7559814453125, -3.59759521484375, -3.439208984375, -3.28082275390625, -3.1224365234375, -2.96405029296875, -2.8056640625, -2.64727783203125, -2.4888916015625, -2.33050537109375, -2.172119140625, -2.01373291015625, -1.8553466796875, -1.69696044921875, -1.53857421875, -1.38018798828125, -1.2218017578125, -1.06341552734375, -0.905029296875, -0.74664306640625, -0.5882568359375, -0.42987060546875, -0.271484375, -0.11309814453125, 0.0452880859375, 0.20367431640625, 0.362060546875, 0.52044677734375, 0.6788330078125, 0.83721923828125, 0.99560546875, 1.15399169921875, 1.3123779296875, 1.47076416015625, 1.629150390625, 1.78753662109375, 1.9459228515625, 2.10430908203125, 2.2626953125, 2.42108154296875, 2.5794677734375, 2.73785400390625, 2.896240234375, 3.05462646484375, 3.2130126953125, 3.37139892578125, 3.52978515625, 3.68817138671875, 3.8465576171875, 4.00494384765625, 4.163330078125, 4.32171630859375, 4.4801025390625, 4.63848876953125, 4.796875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 8.0, 2.0, 7.0, 8.0, 25.0, 33.0, 55.0, 82.0, 104.0, 150.0, 220.0, 365.0, 564.0, 864.0, 1500.0, 2223.0, 3523.0, 5621.0, 9100.0, 14962.0, 24045.0, 39149.0, 61849.0, 93204.0, 128973.0, 153893.0, 150124.0, 122145.0, 86647.0, 56326.0, 35329.0, 21524.0, 13520.0, 8391.0, 5107.0, 3232.0, 2079.0, 1255.0, 813.0, 528.0, 342.0, 249.0, 144.0, 106.0, 65.0, 44.0, 30.0, 15.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.1953125, -4.05499267578125, -3.9146728515625, -3.77435302734375, -3.634033203125, -3.49371337890625, -3.3533935546875, -3.21307373046875, -3.07275390625, -2.93243408203125, -2.7921142578125, -2.65179443359375, -2.511474609375, -2.37115478515625, -2.2308349609375, -2.09051513671875, -1.9501953125, -1.80987548828125, -1.6695556640625, -1.52923583984375, -1.388916015625, -1.24859619140625, -1.1082763671875, -0.96795654296875, -0.82763671875, -0.68731689453125, -0.5469970703125, -0.40667724609375, -0.266357421875, -0.12603759765625, 0.0142822265625, 0.15460205078125, 0.294921875, 0.43524169921875, 0.5755615234375, 0.71588134765625, 0.856201171875, 0.99652099609375, 1.1368408203125, 1.27716064453125, 1.41748046875, 1.55780029296875, 1.6981201171875, 1.83843994140625, 1.978759765625, 2.11907958984375, 2.2593994140625, 2.39971923828125, 2.5400390625, 2.68035888671875, 2.8206787109375, 2.96099853515625, 3.101318359375, 3.24163818359375, 3.3819580078125, 3.52227783203125, 3.66259765625, 3.80291748046875, 3.9432373046875, 4.08355712890625, 4.223876953125, 4.36419677734375, 4.5045166015625, 4.64483642578125, 4.78515625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 8.0, 11.0, 10.0, 14.0, 14.0, 15.0, 16.0, 30.0, 31.0, 31.0, 26.0, 35.0, 44.0, 35.0, 38.0, 32.0, 36.0, 42.0, 54.0, 41.0, 48.0, 48.0, 32.0, 45.0, 30.0, 38.0, 28.0, 24.0, 24.0, 12.0, 26.0, 16.0, 9.0, 13.0, 8.0, 8.0, 10.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.32421875, -3.21453857421875, -3.1048583984375, -2.99517822265625, -2.885498046875, -2.77581787109375, -2.6661376953125, -2.55645751953125, -2.44677734375, -2.33709716796875, -2.2274169921875, -2.11773681640625, -2.008056640625, -1.89837646484375, -1.7886962890625, -1.67901611328125, -1.5693359375, -1.45965576171875, -1.3499755859375, -1.24029541015625, -1.130615234375, -1.02093505859375, -0.9112548828125, -0.80157470703125, -0.69189453125, -0.58221435546875, -0.4725341796875, -0.36285400390625, -0.253173828125, -0.14349365234375, -0.0338134765625, 0.07586669921875, 0.185546875, 0.29522705078125, 0.4049072265625, 0.51458740234375, 0.624267578125, 0.73394775390625, 0.8436279296875, 0.95330810546875, 1.06298828125, 1.17266845703125, 1.2823486328125, 1.39202880859375, 1.501708984375, 1.61138916015625, 1.7210693359375, 1.83074951171875, 1.9404296875, 2.05010986328125, 2.1597900390625, 2.26947021484375, 2.379150390625, 2.48883056640625, 2.5985107421875, 2.70819091796875, 2.81787109375, 2.92755126953125, 3.0372314453125, 3.14691162109375, 3.256591796875, 3.36627197265625, 3.4759521484375, 3.58563232421875, 3.6953125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 6.0, 6.0, 18.0, 19.0, 33.0, 45.0, 48.0, 96.0, 99.0, 159.0, 224.0, 356.0, 481.0, 814.0, 1266.0, 1973.0, 3181.0, 5377.0, 9807.0, 18131.0, 35374.0, 72297.0, 145626.0, 238246.0, 233197.0, 138637.0, 68695.0, 33836.0, 17331.0, 9298.0, 5264.0, 3137.0, 1877.0, 1206.0, 771.0, 509.0, 321.0, 247.0, 139.0, 120.0, 79.0, 64.0, 37.0, 26.0, 22.0, 10.0, 11.0, 7.0, 11.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.85546875, -3.73095703125, -3.6064453125, -3.48193359375, -3.357421875, -3.23291015625, -3.1083984375, -2.98388671875, -2.859375, -2.73486328125, -2.6103515625, -2.48583984375, -2.361328125, -2.23681640625, -2.1123046875, -1.98779296875, -1.86328125, -1.73876953125, -1.6142578125, -1.48974609375, -1.365234375, -1.24072265625, -1.1162109375, -0.99169921875, -0.8671875, -0.74267578125, -0.6181640625, -0.49365234375, -0.369140625, -0.24462890625, -0.1201171875, 0.00439453125, 0.12890625, 0.25341796875, 0.3779296875, 0.50244140625, 0.626953125, 0.75146484375, 0.8759765625, 1.00048828125, 1.125, 1.24951171875, 1.3740234375, 1.49853515625, 1.623046875, 1.74755859375, 1.8720703125, 1.99658203125, 2.12109375, 2.24560546875, 2.3701171875, 2.49462890625, 2.619140625, 2.74365234375, 2.8681640625, 2.99267578125, 3.1171875, 3.24169921875, 3.3662109375, 3.49072265625, 3.615234375, 3.73974609375, 3.8642578125, 3.98876953125, 4.11328125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 7.0, 18.0, 15.0, 20.0, 25.0, 38.0, 37.0, 41.0, 58.0, 70.0, 73.0, 73.0, 79.0, 87.0, 72.0, 68.0, 53.0, 33.0, 30.0, 22.0, 18.0, 11.0, 11.0, 11.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003662109375, -0.00035634636878967285, -0.0003464818000793457, -0.00033661723136901855, -0.0003267526626586914, -0.00031688809394836426, -0.0003070235252380371, -0.00029715895652770996, -0.0002872943878173828, -0.00027742981910705566, -0.0002675652503967285, -0.00025770068168640137, -0.0002478361129760742, -0.00023797154426574707, -0.00022810697555541992, -0.00021824240684509277, -0.00020837783813476562, -0.00019851326942443848, -0.00018864870071411133, -0.00017878413200378418, -0.00016891956329345703, -0.00015905499458312988, -0.00014919042587280273, -0.00013932585716247559, -0.00012946128845214844, -0.00011959671974182129, -0.00010973215103149414, -9.986758232116699e-05, -9.000301361083984e-05, -8.01384449005127e-05, -7.027387619018555e-05, -6.04093074798584e-05, -5.054473876953125e-05, -4.06801700592041e-05, -3.081560134887695e-05, -2.0951032638549805e-05, -1.1086463928222656e-05, -1.2218952178955078e-06, 8.64267349243164e-06, 1.850724220275879e-05, 2.8371810913085938e-05, 3.8236379623413086e-05, 4.8100948333740234e-05, 5.796551704406738e-05, 6.783008575439453e-05, 7.769465446472168e-05, 8.755922317504883e-05, 9.742379188537598e-05, 0.00010728836059570312, 0.00011715292930603027, 0.00012701749801635742, 0.00013688206672668457, 0.00014674663543701172, 0.00015661120414733887, 0.00016647577285766602, 0.00017634034156799316, 0.0001862049102783203, 0.00019606947898864746, 0.0002059340476989746, 0.00021579861640930176, 0.0002256631851196289, 0.00023552775382995605, 0.0002453923225402832, 0.00025525689125061035, 0.0002651214599609375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 8.0, 14.0, 13.0, 25.0, 34.0, 56.0, 72.0, 131.0, 138.0, 254.0, 334.0, 545.0, 894.0, 1525.0, 2566.0, 4535.0, 8530.0, 17106.0, 37292.0, 89262.0, 205849.0, 306395.0, 208744.0, 89828.0, 37322.0, 17052.0, 8757.0, 4554.0, 2645.0, 1483.0, 926.0, 554.0, 363.0, 211.0, 166.0, 98.0, 65.0, 50.0, 34.0, 31.0, 24.0, 18.0, 10.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.3046875, -5.1463623046875, -4.988037109375, -4.8297119140625, -4.67138671875, -4.5130615234375, -4.354736328125, -4.1964111328125, -4.0380859375, -3.8797607421875, -3.721435546875, -3.5631103515625, -3.40478515625, -3.2464599609375, -3.088134765625, -2.9298095703125, -2.771484375, -2.6131591796875, -2.454833984375, -2.2965087890625, -2.13818359375, -1.9798583984375, -1.821533203125, -1.6632080078125, -1.5048828125, -1.3465576171875, -1.188232421875, -1.0299072265625, -0.87158203125, -0.7132568359375, -0.554931640625, -0.3966064453125, -0.23828125, -0.0799560546875, 0.078369140625, 0.2366943359375, 0.39501953125, 0.5533447265625, 0.711669921875, 0.8699951171875, 1.0283203125, 1.1866455078125, 1.344970703125, 1.5032958984375, 1.66162109375, 1.8199462890625, 1.978271484375, 2.1365966796875, 2.294921875, 2.4532470703125, 2.611572265625, 2.7698974609375, 2.92822265625, 3.0865478515625, 3.244873046875, 3.4031982421875, 3.5615234375, 3.7198486328125, 3.878173828125, 4.0364990234375, 4.19482421875, 4.3531494140625, 4.511474609375, 4.6697998046875, 4.828125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 13.0, 7.0, 17.0, 16.0, 23.0, 24.0, 40.0, 42.0, 53.0, 47.0, 69.0, 66.0, 72.0, 58.0, 66.0, 73.0, 46.0, 54.0, 37.0, 37.0, 23.0, 23.0, 14.0, 16.0, 9.0, 6.0, 12.0, 4.0, 3.0, 3.0, 8.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88916015625, -0.8572311401367188, -0.8253021240234375, -0.7933731079101562, -0.761444091796875, -0.7295150756835938, -0.6975860595703125, -0.6656570434570312, -0.63372802734375, -0.6017990112304688, -0.5698699951171875, -0.5379409790039062, -0.506011962890625, -0.47408294677734375, -0.4421539306640625, -0.41022491455078125, -0.3782958984375, -0.34636688232421875, -0.3144378662109375, -0.28250885009765625, -0.250579833984375, -0.21865081787109375, -0.1867218017578125, -0.15479278564453125, -0.12286376953125, -0.09093475341796875, -0.0590057373046875, -0.02707672119140625, 0.004852294921875, 0.03678131103515625, 0.0687103271484375, 0.10063934326171875, 0.132568359375, 0.16449737548828125, 0.1964263916015625, 0.22835540771484375, 0.260284423828125, 0.29221343994140625, 0.3241424560546875, 0.35607147216796875, 0.38800048828125, 0.41992950439453125, 0.4518585205078125, 0.48378753662109375, 0.515716552734375, 0.5476455688476562, 0.5795745849609375, 0.6115036010742188, 0.6434326171875, 0.6753616333007812, 0.7072906494140625, 0.7392196655273438, 0.771148681640625, 0.8030776977539062, 0.8350067138671875, 0.8669357299804688, 0.89886474609375, 0.9307937622070312, 0.9627227783203125, 0.9946517944335938, 1.026580810546875, 1.0585098266601562, 1.0904388427734375, 1.1223678588867188, 1.154296875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 4.0, 9.0, 6.0, 7.0, 13.0, 8.0, 15.0, 23.0, 34.0, 38.0, 32.0, 52.0, 68.0, 54.0, 71.0, 94.0, 89.0, 60.0, 73.0, 56.0, 44.0, 21.0, 30.0, 24.0, 16.0, 15.0, 11.0, 6.0, 5.0, 4.0, 5.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.061903953552246, -10.731118202209473, -10.4003324508667, -10.069546699523926, -9.738760948181152, -9.407975196838379, -9.077189445495605, -8.746404647827148, -8.415618896484375, -8.084833145141602, -7.754047393798828, -7.423261642456055, -7.092475891113281, -6.761690139770508, -6.430904865264893, -6.100119113922119, -5.7693328857421875, -5.438547134399414, -5.107761383056641, -4.776975631713867, -4.446189880371094, -4.11540412902832, -3.784618854522705, -3.4538331031799316, -3.123047351837158, -2.7922616004943848, -2.4614758491516113, -2.130690336227417, -1.7999045848846436, -1.4691188335418701, -1.1383332014083862, -0.8075475692749023, -0.4767608642578125, -0.14597517251968384, 0.18481051921844482, 0.5155962109565735, 0.8463819026947021, 1.1771676540374756, 1.5079532861709595, 1.8387389183044434, 2.169524669647217, 2.5003104209899902, 2.8310961723327637, 3.161881685256958, 3.4926674365997314, 3.823453187942505, 4.154238700866699, 4.485024452209473, 4.815810203552246, 5.1465959548950195, 5.477381706237793, 5.808167457580566, 6.13895320892334, 6.469738960266113, 6.8005242347717285, 7.131309986114502, 7.462095737457275, 7.792881488800049, 8.123666763305664, 8.454452514648438, 8.785238265991211, 9.116024017333984, 9.446809768676758, 9.777595520019531, 10.108381271362305]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 0.0, 4.0, 6.0, 6.0, 12.0, 12.0, 13.0, 18.0, 21.0, 28.0, 31.0, 28.0, 30.0, 44.0, 41.0, 49.0, 48.0, 54.0, 44.0, 40.0, 49.0, 50.0, 45.0, 34.0, 34.0, 40.0, 36.0, 36.0, 21.0, 29.0, 27.0, 14.0, 21.0, 9.0, 10.0, 6.0, 8.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.117946147918701, -5.9360456466674805, -5.754145622253418, -5.5722455978393555, -5.390345096588135, -5.208444595336914, -5.026544570922852, -4.844644546508789, -4.662744045257568, -4.480843544006348, -4.298943519592285, -4.117043495178223, -3.935142993927002, -3.7532427310943604, -3.5713424682617188, -3.389442205429077, -3.2075419425964355, -3.025641679763794, -2.8437414169311523, -2.6618411540985107, -2.479940891265869, -2.2980406284332275, -2.116140365600586, -1.9342401027679443, -1.7523398399353027, -1.5704395771026611, -1.3885393142700195, -1.206639051437378, -1.0247387886047363, -0.8428385257720947, -0.6609382629394531, -0.4790380001068115, -0.2971377372741699, -0.11523747444152832, 0.06666278839111328, 0.24856305122375488, 0.4304633140563965, 0.6123635768890381, 0.7942638397216797, 0.9761641025543213, 1.158064365386963, 1.3399646282196045, 1.521864891052246, 1.7037651538848877, 1.8856654167175293, 2.067565679550171, 2.2494659423828125, 2.431366205215454, 2.6132664680480957, 2.7951667308807373, 2.977066993713379, 3.1589672565460205, 3.340867519378662, 3.5227677822113037, 3.7046680450439453, 3.886568307876587, 4.0684685707092285, 4.250369071960449, 4.432269096374512, 4.614169120788574, 4.796069622039795, 4.977970123291016, 5.159870147705078, 5.341770172119141, 5.523670673370361]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 8.0, 18.0, 12.0, 22.0, 26.0, 38.0, 51.0, 78.0, 91.0, 149.0, 198.0, 282.0, 395.0, 508.0, 748.0, 1043.0, 1529.0, 2151.0, 3141.0, 4786.0, 7277.0, 11099.0, 17800.0, 29867.0, 52267.0, 99836.0, 212961.0, 488188.0, 991615.0, 1108405.0, 620312.0, 269284.0, 121712.0, 60907.0, 33565.0, 19399.0, 12015.0, 7524.0, 4923.0, 3273.0, 2114.0, 1430.0, 1035.0, 676.0, 462.0, 332.0, 227.0, 158.0, 115.0, 89.0, 55.0, 35.0, 22.0, 15.0, 9.0, 8.0, 1.0, 3.0], "bins": [-9.8046875, -9.525634765625, -9.24658203125, -8.967529296875, -8.6884765625, -8.409423828125, -8.13037109375, -7.851318359375, -7.572265625, -7.293212890625, -7.01416015625, -6.735107421875, -6.4560546875, -6.177001953125, -5.89794921875, -5.618896484375, -5.33984375, -5.060791015625, -4.78173828125, -4.502685546875, -4.2236328125, -3.944580078125, -3.66552734375, -3.386474609375, -3.107421875, -2.828369140625, -2.54931640625, -2.270263671875, -1.9912109375, -1.712158203125, -1.43310546875, -1.154052734375, -0.875, -0.595947265625, -0.31689453125, -0.037841796875, 0.2412109375, 0.520263671875, 0.79931640625, 1.078369140625, 1.357421875, 1.636474609375, 1.91552734375, 2.194580078125, 2.4736328125, 2.752685546875, 3.03173828125, 3.310791015625, 3.58984375, 3.868896484375, 4.14794921875, 4.427001953125, 4.7060546875, 4.985107421875, 5.26416015625, 5.543212890625, 5.822265625, 6.101318359375, 6.38037109375, 6.659423828125, 6.9384765625, 7.217529296875, 7.49658203125, 7.775634765625, 8.0546875]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 8.0, 8.0, 10.0, 8.0, 5.0, 15.0, 8.0, 11.0, 18.0, 26.0, 28.0, 34.0, 25.0, 33.0, 38.0, 38.0, 45.0, 36.0, 39.0, 49.0, 52.0, 36.0, 41.0, 39.0, 38.0, 33.0, 36.0, 47.0, 28.0, 28.0, 21.0, 22.0, 20.0, 23.0, 11.0, 10.0, 6.0, 11.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.3203125, -4.18255615234375, -4.0447998046875, -3.90704345703125, -3.769287109375, -3.63153076171875, -3.4937744140625, -3.35601806640625, -3.21826171875, -3.08050537109375, -2.9427490234375, -2.80499267578125, -2.667236328125, -2.52947998046875, -2.3917236328125, -2.25396728515625, -2.1162109375, -1.97845458984375, -1.8406982421875, -1.70294189453125, -1.565185546875, -1.42742919921875, -1.2896728515625, -1.15191650390625, -1.01416015625, -0.87640380859375, -0.7386474609375, -0.60089111328125, -0.463134765625, -0.32537841796875, -0.1876220703125, -0.04986572265625, 0.087890625, 0.22564697265625, 0.3634033203125, 0.50115966796875, 0.638916015625, 0.77667236328125, 0.9144287109375, 1.05218505859375, 1.18994140625, 1.32769775390625, 1.4654541015625, 1.60321044921875, 1.740966796875, 1.87872314453125, 2.0164794921875, 2.15423583984375, 2.2919921875, 2.42974853515625, 2.5675048828125, 2.70526123046875, 2.843017578125, 2.98077392578125, 3.1185302734375, 3.25628662109375, 3.39404296875, 3.53179931640625, 3.6695556640625, 3.80731201171875, 3.945068359375, 4.08282470703125, 4.2205810546875, 4.35833740234375, 4.49609375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 10.0, 15.0, 17.0, 38.0, 49.0, 70.0, 98.0, 148.0, 242.0, 393.0, 586.0, 945.0, 1556.0, 2529.0, 4464.0, 7835.0, 14393.0, 27298.0, 54841.0, 115622.0, 271931.0, 718681.0, 1444586.0, 910539.0, 340123.0, 140848.0, 65644.0, 32248.0, 16867.0, 8933.0, 5149.0, 2873.0, 1809.0, 1068.0, 649.0, 403.0, 300.0, 155.0, 128.0, 68.0, 41.0, 24.0, 21.0, 21.0, 10.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.1875, -12.7568359375, -12.326171875, -11.8955078125, -11.46484375, -11.0341796875, -10.603515625, -10.1728515625, -9.7421875, -9.3115234375, -8.880859375, -8.4501953125, -8.01953125, -7.5888671875, -7.158203125, -6.7275390625, -6.296875, -5.8662109375, -5.435546875, -5.0048828125, -4.57421875, -4.1435546875, -3.712890625, -3.2822265625, -2.8515625, -2.4208984375, -1.990234375, -1.5595703125, -1.12890625, -0.6982421875, -0.267578125, 0.1630859375, 0.59375, 1.0244140625, 1.455078125, 1.8857421875, 2.31640625, 2.7470703125, 3.177734375, 3.6083984375, 4.0390625, 4.4697265625, 4.900390625, 5.3310546875, 5.76171875, 6.1923828125, 6.623046875, 7.0537109375, 7.484375, 7.9150390625, 8.345703125, 8.7763671875, 9.20703125, 9.6376953125, 10.068359375, 10.4990234375, 10.9296875, 11.3603515625, 11.791015625, 12.2216796875, 12.65234375, 13.0830078125, 13.513671875, 13.9443359375, 14.375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 10.0, 7.0, 14.0, 16.0, 14.0, 10.0, 38.0, 36.0, 49.0, 64.0, 86.0, 122.0, 181.0, 222.0, 255.0, 277.0, 362.0, 377.0, 374.0, 332.0, 252.0, 238.0, 174.0, 156.0, 88.0, 81.0, 59.0, 60.0, 30.0, 35.0, 12.0, 14.0, 12.0, 10.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.054473876953125, -3.93707275390625, -3.819671630859375, -3.7022705078125, -3.584869384765625, -3.46746826171875, -3.350067138671875, -3.232666015625, -3.115264892578125, -2.99786376953125, -2.880462646484375, -2.7630615234375, -2.645660400390625, -2.52825927734375, -2.410858154296875, -2.29345703125, -2.176055908203125, -2.05865478515625, -1.941253662109375, -1.8238525390625, -1.706451416015625, -1.58905029296875, -1.471649169921875, -1.354248046875, -1.236846923828125, -1.11944580078125, -1.002044677734375, -0.8846435546875, -0.767242431640625, -0.64984130859375, -0.532440185546875, -0.4150390625, -0.297637939453125, -0.18023681640625, -0.062835693359375, 0.0545654296875, 0.171966552734375, 0.28936767578125, 0.406768798828125, 0.524169921875, 0.641571044921875, 0.75897216796875, 0.876373291015625, 0.9937744140625, 1.111175537109375, 1.22857666015625, 1.345977783203125, 1.46337890625, 1.580780029296875, 1.69818115234375, 1.815582275390625, 1.9329833984375, 2.050384521484375, 2.16778564453125, 2.285186767578125, 2.402587890625, 2.519989013671875, 2.63739013671875, 2.754791259765625, 2.8721923828125, 2.989593505859375, 3.10699462890625, 3.224395751953125, 3.341796875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 7.0, 10.0, 8.0, 20.0, 16.0, 26.0, 28.0, 48.0, 44.0, 68.0, 76.0, 76.0, 95.0, 97.0, 84.0, 55.0, 51.0, 46.0, 31.0, 28.0, 28.0, 15.0, 9.0, 6.0, 7.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.99500846862793, -13.552582740783691, -13.110156059265137, -12.667730331420898, -12.225303649902344, -11.782877922058105, -11.340452194213867, -10.898025512695312, -10.455599784851074, -10.013174057006836, -9.570747375488281, -9.128321647644043, -8.685894966125488, -8.24346923828125, -7.8010430335998535, -7.358616828918457, -6.9161906242370605, -6.473764419555664, -6.031338214874268, -5.588912010192871, -5.146486282348633, -4.704060077667236, -4.26163387298584, -3.8192079067230225, -3.376781702041626, -2.9343554973602295, -2.491929531097412, -2.0495033264160156, -1.6070772409439087, -1.1646511554718018, -0.7222249507904053, -0.2797989845275879, 0.1626272201538086, 0.6050533056259155, 1.0474793910980225, 1.489905595779419, 1.9323316812515259, 2.374757766723633, 2.8171839714050293, 3.2596099376678467, 3.702036142349243, 4.1444621086120605, 4.586888313293457, 5.0293145179748535, 5.47174072265625, 5.914166450500488, 6.356593132019043, 6.799018859863281, 7.241445064544678, 7.683871269226074, 8.126296997070312, 8.568723678588867, 9.011149406433105, 9.453575134277344, 9.896001815795898, 10.338427543640137, 10.780854225158691, 11.22327995300293, 11.665706634521484, 12.108132362365723, 12.550559043884277, 12.992984771728516, 13.43541145324707, 13.877837181091309, 14.320262908935547]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 5.0, 2.0, 6.0, 3.0, 4.0, 15.0, 12.0, 15.0, 19.0, 17.0, 19.0, 27.0, 34.0, 40.0, 35.0, 34.0, 42.0, 39.0, 57.0, 44.0, 46.0, 47.0, 37.0, 42.0, 39.0, 45.0, 32.0, 35.0, 37.0, 25.0, 22.0, 27.0, 20.0, 16.0, 15.0, 9.0, 6.0, 11.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.9950385093688965, -5.804609298706055, -5.614180088043213, -5.423750877380371, -5.233321666717529, -5.0428924560546875, -4.852463722229004, -4.662034034729004, -4.47160530090332, -4.2811760902404785, -4.090746879577637, -3.900317668914795, -3.709888458251953, -3.5194592475891113, -3.3290302753448486, -3.138601064682007, -2.948171615600586, -2.757742404937744, -2.5673131942749023, -2.3768839836120605, -2.1864547729492188, -1.9960256814956665, -1.8055965900421143, -1.6151673793792725, -1.4247381687164307, -1.2343089580535889, -1.043879747390747, -0.8534506559371948, -0.663021445274353, -0.47259223461151123, -0.282163143157959, -0.09173393249511719, 0.0986948013305664, 0.2891239821910858, 0.4795531630516052, 0.6699823141098022, 0.860411524772644, 1.0508407354354858, 1.241269826889038, 1.4316990375518799, 1.6221282482147217, 1.8125574588775635, 2.0029866695404053, 2.193415641784668, 2.3838448524475098, 2.5742740631103516, 2.7647032737731934, 2.955132484436035, 3.145561695098877, 3.3359909057617188, 3.5264201164245605, 3.7168493270874023, 3.907278537750244, 4.097707748413086, 4.2881364822387695, 4.4785661697387695, 4.668994903564453, 4.859424114227295, 5.049853324890137, 5.2402825355529785, 5.43071174621582, 5.621140956878662, 5.811570167541504, 6.0019989013671875, 6.1924285888671875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 6.0, 15.0, 25.0, 39.0, 55.0, 72.0, 100.0, 159.0, 248.0, 404.0, 642.0, 987.0, 1517.0, 2394.0, 3928.0, 6487.0, 10779.0, 18343.0, 30869.0, 53496.0, 89019.0, 136943.0, 176511.0, 174710.0, 132587.0, 84493.0, 50418.0, 29610.0, 17097.0, 10187.0, 6157.0, 3751.0, 2372.0, 1495.0, 916.0, 570.0, 387.0, 250.0, 168.0, 109.0, 74.0, 50.0, 36.0, 27.0, 20.0, 7.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0], "bins": [-4.3984375, -4.26495361328125, -4.1314697265625, -3.99798583984375, -3.864501953125, -3.73101806640625, -3.5975341796875, -3.46405029296875, -3.33056640625, -3.19708251953125, -3.0635986328125, -2.93011474609375, -2.796630859375, -2.66314697265625, -2.5296630859375, -2.39617919921875, -2.2626953125, -2.12921142578125, -1.9957275390625, -1.86224365234375, -1.728759765625, -1.59527587890625, -1.4617919921875, -1.32830810546875, -1.19482421875, -1.06134033203125, -0.9278564453125, -0.79437255859375, -0.660888671875, -0.52740478515625, -0.3939208984375, -0.26043701171875, -0.126953125, 0.00653076171875, 0.1400146484375, 0.27349853515625, 0.406982421875, 0.54046630859375, 0.6739501953125, 0.80743408203125, 0.94091796875, 1.07440185546875, 1.2078857421875, 1.34136962890625, 1.474853515625, 1.60833740234375, 1.7418212890625, 1.87530517578125, 2.0087890625, 2.14227294921875, 2.2757568359375, 2.40924072265625, 2.542724609375, 2.67620849609375, 2.8096923828125, 2.94317626953125, 3.07666015625, 3.21014404296875, 3.3436279296875, 3.47711181640625, 3.610595703125, 3.74407958984375, 3.8775634765625, 4.01104736328125, 4.14453125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 11.0, 5.0, 8.0, 5.0, 13.0, 10.0, 22.0, 16.0, 13.0, 21.0, 23.0, 28.0, 26.0, 46.0, 37.0, 23.0, 33.0, 50.0, 41.0, 33.0, 51.0, 34.0, 41.0, 42.0, 50.0, 42.0, 40.0, 24.0, 30.0, 29.0, 24.0, 25.0, 20.0, 22.0, 14.0, 8.0, 11.0, 6.0, 8.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.2265625, -6.02252197265625, -5.8184814453125, -5.61444091796875, -5.410400390625, -5.20635986328125, -5.0023193359375, -4.79827880859375, -4.59423828125, -4.39019775390625, -4.1861572265625, -3.98211669921875, -3.778076171875, -3.57403564453125, -3.3699951171875, -3.16595458984375, -2.9619140625, -2.75787353515625, -2.5538330078125, -2.34979248046875, -2.145751953125, -1.94171142578125, -1.7376708984375, -1.53363037109375, -1.32958984375, -1.12554931640625, -0.9215087890625, -0.71746826171875, -0.513427734375, -0.30938720703125, -0.1053466796875, 0.09869384765625, 0.302734375, 0.50677490234375, 0.7108154296875, 0.91485595703125, 1.118896484375, 1.32293701171875, 1.5269775390625, 1.73101806640625, 1.93505859375, 2.13909912109375, 2.3431396484375, 2.54718017578125, 2.751220703125, 2.95526123046875, 3.1593017578125, 3.36334228515625, 3.5673828125, 3.77142333984375, 3.9754638671875, 4.17950439453125, 4.383544921875, 4.58758544921875, 4.7916259765625, 4.99566650390625, 5.19970703125, 5.40374755859375, 5.6077880859375, 5.81182861328125, 6.015869140625, 6.21990966796875, 6.4239501953125, 6.62799072265625, 6.83203125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 13.0, 15.0, 28.0, 31.0, 33.0, 74.0, 101.0, 152.0, 228.0, 360.0, 591.0, 946.0, 1602.0, 2944.0, 5375.0, 10122.0, 20147.0, 43467.0, 99095.0, 221042.0, 311107.0, 179972.0, 79674.0, 35710.0, 16741.0, 8448.0, 4314.0, 2512.0, 1415.0, 859.0, 525.0, 293.0, 202.0, 125.0, 92.0, 57.0, 42.0, 32.0, 22.0, 14.0, 15.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.835693359375, -7.57763671875, -7.319580078125, -7.0615234375, -6.803466796875, -6.54541015625, -6.287353515625, -6.029296875, -5.771240234375, -5.51318359375, -5.255126953125, -4.9970703125, -4.739013671875, -4.48095703125, -4.222900390625, -3.96484375, -3.706787109375, -3.44873046875, -3.190673828125, -2.9326171875, -2.674560546875, -2.41650390625, -2.158447265625, -1.900390625, -1.642333984375, -1.38427734375, -1.126220703125, -0.8681640625, -0.610107421875, -0.35205078125, -0.093994140625, 0.1640625, 0.422119140625, 0.68017578125, 0.938232421875, 1.1962890625, 1.454345703125, 1.71240234375, 1.970458984375, 2.228515625, 2.486572265625, 2.74462890625, 3.002685546875, 3.2607421875, 3.518798828125, 3.77685546875, 4.034912109375, 4.29296875, 4.551025390625, 4.80908203125, 5.067138671875, 5.3251953125, 5.583251953125, 5.84130859375, 6.099365234375, 6.357421875, 6.615478515625, 6.87353515625, 7.131591796875, 7.3896484375, 7.647705078125, 7.90576171875, 8.163818359375, 8.421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 4.0, 6.0, 9.0, 8.0, 6.0, 6.0, 16.0, 17.0, 14.0, 19.0, 23.0, 28.0, 27.0, 27.0, 49.0, 37.0, 38.0, 35.0, 47.0, 39.0, 42.0, 36.0, 47.0, 39.0, 51.0, 36.0, 39.0, 40.0, 26.0, 28.0, 31.0, 32.0, 19.0, 12.0, 7.0, 15.0, 8.0, 6.0, 9.0, 3.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.625, -3.50299072265625, -3.3809814453125, -3.25897216796875, -3.136962890625, -3.01495361328125, -2.8929443359375, -2.77093505859375, -2.64892578125, -2.52691650390625, -2.4049072265625, -2.28289794921875, -2.160888671875, -2.03887939453125, -1.9168701171875, -1.79486083984375, -1.6728515625, -1.55084228515625, -1.4288330078125, -1.30682373046875, -1.184814453125, -1.06280517578125, -0.9407958984375, -0.81878662109375, -0.69677734375, -0.57476806640625, -0.4527587890625, -0.33074951171875, -0.208740234375, -0.08673095703125, 0.0352783203125, 0.15728759765625, 0.279296875, 0.40130615234375, 0.5233154296875, 0.64532470703125, 0.767333984375, 0.88934326171875, 1.0113525390625, 1.13336181640625, 1.25537109375, 1.37738037109375, 1.4993896484375, 1.62139892578125, 1.743408203125, 1.86541748046875, 1.9874267578125, 2.10943603515625, 2.2314453125, 2.35345458984375, 2.4754638671875, 2.59747314453125, 2.719482421875, 2.84149169921875, 2.9635009765625, 3.08551025390625, 3.20751953125, 3.32952880859375, 3.4515380859375, 3.57354736328125, 3.695556640625, 3.81756591796875, 3.9395751953125, 4.06158447265625, 4.18359375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 6.0, 14.0, 9.0, 20.0, 23.0, 47.0, 79.0, 92.0, 132.0, 231.0, 382.0, 639.0, 1214.0, 2165.0, 4554.0, 10361.0, 26007.0, 75152.0, 237460.0, 422367.0, 174519.0, 56131.0, 20590.0, 8229.0, 3792.0, 1891.0, 976.0, 583.0, 321.0, 208.0, 111.0, 65.0, 55.0, 40.0, 27.0, 19.0, 13.0, 8.0, 4.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.171875, -5.981201171875, -5.79052734375, -5.599853515625, -5.4091796875, -5.218505859375, -5.02783203125, -4.837158203125, -4.646484375, -4.455810546875, -4.26513671875, -4.074462890625, -3.8837890625, -3.693115234375, -3.50244140625, -3.311767578125, -3.12109375, -2.930419921875, -2.73974609375, -2.549072265625, -2.3583984375, -2.167724609375, -1.97705078125, -1.786376953125, -1.595703125, -1.405029296875, -1.21435546875, -1.023681640625, -0.8330078125, -0.642333984375, -0.45166015625, -0.260986328125, -0.0703125, 0.120361328125, 0.31103515625, 0.501708984375, 0.6923828125, 0.883056640625, 1.07373046875, 1.264404296875, 1.455078125, 1.645751953125, 1.83642578125, 2.027099609375, 2.2177734375, 2.408447265625, 2.59912109375, 2.789794921875, 2.98046875, 3.171142578125, 3.36181640625, 3.552490234375, 3.7431640625, 3.933837890625, 4.12451171875, 4.315185546875, 4.505859375, 4.696533203125, 4.88720703125, 5.077880859375, 5.2685546875, 5.459228515625, 5.64990234375, 5.840576171875, 6.03125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 13.0, 10.0, 15.0, 20.0, 30.0, 40.0, 33.0, 70.0, 48.0, 68.0, 105.0, 91.0, 82.0, 69.0, 59.0, 55.0, 39.0, 22.0, 22.0, 19.0, 18.0, 12.0, 14.0, 5.0, 7.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001690387725830078, -0.00016395747661590576, -0.0001588761806488037, -0.00015379488468170166, -0.0001487135887145996, -0.00014363229274749756, -0.0001385509967803955, -0.00013346970081329346, -0.0001283884048461914, -0.00012330710887908936, -0.0001182258129119873, -0.00011314451694488525, -0.0001080632209777832, -0.00010298192501068115, -9.79006290435791e-05, -9.281933307647705e-05, -8.7738037109375e-05, -8.265674114227295e-05, -7.75754451751709e-05, -7.249414920806885e-05, -6.74128532409668e-05, -6.233155727386475e-05, -5.7250261306762695e-05, -5.2168965339660645e-05, -4.7087669372558594e-05, -4.200637340545654e-05, -3.692507743835449e-05, -3.184378147125244e-05, -2.676248550415039e-05, -2.168118953704834e-05, -1.659989356994629e-05, -1.1518597602844238e-05, -6.4373016357421875e-06, -1.3560056686401367e-06, 3.725290298461914e-06, 8.806586265563965e-06, 1.3887882232666016e-05, 1.8969178199768066e-05, 2.4050474166870117e-05, 2.9131770133972168e-05, 3.421306610107422e-05, 3.929436206817627e-05, 4.437565803527832e-05, 4.945695400238037e-05, 5.453824996948242e-05, 5.961954593658447e-05, 6.470084190368652e-05, 6.978213787078857e-05, 7.486343383789062e-05, 7.994472980499268e-05, 8.502602577209473e-05, 9.010732173919678e-05, 9.518861770629883e-05, 0.00010026991367340088, 0.00010535120964050293, 0.00011043250560760498, 0.00011551380157470703, 0.00012059509754180908, 0.00012567639350891113, 0.00013075768947601318, 0.00013583898544311523, 0.00014092028141021729, 0.00014600157737731934, 0.0001510828733444214, 0.00015616416931152344]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 10.0, 17.0, 27.0, 37.0, 55.0, 81.0, 136.0, 207.0, 316.0, 465.0, 739.0, 1212.0, 2066.0, 3468.0, 5875.0, 10673.0, 19693.0, 38785.0, 77278.0, 152815.0, 240747.0, 224640.0, 131127.0, 65641.0, 32850.0, 17273.0, 9342.0, 5212.0, 3012.0, 1827.0, 1085.0, 624.0, 423.0, 279.0, 174.0, 113.0, 72.0, 45.0, 26.0, 31.0, 20.0, 15.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59765625, -3.4686279296875, -3.339599609375, -3.2105712890625, -3.08154296875, -2.9525146484375, -2.823486328125, -2.6944580078125, -2.5654296875, -2.4364013671875, -2.307373046875, -2.1783447265625, -2.04931640625, -1.9202880859375, -1.791259765625, -1.6622314453125, -1.533203125, -1.4041748046875, -1.275146484375, -1.1461181640625, -1.01708984375, -0.8880615234375, -0.759033203125, -0.6300048828125, -0.5009765625, -0.3719482421875, -0.242919921875, -0.1138916015625, 0.01513671875, 0.1441650390625, 0.273193359375, 0.4022216796875, 0.53125, 0.6602783203125, 0.789306640625, 0.9183349609375, 1.04736328125, 1.1763916015625, 1.305419921875, 1.4344482421875, 1.5634765625, 1.6925048828125, 1.821533203125, 1.9505615234375, 2.07958984375, 2.2086181640625, 2.337646484375, 2.4666748046875, 2.595703125, 2.7247314453125, 2.853759765625, 2.9827880859375, 3.11181640625, 3.2408447265625, 3.369873046875, 3.4989013671875, 3.6279296875, 3.7569580078125, 3.885986328125, 4.0150146484375, 4.14404296875, 4.2730712890625, 4.402099609375, 4.5311279296875, 4.66015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 5.0, 6.0, 6.0, 9.0, 12.0, 13.0, 19.0, 20.0, 30.0, 28.0, 36.0, 42.0, 41.0, 35.0, 42.0, 60.0, 54.0, 69.0, 56.0, 62.0, 46.0, 55.0, 42.0, 36.0, 27.0, 27.0, 26.0, 17.0, 16.0, 6.0, 14.0, 13.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7822265625, -0.7569961547851562, -0.7317657470703125, -0.7065353393554688, -0.681304931640625, -0.6560745239257812, -0.6308441162109375, -0.6056137084960938, -0.58038330078125, -0.5551528930664062, -0.5299224853515625, -0.5046920776367188, -0.479461669921875, -0.45423126220703125, -0.4290008544921875, -0.40377044677734375, -0.3785400390625, -0.35330963134765625, -0.3280792236328125, -0.30284881591796875, -0.277618408203125, -0.25238800048828125, -0.2271575927734375, -0.20192718505859375, -0.17669677734375, -0.15146636962890625, -0.1262359619140625, -0.10100555419921875, -0.075775146484375, -0.05054473876953125, -0.0253143310546875, -8.392333984375e-05, 0.025146484375, 0.05037689208984375, 0.0756072998046875, 0.10083770751953125, 0.126068115234375, 0.15129852294921875, 0.1765289306640625, 0.20175933837890625, 0.22698974609375, 0.25222015380859375, 0.2774505615234375, 0.30268096923828125, 0.327911376953125, 0.35314178466796875, 0.3783721923828125, 0.40360260009765625, 0.4288330078125, 0.45406341552734375, 0.4792938232421875, 0.5045242309570312, 0.529754638671875, 0.5549850463867188, 0.5802154541015625, 0.6054458618164062, 0.63067626953125, 0.6559066772460938, 0.6811370849609375, 0.7063674926757812, 0.731597900390625, 0.7568283081054688, 0.7820587158203125, 0.8072891235351562, 0.83251953125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 9.0, 16.0, 19.0, 14.0, 26.0, 33.0, 47.0, 63.0, 68.0, 77.0, 93.0, 104.0, 75.0, 66.0, 67.0, 44.0, 39.0, 27.0, 28.0, 17.0, 19.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.733867645263672, -13.294132232666016, -12.854395866394043, -12.414660453796387, -11.974924087524414, -11.535188674926758, -11.095453262329102, -10.655716896057129, -10.215980529785156, -9.7762451171875, -9.336508750915527, -8.896773338317871, -8.457036972045898, -8.017301559448242, -7.577565670013428, -7.137829780578613, -6.698094367980957, -6.258358478546143, -5.818622589111328, -5.378887176513672, -4.939150810241699, -4.499415397644043, -4.0596795082092285, -3.619943618774414, -3.1802077293395996, -2.740471839904785, -2.3007359504699707, -1.8610002994537354, -1.421264410018921, -0.9815285205841064, -0.5417928695678711, -0.10205698013305664, 0.3376779556274414, 0.7774137854576111, 1.2171496152877808, 1.6568853855133057, 2.09662127494812, 2.5363571643829346, 2.97609281539917, 3.4158287048339844, 3.855564594268799, 4.295300483703613, 4.735036373138428, 5.174772262573242, 5.614507675170898, 6.054244041442871, 6.493979454040527, 6.933715343475342, 7.373451232910156, 7.813187122344971, 8.252923011779785, 8.692658424377441, 9.132394790649414, 9.57213020324707, 10.011865615844727, 10.4516019821167, 10.891338348388672, 11.331073760986328, 11.7708101272583, 12.210545539855957, 12.65028190612793, 13.090017318725586, 13.529752731323242, 13.969489097595215, 14.409224510192871]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 4.0, 1.0, 5.0, 6.0, 10.0, 16.0, 16.0, 17.0, 19.0, 19.0, 33.0, 31.0, 41.0, 30.0, 32.0, 34.0, 50.0, 46.0, 55.0, 37.0, 41.0, 54.0, 33.0, 43.0, 41.0, 36.0, 26.0, 36.0, 36.0, 22.0, 22.0, 24.0, 13.0, 12.0, 14.0, 9.0, 8.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.688053131103516, -5.50318717956543, -5.318321228027344, -5.133455276489258, -4.948589324951172, -4.763723373413086, -4.578857421875, -4.393991470336914, -4.209125518798828, -4.024259567260742, -3.8393936157226562, -3.6545276641845703, -3.4696617126464844, -3.2847957611083984, -3.0999298095703125, -2.9150638580322266, -2.7301979064941406, -2.5453319549560547, -2.3604660034179688, -2.175600051879883, -1.9907341003417969, -1.805868148803711, -1.621002197265625, -1.436136245727539, -1.2512702941894531, -1.0664043426513672, -0.8815383911132812, -0.6966724395751953, -0.5118064880371094, -0.32694053649902344, -0.1420745849609375, 0.04279136657714844, 0.22765779495239258, 0.4125237464904785, 0.5973896980285645, 0.7822556495666504, 0.9671216011047363, 1.1519875526428223, 1.3368535041809082, 1.5217194557189941, 1.70658540725708, 1.891451358795166, 2.076317310333252, 2.261183261871338, 2.446049213409424, 2.6309151649475098, 2.8157811164855957, 3.0006470680236816, 3.1855130195617676, 3.3703789710998535, 3.5552449226379395, 3.7401108741760254, 3.9249768257141113, 4.109842777252197, 4.294708728790283, 4.479574680328369, 4.664440631866455, 4.849306583404541, 5.034172534942627, 5.219038486480713, 5.403904438018799, 5.588770389556885, 5.773636341094971, 5.958502292633057, 6.143368244171143]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 12.0, 11.0, 12.0, 33.0, 47.0, 74.0, 102.0, 159.0, 220.0, 329.0, 473.0, 729.0, 1051.0, 1591.0, 2198.0, 3513.0, 5275.0, 7945.0, 12098.0, 18441.0, 27389.0, 40776.0, 59595.0, 83175.0, 109153.0, 128030.0, 131419.0, 116185.0, 91674.0, 66913.0, 46354.0, 31443.0, 20802.0, 13801.0, 9211.0, 5999.0, 4044.0, 2779.0, 1793.0, 1210.0, 775.0, 539.0, 379.0, 273.0, 186.0, 104.0, 85.0, 46.0, 43.0, 26.0, 17.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0], "bins": [-4.00390625, -3.879425048828125, -3.75494384765625, -3.630462646484375, -3.5059814453125, -3.381500244140625, -3.25701904296875, -3.132537841796875, -3.008056640625, -2.883575439453125, -2.75909423828125, -2.634613037109375, -2.5101318359375, -2.385650634765625, -2.26116943359375, -2.136688232421875, -2.01220703125, -1.887725830078125, -1.76324462890625, -1.638763427734375, -1.5142822265625, -1.389801025390625, -1.26531982421875, -1.140838623046875, -1.016357421875, -0.891876220703125, -0.76739501953125, -0.642913818359375, -0.5184326171875, -0.393951416015625, -0.26947021484375, -0.144989013671875, -0.0205078125, 0.103973388671875, 0.22845458984375, 0.352935791015625, 0.4774169921875, 0.601898193359375, 0.72637939453125, 0.850860595703125, 0.975341796875, 1.099822998046875, 1.22430419921875, 1.348785400390625, 1.4732666015625, 1.597747802734375, 1.72222900390625, 1.846710205078125, 1.97119140625, 2.095672607421875, 2.22015380859375, 2.344635009765625, 2.4691162109375, 2.593597412109375, 2.71807861328125, 2.842559814453125, 2.967041015625, 3.091522216796875, 3.21600341796875, 3.340484619140625, 3.4649658203125, 3.589447021484375, 3.71392822265625, 3.838409423828125, 3.962890625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 7.0, 1.0, 1.0, 6.0, 9.0, 13.0, 12.0, 18.0, 22.0, 15.0, 21.0, 24.0, 26.0, 21.0, 31.0, 36.0, 26.0, 44.0, 36.0, 41.0, 49.0, 39.0, 40.0, 32.0, 41.0, 26.0, 38.0, 41.0, 39.0, 22.0, 31.0, 22.0, 25.0, 22.0, 23.0, 25.0, 9.0, 14.0, 7.0, 16.0, 5.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.74609375, -5.560546875, -5.375, -5.189453125, -5.00390625, -4.818359375, -4.6328125, -4.447265625, -4.26171875, -4.076171875, -3.890625, -3.705078125, -3.51953125, -3.333984375, -3.1484375, -2.962890625, -2.77734375, -2.591796875, -2.40625, -2.220703125, -2.03515625, -1.849609375, -1.6640625, -1.478515625, -1.29296875, -1.107421875, -0.921875, -0.736328125, -0.55078125, -0.365234375, -0.1796875, 0.005859375, 0.19140625, 0.376953125, 0.5625, 0.748046875, 0.93359375, 1.119140625, 1.3046875, 1.490234375, 1.67578125, 1.861328125, 2.046875, 2.232421875, 2.41796875, 2.603515625, 2.7890625, 2.974609375, 3.16015625, 3.345703125, 3.53125, 3.716796875, 3.90234375, 4.087890625, 4.2734375, 4.458984375, 4.64453125, 4.830078125, 5.015625, 5.201171875, 5.38671875, 5.572265625, 5.7578125, 5.943359375, 6.12890625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 11.0, 9.0, 17.0, 36.0, 45.0, 48.0, 89.0, 158.0, 247.0, 394.0, 654.0, 995.0, 1656.0, 2763.0, 4984.0, 8253.0, 14433.0, 25269.0, 44635.0, 75405.0, 119711.0, 164255.0, 179151.0, 150880.0, 104150.0, 63365.0, 36861.0, 21022.0, 12074.0, 6872.0, 4045.0, 2378.0, 1425.0, 887.0, 503.0, 349.0, 175.0, 129.0, 85.0, 43.0, 24.0, 26.0, 14.0, 7.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3671875, -5.1842041015625, -5.001220703125, -4.8182373046875, -4.63525390625, -4.4522705078125, -4.269287109375, -4.0863037109375, -3.9033203125, -3.7203369140625, -3.537353515625, -3.3543701171875, -3.17138671875, -2.9884033203125, -2.805419921875, -2.6224365234375, -2.439453125, -2.2564697265625, -2.073486328125, -1.8905029296875, -1.70751953125, -1.5245361328125, -1.341552734375, -1.1585693359375, -0.9755859375, -0.7926025390625, -0.609619140625, -0.4266357421875, -0.24365234375, -0.0606689453125, 0.122314453125, 0.3052978515625, 0.48828125, 0.6712646484375, 0.854248046875, 1.0372314453125, 1.22021484375, 1.4031982421875, 1.586181640625, 1.7691650390625, 1.9521484375, 2.1351318359375, 2.318115234375, 2.5010986328125, 2.68408203125, 2.8670654296875, 3.050048828125, 3.2330322265625, 3.416015625, 3.5989990234375, 3.781982421875, 3.9649658203125, 4.14794921875, 4.3309326171875, 4.513916015625, 4.6968994140625, 4.8798828125, 5.0628662109375, 5.245849609375, 5.4288330078125, 5.61181640625, 5.7947998046875, 5.977783203125, 6.1607666015625, 6.34375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 7.0, 11.0, 14.0, 21.0, 18.0, 22.0, 21.0, 32.0, 23.0, 40.0, 40.0, 41.0, 49.0, 50.0, 39.0, 41.0, 39.0, 48.0, 57.0, 47.0, 44.0, 42.0, 37.0, 32.0, 22.0, 25.0, 25.0, 15.0, 16.0, 14.0, 11.0, 13.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-4.828125, -4.7001953125, -4.572265625, -4.4443359375, -4.31640625, -4.1884765625, -4.060546875, -3.9326171875, -3.8046875, -3.6767578125, -3.548828125, -3.4208984375, -3.29296875, -3.1650390625, -3.037109375, -2.9091796875, -2.78125, -2.6533203125, -2.525390625, -2.3974609375, -2.26953125, -2.1416015625, -2.013671875, -1.8857421875, -1.7578125, -1.6298828125, -1.501953125, -1.3740234375, -1.24609375, -1.1181640625, -0.990234375, -0.8623046875, -0.734375, -0.6064453125, -0.478515625, -0.3505859375, -0.22265625, -0.0947265625, 0.033203125, 0.1611328125, 0.2890625, 0.4169921875, 0.544921875, 0.6728515625, 0.80078125, 0.9287109375, 1.056640625, 1.1845703125, 1.3125, 1.4404296875, 1.568359375, 1.6962890625, 1.82421875, 1.9521484375, 2.080078125, 2.2080078125, 2.3359375, 2.4638671875, 2.591796875, 2.7197265625, 2.84765625, 2.9755859375, 3.103515625, 3.2314453125, 3.359375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 12.0, 10.0, 17.0, 23.0, 24.0, 37.0, 48.0, 80.0, 127.0, 170.0, 220.0, 393.0, 555.0, 815.0, 1400.0, 2303.0, 4264.0, 8591.0, 19492.0, 51076.0, 156812.0, 380633.0, 272211.0, 90463.0, 31770.0, 12918.0, 6025.0, 3034.0, 1868.0, 1088.0, 660.0, 443.0, 283.0, 183.0, 139.0, 86.0, 88.0, 58.0, 35.0, 24.0, 26.0, 10.0, 5.0, 5.0, 10.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.6015625, -8.3389892578125, -8.076416015625, -7.8138427734375, -7.55126953125, -7.2886962890625, -7.026123046875, -6.7635498046875, -6.5009765625, -6.2384033203125, -5.975830078125, -5.7132568359375, -5.45068359375, -5.1881103515625, -4.925537109375, -4.6629638671875, -4.400390625, -4.1378173828125, -3.875244140625, -3.6126708984375, -3.35009765625, -3.0875244140625, -2.824951171875, -2.5623779296875, -2.2998046875, -2.0372314453125, -1.774658203125, -1.5120849609375, -1.24951171875, -0.9869384765625, -0.724365234375, -0.4617919921875, -0.19921875, 0.0633544921875, 0.325927734375, 0.5885009765625, 0.85107421875, 1.1136474609375, 1.376220703125, 1.6387939453125, 1.9013671875, 2.1639404296875, 2.426513671875, 2.6890869140625, 2.95166015625, 3.2142333984375, 3.476806640625, 3.7393798828125, 4.001953125, 4.2645263671875, 4.527099609375, 4.7896728515625, 5.05224609375, 5.3148193359375, 5.577392578125, 5.8399658203125, 6.1025390625, 6.3651123046875, 6.627685546875, 6.8902587890625, 7.15283203125, 7.4154052734375, 7.677978515625, 7.9405517578125, 8.203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 0.0, 2.0, 9.0, 10.0, 9.0, 13.0, 21.0, 28.0, 39.0, 66.0, 70.0, 101.0, 130.0, 107.0, 108.0, 79.0, 54.0, 46.0, 23.0, 22.0, 14.0, 8.0, 14.0, 5.0, 1.0, 6.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000812530517578125, -0.0007899180054664612, -0.0007673054933547974, -0.0007446929812431335, -0.0007220804691314697, -0.0006994679570198059, -0.0006768554449081421, -0.0006542429327964783, -0.0006316304206848145, -0.0006090179085731506, -0.0005864053964614868, -0.000563792884349823, -0.0005411803722381592, -0.0005185678601264954, -0.0004959553480148315, -0.0004733428359031677, -0.0004507303237915039, -0.0004281178116798401, -0.00040550529956817627, -0.00038289278745651245, -0.00036028027534484863, -0.0003376677632331848, -0.000315055251121521, -0.0002924427390098572, -0.00026983022689819336, -0.00024721771478652954, -0.00022460520267486572, -0.0002019926905632019, -0.00017938017845153809, -0.00015676766633987427, -0.00013415515422821045, -0.00011154264211654663, -8.893013000488281e-05, -6.6317617893219e-05, -4.3705105781555176e-05, -2.1092593669891357e-05, 1.519918441772461e-06, 2.413243055343628e-05, 4.67449426651001e-05, 6.935745477676392e-05, 9.196996688842773e-05, 0.00011458247900009155, 0.00013719499111175537, 0.0001598075032234192, 0.000182420015335083, 0.00020503252744674683, 0.00022764503955841064, 0.00025025755167007446, 0.0002728700637817383, 0.0002954825758934021, 0.0003180950880050659, 0.00034070760011672974, 0.00036332011222839355, 0.0003859326243400574, 0.0004085451364517212, 0.000431157648563385, 0.00045377016067504883, 0.00047638267278671265, 0.0004989951848983765, 0.0005216076970100403, 0.0005442202091217041, 0.0005668327212333679, 0.0005894452333450317, 0.0006120577454566956, 0.0006346702575683594]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 17.0, 15.0, 26.0, 28.0, 57.0, 66.0, 79.0, 118.0, 200.0, 280.0, 420.0, 591.0, 1057.0, 1858.0, 3423.0, 6717.0, 15138.0, 38718.0, 117998.0, 344243.0, 336731.0, 114192.0, 37242.0, 14724.0, 6555.0, 3283.0, 1767.0, 1039.0, 640.0, 393.0, 275.0, 184.0, 154.0, 94.0, 55.0, 53.0, 34.0, 22.0, 12.0, 14.0, 15.0, 10.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.201416015625, -7.91845703125, -7.635498046875, -7.3525390625, -7.069580078125, -6.78662109375, -6.503662109375, -6.220703125, -5.937744140625, -5.65478515625, -5.371826171875, -5.0888671875, -4.805908203125, -4.52294921875, -4.239990234375, -3.95703125, -3.674072265625, -3.39111328125, -3.108154296875, -2.8251953125, -2.542236328125, -2.25927734375, -1.976318359375, -1.693359375, -1.410400390625, -1.12744140625, -0.844482421875, -0.5615234375, -0.278564453125, 0.00439453125, 0.287353515625, 0.5703125, 0.853271484375, 1.13623046875, 1.419189453125, 1.7021484375, 1.985107421875, 2.26806640625, 2.551025390625, 2.833984375, 3.116943359375, 3.39990234375, 3.682861328125, 3.9658203125, 4.248779296875, 4.53173828125, 4.814697265625, 5.09765625, 5.380615234375, 5.66357421875, 5.946533203125, 6.2294921875, 6.512451171875, 6.79541015625, 7.078369140625, 7.361328125, 7.644287109375, 7.92724609375, 8.210205078125, 8.4931640625, 8.776123046875, 9.05908203125, 9.342041015625, 9.625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 3.0, 16.0, 9.0, 13.0, 28.0, 42.0, 71.0, 83.0, 83.0, 109.0, 81.0, 106.0, 80.0, 67.0, 50.0, 32.0, 32.0, 24.0, 16.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.0424957275390625, -1.979522705078125, -1.9165496826171875, -1.85357666015625, -1.7906036376953125, -1.727630615234375, -1.6646575927734375, -1.6016845703125, -1.5387115478515625, -1.475738525390625, -1.4127655029296875, -1.34979248046875, -1.2868194580078125, -1.223846435546875, -1.1608734130859375, -1.097900390625, -1.0349273681640625, -0.971954345703125, -0.9089813232421875, -0.84600830078125, -0.7830352783203125, -0.720062255859375, -0.6570892333984375, -0.5941162109375, -0.5311431884765625, -0.468170166015625, -0.4051971435546875, -0.34222412109375, -0.2792510986328125, -0.216278076171875, -0.1533050537109375, -0.09033203125, -0.0273590087890625, 0.035614013671875, 0.0985870361328125, 0.16156005859375, 0.2245330810546875, 0.287506103515625, 0.3504791259765625, 0.4134521484375, 0.4764251708984375, 0.539398193359375, 0.6023712158203125, 0.66534423828125, 0.7283172607421875, 0.791290283203125, 0.8542633056640625, 0.917236328125, 0.9802093505859375, 1.043182373046875, 1.1061553955078125, 1.16912841796875, 1.2321014404296875, 1.295074462890625, 1.3580474853515625, 1.4210205078125, 1.4839935302734375, 1.546966552734375, 1.6099395751953125, 1.67291259765625, 1.7358856201171875, 1.798858642578125, 1.8618316650390625, 1.9248046875]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 6.0, 14.0, 18.0, 21.0, 25.0, 35.0, 37.0, 41.0, 66.0, 75.0, 88.0, 67.0, 78.0, 83.0, 59.0, 48.0, 51.0, 40.0, 33.0, 21.0, 22.0, 16.0, 8.0, 7.0, 6.0, 12.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.37030029296875, -12.950541496276855, -12.530782699584961, -12.11102294921875, -11.691264152526855, -11.271505355834961, -10.85174560546875, -10.431986808776855, -10.012228012084961, -9.592469215393066, -9.172710418701172, -8.752950668334961, -8.333191871643066, -7.913433074951172, -7.493673801422119, -7.073914527893066, -6.654155731201172, -6.234396934509277, -5.814637660980225, -5.394878387451172, -4.975119590759277, -4.555360794067383, -4.13560152053833, -3.7158424854278564, -3.296083450317383, -2.876324415206909, -2.4565653800964355, -2.036806344985962, -1.6170473098754883, -1.1972882747650146, -0.777529239654541, -0.3577702045440674, 0.061987876892089844, 0.4817469120025635, 0.9015059471130371, 1.3212649822235107, 1.7410240173339844, 2.160783052444458, 2.5805420875549316, 3.0003011226654053, 3.420060157775879, 3.8398191928863525, 4.259578227996826, 4.679337501525879, 5.099096298217773, 5.518855094909668, 5.938614368438721, 6.358373641967773, 6.778132438659668, 7.1978912353515625, 7.617650508880615, 8.037409782409668, 8.457168579101562, 8.876927375793457, 9.296686172485352, 9.716445922851562, 10.136204719543457, 10.555963516235352, 10.975723266601562, 11.395482063293457, 11.815240859985352, 12.234999656677246, 12.65475845336914, 13.074518203735352, 13.494277000427246]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 11.0, 10.0, 19.0, 10.0, 10.0, 17.0, 14.0, 29.0, 30.0, 35.0, 35.0, 34.0, 41.0, 35.0, 38.0, 38.0, 33.0, 49.0, 38.0, 53.0, 46.0, 40.0, 46.0, 42.0, 42.0, 19.0, 25.0, 27.0, 29.0, 10.0, 18.0, 18.0, 17.0, 7.0, 5.0, 4.0, 6.0, 7.0, 1.0, 1.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.933358192443848, -5.739931106567383, -5.54650354385376, -5.353076457977295, -5.15964937210083, -4.966222286224365, -4.772794723510742, -4.579367637634277, -4.3859405517578125, -4.192513465881348, -3.9990861415863037, -3.8056588172912598, -3.612231731414795, -3.418804407119751, -3.225377082824707, -3.031949996948242, -2.8385226726531982, -2.6450953483581543, -2.4516682624816895, -2.2582409381866455, -2.0648138523101807, -1.8713865280151367, -1.6779593229293823, -1.484532117843628, -1.2911049127578735, -1.0976777076721191, -0.9042505025863647, -0.7108232378959656, -0.5173960328102112, -0.3239688277244568, -0.13054156303405762, 0.06288564205169678, 0.25631284713745117, 0.44974005222320557, 0.64316725730896, 0.8365945219993591, 1.0300216674804688, 1.2234489917755127, 1.416876196861267, 1.6103034019470215, 1.8037306070327759, 1.9971578121185303, 2.190585136413574, 2.384012222290039, 2.577439546585083, 2.770866632461548, 2.964293956756592, 3.1577210426330566, 3.3511483669281006, 3.5445756912231445, 3.7380027770996094, 3.9314301013946533, 4.124857425689697, 4.318284511566162, 4.511711597442627, 4.70513916015625, 4.898566246032715, 5.09199333190918, 5.285420894622803, 5.478847980499268, 5.672275066375732, 5.865702152252197, 6.05912971496582, 6.252556800842285, 6.44598388671875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 9.0, 13.0, 12.0, 16.0, 26.0, 39.0, 59.0, 70.0, 109.0, 150.0, 248.0, 306.0, 436.0, 670.0, 974.0, 1513.0, 2265.0, 3380.0, 5380.0, 8326.0, 13677.0, 22856.0, 39802.0, 75978.0, 164131.0, 405289.0, 961322.0, 1255328.0, 703873.0, 277230.0, 117426.0, 56193.0, 30384.0, 17318.0, 10646.0, 6554.0, 4171.0, 2716.0, 1829.0, 1175.0, 819.0, 525.0, 326.0, 232.0, 159.0, 102.0, 65.0, 59.0, 37.0, 17.0, 19.0, 13.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.65625, -12.276123046875, -11.89599609375, -11.515869140625, -11.1357421875, -10.755615234375, -10.37548828125, -9.995361328125, -9.615234375, -9.235107421875, -8.85498046875, -8.474853515625, -8.0947265625, -7.714599609375, -7.33447265625, -6.954345703125, -6.57421875, -6.194091796875, -5.81396484375, -5.433837890625, -5.0537109375, -4.673583984375, -4.29345703125, -3.913330078125, -3.533203125, -3.153076171875, -2.77294921875, -2.392822265625, -2.0126953125, -1.632568359375, -1.25244140625, -0.872314453125, -0.4921875, -0.112060546875, 0.26806640625, 0.648193359375, 1.0283203125, 1.408447265625, 1.78857421875, 2.168701171875, 2.548828125, 2.928955078125, 3.30908203125, 3.689208984375, 4.0693359375, 4.449462890625, 4.82958984375, 5.209716796875, 5.58984375, 5.969970703125, 6.35009765625, 6.730224609375, 7.1103515625, 7.490478515625, 7.87060546875, 8.250732421875, 8.630859375, 9.010986328125, 9.39111328125, 9.771240234375, 10.1513671875, 10.531494140625, 10.91162109375, 11.291748046875, 11.671875]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 6.0, 3.0, 16.0, 11.0, 13.0, 15.0, 20.0, 19.0, 29.0, 26.0, 20.0, 37.0, 36.0, 34.0, 35.0, 31.0, 52.0, 28.0, 36.0, 40.0, 30.0, 43.0, 37.0, 43.0, 43.0, 35.0, 44.0, 23.0, 31.0, 25.0, 25.0, 15.0, 12.0, 12.0, 13.0, 10.0, 11.0, 10.0, 7.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 1.0], "bins": [-5.921875, -5.75885009765625, -5.5958251953125, -5.43280029296875, -5.269775390625, -5.10675048828125, -4.9437255859375, -4.78070068359375, -4.61767578125, -4.45465087890625, -4.2916259765625, -4.12860107421875, -3.965576171875, -3.80255126953125, -3.6395263671875, -3.47650146484375, -3.3134765625, -3.15045166015625, -2.9874267578125, -2.82440185546875, -2.661376953125, -2.49835205078125, -2.3353271484375, -2.17230224609375, -2.00927734375, -1.84625244140625, -1.6832275390625, -1.52020263671875, -1.357177734375, -1.19415283203125, -1.0311279296875, -0.86810302734375, -0.705078125, -0.54205322265625, -0.3790283203125, -0.21600341796875, -0.052978515625, 0.11004638671875, 0.2730712890625, 0.43609619140625, 0.59912109375, 0.76214599609375, 0.9251708984375, 1.08819580078125, 1.251220703125, 1.41424560546875, 1.5772705078125, 1.74029541015625, 1.9033203125, 2.06634521484375, 2.2293701171875, 2.39239501953125, 2.555419921875, 2.71844482421875, 2.8814697265625, 3.04449462890625, 3.20751953125, 3.37054443359375, 3.5335693359375, 3.69659423828125, 3.859619140625, 4.02264404296875, 4.1856689453125, 4.34869384765625, 4.51171875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 7.0, 24.0, 17.0, 23.0, 25.0, 48.0, 48.0, 104.0, 205.0, 356.0, 560.0, 966.0, 1524.0, 2818.0, 5094.0, 9271.0, 18142.0, 37189.0, 80404.0, 190863.0, 508315.0, 1335446.0, 1232195.0, 454399.0, 171921.0, 73825.0, 34057.0, 16613.0, 8671.0, 4634.0, 2657.0, 1553.0, 877.0, 569.0, 292.0, 170.0, 149.0, 94.0, 53.0, 35.0, 17.0, 12.0, 10.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.390625, -16.789794921875, -16.18896484375, -15.588134765625, -14.9873046875, -14.386474609375, -13.78564453125, -13.184814453125, -12.583984375, -11.983154296875, -11.38232421875, -10.781494140625, -10.1806640625, -9.579833984375, -8.97900390625, -8.378173828125, -7.77734375, -7.176513671875, -6.57568359375, -5.974853515625, -5.3740234375, -4.773193359375, -4.17236328125, -3.571533203125, -2.970703125, -2.369873046875, -1.76904296875, -1.168212890625, -0.5673828125, 0.033447265625, 0.63427734375, 1.235107421875, 1.8359375, 2.436767578125, 3.03759765625, 3.638427734375, 4.2392578125, 4.840087890625, 5.44091796875, 6.041748046875, 6.642578125, 7.243408203125, 7.84423828125, 8.445068359375, 9.0458984375, 9.646728515625, 10.24755859375, 10.848388671875, 11.44921875, 12.050048828125, 12.65087890625, 13.251708984375, 13.8525390625, 14.453369140625, 15.05419921875, 15.655029296875, 16.255859375, 16.856689453125, 17.45751953125, 18.058349609375, 18.6591796875, 19.260009765625, 19.86083984375, 20.461669921875, 21.0625]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 11.0, 11.0, 14.0, 24.0, 26.0, 39.0, 50.0, 51.0, 67.0, 97.0, 128.0, 186.0, 219.0, 278.0, 309.0, 375.0, 364.0, 335.0, 328.0, 245.0, 211.0, 165.0, 141.0, 101.0, 71.0, 73.0, 48.0, 27.0, 20.0, 23.0, 12.0, 4.0, 10.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.94921875, -4.80078125, -4.65234375, -4.50390625, -4.35546875, -4.20703125, -4.05859375, -3.91015625, -3.76171875, -3.61328125, -3.46484375, -3.31640625, -3.16796875, -3.01953125, -2.87109375, -2.72265625, -2.57421875, -2.42578125, -2.27734375, -2.12890625, -1.98046875, -1.83203125, -1.68359375, -1.53515625, -1.38671875, -1.23828125, -1.08984375, -0.94140625, -0.79296875, -0.64453125, -0.49609375, -0.34765625, -0.19921875, -0.05078125, 0.09765625, 0.24609375, 0.39453125, 0.54296875, 0.69140625, 0.83984375, 0.98828125, 1.13671875, 1.28515625, 1.43359375, 1.58203125, 1.73046875, 1.87890625, 2.02734375, 2.17578125, 2.32421875, 2.47265625, 2.62109375, 2.76953125, 2.91796875, 3.06640625, 3.21484375, 3.36328125, 3.51171875, 3.66015625, 3.80859375, 3.95703125, 4.10546875, 4.25390625, 4.40234375, 4.55078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 5.0, 6.0, 4.0, 10.0, 8.0, 7.0, 11.0, 18.0, 21.0, 31.0, 31.0, 36.0, 49.0, 47.0, 62.0, 74.0, 68.0, 69.0, 62.0, 64.0, 57.0, 55.0, 44.0, 30.0, 30.0, 22.0, 18.0, 8.0, 11.0, 9.0, 6.0, 10.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-15.632526397705078, -15.172147750854492, -14.711769104003906, -14.25139045715332, -13.79101276397705, -13.330634117126465, -12.870255470275879, -12.409876823425293, -11.949499130249023, -11.489120483398438, -11.028741836547852, -10.568363189697266, -10.107985496520996, -9.64760684967041, -9.187228202819824, -8.726849555969238, -8.266470909118652, -7.806092262268066, -7.345714092254639, -6.885335445404053, -6.424957275390625, -5.964578628540039, -5.504199981689453, -5.043821334838867, -4.5834431648254395, -4.1230645179748535, -3.662686347961426, -3.20230770111084, -2.741929292678833, -2.281550884246826, -1.8211722373962402, -1.3607938289642334, -0.9004154205322266, -0.44003695249557495, 0.02034151554107666, 0.48072004318237305, 0.9410984516143799, 1.4014768600463867, 1.8618555068969727, 2.3222339153289795, 2.7826123237609863, 3.242990732192993, 3.703369140625, 4.163747787475586, 4.624126434326172, 5.0845046043396, 5.5448832511901855, 6.005261421203613, 6.465640068054199, 6.926018714904785, 7.386396884918213, 7.846775531768799, 8.307153701782227, 8.767532348632812, 9.227910995483398, 9.688289642333984, 10.14866828918457, 10.609046936035156, 11.069425582885742, 11.529804229736328, 11.990181922912598, 12.450560569763184, 12.91093921661377, 13.371317863464355, 13.831695556640625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 4.0, 7.0, 7.0, 7.0, 12.0, 12.0, 10.0, 7.0, 20.0, 24.0, 20.0, 24.0, 21.0, 34.0, 36.0, 38.0, 44.0, 49.0, 33.0, 42.0, 39.0, 47.0, 40.0, 47.0, 46.0, 34.0, 46.0, 29.0, 24.0, 39.0, 30.0, 22.0, 19.0, 16.0, 22.0, 14.0, 8.0, 8.0, 6.0, 9.0, 2.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.317469596862793, -8.085326194763184, -7.853183746337891, -7.621040344238281, -7.38889741897583, -7.156754493713379, -6.924611568450928, -6.692468643188477, -6.460325241088867, -6.228182315826416, -5.996039390563965, -5.7638959884643555, -5.531753063201904, -5.299610137939453, -5.067467212677002, -4.835324287414551, -4.6031813621521, -4.371038436889648, -4.138895511627197, -3.906752347946167, -3.6746091842651367, -3.4424662590026855, -3.2103233337402344, -2.978180408477783, -2.746037244796753, -2.5138943195343018, -2.2817511558532715, -2.0496082305908203, -1.8174651861190796, -1.5853221416473389, -1.3531792163848877, -1.121036171913147, -0.888892650604248, -0.6567496061325073, -0.4246066212654114, -0.19246363639831543, 0.03967940807342529, 0.271822452545166, 0.5039653778076172, 0.7361084222793579, 0.9682514667510986, 1.2003945112228394, 1.43253755569458, 1.6646804809570312, 1.896823525428772, 2.1289665699005127, 2.361109495162964, 2.593252658843994, 2.8253955841064453, 3.0575385093688965, 3.2896816730499268, 3.521824598312378, 3.753967761993408, 3.9861106872558594, 4.2182536125183105, 4.450396537780762, 4.682539939880371, 4.914682865142822, 5.146825790405273, 5.378969192504883, 5.611112117767334, 5.843255043029785, 6.075397968292236, 6.3075408935546875, 6.539683818817139]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 6.0, 6.0, 8.0, 23.0, 25.0, 36.0, 51.0, 74.0, 99.0, 143.0, 219.0, 315.0, 502.0, 731.0, 1195.0, 1832.0, 2886.0, 4707.0, 7986.0, 13558.0, 23564.0, 40651.0, 70868.0, 117599.0, 173285.0, 193757.0, 154204.0, 99839.0, 58696.0, 33534.0, 19596.0, 11060.0, 6653.0, 4033.0, 2384.0, 1557.0, 1004.0, 612.0, 398.0, 292.0, 189.0, 99.0, 89.0, 66.0, 35.0, 29.0, 24.0, 17.0, 5.0, 7.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.484375, -5.29736328125, -5.1103515625, -4.92333984375, -4.736328125, -4.54931640625, -4.3623046875, -4.17529296875, -3.98828125, -3.80126953125, -3.6142578125, -3.42724609375, -3.240234375, -3.05322265625, -2.8662109375, -2.67919921875, -2.4921875, -2.30517578125, -2.1181640625, -1.93115234375, -1.744140625, -1.55712890625, -1.3701171875, -1.18310546875, -0.99609375, -0.80908203125, -0.6220703125, -0.43505859375, -0.248046875, -0.06103515625, 0.1259765625, 0.31298828125, 0.5, 0.68701171875, 0.8740234375, 1.06103515625, 1.248046875, 1.43505859375, 1.6220703125, 1.80908203125, 1.99609375, 2.18310546875, 2.3701171875, 2.55712890625, 2.744140625, 2.93115234375, 3.1181640625, 3.30517578125, 3.4921875, 3.67919921875, 3.8662109375, 4.05322265625, 4.240234375, 4.42724609375, 4.6142578125, 4.80126953125, 4.98828125, 5.17529296875, 5.3623046875, 5.54931640625, 5.736328125, 5.92333984375, 6.1103515625, 6.29736328125, 6.484375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 8.0, 5.0, 8.0, 7.0, 12.0, 13.0, 12.0, 16.0, 17.0, 20.0, 15.0, 25.0, 22.0, 33.0, 35.0, 43.0, 46.0, 35.0, 41.0, 39.0, 38.0, 33.0, 51.0, 43.0, 46.0, 39.0, 31.0, 34.0, 40.0, 34.0, 28.0, 27.0, 23.0, 20.0, 12.0, 14.0, 9.0, 7.0, 3.0, 7.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.09375, -8.84014892578125, -8.5865478515625, -8.33294677734375, -8.079345703125, -7.82574462890625, -7.5721435546875, -7.31854248046875, -7.06494140625, -6.81134033203125, -6.5577392578125, -6.30413818359375, -6.050537109375, -5.79693603515625, -5.5433349609375, -5.28973388671875, -5.0361328125, -4.78253173828125, -4.5289306640625, -4.27532958984375, -4.021728515625, -3.76812744140625, -3.5145263671875, -3.26092529296875, -3.00732421875, -2.75372314453125, -2.5001220703125, -2.24652099609375, -1.992919921875, -1.73931884765625, -1.4857177734375, -1.23211669921875, -0.978515625, -0.72491455078125, -0.4713134765625, -0.21771240234375, 0.035888671875, 0.28948974609375, 0.5430908203125, 0.79669189453125, 1.05029296875, 1.30389404296875, 1.5574951171875, 1.81109619140625, 2.064697265625, 2.31829833984375, 2.5718994140625, 2.82550048828125, 3.0791015625, 3.33270263671875, 3.5863037109375, 3.83990478515625, 4.093505859375, 4.34710693359375, 4.6007080078125, 4.85430908203125, 5.10791015625, 5.36151123046875, 5.6151123046875, 5.86871337890625, 6.122314453125, 6.37591552734375, 6.6295166015625, 6.88311767578125, 7.13671875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 9.0, 11.0, 10.0, 10.0, 34.0, 32.0, 56.0, 68.0, 98.0, 133.0, 235.0, 356.0, 636.0, 1069.0, 1997.0, 3640.0, 7035.0, 14932.0, 33017.0, 79231.0, 191615.0, 331404.0, 218372.0, 91837.0, 38298.0, 17053.0, 8014.0, 4146.0, 2121.0, 1189.0, 689.0, 425.0, 224.0, 185.0, 111.0, 74.0, 52.0, 36.0, 23.0, 19.0, 13.0, 15.0, 11.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.015625, -11.6468505859375, -11.278076171875, -10.9093017578125, -10.54052734375, -10.1717529296875, -9.802978515625, -9.4342041015625, -9.0654296875, -8.6966552734375, -8.327880859375, -7.9591064453125, -7.59033203125, -7.2215576171875, -6.852783203125, -6.4840087890625, -6.115234375, -5.7464599609375, -5.377685546875, -5.0089111328125, -4.64013671875, -4.2713623046875, -3.902587890625, -3.5338134765625, -3.1650390625, -2.7962646484375, -2.427490234375, -2.0587158203125, -1.68994140625, -1.3211669921875, -0.952392578125, -0.5836181640625, -0.21484375, 0.1539306640625, 0.522705078125, 0.8914794921875, 1.26025390625, 1.6290283203125, 1.997802734375, 2.3665771484375, 2.7353515625, 3.1041259765625, 3.472900390625, 3.8416748046875, 4.21044921875, 4.5792236328125, 4.947998046875, 5.3167724609375, 5.685546875, 6.0543212890625, 6.423095703125, 6.7918701171875, 7.16064453125, 7.5294189453125, 7.898193359375, 8.2669677734375, 8.6357421875, 9.0045166015625, 9.373291015625, 9.7420654296875, 10.11083984375, 10.4796142578125, 10.848388671875, 11.2171630859375, 11.5859375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 7.0, 14.0, 20.0, 15.0, 22.0, 17.0, 16.0, 23.0, 31.0, 28.0, 34.0, 25.0, 33.0, 28.0, 35.0, 40.0, 25.0, 47.0, 37.0, 40.0, 37.0, 45.0, 46.0, 32.0, 30.0, 29.0, 29.0, 34.0, 25.0, 30.0, 16.0, 20.0, 19.0, 11.0, 8.0, 11.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.4296875, -4.28924560546875, -4.1488037109375, -4.00836181640625, -3.867919921875, -3.72747802734375, -3.5870361328125, -3.44659423828125, -3.30615234375, -3.16571044921875, -3.0252685546875, -2.88482666015625, -2.744384765625, -2.60394287109375, -2.4635009765625, -2.32305908203125, -2.1826171875, -2.04217529296875, -1.9017333984375, -1.76129150390625, -1.620849609375, -1.48040771484375, -1.3399658203125, -1.19952392578125, -1.05908203125, -0.91864013671875, -0.7781982421875, -0.63775634765625, -0.497314453125, -0.35687255859375, -0.2164306640625, -0.07598876953125, 0.064453125, 0.20489501953125, 0.3453369140625, 0.48577880859375, 0.626220703125, 0.76666259765625, 0.9071044921875, 1.04754638671875, 1.18798828125, 1.32843017578125, 1.4688720703125, 1.60931396484375, 1.749755859375, 1.89019775390625, 2.0306396484375, 2.17108154296875, 2.3115234375, 2.45196533203125, 2.5924072265625, 2.73284912109375, 2.873291015625, 3.01373291015625, 3.1541748046875, 3.29461669921875, 3.43505859375, 3.57550048828125, 3.7159423828125, 3.85638427734375, 3.996826171875, 4.13726806640625, 4.2777099609375, 4.41815185546875, 4.55859375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 5.0, 9.0, 5.0, 6.0, 8.0, 12.0, 16.0, 38.0, 36.0, 62.0, 83.0, 121.0, 181.0, 253.0, 432.0, 649.0, 1094.0, 1687.0, 2664.0, 4745.0, 8054.0, 14797.0, 27565.0, 52915.0, 103753.0, 198371.0, 265688.0, 174625.0, 89650.0, 45479.0, 23997.0, 13270.0, 7397.0, 4157.0, 2484.0, 1521.0, 934.0, 639.0, 388.0, 222.0, 169.0, 116.0, 76.0, 59.0, 40.0, 27.0, 17.0, 13.0, 9.0, 15.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.78460693359375, -4.6160888671875, -4.44757080078125, -4.279052734375, -4.11053466796875, -3.9420166015625, -3.77349853515625, -3.60498046875, -3.43646240234375, -3.2679443359375, -3.09942626953125, -2.930908203125, -2.76239013671875, -2.5938720703125, -2.42535400390625, -2.2568359375, -2.08831787109375, -1.9197998046875, -1.75128173828125, -1.582763671875, -1.41424560546875, -1.2457275390625, -1.07720947265625, -0.90869140625, -0.74017333984375, -0.5716552734375, -0.40313720703125, -0.234619140625, -0.06610107421875, 0.1024169921875, 0.27093505859375, 0.439453125, 0.60797119140625, 0.7764892578125, 0.94500732421875, 1.113525390625, 1.28204345703125, 1.4505615234375, 1.61907958984375, 1.78759765625, 1.95611572265625, 2.1246337890625, 2.29315185546875, 2.461669921875, 2.63018798828125, 2.7987060546875, 2.96722412109375, 3.1357421875, 3.30426025390625, 3.4727783203125, 3.64129638671875, 3.809814453125, 3.97833251953125, 4.1468505859375, 4.31536865234375, 4.48388671875, 4.65240478515625, 4.8209228515625, 4.98944091796875, 5.157958984375, 5.32647705078125, 5.4949951171875, 5.66351318359375, 5.83203125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 4.0, 8.0, 6.0, 9.0, 10.0, 5.0, 9.0, 13.0, 21.0, 14.0, 17.0, 19.0, 26.0, 32.0, 32.0, 36.0, 48.0, 48.0, 63.0, 56.0, 53.0, 47.0, 66.0, 56.0, 37.0, 37.0, 31.0, 32.0, 31.0, 21.0, 13.0, 13.0, 16.0, 15.0, 9.0, 8.0, 12.0, 3.0, 6.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.00018489360809326172, -0.00017954781651496887, -0.00017420202493667603, -0.00016885623335838318, -0.00016351044178009033, -0.00015816465020179749, -0.00015281885862350464, -0.0001474730670452118, -0.00014212727546691895, -0.0001367814838886261, -0.00013143569231033325, -0.0001260899007320404, -0.00012074410915374756, -0.00011539831757545471, -0.00011005252599716187, -0.00010470673441886902, -9.936094284057617e-05, -9.401515126228333e-05, -8.866935968399048e-05, -8.332356810569763e-05, -7.797777652740479e-05, -7.263198494911194e-05, -6.728619337081909e-05, -6.194040179252625e-05, -5.65946102142334e-05, -5.124881863594055e-05, -4.5903027057647705e-05, -4.055723547935486e-05, -3.521144390106201e-05, -2.9865652322769165e-05, -2.451986074447632e-05, -1.917406916618347e-05, -1.3828277587890625e-05, -8.482486009597778e-06, -3.1366944313049316e-06, 2.209097146987915e-06, 7.554888725280762e-06, 1.2900680303573608e-05, 1.8246471881866455e-05, 2.3592263460159302e-05, 2.893805503845215e-05, 3.4283846616744995e-05, 3.962963819503784e-05, 4.497542977333069e-05, 5.0321221351623535e-05, 5.566701292991638e-05, 6.101280450820923e-05, 6.635859608650208e-05, 7.170438766479492e-05, 7.705017924308777e-05, 8.239597082138062e-05, 8.774176239967346e-05, 9.308755397796631e-05, 9.843334555625916e-05, 0.000103779137134552, 0.00010912492871284485, 0.0001144707202911377, 0.00011981651186943054, 0.0001251623034477234, 0.00013050809502601624, 0.00013585388660430908, 0.00014119967818260193, 0.00014654546976089478, 0.00015189126133918762, 0.00015723705291748047]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 9.0, 11.0, 13.0, 10.0, 17.0, 32.0, 40.0, 62.0, 82.0, 137.0, 180.0, 305.0, 548.0, 792.0, 1378.0, 2526.0, 4371.0, 8286.0, 15551.0, 30493.0, 61665.0, 123120.0, 216355.0, 246987.0, 163892.0, 84190.0, 41818.0, 21115.0, 10999.0, 5826.0, 3159.0, 1809.0, 1072.0, 615.0, 366.0, 226.0, 177.0, 113.0, 59.0, 48.0, 28.0, 25.0, 12.0, 3.0, 9.0, 10.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.78125, -5.58343505859375, -5.3856201171875, -5.18780517578125, -4.989990234375, -4.79217529296875, -4.5943603515625, -4.39654541015625, -4.19873046875, -4.00091552734375, -3.8031005859375, -3.60528564453125, -3.407470703125, -3.20965576171875, -3.0118408203125, -2.81402587890625, -2.6162109375, -2.41839599609375, -2.2205810546875, -2.02276611328125, -1.824951171875, -1.62713623046875, -1.4293212890625, -1.23150634765625, -1.03369140625, -0.83587646484375, -0.6380615234375, -0.44024658203125, -0.242431640625, -0.04461669921875, 0.1531982421875, 0.35101318359375, 0.548828125, 0.74664306640625, 0.9444580078125, 1.14227294921875, 1.340087890625, 1.53790283203125, 1.7357177734375, 1.93353271484375, 2.13134765625, 2.32916259765625, 2.5269775390625, 2.72479248046875, 2.922607421875, 3.12042236328125, 3.3182373046875, 3.51605224609375, 3.7138671875, 3.91168212890625, 4.1094970703125, 4.30731201171875, 4.505126953125, 4.70294189453125, 4.9007568359375, 5.09857177734375, 5.29638671875, 5.49420166015625, 5.6920166015625, 5.88983154296875, 6.087646484375, 6.28546142578125, 6.4832763671875, 6.68109130859375, 6.87890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 10.0, 10.0, 8.0, 14.0, 18.0, 18.0, 25.0, 32.0, 35.0, 33.0, 46.0, 54.0, 60.0, 65.0, 64.0, 67.0, 66.0, 47.0, 53.0, 59.0, 29.0, 37.0, 34.0, 24.0, 19.0, 21.0, 13.0, 4.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.5947265625, -1.5515899658203125, -1.508453369140625, -1.4653167724609375, -1.42218017578125, -1.3790435791015625, -1.335906982421875, -1.2927703857421875, -1.2496337890625, -1.2064971923828125, -1.163360595703125, -1.1202239990234375, -1.07708740234375, -1.0339508056640625, -0.990814208984375, -0.9476776123046875, -0.904541015625, -0.8614044189453125, -0.818267822265625, -0.7751312255859375, -0.73199462890625, -0.6888580322265625, -0.645721435546875, -0.6025848388671875, -0.5594482421875, -0.5163116455078125, -0.473175048828125, -0.4300384521484375, -0.38690185546875, -0.3437652587890625, -0.300628662109375, -0.2574920654296875, -0.21435546875, -0.1712188720703125, -0.128082275390625, -0.0849456787109375, -0.04180908203125, 0.0013275146484375, 0.044464111328125, 0.0876007080078125, 0.1307373046875, 0.1738739013671875, 0.217010498046875, 0.2601470947265625, 0.30328369140625, 0.3464202880859375, 0.389556884765625, 0.4326934814453125, 0.475830078125, 0.5189666748046875, 0.562103271484375, 0.6052398681640625, 0.64837646484375, 0.6915130615234375, 0.734649658203125, 0.7777862548828125, 0.8209228515625, 0.8640594482421875, 0.907196044921875, 0.9503326416015625, 0.99346923828125, 1.0366058349609375, 1.079742431640625, 1.1228790283203125, 1.166015625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 6.0, 4.0, 7.0, 8.0, 5.0, 14.0, 13.0, 21.0, 16.0, 27.0, 30.0, 39.0, 43.0, 69.0, 72.0, 72.0, 73.0, 71.0, 67.0, 63.0, 64.0, 36.0, 41.0, 30.0, 30.0, 15.0, 11.0, 10.0, 10.0, 10.0, 5.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.333417892456055, -16.847332000732422, -16.36124610900879, -15.875160217285156, -15.389074325561523, -14.90298843383789, -14.416901588439941, -13.930815696716309, -13.444729804992676, -12.958643913269043, -12.47255802154541, -11.986472129821777, -11.500385284423828, -11.014299392700195, -10.528213500976562, -10.04212760925293, -9.556041717529297, -9.069955825805664, -8.583869934082031, -8.097784042358398, -7.611697673797607, -7.125611782073975, -6.639525413513184, -6.153439521789551, -5.667353630065918, -5.181267738342285, -4.695181846618652, -4.209095478057861, -3.7230095863342285, -3.2369236946105957, -2.750837564468384, -2.264751434326172, -1.778665542602539, -1.2925795316696167, -0.8064935207366943, -0.320407509803772, 0.1656785011291504, 0.6517643928527832, 1.1378505229949951, 1.623936653137207, 2.11002254486084, 2.5961084365844727, 3.0821945667266846, 3.5682806968688965, 4.054366588592529, 4.540452480316162, 5.026538848876953, 5.512624740600586, 5.998710632324219, 6.484796524047852, 6.970882415771484, 7.456968784332275, 7.943054676055908, 8.429140090942383, 8.915226936340332, 9.401312828063965, 9.887398719787598, 10.37348461151123, 10.859570503234863, 11.345656394958496, 11.831743240356445, 12.317829132080078, 12.803915023803711, 13.290000915527344, 13.776086807250977]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 3.0, 8.0, 11.0, 7.0, 12.0, 11.0, 19.0, 11.0, 23.0, 22.0, 33.0, 21.0, 28.0, 39.0, 43.0, 38.0, 39.0, 41.0, 46.0, 37.0, 53.0, 40.0, 50.0, 37.0, 30.0, 49.0, 35.0, 23.0, 23.0, 35.0, 22.0, 23.0, 23.0, 14.0, 12.0, 10.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-8.575113296508789, -8.342183113098145, -8.109253883361816, -7.876323699951172, -7.643393516540527, -7.410463809967041, -7.177534103393555, -6.94460391998291, -6.711674213409424, -6.4787445068359375, -6.245814323425293, -6.012884616851807, -5.77995491027832, -5.547024726867676, -5.3140950202941895, -5.081165313720703, -4.848235130310059, -4.615305423736572, -4.382375240325928, -4.149445533752441, -3.916515588760376, -3.6835856437683105, -3.450655937194824, -3.217725992202759, -2.9847960472106934, -2.751866102218628, -2.5189361572265625, -2.286006450653076, -2.0530765056610107, -1.8201465606689453, -1.5872167348861694, -1.3542869091033936, -1.12135648727417, -0.8884266018867493, -0.6554967164993286, -0.42256683111190796, -0.1896369457244873, 0.043292999267578125, 0.276222825050354, 0.5091526508331299, 0.7420825958251953, 0.975012481212616, 1.2079423666000366, 1.4408721923828125, 1.673802137374878, 1.9067320823669434, 2.1396617889404297, 2.372591733932495, 2.6055216789245605, 2.838451623916626, 3.0713815689086914, 3.3043112754821777, 3.537241220474243, 3.7701711654663086, 4.003100872039795, 4.236030578613281, 4.468960762023926, 4.701890468597412, 4.934820652008057, 5.167750358581543, 5.4006805419921875, 5.633610248565674, 5.86653995513916, 6.099470138549805, 6.332399845123291]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 6.0, 9.0, 12.0, 15.0, 20.0, 25.0, 48.0, 67.0, 112.0, 157.0, 248.0, 355.0, 532.0, 816.0, 1261.0, 1861.0, 3029.0, 4567.0, 6979.0, 10845.0, 16962.0, 25887.0, 39450.0, 58966.0, 84292.0, 111546.0, 134028.0, 137246.0, 119845.0, 93015.0, 66691.0, 45033.0, 29945.0, 19247.0, 12556.0, 8091.0, 5100.0, 3274.0, 2175.0, 1446.0, 980.0, 592.0, 409.0, 267.0, 175.0, 124.0, 90.0, 64.0, 40.0, 22.0, 18.0, 8.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-5.4765625, -5.3114013671875, -5.146240234375, -4.9810791015625, -4.81591796875, -4.6507568359375, -4.485595703125, -4.3204345703125, -4.1552734375, -3.9901123046875, -3.824951171875, -3.6597900390625, -3.49462890625, -3.3294677734375, -3.164306640625, -2.9991455078125, -2.833984375, -2.6688232421875, -2.503662109375, -2.3385009765625, -2.17333984375, -2.0081787109375, -1.843017578125, -1.6778564453125, -1.5126953125, -1.3475341796875, -1.182373046875, -1.0172119140625, -0.85205078125, -0.6868896484375, -0.521728515625, -0.3565673828125, -0.19140625, -0.0262451171875, 0.138916015625, 0.3040771484375, 0.46923828125, 0.6343994140625, 0.799560546875, 0.9647216796875, 1.1298828125, 1.2950439453125, 1.460205078125, 1.6253662109375, 1.79052734375, 1.9556884765625, 2.120849609375, 2.2860107421875, 2.451171875, 2.6163330078125, 2.781494140625, 2.9466552734375, 3.11181640625, 3.2769775390625, 3.442138671875, 3.6072998046875, 3.7724609375, 3.9376220703125, 4.102783203125, 4.2679443359375, 4.43310546875, 4.5982666015625, 4.763427734375, 4.9285888671875, 5.09375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 1.0, 4.0, 5.0, 10.0, 10.0, 12.0, 9.0, 13.0, 16.0, 19.0, 22.0, 24.0, 19.0, 20.0, 22.0, 36.0, 30.0, 30.0, 34.0, 37.0, 37.0, 33.0, 42.0, 45.0, 44.0, 32.0, 40.0, 40.0, 36.0, 40.0, 28.0, 24.0, 25.0, 28.0, 24.0, 14.0, 16.0, 13.0, 10.0, 10.0, 4.0, 11.0, 4.0, 4.0, 3.0, 5.0, 2.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-7.52734375, -7.2979736328125, -7.068603515625, -6.8392333984375, -6.60986328125, -6.3804931640625, -6.151123046875, -5.9217529296875, -5.6923828125, -5.4630126953125, -5.233642578125, -5.0042724609375, -4.77490234375, -4.5455322265625, -4.316162109375, -4.0867919921875, -3.857421875, -3.6280517578125, -3.398681640625, -3.1693115234375, -2.93994140625, -2.7105712890625, -2.481201171875, -2.2518310546875, -2.0224609375, -1.7930908203125, -1.563720703125, -1.3343505859375, -1.10498046875, -0.8756103515625, -0.646240234375, -0.4168701171875, -0.1875, 0.0418701171875, 0.271240234375, 0.5006103515625, 0.72998046875, 0.9593505859375, 1.188720703125, 1.4180908203125, 1.6474609375, 1.8768310546875, 2.106201171875, 2.3355712890625, 2.56494140625, 2.7943115234375, 3.023681640625, 3.2530517578125, 3.482421875, 3.7117919921875, 3.941162109375, 4.1705322265625, 4.39990234375, 4.6292724609375, 4.858642578125, 5.0880126953125, 5.3173828125, 5.5467529296875, 5.776123046875, 6.0054931640625, 6.23486328125, 6.4642333984375, 6.693603515625, 6.9229736328125, 7.15234375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 12.0, 23.0, 35.0, 58.0, 67.0, 89.0, 149.0, 250.0, 355.0, 652.0, 931.0, 1474.0, 2300.0, 3742.0, 6085.0, 10023.0, 16055.0, 25993.0, 41208.0, 64266.0, 95372.0, 130257.0, 153547.0, 147081.0, 118362.0, 83285.0, 54571.0, 34895.0, 21887.0, 13383.0, 8327.0, 5187.0, 3119.0, 1963.0, 1271.0, 797.0, 516.0, 337.0, 205.0, 116.0, 88.0, 70.0, 51.0, 29.0, 16.0, 15.0, 11.0, 3.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.7734375, -6.560546875, -6.34765625, -6.134765625, -5.921875, -5.708984375, -5.49609375, -5.283203125, -5.0703125, -4.857421875, -4.64453125, -4.431640625, -4.21875, -4.005859375, -3.79296875, -3.580078125, -3.3671875, -3.154296875, -2.94140625, -2.728515625, -2.515625, -2.302734375, -2.08984375, -1.876953125, -1.6640625, -1.451171875, -1.23828125, -1.025390625, -0.8125, -0.599609375, -0.38671875, -0.173828125, 0.0390625, 0.251953125, 0.46484375, 0.677734375, 0.890625, 1.103515625, 1.31640625, 1.529296875, 1.7421875, 1.955078125, 2.16796875, 2.380859375, 2.59375, 2.806640625, 3.01953125, 3.232421875, 3.4453125, 3.658203125, 3.87109375, 4.083984375, 4.296875, 4.509765625, 4.72265625, 4.935546875, 5.1484375, 5.361328125, 5.57421875, 5.787109375, 6.0, 6.212890625, 6.42578125, 6.638671875, 6.8515625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 9.0, 13.0, 16.0, 15.0, 22.0, 21.0, 20.0, 26.0, 19.0, 32.0, 30.0, 46.0, 26.0, 57.0, 49.0, 35.0, 36.0, 49.0, 43.0, 49.0, 44.0, 42.0, 49.0, 29.0, 25.0, 26.0, 33.0, 21.0, 16.0, 22.0, 16.0, 10.0, 9.0, 8.0, 10.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17578125, -5.00189208984375, -4.8280029296875, -4.65411376953125, -4.480224609375, -4.30633544921875, -4.1324462890625, -3.95855712890625, -3.78466796875, -3.61077880859375, -3.4368896484375, -3.26300048828125, -3.089111328125, -2.91522216796875, -2.7413330078125, -2.56744384765625, -2.3935546875, -2.21966552734375, -2.0457763671875, -1.87188720703125, -1.697998046875, -1.52410888671875, -1.3502197265625, -1.17633056640625, -1.00244140625, -0.82855224609375, -0.6546630859375, -0.48077392578125, -0.306884765625, -0.13299560546875, 0.0408935546875, 0.21478271484375, 0.388671875, 0.56256103515625, 0.7364501953125, 0.91033935546875, 1.084228515625, 1.25811767578125, 1.4320068359375, 1.60589599609375, 1.77978515625, 1.95367431640625, 2.1275634765625, 2.30145263671875, 2.475341796875, 2.64923095703125, 2.8231201171875, 2.99700927734375, 3.1708984375, 3.34478759765625, 3.5186767578125, 3.69256591796875, 3.866455078125, 4.04034423828125, 4.2142333984375, 4.38812255859375, 4.56201171875, 4.73590087890625, 4.9097900390625, 5.08367919921875, 5.257568359375, 5.43145751953125, 5.6053466796875, 5.77923583984375, 5.953125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 8.0, 10.0, 11.0, 27.0, 21.0, 36.0, 48.0, 58.0, 86.0, 120.0, 203.0, 259.0, 363.0, 582.0, 902.0, 1425.0, 2425.0, 4085.0, 7105.0, 12878.0, 25155.0, 55333.0, 133804.0, 289125.0, 280073.0, 127341.0, 53050.0, 24415.0, 12575.0, 6739.0, 3857.0, 2305.0, 1440.0, 877.0, 587.0, 351.0, 259.0, 189.0, 103.0, 77.0, 73.0, 52.0, 37.0, 30.0, 14.0, 12.0, 9.0, 5.0, 3.0, 5.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.9866943359375, -8.676513671875, -8.3663330078125, -8.05615234375, -7.7459716796875, -7.435791015625, -7.1256103515625, -6.8154296875, -6.5052490234375, -6.195068359375, -5.8848876953125, -5.57470703125, -5.2645263671875, -4.954345703125, -4.6441650390625, -4.333984375, -4.0238037109375, -3.713623046875, -3.4034423828125, -3.09326171875, -2.7830810546875, -2.472900390625, -2.1627197265625, -1.8525390625, -1.5423583984375, -1.232177734375, -0.9219970703125, -0.61181640625, -0.3016357421875, 0.008544921875, 0.3187255859375, 0.62890625, 0.9390869140625, 1.249267578125, 1.5594482421875, 1.86962890625, 2.1798095703125, 2.489990234375, 2.8001708984375, 3.1103515625, 3.4205322265625, 3.730712890625, 4.0408935546875, 4.35107421875, 4.6612548828125, 4.971435546875, 5.2816162109375, 5.591796875, 5.9019775390625, 6.212158203125, 6.5223388671875, 6.83251953125, 7.1427001953125, 7.452880859375, 7.7630615234375, 8.0732421875, 8.3834228515625, 8.693603515625, 9.0037841796875, 9.31396484375, 9.6241455078125, 9.934326171875, 10.2445068359375, 10.5546875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 7.0, 16.0, 14.0, 18.0, 29.0, 37.0, 28.0, 57.0, 79.0, 89.0, 92.0, 96.0, 98.0, 74.0, 53.0, 37.0, 36.0, 25.0, 18.0, 6.0, 10.0, 7.0, 15.0, 5.0, 4.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0008573532104492188, -0.0008311942219734192, -0.0008050352334976196, -0.0007788762450218201, -0.0007527172565460205, -0.000726558268070221, -0.0007003992795944214, -0.0006742402911186218, -0.0006480813026428223, -0.0006219223141670227, -0.0005957633256912231, -0.0005696043372154236, -0.000543445348739624, -0.0005172863602638245, -0.0004911273717880249, -0.00046496838331222534, -0.0004388093948364258, -0.0004126504063606262, -0.00038649141788482666, -0.0003603324294090271, -0.00033417344093322754, -0.000308014452457428, -0.0002818554639816284, -0.00025569647550582886, -0.0002295374870300293, -0.00020337849855422974, -0.00017721951007843018, -0.00015106052160263062, -0.00012490153312683105, -9.87425446510315e-05, -7.258355617523193e-05, -4.642456769943237e-05, -2.0265579223632812e-05, 5.893409252166748e-06, 3.205239772796631e-05, 5.821138620376587e-05, 8.437037467956543e-05, 0.00011052936315536499, 0.00013668835163116455, 0.0001628473401069641, 0.00018900632858276367, 0.00021516531705856323, 0.0002413243055343628, 0.00026748329401016235, 0.0002936422824859619, 0.0003198012709617615, 0.00034596025943756104, 0.0003721192479133606, 0.00039827823638916016, 0.0004244372248649597, 0.0004505962133407593, 0.00047675520181655884, 0.0005029141902923584, 0.000529073178768158, 0.0005552321672439575, 0.0005813911557197571, 0.0006075501441955566, 0.0006337091326713562, 0.0006598681211471558, 0.0006860271096229553, 0.0007121860980987549, 0.0007383450865745544, 0.000764504075050354, 0.0007906630635261536, 0.0008168220520019531]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 1.0, 6.0, 6.0, 15.0, 16.0, 16.0, 34.0, 36.0, 53.0, 65.0, 114.0, 136.0, 236.0, 334.0, 489.0, 761.0, 1201.0, 2061.0, 3331.0, 5828.0, 11516.0, 23965.0, 55591.0, 142390.0, 327396.0, 277693.0, 109549.0, 43708.0, 19579.0, 9470.0, 5146.0, 2795.0, 1782.0, 1089.0, 701.0, 457.0, 307.0, 194.0, 126.0, 111.0, 68.0, 53.0, 43.0, 22.0, 16.0, 16.0, 8.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.0546875, -11.69873046875, -11.3427734375, -10.98681640625, -10.630859375, -10.27490234375, -9.9189453125, -9.56298828125, -9.20703125, -8.85107421875, -8.4951171875, -8.13916015625, -7.783203125, -7.42724609375, -7.0712890625, -6.71533203125, -6.359375, -6.00341796875, -5.6474609375, -5.29150390625, -4.935546875, -4.57958984375, -4.2236328125, -3.86767578125, -3.51171875, -3.15576171875, -2.7998046875, -2.44384765625, -2.087890625, -1.73193359375, -1.3759765625, -1.02001953125, -0.6640625, -0.30810546875, 0.0478515625, 0.40380859375, 0.759765625, 1.11572265625, 1.4716796875, 1.82763671875, 2.18359375, 2.53955078125, 2.8955078125, 3.25146484375, 3.607421875, 3.96337890625, 4.3193359375, 4.67529296875, 5.03125, 5.38720703125, 5.7431640625, 6.09912109375, 6.455078125, 6.81103515625, 7.1669921875, 7.52294921875, 7.87890625, 8.23486328125, 8.5908203125, 8.94677734375, 9.302734375, 9.65869140625, 10.0146484375, 10.37060546875, 10.7265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 11.0, 14.0, 22.0, 28.0, 36.0, 46.0, 47.0, 61.0, 78.0, 81.0, 84.0, 94.0, 73.0, 57.0, 66.0, 52.0, 29.0, 31.0, 23.0, 15.0, 18.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.671875, -1.59844970703125, -1.5250244140625, -1.45159912109375, -1.378173828125, -1.30474853515625, -1.2313232421875, -1.15789794921875, -1.08447265625, -1.01104736328125, -0.9376220703125, -0.86419677734375, -0.790771484375, -0.71734619140625, -0.6439208984375, -0.57049560546875, -0.4970703125, -0.42364501953125, -0.3502197265625, -0.27679443359375, -0.203369140625, -0.12994384765625, -0.0565185546875, 0.01690673828125, 0.09033203125, 0.16375732421875, 0.2371826171875, 0.31060791015625, 0.384033203125, 0.45745849609375, 0.5308837890625, 0.60430908203125, 0.677734375, 0.75115966796875, 0.8245849609375, 0.89801025390625, 0.971435546875, 1.04486083984375, 1.1182861328125, 1.19171142578125, 1.26513671875, 1.33856201171875, 1.4119873046875, 1.48541259765625, 1.558837890625, 1.63226318359375, 1.7056884765625, 1.77911376953125, 1.8525390625, 1.92596435546875, 1.9993896484375, 2.07281494140625, 2.146240234375, 2.21966552734375, 2.2930908203125, 2.36651611328125, 2.43994140625, 2.51336669921875, 2.5867919921875, 2.66021728515625, 2.733642578125, 2.80706787109375, 2.8804931640625, 2.95391845703125, 3.02734375]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 8.0, 5.0, 11.0, 11.0, 13.0, 21.0, 23.0, 17.0, 43.0, 53.0, 59.0, 54.0, 83.0, 84.0, 73.0, 71.0, 78.0, 63.0, 48.0, 34.0, 30.0, 31.0, 22.0, 12.0, 15.0, 9.0, 6.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.73642349243164, -16.196664810180664, -15.656905174255371, -15.117145538330078, -14.577386856079102, -14.037627220153809, -13.497867584228516, -12.958108901977539, -12.418349266052246, -11.878589630126953, -11.338830947875977, -10.799071311950684, -10.25931167602539, -9.719552993774414, -9.179793357849121, -8.640033721923828, -8.100275039672852, -7.560515880584717, -7.020756721496582, -6.480997085571289, -5.941237926483154, -5.4014787673950195, -4.861719131469727, -4.321959972381592, -3.782200813293457, -3.2424416542053223, -2.7026822566986084, -2.1629228591918945, -1.6231637001037598, -1.083404541015625, -0.5436451435089111, -0.0038857460021972656, 0.5358753204345703, 1.0756345987319946, 1.615393877029419, 2.155153274536133, 2.6949124336242676, 3.2346715927124023, 3.774430990219116, 4.31419038772583, 4.853949546813965, 5.3937087059021, 5.933467864990234, 6.473227500915527, 7.012986660003662, 7.552745819091797, 8.09250545501709, 8.632265090942383, 9.17202377319336, 9.711783409118652, 10.251542091369629, 10.791301727294922, 11.331060409545898, 11.870820045471191, 12.410579681396484, 12.950338363647461, 13.490097999572754, 14.029857635498047, 14.569616317749023, 15.109375953674316, 15.64913558959961, 16.188894271850586, 16.728652954101562, 17.268413543701172, 17.80817222595215]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 7.0, 6.0, 15.0, 19.0, 13.0, 19.0, 13.0, 23.0, 26.0, 25.0, 36.0, 36.0, 43.0, 40.0, 42.0, 46.0, 43.0, 45.0, 46.0, 47.0, 45.0, 37.0, 35.0, 39.0, 30.0, 25.0, 36.0, 21.0, 28.0, 20.0, 20.0, 10.0, 16.0, 11.0, 10.0, 3.0, 5.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.566052436828613, -9.3101806640625, -9.054309844970703, -8.79843807220459, -8.542567253112793, -8.28669548034668, -8.030824661254883, -7.7749528884887695, -7.5190815925598145, -7.263210296630859, -7.007339000701904, -6.751467704772949, -6.495595932006836, -6.239725112915039, -5.983853340148926, -5.727982044219971, -5.472110748291016, -5.2162394523620605, -4.9603681564331055, -4.70449686050415, -4.448625564575195, -4.192753791809082, -3.936882495880127, -3.681011199951172, -3.425139904022217, -3.1692686080932617, -2.9133973121643066, -2.6575257778167725, -2.4016544818878174, -2.1457831859588623, -1.8899117708206177, -1.634040355682373, -1.3781685829162598, -1.1222972869873047, -0.8664258718490601, -0.6105545163154602, -0.35468316078186035, -0.09881186485290527, 0.15705955028533936, 0.412930965423584, 0.6688022613525391, 0.9246736168861389, 1.1805449724197388, 1.4364163875579834, 1.6922876834869385, 1.9481589794158936, 2.2040305137634277, 2.459901809692383, 2.715773105621338, 2.971644401550293, 3.227515697479248, 3.4833872318267822, 3.7392585277557373, 3.9951298236846924, 4.251001358032227, 4.506872653961182, 4.762743949890137, 5.018615245819092, 5.274486541748047, 5.530357837677002, 5.786229133605957, 6.04210090637207, 6.297972202301025, 6.5538434982299805, 6.8097147941589355]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 8.0, 8.0, 12.0, 14.0, 20.0, 36.0, 42.0, 56.0, 78.0, 103.0, 160.0, 219.0, 304.0, 532.0, 785.0, 1234.0, 1985.0, 3156.0, 5143.0, 8544.0, 14507.0, 25415.0, 47169.0, 94114.0, 216844.0, 551145.0, 1181798.0, 1133725.0, 513823.0, 200304.0, 88159.0, 44227.0, 24311.0, 14138.0, 8316.0, 5172.0, 3143.0, 1985.0, 1262.0, 808.0, 513.0, 294.0, 224.0, 153.0, 103.0, 77.0, 40.0, 29.0, 21.0, 10.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-18.359375, -17.834228515625, -17.30908203125, -16.783935546875, -16.2587890625, -15.733642578125, -15.20849609375, -14.683349609375, -14.158203125, -13.633056640625, -13.10791015625, -12.582763671875, -12.0576171875, -11.532470703125, -11.00732421875, -10.482177734375, -9.95703125, -9.431884765625, -8.90673828125, -8.381591796875, -7.8564453125, -7.331298828125, -6.80615234375, -6.281005859375, -5.755859375, -5.230712890625, -4.70556640625, -4.180419921875, -3.6552734375, -3.130126953125, -2.60498046875, -2.079833984375, -1.5546875, -1.029541015625, -0.50439453125, 0.020751953125, 0.5458984375, 1.071044921875, 1.59619140625, 2.121337890625, 2.646484375, 3.171630859375, 3.69677734375, 4.221923828125, 4.7470703125, 5.272216796875, 5.79736328125, 6.322509765625, 6.84765625, 7.372802734375, 7.89794921875, 8.423095703125, 8.9482421875, 9.473388671875, 9.99853515625, 10.523681640625, 11.048828125, 11.573974609375, 12.09912109375, 12.624267578125, 13.1494140625, 13.674560546875, 14.19970703125, 14.724853515625, 15.25]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 5.0, 10.0, 15.0, 15.0, 12.0, 18.0, 15.0, 13.0, 17.0, 29.0, 37.0, 26.0, 32.0, 49.0, 31.0, 33.0, 37.0, 45.0, 61.0, 38.0, 46.0, 45.0, 41.0, 35.0, 27.0, 35.0, 32.0, 19.0, 25.0, 18.0, 21.0, 16.0, 26.0, 16.0, 14.0, 10.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.65234375, -7.419677734375, -7.18701171875, -6.954345703125, -6.7216796875, -6.489013671875, -6.25634765625, -6.023681640625, -5.791015625, -5.558349609375, -5.32568359375, -5.093017578125, -4.8603515625, -4.627685546875, -4.39501953125, -4.162353515625, -3.9296875, -3.697021484375, -3.46435546875, -3.231689453125, -2.9990234375, -2.766357421875, -2.53369140625, -2.301025390625, -2.068359375, -1.835693359375, -1.60302734375, -1.370361328125, -1.1376953125, -0.905029296875, -0.67236328125, -0.439697265625, -0.20703125, 0.025634765625, 0.25830078125, 0.490966796875, 0.7236328125, 0.956298828125, 1.18896484375, 1.421630859375, 1.654296875, 1.886962890625, 2.11962890625, 2.352294921875, 2.5849609375, 2.817626953125, 3.05029296875, 3.282958984375, 3.515625, 3.748291015625, 3.98095703125, 4.213623046875, 4.4462890625, 4.678955078125, 4.91162109375, 5.144287109375, 5.376953125, 5.609619140625, 5.84228515625, 6.074951171875, 6.3076171875, 6.540283203125, 6.77294921875, 7.005615234375, 7.23828125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 6.0, 3.0, 9.0, 10.0, 14.0, 20.0, 26.0, 51.0, 80.0, 128.0, 215.0, 306.0, 505.0, 793.0, 1358.0, 2275.0, 3757.0, 6677.0, 11790.0, 22556.0, 44100.0, 93383.0, 214359.0, 543641.0, 1270206.0, 1155821.0, 467473.0, 186766.0, 82719.0, 39374.0, 20180.0, 10800.0, 6163.0, 3468.0, 1944.0, 1233.0, 742.0, 462.0, 274.0, 179.0, 136.0, 91.0, 63.0, 42.0, 28.0, 19.0, 16.0, 7.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-25.390625, -24.619384765625, -23.84814453125, -23.076904296875, -22.3056640625, -21.534423828125, -20.76318359375, -19.991943359375, -19.220703125, -18.449462890625, -17.67822265625, -16.906982421875, -16.1357421875, -15.364501953125, -14.59326171875, -13.822021484375, -13.05078125, -12.279541015625, -11.50830078125, -10.737060546875, -9.9658203125, -9.194580078125, -8.42333984375, -7.652099609375, -6.880859375, -6.109619140625, -5.33837890625, -4.567138671875, -3.7958984375, -3.024658203125, -2.25341796875, -1.482177734375, -0.7109375, 0.060302734375, 0.83154296875, 1.602783203125, 2.3740234375, 3.145263671875, 3.91650390625, 4.687744140625, 5.458984375, 6.230224609375, 7.00146484375, 7.772705078125, 8.5439453125, 9.315185546875, 10.08642578125, 10.857666015625, 11.62890625, 12.400146484375, 13.17138671875, 13.942626953125, 14.7138671875, 15.485107421875, 16.25634765625, 17.027587890625, 17.798828125, 18.570068359375, 19.34130859375, 20.112548828125, 20.8837890625, 21.655029296875, 22.42626953125, 23.197509765625, 23.96875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 5.0, 8.0, 12.0, 14.0, 3.0, 12.0, 10.0, 22.0, 23.0, 35.0, 28.0, 45.0, 68.0, 74.0, 93.0, 111.0, 132.0, 172.0, 205.0, 217.0, 256.0, 263.0, 292.0, 264.0, 247.0, 250.0, 215.0, 176.0, 155.0, 138.0, 128.0, 73.0, 76.0, 65.0, 45.0, 36.0, 30.0, 16.0, 18.0, 10.0, 7.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.10845947265625, -4.9473876953125, -4.78631591796875, -4.625244140625, -4.46417236328125, -4.3031005859375, -4.14202880859375, -3.98095703125, -3.81988525390625, -3.6588134765625, -3.49774169921875, -3.336669921875, -3.17559814453125, -3.0145263671875, -2.85345458984375, -2.6923828125, -2.53131103515625, -2.3702392578125, -2.20916748046875, -2.048095703125, -1.88702392578125, -1.7259521484375, -1.56488037109375, -1.40380859375, -1.24273681640625, -1.0816650390625, -0.92059326171875, -0.759521484375, -0.59844970703125, -0.4373779296875, -0.27630615234375, -0.115234375, 0.04583740234375, 0.2069091796875, 0.36798095703125, 0.529052734375, 0.69012451171875, 0.8511962890625, 1.01226806640625, 1.17333984375, 1.33441162109375, 1.4954833984375, 1.65655517578125, 1.817626953125, 1.97869873046875, 2.1397705078125, 2.30084228515625, 2.4619140625, 2.62298583984375, 2.7840576171875, 2.94512939453125, 3.106201171875, 3.26727294921875, 3.4283447265625, 3.58941650390625, 3.75048828125, 3.91156005859375, 4.0726318359375, 4.23370361328125, 4.394775390625, 4.55584716796875, 4.7169189453125, 4.87799072265625, 5.0390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 13.0, 9.0, 9.0, 19.0, 18.0, 27.0, 32.0, 28.0, 26.0, 48.0, 51.0, 51.0, 66.0, 82.0, 63.0, 60.0, 59.0, 49.0, 51.0, 43.0, 33.0, 29.0, 24.0, 20.0, 16.0, 11.0, 8.0, 7.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-20.241504669189453, -19.626298904418945, -19.011093139648438, -18.395885467529297, -17.78067970275879, -17.16547393798828, -16.550268173217773, -15.935062408447266, -15.319856643676758, -14.70465087890625, -14.089444160461426, -13.474238395690918, -12.85903263092041, -12.243825912475586, -11.628620147705078, -11.01341438293457, -10.398207664489746, -9.783001899719238, -9.167795181274414, -8.552589416503906, -7.937383651733398, -7.322177410125732, -6.706971168518066, -6.091765403747559, -5.476559162139893, -4.861352920532227, -4.246147155761719, -3.6309409141540527, -3.015734910964966, -2.400528907775879, -1.785322666168213, -1.170116901397705, -0.5549106597900391, 0.06029540300369263, 0.6755014657974243, 1.2907075881958008, 1.9059135913848877, 2.5211195945739746, 3.1363258361816406, 3.7515316009521484, 4.3667378425598145, 4.9819440841674805, 5.597149848937988, 6.212356090545654, 6.82756233215332, 7.442768096923828, 8.057973861694336, 8.673179626464844, 9.288386344909668, 9.903592109680176, 10.518798828125, 11.134004592895508, 11.749210357666016, 12.364416122436523, 12.979622840881348, 13.594828605651855, 14.21003532409668, 14.825241088867188, 15.440447807312012, 16.055652618408203, 16.670860290527344, 17.28606605529785, 17.90127182006836, 18.516477584838867, 19.131683349609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 8.0, 11.0, 11.0, 7.0, 14.0, 16.0, 17.0, 27.0, 18.0, 26.0, 39.0, 40.0, 44.0, 44.0, 44.0, 33.0, 44.0, 39.0, 48.0, 41.0, 51.0, 41.0, 39.0, 44.0, 35.0, 30.0, 22.0, 30.0, 12.0, 20.0, 17.0, 18.0, 9.0, 11.0, 11.0, 9.0, 9.0, 9.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.59255313873291, -11.275200843811035, -10.95784854888916, -10.640496253967285, -10.32314395904541, -10.005791664123535, -9.68843936920166, -9.371086120605469, -9.053733825683594, -8.736381530761719, -8.419029235839844, -8.101676940917969, -7.784324645996094, -7.466972351074219, -7.1496195793151855, -6.8322672843933105, -6.514915466308594, -6.197563171386719, -5.880210876464844, -5.562858581542969, -5.245506286621094, -4.928153991699219, -4.6108012199401855, -4.2934489250183105, -3.9760966300964355, -3.6587443351745605, -3.3413920402526855, -3.0240395069122314, -2.7066872119903564, -2.3893349170684814, -2.0719823837280273, -1.7546300888061523, -1.4372777938842773, -1.1199254989624023, -0.8025730848312378, -0.485220730304718, -0.16786837577819824, 0.14948391914367676, 0.4668363332748413, 0.7841887474060059, 1.1015410423278809, 1.4188933372497559, 1.7362457513809204, 2.053598165512085, 2.37095046043396, 2.688302755355835, 3.005655288696289, 3.323007583618164, 3.640359878540039, 3.957712173461914, 4.275064468383789, 4.592416763305664, 4.909769058227539, 5.227121353149414, 5.544474124908447, 5.861826419830322, 6.179178714752197, 6.496531009674072, 6.813883304595947, 7.131235599517822, 7.4485883712768555, 7.7659406661987305, 8.083292961120605, 8.40064525604248, 8.717997550964355]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 14.0, 16.0, 17.0, 30.0, 57.0, 62.0, 126.0, 227.0, 346.0, 526.0, 839.0, 1317.0, 2145.0, 3342.0, 5547.0, 9150.0, 15381.0, 26133.0, 44264.0, 73417.0, 118131.0, 167633.0, 184893.0, 148584.0, 98102.0, 59713.0, 35274.0, 21039.0, 12743.0, 7445.0, 4528.0, 2805.0, 1745.0, 1072.0, 667.0, 420.0, 288.0, 193.0, 122.0, 65.0, 49.0, 27.0, 31.0, 11.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.88671875, -7.63470458984375, -7.3826904296875, -7.13067626953125, -6.878662109375, -6.62664794921875, -6.3746337890625, -6.12261962890625, -5.87060546875, -5.61859130859375, -5.3665771484375, -5.11456298828125, -4.862548828125, -4.61053466796875, -4.3585205078125, -4.10650634765625, -3.8544921875, -3.60247802734375, -3.3504638671875, -3.09844970703125, -2.846435546875, -2.59442138671875, -2.3424072265625, -2.09039306640625, -1.83837890625, -1.58636474609375, -1.3343505859375, -1.08233642578125, -0.830322265625, -0.57830810546875, -0.3262939453125, -0.07427978515625, 0.177734375, 0.42974853515625, 0.6817626953125, 0.93377685546875, 1.185791015625, 1.43780517578125, 1.6898193359375, 1.94183349609375, 2.19384765625, 2.44586181640625, 2.6978759765625, 2.94989013671875, 3.201904296875, 3.45391845703125, 3.7059326171875, 3.95794677734375, 4.2099609375, 4.46197509765625, 4.7139892578125, 4.96600341796875, 5.218017578125, 5.47003173828125, 5.7220458984375, 5.97406005859375, 6.22607421875, 6.47808837890625, 6.7301025390625, 6.98211669921875, 7.234130859375, 7.48614501953125, 7.7381591796875, 7.99017333984375, 8.2421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 4.0, 1.0, 2.0, 6.0, 8.0, 8.0, 11.0, 15.0, 10.0, 17.0, 15.0, 19.0, 27.0, 20.0, 41.0, 46.0, 41.0, 42.0, 41.0, 42.0, 34.0, 44.0, 37.0, 47.0, 41.0, 41.0, 45.0, 44.0, 38.0, 30.0, 26.0, 26.0, 26.0, 21.0, 11.0, 15.0, 17.0, 16.0, 7.0, 9.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.2578125, -11.8857421875, -11.513671875, -11.1416015625, -10.76953125, -10.3974609375, -10.025390625, -9.6533203125, -9.28125, -8.9091796875, -8.537109375, -8.1650390625, -7.79296875, -7.4208984375, -7.048828125, -6.6767578125, -6.3046875, -5.9326171875, -5.560546875, -5.1884765625, -4.81640625, -4.4443359375, -4.072265625, -3.7001953125, -3.328125, -2.9560546875, -2.583984375, -2.2119140625, -1.83984375, -1.4677734375, -1.095703125, -0.7236328125, -0.3515625, 0.0205078125, 0.392578125, 0.7646484375, 1.13671875, 1.5087890625, 1.880859375, 2.2529296875, 2.625, 2.9970703125, 3.369140625, 3.7412109375, 4.11328125, 4.4853515625, 4.857421875, 5.2294921875, 5.6015625, 5.9736328125, 6.345703125, 6.7177734375, 7.08984375, 7.4619140625, 7.833984375, 8.2060546875, 8.578125, 8.9501953125, 9.322265625, 9.6943359375, 10.06640625, 10.4384765625, 10.810546875, 11.1826171875, 11.5546875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 22.0, 17.0, 39.0, 45.0, 53.0, 98.0, 118.0, 204.0, 250.0, 420.0, 593.0, 892.0, 1432.0, 2241.0, 3555.0, 5867.0, 10082.0, 17960.0, 32683.0, 62385.0, 118457.0, 210496.0, 244593.0, 155528.0, 82444.0, 42791.0, 23024.0, 12705.0, 7499.0, 4394.0, 2685.0, 1716.0, 1092.0, 715.0, 450.0, 315.0, 228.0, 148.0, 98.0, 72.0, 43.0, 33.0, 22.0, 15.0, 12.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0], "bins": [-13.78125, -13.389892578125, -12.99853515625, -12.607177734375, -12.2158203125, -11.824462890625, -11.43310546875, -11.041748046875, -10.650390625, -10.259033203125, -9.86767578125, -9.476318359375, -9.0849609375, -8.693603515625, -8.30224609375, -7.910888671875, -7.51953125, -7.128173828125, -6.73681640625, -6.345458984375, -5.9541015625, -5.562744140625, -5.17138671875, -4.780029296875, -4.388671875, -3.997314453125, -3.60595703125, -3.214599609375, -2.8232421875, -2.431884765625, -2.04052734375, -1.649169921875, -1.2578125, -0.866455078125, -0.47509765625, -0.083740234375, 0.3076171875, 0.698974609375, 1.09033203125, 1.481689453125, 1.873046875, 2.264404296875, 2.65576171875, 3.047119140625, 3.4384765625, 3.829833984375, 4.22119140625, 4.612548828125, 5.00390625, 5.395263671875, 5.78662109375, 6.177978515625, 6.5693359375, 6.960693359375, 7.35205078125, 7.743408203125, 8.134765625, 8.526123046875, 8.91748046875, 9.308837890625, 9.7001953125, 10.091552734375, 10.48291015625, 10.874267578125, 11.265625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 5.0, 7.0, 12.0, 10.0, 17.0, 12.0, 13.0, 11.0, 19.0, 18.0, 27.0, 29.0, 38.0, 27.0, 31.0, 34.0, 41.0, 38.0, 41.0, 42.0, 39.0, 43.0, 38.0, 48.0, 43.0, 35.0, 37.0, 38.0, 25.0, 21.0, 17.0, 25.0, 17.0, 21.0, 10.0, 14.0, 9.0, 7.0, 5.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.484375, -6.27813720703125, -6.0718994140625, -5.86566162109375, -5.659423828125, -5.45318603515625, -5.2469482421875, -5.04071044921875, -4.83447265625, -4.62823486328125, -4.4219970703125, -4.21575927734375, -4.009521484375, -3.80328369140625, -3.5970458984375, -3.39080810546875, -3.1845703125, -2.97833251953125, -2.7720947265625, -2.56585693359375, -2.359619140625, -2.15338134765625, -1.9471435546875, -1.74090576171875, -1.53466796875, -1.32843017578125, -1.1221923828125, -0.91595458984375, -0.709716796875, -0.50347900390625, -0.2972412109375, -0.09100341796875, 0.115234375, 0.32147216796875, 0.5277099609375, 0.73394775390625, 0.940185546875, 1.14642333984375, 1.3526611328125, 1.55889892578125, 1.76513671875, 1.97137451171875, 2.1776123046875, 2.38385009765625, 2.590087890625, 2.79632568359375, 3.0025634765625, 3.20880126953125, 3.4150390625, 3.62127685546875, 3.8275146484375, 4.03375244140625, 4.239990234375, 4.44622802734375, 4.6524658203125, 4.85870361328125, 5.06494140625, 5.27117919921875, 5.4774169921875, 5.68365478515625, 5.889892578125, 6.09613037109375, 6.3023681640625, 6.50860595703125, 6.71484375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 11.0, 7.0, 22.0, 50.0, 69.0, 75.0, 161.0, 267.0, 434.0, 878.0, 1527.0, 2742.0, 5206.0, 10013.0, 20684.0, 44233.0, 99072.0, 222108.0, 313572.0, 178331.0, 78450.0, 35851.0, 16850.0, 8274.0, 4359.0, 2372.0, 1222.0, 687.0, 430.0, 251.0, 133.0, 78.0, 48.0, 28.0, 22.0, 15.0, 6.0, 6.0, 5.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.328125, -8.04443359375, -7.7607421875, -7.47705078125, -7.193359375, -6.90966796875, -6.6259765625, -6.34228515625, -6.05859375, -5.77490234375, -5.4912109375, -5.20751953125, -4.923828125, -4.64013671875, -4.3564453125, -4.07275390625, -3.7890625, -3.50537109375, -3.2216796875, -2.93798828125, -2.654296875, -2.37060546875, -2.0869140625, -1.80322265625, -1.51953125, -1.23583984375, -0.9521484375, -0.66845703125, -0.384765625, -0.10107421875, 0.1826171875, 0.46630859375, 0.75, 1.03369140625, 1.3173828125, 1.60107421875, 1.884765625, 2.16845703125, 2.4521484375, 2.73583984375, 3.01953125, 3.30322265625, 3.5869140625, 3.87060546875, 4.154296875, 4.43798828125, 4.7216796875, 5.00537109375, 5.2890625, 5.57275390625, 5.8564453125, 6.14013671875, 6.423828125, 6.70751953125, 6.9912109375, 7.27490234375, 7.55859375, 7.84228515625, 8.1259765625, 8.40966796875, 8.693359375, 8.97705078125, 9.2607421875, 9.54443359375, 9.828125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 10.0, 4.0, 10.0, 14.0, 12.0, 12.0, 14.0, 23.0, 32.0, 26.0, 32.0, 33.0, 45.0, 51.0, 46.0, 74.0, 56.0, 70.0, 64.0, 64.0, 47.0, 37.0, 46.0, 29.0, 27.0, 30.0, 20.0, 17.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002321004867553711, -0.00022402219474315643, -0.00021594390273094177, -0.0002078656107187271, -0.00019978731870651245, -0.0001917090266942978, -0.00018363073468208313, -0.00017555244266986847, -0.0001674741506576538, -0.00015939585864543915, -0.0001513175666332245, -0.00014323927462100983, -0.00013516098260879517, -0.0001270826905965805, -0.00011900439858436584, -0.00011092610657215118, -0.00010284781455993652, -9.476952254772186e-05, -8.66912305355072e-05, -7.861293852329254e-05, -7.053464651107788e-05, -6.245635449886322e-05, -5.437806248664856e-05, -4.62997704744339e-05, -3.822147846221924e-05, -3.0143186450004578e-05, -2.2064894437789917e-05, -1.3986602425575256e-05, -5.908310413360596e-06, 2.169981598854065e-06, 1.0248273611068726e-05, 1.8326565623283386e-05, 2.6404857635498047e-05, 3.448314964771271e-05, 4.256144165992737e-05, 5.063973367214203e-05, 5.871802568435669e-05, 6.679631769657135e-05, 7.487460970878601e-05, 8.295290172100067e-05, 9.103119373321533e-05, 9.910948574542999e-05, 0.00010718777775764465, 0.00011526606976985931, 0.00012334436178207397, 0.00013142265379428864, 0.0001395009458065033, 0.00014757923781871796, 0.00015565752983093262, 0.00016373582184314728, 0.00017181411385536194, 0.0001798924058675766, 0.00018797069787979126, 0.00019604898989200592, 0.00020412728190422058, 0.00021220557391643524, 0.0002202838659286499, 0.00022836215794086456, 0.00023644044995307922, 0.0002445187419652939, 0.00025259703397750854, 0.0002606753259897232, 0.00026875361800193787, 0.0002768319100141525, 0.0002849102020263672]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 12.0, 6.0, 20.0, 21.0, 22.0, 37.0, 61.0, 73.0, 120.0, 147.0, 189.0, 287.0, 421.0, 571.0, 790.0, 1254.0, 1771.0, 2597.0, 3986.0, 6299.0, 10032.0, 16211.0, 27030.0, 44712.0, 73456.0, 114021.0, 158309.0, 174443.0, 146089.0, 100924.0, 63429.0, 38519.0, 23188.0, 14210.0, 8689.0, 5575.0, 3533.0, 2301.0, 1564.0, 1093.0, 771.0, 501.0, 383.0, 239.0, 207.0, 127.0, 91.0, 74.0, 45.0, 32.0, 29.0, 13.0, 15.0, 12.0, 1.0, 4.0, 2.0, 4.0, 2.0], "bins": [-6.27734375, -6.08331298828125, -5.8892822265625, -5.69525146484375, -5.501220703125, -5.30718994140625, -5.1131591796875, -4.91912841796875, -4.72509765625, -4.53106689453125, -4.3370361328125, -4.14300537109375, -3.948974609375, -3.75494384765625, -3.5609130859375, -3.36688232421875, -3.1728515625, -2.97882080078125, -2.7847900390625, -2.59075927734375, -2.396728515625, -2.20269775390625, -2.0086669921875, -1.81463623046875, -1.62060546875, -1.42657470703125, -1.2325439453125, -1.03851318359375, -0.844482421875, -0.65045166015625, -0.4564208984375, -0.26239013671875, -0.068359375, 0.12567138671875, 0.3197021484375, 0.51373291015625, 0.707763671875, 0.90179443359375, 1.0958251953125, 1.28985595703125, 1.48388671875, 1.67791748046875, 1.8719482421875, 2.06597900390625, 2.260009765625, 2.45404052734375, 2.6480712890625, 2.84210205078125, 3.0361328125, 3.23016357421875, 3.4241943359375, 3.61822509765625, 3.812255859375, 4.00628662109375, 4.2003173828125, 4.39434814453125, 4.58837890625, 4.78240966796875, 4.9764404296875, 5.17047119140625, 5.364501953125, 5.55853271484375, 5.7525634765625, 5.94659423828125, 6.140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 4.0, 3.0, 10.0, 11.0, 13.0, 14.0, 20.0, 28.0, 24.0, 19.0, 41.0, 47.0, 43.0, 50.0, 43.0, 58.0, 55.0, 44.0, 54.0, 49.0, 46.0, 40.0, 44.0, 43.0, 33.0, 28.0, 28.0, 18.0, 14.0, 20.0, 11.0, 11.0, 5.0, 4.0, 2.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5888671875, -1.5374603271484375, -1.486053466796875, -1.4346466064453125, -1.38323974609375, -1.3318328857421875, -1.280426025390625, -1.2290191650390625, -1.1776123046875, -1.1262054443359375, -1.074798583984375, -1.0233917236328125, -0.97198486328125, -0.9205780029296875, -0.869171142578125, -0.8177642822265625, -0.766357421875, -0.7149505615234375, -0.663543701171875, -0.6121368408203125, -0.56072998046875, -0.5093231201171875, -0.457916259765625, -0.4065093994140625, -0.3551025390625, -0.3036956787109375, -0.252288818359375, -0.2008819580078125, -0.14947509765625, -0.0980682373046875, -0.046661376953125, 0.0047454833984375, 0.05615234375, 0.1075592041015625, 0.158966064453125, 0.2103729248046875, 0.26177978515625, 0.3131866455078125, 0.364593505859375, 0.4160003662109375, 0.4674072265625, 0.5188140869140625, 0.570220947265625, 0.6216278076171875, 0.67303466796875, 0.7244415283203125, 0.775848388671875, 0.8272552490234375, 0.878662109375, 0.9300689697265625, 0.981475830078125, 1.0328826904296875, 1.08428955078125, 1.1356964111328125, 1.187103271484375, 1.2385101318359375, 1.2899169921875, 1.3413238525390625, 1.392730712890625, 1.4441375732421875, 1.49554443359375, 1.5469512939453125, 1.598358154296875, 1.6497650146484375, 1.701171875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 7.0, 6.0, 5.0, 9.0, 4.0, 12.0, 16.0, 18.0, 16.0, 38.0, 34.0, 22.0, 40.0, 47.0, 49.0, 53.0, 70.0, 70.0, 73.0, 60.0, 57.0, 51.0, 43.0, 37.0, 33.0, 28.0, 19.0, 25.0, 8.0, 10.0, 9.0, 10.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.470176696777344, -18.85137176513672, -18.232566833496094, -17.6137638092041, -16.994958877563477, -16.37615394592285, -15.757349967956543, -15.138545989990234, -14.51974105834961, -13.900936126708984, -13.282132148742676, -12.663328170776367, -12.044523239135742, -11.425718307495117, -10.806914329528809, -10.1881103515625, -9.569305419921875, -8.95050048828125, -8.331696510314941, -7.712892055511475, -7.094087600708008, -6.475283145904541, -5.856478691101074, -5.237674236297607, -4.618869781494141, -4.000065326690674, -3.381260871887207, -2.7624564170837402, -2.1436519622802734, -1.5248475074768066, -0.9060430526733398, -0.28723859786987305, 0.33156585693359375, 0.9503703117370605, 1.5691747665405273, 2.187979221343994, 2.806783676147461, 3.4255881309509277, 4.0443925857543945, 4.663197040557861, 5.282001495361328, 5.900805950164795, 6.519610404968262, 7.1384148597717285, 7.757219314575195, 8.37602424621582, 8.994828224182129, 9.613632202148438, 10.232437133789062, 10.851242065429688, 11.470046043395996, 12.088850021362305, 12.70765495300293, 13.326459884643555, 13.945263862609863, 14.564067840576172, 15.182872772216797, 15.801677703857422, 16.420482635498047, 17.03928565979004, 17.658090591430664, 18.27689552307129, 18.89569854736328, 19.514503479003906, 20.13330841064453]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 7.0, 10.0, 9.0, 14.0, 14.0, 20.0, 17.0, 18.0, 27.0, 34.0, 39.0, 34.0, 52.0, 41.0, 40.0, 44.0, 43.0, 41.0, 53.0, 37.0, 45.0, 45.0, 41.0, 37.0, 30.0, 26.0, 24.0, 24.0, 20.0, 17.0, 17.0, 12.0, 10.0, 12.0, 4.0, 14.0, 10.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.650531768798828, -11.330387115478516, -11.01024341583252, -10.690098762512207, -10.369955062866211, -10.049810409545898, -9.729666709899902, -9.40952205657959, -9.089378356933594, -8.769233703613281, -8.449090003967285, -8.128945350646973, -7.808801651000977, -7.488656997680664, -7.16851282119751, -6.8483686447143555, -6.528223991394043, -6.208079814910889, -5.887935638427734, -5.56779146194458, -5.247647285461426, -4.927502632141113, -4.607358455657959, -4.287214279174805, -3.9670701026916504, -3.646925926208496, -3.326781749725342, -3.0066373348236084, -2.686493158340454, -2.3663489818573, -2.0462045669555664, -1.726060390472412, -1.4059162139892578, -1.0857720375061035, -0.7656277418136597, -0.4454835057258606, -0.12533926963806152, 0.19480490684509277, 0.5149492025375366, 0.8350934982299805, 1.1552376747131348, 1.475381851196289, 1.795526146888733, 2.1156704425811768, 2.435814619064331, 2.7559587955474854, 3.0761032104492188, 3.396247386932373, 3.7163915634155273, 4.036535739898682, 4.356679916381836, 4.67682409286499, 4.9969682693481445, 5.317112922668457, 5.637257099151611, 5.957401275634766, 6.27754545211792, 6.597689628601074, 6.9178338050842285, 7.237977981567383, 7.558122634887695, 7.878266334533691, 8.198410987854004, 8.5185546875, 8.838699340820312]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 13.0, 13.0, 19.0, 29.0, 48.0, 56.0, 103.0, 128.0, 174.0, 253.0, 468.0, 741.0, 1172.0, 2057.0, 3601.0, 6878.0, 12836.0, 25296.0, 48083.0, 88966.0, 150710.0, 204652.0, 197436.0, 137256.0, 78317.0, 42070.0, 21959.0, 11232.0, 5845.0, 3260.0, 1862.0, 1082.0, 657.0, 408.0, 308.0, 174.0, 104.0, 87.0, 56.0, 43.0, 34.0, 31.0, 14.0, 10.0, 6.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.375, -12.0203857421875, -11.665771484375, -11.3111572265625, -10.95654296875, -10.6019287109375, -10.247314453125, -9.8927001953125, -9.5380859375, -9.1834716796875, -8.828857421875, -8.4742431640625, -8.11962890625, -7.7650146484375, -7.410400390625, -7.0557861328125, -6.701171875, -6.3465576171875, -5.991943359375, -5.6373291015625, -5.28271484375, -4.9281005859375, -4.573486328125, -4.2188720703125, -3.8642578125, -3.5096435546875, -3.155029296875, -2.8004150390625, -2.44580078125, -2.0911865234375, -1.736572265625, -1.3819580078125, -1.02734375, -0.6727294921875, -0.318115234375, 0.0364990234375, 0.39111328125, 0.7457275390625, 1.100341796875, 1.4549560546875, 1.8095703125, 2.1641845703125, 2.518798828125, 2.8734130859375, 3.22802734375, 3.5826416015625, 3.937255859375, 4.2918701171875, 4.646484375, 5.0010986328125, 5.355712890625, 5.7103271484375, 6.06494140625, 6.4195556640625, 6.774169921875, 7.1287841796875, 7.4833984375, 7.8380126953125, 8.192626953125, 8.5472412109375, 8.90185546875, 9.2564697265625, 9.611083984375, 9.9656982421875, 10.3203125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 5.0, 8.0, 4.0, 6.0, 6.0, 11.0, 10.0, 11.0, 15.0, 14.0, 14.0, 19.0, 32.0, 30.0, 25.0, 36.0, 51.0, 39.0, 43.0, 43.0, 53.0, 55.0, 42.0, 42.0, 43.0, 43.0, 36.0, 30.0, 32.0, 33.0, 28.0, 18.0, 19.0, 20.0, 12.0, 24.0, 9.0, 9.0, 11.0, 6.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.28125, -12.9163818359375, -12.551513671875, -12.1866455078125, -11.82177734375, -11.4569091796875, -11.092041015625, -10.7271728515625, -10.3623046875, -9.9974365234375, -9.632568359375, -9.2677001953125, -8.90283203125, -8.5379638671875, -8.173095703125, -7.8082275390625, -7.443359375, -7.0784912109375, -6.713623046875, -6.3487548828125, -5.98388671875, -5.6190185546875, -5.254150390625, -4.8892822265625, -4.5244140625, -4.1595458984375, -3.794677734375, -3.4298095703125, -3.06494140625, -2.7000732421875, -2.335205078125, -1.9703369140625, -1.60546875, -1.2406005859375, -0.875732421875, -0.5108642578125, -0.14599609375, 0.2188720703125, 0.583740234375, 0.9486083984375, 1.3134765625, 1.6783447265625, 2.043212890625, 2.4080810546875, 2.77294921875, 3.1378173828125, 3.502685546875, 3.8675537109375, 4.232421875, 4.5972900390625, 4.962158203125, 5.3270263671875, 5.69189453125, 6.0567626953125, 6.421630859375, 6.7864990234375, 7.1513671875, 7.5162353515625, 7.881103515625, 8.2459716796875, 8.61083984375, 8.9757080078125, 9.340576171875, 9.7054443359375, 10.0703125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 10.0, 25.0, 28.0, 30.0, 62.0, 67.0, 129.0, 193.0, 261.0, 381.0, 585.0, 901.0, 1476.0, 2244.0, 4048.0, 6862.0, 12175.0, 22179.0, 41852.0, 77759.0, 135479.0, 196176.0, 203594.0, 149212.0, 87230.0, 47491.0, 25054.0, 13851.0, 7558.0, 4286.0, 2596.0, 1702.0, 1016.0, 638.0, 448.0, 314.0, 194.0, 121.0, 99.0, 73.0, 42.0, 34.0, 19.0, 20.0, 10.0, 4.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.7421875, -13.3140869140625, -12.885986328125, -12.4578857421875, -12.02978515625, -11.6016845703125, -11.173583984375, -10.7454833984375, -10.3173828125, -9.8892822265625, -9.461181640625, -9.0330810546875, -8.60498046875, -8.1768798828125, -7.748779296875, -7.3206787109375, -6.892578125, -6.4644775390625, -6.036376953125, -5.6082763671875, -5.18017578125, -4.7520751953125, -4.323974609375, -3.8958740234375, -3.4677734375, -3.0396728515625, -2.611572265625, -2.1834716796875, -1.75537109375, -1.3272705078125, -0.899169921875, -0.4710693359375, -0.04296875, 0.3851318359375, 0.813232421875, 1.2413330078125, 1.66943359375, 2.0975341796875, 2.525634765625, 2.9537353515625, 3.3818359375, 3.8099365234375, 4.238037109375, 4.6661376953125, 5.09423828125, 5.5223388671875, 5.950439453125, 6.3785400390625, 6.806640625, 7.2347412109375, 7.662841796875, 8.0909423828125, 8.51904296875, 8.9471435546875, 9.375244140625, 9.8033447265625, 10.2314453125, 10.6595458984375, 11.087646484375, 11.5157470703125, 11.94384765625, 12.3719482421875, 12.800048828125, 13.2281494140625, 13.65625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 5.0, 5.0, 5.0, 5.0, 9.0, 9.0, 8.0, 13.0, 8.0, 15.0, 15.0, 17.0, 10.0, 26.0, 26.0, 29.0, 29.0, 25.0, 32.0, 39.0, 29.0, 38.0, 36.0, 36.0, 41.0, 34.0, 27.0, 35.0, 39.0, 31.0, 32.0, 39.0, 36.0, 36.0, 30.0, 17.0, 20.0, 19.0, 13.0, 12.0, 10.0, 13.0, 7.0, 7.0, 8.0, 8.0, 7.0, 8.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-6.01953125, -5.82232666015625, -5.6251220703125, -5.42791748046875, -5.230712890625, -5.03350830078125, -4.8363037109375, -4.63909912109375, -4.44189453125, -4.24468994140625, -4.0474853515625, -3.85028076171875, -3.653076171875, -3.45587158203125, -3.2586669921875, -3.06146240234375, -2.8642578125, -2.66705322265625, -2.4698486328125, -2.27264404296875, -2.075439453125, -1.87823486328125, -1.6810302734375, -1.48382568359375, -1.28662109375, -1.08941650390625, -0.8922119140625, -0.69500732421875, -0.497802734375, -0.30059814453125, -0.1033935546875, 0.09381103515625, 0.291015625, 0.48822021484375, 0.6854248046875, 0.88262939453125, 1.079833984375, 1.27703857421875, 1.4742431640625, 1.67144775390625, 1.86865234375, 2.06585693359375, 2.2630615234375, 2.46026611328125, 2.657470703125, 2.85467529296875, 3.0518798828125, 3.24908447265625, 3.4462890625, 3.64349365234375, 3.8406982421875, 4.03790283203125, 4.235107421875, 4.43231201171875, 4.6295166015625, 4.82672119140625, 5.02392578125, 5.22113037109375, 5.4183349609375, 5.61553955078125, 5.812744140625, 6.00994873046875, 6.2071533203125, 6.40435791015625, 6.6015625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 3.0, 5.0, 12.0, 17.0, 28.0, 31.0, 63.0, 75.0, 108.0, 195.0, 345.0, 538.0, 911.0, 1595.0, 2808.0, 5993.0, 23303.0, 351878.0, 611217.0, 34473.0, 7508.0, 3142.0, 1636.0, 1018.0, 623.0, 358.0, 248.0, 141.0, 94.0, 65.0, 28.0, 26.0, 18.0, 17.0, 16.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-70.75, -68.89306640625, -67.0361328125, -65.17919921875, -63.322265625, -61.46533203125, -59.6083984375, -57.75146484375, -55.89453125, -54.03759765625, -52.1806640625, -50.32373046875, -48.466796875, -46.60986328125, -44.7529296875, -42.89599609375, -41.0390625, -39.18212890625, -37.3251953125, -35.46826171875, -33.611328125, -31.75439453125, -29.8974609375, -28.04052734375, -26.18359375, -24.32666015625, -22.4697265625, -20.61279296875, -18.755859375, -16.89892578125, -15.0419921875, -13.18505859375, -11.328125, -9.47119140625, -7.6142578125, -5.75732421875, -3.900390625, -2.04345703125, -0.1865234375, 1.67041015625, 3.52734375, 5.38427734375, 7.2412109375, 9.09814453125, 10.955078125, 12.81201171875, 14.6689453125, 16.52587890625, 18.3828125, 20.23974609375, 22.0966796875, 23.95361328125, 25.810546875, 27.66748046875, 29.5244140625, 31.38134765625, 33.23828125, 35.09521484375, 36.9521484375, 38.80908203125, 40.666015625, 42.52294921875, 44.3798828125, 46.23681640625, 48.09375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 10.0, 17.0, 35.0, 95.0, 193.0, 297.0, 194.0, 80.0, 40.0, 16.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002716064453125, -0.0025949478149414062, -0.0024738311767578125, -0.0023527145385742188, -0.002231597900390625, -0.0021104812622070312, -0.0019893646240234375, -0.0018682479858398438, -0.00174713134765625, -0.0016260147094726562, -0.0015048980712890625, -0.0013837814331054688, -0.001262664794921875, -0.0011415481567382812, -0.0010204315185546875, -0.0008993148803710938, -0.0007781982421875, -0.0006570816040039062, -0.0005359649658203125, -0.00041484832763671875, -0.000293731689453125, -0.00017261505126953125, -5.14984130859375e-05, 6.961822509765625e-05, 0.00019073486328125, 0.00031185150146484375, 0.0004329681396484375, 0.0005540847778320312, 0.000675201416015625, 0.0007963180541992188, 0.0009174346923828125, 0.0010385513305664062, 0.00115966796875, 0.0012807846069335938, 0.0014019012451171875, 0.0015230178833007812, 0.001644134521484375, 0.0017652511596679688, 0.0018863677978515625, 0.0020074844360351562, 0.00212860107421875, 0.0022497177124023438, 0.0023708343505859375, 0.0024919509887695312, 0.002613067626953125, 0.0027341842651367188, 0.0028553009033203125, 0.0029764175415039062, 0.0030975341796875, 0.0032186508178710938, 0.0033397674560546875, 0.0034608840942382812, 0.003582000732421875, 0.0037031173706054688, 0.0038242340087890625, 0.003945350646972656, 0.00406646728515625, 0.004187583923339844, 0.0043087005615234375, 0.004429817199707031, 0.004550933837890625, 0.004672050476074219, 0.0047931671142578125, 0.004914283752441406, 0.005035400390625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 4.0, 2.0, 7.0, 8.0, 10.0, 13.0, 8.0, 22.0, 27.0, 40.0, 55.0, 68.0, 75.0, 118.0, 146.0, 195.0, 247.0, 342.0, 455.0, 545.0, 720.0, 1003.0, 1332.0, 2021.0, 3235.0, 5794.0, 12521.0, 37406.0, 206977.0, 589976.0, 132010.0, 28243.0, 10266.0, 4867.0, 2833.0, 1870.0, 1223.0, 946.0, 688.0, 550.0, 409.0, 293.0, 226.0, 194.0, 131.0, 107.0, 84.0, 64.0, 57.0, 37.0, 22.0, 14.0, 16.0, 11.0, 8.0, 10.0, 4.0, 4.0, 2.0, 2.0, 3.0], "bins": [-34.09375, -33.041015625, -31.98828125, -30.935546875, -29.8828125, -28.830078125, -27.77734375, -26.724609375, -25.671875, -24.619140625, -23.56640625, -22.513671875, -21.4609375, -20.408203125, -19.35546875, -18.302734375, -17.25, -16.197265625, -15.14453125, -14.091796875, -13.0390625, -11.986328125, -10.93359375, -9.880859375, -8.828125, -7.775390625, -6.72265625, -5.669921875, -4.6171875, -3.564453125, -2.51171875, -1.458984375, -0.40625, 0.646484375, 1.69921875, 2.751953125, 3.8046875, 4.857421875, 5.91015625, 6.962890625, 8.015625, 9.068359375, 10.12109375, 11.173828125, 12.2265625, 13.279296875, 14.33203125, 15.384765625, 16.4375, 17.490234375, 18.54296875, 19.595703125, 20.6484375, 21.701171875, 22.75390625, 23.806640625, 24.859375, 25.912109375, 26.96484375, 28.017578125, 29.0703125, 30.123046875, 31.17578125, 32.228515625, 33.28125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 10.0, 4.0, 26.0, 27.0, 86.0, 153.0, 216.0, 224.0, 130.0, 52.0, 15.0, 14.0, 7.0, 6.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.5687255859375, -7.285888671875, -7.0030517578125, -6.72021484375, -6.4373779296875, -6.154541015625, -5.8717041015625, -5.5888671875, -5.3060302734375, -5.023193359375, -4.7403564453125, -4.45751953125, -4.1746826171875, -3.891845703125, -3.6090087890625, -3.326171875, -3.0433349609375, -2.760498046875, -2.4776611328125, -2.19482421875, -1.9119873046875, -1.629150390625, -1.3463134765625, -1.0634765625, -0.7806396484375, -0.497802734375, -0.2149658203125, 0.06787109375, 0.3507080078125, 0.633544921875, 0.9163818359375, 1.19921875, 1.4820556640625, 1.764892578125, 2.0477294921875, 2.33056640625, 2.6134033203125, 2.896240234375, 3.1790771484375, 3.4619140625, 3.7447509765625, 4.027587890625, 4.3104248046875, 4.59326171875, 4.8760986328125, 5.158935546875, 5.4417724609375, 5.724609375, 6.0074462890625, 6.290283203125, 6.5731201171875, 6.85595703125, 7.1387939453125, 7.421630859375, 7.7044677734375, 7.9873046875, 8.2701416015625, 8.552978515625, 8.8358154296875, 9.11865234375, 9.4014892578125, 9.684326171875, 9.9671630859375, 10.25]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 11.0, 10.0, 12.0, 11.0, 13.0, 22.0, 23.0, 29.0, 27.0, 33.0, 32.0, 54.0, 62.0, 55.0, 64.0, 58.0, 71.0, 44.0, 54.0, 37.0, 49.0, 34.0, 30.0, 25.0, 32.0, 17.0, 12.0, 12.0, 11.0, 7.0, 10.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.450876235961914, -18.82955551147461, -18.208234786987305, -17.5869140625, -16.965593338012695, -16.34427261352539, -15.722951889038086, -15.101631164550781, -14.480310440063477, -13.858989715576172, -13.237668991088867, -12.616348266601562, -11.995027542114258, -11.373706817626953, -10.752386093139648, -10.131065368652344, -9.509745597839355, -8.88842487335205, -8.267104148864746, -7.645783424377441, -7.024462699890137, -6.403141975402832, -5.7818217277526855, -5.160501003265381, -4.539180278778076, -3.9178595542907715, -3.296538829803467, -2.675218343734741, -2.0538976192474365, -1.4325768947601318, -0.8112564086914062, -0.18993568420410156, 0.4313850402832031, 1.0527057647705078, 1.674026370048523, 2.295346975326538, 2.9166676998138428, 3.5379884243011475, 4.159308910369873, 4.780629634857178, 5.401950359344482, 6.023271083831787, 6.644591808319092, 7.265912055969238, 7.887232780456543, 8.508553504943848, 9.129874229431152, 9.751194953918457, 10.372515678405762, 10.993836402893066, 11.615157127380371, 12.236477851867676, 12.85779857635498, 13.479119300842285, 14.100439071655273, 14.721759796142578, 15.343080520629883, 15.964401245117188, 16.585721969604492, 17.207042694091797, 17.8283634185791, 18.449684143066406, 19.07100486755371, 19.692325592041016, 20.31364631652832]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 3.0, 7.0, 4.0, 8.0, 15.0, 14.0, 15.0, 21.0, 24.0, 23.0, 25.0, 28.0, 30.0, 31.0, 46.0, 38.0, 47.0, 56.0, 43.0, 47.0, 51.0, 39.0, 40.0, 40.0, 38.0, 28.0, 27.0, 30.0, 31.0, 20.0, 15.0, 23.0, 16.0, 11.0, 16.0, 10.0, 6.0, 5.0, 6.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.02629566192627, -12.654746055603027, -12.283196449279785, -11.911645889282227, -11.540096282958984, -11.168546676635742, -10.7969970703125, -10.425447463989258, -10.053897857666016, -9.682348251342773, -9.310798645019531, -8.939249038696289, -8.56769847869873, -8.196148872375488, -7.824599266052246, -7.453049659729004, -7.081499099731445, -6.709949493408203, -6.338399410247803, -5.9668498039245605, -5.59529972076416, -5.223750114440918, -4.852200508117676, -4.480650901794434, -4.109100818634033, -3.737550973892212, -3.3660011291503906, -2.9944515228271484, -2.622901678085327, -2.251351833343506, -1.8798022270202637, -1.5082523822784424, -1.1367034912109375, -0.765153706073761, -0.3936039209365845, -0.022054195404052734, 0.34949564933776855, 0.7210454940795898, 1.092595100402832, 1.4641449451446533, 1.8356947898864746, 2.207244634628296, 2.578794479370117, 2.9503440856933594, 3.3218939304351807, 3.693443775177002, 4.064993381500244, 4.4365434646606445, 4.808093070983887, 5.179642677307129, 5.551192760467529, 5.9227423667907715, 6.294292449951172, 6.665842056274414, 7.037391662597656, 7.408941268920898, 7.780491352081299, 8.1520414352417, 8.523591041564941, 8.895140647888184, 9.266690254211426, 9.638240814208984, 10.009790420532227, 10.381340026855469, 10.752889633178711]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 10.0, 8.0, 9.0, 21.0, 24.0, 26.0, 36.0, 80.0, 95.0, 135.0, 211.0, 331.0, 536.0, 772.0, 1235.0, 2037.0, 3174.0, 5488.0, 9178.0, 15876.0, 27916.0, 52752.0, 108215.0, 257623.0, 681730.0, 1313093.0, 993303.0, 396094.0, 160655.0, 74826.0, 38319.0, 20841.0, 11929.0, 6906.0, 4102.0, 2469.0, 1558.0, 887.0, 613.0, 425.0, 270.0, 173.0, 98.0, 71.0, 43.0, 33.0, 17.0, 13.0, 11.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0], "bins": [-27.203125, -26.396484375, -25.58984375, -24.783203125, -23.9765625, -23.169921875, -22.36328125, -21.556640625, -20.75, -19.943359375, -19.13671875, -18.330078125, -17.5234375, -16.716796875, -15.91015625, -15.103515625, -14.296875, -13.490234375, -12.68359375, -11.876953125, -11.0703125, -10.263671875, -9.45703125, -8.650390625, -7.84375, -7.037109375, -6.23046875, -5.423828125, -4.6171875, -3.810546875, -3.00390625, -2.197265625, -1.390625, -0.583984375, 0.22265625, 1.029296875, 1.8359375, 2.642578125, 3.44921875, 4.255859375, 5.0625, 5.869140625, 6.67578125, 7.482421875, 8.2890625, 9.095703125, 9.90234375, 10.708984375, 11.515625, 12.322265625, 13.12890625, 13.935546875, 14.7421875, 15.548828125, 16.35546875, 17.162109375, 17.96875, 18.775390625, 19.58203125, 20.388671875, 21.1953125, 22.001953125, 22.80859375, 23.615234375, 24.421875]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 5.0, 14.0, 11.0, 12.0, 10.0, 17.0, 17.0, 27.0, 29.0, 21.0, 29.0, 38.0, 31.0, 41.0, 39.0, 45.0, 42.0, 57.0, 48.0, 45.0, 43.0, 43.0, 37.0, 38.0, 31.0, 28.0, 34.0, 22.0, 11.0, 26.0, 15.0, 19.0, 8.0, 12.0, 5.0, 8.0, 7.0, 5.0, 8.0, 3.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1796875, -12.800048828125, -12.42041015625, -12.040771484375, -11.6611328125, -11.281494140625, -10.90185546875, -10.522216796875, -10.142578125, -9.762939453125, -9.38330078125, -9.003662109375, -8.6240234375, -8.244384765625, -7.86474609375, -7.485107421875, -7.10546875, -6.725830078125, -6.34619140625, -5.966552734375, -5.5869140625, -5.207275390625, -4.82763671875, -4.447998046875, -4.068359375, -3.688720703125, -3.30908203125, -2.929443359375, -2.5498046875, -2.170166015625, -1.79052734375, -1.410888671875, -1.03125, -0.651611328125, -0.27197265625, 0.107666015625, 0.4873046875, 0.866943359375, 1.24658203125, 1.626220703125, 2.005859375, 2.385498046875, 2.76513671875, 3.144775390625, 3.5244140625, 3.904052734375, 4.28369140625, 4.663330078125, 5.04296875, 5.422607421875, 5.80224609375, 6.181884765625, 6.5615234375, 6.941162109375, 7.32080078125, 7.700439453125, 8.080078125, 8.459716796875, 8.83935546875, 9.218994140625, 9.5986328125, 9.978271484375, 10.35791015625, 10.737548828125, 11.1171875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 7.0, 2.0, 6.0, 11.0, 11.0, 17.0, 36.0, 34.0, 58.0, 84.0, 136.0, 176.0, 236.0, 410.0, 551.0, 868.0, 1266.0, 1882.0, 2961.0, 4711.0, 7242.0, 11778.0, 19245.0, 32410.0, 57609.0, 106099.0, 204501.0, 422066.0, 875165.0, 1135020.0, 652755.0, 308477.0, 153966.0, 81361.0, 45074.0, 25883.0, 15624.0, 9404.0, 5893.0, 3746.0, 2476.0, 1655.0, 1083.0, 773.0, 464.0, 339.0, 226.0, 145.0, 118.0, 78.0, 47.0, 34.0, 28.0, 20.0, 10.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.3125, -28.3447265625, -27.376953125, -26.4091796875, -25.44140625, -24.4736328125, -23.505859375, -22.5380859375, -21.5703125, -20.6025390625, -19.634765625, -18.6669921875, -17.69921875, -16.7314453125, -15.763671875, -14.7958984375, -13.828125, -12.8603515625, -11.892578125, -10.9248046875, -9.95703125, -8.9892578125, -8.021484375, -7.0537109375, -6.0859375, -5.1181640625, -4.150390625, -3.1826171875, -2.21484375, -1.2470703125, -0.279296875, 0.6884765625, 1.65625, 2.6240234375, 3.591796875, 4.5595703125, 5.52734375, 6.4951171875, 7.462890625, 8.4306640625, 9.3984375, 10.3662109375, 11.333984375, 12.3017578125, 13.26953125, 14.2373046875, 15.205078125, 16.1728515625, 17.140625, 18.1083984375, 19.076171875, 20.0439453125, 21.01171875, 21.9794921875, 22.947265625, 23.9150390625, 24.8828125, 25.8505859375, 26.818359375, 27.7861328125, 28.75390625, 29.7216796875, 30.689453125, 31.6572265625, 32.625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 13.0, 20.0, 15.0, 23.0, 29.0, 32.0, 53.0, 82.0, 107.0, 138.0, 169.0, 206.0, 251.0, 281.0, 338.0, 401.0, 346.0, 338.0, 256.0, 233.0, 182.0, 128.0, 103.0, 86.0, 65.0, 44.0, 33.0, 26.0, 16.0, 16.0, 13.0, 9.0, 6.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.1070556640625, -11.768798828125, -11.4305419921875, -11.09228515625, -10.7540283203125, -10.415771484375, -10.0775146484375, -9.7392578125, -9.4010009765625, -9.062744140625, -8.7244873046875, -8.38623046875, -8.0479736328125, -7.709716796875, -7.3714599609375, -7.033203125, -6.6949462890625, -6.356689453125, -6.0184326171875, -5.68017578125, -5.3419189453125, -5.003662109375, -4.6654052734375, -4.3271484375, -3.9888916015625, -3.650634765625, -3.3123779296875, -2.97412109375, -2.6358642578125, -2.297607421875, -1.9593505859375, -1.62109375, -1.2828369140625, -0.944580078125, -0.6063232421875, -0.26806640625, 0.0701904296875, 0.408447265625, 0.7467041015625, 1.0849609375, 1.4232177734375, 1.761474609375, 2.0997314453125, 2.43798828125, 2.7762451171875, 3.114501953125, 3.4527587890625, 3.791015625, 4.1292724609375, 4.467529296875, 4.8057861328125, 5.14404296875, 5.4822998046875, 5.820556640625, 6.1588134765625, 6.4970703125, 6.8353271484375, 7.173583984375, 7.5118408203125, 7.85009765625, 8.1883544921875, 8.526611328125, 8.8648681640625, 9.203125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 8.0, 6.0, 4.0, 9.0, 16.0, 25.0, 25.0, 19.0, 39.0, 48.0, 36.0, 53.0, 46.0, 53.0, 69.0, 70.0, 67.0, 65.0, 61.0, 58.0, 38.0, 38.0, 33.0, 22.0, 21.0, 17.0, 12.0, 7.0, 7.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.86573028564453, -32.743568420410156, -31.621408462524414, -30.499248504638672, -29.377086639404297, -28.254924774169922, -27.13276481628418, -26.010604858398438, -24.888442993164062, -23.766281127929688, -22.644121170043945, -21.521961212158203, -20.399799346923828, -19.277637481689453, -18.15547752380371, -17.03331756591797, -15.911155700683594, -14.788994789123535, -13.666833877563477, -12.544672966003418, -11.42251205444336, -10.3003511428833, -9.178190231323242, -8.056029319763184, -6.933868408203125, -5.811707496643066, -4.689546585083008, -3.567385673522949, -2.4452247619628906, -1.323063850402832, -0.20090293884277344, 0.9212579727172852, 2.0434226989746094, 3.165583610534668, 4.287744522094727, 5.409905433654785, 6.532066345214844, 7.654227256774902, 8.776388168334961, 9.89854907989502, 11.020709991455078, 12.142870903015137, 13.265031814575195, 14.387192726135254, 15.509353637695312, 16.631515502929688, 17.75367546081543, 18.875835418701172, 19.997997283935547, 21.120159149169922, 22.242319107055664, 23.364479064941406, 24.48664093017578, 25.608802795410156, 26.7309627532959, 27.85312271118164, 28.975284576416016, 30.09744644165039, 31.219606399536133, 32.341766357421875, 33.46392822265625, 34.586090087890625, 35.708251953125, 36.83041000366211, 37.952571868896484]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 11.0, 5.0, 9.0, 14.0, 19.0, 23.0, 14.0, 20.0, 30.0, 19.0, 25.0, 28.0, 38.0, 34.0, 51.0, 28.0, 39.0, 38.0, 40.0, 35.0, 43.0, 39.0, 40.0, 39.0, 41.0, 33.0, 25.0, 28.0, 29.0, 31.0, 17.0, 13.0, 12.0, 14.0, 12.0, 13.0, 8.0, 7.0, 4.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.0950870513916, -17.545516967773438, -16.995946884155273, -16.446378707885742, -15.896808624267578, -15.347238540649414, -14.79766845703125, -14.248098373413086, -13.698529243469238, -13.148959159851074, -12.599390029907227, -12.049819946289062, -11.500249862670898, -10.95068073272705, -10.401110649108887, -9.851541519165039, -9.301971435546875, -8.752401351928711, -8.202832221984863, -7.653262138366699, -7.103692531585693, -6.5541229248046875, -6.004552841186523, -5.454983234405518, -4.905413627624512, -4.355844020843506, -3.806274175643921, -3.256704330444336, -2.70713472366333, -2.157565116882324, -1.6079952716827393, -1.0584254264831543, -0.5088539123535156, 0.040715813636779785, 0.5902855396270752, 1.1398552656173706, 1.689424991607666, 2.238994598388672, 2.788564443588257, 3.338134288787842, 3.8877038955688477, 4.4372735023498535, 4.986843109130859, 5.536413192749023, 6.085982799530029, 6.635552406311035, 7.185122489929199, 7.734692096710205, 8.284261703491211, 8.833831787109375, 9.383400917053223, 9.932971000671387, 10.482540130615234, 11.032110214233398, 11.581680297851562, 12.131250381469727, 12.680819511413574, 13.230389595031738, 13.779958724975586, 14.32952880859375, 14.879098892211914, 15.428668022155762, 15.978238105773926, 16.527807235717773, 17.077377319335938]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 9.0, 19.0, 14.0, 37.0, 50.0, 71.0, 135.0, 220.0, 321.0, 557.0, 957.0, 1702.0, 2922.0, 5281.0, 9329.0, 17829.0, 34193.0, 66245.0, 124003.0, 202125.0, 228380.0, 161926.0, 91130.0, 47632.0, 24303.0, 13103.0, 6884.0, 3883.0, 2180.0, 1209.0, 683.0, 473.0, 277.0, 162.0, 121.0, 73.0, 38.0, 24.0, 13.0, 17.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-17.375, -16.8956298828125, -16.416259765625, -15.9368896484375, -15.45751953125, -14.9781494140625, -14.498779296875, -14.0194091796875, -13.5400390625, -13.0606689453125, -12.581298828125, -12.1019287109375, -11.62255859375, -11.1431884765625, -10.663818359375, -10.1844482421875, -9.705078125, -9.2257080078125, -8.746337890625, -8.2669677734375, -7.78759765625, -7.3082275390625, -6.828857421875, -6.3494873046875, -5.8701171875, -5.3907470703125, -4.911376953125, -4.4320068359375, -3.95263671875, -3.4732666015625, -2.993896484375, -2.5145263671875, -2.03515625, -1.5557861328125, -1.076416015625, -0.5970458984375, -0.11767578125, 0.3616943359375, 0.841064453125, 1.3204345703125, 1.7998046875, 2.2791748046875, 2.758544921875, 3.2379150390625, 3.71728515625, 4.1966552734375, 4.676025390625, 5.1553955078125, 5.634765625, 6.1141357421875, 6.593505859375, 7.0728759765625, 7.55224609375, 8.0316162109375, 8.510986328125, 8.9903564453125, 9.4697265625, 9.9490966796875, 10.428466796875, 10.9078369140625, 11.38720703125, 11.8665771484375, 12.345947265625, 12.8253173828125, 13.3046875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 2.0, 2.0, 6.0, 7.0, 17.0, 13.0, 15.0, 20.0, 20.0, 32.0, 30.0, 23.0, 35.0, 43.0, 47.0, 54.0, 48.0, 37.0, 67.0, 43.0, 48.0, 43.0, 31.0, 50.0, 42.0, 29.0, 26.0, 32.0, 35.0, 19.0, 14.0, 19.0, 14.0, 13.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.578125, -17.83056640625, -17.0830078125, -16.33544921875, -15.587890625, -14.84033203125, -14.0927734375, -13.34521484375, -12.59765625, -11.85009765625, -11.1025390625, -10.35498046875, -9.607421875, -8.85986328125, -8.1123046875, -7.36474609375, -6.6171875, -5.86962890625, -5.1220703125, -4.37451171875, -3.626953125, -2.87939453125, -2.1318359375, -1.38427734375, -0.63671875, 0.11083984375, 0.8583984375, 1.60595703125, 2.353515625, 3.10107421875, 3.8486328125, 4.59619140625, 5.34375, 6.09130859375, 6.8388671875, 7.58642578125, 8.333984375, 9.08154296875, 9.8291015625, 10.57666015625, 11.32421875, 12.07177734375, 12.8193359375, 13.56689453125, 14.314453125, 15.06201171875, 15.8095703125, 16.55712890625, 17.3046875, 18.05224609375, 18.7998046875, 19.54736328125, 20.294921875, 21.04248046875, 21.7900390625, 22.53759765625, 23.28515625, 24.03271484375, 24.7802734375, 25.52783203125, 26.275390625, 27.02294921875, 27.7705078125, 28.51806640625, 29.265625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 8.0, 13.0, 15.0, 24.0, 49.0, 64.0, 77.0, 140.0, 197.0, 346.0, 528.0, 963.0, 1622.0, 2829.0, 5269.0, 9744.0, 18875.0, 37940.0, 77966.0, 160928.0, 273967.0, 226684.0, 116296.0, 56047.0, 27347.0, 13790.0, 7349.0, 3958.0, 2219.0, 1317.0, 682.0, 487.0, 281.0, 182.0, 117.0, 83.0, 44.0, 36.0, 19.0, 16.0, 17.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0], "bins": [-25.265625, -24.5966796875, -23.927734375, -23.2587890625, -22.58984375, -21.9208984375, -21.251953125, -20.5830078125, -19.9140625, -19.2451171875, -18.576171875, -17.9072265625, -17.23828125, -16.5693359375, -15.900390625, -15.2314453125, -14.5625, -13.8935546875, -13.224609375, -12.5556640625, -11.88671875, -11.2177734375, -10.548828125, -9.8798828125, -9.2109375, -8.5419921875, -7.873046875, -7.2041015625, -6.53515625, -5.8662109375, -5.197265625, -4.5283203125, -3.859375, -3.1904296875, -2.521484375, -1.8525390625, -1.18359375, -0.5146484375, 0.154296875, 0.8232421875, 1.4921875, 2.1611328125, 2.830078125, 3.4990234375, 4.16796875, 4.8369140625, 5.505859375, 6.1748046875, 6.84375, 7.5126953125, 8.181640625, 8.8505859375, 9.51953125, 10.1884765625, 10.857421875, 11.5263671875, 12.1953125, 12.8642578125, 13.533203125, 14.2021484375, 14.87109375, 15.5400390625, 16.208984375, 16.8779296875, 17.546875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 13.0, 11.0, 5.0, 9.0, 16.0, 14.0, 29.0, 19.0, 37.0, 25.0, 19.0, 37.0, 31.0, 36.0, 47.0, 34.0, 41.0, 36.0, 37.0, 46.0, 41.0, 32.0, 38.0, 38.0, 34.0, 35.0, 25.0, 26.0, 16.0, 27.0, 20.0, 14.0, 20.0, 15.0, 12.0, 8.0, 7.0, 6.0, 8.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-11.015625, -10.676025390625, -10.33642578125, -9.996826171875, -9.6572265625, -9.317626953125, -8.97802734375, -8.638427734375, -8.298828125, -7.959228515625, -7.61962890625, -7.280029296875, -6.9404296875, -6.600830078125, -6.26123046875, -5.921630859375, -5.58203125, -5.242431640625, -4.90283203125, -4.563232421875, -4.2236328125, -3.884033203125, -3.54443359375, -3.204833984375, -2.865234375, -2.525634765625, -2.18603515625, -1.846435546875, -1.5068359375, -1.167236328125, -0.82763671875, -0.488037109375, -0.1484375, 0.191162109375, 0.53076171875, 0.870361328125, 1.2099609375, 1.549560546875, 1.88916015625, 2.228759765625, 2.568359375, 2.907958984375, 3.24755859375, 3.587158203125, 3.9267578125, 4.266357421875, 4.60595703125, 4.945556640625, 5.28515625, 5.624755859375, 5.96435546875, 6.303955078125, 6.6435546875, 6.983154296875, 7.32275390625, 7.662353515625, 8.001953125, 8.341552734375, 8.68115234375, 9.020751953125, 9.3603515625, 9.699951171875, 10.03955078125, 10.379150390625, 10.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 6.0, 15.0, 9.0, 18.0, 35.0, 45.0, 55.0, 82.0, 139.0, 154.0, 256.0, 375.0, 616.0, 923.0, 1444.0, 2152.0, 3517.0, 5841.0, 9504.0, 16428.0, 29815.0, 55261.0, 105261.0, 194545.0, 252568.0, 169099.0, 90123.0, 47717.0, 25706.0, 14628.0, 8393.0, 5037.0, 3054.0, 1956.0, 1313.0, 780.0, 519.0, 372.0, 248.0, 157.0, 123.0, 86.0, 55.0, 36.0, 29.0, 16.0, 13.0, 6.0, 13.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0], "bins": [-10.2265625, -9.920166015625, -9.61376953125, -9.307373046875, -9.0009765625, -8.694580078125, -8.38818359375, -8.081787109375, -7.775390625, -7.468994140625, -7.16259765625, -6.856201171875, -6.5498046875, -6.243408203125, -5.93701171875, -5.630615234375, -5.32421875, -5.017822265625, -4.71142578125, -4.405029296875, -4.0986328125, -3.792236328125, -3.48583984375, -3.179443359375, -2.873046875, -2.566650390625, -2.26025390625, -1.953857421875, -1.6474609375, -1.341064453125, -1.03466796875, -0.728271484375, -0.421875, -0.115478515625, 0.19091796875, 0.497314453125, 0.8037109375, 1.110107421875, 1.41650390625, 1.722900390625, 2.029296875, 2.335693359375, 2.64208984375, 2.948486328125, 3.2548828125, 3.561279296875, 3.86767578125, 4.174072265625, 4.48046875, 4.786865234375, 5.09326171875, 5.399658203125, 5.7060546875, 6.012451171875, 6.31884765625, 6.625244140625, 6.931640625, 7.238037109375, 7.54443359375, 7.850830078125, 8.1572265625, 8.463623046875, 8.77001953125, 9.076416015625, 9.3828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 5.0, 9.0, 9.0, 10.0, 7.0, 16.0, 18.0, 18.0, 28.0, 27.0, 28.0, 42.0, 52.0, 54.0, 81.0, 77.0, 75.0, 60.0, 59.0, 59.0, 59.0, 33.0, 37.0, 36.0, 19.0, 16.0, 12.0, 9.0, 9.0, 8.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00045609474182128906, -0.0004414990544319153, -0.0004269033670425415, -0.0004123076796531677, -0.00039771199226379395, -0.00038311630487442017, -0.0003685206174850464, -0.0003539249300956726, -0.00033932924270629883, -0.00032473355531692505, -0.00031013786792755127, -0.0002955421805381775, -0.0002809464931488037, -0.00026635080575942993, -0.00025175511837005615, -0.00023715943098068237, -0.0002225637435913086, -0.00020796805620193481, -0.00019337236881256104, -0.00017877668142318726, -0.00016418099403381348, -0.0001495853066444397, -0.00013498961925506592, -0.00012039393186569214, -0.00010579824447631836, -9.120255708694458e-05, -7.66068696975708e-05, -6.201118230819702e-05, -4.741549491882324e-05, -3.281980752944946e-05, -1.8224120140075684e-05, -3.6284327507019043e-06, 1.0967254638671875e-05, 2.5562942028045654e-05, 4.0158629417419434e-05, 5.475431680679321e-05, 6.935000419616699e-05, 8.394569158554077e-05, 9.854137897491455e-05, 0.00011313706636428833, 0.0001277327537536621, 0.0001423284411430359, 0.00015692412853240967, 0.00017151981592178345, 0.00018611550331115723, 0.000200711190700531, 0.00021530687808990479, 0.00022990256547927856, 0.00024449825286865234, 0.0002590939402580261, 0.0002736896276473999, 0.0002882853150367737, 0.00030288100242614746, 0.00031747668981552124, 0.000332072377204895, 0.0003466680645942688, 0.0003612637519836426, 0.00037585943937301636, 0.00039045512676239014, 0.0004050508141517639, 0.0004196465015411377, 0.0004342421889305115, 0.00044883787631988525, 0.00046343356370925903, 0.0004780292510986328]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 17.0, 28.0, 36.0, 38.0, 59.0, 115.0, 151.0, 235.0, 422.0, 630.0, 939.0, 1505.0, 2497.0, 4056.0, 6708.0, 11501.0, 20089.0, 36653.0, 66838.0, 124955.0, 204637.0, 225467.0, 152666.0, 84114.0, 45155.0, 24580.0, 13775.0, 8141.0, 4726.0, 2942.0, 1781.0, 1091.0, 677.0, 484.0, 292.0, 195.0, 122.0, 61.0, 44.0, 35.0, 28.0, 19.0, 12.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4239501953125, -10.066650390625, -9.7093505859375, -9.35205078125, -8.9947509765625, -8.637451171875, -8.2801513671875, -7.9228515625, -7.5655517578125, -7.208251953125, -6.8509521484375, -6.49365234375, -6.1363525390625, -5.779052734375, -5.4217529296875, -5.064453125, -4.7071533203125, -4.349853515625, -3.9925537109375, -3.63525390625, -3.2779541015625, -2.920654296875, -2.5633544921875, -2.2060546875, -1.8487548828125, -1.491455078125, -1.1341552734375, -0.77685546875, -0.4195556640625, -0.062255859375, 0.2950439453125, 0.65234375, 1.0096435546875, 1.366943359375, 1.7242431640625, 2.08154296875, 2.4388427734375, 2.796142578125, 3.1534423828125, 3.5107421875, 3.8680419921875, 4.225341796875, 4.5826416015625, 4.93994140625, 5.2972412109375, 5.654541015625, 6.0118408203125, 6.369140625, 6.7264404296875, 7.083740234375, 7.4410400390625, 7.79833984375, 8.1556396484375, 8.512939453125, 8.8702392578125, 9.2275390625, 9.5848388671875, 9.942138671875, 10.2994384765625, 10.65673828125, 11.0140380859375, 11.371337890625, 11.7286376953125, 12.0859375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 10.0, 4.0, 19.0, 12.0, 15.0, 20.0, 19.0, 30.0, 35.0, 37.0, 62.0, 56.0, 68.0, 79.0, 67.0, 72.0, 73.0, 41.0, 55.0, 45.0, 39.0, 36.0, 27.0, 15.0, 15.0, 8.0, 13.0, 8.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.73046875, -3.627716064453125, -3.52496337890625, -3.422210693359375, -3.3194580078125, -3.216705322265625, -3.11395263671875, -3.011199951171875, -2.908447265625, -2.805694580078125, -2.70294189453125, -2.600189208984375, -2.4974365234375, -2.394683837890625, -2.29193115234375, -2.189178466796875, -2.08642578125, -1.983673095703125, -1.88092041015625, -1.778167724609375, -1.6754150390625, -1.572662353515625, -1.46990966796875, -1.367156982421875, -1.264404296875, -1.161651611328125, -1.05889892578125, -0.956146240234375, -0.8533935546875, -0.750640869140625, -0.64788818359375, -0.545135498046875, -0.4423828125, -0.339630126953125, -0.23687744140625, -0.134124755859375, -0.0313720703125, 0.071380615234375, 0.17413330078125, 0.276885986328125, 0.379638671875, 0.482391357421875, 0.58514404296875, 0.687896728515625, 0.7906494140625, 0.893402099609375, 0.99615478515625, 1.098907470703125, 1.20166015625, 1.304412841796875, 1.40716552734375, 1.509918212890625, 1.6126708984375, 1.715423583984375, 1.81817626953125, 1.920928955078125, 2.023681640625, 2.126434326171875, 2.22918701171875, 2.331939697265625, 2.4346923828125, 2.537445068359375, 2.64019775390625, 2.742950439453125, 2.845703125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 7.0, 11.0, 19.0, 14.0, 27.0, 29.0, 38.0, 37.0, 44.0, 44.0, 50.0, 55.0, 63.0, 71.0, 52.0, 73.0, 54.0, 53.0, 50.0, 34.0, 32.0, 27.0, 24.0, 19.0, 17.0, 7.0, 4.0, 2.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.7175178527832, -32.60483932495117, -31.49216079711914, -30.379480361938477, -29.266801834106445, -28.154123306274414, -27.04144287109375, -25.92876434326172, -24.816085815429688, -23.703407287597656, -22.590728759765625, -21.47804832458496, -20.36536979675293, -19.2526912689209, -18.140010833740234, -17.027332305908203, -15.914653778076172, -14.80197525024414, -13.689295768737793, -12.576616287231445, -11.463937759399414, -10.351259231567383, -9.238579750061035, -8.125900268554688, -7.013221740722656, -5.900542736053467, -4.787863731384277, -3.675184726715088, -2.5625057220458984, -1.449826717376709, -0.33714771270751953, 0.7755312919616699, 1.8882102966308594, 3.000889301300049, 4.113568305969238, 5.226247310638428, 6.338926315307617, 7.451605319976807, 8.564284324645996, 9.676963806152344, 10.789642333984375, 11.902320861816406, 13.015000343322754, 14.127679824829102, 15.240358352661133, 16.353036880493164, 17.465717315673828, 18.57839584350586, 19.69107437133789, 20.803752899169922, 21.916431427001953, 23.029111862182617, 24.14179039001465, 25.25446891784668, 26.367149353027344, 27.479827880859375, 28.592506408691406, 29.705184936523438, 30.81786346435547, 31.930543899536133, 33.04322052001953, 34.15590286254883, 35.26858139038086, 36.38125991821289, 37.49393844604492]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 7.0, 10.0, 7.0, 22.0, 21.0, 17.0, 17.0, 27.0, 25.0, 25.0, 25.0, 29.0, 44.0, 34.0, 33.0, 44.0, 41.0, 33.0, 40.0, 45.0, 39.0, 40.0, 43.0, 41.0, 36.0, 28.0, 26.0, 26.0, 27.0, 19.0, 16.0, 15.0, 14.0, 16.0, 7.0, 13.0, 7.0, 3.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.160133361816406, -17.593490600585938, -17.02684783935547, -16.460205078125, -15.893562316894531, -15.326919555664062, -14.760276794433594, -14.193634033203125, -13.626991271972656, -13.060348510742188, -12.493705749511719, -11.92706298828125, -11.360420227050781, -10.793777465820312, -10.227134704589844, -9.660491943359375, -9.093849182128906, -8.527206420898438, -7.960563659667969, -7.3939208984375, -6.827278137207031, -6.2606353759765625, -5.693992614746094, -5.127349853515625, -4.560707092285156, -3.9940643310546875, -3.4274215698242188, -2.86077880859375, -2.2941360473632812, -1.7274932861328125, -1.1608505249023438, -0.594207763671875, -0.027566909790039062, 0.5390758514404297, 1.1057186126708984, 1.6723613739013672, 2.239004135131836, 2.8056468963623047, 3.3722896575927734, 3.938932418823242, 4.505575180053711, 5.07221794128418, 5.638860702514648, 6.205503463745117, 6.772146224975586, 7.338788986206055, 7.905431747436523, 8.472074508666992, 9.038717269897461, 9.60536003112793, 10.172002792358398, 10.738645553588867, 11.305288314819336, 11.871931076049805, 12.438573837280273, 13.005216598510742, 13.571859359741211, 14.13850212097168, 14.705144882202148, 15.271787643432617, 15.838430404663086, 16.405073165893555, 16.971715927124023, 17.538358688354492, 18.10500144958496]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 8.0, 19.0, 28.0, 38.0, 75.0, 110.0, 154.0, 201.0, 314.0, 503.0, 747.0, 1138.0, 1714.0, 2768.0, 4143.0, 6590.0, 10312.0, 16541.0, 25745.0, 40503.0, 61734.0, 91662.0, 125379.0, 149410.0, 145808.0, 118882.0, 84933.0, 57070.0, 37258.0, 23471.0, 14873.0, 9409.0, 6076.0, 3844.0, 2487.0, 1537.0, 1033.0, 660.0, 449.0, 312.0, 207.0, 139.0, 92.0, 42.0, 41.0, 26.0, 27.0, 15.0, 10.0, 6.0, 6.0, 4.0, 2.0, 2.0], "bins": [-12.890625, -12.5103759765625, -12.130126953125, -11.7498779296875, -11.36962890625, -10.9893798828125, -10.609130859375, -10.2288818359375, -9.8486328125, -9.4683837890625, -9.088134765625, -8.7078857421875, -8.32763671875, -7.9473876953125, -7.567138671875, -7.1868896484375, -6.806640625, -6.4263916015625, -6.046142578125, -5.6658935546875, -5.28564453125, -4.9053955078125, -4.525146484375, -4.1448974609375, -3.7646484375, -3.3843994140625, -3.004150390625, -2.6239013671875, -2.24365234375, -1.8634033203125, -1.483154296875, -1.1029052734375, -0.72265625, -0.3424072265625, 0.037841796875, 0.4180908203125, 0.79833984375, 1.1785888671875, 1.558837890625, 1.9390869140625, 2.3193359375, 2.6995849609375, 3.079833984375, 3.4600830078125, 3.84033203125, 4.2205810546875, 4.600830078125, 4.9810791015625, 5.361328125, 5.7415771484375, 6.121826171875, 6.5020751953125, 6.88232421875, 7.2625732421875, 7.642822265625, 8.0230712890625, 8.4033203125, 8.7835693359375, 9.163818359375, 9.5440673828125, 9.92431640625, 10.3045654296875, 10.684814453125, 11.0650634765625, 11.4453125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 7.0, 12.0, 12.0, 5.0, 11.0, 16.0, 15.0, 22.0, 29.0, 26.0, 26.0, 22.0, 43.0, 40.0, 34.0, 36.0, 39.0, 45.0, 37.0, 52.0, 50.0, 40.0, 41.0, 31.0, 39.0, 33.0, 30.0, 36.0, 26.0, 24.0, 17.0, 19.0, 15.0, 10.0, 11.0, 4.0, 13.0, 14.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-21.96875, -21.344482421875, -20.72021484375, -20.095947265625, -19.4716796875, -18.847412109375, -18.22314453125, -17.598876953125, -16.974609375, -16.350341796875, -15.72607421875, -15.101806640625, -14.4775390625, -13.853271484375, -13.22900390625, -12.604736328125, -11.98046875, -11.356201171875, -10.73193359375, -10.107666015625, -9.4833984375, -8.859130859375, -8.23486328125, -7.610595703125, -6.986328125, -6.362060546875, -5.73779296875, -5.113525390625, -4.4892578125, -3.864990234375, -3.24072265625, -2.616455078125, -1.9921875, -1.367919921875, -0.74365234375, -0.119384765625, 0.5048828125, 1.129150390625, 1.75341796875, 2.377685546875, 3.001953125, 3.626220703125, 4.25048828125, 4.874755859375, 5.4990234375, 6.123291015625, 6.74755859375, 7.371826171875, 7.99609375, 8.620361328125, 9.24462890625, 9.868896484375, 10.4931640625, 11.117431640625, 11.74169921875, 12.365966796875, 12.990234375, 13.614501953125, 14.23876953125, 14.863037109375, 15.4873046875, 16.111572265625, 16.73583984375, 17.360107421875, 17.984375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 6.0, 14.0, 12.0, 21.0, 37.0, 56.0, 82.0, 133.0, 202.0, 306.0, 447.0, 714.0, 1145.0, 1794.0, 3155.0, 5288.0, 9442.0, 17415.0, 32811.0, 65955.0, 134851.0, 239416.0, 245658.0, 143252.0, 69862.0, 34698.0, 18026.0, 9847.0, 5463.0, 3244.0, 1955.0, 1233.0, 717.0, 434.0, 339.0, 157.0, 131.0, 67.0, 59.0, 43.0, 28.0, 16.0, 8.0, 7.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.8125, -36.70166015625, -35.5908203125, -34.47998046875, -33.369140625, -32.25830078125, -31.1474609375, -30.03662109375, -28.92578125, -27.81494140625, -26.7041015625, -25.59326171875, -24.482421875, -23.37158203125, -22.2607421875, -21.14990234375, -20.0390625, -18.92822265625, -17.8173828125, -16.70654296875, -15.595703125, -14.48486328125, -13.3740234375, -12.26318359375, -11.15234375, -10.04150390625, -8.9306640625, -7.81982421875, -6.708984375, -5.59814453125, -4.4873046875, -3.37646484375, -2.265625, -1.15478515625, -0.0439453125, 1.06689453125, 2.177734375, 3.28857421875, 4.3994140625, 5.51025390625, 6.62109375, 7.73193359375, 8.8427734375, 9.95361328125, 11.064453125, 12.17529296875, 13.2861328125, 14.39697265625, 15.5078125, 16.61865234375, 17.7294921875, 18.84033203125, 19.951171875, 21.06201171875, 22.1728515625, 23.28369140625, 24.39453125, 25.50537109375, 26.6162109375, 27.72705078125, 28.837890625, 29.94873046875, 31.0595703125, 32.17041015625, 33.28125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 8.0, 3.0, 8.0, 7.0, 6.0, 9.0, 11.0, 21.0, 21.0, 29.0, 23.0, 31.0, 49.0, 34.0, 39.0, 46.0, 40.0, 45.0, 33.0, 42.0, 54.0, 35.0, 52.0, 38.0, 47.0, 36.0, 32.0, 31.0, 29.0, 23.0, 28.0, 25.0, 14.0, 16.0, 7.0, 12.0, 7.0, 4.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.66064453125, -15.1337890625, -14.60693359375, -14.080078125, -13.55322265625, -13.0263671875, -12.49951171875, -11.97265625, -11.44580078125, -10.9189453125, -10.39208984375, -9.865234375, -9.33837890625, -8.8115234375, -8.28466796875, -7.7578125, -7.23095703125, -6.7041015625, -6.17724609375, -5.650390625, -5.12353515625, -4.5966796875, -4.06982421875, -3.54296875, -3.01611328125, -2.4892578125, -1.96240234375, -1.435546875, -0.90869140625, -0.3818359375, 0.14501953125, 0.671875, 1.19873046875, 1.7255859375, 2.25244140625, 2.779296875, 3.30615234375, 3.8330078125, 4.35986328125, 4.88671875, 5.41357421875, 5.9404296875, 6.46728515625, 6.994140625, 7.52099609375, 8.0478515625, 8.57470703125, 9.1015625, 9.62841796875, 10.1552734375, 10.68212890625, 11.208984375, 11.73583984375, 12.2626953125, 12.78955078125, 13.31640625, 13.84326171875, 14.3701171875, 14.89697265625, 15.423828125, 15.95068359375, 16.4775390625, 17.00439453125, 17.53125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 12.0, 7.0, 13.0, 27.0, 30.0, 44.0, 63.0, 118.0, 172.0, 315.0, 600.0, 1082.0, 2218.0, 4950.0, 15451.0, 86390.0, 637277.0, 253902.0, 31380.0, 8088.0, 3131.0, 1523.0, 749.0, 405.0, 222.0, 114.0, 90.0, 53.0, 35.0, 28.0, 14.0, 12.0, 9.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.3125, -77.931640625, -75.55078125, -73.169921875, -70.7890625, -68.408203125, -66.02734375, -63.646484375, -61.265625, -58.884765625, -56.50390625, -54.123046875, -51.7421875, -49.361328125, -46.98046875, -44.599609375, -42.21875, -39.837890625, -37.45703125, -35.076171875, -32.6953125, -30.314453125, -27.93359375, -25.552734375, -23.171875, -20.791015625, -18.41015625, -16.029296875, -13.6484375, -11.267578125, -8.88671875, -6.505859375, -4.125, -1.744140625, 0.63671875, 3.017578125, 5.3984375, 7.779296875, 10.16015625, 12.541015625, 14.921875, 17.302734375, 19.68359375, 22.064453125, 24.4453125, 26.826171875, 29.20703125, 31.587890625, 33.96875, 36.349609375, 38.73046875, 41.111328125, 43.4921875, 45.873046875, 48.25390625, 50.634765625, 53.015625, 55.396484375, 57.77734375, 60.158203125, 62.5390625, 64.919921875, 67.30078125, 69.681640625, 72.0625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 9.0, 8.0, 12.0, 22.0, 30.0, 57.0, 91.0, 141.0, 183.0, 159.0, 98.0, 80.0, 37.0, 19.0, 13.0, 10.0, 6.0, 6.0, 5.0, 3.0, 8.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00366973876953125, -0.0035080313682556152, -0.0033463239669799805, -0.0031846165657043457, -0.003022909164428711, -0.002861201763153076, -0.0026994943618774414, -0.0025377869606018066, -0.002376079559326172, -0.002214372158050537, -0.0020526647567749023, -0.0018909573554992676, -0.0017292499542236328, -0.001567542552947998, -0.0014058351516723633, -0.0012441277503967285, -0.0010824203491210938, -0.000920712947845459, -0.0007590055465698242, -0.0005972981452941895, -0.0004355907440185547, -0.0002738833427429199, -0.00011217594146728516, 4.953145980834961e-05, 0.00021123886108398438, 0.00037294626235961914, 0.0005346536636352539, 0.0006963610649108887, 0.0008580684661865234, 0.0010197758674621582, 0.001181483268737793, 0.0013431906700134277, 0.0015048980712890625, 0.0016666054725646973, 0.001828312873840332, 0.001990020275115967, 0.0021517276763916016, 0.0023134350776672363, 0.002475142478942871, 0.002636849880218506, 0.0027985572814941406, 0.0029602646827697754, 0.00312197208404541, 0.003283679485321045, 0.0034453868865966797, 0.0036070942878723145, 0.0037688016891479492, 0.003930509090423584, 0.004092216491699219, 0.0042539238929748535, 0.004415631294250488, 0.004577338695526123, 0.004739046096801758, 0.004900753498077393, 0.005062460899353027, 0.005224168300628662, 0.005385875701904297, 0.005547583103179932, 0.005709290504455566, 0.005870997905731201, 0.006032705307006836, 0.006194412708282471, 0.0063561201095581055, 0.00651782751083374, 0.006679534912109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 3.0, 7.0, 2.0, 19.0, 13.0, 18.0, 19.0, 41.0, 30.0, 62.0, 83.0, 106.0, 114.0, 169.0, 248.0, 350.0, 513.0, 743.0, 1260.0, 1826.0, 3090.0, 6423.0, 15059.0, 43647.0, 158424.0, 463033.0, 249513.0, 64134.0, 20973.0, 8319.0, 3819.0, 2250.0, 1335.0, 862.0, 584.0, 398.0, 303.0, 175.0, 162.0, 115.0, 82.0, 57.0, 44.0, 32.0, 31.0, 16.0, 8.0, 10.0, 10.0, 1.0, 8.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-42.3125, -41.01708984375, -39.7216796875, -38.42626953125, -37.130859375, -35.83544921875, -34.5400390625, -33.24462890625, -31.94921875, -30.65380859375, -29.3583984375, -28.06298828125, -26.767578125, -25.47216796875, -24.1767578125, -22.88134765625, -21.5859375, -20.29052734375, -18.9951171875, -17.69970703125, -16.404296875, -15.10888671875, -13.8134765625, -12.51806640625, -11.22265625, -9.92724609375, -8.6318359375, -7.33642578125, -6.041015625, -4.74560546875, -3.4501953125, -2.15478515625, -0.859375, 0.43603515625, 1.7314453125, 3.02685546875, 4.322265625, 5.61767578125, 6.9130859375, 8.20849609375, 9.50390625, 10.79931640625, 12.0947265625, 13.39013671875, 14.685546875, 15.98095703125, 17.2763671875, 18.57177734375, 19.8671875, 21.16259765625, 22.4580078125, 23.75341796875, 25.048828125, 26.34423828125, 27.6396484375, 28.93505859375, 30.23046875, 31.52587890625, 32.8212890625, 34.11669921875, 35.412109375, 36.70751953125, 38.0029296875, 39.29833984375, 40.59375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 9.0, 14.0, 20.0, 23.0, 31.0, 61.0, 79.0, 121.0, 135.0, 143.0, 126.0, 82.0, 40.0, 34.0, 19.0, 17.0, 13.0, 10.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.515625, -8.2315673828125, -7.947509765625, -7.6634521484375, -7.37939453125, -7.0953369140625, -6.811279296875, -6.5272216796875, -6.2431640625, -5.9591064453125, -5.675048828125, -5.3909912109375, -5.10693359375, -4.8228759765625, -4.538818359375, -4.2547607421875, -3.970703125, -3.6866455078125, -3.402587890625, -3.1185302734375, -2.83447265625, -2.5504150390625, -2.266357421875, -1.9822998046875, -1.6982421875, -1.4141845703125, -1.130126953125, -0.8460693359375, -0.56201171875, -0.2779541015625, 0.006103515625, 0.2901611328125, 0.57421875, 0.8582763671875, 1.142333984375, 1.4263916015625, 1.71044921875, 1.9945068359375, 2.278564453125, 2.5626220703125, 2.8466796875, 3.1307373046875, 3.414794921875, 3.6988525390625, 3.98291015625, 4.2669677734375, 4.551025390625, 4.8350830078125, 5.119140625, 5.4031982421875, 5.687255859375, 5.9713134765625, 6.25537109375, 6.5394287109375, 6.823486328125, 7.1075439453125, 7.3916015625, 7.6756591796875, 7.959716796875, 8.2437744140625, 8.52783203125, 8.8118896484375, 9.095947265625, 9.3800048828125, 9.6640625]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 1.0, 6.0, 4.0, 6.0, 8.0, 16.0, 7.0, 17.0, 17.0, 15.0, 19.0, 26.0, 28.0, 30.0, 29.0, 45.0, 43.0, 42.0, 59.0, 68.0, 55.0, 50.0, 52.0, 45.0, 47.0, 39.0, 39.0, 30.0, 31.0, 17.0, 24.0, 13.0, 15.0, 17.0, 7.0, 8.0, 6.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.053197860717773, -29.982011795043945, -28.91082763671875, -27.839641571044922, -26.768455505371094, -25.697269439697266, -24.626083374023438, -23.554899215698242, -22.483713150024414, -21.412527084350586, -20.34134292602539, -19.270156860351562, -18.198970794677734, -17.127784729003906, -16.056598663330078, -14.985414505004883, -13.914228439331055, -12.843042373657227, -11.771857261657715, -10.700672149658203, -9.629486083984375, -8.558300018310547, -7.487114906311035, -6.415929317474365, -5.344743728637695, -4.273558139801025, -3.2023725509643555, -2.1311869621276855, -1.0600013732910156, 0.011184215545654297, 1.0823698043823242, 2.153555393218994, 3.2247390747070312, 4.295924663543701, 5.367110252380371, 6.438295841217041, 7.509481430053711, 8.580667495727539, 9.65185260772705, 10.723037719726562, 11.79422378540039, 12.865409851074219, 13.93659496307373, 15.007780075073242, 16.07896614074707, 17.1501522064209, 18.221336364746094, 19.292522430419922, 20.36370849609375, 21.434894561767578, 22.506080627441406, 23.5772647857666, 24.64845085144043, 25.719636917114258, 26.790821075439453, 27.86200714111328, 28.93319320678711, 30.004379272460938, 31.075565338134766, 32.146751403808594, 33.217933654785156, 34.289119720458984, 35.36030578613281, 36.43149185180664, 37.50267791748047]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 10.0, 9.0, 16.0, 33.0, 20.0, 19.0, 31.0, 33.0, 37.0, 32.0, 47.0, 37.0, 50.0, 47.0, 33.0, 38.0, 56.0, 44.0, 44.0, 43.0, 40.0, 39.0, 42.0, 36.0, 26.0, 21.0, 21.0, 13.0, 12.0, 14.0, 9.0, 3.0, 4.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-36.294898986816406, -35.2972526550293, -34.29961013793945, -33.301963806152344, -32.304317474365234, -31.306673049926758, -30.30902862548828, -29.311382293701172, -28.313735961914062, -27.316091537475586, -26.318445205688477, -25.32080078125, -24.32315444946289, -23.325510025024414, -22.327865600585938, -21.330219268798828, -20.33257484436035, -19.334930419921875, -18.337284088134766, -17.33963966369629, -16.34199333190918, -15.344348907470703, -14.34670352935791, -13.349058151245117, -12.351412773132324, -11.353767395019531, -10.356122016906738, -9.358476638793945, -8.360832214355469, -7.363186359405518, -6.365541458129883, -5.36789608001709, -4.37025260925293, -3.3726072311401367, -2.374962091445923, -1.377316951751709, -0.379671573638916, 0.617973804473877, 1.6156187057495117, 2.6132640838623047, 3.6109094619750977, 4.608554840087891, 5.606200218200684, 6.603845119476318, 7.601490497589111, 8.599136352539062, 9.596780776977539, 10.594426155090332, 11.592071533203125, 12.589716911315918, 13.587362289428711, 14.585006713867188, 15.582653045654297, 16.580297470092773, 17.57794189453125, 18.57558822631836, 19.57323455810547, 20.570878982543945, 21.568525314331055, 22.56616973876953, 23.56381607055664, 24.561460494995117, 25.559104919433594, 26.556751251220703, 27.55439567565918]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 6.0, 2.0, 7.0, 5.0, 6.0, 7.0, 15.0, 8.0, 19.0, 21.0, 28.0, 35.0, 49.0, 47.0, 65.0, 103.0, 117.0, 152.0, 186.0, 270.0, 358.0, 628.0, 1983.0, 14659.0, 500941.0, 2281.0, 703.0, 399.0, 281.0, 197.0, 159.0, 101.0, 107.0, 85.0, 60.0, 45.0, 32.0, 23.0, 29.0, 9.0, 11.0, 8.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-592.6599731445312, -570.7471313476562, -548.834228515625, -526.92138671875, -505.008544921875, -483.0956726074219, -461.18280029296875, -439.26995849609375, -417.3570861816406, -395.4442138671875, -373.5313720703125, -351.6184997558594, -329.70562744140625, -307.79278564453125, -285.8799133300781, -263.967041015625, -242.05419921875, -220.14134216308594, -198.22848510742188, -176.31561279296875, -154.4027557373047, -132.48989868164062, -110.5770263671875, -88.66416931152344, -66.75131225585938, -44.83845138549805, -22.92559051513672, -1.012725830078125, 20.900131225585938, 42.81298828125, 64.72586059570312, 86.63871765136719, 108.5516357421875, 130.46449279785156, 152.37734985351562, 174.29022216796875, 196.2030792236328, 218.11593627929688, 240.02880859375, 261.941650390625, 283.8545227050781, 305.76739501953125, 327.68023681640625, 349.5931091308594, 371.5059814453125, 393.4188232421875, 415.3316955566406, 437.24456787109375, 459.15740966796875, 481.0702819824219, 502.9831237792969, 524.89599609375, 546.808837890625, 568.7216796875, 590.6345825195312, 612.5474243164062, 634.4603271484375, 656.3731689453125, 678.2860717773438, 700.1989135742188, 722.1117553710938, 744.024658203125, 765.9375, 787.850341796875, 809.76318359375]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 7.0, 9.0, 8.0, 9.0, 18.0, 26.0, 29.0, 19.0, 29.0, 27.0, 40.0, 35.0, 42.0, 43.0, 46.0, 46.0, 33.0, 1061.0, 55.0, 43.0, 52.0, 34.0, 43.0, 40.0, 44.0, 36.0, 27.0, 17.0, 24.0, 13.0, 15.0, 12.0, 9.0, 6.0, 7.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1188.595947265625, -1155.994140625, -1123.3922119140625, -1090.7904052734375, -1058.1884765625, -1025.586669921875, -992.9847412109375, -960.3829345703125, -927.781005859375, -895.1791381835938, -862.5772705078125, -829.9754028320312, -797.37353515625, -764.7716674804688, -732.1697998046875, -699.5679931640625, -666.9661254882812, -634.3642578125, -601.7623901367188, -569.1605224609375, -536.5586547851562, -503.956787109375, -471.3549499511719, -438.7530822753906, -406.1512145996094, -373.5493469238281, -340.9474792480469, -308.34564208984375, -275.7437744140625, -243.1418914794922, -210.5400390625, -177.93817138671875, -145.33624267578125, -112.734375, -80.13251495361328, -47.53065490722656, -14.928787231445312, 17.673080444335938, 50.274932861328125, 82.87680053710938, 115.47866821289062, 148.08053588867188, 180.68240356445312, 213.2842559814453, 245.88612365722656, 278.48797607421875, 311.08984375, 343.69171142578125, 376.2935791015625, 408.89544677734375, 441.497314453125, 474.09918212890625, 506.7010498046875, 539.3029174804688, 571.90478515625, 604.506591796875, 637.1085205078125, 669.7103881835938, 702.312255859375, 734.9141235351562, 767.5159912109375, 800.1178588867188, 832.7197265625, 865.321533203125, 897.9234008789062]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 6.0, 4.0, 7.0, 8.0, 17.0, 20.0, 28.0, 23.0, 43.0, 60.0, 74.0, 99.0, 134.0, 209.0, 341.0, 540.0, 791.0, 1275.0, 1886.0, 2935.0, 4775.0, 11038.0, 31183922.0, 27123.0, 13338.0, 3338.0, 1018.0, 424.0, 230.0, 187.0, 139.0, 91.0, 78.0, 84.0, 56.0, 36.0, 30.0, 28.0, 17.0, 22.0, 10.0, 7.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-655.300048828125, -633.9081420898438, -612.5162353515625, -591.1243896484375, -569.7324829101562, -548.340576171875, -526.9486694335938, -505.5567626953125, -484.16485595703125, -462.77294921875, -441.3810729980469, -419.9891662597656, -398.5972595214844, -377.20538330078125, -355.8134765625, -334.42156982421875, -313.0296936035156, -291.6377868652344, -270.24591064453125, -248.85400390625, -227.46209716796875, -206.07020568847656, -184.67831420898438, -163.28640747070312, -141.89451599121094, -120.50261688232422, -99.1107177734375, -77.71882629394531, -56.326927185058594, -34.935028076171875, -13.543136596679688, 7.8487701416015625, 29.24066162109375, 50.63256072998047, 72.02445983886719, 93.41635131835938, 114.8082504272461, 136.2001495361328, 157.592041015625, 178.98394775390625, 200.37583923339844, 221.76773071289062, 243.15963745117188, 264.551513671875, 285.94342041015625, 307.3353271484375, 328.72723388671875, 350.119140625, 371.5110168457031, 392.9029235839844, 414.2947998046875, 435.68670654296875, 457.07861328125, 478.47052001953125, 499.8623962402344, 521.2542724609375, 542.6461791992188, 564.0380859375, 585.4299926757812, 606.8218994140625, 628.2137451171875, 649.6056518554688, 670.99755859375, 692.3894653320312, 713.7813720703125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 12.0, 13.0, 27.0, 51.0, 57.0, 97.0, 145.0, 257.0, 384.0, 678.0, 1150.0, 1903.0, 3189.0, 5700.0, 10272.0, 18508.0, 35620.0, 68686.0, 138840.0, 297687.0, 713556.0, 1991883.0, 1810928.0, 645964.0, 276572.0, 130070.0, 64656.0, 33921.0, 17805.0, 9687.0, 5413.0, 3032.0, 1809.0, 1093.0, 605.0, 416.0, 266.0, 165.0, 115.0, 64.0, 50.0, 29.0, 21.0, 11.0, 6.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.59375, -38.39208984375, -37.1904296875, -35.98876953125, -34.787109375, -33.58544921875, -32.3837890625, -31.18212890625, -29.98046875, -28.77880859375, -27.5771484375, -26.37548828125, -25.173828125, -23.97216796875, -22.7705078125, -21.56884765625, -20.3671875, -19.16552734375, -17.9638671875, -16.76220703125, -15.560546875, -14.35888671875, -13.1572265625, -11.95556640625, -10.75390625, -9.55224609375, -8.3505859375, -7.14892578125, -5.947265625, -4.74560546875, -3.5439453125, -2.34228515625, -1.140625, 0.06103515625, 1.2626953125, 2.46435546875, 3.666015625, 4.86767578125, 6.0693359375, 7.27099609375, 8.47265625, 9.67431640625, 10.8759765625, 12.07763671875, 13.279296875, 14.48095703125, 15.6826171875, 16.88427734375, 18.0859375, 19.28759765625, 20.4892578125, 21.69091796875, 22.892578125, 24.09423828125, 25.2958984375, 26.49755859375, 27.69921875, 28.90087890625, 30.1025390625, 31.30419921875, 32.505859375, 33.70751953125, 34.9091796875, 36.11083984375, 37.3125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 9.0, 3.0, 15.0, 7.0, 17.0, 19.0, 14.0, 19.0, 46.0, 36.0, 52.0, 62.0, 77.0, 114.0, 163.0, 195.0, 250.0, 226.0, 177.0, 101.0, 90.0, 62.0, 51.0, 45.0, 26.0, 31.0, 17.0, 15.0, 11.0, 12.0, 12.0, 6.0, 8.0, 6.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.515625, -16.925048828125, -16.33447265625, -15.743896484375, -15.1533203125, -14.562744140625, -13.97216796875, -13.381591796875, -12.791015625, -12.200439453125, -11.60986328125, -11.019287109375, -10.4287109375, -9.838134765625, -9.24755859375, -8.656982421875, -8.06640625, -7.475830078125, -6.88525390625, -6.294677734375, -5.7041015625, -5.113525390625, -4.52294921875, -3.932373046875, -3.341796875, -2.751220703125, -2.16064453125, -1.570068359375, -0.9794921875, -0.388916015625, 0.20166015625, 0.792236328125, 1.3828125, 1.973388671875, 2.56396484375, 3.154541015625, 3.7451171875, 4.335693359375, 4.92626953125, 5.516845703125, 6.107421875, 6.697998046875, 7.28857421875, 7.879150390625, 8.4697265625, 9.060302734375, 9.65087890625, 10.241455078125, 10.83203125, 11.422607421875, 12.01318359375, 12.603759765625, 13.1943359375, 13.784912109375, 14.37548828125, 14.966064453125, 15.556640625, 16.147216796875, 16.73779296875, 17.328369140625, 17.9189453125, 18.509521484375, 19.10009765625, 19.690673828125, 20.28125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 5.0, 8.0, 7.0, 13.0, 18.0, 20.0, 46.0, 73.0, 99.0, 127.0, 141.0, 281.0, 474.0, 687.0, 1030.0, 1544.0, 2258.0, 3658.0, 5674.0, 9451.0, 15103.0, 24568.0, 40299.0, 64338.0, 109208.0, 186618.0, 338014.0, 694601.0, 1730024.0, 1633654.0, 653558.0, 324740.0, 181270.0, 105325.0, 63104.0, 38364.0, 23650.0, 14513.0, 9064.0, 5663.0, 3591.0, 2259.0, 1428.0, 949.0, 650.0, 444.0, 305.0, 174.0, 102.0, 90.0, 49.0, 29.0, 14.0, 25.0, 20.0, 6.0, 5.0, 9.0, 6.0, 3.0], "bins": [-17.609375, -17.0751953125, -16.541015625, -16.0068359375, -15.47265625, -14.9384765625, -14.404296875, -13.8701171875, -13.3359375, -12.8017578125, -12.267578125, -11.7333984375, -11.19921875, -10.6650390625, -10.130859375, -9.5966796875, -9.0625, -8.5283203125, -7.994140625, -7.4599609375, -6.92578125, -6.3916015625, -5.857421875, -5.3232421875, -4.7890625, -4.2548828125, -3.720703125, -3.1865234375, -2.65234375, -2.1181640625, -1.583984375, -1.0498046875, -0.515625, 0.0185546875, 0.552734375, 1.0869140625, 1.62109375, 2.1552734375, 2.689453125, 3.2236328125, 3.7578125, 4.2919921875, 4.826171875, 5.3603515625, 5.89453125, 6.4287109375, 6.962890625, 7.4970703125, 8.03125, 8.5654296875, 9.099609375, 9.6337890625, 10.16796875, 10.7021484375, 11.236328125, 11.7705078125, 12.3046875, 12.8388671875, 13.373046875, 13.9072265625, 14.44140625, 14.9755859375, 15.509765625, 16.0439453125, 16.578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 13.0, 14.0, 15.0, 12.0, 18.0, 20.0, 28.0, 38.0, 49.0, 51.0, 77.0, 101.0, 152.0, 214.0, 291.0, 255.0, 159.0, 103.0, 87.0, 62.0, 45.0, 45.0, 32.0, 17.0, 30.0, 22.0, 12.0, 9.0, 8.0, 8.0, 3.0, 5.0, 7.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.6875, -26.839599609375, -25.99169921875, -25.143798828125, -24.2958984375, -23.447998046875, -22.60009765625, -21.752197265625, -20.904296875, -20.056396484375, -19.20849609375, -18.360595703125, -17.5126953125, -16.664794921875, -15.81689453125, -14.968994140625, -14.12109375, -13.273193359375, -12.42529296875, -11.577392578125, -10.7294921875, -9.881591796875, -9.03369140625, -8.185791015625, -7.337890625, -6.489990234375, -5.64208984375, -4.794189453125, -3.9462890625, -3.098388671875, -2.25048828125, -1.402587890625, -0.5546875, 0.293212890625, 1.14111328125, 1.989013671875, 2.8369140625, 3.684814453125, 4.53271484375, 5.380615234375, 6.228515625, 7.076416015625, 7.92431640625, 8.772216796875, 9.6201171875, 10.468017578125, 11.31591796875, 12.163818359375, 13.01171875, 13.859619140625, 14.70751953125, 15.555419921875, 16.4033203125, 17.251220703125, 18.09912109375, 18.947021484375, 19.794921875, 20.642822265625, 21.49072265625, 22.338623046875, 23.1865234375, 24.034423828125, 24.88232421875, 25.730224609375, 26.578125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 9.0, 8.0, 8.0, 9.0, 19.0, 21.0, 28.0, 41.0, 80.0, 86.0, 175.0, 192.0, 361.0, 538.0, 846.0, 1461.0, 2666.0, 4837.0, 9754.0, 23439.0, 67704.0, 484936.0, 5559308.0, 84456.0, 26840.0, 11082.0, 5499.0, 2810.0, 1529.0, 978.0, 513.0, 386.0, 265.0, 171.0, 112.0, 57.0, 53.0, 42.0, 32.0, 29.0, 9.0, 11.0, 6.0, 9.0, 10.0, 1.0, 6.0, 0.0, 0.0, 0.0, 5.0, 4.0], "bins": [-89.5, -86.8740234375, -84.248046875, -81.6220703125, -78.99609375, -76.3701171875, -73.744140625, -71.1181640625, -68.4921875, -65.8662109375, -63.240234375, -60.6142578125, -57.98828125, -55.3623046875, -52.736328125, -50.1103515625, -47.484375, -44.8583984375, -42.232421875, -39.6064453125, -36.98046875, -34.3544921875, -31.728515625, -29.1025390625, -26.4765625, -23.8505859375, -21.224609375, -18.5986328125, -15.97265625, -13.3466796875, -10.720703125, -8.0947265625, -5.46875, -2.8427734375, -0.216796875, 2.4091796875, 5.03515625, 7.6611328125, 10.287109375, 12.9130859375, 15.5390625, 18.1650390625, 20.791015625, 23.4169921875, 26.04296875, 28.6689453125, 31.294921875, 33.9208984375, 36.546875, 39.1728515625, 41.798828125, 44.4248046875, 47.05078125, 49.6767578125, 52.302734375, 54.9287109375, 57.5546875, 60.1806640625, 62.806640625, 65.4326171875, 68.05859375, 70.6845703125, 73.310546875, 75.9365234375, 78.5625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 8.0, 6.0, 13.0, 12.0, 22.0, 22.0, 32.0, 39.0, 51.0, 53.0, 59.0, 84.0, 225.0, 537.0, 348.0, 123.0, 85.0, 55.0, 47.0, 31.0, 35.0, 26.0, 32.0, 19.0, 7.0, 10.0, 13.0, 9.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.5, -53.6298828125, -51.759765625, -49.8896484375, -48.01953125, -46.1494140625, -44.279296875, -42.4091796875, -40.5390625, -38.6689453125, -36.798828125, -34.9287109375, -33.05859375, -31.1884765625, -29.318359375, -27.4482421875, -25.578125, -23.7080078125, -21.837890625, -19.9677734375, -18.09765625, -16.2275390625, -14.357421875, -12.4873046875, -10.6171875, -8.7470703125, -6.876953125, -5.0068359375, -3.13671875, -1.2666015625, 0.603515625, 2.4736328125, 4.34375, 6.2138671875, 8.083984375, 9.9541015625, 11.82421875, 13.6943359375, 15.564453125, 17.4345703125, 19.3046875, 21.1748046875, 23.044921875, 24.9150390625, 26.78515625, 28.6552734375, 30.525390625, 32.3955078125, 34.265625, 36.1357421875, 38.005859375, 39.8759765625, 41.74609375, 43.6162109375, 45.486328125, 47.3564453125, 49.2265625, 51.0966796875, 52.966796875, 54.8369140625, 56.70703125, 58.5771484375, 60.447265625, 62.3173828125, 64.1875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 10.0, 12.0, 11.0, 16.0, 22.0, 33.0, 34.0, 53.0, 73.0, 92.0, 183.0, 162.0, 69.0, 51.0, 40.0, 39.0, 18.0, 23.0, 7.0, 7.0, 8.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1070.520751953125, -1032.02880859375, -993.5369262695312, -955.0450439453125, -916.5531616210938, -878.061279296875, -839.5693359375, -801.0774536132812, -762.5855712890625, -724.0936889648438, -685.6017456054688, -647.10986328125, -608.6179809570312, -570.1260986328125, -531.6341552734375, -493.14227294921875, -454.65032958984375, -416.1584167480469, -377.6665344238281, -339.17462158203125, -300.6827392578125, -262.1908264160156, -223.69891357421875, -185.20703125, -146.71511840820312, -108.22322082519531, -69.73131561279297, -31.239410400390625, 7.2524871826171875, 45.744384765625, 84.23629760742188, 122.72817993164062, 161.2200927734375, 199.7119903564453, 238.20388793945312, 276.69580078125, 315.18768310546875, 353.6795959472656, 392.1715087890625, 430.66339111328125, 469.1553039550781, 507.647216796875, 546.1390991210938, 584.6309814453125, 623.1229248046875, 661.6148071289062, 700.106689453125, 738.5986328125, 777.0905151367188, 815.5823974609375, 854.0743408203125, 892.5662231445312, 931.05810546875, 969.550048828125, 1008.0419311523438, 1046.5338134765625, 1085.0257568359375, 1123.5177001953125, 1162.009521484375, 1200.50146484375, 1238.993408203125, 1277.4852294921875, 1315.9771728515625, 1354.468994140625, 1392.9609375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 0.0, 4.0, 7.0, 5.0, 10.0, 12.0, 17.0, 16.0, 14.0, 11.0, 20.0, 26.0, 27.0, 23.0, 30.0, 37.0, 45.0, 76.0, 162.0, 113.0, 75.0, 30.0, 36.0, 28.0, 19.0, 25.0, 22.0, 18.0, 13.0, 17.0, 12.0, 12.0, 9.0, 12.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1685.51123046875, -1635.6361083984375, -1585.760986328125, -1535.8858642578125, -1486.0107421875, -1436.1357421875, -1386.2606201171875, -1336.385498046875, -1286.5103759765625, -1236.63525390625, -1186.7601318359375, -1136.885009765625, -1087.010009765625, -1037.1348876953125, -987.259765625, -937.3846435546875, -887.509521484375, -837.6343994140625, -787.75927734375, -737.8842163085938, -688.0090942382812, -638.1339721679688, -588.2589111328125, -538.3837890625, -488.5086669921875, -438.633544921875, -388.7584533691406, -338.88336181640625, -289.00823974609375, -239.1331329345703, -189.25802612304688, -139.3829345703125, -89.5078125, -39.63270568847656, 10.242401123046875, 60.11750793457031, 109.99261474609375, 159.8677215576172, 209.74282836914062, 259.617919921875, 309.4930419921875, 359.3681640625, 409.2432556152344, 459.11834716796875, 508.99346923828125, 558.8685913085938, 608.74365234375, 658.6187744140625, 708.493896484375, 758.3690185546875, 808.244140625, 858.1192016601562, 907.9943237304688, 957.8694458007812, 1007.7445068359375, 1057.61962890625, 1107.4947509765625, 1157.369873046875, 1207.2449951171875, 1257.1201171875, 1306.9951171875, 1356.8702392578125, 1406.745361328125, 1456.6204833984375, 1506.49560546875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 13.0, 9.0, 14.0, 20.0, 43.0, 58.0, 67.0, 107.0, 164.0, 250.0, 363.0, 540.0, 839.0, 1253.0, 2016.0, 3156.0, 5316.0, 9332.0, 18169.0, 42473.0, 134624.0, 1080310.0, 2625895.0, 162697.0, 51532.0, 22702.0, 12151.0, 7215.0, 4499.0, 2738.0, 1880.0, 1212.0, 805.0, 580.0, 353.0, 269.0, 191.0, 128.0, 83.0, 69.0, 46.0, 32.0, 20.0, 14.0, 13.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0], "bins": [-11.4453125, -11.088623046875, -10.73193359375, -10.375244140625, -10.0185546875, -9.661865234375, -9.30517578125, -8.948486328125, -8.591796875, -8.235107421875, -7.87841796875, -7.521728515625, -7.1650390625, -6.808349609375, -6.45166015625, -6.094970703125, -5.73828125, -5.381591796875, -5.02490234375, -4.668212890625, -4.3115234375, -3.954833984375, -3.59814453125, -3.241455078125, -2.884765625, -2.528076171875, -2.17138671875, -1.814697265625, -1.4580078125, -1.101318359375, -0.74462890625, -0.387939453125, -0.03125, 0.325439453125, 0.68212890625, 1.038818359375, 1.3955078125, 1.752197265625, 2.10888671875, 2.465576171875, 2.822265625, 3.178955078125, 3.53564453125, 3.892333984375, 4.2490234375, 4.605712890625, 4.96240234375, 5.319091796875, 5.67578125, 6.032470703125, 6.38916015625, 6.745849609375, 7.1025390625, 7.459228515625, 7.81591796875, 8.172607421875, 8.529296875, 8.885986328125, 9.24267578125, 9.599365234375, 9.9560546875, 10.312744140625, 10.66943359375, 11.026123046875, 11.3828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 7.0, 7.0, 8.0, 17.0, 24.0, 31.0, 42.0, 60.0, 97.0, 153.0, 181.0, 97.0, 59.0, 66.0, 24.0, 30.0, 15.0, 9.0, 12.0, 7.0, 6.0, 5.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.419921875, -1.3760986328125, -1.332275390625, -1.2884521484375, -1.24462890625, -1.2008056640625, -1.156982421875, -1.1131591796875, -1.0693359375, -1.0255126953125, -0.981689453125, -0.9378662109375, -0.89404296875, -0.8502197265625, -0.806396484375, -0.7625732421875, -0.71875, -0.6749267578125, -0.631103515625, -0.5872802734375, -0.54345703125, -0.4996337890625, -0.455810546875, -0.4119873046875, -0.3681640625, -0.3243408203125, -0.280517578125, -0.2366943359375, -0.19287109375, -0.1490478515625, -0.105224609375, -0.0614013671875, -0.017578125, 0.0262451171875, 0.070068359375, 0.1138916015625, 0.15771484375, 0.2015380859375, 0.245361328125, 0.2891845703125, 0.3330078125, 0.3768310546875, 0.420654296875, 0.4644775390625, 0.50830078125, 0.5521240234375, 0.595947265625, 0.6397705078125, 0.68359375, 0.7274169921875, 0.771240234375, 0.8150634765625, 0.85888671875, 0.9027099609375, 0.946533203125, 0.9903564453125, 1.0341796875, 1.0780029296875, 1.121826171875, 1.1656494140625, 1.20947265625, 1.2532958984375, 1.297119140625, 1.3409423828125, 1.384765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 7.0, 11.0, 14.0, 24.0, 28.0, 36.0, 54.0, 62.0, 113.0, 164.0, 232.0, 291.0, 483.0, 744.0, 1307.0, 2303.0, 4810.0, 10511.0, 26774.0, 83458.0, 376840.0, 2600137.0, 864165.0, 151712.0, 41788.0, 14897.0, 6360.0, 2953.0, 1582.0, 850.0, 544.0, 322.0, 196.0, 133.0, 92.0, 76.0, 53.0, 61.0, 25.0, 23.0, 9.0, 8.0, 8.0, 8.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.8203125, -10.4434814453125, -10.066650390625, -9.6898193359375, -9.31298828125, -8.9361572265625, -8.559326171875, -8.1824951171875, -7.8056640625, -7.4288330078125, -7.052001953125, -6.6751708984375, -6.29833984375, -5.9215087890625, -5.544677734375, -5.1678466796875, -4.791015625, -4.4141845703125, -4.037353515625, -3.6605224609375, -3.28369140625, -2.9068603515625, -2.530029296875, -2.1531982421875, -1.7763671875, -1.3995361328125, -1.022705078125, -0.6458740234375, -0.26904296875, 0.1077880859375, 0.484619140625, 0.8614501953125, 1.23828125, 1.6151123046875, 1.991943359375, 2.3687744140625, 2.74560546875, 3.1224365234375, 3.499267578125, 3.8760986328125, 4.2529296875, 4.6297607421875, 5.006591796875, 5.3834228515625, 5.76025390625, 6.1370849609375, 6.513916015625, 6.8907470703125, 7.267578125, 7.6444091796875, 8.021240234375, 8.3980712890625, 8.77490234375, 9.1517333984375, 9.528564453125, 9.9053955078125, 10.2822265625, 10.6590576171875, 11.035888671875, 11.4127197265625, 11.78955078125, 12.1663818359375, 12.543212890625, 12.9200439453125, 13.296875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 14.0, 11.0, 14.0, 18.0, 14.0, 21.0, 18.0, 20.0, 31.0, 52.0, 45.0, 64.0, 71.0, 82.0, 123.0, 142.0, 206.0, 251.0, 349.0, 682.0, 458.0, 295.0, 248.0, 173.0, 112.0, 104.0, 88.0, 52.0, 63.0, 42.0, 43.0, 40.0, 31.0, 16.0, 17.0, 11.0, 11.0, 9.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 3.0], "bins": [-3.84765625, -3.748016357421875, -3.64837646484375, -3.548736572265625, -3.4490966796875, -3.349456787109375, -3.24981689453125, -3.150177001953125, -3.050537109375, -2.950897216796875, -2.85125732421875, -2.751617431640625, -2.6519775390625, -2.552337646484375, -2.45269775390625, -2.353057861328125, -2.25341796875, -2.153778076171875, -2.05413818359375, -1.954498291015625, -1.8548583984375, -1.755218505859375, -1.65557861328125, -1.555938720703125, -1.456298828125, -1.356658935546875, -1.25701904296875, -1.157379150390625, -1.0577392578125, -0.958099365234375, -0.85845947265625, -0.758819580078125, -0.6591796875, -0.559539794921875, -0.45989990234375, -0.360260009765625, -0.2606201171875, -0.160980224609375, -0.06134033203125, 0.038299560546875, 0.137939453125, 0.237579345703125, 0.33721923828125, 0.436859130859375, 0.5364990234375, 0.636138916015625, 0.73577880859375, 0.835418701171875, 0.93505859375, 1.034698486328125, 1.13433837890625, 1.233978271484375, 1.3336181640625, 1.433258056640625, 1.53289794921875, 1.632537841796875, 1.732177734375, 1.831817626953125, 1.93145751953125, 2.031097412109375, 2.1307373046875, 2.230377197265625, 2.33001708984375, 2.429656982421875, 2.529296875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 8.0, 15.0, 18.0, 31.0, 33.0, 56.0, 90.0, 125.0, 155.0, 152.0, 91.0, 73.0, 49.0, 37.0, 20.0, 17.0, 8.0, 5.0, 6.0, 6.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.2535400390625, -35.95635223388672, -34.65916442871094, -33.361976623535156, -32.064788818359375, -30.76759910583496, -29.47041130065918, -28.173221588134766, -26.876033782958984, -25.578845977783203, -24.281658172607422, -22.98447036743164, -21.687280654907227, -20.390092849731445, -19.092905044555664, -17.79571533203125, -16.4985294342041, -15.20134162902832, -13.904152870178223, -12.606965065002441, -11.309776306152344, -10.012588500976562, -8.715400695800781, -7.418211936950684, -6.121024131774902, -4.823835849761963, -3.5266478061676025, -2.229459762573242, -0.9322714805603027, 0.3649168014526367, 1.662104606628418, 2.9592933654785156, 4.256481170654297, 5.553669452667236, 6.850857734680176, 8.148045539855957, 9.445234298706055, 10.742422103881836, 12.039609909057617, 13.336798667907715, 14.633986473083496, 15.931174278259277, 17.228363037109375, 18.525550842285156, 19.822738647460938, 21.11992645263672, 22.4171142578125, 23.714303970336914, 25.011491775512695, 26.308679580688477, 27.605867385864258, 28.903057098388672, 30.200244903564453, 31.497432708740234, 32.794620513916016, 34.0918083190918, 35.38899612426758, 36.68618392944336, 37.98337173461914, 39.28055953979492, 40.5777473449707, 41.87493896484375, 43.17212677001953, 44.46931457519531, 45.766502380371094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 8.0, 15.0, 15.0, 19.0, 23.0, 35.0, 47.0, 67.0, 64.0, 51.0, 54.0, 61.0, 65.0, 71.0, 63.0, 56.0, 51.0, 51.0, 46.0, 40.0, 33.0, 17.0, 20.0, 13.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.13752746582031, -36.99752426147461, -35.857521057128906, -34.7175178527832, -33.5775146484375, -32.4375114440918, -31.297508239746094, -30.15750503540039, -29.017501831054688, -27.877498626708984, -26.73749542236328, -25.597492218017578, -24.457489013671875, -23.317485809326172, -22.17748260498047, -21.037479400634766, -19.897476196289062, -18.75747299194336, -17.617469787597656, -16.477466583251953, -15.33746337890625, -14.197460174560547, -13.057456970214844, -11.91745376586914, -10.777450561523438, -9.637447357177734, -8.497444152832031, -7.357440948486328, -6.217437744140625, -5.077434539794922, -3.9374313354492188, -2.7974281311035156, -1.6574249267578125, -0.5174217224121094, 0.6225814819335938, 1.7625846862792969, 2.902587890625, 4.042591094970703, 5.182594299316406, 6.322597503662109, 7.4626007080078125, 8.602603912353516, 9.742607116699219, 10.882610321044922, 12.022613525390625, 13.162616729736328, 14.302619934082031, 15.442623138427734, 16.582626342773438, 17.72262954711914, 18.862632751464844, 20.002635955810547, 21.14263916015625, 22.282642364501953, 23.422645568847656, 24.56264877319336, 25.702651977539062, 26.842655181884766, 27.98265838623047, 29.122661590576172, 30.262664794921875, 31.402667999267578, 32.54267120361328, 33.682674407958984, 34.82267761230469]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 11.0, 6.0, 10.0, 19.0, 25.0, 26.0, 27.0, 50.0, 65.0, 93.0, 126.0, 159.0, 201.0, 293.0, 445.0, 672.0, 863.0, 1335.0, 1968.0, 3063.0, 4789.0, 8846.0, 16864.0, 36066.0, 87613.0, 301161.0, 390516.0, 106294.0, 42024.0, 19359.0, 9818.0, 5443.0, 3330.0, 2146.0, 1389.0, 935.0, 675.0, 496.0, 384.0, 258.0, 184.0, 141.0, 90.0, 67.0, 64.0, 39.0, 33.0, 17.0, 17.0, 15.0, 12.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.61328125, -6.4072265625, -6.201171875, -5.9951171875, -5.7890625, -5.5830078125, -5.376953125, -5.1708984375, -4.96484375, -4.7587890625, -4.552734375, -4.3466796875, -4.140625, -3.9345703125, -3.728515625, -3.5224609375, -3.31640625, -3.1103515625, -2.904296875, -2.6982421875, -2.4921875, -2.2861328125, -2.080078125, -1.8740234375, -1.66796875, -1.4619140625, -1.255859375, -1.0498046875, -0.84375, -0.6376953125, -0.431640625, -0.2255859375, -0.01953125, 0.1865234375, 0.392578125, 0.5986328125, 0.8046875, 1.0107421875, 1.216796875, 1.4228515625, 1.62890625, 1.8349609375, 2.041015625, 2.2470703125, 2.453125, 2.6591796875, 2.865234375, 3.0712890625, 3.27734375, 3.4833984375, 3.689453125, 3.8955078125, 4.1015625, 4.3076171875, 4.513671875, 4.7197265625, 4.92578125, 5.1318359375, 5.337890625, 5.5439453125, 5.75, 5.9560546875, 6.162109375, 6.3681640625, 6.57421875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 13.0, 14.0, 22.0, 22.0, 36.0, 30.0, 43.0, 52.0, 62.0, 82.0, 66.0, 65.0, 72.0, 62.0, 64.0, 49.0, 47.0, 31.0, 28.0, 30.0, 22.0, 13.0, 8.0, 10.0, 7.0, 7.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.28515625, -1.2445068359375, -1.203857421875, -1.1632080078125, -1.12255859375, -1.0819091796875, -1.041259765625, -1.0006103515625, -0.9599609375, -0.9193115234375, -0.878662109375, -0.8380126953125, -0.79736328125, -0.7567138671875, -0.716064453125, -0.6754150390625, -0.634765625, -0.5941162109375, -0.553466796875, -0.5128173828125, -0.47216796875, -0.4315185546875, -0.390869140625, -0.3502197265625, -0.3095703125, -0.2689208984375, -0.228271484375, -0.1876220703125, -0.14697265625, -0.1063232421875, -0.065673828125, -0.0250244140625, 0.015625, 0.0562744140625, 0.096923828125, 0.1375732421875, 0.17822265625, 0.2188720703125, 0.259521484375, 0.3001708984375, 0.3408203125, 0.3814697265625, 0.422119140625, 0.4627685546875, 0.50341796875, 0.5440673828125, 0.584716796875, 0.6253662109375, 0.666015625, 0.7066650390625, 0.747314453125, 0.7879638671875, 0.82861328125, 0.8692626953125, 0.909912109375, 0.9505615234375, 0.9912109375, 1.0318603515625, 1.072509765625, 1.1131591796875, 1.15380859375, 1.1944580078125, 1.235107421875, 1.2757568359375, 1.31640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 13.0, 14.0, 16.0, 17.0, 38.0, 37.0, 51.0, 68.0, 96.0, 142.0, 204.0, 268.0, 362.0, 547.0, 844.0, 1219.0, 1925.0, 3246.0, 5510.0, 9610.0, 18502.0, 38294.0, 89861.0, 293104.0, 381429.0, 109808.0, 44311.0, 21444.0, 11360.0, 6239.0, 3679.0, 2175.0, 1362.0, 871.0, 554.0, 382.0, 276.0, 195.0, 141.0, 98.0, 72.0, 55.0, 32.0, 16.0, 26.0, 8.0, 12.0, 8.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.55078125, -5.372314453125, -5.19384765625, -5.015380859375, -4.8369140625, -4.658447265625, -4.47998046875, -4.301513671875, -4.123046875, -3.944580078125, -3.76611328125, -3.587646484375, -3.4091796875, -3.230712890625, -3.05224609375, -2.873779296875, -2.6953125, -2.516845703125, -2.33837890625, -2.159912109375, -1.9814453125, -1.802978515625, -1.62451171875, -1.446044921875, -1.267578125, -1.089111328125, -0.91064453125, -0.732177734375, -0.5537109375, -0.375244140625, -0.19677734375, -0.018310546875, 0.16015625, 0.338623046875, 0.51708984375, 0.695556640625, 0.8740234375, 1.052490234375, 1.23095703125, 1.409423828125, 1.587890625, 1.766357421875, 1.94482421875, 2.123291015625, 2.3017578125, 2.480224609375, 2.65869140625, 2.837158203125, 3.015625, 3.194091796875, 3.37255859375, 3.551025390625, 3.7294921875, 3.907958984375, 4.08642578125, 4.264892578125, 4.443359375, 4.621826171875, 4.80029296875, 4.978759765625, 5.1572265625, 5.335693359375, 5.51416015625, 5.692626953125, 5.87109375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 5.0, 10.0, 16.0, 18.0, 21.0, 22.0, 24.0, 30.0, 34.0, 26.0, 37.0, 44.0, 50.0, 38.0, 52.0, 40.0, 48.0, 38.0, 35.0, 41.0, 45.0, 36.0, 31.0, 21.0, 30.0, 23.0, 24.0, 19.0, 16.0, 20.0, 15.0, 16.0, 10.0, 13.0, 7.0, 9.0, 4.0, 5.0, 1.0, 4.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.58245849609375, -6.3719482421875, -6.16143798828125, -5.950927734375, -5.74041748046875, -5.5299072265625, -5.31939697265625, -5.10888671875, -4.89837646484375, -4.6878662109375, -4.47735595703125, -4.266845703125, -4.05633544921875, -3.8458251953125, -3.63531494140625, -3.4248046875, -3.21429443359375, -3.0037841796875, -2.79327392578125, -2.582763671875, -2.37225341796875, -2.1617431640625, -1.95123291015625, -1.74072265625, -1.53021240234375, -1.3197021484375, -1.10919189453125, -0.898681640625, -0.68817138671875, -0.4776611328125, -0.26715087890625, -0.056640625, 0.15386962890625, 0.3643798828125, 0.57489013671875, 0.785400390625, 0.99591064453125, 1.2064208984375, 1.41693115234375, 1.62744140625, 1.83795166015625, 2.0484619140625, 2.25897216796875, 2.469482421875, 2.67999267578125, 2.8905029296875, 3.10101318359375, 3.3115234375, 3.52203369140625, 3.7325439453125, 3.94305419921875, 4.153564453125, 4.36407470703125, 4.5745849609375, 4.78509521484375, 4.99560546875, 5.20611572265625, 5.4166259765625, 5.62713623046875, 5.837646484375, 6.04815673828125, 6.2586669921875, 6.46917724609375, 6.6796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 8.0, 6.0, 11.0, 12.0, 18.0, 33.0, 40.0, 47.0, 90.0, 133.0, 190.0, 271.0, 503.0, 918.0, 1668.0, 3164.0, 6971.0, 18215.0, 57697.0, 261974.0, 511486.0, 129919.0, 33118.0, 11529.0, 4978.0, 2489.0, 1218.0, 728.0, 392.0, 270.0, 152.0, 90.0, 66.0, 44.0, 30.0, 25.0, 11.0, 7.0, 3.0, 6.0, 6.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.265625, -3.161224365234375, -3.05682373046875, -2.952423095703125, -2.8480224609375, -2.743621826171875, -2.63922119140625, -2.534820556640625, -2.430419921875, -2.326019287109375, -2.22161865234375, -2.117218017578125, -2.0128173828125, -1.908416748046875, -1.80401611328125, -1.699615478515625, -1.59521484375, -1.490814208984375, -1.38641357421875, -1.282012939453125, -1.1776123046875, -1.073211669921875, -0.96881103515625, -0.864410400390625, -0.760009765625, -0.655609130859375, -0.55120849609375, -0.446807861328125, -0.3424072265625, -0.238006591796875, -0.13360595703125, -0.029205322265625, 0.0751953125, 0.179595947265625, 0.28399658203125, 0.388397216796875, 0.4927978515625, 0.597198486328125, 0.70159912109375, 0.805999755859375, 0.910400390625, 1.014801025390625, 1.11920166015625, 1.223602294921875, 1.3280029296875, 1.432403564453125, 1.53680419921875, 1.641204833984375, 1.74560546875, 1.850006103515625, 1.95440673828125, 2.058807373046875, 2.1632080078125, 2.267608642578125, 2.37200927734375, 2.476409912109375, 2.580810546875, 2.685211181640625, 2.78961181640625, 2.894012451171875, 2.9984130859375, 3.102813720703125, 3.20721435546875, 3.311614990234375, 3.416015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 9.0, 4.0, 10.0, 9.0, 12.0, 28.0, 20.0, 23.0, 37.0, 36.0, 38.0, 60.0, 70.0, 91.0, 70.0, 78.0, 83.0, 74.0, 57.0, 40.0, 42.0, 27.0, 26.0, 17.0, 20.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.00013637542724609375, -0.00013278890401124954, -0.00012920238077640533, -0.00012561585754156113, -0.00012202933430671692, -0.00011844281107187271, -0.0001148562878370285, -0.0001112697646021843, -0.00010768324136734009, -0.00010409671813249588, -0.00010051019489765167, -9.692367166280746e-05, -9.333714842796326e-05, -8.975062519311905e-05, -8.616410195827484e-05, -8.257757872343063e-05, -7.899105548858643e-05, -7.540453225374222e-05, -7.181800901889801e-05, -6.82314857840538e-05, -6.46449625492096e-05, -6.105843931436539e-05, -5.747191607952118e-05, -5.388539284467697e-05, -5.0298869609832764e-05, -4.6712346374988556e-05, -4.312582314014435e-05, -3.953929990530014e-05, -3.595277667045593e-05, -3.2366253435611725e-05, -2.8779730200767517e-05, -2.519320696592331e-05, -2.16066837310791e-05, -1.8020160496234894e-05, -1.4433637261390686e-05, -1.0847114026546478e-05, -7.2605907917022705e-06, -3.6740675568580627e-06, -8.754432201385498e-08, 3.4989789128303528e-06, 7.0855021476745605e-06, 1.0672025382518768e-05, 1.4258548617362976e-05, 1.7845071852207184e-05, 2.143159508705139e-05, 2.50181183218956e-05, 2.8604641556739807e-05, 3.2191164791584015e-05, 3.577768802642822e-05, 3.936421126127243e-05, 4.295073449611664e-05, 4.6537257730960846e-05, 5.0123780965805054e-05, 5.371030420064926e-05, 5.729682743549347e-05, 6.088335067033768e-05, 6.446987390518188e-05, 6.805639714002609e-05, 7.16429203748703e-05, 7.522944360971451e-05, 7.881596684455872e-05, 8.240249007940292e-05, 8.598901331424713e-05, 8.957553654909134e-05, 9.316205978393555e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 13.0, 13.0, 9.0, 22.0, 22.0, 24.0, 41.0, 55.0, 90.0, 148.0, 168.0, 283.0, 436.0, 658.0, 1134.0, 1736.0, 3034.0, 5487.0, 10688.0, 22217.0, 52685.0, 143343.0, 355610.0, 274566.0, 100979.0, 38607.0, 17068.0, 8268.0, 4431.0, 2526.0, 1490.0, 878.0, 586.0, 373.0, 269.0, 173.0, 128.0, 77.0, 54.0, 47.0, 33.0, 23.0, 20.0, 8.0, 15.0, 11.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.063629150390625, -1.99444580078125, -1.925262451171875, -1.8560791015625, -1.786895751953125, -1.71771240234375, -1.648529052734375, -1.579345703125, -1.510162353515625, -1.44097900390625, -1.371795654296875, -1.3026123046875, -1.233428955078125, -1.16424560546875, -1.095062255859375, -1.02587890625, -0.956695556640625, -0.88751220703125, -0.818328857421875, -0.7491455078125, -0.679962158203125, -0.61077880859375, -0.541595458984375, -0.472412109375, -0.403228759765625, -0.33404541015625, -0.264862060546875, -0.1956787109375, -0.126495361328125, -0.05731201171875, 0.011871337890625, 0.0810546875, 0.150238037109375, 0.21942138671875, 0.288604736328125, 0.3577880859375, 0.426971435546875, 0.49615478515625, 0.565338134765625, 0.634521484375, 0.703704833984375, 0.77288818359375, 0.842071533203125, 0.9112548828125, 0.980438232421875, 1.04962158203125, 1.118804931640625, 1.18798828125, 1.257171630859375, 1.32635498046875, 1.395538330078125, 1.4647216796875, 1.533905029296875, 1.60308837890625, 1.672271728515625, 1.741455078125, 1.810638427734375, 1.87982177734375, 1.949005126953125, 2.0181884765625, 2.087371826171875, 2.15655517578125, 2.225738525390625, 2.294921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 9.0, 12.0, 12.0, 16.0, 14.0, 23.0, 17.0, 31.0, 22.0, 28.0, 34.0, 45.0, 34.0, 38.0, 62.0, 60.0, 44.0, 45.0, 47.0, 55.0, 45.0, 41.0, 40.0, 42.0, 20.0, 23.0, 20.0, 14.0, 14.0, 14.0, 8.0, 12.0, 7.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8251953125, -1.7693939208984375, -1.713592529296875, -1.6577911376953125, -1.60198974609375, -1.5461883544921875, -1.490386962890625, -1.4345855712890625, -1.3787841796875, -1.3229827880859375, -1.267181396484375, -1.2113800048828125, -1.15557861328125, -1.0997772216796875, -1.043975830078125, -0.9881744384765625, -0.932373046875, -0.8765716552734375, -0.820770263671875, -0.7649688720703125, -0.70916748046875, -0.6533660888671875, -0.597564697265625, -0.5417633056640625, -0.4859619140625, -0.4301605224609375, -0.374359130859375, -0.3185577392578125, -0.26275634765625, -0.2069549560546875, -0.151153564453125, -0.0953521728515625, -0.03955078125, 0.0162506103515625, 0.072052001953125, 0.1278533935546875, 0.18365478515625, 0.2394561767578125, 0.295257568359375, 0.3510589599609375, 0.4068603515625, 0.4626617431640625, 0.518463134765625, 0.5742645263671875, 0.63006591796875, 0.6858673095703125, 0.741668701171875, 0.7974700927734375, 0.853271484375, 0.9090728759765625, 0.964874267578125, 1.0206756591796875, 1.07647705078125, 1.1322784423828125, 1.188079833984375, 1.2438812255859375, 1.2996826171875, 1.3554840087890625, 1.411285400390625, 1.4670867919921875, 1.52288818359375, 1.5786895751953125, 1.634490966796875, 1.6902923583984375, 1.74609375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 3.0, 7.0, 9.0, 16.0, 31.0, 44.0, 90.0, 225.0, 268.0, 123.0, 73.0, 22.0, 27.0, 22.0, 15.0, 7.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.48335266113281, -49.89387512207031, -47.30439758300781, -44.71492004394531, -42.12544250488281, -39.53596496582031, -36.94648361206055, -34.35700607299805, -31.767528533935547, -29.178050994873047, -26.588573455810547, -23.999094009399414, -21.409616470336914, -18.820138931274414, -16.23065948486328, -13.641181945800781, -11.051704406738281, -8.462226867675781, -5.872748374938965, -3.2832703590393066, -0.6937923431396484, 1.8956851959228516, 4.485163688659668, 7.074642181396484, 9.664119720458984, 12.253597259521484, 14.8430757522583, 17.432554244995117, 20.022031784057617, 22.611509323120117, 25.20098876953125, 27.79046630859375, 30.37994384765625, 32.96942138671875, 35.55889892578125, 38.14837646484375, 40.73785400390625, 43.32733154296875, 45.916812896728516, 48.506290435791016, 51.095767974853516, 53.685245513916016, 56.274723052978516, 58.864200592041016, 61.45368194580078, 64.04315948486328, 66.63263702392578, 69.22211456298828, 71.81159210205078, 74.40106964111328, 76.99054718017578, 79.58002471923828, 82.16950225830078, 84.75897979736328, 87.34845733642578, 89.93794250488281, 92.52742004394531, 95.11689758300781, 97.70637512207031, 100.29585266113281, 102.88533020019531, 105.47480773925781, 108.06428527832031, 110.65376281738281, 113.24324035644531]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 9.0, 12.0, 19.0, 32.0, 47.0, 68.0, 74.0, 121.0, 113.0, 142.0, 109.0, 73.0, 46.0, 31.0, 21.0, 13.0, 14.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-124.30231475830078, -120.80897521972656, -117.31563568115234, -113.82229614257812, -110.3289566040039, -106.83561706542969, -103.34228515625, -99.84893798828125, -96.35560607910156, -92.86226654052734, -89.36892700195312, -85.8755874633789, -82.38224792480469, -78.88890838623047, -75.39556884765625, -71.90223693847656, -68.40888977050781, -64.9155502319336, -61.422210693359375, -57.928871154785156, -54.43553161621094, -50.94219207763672, -47.448856353759766, -43.95551681518555, -40.46217727661133, -36.96883773803711, -33.47549819946289, -29.982160568237305, -26.488821029663086, -22.995481491088867, -19.50214385986328, -16.008804321289062, -12.515457153320312, -9.022117614746094, -5.528779029846191, -2.035440444946289, 1.4578990936279297, 4.951238632202148, 8.444576263427734, 11.937915802001953, 15.431255340576172, 18.92459487915039, 22.41793441772461, 25.911272048950195, 29.404611587524414, 32.89794921875, 36.39128875732422, 39.88462829589844, 43.377967834472656, 46.871307373046875, 50.364646911621094, 53.85798645019531, 57.35132598876953, 60.84466552734375, 64.33799743652344, 67.83134460449219, 71.32467651367188, 74.8180160522461, 78.31135559082031, 81.80469512939453, 85.29803466796875, 88.79137420654297, 92.28471374511719, 95.77804565429688, 99.27139282226562]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 8.0, 4.0, 5.0, 5.0, 10.0, 15.0, 24.0, 27.0, 44.0, 58.0, 74.0, 102.0, 187.0, 295.0, 464.0, 798.0, 1488.0, 2891.0, 6654.0, 18095.0, 71599.0, 3099867.0, 904064.0, 60326.0, 16219.0, 5813.0, 2553.0, 1143.0, 604.0, 311.0, 181.0, 122.0, 82.0, 48.0, 38.0, 21.0, 11.0, 11.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-27.203125, -26.4462890625, -25.689453125, -24.9326171875, -24.17578125, -23.4189453125, -22.662109375, -21.9052734375, -21.1484375, -20.3916015625, -19.634765625, -18.8779296875, -18.12109375, -17.3642578125, -16.607421875, -15.8505859375, -15.09375, -14.3369140625, -13.580078125, -12.8232421875, -12.06640625, -11.3095703125, -10.552734375, -9.7958984375, -9.0390625, -8.2822265625, -7.525390625, -6.7685546875, -6.01171875, -5.2548828125, -4.498046875, -3.7412109375, -2.984375, -2.2275390625, -1.470703125, -0.7138671875, 0.04296875, 0.7998046875, 1.556640625, 2.3134765625, 3.0703125, 3.8271484375, 4.583984375, 5.3408203125, 6.09765625, 6.8544921875, 7.611328125, 8.3681640625, 9.125, 9.8818359375, 10.638671875, 11.3955078125, 12.15234375, 12.9091796875, 13.666015625, 14.4228515625, 15.1796875, 15.9365234375, 16.693359375, 17.4501953125, 18.20703125, 18.9638671875, 19.720703125, 20.4775390625, 21.234375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 9.0, 13.0, 15.0, 32.0, 30.0, 40.0, 67.0, 56.0, 70.0, 88.0, 91.0, 79.0, 72.0, 64.0, 52.0, 55.0, 35.0, 31.0, 20.0, 20.0, 8.0, 4.0, 11.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.85546875, -1.8031463623046875, -1.750823974609375, -1.6985015869140625, -1.64617919921875, -1.5938568115234375, -1.541534423828125, -1.4892120361328125, -1.4368896484375, -1.3845672607421875, -1.332244873046875, -1.2799224853515625, -1.22760009765625, -1.1752777099609375, -1.122955322265625, -1.0706329345703125, -1.018310546875, -0.9659881591796875, -0.913665771484375, -0.8613433837890625, -0.80902099609375, -0.7566986083984375, -0.704376220703125, -0.6520538330078125, -0.5997314453125, -0.5474090576171875, -0.495086669921875, -0.4427642822265625, -0.39044189453125, -0.3381195068359375, -0.285797119140625, -0.2334747314453125, -0.18115234375, -0.1288299560546875, -0.076507568359375, -0.0241851806640625, 0.02813720703125, 0.0804595947265625, 0.132781982421875, 0.1851043701171875, 0.2374267578125, 0.2897491455078125, 0.342071533203125, 0.3943939208984375, 0.44671630859375, 0.4990386962890625, 0.551361083984375, 0.6036834716796875, 0.656005859375, 0.7083282470703125, 0.760650634765625, 0.8129730224609375, 0.86529541015625, 0.9176177978515625, 0.969940185546875, 1.0222625732421875, 1.0745849609375, 1.1269073486328125, 1.179229736328125, 1.2315521240234375, 1.28387451171875, 1.3361968994140625, 1.388519287109375, 1.4408416748046875, 1.4931640625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 13.0, 9.0, 7.0, 18.0, 23.0, 17.0, 42.0, 56.0, 81.0, 127.0, 172.0, 274.0, 471.0, 791.0, 1276.0, 2067.0, 3882.0, 7446.0, 16485.0, 43699.0, 149074.0, 1169380.0, 2528113.0, 184176.0, 50227.0, 18509.0, 8076.0, 4011.0, 2228.0, 1352.0, 806.0, 496.0, 287.0, 176.0, 120.0, 89.0, 61.0, 44.0, 34.0, 14.0, 14.0, 11.0, 10.0, 7.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.625, -14.154296875, -13.68359375, -13.212890625, -12.7421875, -12.271484375, -11.80078125, -11.330078125, -10.859375, -10.388671875, -9.91796875, -9.447265625, -8.9765625, -8.505859375, -8.03515625, -7.564453125, -7.09375, -6.623046875, -6.15234375, -5.681640625, -5.2109375, -4.740234375, -4.26953125, -3.798828125, -3.328125, -2.857421875, -2.38671875, -1.916015625, -1.4453125, -0.974609375, -0.50390625, -0.033203125, 0.4375, 0.908203125, 1.37890625, 1.849609375, 2.3203125, 2.791015625, 3.26171875, 3.732421875, 4.203125, 4.673828125, 5.14453125, 5.615234375, 6.0859375, 6.556640625, 7.02734375, 7.498046875, 7.96875, 8.439453125, 8.91015625, 9.380859375, 9.8515625, 10.322265625, 10.79296875, 11.263671875, 11.734375, 12.205078125, 12.67578125, 13.146484375, 13.6171875, 14.087890625, 14.55859375, 15.029296875, 15.5]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 4.0, 5.0, 4.0, 5.0, 5.0, 12.0, 17.0, 23.0, 39.0, 40.0, 54.0, 80.0, 115.0, 261.0, 539.0, 1756.0, 461.0, 213.0, 140.0, 98.0, 57.0, 36.0, 28.0, 16.0, 12.0, 15.0, 9.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.66015625, -3.553680419921875, -3.44720458984375, -3.340728759765625, -3.2342529296875, -3.127777099609375, -3.02130126953125, -2.914825439453125, -2.808349609375, -2.701873779296875, -2.59539794921875, -2.488922119140625, -2.3824462890625, -2.275970458984375, -2.16949462890625, -2.063018798828125, -1.95654296875, -1.850067138671875, -1.74359130859375, -1.637115478515625, -1.5306396484375, -1.424163818359375, -1.31768798828125, -1.211212158203125, -1.104736328125, -0.998260498046875, -0.89178466796875, -0.785308837890625, -0.6788330078125, -0.572357177734375, -0.46588134765625, -0.359405517578125, -0.2529296875, -0.146453857421875, -0.03997802734375, 0.066497802734375, 0.1729736328125, 0.279449462890625, 0.38592529296875, 0.492401123046875, 0.598876953125, 0.705352783203125, 0.81182861328125, 0.918304443359375, 1.0247802734375, 1.131256103515625, 1.23773193359375, 1.344207763671875, 1.45068359375, 1.557159423828125, 1.66363525390625, 1.770111083984375, 1.8765869140625, 1.983062744140625, 2.08953857421875, 2.196014404296875, 2.302490234375, 2.408966064453125, 2.51544189453125, 2.621917724609375, 2.7283935546875, 2.834869384765625, 2.94134521484375, 3.047821044921875, 3.154296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 9.0, 16.0, 26.0, 49.0, 113.0, 208.0, 249.0, 196.0, 69.0, 31.0, 17.0, 8.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.77820587158203, -23.713666915893555, -22.649127960205078, -21.5845890045166, -20.520050048828125, -19.45551109313965, -18.390972137451172, -17.326431274414062, -16.26189422607422, -15.197355270385742, -14.132816314697266, -13.068277359008789, -12.003738403320312, -10.939199447631836, -9.874659538269043, -8.810120582580566, -7.745580673217773, -6.681041717529297, -5.61650276184082, -4.5519633293151855, -3.487424373626709, -2.4228854179382324, -1.3583459854125977, -0.2938070297241211, 0.7707319259643555, 1.8352710008621216, 2.8998100757598877, 3.9643492698669434, 5.02888822555542, 6.0934271812438965, 7.157966613769531, 8.222505569458008, 9.287044525146484, 10.351583480834961, 11.416122436523438, 12.480661392211914, 13.54520034790039, 14.609739303588867, 15.67427921295166, 16.738819122314453, 17.803356170654297, 18.867895126342773, 19.93243408203125, 20.996973037719727, 22.061511993408203, 23.12605094909668, 24.190589904785156, 25.255130767822266, 26.319669723510742, 27.38420867919922, 28.448747634887695, 29.513286590576172, 30.57782554626465, 31.642364501953125, 32.706905364990234, 33.77144241333008, 34.83598327636719, 35.9005241394043, 36.96506118774414, 38.02960205078125, 39.094139099121094, 40.1586799621582, 41.22321701049805, 42.287757873535156, 43.352294921875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 16.0, 17.0, 16.0, 19.0, 31.0, 29.0, 45.0, 51.0, 49.0, 43.0, 57.0, 70.0, 70.0, 69.0, 61.0, 42.0, 41.0, 45.0, 50.0, 33.0, 21.0, 21.0, 15.0, 11.0, 10.0, 7.0, 7.0, 6.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0], "bins": [-14.376716613769531, -13.967376708984375, -13.558037757873535, -13.148697853088379, -12.739357948303223, -12.330018997192383, -11.920679092407227, -11.51133918762207, -11.10200023651123, -10.692660331726074, -10.283321380615234, -9.873981475830078, -9.464641571044922, -9.055302619934082, -8.645962715148926, -8.236623764038086, -7.8272833824157715, -7.417943954467773, -7.008604049682617, -6.599264621734619, -6.189925193786621, -5.780585289001465, -5.371245861053467, -4.961906433105469, -4.5525665283203125, -4.1432271003723145, -3.7338874340057373, -3.32454776763916, -2.915208339691162, -2.505868673324585, -2.096529006958008, -1.6871895790100098, -1.2778501510620117, -0.8685106039047241, -0.45917099714279175, -0.049831390380859375, 0.3595081567764282, 0.7688477039337158, 1.178187370300293, 1.587526798248291, 1.9968664646148682, 2.4062061309814453, 2.8155455589294434, 3.2248852252960205, 3.6342248916625977, 4.043564319610596, 4.452903747558594, 4.86224365234375, 5.271583080291748, 5.680922508239746, 6.090262413024902, 6.4996018409729, 6.908941268920898, 7.318281173706055, 7.727620601654053, 8.13696002960205, 8.546299934387207, 8.955639839172363, 9.364978790283203, 9.77431869506836, 10.183658599853516, 10.592997550964355, 11.002337455749512, 11.411676406860352, 11.821016311645508]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 11.0, 15.0, 19.0, 30.0, 45.0, 45.0, 92.0, 111.0, 191.0, 305.0, 419.0, 739.0, 1161.0, 2020.0, 3535.0, 6729.0, 13687.0, 31756.0, 82926.0, 294741.0, 420142.0, 113506.0, 40885.0, 17128.0, 8041.0, 4194.0, 2293.0, 1391.0, 837.0, 559.0, 321.0, 199.0, 153.0, 90.0, 70.0, 41.0, 29.0, 29.0, 16.0, 13.0, 9.0, 10.0, 5.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.671875, -10.33984375, -10.0078125, -9.67578125, -9.34375, -9.01171875, -8.6796875, -8.34765625, -8.015625, -7.68359375, -7.3515625, -7.01953125, -6.6875, -6.35546875, -6.0234375, -5.69140625, -5.359375, -5.02734375, -4.6953125, -4.36328125, -4.03125, -3.69921875, -3.3671875, -3.03515625, -2.703125, -2.37109375, -2.0390625, -1.70703125, -1.375, -1.04296875, -0.7109375, -0.37890625, -0.046875, 0.28515625, 0.6171875, 0.94921875, 1.28125, 1.61328125, 1.9453125, 2.27734375, 2.609375, 2.94140625, 3.2734375, 3.60546875, 3.9375, 4.26953125, 4.6015625, 4.93359375, 5.265625, 5.59765625, 5.9296875, 6.26171875, 6.59375, 6.92578125, 7.2578125, 7.58984375, 7.921875, 8.25390625, 8.5859375, 8.91796875, 9.25, 9.58203125, 9.9140625, 10.24609375, 10.578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 13.0, 9.0, 22.0, 21.0, 26.0, 36.0, 37.0, 34.0, 47.0, 37.0, 45.0, 69.0, 64.0, 87.0, 65.0, 58.0, 40.0, 40.0, 46.0, 41.0, 29.0, 24.0, 24.0, 16.0, 15.0, 9.0, 5.0, 10.0, 7.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3447265625, -1.3038330078125, -1.262939453125, -1.2220458984375, -1.18115234375, -1.1402587890625, -1.099365234375, -1.0584716796875, -1.017578125, -0.9766845703125, -0.935791015625, -0.8948974609375, -0.85400390625, -0.8131103515625, -0.772216796875, -0.7313232421875, -0.6904296875, -0.6495361328125, -0.608642578125, -0.5677490234375, -0.52685546875, -0.4859619140625, -0.445068359375, -0.4041748046875, -0.36328125, -0.3223876953125, -0.281494140625, -0.2406005859375, -0.19970703125, -0.1588134765625, -0.117919921875, -0.0770263671875, -0.0361328125, 0.0047607421875, 0.045654296875, 0.0865478515625, 0.12744140625, 0.1683349609375, 0.209228515625, 0.2501220703125, 0.291015625, 0.3319091796875, 0.372802734375, 0.4136962890625, 0.45458984375, 0.4954833984375, 0.536376953125, 0.5772705078125, 0.6181640625, 0.6590576171875, 0.699951171875, 0.7408447265625, 0.78173828125, 0.8226318359375, 0.863525390625, 0.9044189453125, 0.9453125, 0.9862060546875, 1.027099609375, 1.0679931640625, 1.10888671875, 1.1497802734375, 1.190673828125, 1.2315673828125, 1.2724609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 6.0, 12.0, 9.0, 26.0, 36.0, 45.0, 54.0, 83.0, 121.0, 208.0, 260.0, 399.0, 638.0, 963.0, 1523.0, 2547.0, 4437.0, 8266.0, 16474.0, 36037.0, 90010.0, 280063.0, 387045.0, 125487.0, 48290.0, 21339.0, 10461.0, 5525.0, 3069.0, 1808.0, 1132.0, 702.0, 454.0, 294.0, 196.0, 134.0, 108.0, 74.0, 43.0, 45.0, 30.0, 20.0, 14.0, 16.0, 11.0, 6.0, 5.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.0234375, -6.79052734375, -6.5576171875, -6.32470703125, -6.091796875, -5.85888671875, -5.6259765625, -5.39306640625, -5.16015625, -4.92724609375, -4.6943359375, -4.46142578125, -4.228515625, -3.99560546875, -3.7626953125, -3.52978515625, -3.296875, -3.06396484375, -2.8310546875, -2.59814453125, -2.365234375, -2.13232421875, -1.8994140625, -1.66650390625, -1.43359375, -1.20068359375, -0.9677734375, -0.73486328125, -0.501953125, -0.26904296875, -0.0361328125, 0.19677734375, 0.4296875, 0.66259765625, 0.8955078125, 1.12841796875, 1.361328125, 1.59423828125, 1.8271484375, 2.06005859375, 2.29296875, 2.52587890625, 2.7587890625, 2.99169921875, 3.224609375, 3.45751953125, 3.6904296875, 3.92333984375, 4.15625, 4.38916015625, 4.6220703125, 4.85498046875, 5.087890625, 5.32080078125, 5.5537109375, 5.78662109375, 6.01953125, 6.25244140625, 6.4853515625, 6.71826171875, 6.951171875, 7.18408203125, 7.4169921875, 7.64990234375, 7.8828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 1.0, 9.0, 9.0, 16.0, 21.0, 31.0, 26.0, 45.0, 36.0, 40.0, 44.0, 45.0, 50.0, 59.0, 64.0, 61.0, 54.0, 57.0, 54.0, 45.0, 40.0, 38.0, 29.0, 23.0, 21.0, 21.0, 19.0, 11.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.609375, -6.38592529296875, -6.1624755859375, -5.93902587890625, -5.715576171875, -5.49212646484375, -5.2686767578125, -5.04522705078125, -4.82177734375, -4.59832763671875, -4.3748779296875, -4.15142822265625, -3.927978515625, -3.70452880859375, -3.4810791015625, -3.25762939453125, -3.0341796875, -2.81072998046875, -2.5872802734375, -2.36383056640625, -2.140380859375, -1.91693115234375, -1.6934814453125, -1.47003173828125, -1.24658203125, -1.02313232421875, -0.7996826171875, -0.57623291015625, -0.352783203125, -0.12933349609375, 0.0941162109375, 0.31756591796875, 0.541015625, 0.76446533203125, 0.9879150390625, 1.21136474609375, 1.434814453125, 1.65826416015625, 1.8817138671875, 2.10516357421875, 2.32861328125, 2.55206298828125, 2.7755126953125, 2.99896240234375, 3.222412109375, 3.44586181640625, 3.6693115234375, 3.89276123046875, 4.1162109375, 4.33966064453125, 4.5631103515625, 4.78656005859375, 5.010009765625, 5.23345947265625, 5.4569091796875, 5.68035888671875, 5.90380859375, 6.12725830078125, 6.3507080078125, 6.57415771484375, 6.797607421875, 7.02105712890625, 7.2445068359375, 7.46795654296875, 7.69140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 11.0, 9.0, 9.0, 25.0, 36.0, 62.0, 80.0, 151.0, 244.0, 381.0, 763.0, 1575.0, 3304.0, 8059.0, 20548.0, 61414.0, 194034.0, 408247.0, 233463.0, 74364.0, 24777.0, 9377.0, 3889.0, 1728.0, 874.0, 457.0, 273.0, 152.0, 81.0, 57.0, 43.0, 14.0, 13.0, 12.0, 5.0, 6.0, 6.0, 1.0, 6.0, 0.0, 1.0, 2.0], "bins": [-6.57421875, -6.40814208984375, -6.2420654296875, -6.07598876953125, -5.909912109375, -5.74383544921875, -5.5777587890625, -5.41168212890625, -5.24560546875, -5.07952880859375, -4.9134521484375, -4.74737548828125, -4.581298828125, -4.41522216796875, -4.2491455078125, -4.08306884765625, -3.9169921875, -3.75091552734375, -3.5848388671875, -3.41876220703125, -3.252685546875, -3.08660888671875, -2.9205322265625, -2.75445556640625, -2.58837890625, -2.42230224609375, -2.2562255859375, -2.09014892578125, -1.924072265625, -1.75799560546875, -1.5919189453125, -1.42584228515625, -1.259765625, -1.09368896484375, -0.9276123046875, -0.76153564453125, -0.595458984375, -0.42938232421875, -0.2633056640625, -0.09722900390625, 0.06884765625, 0.23492431640625, 0.4010009765625, 0.56707763671875, 0.733154296875, 0.89923095703125, 1.0653076171875, 1.23138427734375, 1.3974609375, 1.56353759765625, 1.7296142578125, 1.89569091796875, 2.061767578125, 2.22784423828125, 2.3939208984375, 2.55999755859375, 2.72607421875, 2.89215087890625, 3.0582275390625, 3.22430419921875, 3.390380859375, 3.55645751953125, 3.7225341796875, 3.88861083984375, 4.0546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 5.0, 10.0, 10.0, 36.0, 91.0, 285.0, 320.0, 132.0, 42.0, 18.0, 12.0, 6.0, 1.0, 3.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008087158203125, -0.0007819011807441711, -0.0007550865411758423, -0.0007282719016075134, -0.0007014572620391846, -0.0006746426224708557, -0.0006478279829025269, -0.000621013343334198, -0.0005941987037658691, -0.0005673840641975403, -0.0005405694246292114, -0.0005137547850608826, -0.0004869401454925537, -0.00046012550592422485, -0.000433310866355896, -0.00040649622678756714, -0.0003796815872192383, -0.0003528669476509094, -0.00032605230808258057, -0.0002992376685142517, -0.00027242302894592285, -0.000245608389377594, -0.00021879374980926514, -0.00019197911024093628, -0.00016516447067260742, -0.00013834983110427856, -0.00011153519153594971, -8.472055196762085e-05, -5.790591239929199e-05, -3.1091272830963135e-05, -4.276633262634277e-06, 2.253800630569458e-05, 4.935264587402344e-05, 7.61672854423523e-05, 0.00010298192501068115, 0.00012979656457901, 0.00015661120414733887, 0.00018342584371566772, 0.00021024048328399658, 0.00023705512285232544, 0.0002638697624206543, 0.00029068440198898315, 0.000317499041557312, 0.00034431368112564087, 0.0003711283206939697, 0.0003979429602622986, 0.00042475759983062744, 0.0004515722393989563, 0.00047838687896728516, 0.000505201518535614, 0.0005320161581039429, 0.0005588307976722717, 0.0005856454372406006, 0.0006124600768089294, 0.0006392747163772583, 0.0006660893559455872, 0.000692903995513916, 0.0007197186350822449, 0.0007465332746505737, 0.0007733479142189026, 0.0008001625537872314, 0.0008269771933555603, 0.0008537918329238892, 0.000880606472492218, 0.0009074211120605469]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 8.0, 7.0, 20.0, 26.0, 32.0, 46.0, 49.0, 92.0, 155.0, 226.0, 313.0, 465.0, 836.0, 1311.0, 2093.0, 3572.0, 5990.0, 10477.0, 19479.0, 37565.0, 76742.0, 152609.0, 248182.0, 227261.0, 127993.0, 63362.0, 31197.0, 16312.0, 9009.0, 5171.0, 2982.0, 1814.0, 1098.0, 705.0, 460.0, 289.0, 193.0, 142.0, 90.0, 57.0, 42.0, 23.0, 21.0, 9.0, 7.0, 11.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.353515625, -3.244873046875, -3.13623046875, -3.027587890625, -2.9189453125, -2.810302734375, -2.70166015625, -2.593017578125, -2.484375, -2.375732421875, -2.26708984375, -2.158447265625, -2.0498046875, -1.941162109375, -1.83251953125, -1.723876953125, -1.615234375, -1.506591796875, -1.39794921875, -1.289306640625, -1.1806640625, -1.072021484375, -0.96337890625, -0.854736328125, -0.74609375, -0.637451171875, -0.52880859375, -0.420166015625, -0.3115234375, -0.202880859375, -0.09423828125, 0.014404296875, 0.123046875, 0.231689453125, 0.34033203125, 0.448974609375, 0.5576171875, 0.666259765625, 0.77490234375, 0.883544921875, 0.9921875, 1.100830078125, 1.20947265625, 1.318115234375, 1.4267578125, 1.535400390625, 1.64404296875, 1.752685546875, 1.861328125, 1.969970703125, 2.07861328125, 2.187255859375, 2.2958984375, 2.404541015625, 2.51318359375, 2.621826171875, 2.73046875, 2.839111328125, 2.94775390625, 3.056396484375, 3.1650390625, 3.273681640625, 3.38232421875, 3.490966796875, 3.599609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 14.0, 7.0, 5.0, 7.0, 20.0, 9.0, 12.0, 24.0, 27.0, 36.0, 35.0, 42.0, 57.0, 48.0, 48.0, 57.0, 62.0, 59.0, 42.0, 46.0, 47.0, 46.0, 40.0, 26.0, 25.0, 27.0, 17.0, 23.0, 19.0, 4.0, 12.0, 7.0, 7.0, 10.0, 4.0, 3.0, 5.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.427734375, -3.3345947265625, -3.241455078125, -3.1483154296875, -3.05517578125, -2.9620361328125, -2.868896484375, -2.7757568359375, -2.6826171875, -2.5894775390625, -2.496337890625, -2.4031982421875, -2.31005859375, -2.2169189453125, -2.123779296875, -2.0306396484375, -1.9375, -1.8443603515625, -1.751220703125, -1.6580810546875, -1.56494140625, -1.4718017578125, -1.378662109375, -1.2855224609375, -1.1923828125, -1.0992431640625, -1.006103515625, -0.9129638671875, -0.81982421875, -0.7266845703125, -0.633544921875, -0.5404052734375, -0.447265625, -0.3541259765625, -0.260986328125, -0.1678466796875, -0.07470703125, 0.0184326171875, 0.111572265625, 0.2047119140625, 0.2978515625, 0.3909912109375, 0.484130859375, 0.5772705078125, 0.67041015625, 0.7635498046875, 0.856689453125, 0.9498291015625, 1.04296875, 1.1361083984375, 1.229248046875, 1.3223876953125, 1.41552734375, 1.5086669921875, 1.601806640625, 1.6949462890625, 1.7880859375, 1.8812255859375, 1.974365234375, 2.0675048828125, 2.16064453125, 2.2537841796875, 2.346923828125, 2.4400634765625, 2.533203125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 19.0, 32.0, 100.0, 225.0, 335.0, 198.0, 49.0, 26.0, 6.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.93316650390625, -162.01480102539062, -158.09642028808594, -154.1780548095703, -150.2596893310547, -146.34130859375, -142.42294311523438, -138.50457763671875, -134.58621215820312, -130.6678466796875, -126.74947357177734, -122.83110046386719, -118.91273498535156, -114.9943618774414, -111.07598876953125, -107.15762329101562, -103.23924255371094, -99.32086944580078, -95.40250396728516, -91.484130859375, -87.56576538085938, -83.64739227294922, -79.72901916503906, -75.81065368652344, -71.89228057861328, -67.97390747070312, -64.0555419921875, -60.137168884277344, -56.21879959106445, -52.30043029785156, -48.382057189941406, -44.463687896728516, -40.545326232910156, -36.626956939697266, -32.708587646484375, -28.79021453857422, -24.871845245361328, -20.953475952148438, -17.035104751586914, -13.11673355102539, -9.1983642578125, -5.279994010925293, -1.361623764038086, 2.556746482849121, 6.475116729736328, 10.393486022949219, 14.311857223510742, 18.230228424072266, 22.148597717285156, 26.066967010498047, 29.98533821105957, 33.903709411621094, 37.822078704833984, 41.740447998046875, 45.65882110595703, 49.57719039916992, 53.49555969238281, 57.4139289855957, 61.332298278808594, 65.25067138671875, 69.16903686523438, 73.08740997314453, 77.00578308105469, 80.92414855957031, 84.84252166748047]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 6.0, 11.0, 13.0, 17.0, 30.0, 31.0, 52.0, 69.0, 75.0, 93.0, 86.0, 95.0, 95.0, 68.0, 49.0, 53.0, 38.0, 28.0, 27.0, 21.0, 11.0, 11.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.6375732421875, -79.416748046875, -77.19591522216797, -74.97509002685547, -72.75425720214844, -70.53343200683594, -68.31260681152344, -66.0917739868164, -63.870948791503906, -61.65011978149414, -59.429290771484375, -57.208465576171875, -54.98763656616211, -52.766807556152344, -50.545982360839844, -48.32515335083008, -46.10432434082031, -43.88349533081055, -41.66266632080078, -39.44184112548828, -37.221012115478516, -35.00018310546875, -32.77935791015625, -30.558528900146484, -28.33769989013672, -26.116870880126953, -23.89604377746582, -21.675216674804688, -19.454387664794922, -17.233558654785156, -15.012731552124023, -12.791903495788574, -10.571067810058594, -8.350239753723145, -6.129411697387695, -3.908583641052246, -1.6877555847167969, 0.5330724716186523, 2.7539005279541016, 4.974728584289551, 7.195556640625, 9.41638469696045, 11.637212753295898, 13.858040809631348, 16.078868865966797, 18.299697875976562, 20.520524978637695, 22.741352081298828, 24.962181091308594, 27.18301010131836, 29.403837203979492, 31.624664306640625, 33.84549331665039, 36.066322326660156, 38.287147521972656, 40.50797653198242, 42.72880554199219, 44.94963455200195, 47.17046356201172, 49.39128875732422, 51.612117767333984, 53.83294677734375, 56.05377197265625, 58.274600982666016, 60.49542999267578]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 6.0, 11.0, 18.0, 28.0, 31.0, 38.0, 68.0, 93.0, 137.0, 170.0, 281.0, 396.0, 672.0, 1001.0, 1580.0, 2659.0, 4429.0, 8425.0, 17107.0, 41181.0, 149957.0, 3488489.0, 364948.0, 64484.0, 23540.0, 11024.0, 5777.0, 3130.0, 1807.0, 1089.0, 641.0, 387.0, 248.0, 166.0, 97.0, 54.0, 36.0, 25.0, 15.0, 10.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-29.65625, -28.889892578125, -28.12353515625, -27.357177734375, -26.5908203125, -25.824462890625, -25.05810546875, -24.291748046875, -23.525390625, -22.759033203125, -21.99267578125, -21.226318359375, -20.4599609375, -19.693603515625, -18.92724609375, -18.160888671875, -17.39453125, -16.628173828125, -15.86181640625, -15.095458984375, -14.3291015625, -13.562744140625, -12.79638671875, -12.030029296875, -11.263671875, -10.497314453125, -9.73095703125, -8.964599609375, -8.1982421875, -7.431884765625, -6.66552734375, -5.899169921875, -5.1328125, -4.366455078125, -3.60009765625, -2.833740234375, -2.0673828125, -1.301025390625, -0.53466796875, 0.231689453125, 0.998046875, 1.764404296875, 2.53076171875, 3.297119140625, 4.0634765625, 4.829833984375, 5.59619140625, 6.362548828125, 7.12890625, 7.895263671875, 8.66162109375, 9.427978515625, 10.1943359375, 10.960693359375, 11.72705078125, 12.493408203125, 13.259765625, 14.026123046875, 14.79248046875, 15.558837890625, 16.3251953125, 17.091552734375, 17.85791015625, 18.624267578125, 19.390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 8.0, 7.0, 8.0, 10.0, 16.0, 8.0, 12.0, 18.0, 25.0, 34.0, 39.0, 38.0, 35.0, 43.0, 50.0, 57.0, 34.0, 50.0, 55.0, 41.0, 48.0, 49.0, 59.0, 36.0, 29.0, 35.0, 34.0, 26.0, 22.0, 16.0, 16.0, 12.0, 10.0, 4.0, 10.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.3090362548828125, -1.271392822265625, -1.2337493896484375, -1.19610595703125, -1.1584625244140625, -1.120819091796875, -1.0831756591796875, -1.0455322265625, -1.0078887939453125, -0.970245361328125, -0.9326019287109375, -0.89495849609375, -0.8573150634765625, -0.819671630859375, -0.7820281982421875, -0.744384765625, -0.7067413330078125, -0.669097900390625, -0.6314544677734375, -0.59381103515625, -0.5561676025390625, -0.518524169921875, -0.4808807373046875, -0.4432373046875, -0.4055938720703125, -0.367950439453125, -0.3303070068359375, -0.29266357421875, -0.2550201416015625, -0.217376708984375, -0.1797332763671875, -0.14208984375, -0.1044464111328125, -0.066802978515625, -0.0291595458984375, 0.00848388671875, 0.0461273193359375, 0.083770751953125, 0.1214141845703125, 0.1590576171875, 0.1967010498046875, 0.234344482421875, 0.2719879150390625, 0.30963134765625, 0.3472747802734375, 0.384918212890625, 0.4225616455078125, 0.460205078125, 0.4978485107421875, 0.535491943359375, 0.5731353759765625, 0.61077880859375, 0.6484222412109375, 0.686065673828125, 0.7237091064453125, 0.7613525390625, 0.7989959716796875, 0.836639404296875, 0.8742828369140625, 0.91192626953125, 0.9495697021484375, 0.987213134765625, 1.0248565673828125, 1.0625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 7.0, 10.0, 11.0, 10.0, 7.0, 25.0, 29.0, 61.0, 118.0, 283.0, 1158.0, 8666.0, 259140.0, 3889365.0, 31822.0, 2666.0, 519.0, 165.0, 69.0, 42.0, 23.0, 18.0, 13.0, 12.0, 11.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.34375, -59.87353515625, -57.4033203125, -54.93310546875, -52.462890625, -49.99267578125, -47.5224609375, -45.05224609375, -42.58203125, -40.11181640625, -37.6416015625, -35.17138671875, -32.701171875, -30.23095703125, -27.7607421875, -25.29052734375, -22.8203125, -20.35009765625, -17.8798828125, -15.40966796875, -12.939453125, -10.46923828125, -7.9990234375, -5.52880859375, -3.05859375, -0.58837890625, 1.8818359375, 4.35205078125, 6.822265625, 9.29248046875, 11.7626953125, 14.23291015625, 16.703125, 19.17333984375, 21.6435546875, 24.11376953125, 26.583984375, 29.05419921875, 31.5244140625, 33.99462890625, 36.46484375, 38.93505859375, 41.4052734375, 43.87548828125, 46.345703125, 48.81591796875, 51.2861328125, 53.75634765625, 56.2265625, 58.69677734375, 61.1669921875, 63.63720703125, 66.107421875, 68.57763671875, 71.0478515625, 73.51806640625, 75.98828125, 78.45849609375, 80.9287109375, 83.39892578125, 85.869140625, 88.33935546875, 90.8095703125, 93.27978515625, 95.75]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 1.0, 2.0, 4.0, 10.0, 7.0, 16.0, 11.0, 17.0, 25.0, 43.0, 47.0, 85.0, 112.0, 219.0, 487.0, 1800.0, 520.0, 236.0, 148.0, 88.0, 59.0, 40.0, 20.0, 17.0, 9.0, 10.0, 8.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -5.030120849609375, -4.89617919921875, -4.762237548828125, -4.6282958984375, -4.494354248046875, -4.36041259765625, -4.226470947265625, -4.092529296875, -3.958587646484375, -3.82464599609375, -3.690704345703125, -3.5567626953125, -3.422821044921875, -3.28887939453125, -3.154937744140625, -3.02099609375, -2.887054443359375, -2.75311279296875, -2.619171142578125, -2.4852294921875, -2.351287841796875, -2.21734619140625, -2.083404541015625, -1.949462890625, -1.815521240234375, -1.68157958984375, -1.547637939453125, -1.4136962890625, -1.279754638671875, -1.14581298828125, -1.011871337890625, -0.8779296875, -0.743988037109375, -0.61004638671875, -0.476104736328125, -0.3421630859375, -0.208221435546875, -0.07427978515625, 0.059661865234375, 0.193603515625, 0.327545166015625, 0.46148681640625, 0.595428466796875, 0.7293701171875, 0.863311767578125, 0.99725341796875, 1.131195068359375, 1.26513671875, 1.399078369140625, 1.53302001953125, 1.666961669921875, 1.8009033203125, 1.934844970703125, 2.06878662109375, 2.202728271484375, 2.336669921875, 2.470611572265625, 2.60455322265625, 2.738494873046875, 2.8724365234375, 3.006378173828125, 3.14031982421875, 3.274261474609375, 3.408203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 13.0, 51.0, 130.0, 265.0, 299.0, 170.0, 53.0, 16.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.23458099365234, -62.9947624206543, -60.754947662353516, -58.51512908935547, -56.27531433105469, -54.03549575805664, -51.795677185058594, -49.55586242675781, -47.316043853759766, -45.07622528076172, -42.83641052246094, -40.59659194946289, -38.356773376464844, -36.11695861816406, -33.877140045166016, -31.6373233795166, -29.397506713867188, -27.157690048217773, -24.91787338256836, -22.678054809570312, -20.4382381439209, -18.198421478271484, -15.958603858947754, -13.718786239624023, -11.47896957397461, -9.239152908325195, -6.999335289001465, -4.759518146514893, -2.5197010040283203, -0.27988433837890625, 1.9599332809448242, 4.199750900268555, 6.4395751953125, 8.679391860961914, 10.919209480285645, 13.159027099609375, 15.398843765258789, 17.638660430908203, 19.87847900390625, 22.118295669555664, 24.358112335205078, 26.597929000854492, 28.837745666503906, 31.077564239501953, 33.3173828125, 35.55719757080078, 37.79701614379883, 40.036834716796875, 42.276649475097656, 44.5164680480957, 46.756282806396484, 48.99610137939453, 51.23591613769531, 53.47573471069336, 55.715553283691406, 57.95536804199219, 60.195186614990234, 62.43500518798828, 64.67481994628906, 66.91463470458984, 69.15445709228516, 71.39427185058594, 73.63408660888672, 75.87390899658203, 78.11372375488281]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 10.0, 13.0, 20.0, 20.0, 22.0, 27.0, 31.0, 45.0, 39.0, 50.0, 46.0, 48.0, 41.0, 46.0, 56.0, 60.0, 43.0, 37.0, 49.0, 33.0, 41.0, 38.0, 30.0, 35.0, 26.0, 16.0, 17.0, 13.0, 7.0, 3.0, 5.0, 3.0, 8.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.422658920288086, -12.934398651123047, -12.446139335632324, -11.957879066467285, -11.469618797302246, -10.981359481811523, -10.493099212646484, -10.004838943481445, -9.516578674316406, -9.028318405151367, -8.540059089660645, -8.051798820495605, -7.563538551330566, -7.0752787590026855, -6.587018966674805, -6.098758697509766, -5.610499382019043, -5.122239589691162, -4.633979320526123, -4.145719528198242, -3.6574594974517822, -3.1691994667053223, -2.6809396743774414, -2.1926796436309814, -1.7044196128845215, -1.2161595821380615, -0.7278996706008911, -0.2396397590637207, 0.24862027168273926, 0.7368803024291992, 1.22514009475708, 1.71340012550354, 2.20166015625, 2.68992018699646, 3.17818021774292, 3.666440010070801, 4.15470027923584, 4.642960071563721, 5.131219863891602, 5.619480133056641, 6.1077399253845215, 6.595999717712402, 7.084259986877441, 7.572519779205322, 8.060779571533203, 8.549039840698242, 9.037300109863281, 9.525559425354004, 10.013819694519043, 10.502079963684082, 10.990339279174805, 11.478599548339844, 11.966859817504883, 12.455120086669922, 12.943379402160645, 13.431639671325684, 13.919898986816406, 14.408159255981445, 14.896418571472168, 15.384678840637207, 15.872939109802246, 16.36119842529297, 16.849458694458008, 17.337718963623047, 17.825979232788086]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 7.0, 5.0, 11.0, 9.0, 19.0, 25.0, 34.0, 40.0, 69.0, 94.0, 180.0, 244.0, 338.0, 600.0, 855.0, 1451.0, 2389.0, 3961.0, 6913.0, 12193.0, 21682.0, 39041.0, 70440.0, 122395.0, 189976.0, 211799.0, 154422.0, 91926.0, 51248.0, 28265.0, 15826.0, 8867.0, 5187.0, 3023.0, 1884.0, 1139.0, 721.0, 453.0, 281.0, 190.0, 103.0, 77.0, 55.0, 41.0, 24.0, 17.0, 8.0, 12.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-7.78125, -7.5321044921875, -7.282958984375, -7.0338134765625, -6.78466796875, -6.5355224609375, -6.286376953125, -6.0372314453125, -5.7880859375, -5.5389404296875, -5.289794921875, -5.0406494140625, -4.79150390625, -4.5423583984375, -4.293212890625, -4.0440673828125, -3.794921875, -3.5457763671875, -3.296630859375, -3.0474853515625, -2.79833984375, -2.5491943359375, -2.300048828125, -2.0509033203125, -1.8017578125, -1.5526123046875, -1.303466796875, -1.0543212890625, -0.80517578125, -0.5560302734375, -0.306884765625, -0.0577392578125, 0.19140625, 0.4405517578125, 0.689697265625, 0.9388427734375, 1.18798828125, 1.4371337890625, 1.686279296875, 1.9354248046875, 2.1845703125, 2.4337158203125, 2.682861328125, 2.9320068359375, 3.18115234375, 3.4302978515625, 3.679443359375, 3.9285888671875, 4.177734375, 4.4268798828125, 4.676025390625, 4.9251708984375, 5.17431640625, 5.4234619140625, 5.672607421875, 5.9217529296875, 6.1708984375, 6.4200439453125, 6.669189453125, 6.9183349609375, 7.16748046875, 7.4166259765625, 7.665771484375, 7.9149169921875, 8.1640625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 9.0, 12.0, 15.0, 10.0, 19.0, 24.0, 34.0, 27.0, 31.0, 28.0, 29.0, 44.0, 51.0, 49.0, 48.0, 37.0, 62.0, 49.0, 53.0, 45.0, 42.0, 50.0, 32.0, 27.0, 40.0, 22.0, 18.0, 14.0, 15.0, 11.0, 10.0, 10.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.3046875, -1.267333984375, -1.22998046875, -1.192626953125, -1.1552734375, -1.117919921875, -1.08056640625, -1.043212890625, -1.005859375, -0.968505859375, -0.93115234375, -0.893798828125, -0.8564453125, -0.819091796875, -0.78173828125, -0.744384765625, -0.70703125, -0.669677734375, -0.63232421875, -0.594970703125, -0.5576171875, -0.520263671875, -0.48291015625, -0.445556640625, -0.408203125, -0.370849609375, -0.33349609375, -0.296142578125, -0.2587890625, -0.221435546875, -0.18408203125, -0.146728515625, -0.109375, -0.072021484375, -0.03466796875, 0.002685546875, 0.0400390625, 0.077392578125, 0.11474609375, 0.152099609375, 0.189453125, 0.226806640625, 0.26416015625, 0.301513671875, 0.3388671875, 0.376220703125, 0.41357421875, 0.450927734375, 0.48828125, 0.525634765625, 0.56298828125, 0.600341796875, 0.6376953125, 0.675048828125, 0.71240234375, 0.749755859375, 0.787109375, 0.824462890625, 0.86181640625, 0.899169921875, 0.9365234375, 0.973876953125, 1.01123046875, 1.048583984375, 1.0859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 5.0, 10.0, 13.0, 27.0, 54.0, 52.0, 87.0, 138.0, 284.0, 451.0, 696.0, 1370.0, 3116.0, 7278.0, 19834.0, 62603.0, 204592.0, 423607.0, 220103.0, 68242.0, 21594.0, 7677.0, 3290.0, 1550.0, 711.0, 435.0, 273.0, 161.0, 100.0, 78.0, 40.0, 19.0, 16.0, 24.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.203125, -19.6005859375, -18.998046875, -18.3955078125, -17.79296875, -17.1904296875, -16.587890625, -15.9853515625, -15.3828125, -14.7802734375, -14.177734375, -13.5751953125, -12.97265625, -12.3701171875, -11.767578125, -11.1650390625, -10.5625, -9.9599609375, -9.357421875, -8.7548828125, -8.15234375, -7.5498046875, -6.947265625, -6.3447265625, -5.7421875, -5.1396484375, -4.537109375, -3.9345703125, -3.33203125, -2.7294921875, -2.126953125, -1.5244140625, -0.921875, -0.3193359375, 0.283203125, 0.8857421875, 1.48828125, 2.0908203125, 2.693359375, 3.2958984375, 3.8984375, 4.5009765625, 5.103515625, 5.7060546875, 6.30859375, 6.9111328125, 7.513671875, 8.1162109375, 8.71875, 9.3212890625, 9.923828125, 10.5263671875, 11.12890625, 11.7314453125, 12.333984375, 12.9365234375, 13.5390625, 14.1416015625, 14.744140625, 15.3466796875, 15.94921875, 16.5517578125, 17.154296875, 17.7568359375, 18.359375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 8.0, 15.0, 11.0, 18.0, 23.0, 17.0, 19.0, 28.0, 32.0, 36.0, 34.0, 44.0, 48.0, 44.0, 35.0, 48.0, 55.0, 48.0, 36.0, 45.0, 41.0, 32.0, 39.0, 19.0, 35.0, 24.0, 29.0, 20.0, 13.0, 21.0, 12.0, 12.0, 7.0, 6.0, 3.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-9.2890625, -9.0228271484375, -8.756591796875, -8.4903564453125, -8.22412109375, -7.9578857421875, -7.691650390625, -7.4254150390625, -7.1591796875, -6.8929443359375, -6.626708984375, -6.3604736328125, -6.09423828125, -5.8280029296875, -5.561767578125, -5.2955322265625, -5.029296875, -4.7630615234375, -4.496826171875, -4.2305908203125, -3.96435546875, -3.6981201171875, -3.431884765625, -3.1656494140625, -2.8994140625, -2.6331787109375, -2.366943359375, -2.1007080078125, -1.83447265625, -1.5682373046875, -1.302001953125, -1.0357666015625, -0.76953125, -0.5032958984375, -0.237060546875, 0.0291748046875, 0.29541015625, 0.5616455078125, 0.827880859375, 1.0941162109375, 1.3603515625, 1.6265869140625, 1.892822265625, 2.1590576171875, 2.42529296875, 2.6915283203125, 2.957763671875, 3.2239990234375, 3.490234375, 3.7564697265625, 4.022705078125, 4.2889404296875, 4.55517578125, 4.8214111328125, 5.087646484375, 5.3538818359375, 5.6201171875, 5.8863525390625, 6.152587890625, 6.4188232421875, 6.68505859375, 6.9512939453125, 7.217529296875, 7.4837646484375, 7.75]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 11.0, 8.0, 17.0, 16.0, 21.0, 22.0, 48.0, 55.0, 79.0, 97.0, 167.0, 251.0, 354.0, 519.0, 920.0, 1470.0, 2660.0, 5275.0, 10636.0, 24627.0, 63314.0, 173313.0, 338018.0, 256450.0, 101316.0, 37451.0, 15429.0, 7251.0, 3555.0, 1944.0, 1159.0, 692.0, 451.0, 313.0, 179.0, 129.0, 86.0, 79.0, 38.0, 35.0, 29.0, 16.0, 18.0, 8.0, 10.0, 4.0, 2.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.95703125, -7.72113037109375, -7.4852294921875, -7.24932861328125, -7.013427734375, -6.77752685546875, -6.5416259765625, -6.30572509765625, -6.06982421875, -5.83392333984375, -5.5980224609375, -5.36212158203125, -5.126220703125, -4.89031982421875, -4.6544189453125, -4.41851806640625, -4.1826171875, -3.94671630859375, -3.7108154296875, -3.47491455078125, -3.239013671875, -3.00311279296875, -2.7672119140625, -2.53131103515625, -2.29541015625, -2.05950927734375, -1.8236083984375, -1.58770751953125, -1.351806640625, -1.11590576171875, -0.8800048828125, -0.64410400390625, -0.408203125, -0.17230224609375, 0.0635986328125, 0.29949951171875, 0.535400390625, 0.77130126953125, 1.0072021484375, 1.24310302734375, 1.47900390625, 1.71490478515625, 1.9508056640625, 2.18670654296875, 2.422607421875, 2.65850830078125, 2.8944091796875, 3.13031005859375, 3.3662109375, 3.60211181640625, 3.8380126953125, 4.07391357421875, 4.309814453125, 4.54571533203125, 4.7816162109375, 5.01751708984375, 5.25341796875, 5.48931884765625, 5.7252197265625, 5.96112060546875, 6.197021484375, 6.43292236328125, 6.6688232421875, 6.90472412109375, 7.140625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 4.0, 4.0, 5.0, 9.0, 10.0, 12.0, 13.0, 14.0, 19.0, 18.0, 33.0, 42.0, 46.0, 58.0, 63.0, 81.0, 95.0, 81.0, 72.0, 44.0, 49.0, 26.0, 36.0, 34.0, 25.0, 16.0, 17.0, 12.0, 13.0, 6.0, 9.0, 11.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010652542114257812, -0.001031726598739624, -0.0009981989860534668, -0.0009646713733673096, -0.0009311437606811523, -0.0008976161479949951, -0.0008640885353088379, -0.0008305609226226807, -0.0007970333099365234, -0.0007635056972503662, -0.000729978084564209, -0.0006964504718780518, -0.0006629228591918945, -0.0006293952465057373, -0.0005958676338195801, -0.0005623400211334229, -0.0005288124084472656, -0.0004952847957611084, -0.00046175718307495117, -0.00042822957038879395, -0.0003947019577026367, -0.0003611743450164795, -0.00032764673233032227, -0.00029411911964416504, -0.0002605915069580078, -0.00022706389427185059, -0.00019353628158569336, -0.00016000866889953613, -0.0001264810562133789, -9.295344352722168e-05, -5.942583084106445e-05, -2.5898218154907227e-05, 7.62939453125e-06, 4.1157007217407227e-05, 7.468461990356445e-05, 0.00010821223258972168, 0.0001417398452758789, 0.00017526745796203613, 0.00020879507064819336, 0.00024232268333435059, 0.0002758502960205078, 0.00030937790870666504, 0.00034290552139282227, 0.0003764331340789795, 0.0004099607467651367, 0.00044348835945129395, 0.00047701597213745117, 0.0005105435848236084, 0.0005440711975097656, 0.0005775988101959229, 0.0006111264228820801, 0.0006446540355682373, 0.0006781816482543945, 0.0007117092609405518, 0.000745236873626709, 0.0007787644863128662, 0.0008122920989990234, 0.0008458197116851807, 0.0008793473243713379, 0.0009128749370574951, 0.0009464025497436523, 0.0009799301624298096, 0.0010134577751159668, 0.001046985387802124, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 5.0, 11.0, 16.0, 14.0, 24.0, 50.0, 47.0, 72.0, 105.0, 113.0, 212.0, 313.0, 505.0, 856.0, 1767.0, 3433.0, 7406.0, 18071.0, 48541.0, 146933.0, 352729.0, 298393.0, 107318.0, 36185.0, 13665.0, 5691.0, 2671.0, 1332.0, 739.0, 399.0, 310.0, 189.0, 125.0, 83.0, 78.0, 47.0, 35.0, 21.0, 20.0, 10.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.054931640625, -5.82080078125, -5.586669921875, -5.3525390625, -5.118408203125, -4.88427734375, -4.650146484375, -4.416015625, -4.181884765625, -3.94775390625, -3.713623046875, -3.4794921875, -3.245361328125, -3.01123046875, -2.777099609375, -2.54296875, -2.308837890625, -2.07470703125, -1.840576171875, -1.6064453125, -1.372314453125, -1.13818359375, -0.904052734375, -0.669921875, -0.435791015625, -0.20166015625, 0.032470703125, 0.2666015625, 0.500732421875, 0.73486328125, 0.968994140625, 1.203125, 1.437255859375, 1.67138671875, 1.905517578125, 2.1396484375, 2.373779296875, 2.60791015625, 2.842041015625, 3.076171875, 3.310302734375, 3.54443359375, 3.778564453125, 4.0126953125, 4.246826171875, 4.48095703125, 4.715087890625, 4.94921875, 5.183349609375, 5.41748046875, 5.651611328125, 5.8857421875, 6.119873046875, 6.35400390625, 6.588134765625, 6.822265625, 7.056396484375, 7.29052734375, 7.524658203125, 7.7587890625, 7.992919921875, 8.22705078125, 8.461181640625, 8.6953125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 1.0, 8.0, 9.0, 9.0, 6.0, 10.0, 10.0, 8.0, 21.0, 28.0, 26.0, 27.0, 52.0, 37.0, 56.0, 64.0, 62.0, 72.0, 63.0, 73.0, 63.0, 51.0, 55.0, 33.0, 42.0, 22.0, 21.0, 16.0, 12.0, 15.0, 9.0, 6.0, 9.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.374664306640625, -3.23956298828125, -3.104461669921875, -2.9693603515625, -2.834259033203125, -2.69915771484375, -2.564056396484375, -2.428955078125, -2.293853759765625, -2.15875244140625, -2.023651123046875, -1.8885498046875, -1.753448486328125, -1.61834716796875, -1.483245849609375, -1.34814453125, -1.213043212890625, -1.07794189453125, -0.942840576171875, -0.8077392578125, -0.672637939453125, -0.53753662109375, -0.402435302734375, -0.267333984375, -0.132232666015625, 0.00286865234375, 0.137969970703125, 0.2730712890625, 0.408172607421875, 0.54327392578125, 0.678375244140625, 0.8134765625, 0.948577880859375, 1.08367919921875, 1.218780517578125, 1.3538818359375, 1.488983154296875, 1.62408447265625, 1.759185791015625, 1.894287109375, 2.029388427734375, 2.16448974609375, 2.299591064453125, 2.4346923828125, 2.569793701171875, 2.70489501953125, 2.839996337890625, 2.97509765625, 3.110198974609375, 3.24530029296875, 3.380401611328125, 3.5155029296875, 3.650604248046875, 3.78570556640625, 3.920806884765625, 4.055908203125, 4.191009521484375, 4.32611083984375, 4.461212158203125, 4.5963134765625, 4.731414794921875, 4.86651611328125, 5.001617431640625, 5.13671875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 5.0, 12.0, 7.0, 7.0, 14.0, 22.0, 15.0, 41.0, 53.0, 78.0, 92.0, 104.0, 114.0, 101.0, 103.0, 75.0, 47.0, 33.0, 22.0, 24.0, 20.0, 2.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.29010009765625, -73.40792083740234, -70.52574157714844, -67.64356994628906, -64.76139068603516, -61.87921142578125, -58.99703598022461, -56.11486053466797, -53.23268127441406, -50.350502014160156, -47.468326568603516, -44.586151123046875, -41.70397186279297, -38.82179260253906, -35.93961715698242, -33.05744171142578, -30.175262451171875, -27.2930850982666, -24.410907745361328, -21.528730392456055, -18.64655303955078, -15.764375686645508, -12.882198333740234, -10.000020980834961, -7.1178436279296875, -4.235666275024414, -1.3534889221191406, 1.5286884307861328, 4.410865783691406, 7.29304313659668, 10.175220489501953, 13.057397842407227, 15.9395751953125, 18.821752548217773, 21.703929901123047, 24.58610725402832, 27.468284606933594, 30.350461959838867, 33.23263931274414, 36.11481475830078, 38.99699401855469, 41.879173278808594, 44.761348724365234, 47.643524169921875, 50.52570343017578, 53.40788269042969, 56.29005813598633, 59.17223358154297, 62.054412841796875, 64.93659210205078, 67.81877136230469, 70.70094299316406, 73.58312225341797, 76.46530151367188, 79.34747314453125, 82.22965240478516, 85.11183166503906, 87.99401092529297, 90.87619018554688, 93.75836181640625, 96.64054107666016, 99.52272033691406, 102.40489196777344, 105.28707122802734, 108.16925048828125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 5.0, 10.0, 5.0, 4.0, 15.0, 6.0, 16.0, 32.0, 33.0, 34.0, 37.0, 52.0, 49.0, 41.0, 61.0, 60.0, 66.0, 63.0, 55.0, 46.0, 50.0, 43.0, 40.0, 35.0, 29.0, 19.0, 16.0, 15.0, 15.0, 12.0, 13.0, 4.0, 9.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.1854248046875, -80.8350601196289, -78.48469543457031, -76.13433074951172, -73.78396606445312, -71.43359375, -69.08323669433594, -66.73286437988281, -64.38249969482422, -62.032135009765625, -59.68177032470703, -57.33140563964844, -54.98103713989258, -52.630672454833984, -50.28030776977539, -47.92993927001953, -45.5795783996582, -43.22921371459961, -40.878849029541016, -38.528480529785156, -36.17811584472656, -33.82775115966797, -31.477386474609375, -29.12701988220215, -26.776655197143555, -24.42629051208496, -22.075923919677734, -19.72555923461914, -17.375194549560547, -15.02482795715332, -12.674463272094727, -10.3240966796875, -7.973731994628906, -5.623366355895996, -3.273001194000244, -0.9226360321044922, 1.427729606628418, 3.778095245361328, 6.128459930419922, 8.478826522827148, 10.829191207885742, 13.179556846618652, 15.529922485351562, 17.880287170410156, 20.23065185546875, 22.581018447875977, 24.93138313293457, 27.281749725341797, 29.63211441040039, 31.982479095458984, 34.33284378051758, 36.68321228027344, 39.03357696533203, 41.383941650390625, 43.73430633544922, 46.08467102050781, 48.435035705566406, 50.785400390625, 53.135765075683594, 55.48612976074219, 57.83649826049805, 60.18686294555664, 62.537227630615234, 64.8875961303711, 67.23796081542969]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 14.0, 19.0, 25.0, 39.0, 61.0, 85.0, 157.0, 360.0, 903.0, 3305.0, 16835.0, 184996.0, 3893348.0, 81661.0, 9747.0, 1817.0, 473.0, 171.0, 76.0, 40.0, 36.0, 20.0, 17.0, 17.0, 10.0, 7.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-96.9375, -94.41015625, -91.8828125, -89.35546875, -86.828125, -84.30078125, -81.7734375, -79.24609375, -76.71875, -74.19140625, -71.6640625, -69.13671875, -66.609375, -64.08203125, -61.5546875, -59.02734375, -56.5, -53.97265625, -51.4453125, -48.91796875, -46.390625, -43.86328125, -41.3359375, -38.80859375, -36.28125, -33.75390625, -31.2265625, -28.69921875, -26.171875, -23.64453125, -21.1171875, -18.58984375, -16.0625, -13.53515625, -11.0078125, -8.48046875, -5.953125, -3.42578125, -0.8984375, 1.62890625, 4.15625, 6.68359375, 9.2109375, 11.73828125, 14.265625, 16.79296875, 19.3203125, 21.84765625, 24.375, 26.90234375, 29.4296875, 31.95703125, 34.484375, 37.01171875, 39.5390625, 42.06640625, 44.59375, 47.12109375, 49.6484375, 52.17578125, 54.703125, 57.23046875, 59.7578125, 62.28515625, 64.8125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 8.0, 7.0, 14.0, 22.0, 13.0, 33.0, 19.0, 25.0, 46.0, 55.0, 51.0, 73.0, 64.0, 67.0, 60.0, 59.0, 65.0, 61.0, 40.0, 45.0, 37.0, 34.0, 21.0, 18.0, 16.0, 12.0, 8.0, 4.0, 8.0, 2.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.62109375, -2.5520477294921875, -2.483001708984375, -2.4139556884765625, -2.34490966796875, -2.2758636474609375, -2.206817626953125, -2.1377716064453125, -2.0687255859375, -1.9996795654296875, -1.930633544921875, -1.8615875244140625, -1.79254150390625, -1.7234954833984375, -1.654449462890625, -1.5854034423828125, -1.516357421875, -1.4473114013671875, -1.378265380859375, -1.3092193603515625, -1.24017333984375, -1.1711273193359375, -1.102081298828125, -1.0330352783203125, -0.9639892578125, -0.8949432373046875, -0.825897216796875, -0.7568511962890625, -0.68780517578125, -0.6187591552734375, -0.549713134765625, -0.4806671142578125, -0.41162109375, -0.3425750732421875, -0.273529052734375, -0.2044830322265625, -0.13543701171875, -0.0663909912109375, 0.002655029296875, 0.0717010498046875, 0.1407470703125, 0.2097930908203125, 0.278839111328125, 0.3478851318359375, 0.41693115234375, 0.4859771728515625, 0.555023193359375, 0.6240692138671875, 0.693115234375, 0.7621612548828125, 0.831207275390625, 0.9002532958984375, 0.96929931640625, 1.0383453369140625, 1.107391357421875, 1.1764373779296875, 1.2454833984375, 1.3145294189453125, 1.383575439453125, 1.4526214599609375, 1.52166748046875, 1.5907135009765625, 1.659759521484375, 1.7288055419921875, 1.7978515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 7.0, 9.0, 11.0, 24.0, 19.0, 28.0, 43.0, 70.0, 181.0, 547.0, 1833.0, 8102.0, 52656.0, 813669.0, 3206393.0, 93933.0, 12748.0, 2613.0, 780.0, 297.0, 123.0, 75.0, 35.0, 30.0, 19.0, 13.0, 8.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.34375, -44.49951171875, -42.6552734375, -40.81103515625, -38.966796875, -37.12255859375, -35.2783203125, -33.43408203125, -31.58984375, -29.74560546875, -27.9013671875, -26.05712890625, -24.212890625, -22.36865234375, -20.5244140625, -18.68017578125, -16.8359375, -14.99169921875, -13.1474609375, -11.30322265625, -9.458984375, -7.61474609375, -5.7705078125, -3.92626953125, -2.08203125, -0.23779296875, 1.6064453125, 3.45068359375, 5.294921875, 7.13916015625, 8.9833984375, 10.82763671875, 12.671875, 14.51611328125, 16.3603515625, 18.20458984375, 20.048828125, 21.89306640625, 23.7373046875, 25.58154296875, 27.42578125, 29.27001953125, 31.1142578125, 32.95849609375, 34.802734375, 36.64697265625, 38.4912109375, 40.33544921875, 42.1796875, 44.02392578125, 45.8681640625, 47.71240234375, 49.556640625, 51.40087890625, 53.2451171875, 55.08935546875, 56.93359375, 58.77783203125, 60.6220703125, 62.46630859375, 64.310546875, 66.15478515625, 67.9990234375, 69.84326171875, 71.6875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 4.0, 13.0, 10.0, 28.0, 27.0, 26.0, 52.0, 54.0, 71.0, 104.0, 137.0, 229.0, 381.0, 1411.0, 569.0, 267.0, 175.0, 122.0, 87.0, 63.0, 41.0, 37.0, 31.0, 25.0, 20.0, 14.0, 8.0, 10.0, 4.0, 6.0, 6.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.78125, -4.60858154296875, -4.4359130859375, -4.26324462890625, -4.090576171875, -3.91790771484375, -3.7452392578125, -3.57257080078125, -3.39990234375, -3.22723388671875, -3.0545654296875, -2.88189697265625, -2.709228515625, -2.53656005859375, -2.3638916015625, -2.19122314453125, -2.0185546875, -1.84588623046875, -1.6732177734375, -1.50054931640625, -1.327880859375, -1.15521240234375, -0.9825439453125, -0.80987548828125, -0.63720703125, -0.46453857421875, -0.2918701171875, -0.11920166015625, 0.053466796875, 0.22613525390625, 0.3988037109375, 0.57147216796875, 0.744140625, 0.91680908203125, 1.0894775390625, 1.26214599609375, 1.434814453125, 1.60748291015625, 1.7801513671875, 1.95281982421875, 2.12548828125, 2.29815673828125, 2.4708251953125, 2.64349365234375, 2.816162109375, 2.98883056640625, 3.1614990234375, 3.33416748046875, 3.5068359375, 3.67950439453125, 3.8521728515625, 4.02484130859375, 4.197509765625, 4.37017822265625, 4.5428466796875, 4.71551513671875, 4.88818359375, 5.06085205078125, 5.2335205078125, 5.40618896484375, 5.578857421875, 5.75152587890625, 5.9241943359375, 6.09686279296875, 6.26953125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 9.0, 8.0, 31.0, 39.0, 86.0, 108.0, 153.0, 168.0, 129.0, 98.0, 68.0, 43.0, 18.0, 9.0, 13.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-88.38987731933594, -86.43927001953125, -84.48865509033203, -82.53804779052734, -80.58744049072266, -78.63683319091797, -76.68621826171875, -74.73561096191406, -72.78500366210938, -70.83439636230469, -68.88378143310547, -66.93317413330078, -64.9825668334961, -63.03195571899414, -61.08134460449219, -59.1307373046875, -57.18012619018555, -55.229515075683594, -53.278907775878906, -51.32829666137695, -49.377689361572266, -47.42707824707031, -45.476470947265625, -43.52585983276367, -41.57524871826172, -39.624637603759766, -37.67403030395508, -35.723419189453125, -33.77281188964844, -31.822200775146484, -29.871591567993164, -27.920982360839844, -25.970375061035156, -24.019765853881836, -22.069156646728516, -20.118545532226562, -18.167938232421875, -16.217327117919922, -14.266717910766602, -12.316108703613281, -10.365499496459961, -8.41489028930664, -6.464280605316162, -4.513670921325684, -2.5630617141723633, -0.612452507019043, 1.3381576538085938, 3.288766860961914, 5.239376068115234, 7.189985275268555, 9.140594482421875, 11.091204643249512, 13.041813850402832, 14.992423057556152, 16.94303321838379, 18.89364242553711, 20.84425163269043, 22.79486083984375, 24.74547004699707, 26.69607925415039, 28.646690368652344, 30.59729766845703, 32.547908782958984, 34.49851989746094, 36.449127197265625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 10.0, 13.0, 16.0, 15.0, 16.0, 19.0, 21.0, 45.0, 42.0, 46.0, 52.0, 51.0, 55.0, 56.0, 39.0, 56.0, 52.0, 67.0, 48.0, 29.0, 32.0, 42.0, 36.0, 22.0, 17.0, 19.0, 17.0, 13.0, 16.0, 11.0, 6.0, 5.0, 5.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.370193481445312, -24.43484115600586, -23.49949073791504, -22.564138412475586, -21.628787994384766, -20.693435668945312, -19.75808334350586, -18.82273292541504, -17.88738250732422, -16.952030181884766, -16.016679763793945, -15.081327438354492, -14.145977020263672, -13.210624694824219, -12.275273323059082, -11.339921951293945, -10.404569625854492, -9.469218254089355, -8.533866882324219, -7.598515033721924, -6.663163661956787, -5.72781229019165, -4.7924604415893555, -3.8571090698242188, -2.921757698059082, -1.9864062070846558, -1.0510547161102295, -0.11570310592651367, 0.819648265838623, 1.7549996376037598, 2.6903514862060547, 3.6257028579711914, 4.561054229736328, 5.496405601501465, 6.431756973266602, 7.3671088218688965, 8.302459716796875, 9.237812042236328, 10.173163414001465, 11.108514785766602, 12.043866157531738, 12.979217529296875, 13.914568901062012, 14.849920272827148, 15.785272598266602, 16.720623016357422, 17.655975341796875, 18.591327667236328, 19.52667808532715, 20.4620304107666, 21.397380828857422, 22.332733154296875, 23.268083572387695, 24.20343589782715, 25.13878631591797, 26.074138641357422, 27.009490966796875, 27.944843292236328, 28.88019371032715, 29.8155460357666, 30.750896453857422, 31.686248779296875, 32.62160110473633, 33.55695343017578, 34.49230194091797]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 15.0, 18.0, 20.0, 34.0, 48.0, 57.0, 86.0, 98.0, 164.0, 240.0, 385.0, 579.0, 1025.0, 1844.0, 4270.0, 10299.0, 30075.0, 94134.0, 278708.0, 384147.0, 162029.0, 50984.0, 16872.0, 6198.0, 2717.0, 1339.0, 753.0, 431.0, 289.0, 215.0, 143.0, 80.0, 59.0, 49.0, 40.0, 28.0, 14.0, 13.0, 10.0, 5.0, 7.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.171875, -19.56494140625, -18.9580078125, -18.35107421875, -17.744140625, -17.13720703125, -16.5302734375, -15.92333984375, -15.31640625, -14.70947265625, -14.1025390625, -13.49560546875, -12.888671875, -12.28173828125, -11.6748046875, -11.06787109375, -10.4609375, -9.85400390625, -9.2470703125, -8.64013671875, -8.033203125, -7.42626953125, -6.8193359375, -6.21240234375, -5.60546875, -4.99853515625, -4.3916015625, -3.78466796875, -3.177734375, -2.57080078125, -1.9638671875, -1.35693359375, -0.75, -0.14306640625, 0.4638671875, 1.07080078125, 1.677734375, 2.28466796875, 2.8916015625, 3.49853515625, 4.10546875, 4.71240234375, 5.3193359375, 5.92626953125, 6.533203125, 7.14013671875, 7.7470703125, 8.35400390625, 8.9609375, 9.56787109375, 10.1748046875, 10.78173828125, 11.388671875, 11.99560546875, 12.6025390625, 13.20947265625, 13.81640625, 14.42333984375, 15.0302734375, 15.63720703125, 16.244140625, 16.85107421875, 17.4580078125, 18.06494140625, 18.671875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 10.0, 16.0, 32.0, 40.0, 34.0, 54.0, 53.0, 71.0, 85.0, 71.0, 88.0, 98.0, 74.0, 53.0, 45.0, 34.0, 32.0, 28.0, 24.0, 9.0, 15.0, 10.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.353515625, -3.257843017578125, -3.16217041015625, -3.066497802734375, -2.9708251953125, -2.875152587890625, -2.77947998046875, -2.683807373046875, -2.588134765625, -2.492462158203125, -2.39678955078125, -2.301116943359375, -2.2054443359375, -2.109771728515625, -2.01409912109375, -1.918426513671875, -1.82275390625, -1.727081298828125, -1.63140869140625, -1.535736083984375, -1.4400634765625, -1.344390869140625, -1.24871826171875, -1.153045654296875, -1.057373046875, -0.961700439453125, -0.86602783203125, -0.770355224609375, -0.6746826171875, -0.579010009765625, -0.48333740234375, -0.387664794921875, -0.2919921875, -0.196319580078125, -0.10064697265625, -0.004974365234375, 0.0906982421875, 0.186370849609375, 0.28204345703125, 0.377716064453125, 0.473388671875, 0.569061279296875, 0.66473388671875, 0.760406494140625, 0.8560791015625, 0.951751708984375, 1.04742431640625, 1.143096923828125, 1.23876953125, 1.334442138671875, 1.43011474609375, 1.525787353515625, 1.6214599609375, 1.717132568359375, 1.81280517578125, 1.908477783203125, 2.004150390625, 2.099822998046875, 2.19549560546875, 2.291168212890625, 2.3868408203125, 2.482513427734375, 2.57818603515625, 2.673858642578125, 2.76953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 13.0, 21.0, 33.0, 46.0, 51.0, 76.0, 102.0, 157.0, 212.0, 282.0, 420.0, 690.0, 1121.0, 2044.0, 3794.0, 8252.0, 19812.0, 52580.0, 144428.0, 334033.0, 290773.0, 115325.0, 42418.0, 16268.0, 7091.0, 3464.0, 1853.0, 1075.0, 690.0, 440.0, 279.0, 202.0, 144.0, 91.0, 61.0, 50.0, 40.0, 33.0, 26.0, 15.0, 9.0, 5.0, 10.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.78125, -14.251220703125, -13.72119140625, -13.191162109375, -12.6611328125, -12.131103515625, -11.60107421875, -11.071044921875, -10.541015625, -10.010986328125, -9.48095703125, -8.950927734375, -8.4208984375, -7.890869140625, -7.36083984375, -6.830810546875, -6.30078125, -5.770751953125, -5.24072265625, -4.710693359375, -4.1806640625, -3.650634765625, -3.12060546875, -2.590576171875, -2.060546875, -1.530517578125, -1.00048828125, -0.470458984375, 0.0595703125, 0.589599609375, 1.11962890625, 1.649658203125, 2.1796875, 2.709716796875, 3.23974609375, 3.769775390625, 4.2998046875, 4.829833984375, 5.35986328125, 5.889892578125, 6.419921875, 6.949951171875, 7.47998046875, 8.010009765625, 8.5400390625, 9.070068359375, 9.60009765625, 10.130126953125, 10.66015625, 11.190185546875, 11.72021484375, 12.250244140625, 12.7802734375, 13.310302734375, 13.84033203125, 14.370361328125, 14.900390625, 15.430419921875, 15.96044921875, 16.490478515625, 17.0205078125, 17.550537109375, 18.08056640625, 18.610595703125, 19.140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 7.0, 4.0, 8.0, 15.0, 10.0, 20.0, 24.0, 24.0, 23.0, 36.0, 35.0, 44.0, 54.0, 50.0, 67.0, 53.0, 54.0, 57.0, 66.0, 39.0, 48.0, 44.0, 30.0, 30.0, 32.0, 16.0, 26.0, 17.0, 14.0, 15.0, 11.0, 6.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.6796875, -13.2677001953125, -12.855712890625, -12.4437255859375, -12.03173828125, -11.6197509765625, -11.207763671875, -10.7957763671875, -10.3837890625, -9.9718017578125, -9.559814453125, -9.1478271484375, -8.73583984375, -8.3238525390625, -7.911865234375, -7.4998779296875, -7.087890625, -6.6759033203125, -6.263916015625, -5.8519287109375, -5.43994140625, -5.0279541015625, -4.615966796875, -4.2039794921875, -3.7919921875, -3.3800048828125, -2.968017578125, -2.5560302734375, -2.14404296875, -1.7320556640625, -1.320068359375, -0.9080810546875, -0.49609375, -0.0841064453125, 0.327880859375, 0.7398681640625, 1.15185546875, 1.5638427734375, 1.975830078125, 2.3878173828125, 2.7998046875, 3.2117919921875, 3.623779296875, 4.0357666015625, 4.44775390625, 4.8597412109375, 5.271728515625, 5.6837158203125, 6.095703125, 6.5076904296875, 6.919677734375, 7.3316650390625, 7.74365234375, 8.1556396484375, 8.567626953125, 8.9796142578125, 9.3916015625, 9.8035888671875, 10.215576171875, 10.6275634765625, 11.03955078125, 11.4515380859375, 11.863525390625, 12.2755126953125, 12.6875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 10.0, 10.0, 15.0, 15.0, 21.0, 30.0, 56.0, 76.0, 120.0, 168.0, 291.0, 534.0, 878.0, 1695.0, 3490.0, 8124.0, 21730.0, 67385.0, 224752.0, 407672.0, 212185.0, 63838.0, 20599.0, 7704.0, 3387.0, 1587.0, 841.0, 500.0, 282.0, 168.0, 106.0, 74.0, 55.0, 39.0, 30.0, 23.0, 12.0, 10.0, 11.0, 7.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.5546875, -8.291259765625, -8.02783203125, -7.764404296875, -7.5009765625, -7.237548828125, -6.97412109375, -6.710693359375, -6.447265625, -6.183837890625, -5.92041015625, -5.656982421875, -5.3935546875, -5.130126953125, -4.86669921875, -4.603271484375, -4.33984375, -4.076416015625, -3.81298828125, -3.549560546875, -3.2861328125, -3.022705078125, -2.75927734375, -2.495849609375, -2.232421875, -1.968994140625, -1.70556640625, -1.442138671875, -1.1787109375, -0.915283203125, -0.65185546875, -0.388427734375, -0.125, 0.138427734375, 0.40185546875, 0.665283203125, 0.9287109375, 1.192138671875, 1.45556640625, 1.718994140625, 1.982421875, 2.245849609375, 2.50927734375, 2.772705078125, 3.0361328125, 3.299560546875, 3.56298828125, 3.826416015625, 4.08984375, 4.353271484375, 4.61669921875, 4.880126953125, 5.1435546875, 5.406982421875, 5.67041015625, 5.933837890625, 6.197265625, 6.460693359375, 6.72412109375, 6.987548828125, 7.2509765625, 7.514404296875, 7.77783203125, 8.041259765625, 8.3046875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 7.0, 8.0, 5.0, 8.0, 10.0, 14.0, 16.0, 26.0, 27.0, 27.0, 30.0, 51.0, 56.0, 69.0, 82.0, 97.0, 94.0, 63.0, 58.0, 37.0, 37.0, 33.0, 29.0, 23.0, 13.0, 19.0, 15.0, 4.0, 5.0, 1.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011835098266601562, -0.0011445730924606323, -0.0011056363582611084, -0.0010666996240615845, -0.0010277628898620605, -0.0009888261556625366, -0.0009498894214630127, -0.0009109526872634888, -0.0008720159530639648, -0.0008330792188644409, -0.000794142484664917, -0.0007552057504653931, -0.0007162690162658691, -0.0006773322820663452, -0.0006383955478668213, -0.0005994588136672974, -0.0005605220794677734, -0.0005215853452682495, -0.0004826486110687256, -0.00044371187686920166, -0.00040477514266967773, -0.0003658384084701538, -0.0003269016742706299, -0.00028796494007110596, -0.00024902820587158203, -0.0002100914716720581, -0.00017115473747253418, -0.00013221800327301025, -9.328126907348633e-05, -5.43445348739624e-05, -1.5407800674438477e-05, 2.352893352508545e-05, 6.246566772460938e-05, 0.0001014024019241333, 0.00014033913612365723, 0.00017927587032318115, 0.00021821260452270508, 0.000257149338722229, 0.00029608607292175293, 0.00033502280712127686, 0.0003739595413208008, 0.0004128962755203247, 0.00045183300971984863, 0.0004907697439193726, 0.0005297064781188965, 0.0005686432123184204, 0.0006075799465179443, 0.0006465166807174683, 0.0006854534149169922, 0.0007243901491165161, 0.00076332688331604, 0.000802263617515564, 0.0008412003517150879, 0.0008801370859146118, 0.0009190738201141357, 0.0009580105543136597, 0.0009969472885131836, 0.0010358840227127075, 0.0010748207569122314, 0.0011137574911117554, 0.0011526942253112793, 0.0011916309595108032, 0.0012305676937103271, 0.001269504427909851, 0.001308441162109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 7.0, 6.0, 13.0, 14.0, 26.0, 32.0, 50.0, 60.0, 105.0, 170.0, 229.0, 361.0, 566.0, 1073.0, 2062.0, 4580.0, 11350.0, 34244.0, 131849.0, 422050.0, 318182.0, 82682.0, 23133.0, 8276.0, 3478.0, 1679.0, 936.0, 476.0, 277.0, 160.0, 128.0, 92.0, 51.0, 46.0, 23.0, 23.0, 15.0, 9.0, 12.0, 3.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.7890625, -8.4842529296875, -8.179443359375, -7.8746337890625, -7.56982421875, -7.2650146484375, -6.960205078125, -6.6553955078125, -6.3505859375, -6.0457763671875, -5.740966796875, -5.4361572265625, -5.13134765625, -4.8265380859375, -4.521728515625, -4.2169189453125, -3.912109375, -3.6072998046875, -3.302490234375, -2.9976806640625, -2.69287109375, -2.3880615234375, -2.083251953125, -1.7784423828125, -1.4736328125, -1.1688232421875, -0.864013671875, -0.5592041015625, -0.25439453125, 0.0504150390625, 0.355224609375, 0.6600341796875, 0.96484375, 1.2696533203125, 1.574462890625, 1.8792724609375, 2.18408203125, 2.4888916015625, 2.793701171875, 3.0985107421875, 3.4033203125, 3.7081298828125, 4.012939453125, 4.3177490234375, 4.62255859375, 4.9273681640625, 5.232177734375, 5.5369873046875, 5.841796875, 6.1466064453125, 6.451416015625, 6.7562255859375, 7.06103515625, 7.3658447265625, 7.670654296875, 7.9754638671875, 8.2802734375, 8.5850830078125, 8.889892578125, 9.1947021484375, 9.49951171875, 9.8043212890625, 10.109130859375, 10.4139404296875, 10.71875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 10.0, 11.0, 7.0, 27.0, 13.0, 32.0, 41.0, 34.0, 60.0, 63.0, 86.0, 85.0, 91.0, 89.0, 79.0, 53.0, 38.0, 52.0, 33.0, 14.0, 21.0, 8.0, 8.0, 8.0, 8.0, 5.0, 6.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1953125, -5.0108642578125, -4.826416015625, -4.6419677734375, -4.45751953125, -4.2730712890625, -4.088623046875, -3.9041748046875, -3.7197265625, -3.5352783203125, -3.350830078125, -3.1663818359375, -2.98193359375, -2.7974853515625, -2.613037109375, -2.4285888671875, -2.244140625, -2.0596923828125, -1.875244140625, -1.6907958984375, -1.50634765625, -1.3218994140625, -1.137451171875, -0.9530029296875, -0.7685546875, -0.5841064453125, -0.399658203125, -0.2152099609375, -0.03076171875, 0.1536865234375, 0.338134765625, 0.5225830078125, 0.70703125, 0.8914794921875, 1.075927734375, 1.2603759765625, 1.44482421875, 1.6292724609375, 1.813720703125, 1.9981689453125, 2.1826171875, 2.3670654296875, 2.551513671875, 2.7359619140625, 2.92041015625, 3.1048583984375, 3.289306640625, 3.4737548828125, 3.658203125, 3.8426513671875, 4.027099609375, 4.2115478515625, 4.39599609375, 4.5804443359375, 4.764892578125, 4.9493408203125, 5.1337890625, 5.3182373046875, 5.502685546875, 5.6871337890625, 5.87158203125, 6.0560302734375, 6.240478515625, 6.4249267578125, 6.609375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 13.0, 9.0, 17.0, 28.0, 41.0, 47.0, 58.0, 90.0, 96.0, 91.0, 116.0, 94.0, 85.0, 51.0, 41.0, 32.0, 21.0, 19.0, 14.0, 9.0, 0.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.33743286132812, -86.41983795166016, -83.50224304199219, -80.58464813232422, -77.66705322265625, -74.74945068359375, -71.83185577392578, -68.91426086425781, -65.99666595458984, -63.079071044921875, -60.161476135253906, -57.24387741088867, -54.3262825012207, -51.408687591552734, -48.4910888671875, -45.57349395751953, -42.65589904785156, -39.738304138183594, -36.820709228515625, -33.90311050415039, -30.985515594482422, -28.067920684814453, -25.15032386779785, -22.23272705078125, -19.31513214111328, -16.397537231445312, -13.479940414428711, -10.562344551086426, -7.644748687744141, -4.7271528244018555, -1.8095569610595703, 1.1080398559570312, 4.025634765625, 6.943230628967285, 9.86082649230957, 12.778422355651855, 15.69601821899414, 18.61361312866211, 21.53120994567871, 24.448806762695312, 27.36640167236328, 30.28399658203125, 33.20159149169922, 36.11919021606445, 39.03678512573242, 41.95438003540039, 44.871978759765625, 47.789573669433594, 50.70716857910156, 53.62476348876953, 56.5423583984375, 59.459957122802734, 62.3775520324707, 65.29515075683594, 68.2127456665039, 71.13034057617188, 74.04793548583984, 76.96553039550781, 79.88312530517578, 82.80072021484375, 85.71832275390625, 88.63591766357422, 91.55351257324219, 94.47110748291016, 97.38870239257812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 9.0, 9.0, 10.0, 16.0, 21.0, 25.0, 28.0, 45.0, 44.0, 42.0, 71.0, 67.0, 81.0, 64.0, 86.0, 68.0, 62.0, 49.0, 41.0, 33.0, 38.0, 23.0, 19.0, 11.0, 11.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-134.0576171875, -130.43565368652344, -126.81368255615234, -123.19171905517578, -119.56974792480469, -115.94778442382812, -112.32582092285156, -108.703857421875, -105.0818862915039, -101.45992279052734, -97.83795166015625, -94.21598815917969, -90.59402465820312, -86.97205352783203, -83.35009002685547, -79.72811889648438, -76.10615539550781, -72.48419189453125, -68.86222076416016, -65.2402572631836, -61.618289947509766, -57.99632263183594, -54.374359130859375, -50.75239181518555, -47.13042449951172, -43.50845718383789, -39.88648986816406, -36.2645263671875, -32.64255905151367, -29.020591735839844, -25.39862632751465, -21.776660919189453, -18.154693603515625, -14.532727241516113, -10.910760879516602, -7.28879451751709, -3.666828155517578, -0.04486083984375, 3.5771045684814453, 7.199069976806641, 10.821037292480469, 14.44300365447998, 18.064970016479492, 21.686935424804688, 25.308902740478516, 28.930870056152344, 32.552833557128906, 36.174800872802734, 39.79676818847656, 43.41873550415039, 47.04070281982422, 50.66266632080078, 54.28463363647461, 57.90660095214844, 61.528564453125, 65.15052795410156, 68.77249908447266, 72.39446258544922, 76.01643371582031, 79.63839721679688, 83.26036071777344, 86.88233184814453, 90.5042953491211, 94.12626647949219, 97.74822998046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 13.0, 22.0, 19.0, 23.0, 52.0, 73.0, 126.0, 171.0, 361.0, 974.0, 3379.0, 19623.0, 718167.0, 3419724.0, 25430.0, 4217.0, 1160.0, 380.0, 156.0, 86.0, 36.0, 25.0, 17.0, 15.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-107.1875, -104.638671875, -102.08984375, -99.541015625, -96.9921875, -94.443359375, -91.89453125, -89.345703125, -86.796875, -84.248046875, -81.69921875, -79.150390625, -76.6015625, -74.052734375, -71.50390625, -68.955078125, -66.40625, -63.857421875, -61.30859375, -58.759765625, -56.2109375, -53.662109375, -51.11328125, -48.564453125, -46.015625, -43.466796875, -40.91796875, -38.369140625, -35.8203125, -33.271484375, -30.72265625, -28.173828125, -25.625, -23.076171875, -20.52734375, -17.978515625, -15.4296875, -12.880859375, -10.33203125, -7.783203125, -5.234375, -2.685546875, -0.13671875, 2.412109375, 4.9609375, 7.509765625, 10.05859375, 12.607421875, 15.15625, 17.705078125, 20.25390625, 22.802734375, 25.3515625, 27.900390625, 30.44921875, 32.998046875, 35.546875, 38.095703125, 40.64453125, 43.193359375, 45.7421875, 48.291015625, 50.83984375, 53.388671875, 55.9375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 13.0, 12.0, 29.0, 21.0, 32.0, 40.0, 53.0, 59.0, 71.0, 72.0, 91.0, 88.0, 87.0, 78.0, 58.0, 51.0, 39.0, 29.0, 19.0, 16.0, 13.0, 8.0, 5.0, 10.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 5.0], "bins": [-5.42578125, -5.3023681640625, -5.178955078125, -5.0555419921875, -4.93212890625, -4.8087158203125, -4.685302734375, -4.5618896484375, -4.4384765625, -4.3150634765625, -4.191650390625, -4.0682373046875, -3.94482421875, -3.8214111328125, -3.697998046875, -3.5745849609375, -3.451171875, -3.3277587890625, -3.204345703125, -3.0809326171875, -2.95751953125, -2.8341064453125, -2.710693359375, -2.5872802734375, -2.4638671875, -2.3404541015625, -2.217041015625, -2.0936279296875, -1.97021484375, -1.8468017578125, -1.723388671875, -1.5999755859375, -1.4765625, -1.3531494140625, -1.229736328125, -1.1063232421875, -0.98291015625, -0.8594970703125, -0.736083984375, -0.6126708984375, -0.4892578125, -0.3658447265625, -0.242431640625, -0.1190185546875, 0.00439453125, 0.1278076171875, 0.251220703125, 0.3746337890625, 0.498046875, 0.6214599609375, 0.744873046875, 0.8682861328125, 0.99169921875, 1.1151123046875, 1.238525390625, 1.3619384765625, 1.4853515625, 1.6087646484375, 1.732177734375, 1.8555908203125, 1.97900390625, 2.1024169921875, 2.225830078125, 2.3492431640625, 2.47265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 5.0, 6.0, 15.0, 23.0, 53.0, 49.0, 76.0, 135.0, 183.0, 304.0, 451.0, 838.0, 1570.0, 2924.0, 6572.0, 15447.0, 43284.0, 154540.0, 1444293.0, 2280282.0, 168308.0, 45379.0, 16197.0, 6822.0, 3116.0, 1445.0, 806.0, 471.0, 269.0, 157.0, 84.0, 71.0, 43.0, 24.0, 19.0, 15.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-29.875, -29.128662109375, -28.38232421875, -27.635986328125, -26.8896484375, -26.143310546875, -25.39697265625, -24.650634765625, -23.904296875, -23.157958984375, -22.41162109375, -21.665283203125, -20.9189453125, -20.172607421875, -19.42626953125, -18.679931640625, -17.93359375, -17.187255859375, -16.44091796875, -15.694580078125, -14.9482421875, -14.201904296875, -13.45556640625, -12.709228515625, -11.962890625, -11.216552734375, -10.47021484375, -9.723876953125, -8.9775390625, -8.231201171875, -7.48486328125, -6.738525390625, -5.9921875, -5.245849609375, -4.49951171875, -3.753173828125, -3.0068359375, -2.260498046875, -1.51416015625, -0.767822265625, -0.021484375, 0.724853515625, 1.47119140625, 2.217529296875, 2.9638671875, 3.710205078125, 4.45654296875, 5.202880859375, 5.94921875, 6.695556640625, 7.44189453125, 8.188232421875, 8.9345703125, 9.680908203125, 10.42724609375, 11.173583984375, 11.919921875, 12.666259765625, 13.41259765625, 14.158935546875, 14.9052734375, 15.651611328125, 16.39794921875, 17.144287109375, 17.890625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 3.0, 7.0, 5.0, 12.0, 9.0, 14.0, 19.0, 38.0, 57.0, 66.0, 115.0, 207.0, 442.0, 1777.0, 639.0, 263.0, 153.0, 77.0, 56.0, 31.0, 28.0, 13.0, 12.0, 7.0, 5.0, 9.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.95703125, -7.70562744140625, -7.4542236328125, -7.20281982421875, -6.951416015625, -6.70001220703125, -6.4486083984375, -6.19720458984375, -5.94580078125, -5.69439697265625, -5.4429931640625, -5.19158935546875, -4.940185546875, -4.68878173828125, -4.4373779296875, -4.18597412109375, -3.9345703125, -3.68316650390625, -3.4317626953125, -3.18035888671875, -2.928955078125, -2.67755126953125, -2.4261474609375, -2.17474365234375, -1.92333984375, -1.67193603515625, -1.4205322265625, -1.16912841796875, -0.917724609375, -0.66632080078125, -0.4149169921875, -0.16351318359375, 0.087890625, 0.33929443359375, 0.5906982421875, 0.84210205078125, 1.093505859375, 1.34490966796875, 1.5963134765625, 1.84771728515625, 2.09912109375, 2.35052490234375, 2.6019287109375, 2.85333251953125, 3.104736328125, 3.35614013671875, 3.6075439453125, 3.85894775390625, 4.1103515625, 4.36175537109375, 4.6131591796875, 4.86456298828125, 5.115966796875, 5.36737060546875, 5.6187744140625, 5.87017822265625, 6.12158203125, 6.37298583984375, 6.6243896484375, 6.87579345703125, 7.127197265625, 7.37860107421875, 7.6300048828125, 7.88140869140625, 8.1328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 9.0, 11.0, 15.0, 34.0, 70.0, 107.0, 133.0, 165.0, 113.0, 135.0, 94.0, 31.0, 34.0, 19.0, 13.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.7917366027832, -58.12405014038086, -56.45635986328125, -54.788673400878906, -53.12098693847656, -51.45329666137695, -49.78561019897461, -48.117919921875, -46.450233459472656, -44.78254699707031, -43.1148567199707, -41.44717025756836, -39.77947998046875, -38.111793518066406, -36.44410705566406, -34.77642059326172, -33.10873031616211, -31.441041946411133, -29.773353576660156, -28.105667114257812, -26.437978744506836, -24.77029037475586, -23.102603912353516, -21.43491554260254, -19.767227172851562, -18.099538803100586, -16.43185043334961, -14.764163970947266, -13.096475601196289, -11.428787231445312, -9.761099815368652, -8.093412399291992, -6.425727844238281, -4.758039951324463, -3.0903520584106445, -1.4226641654968262, 0.2450237274169922, 1.9127120971679688, 3.580399513244629, 5.248086929321289, 6.915775299072266, 8.583463668823242, 10.251151084899902, 11.918838500976562, 13.586526870727539, 15.254215240478516, 16.92190170288086, 18.589590072631836, 20.257278442382812, 21.92496681213379, 23.592655181884766, 25.26034164428711, 26.928030014038086, 28.595718383789062, 30.263404846191406, 31.931093215942383, 33.59878158569336, 35.2664680480957, 36.93415832519531, 38.601844787597656, 40.26953125, 41.93722152709961, 43.60490798950195, 45.27259826660156, 46.940284729003906]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 4.0, 8.0, 5.0, 11.0, 8.0, 7.0, 20.0, 18.0, 23.0, 33.0, 40.0, 33.0, 36.0, 53.0, 43.0, 45.0, 41.0, 50.0, 52.0, 41.0, 51.0, 47.0, 42.0, 39.0, 45.0, 36.0, 20.0, 22.0, 30.0, 17.0, 15.0, 8.0, 11.0, 9.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.309494018554688, -21.565593719482422, -20.82169532775879, -20.077795028686523, -19.33389663696289, -18.589996337890625, -17.84609603881836, -17.102195739746094, -16.35829734802246, -15.614398002624512, -14.870498657226562, -14.126598358154297, -13.382699012756348, -12.638799667358398, -11.894899368286133, -11.151000022888184, -10.407100677490234, -9.663201332092285, -8.919301986694336, -8.17540168762207, -7.431502342224121, -6.687602996826172, -5.9437031745910645, -5.199803352355957, -4.455904006958008, -3.7120044231414795, -2.968104839324951, -2.224205255508423, -1.4803056716918945, -0.7364060878753662, 0.007493495941162109, 0.7513933181762695, 1.4952945709228516, 2.23919415473938, 2.983093738555908, 3.7269933223724365, 4.470892906188965, 5.214792251586914, 5.9586920738220215, 6.702591896057129, 7.446491241455078, 8.190390586853027, 8.934289932250977, 9.678190231323242, 10.422089576721191, 11.16598892211914, 11.909889221191406, 12.653788566589355, 13.397687911987305, 14.141587257385254, 14.885486602783203, 15.629386901855469, 16.373287200927734, 17.117185592651367, 17.861085891723633, 18.604984283447266, 19.34888458251953, 20.092784881591797, 20.83668327331543, 21.580583572387695, 22.324481964111328, 23.068382263183594, 23.81228256225586, 24.556182861328125, 25.300081253051758]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 9.0, 6.0, 7.0, 8.0, 15.0, 24.0, 31.0, 49.0, 50.0, 66.0, 81.0, 120.0, 144.0, 224.0, 327.0, 573.0, 887.0, 1723.0, 3765.0, 9208.0, 26493.0, 86191.0, 269275.0, 405311.0, 165477.0, 50170.0, 16234.0, 6142.0, 2510.0, 1236.0, 702.0, 460.0, 255.0, 188.0, 154.0, 121.0, 73.0, 59.0, 50.0, 51.0, 19.0, 11.0, 14.0, 14.0, 7.0, 8.0, 5.0, 5.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8671875, -15.3060302734375, -14.744873046875, -14.1837158203125, -13.62255859375, -13.0614013671875, -12.500244140625, -11.9390869140625, -11.3779296875, -10.8167724609375, -10.255615234375, -9.6944580078125, -9.13330078125, -8.5721435546875, -8.010986328125, -7.4498291015625, -6.888671875, -6.3275146484375, -5.766357421875, -5.2052001953125, -4.64404296875, -4.0828857421875, -3.521728515625, -2.9605712890625, -2.3994140625, -1.8382568359375, -1.277099609375, -0.7159423828125, -0.15478515625, 0.4063720703125, 0.967529296875, 1.5286865234375, 2.08984375, 2.6510009765625, 3.212158203125, 3.7733154296875, 4.33447265625, 4.8956298828125, 5.456787109375, 6.0179443359375, 6.5791015625, 7.1402587890625, 7.701416015625, 8.2625732421875, 8.82373046875, 9.3848876953125, 9.946044921875, 10.5072021484375, 11.068359375, 11.6295166015625, 12.190673828125, 12.7518310546875, 13.31298828125, 13.8741455078125, 14.435302734375, 14.9964599609375, 15.5576171875, 16.1187744140625, 16.679931640625, 17.2410888671875, 17.80224609375, 18.3634033203125, 18.924560546875, 19.4857177734375, 20.046875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 9.0, 17.0, 25.0, 37.0, 56.0, 60.0, 85.0, 91.0, 96.0, 97.0, 108.0, 79.0, 64.0, 39.0, 39.0, 34.0, 22.0, 11.0, 8.0, 5.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.953125, -5.808380126953125, -5.66363525390625, -5.518890380859375, -5.3741455078125, -5.229400634765625, -5.08465576171875, -4.939910888671875, -4.795166015625, -4.650421142578125, -4.50567626953125, -4.360931396484375, -4.2161865234375, -4.071441650390625, -3.92669677734375, -3.781951904296875, -3.63720703125, -3.492462158203125, -3.34771728515625, -3.202972412109375, -3.0582275390625, -2.913482666015625, -2.76873779296875, -2.623992919921875, -2.479248046875, -2.334503173828125, -2.18975830078125, -2.045013427734375, -1.9002685546875, -1.755523681640625, -1.61077880859375, -1.466033935546875, -1.3212890625, -1.176544189453125, -1.03179931640625, -0.887054443359375, -0.7423095703125, -0.597564697265625, -0.45281982421875, -0.308074951171875, -0.163330078125, -0.018585205078125, 0.12615966796875, 0.270904541015625, 0.4156494140625, 0.560394287109375, 0.70513916015625, 0.849884033203125, 0.99462890625, 1.139373779296875, 1.28411865234375, 1.428863525390625, 1.5736083984375, 1.718353271484375, 1.86309814453125, 2.007843017578125, 2.152587890625, 2.297332763671875, 2.44207763671875, 2.586822509765625, 2.7315673828125, 2.876312255859375, 3.02105712890625, 3.165802001953125, 3.310546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 10.0, 8.0, 7.0, 16.0, 13.0, 27.0, 31.0, 51.0, 67.0, 75.0, 103.0, 156.0, 205.0, 318.0, 409.0, 700.0, 1084.0, 1867.0, 3275.0, 6585.0, 13230.0, 29012.0, 68208.0, 155799.0, 298746.0, 252670.0, 119281.0, 51484.0, 22390.0, 10448.0, 5125.0, 2760.0, 1541.0, 956.0, 559.0, 371.0, 272.0, 192.0, 140.0, 99.0, 75.0, 46.0, 45.0, 20.0, 25.0, 11.0, 10.0, 12.0, 5.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.6484375, -10.3031005859375, -9.957763671875, -9.6124267578125, -9.26708984375, -8.9217529296875, -8.576416015625, -8.2310791015625, -7.8857421875, -7.5404052734375, -7.195068359375, -6.8497314453125, -6.50439453125, -6.1590576171875, -5.813720703125, -5.4683837890625, -5.123046875, -4.7777099609375, -4.432373046875, -4.0870361328125, -3.74169921875, -3.3963623046875, -3.051025390625, -2.7056884765625, -2.3603515625, -2.0150146484375, -1.669677734375, -1.3243408203125, -0.97900390625, -0.6336669921875, -0.288330078125, 0.0570068359375, 0.40234375, 0.7476806640625, 1.093017578125, 1.4383544921875, 1.78369140625, 2.1290283203125, 2.474365234375, 2.8197021484375, 3.1650390625, 3.5103759765625, 3.855712890625, 4.2010498046875, 4.54638671875, 4.8917236328125, 5.237060546875, 5.5823974609375, 5.927734375, 6.2730712890625, 6.618408203125, 6.9637451171875, 7.30908203125, 7.6544189453125, 7.999755859375, 8.3450927734375, 8.6904296875, 9.0357666015625, 9.381103515625, 9.7264404296875, 10.07177734375, 10.4171142578125, 10.762451171875, 11.1077880859375, 11.453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 4.0, 4.0, 2.0, 6.0, 17.0, 13.0, 22.0, 20.0, 26.0, 24.0, 30.0, 35.0, 41.0, 50.0, 46.0, 57.0, 52.0, 50.0, 57.0, 50.0, 51.0, 37.0, 55.0, 36.0, 36.0, 32.0, 29.0, 28.0, 25.0, 14.0, 18.0, 7.0, 3.0, 6.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.71875, -11.315185546875, -10.91162109375, -10.508056640625, -10.1044921875, -9.700927734375, -9.29736328125, -8.893798828125, -8.490234375, -8.086669921875, -7.68310546875, -7.279541015625, -6.8759765625, -6.472412109375, -6.06884765625, -5.665283203125, -5.26171875, -4.858154296875, -4.45458984375, -4.051025390625, -3.6474609375, -3.243896484375, -2.84033203125, -2.436767578125, -2.033203125, -1.629638671875, -1.22607421875, -0.822509765625, -0.4189453125, -0.015380859375, 0.38818359375, 0.791748046875, 1.1953125, 1.598876953125, 2.00244140625, 2.406005859375, 2.8095703125, 3.213134765625, 3.61669921875, 4.020263671875, 4.423828125, 4.827392578125, 5.23095703125, 5.634521484375, 6.0380859375, 6.441650390625, 6.84521484375, 7.248779296875, 7.65234375, 8.055908203125, 8.45947265625, 8.863037109375, 9.2666015625, 9.670166015625, 10.07373046875, 10.477294921875, 10.880859375, 11.284423828125, 11.68798828125, 12.091552734375, 12.4951171875, 12.898681640625, 13.30224609375, 13.705810546875, 14.109375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 3.0, 13.0, 10.0, 12.0, 13.0, 24.0, 42.0, 47.0, 97.0, 148.0, 269.0, 444.0, 873.0, 1961.0, 5188.0, 16260.0, 61534.0, 261244.0, 474401.0, 168134.0, 40118.0, 10935.0, 3673.0, 1447.0, 693.0, 377.0, 195.0, 125.0, 84.0, 51.0, 42.0, 30.0, 17.0, 12.0, 10.0, 8.0, 5.0, 3.0, 1.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.08203125, -6.86962890625, -6.6572265625, -6.44482421875, -6.232421875, -6.02001953125, -5.8076171875, -5.59521484375, -5.3828125, -5.17041015625, -4.9580078125, -4.74560546875, -4.533203125, -4.32080078125, -4.1083984375, -3.89599609375, -3.68359375, -3.47119140625, -3.2587890625, -3.04638671875, -2.833984375, -2.62158203125, -2.4091796875, -2.19677734375, -1.984375, -1.77197265625, -1.5595703125, -1.34716796875, -1.134765625, -0.92236328125, -0.7099609375, -0.49755859375, -0.28515625, -0.07275390625, 0.1396484375, 0.35205078125, 0.564453125, 0.77685546875, 0.9892578125, 1.20166015625, 1.4140625, 1.62646484375, 1.8388671875, 2.05126953125, 2.263671875, 2.47607421875, 2.6884765625, 2.90087890625, 3.11328125, 3.32568359375, 3.5380859375, 3.75048828125, 3.962890625, 4.17529296875, 4.3876953125, 4.60009765625, 4.8125, 5.02490234375, 5.2373046875, 5.44970703125, 5.662109375, 5.87451171875, 6.0869140625, 6.29931640625, 6.51171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 7.0, 9.0, 8.0, 21.0, 21.0, 17.0, 29.0, 37.0, 35.0, 43.0, 59.0, 67.0, 103.0, 113.0, 97.0, 53.0, 59.0, 53.0, 34.0, 18.0, 19.0, 16.0, 21.0, 9.0, 9.0, 7.0, 6.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010747909545898438, -0.0010450109839439392, -0.0010152310132980347, -0.0009854510426521301, -0.0009556710720062256, -0.000925891101360321, -0.0008961111307144165, -0.000866331160068512, -0.0008365511894226074, -0.0008067712187767029, -0.0007769912481307983, -0.0007472112774848938, -0.0007174313068389893, -0.0006876513361930847, -0.0006578713655471802, -0.0006280913949012756, -0.0005983114242553711, -0.0005685314536094666, -0.000538751482963562, -0.0005089715123176575, -0.00047919154167175293, -0.0004494115710258484, -0.00041963160037994385, -0.0003898516297340393, -0.00036007165908813477, -0.0003302916884422302, -0.0003005117177963257, -0.00027073174715042114, -0.0002409517765045166, -0.00021117180585861206, -0.00018139183521270752, -0.00015161186456680298, -0.00012183189392089844, -9.20519232749939e-05, -6.227195262908936e-05, -3.2491981983184814e-05, -2.7120113372802734e-06, 2.7067959308624268e-05, 5.684792995452881e-05, 8.662790060043335e-05, 0.00011640787124633789, 0.00014618784189224243, 0.00017596781253814697, 0.00020574778318405151, 0.00023552775382995605, 0.0002653077244758606, 0.00029508769512176514, 0.0003248676657676697, 0.0003546476364135742, 0.00038442760705947876, 0.0004142075777053833, 0.00044398754835128784, 0.0004737675189971924, 0.0005035474896430969, 0.0005333274602890015, 0.000563107430934906, 0.0005928874015808105, 0.0006226673722267151, 0.0006524473428726196, 0.0006822273135185242, 0.0007120072841644287, 0.0007417872548103333, 0.0007715672254562378, 0.0008013471961021423, 0.0008311271667480469]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 4.0, 6.0, 13.0, 26.0, 29.0, 49.0, 71.0, 119.0, 192.0, 302.0, 561.0, 1027.0, 2013.0, 4686.0, 12528.0, 40451.0, 166037.0, 482774.0, 249531.0, 59736.0, 17007.0, 6057.0, 2518.0, 1211.0, 626.0, 353.0, 218.0, 126.0, 89.0, 50.0, 42.0, 26.0, 22.0, 11.0, 6.0, 13.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.5234375, -6.310546875, -6.09765625, -5.884765625, -5.671875, -5.458984375, -5.24609375, -5.033203125, -4.8203125, -4.607421875, -4.39453125, -4.181640625, -3.96875, -3.755859375, -3.54296875, -3.330078125, -3.1171875, -2.904296875, -2.69140625, -2.478515625, -2.265625, -2.052734375, -1.83984375, -1.626953125, -1.4140625, -1.201171875, -0.98828125, -0.775390625, -0.5625, -0.349609375, -0.13671875, 0.076171875, 0.2890625, 0.501953125, 0.71484375, 0.927734375, 1.140625, 1.353515625, 1.56640625, 1.779296875, 1.9921875, 2.205078125, 2.41796875, 2.630859375, 2.84375, 3.056640625, 3.26953125, 3.482421875, 3.6953125, 3.908203125, 4.12109375, 4.333984375, 4.546875, 4.759765625, 4.97265625, 5.185546875, 5.3984375, 5.611328125, 5.82421875, 6.037109375, 6.25, 6.462890625, 6.67578125, 6.888671875, 7.1015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 6.0, 12.0, 23.0, 18.0, 31.0, 37.0, 40.0, 71.0, 77.0, 92.0, 102.0, 92.0, 99.0, 60.0, 53.0, 40.0, 25.0, 27.0, 22.0, 18.0, 10.0, 7.0, 13.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96484375, -4.80419921875, -4.6435546875, -4.48291015625, -4.322265625, -4.16162109375, -4.0009765625, -3.84033203125, -3.6796875, -3.51904296875, -3.3583984375, -3.19775390625, -3.037109375, -2.87646484375, -2.7158203125, -2.55517578125, -2.39453125, -2.23388671875, -2.0732421875, -1.91259765625, -1.751953125, -1.59130859375, -1.4306640625, -1.27001953125, -1.109375, -0.94873046875, -0.7880859375, -0.62744140625, -0.466796875, -0.30615234375, -0.1455078125, 0.01513671875, 0.17578125, 0.33642578125, 0.4970703125, 0.65771484375, 0.818359375, 0.97900390625, 1.1396484375, 1.30029296875, 1.4609375, 1.62158203125, 1.7822265625, 1.94287109375, 2.103515625, 2.26416015625, 2.4248046875, 2.58544921875, 2.74609375, 2.90673828125, 3.0673828125, 3.22802734375, 3.388671875, 3.54931640625, 3.7099609375, 3.87060546875, 4.03125, 4.19189453125, 4.3525390625, 4.51318359375, 4.673828125, 4.83447265625, 4.9951171875, 5.15576171875, 5.31640625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 18.0, 19.0, 31.0, 46.0, 87.0, 114.0, 130.0, 142.0, 132.0, 89.0, 66.0, 36.0, 23.0, 13.0, 13.0, 10.0, 3.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.98638916015625, -96.97216796875, -93.95795440673828, -90.94373321533203, -87.92951965332031, -84.91529846191406, -81.90108489990234, -78.8868637084961, -75.87265014648438, -72.85842895507812, -69.8442153930664, -66.82999420166016, -63.81578063964844, -60.80156326293945, -57.78734588623047, -54.77312469482422, -51.758907318115234, -48.74468994140625, -45.730472564697266, -42.71625518798828, -39.7020378112793, -36.68782043457031, -33.67359924316406, -30.65938377380371, -27.645166397094727, -24.630949020385742, -21.616731643676758, -18.60251235961914, -15.588295936584473, -12.574078559875488, -9.559860229492188, -6.545642852783203, -3.5314254760742188, -0.5172078609466553, 2.497009754180908, 5.511227607727051, 8.525444984436035, 11.53966236114502, 14.55388069152832, 17.568098068237305, 20.58231544494629, 23.596532821655273, 26.610750198364258, 29.624969482421875, 32.63918685913086, 35.653404235839844, 38.66762161254883, 41.68183898925781, 44.6960563659668, 47.71027374267578, 50.724491119384766, 53.73870849609375, 56.752925872802734, 59.76714324951172, 62.78136444091797, 65.79557800292969, 68.80979919433594, 71.82402038574219, 74.8382339477539, 77.85245513916016, 80.86666870117188, 83.88088989257812, 86.89510345458984, 89.9093246459961, 92.92353820800781]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 12.0, 6.0, 7.0, 10.0, 14.0, 9.0, 7.0, 14.0, 16.0, 25.0, 29.0, 25.0, 30.0, 35.0, 35.0, 32.0, 46.0, 41.0, 43.0, 37.0, 49.0, 47.0, 40.0, 46.0, 37.0, 29.0, 33.0, 24.0, 29.0, 25.0, 24.0, 20.0, 23.0, 24.0, 13.0, 12.0, 9.0, 9.0, 3.0, 10.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-58.398258209228516, -56.64570617675781, -54.89315414428711, -53.140602111816406, -51.3880500793457, -49.635498046875, -47.88294219970703, -46.130393981933594, -44.377838134765625, -42.62528610229492, -40.87273406982422, -39.120182037353516, -37.36763000488281, -35.61507797241211, -33.862525939941406, -32.10997009277344, -30.357421875, -28.604869842529297, -26.852317810058594, -25.09976577758789, -23.347213745117188, -21.594661712646484, -19.84210777282715, -18.089555740356445, -16.337003707885742, -14.584451675415039, -12.831899642944336, -11.079346656799316, -9.326794624328613, -7.57424259185791, -5.821689605712891, -4.0691375732421875, -2.3165817260742188, -0.5640294551849365, 1.1885228157043457, 2.941075325012207, 4.69362735748291, 6.446179389953613, 8.198732376098633, 9.951284408569336, 11.703836441040039, 13.456388473510742, 15.208940505981445, 16.96149444580078, 18.714046478271484, 20.466598510742188, 22.21915054321289, 23.971702575683594, 25.724254608154297, 27.476806640625, 29.229358673095703, 30.981910705566406, 32.73446273803711, 34.48701477050781, 36.23957061767578, 37.99211883544922, 39.74467468261719, 41.49722671508789, 43.249778747558594, 45.0023307800293, 46.7548828125, 48.5074348449707, 50.259986877441406, 52.012542724609375, 53.76509094238281]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 7.0, 9.0, 9.0, 12.0, 18.0, 14.0, 28.0, 29.0, 49.0, 34.0, 89.0, 95.0, 165.0, 227.0, 469.0, 945.0, 2102.0, 5526.0, 19738.0, 141334.0, 3878077.0, 117674.0, 18334.0, 5323.0, 1987.0, 901.0, 470.0, 243.0, 118.0, 97.0, 48.0, 28.0, 16.0, 21.0, 16.0, 9.0, 4.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.96875, -32.983154296875, -31.99755859375, -31.011962890625, -30.0263671875, -29.040771484375, -28.05517578125, -27.069580078125, -26.083984375, -25.098388671875, -24.11279296875, -23.127197265625, -22.1416015625, -21.156005859375, -20.17041015625, -19.184814453125, -18.19921875, -17.213623046875, -16.22802734375, -15.242431640625, -14.2568359375, -13.271240234375, -12.28564453125, -11.300048828125, -10.314453125, -9.328857421875, -8.34326171875, -7.357666015625, -6.3720703125, -5.386474609375, -4.40087890625, -3.415283203125, -2.4296875, -1.444091796875, -0.45849609375, 0.527099609375, 1.5126953125, 2.498291015625, 3.48388671875, 4.469482421875, 5.455078125, 6.440673828125, 7.42626953125, 8.411865234375, 9.3974609375, 10.383056640625, 11.36865234375, 12.354248046875, 13.33984375, 14.325439453125, 15.31103515625, 16.296630859375, 17.2822265625, 18.267822265625, 19.25341796875, 20.239013671875, 21.224609375, 22.210205078125, 23.19580078125, 24.181396484375, 25.1669921875, 26.152587890625, 27.13818359375, 28.123779296875, 29.109375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 10.0, 13.0, 23.0, 35.0, 39.0, 62.0, 71.0, 84.0, 88.0, 88.0, 101.0, 93.0, 68.0, 66.0, 45.0, 40.0, 32.0, 12.0, 14.0, 4.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.392303466796875, -5.24945068359375, -5.106597900390625, -4.9637451171875, -4.820892333984375, -4.67803955078125, -4.535186767578125, -4.392333984375, -4.249481201171875, -4.10662841796875, -3.963775634765625, -3.8209228515625, -3.678070068359375, -3.53521728515625, -3.392364501953125, -3.24951171875, -3.106658935546875, -2.96380615234375, -2.820953369140625, -2.6781005859375, -2.535247802734375, -2.39239501953125, -2.249542236328125, -2.106689453125, -1.963836669921875, -1.82098388671875, -1.678131103515625, -1.5352783203125, -1.392425537109375, -1.24957275390625, -1.106719970703125, -0.9638671875, -0.821014404296875, -0.67816162109375, -0.535308837890625, -0.3924560546875, -0.249603271484375, -0.10675048828125, 0.036102294921875, 0.178955078125, 0.321807861328125, 0.46466064453125, 0.607513427734375, 0.7503662109375, 0.893218994140625, 1.03607177734375, 1.178924560546875, 1.32177734375, 1.464630126953125, 1.60748291015625, 1.750335693359375, 1.8931884765625, 2.036041259765625, 2.17889404296875, 2.321746826171875, 2.464599609375, 2.607452392578125, 2.75030517578125, 2.893157958984375, 3.0360107421875, 3.178863525390625, 3.32171630859375, 3.464569091796875, 3.607421875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 8.0, 7.0, 11.0, 12.0, 20.0, 31.0, 33.0, 49.0, 84.0, 99.0, 159.0, 215.0, 368.0, 515.0, 858.0, 1302.0, 2307.0, 4306.0, 8595.0, 18249.0, 42779.0, 121659.0, 567417.0, 2998219.0, 288455.0, 80205.0, 30315.0, 13245.0, 6280.0, 3279.0, 1874.0, 1122.0, 686.0, 485.0, 342.0, 227.0, 124.0, 99.0, 78.0, 47.0, 33.0, 18.0, 25.0, 14.0, 7.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.9453125, -11.57568359375, -11.2060546875, -10.83642578125, -10.466796875, -10.09716796875, -9.7275390625, -9.35791015625, -8.98828125, -8.61865234375, -8.2490234375, -7.87939453125, -7.509765625, -7.14013671875, -6.7705078125, -6.40087890625, -6.03125, -5.66162109375, -5.2919921875, -4.92236328125, -4.552734375, -4.18310546875, -3.8134765625, -3.44384765625, -3.07421875, -2.70458984375, -2.3349609375, -1.96533203125, -1.595703125, -1.22607421875, -0.8564453125, -0.48681640625, -0.1171875, 0.25244140625, 0.6220703125, 0.99169921875, 1.361328125, 1.73095703125, 2.1005859375, 2.47021484375, 2.83984375, 3.20947265625, 3.5791015625, 3.94873046875, 4.318359375, 4.68798828125, 5.0576171875, 5.42724609375, 5.796875, 6.16650390625, 6.5361328125, 6.90576171875, 7.275390625, 7.64501953125, 8.0146484375, 8.38427734375, 8.75390625, 9.12353515625, 9.4931640625, 9.86279296875, 10.232421875, 10.60205078125, 10.9716796875, 11.34130859375, 11.7109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 1.0, 8.0, 7.0, 12.0, 10.0, 27.0, 28.0, 46.0, 55.0, 101.0, 144.0, 329.0, 1576.0, 1005.0, 300.0, 174.0, 83.0, 52.0, 35.0, 18.0, 14.0, 17.0, 7.0, 2.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.0234375, -5.8603515625, -5.697265625, -5.5341796875, -5.37109375, -5.2080078125, -5.044921875, -4.8818359375, -4.71875, -4.5556640625, -4.392578125, -4.2294921875, -4.06640625, -3.9033203125, -3.740234375, -3.5771484375, -3.4140625, -3.2509765625, -3.087890625, -2.9248046875, -2.76171875, -2.5986328125, -2.435546875, -2.2724609375, -2.109375, -1.9462890625, -1.783203125, -1.6201171875, -1.45703125, -1.2939453125, -1.130859375, -0.9677734375, -0.8046875, -0.6416015625, -0.478515625, -0.3154296875, -0.15234375, 0.0107421875, 0.173828125, 0.3369140625, 0.5, 0.6630859375, 0.826171875, 0.9892578125, 1.15234375, 1.3154296875, 1.478515625, 1.6416015625, 1.8046875, 1.9677734375, 2.130859375, 2.2939453125, 2.45703125, 2.6201171875, 2.783203125, 2.9462890625, 3.109375, 3.2724609375, 3.435546875, 3.5986328125, 3.76171875, 3.9248046875, 4.087890625, 4.2509765625, 4.4140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 17.0, 27.0, 53.0, 83.0, 118.0, 154.0, 166.0, 135.0, 95.0, 68.0, 34.0, 22.0, 17.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.474124908447266, -25.295629501342773, -24.11713409423828, -22.938640594482422, -21.76014518737793, -20.581649780273438, -19.403156280517578, -18.224660873413086, -17.046165466308594, -15.867670059204102, -14.689175605773926, -13.51068115234375, -12.332185745239258, -11.153690338134766, -9.97519588470459, -8.796701431274414, -7.618206024169922, -6.439711093902588, -5.261216163635254, -4.08272123336792, -2.904226303100586, -1.725731372833252, -0.547236442565918, 0.6312580108642578, 1.80975341796875, 2.988248348236084, 4.166743278503418, 5.345238208770752, 6.523733139038086, 7.70222806930542, 8.880722999572754, 10.05921745300293, 11.237716674804688, 12.41621208190918, 13.594706535339355, 14.773200988769531, 15.951696395874023, 17.130191802978516, 18.308685302734375, 19.487180709838867, 20.66567611694336, 21.84417152404785, 23.022666931152344, 24.201160430908203, 25.379655838012695, 26.558151245117188, 27.736644744873047, 28.91514015197754, 30.09363555908203, 31.272130966186523, 32.450626373291016, 33.629119873046875, 34.8076171875, 35.98611068725586, 37.16460418701172, 38.343101501464844, 39.5215950012207, 40.70008850097656, 41.87858581542969, 43.05707931518555, 44.235572814941406, 45.41407012939453, 46.59256362915039, 47.77105712890625, 48.949554443359375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 1.0, 6.0, 5.0, 4.0, 7.0, 8.0, 7.0, 7.0, 15.0, 17.0, 10.0, 18.0, 14.0, 26.0, 26.0, 27.0, 38.0, 33.0, 37.0, 31.0, 31.0, 40.0, 43.0, 43.0, 50.0, 48.0, 42.0, 49.0, 46.0, 40.0, 31.0, 36.0, 22.0, 19.0, 21.0, 17.0, 10.0, 18.0, 13.0, 7.0, 9.0, 6.0, 8.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-14.415864944458008, -13.992840766906738, -13.569816589355469, -13.1467924118042, -12.72376823425293, -12.300745010375977, -11.877720832824707, -11.454696655273438, -11.031672477722168, -10.608648300170898, -10.185624122619629, -9.76259994506836, -9.339576721191406, -8.91655158996582, -8.493528366088867, -8.070504188537598, -7.647480010986328, -7.224455833435059, -6.801431655883789, -6.378407955169678, -5.955383777618408, -5.532359600067139, -5.109335899353027, -4.686311721801758, -4.263287544250488, -3.8402633666992188, -3.4172394275665283, -2.994215488433838, -2.5711913108825684, -2.148167133331299, -1.7251431941986084, -1.302119255065918, -0.8790960311889648, -0.45607197284698486, -0.03304791450500488, 0.3899761438369751, 0.8130002021789551, 1.2360243797302246, 1.659048318862915, 2.0820722579956055, 2.505096435546875, 2.9281206130981445, 3.351144552230835, 3.7741684913635254, 4.197192668914795, 4.6202168464660645, 5.043240547180176, 5.466264724731445, 5.889288902282715, 6.312313079833984, 6.735337257385254, 7.158360958099365, 7.581385135650635, 8.004409790039062, 8.427433013916016, 8.850457191467285, 9.273481369018555, 9.696505546569824, 10.119529724121094, 10.542553901672363, 10.965578079223633, 11.388601303100586, 11.811625480651855, 12.234649658203125, 12.657673835754395]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 5.0, 1.0, 0.0, 6.0, 6.0, 13.0, 20.0, 20.0, 29.0, 33.0, 39.0, 44.0, 81.0, 109.0, 160.0, 218.0, 328.0, 537.0, 885.0, 1647.0, 3784.0, 10131.0, 32787.0, 121029.0, 404362.0, 336716.0, 94353.0, 25899.0, 8162.0, 3268.0, 1552.0, 823.0, 476.0, 345.0, 204.0, 145.0, 99.0, 60.0, 43.0, 45.0, 25.0, 13.0, 19.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.4873046875, -15.896484375, -15.3056640625, -14.71484375, -14.1240234375, -13.533203125, -12.9423828125, -12.3515625, -11.7607421875, -11.169921875, -10.5791015625, -9.98828125, -9.3974609375, -8.806640625, -8.2158203125, -7.625, -7.0341796875, -6.443359375, -5.8525390625, -5.26171875, -4.6708984375, -4.080078125, -3.4892578125, -2.8984375, -2.3076171875, -1.716796875, -1.1259765625, -0.53515625, 0.0556640625, 0.646484375, 1.2373046875, 1.828125, 2.4189453125, 3.009765625, 3.6005859375, 4.19140625, 4.7822265625, 5.373046875, 5.9638671875, 6.5546875, 7.1455078125, 7.736328125, 8.3271484375, 8.91796875, 9.5087890625, 10.099609375, 10.6904296875, 11.28125, 11.8720703125, 12.462890625, 13.0537109375, 13.64453125, 14.2353515625, 14.826171875, 15.4169921875, 16.0078125, 16.5986328125, 17.189453125, 17.7802734375, 18.37109375, 18.9619140625, 19.552734375, 20.1435546875, 20.734375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 11.0, 15.0, 22.0, 42.0, 59.0, 60.0, 99.0, 94.0, 104.0, 95.0, 105.0, 90.0, 56.0, 41.0, 37.0, 31.0, 14.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.97882080078125, -5.8209228515625, -5.66302490234375, -5.505126953125, -5.34722900390625, -5.1893310546875, -5.03143310546875, -4.87353515625, -4.71563720703125, -4.5577392578125, -4.39984130859375, -4.241943359375, -4.08404541015625, -3.9261474609375, -3.76824951171875, -3.6103515625, -3.45245361328125, -3.2945556640625, -3.13665771484375, -2.978759765625, -2.82086181640625, -2.6629638671875, -2.50506591796875, -2.34716796875, -2.18927001953125, -2.0313720703125, -1.87347412109375, -1.715576171875, -1.55767822265625, -1.3997802734375, -1.24188232421875, -1.083984375, -0.92608642578125, -0.7681884765625, -0.61029052734375, -0.452392578125, -0.29449462890625, -0.1365966796875, 0.02130126953125, 0.17919921875, 0.33709716796875, 0.4949951171875, 0.65289306640625, 0.810791015625, 0.96868896484375, 1.1265869140625, 1.28448486328125, 1.4423828125, 1.60028076171875, 1.7581787109375, 1.91607666015625, 2.073974609375, 2.23187255859375, 2.3897705078125, 2.54766845703125, 2.70556640625, 2.86346435546875, 3.0213623046875, 3.17926025390625, 3.337158203125, 3.49505615234375, 3.6529541015625, 3.81085205078125, 3.96875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 10.0, 14.0, 28.0, 35.0, 42.0, 46.0, 92.0, 97.0, 128.0, 196.0, 295.0, 404.0, 644.0, 938.0, 1625.0, 2637.0, 4689.0, 9090.0, 18631.0, 41945.0, 97222.0, 212453.0, 308669.0, 190477.0, 85668.0, 37119.0, 16499.0, 8104.0, 4151.0, 2390.0, 1378.0, 913.0, 610.0, 395.0, 272.0, 175.0, 127.0, 98.0, 65.0, 48.0, 38.0, 26.0, 21.0, 13.0, 11.0, 7.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0], "bins": [-9.8203125, -9.5264892578125, -9.232666015625, -8.9388427734375, -8.64501953125, -8.3511962890625, -8.057373046875, -7.7635498046875, -7.4697265625, -7.1759033203125, -6.882080078125, -6.5882568359375, -6.29443359375, -6.0006103515625, -5.706787109375, -5.4129638671875, -5.119140625, -4.8253173828125, -4.531494140625, -4.2376708984375, -3.94384765625, -3.6500244140625, -3.356201171875, -3.0623779296875, -2.7685546875, -2.4747314453125, -2.180908203125, -1.8870849609375, -1.59326171875, -1.2994384765625, -1.005615234375, -0.7117919921875, -0.41796875, -0.1241455078125, 0.169677734375, 0.4635009765625, 0.75732421875, 1.0511474609375, 1.344970703125, 1.6387939453125, 1.9326171875, 2.2264404296875, 2.520263671875, 2.8140869140625, 3.10791015625, 3.4017333984375, 3.695556640625, 3.9893798828125, 4.283203125, 4.5770263671875, 4.870849609375, 5.1646728515625, 5.45849609375, 5.7523193359375, 6.046142578125, 6.3399658203125, 6.6337890625, 6.9276123046875, 7.221435546875, 7.5152587890625, 7.80908203125, 8.1029052734375, 8.396728515625, 8.6905517578125, 8.984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 10.0, 12.0, 14.0, 17.0, 28.0, 15.0, 30.0, 34.0, 37.0, 40.0, 46.0, 56.0, 43.0, 62.0, 56.0, 46.0, 60.0, 64.0, 44.0, 48.0, 34.0, 33.0, 32.0, 25.0, 23.0, 18.0, 15.0, 6.0, 5.0, 5.0, 8.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-15.0078125, -14.62060546875, -14.2333984375, -13.84619140625, -13.458984375, -13.07177734375, -12.6845703125, -12.29736328125, -11.91015625, -11.52294921875, -11.1357421875, -10.74853515625, -10.361328125, -9.97412109375, -9.5869140625, -9.19970703125, -8.8125, -8.42529296875, -8.0380859375, -7.65087890625, -7.263671875, -6.87646484375, -6.4892578125, -6.10205078125, -5.71484375, -5.32763671875, -4.9404296875, -4.55322265625, -4.166015625, -3.77880859375, -3.3916015625, -3.00439453125, -2.6171875, -2.22998046875, -1.8427734375, -1.45556640625, -1.068359375, -0.68115234375, -0.2939453125, 0.09326171875, 0.48046875, 0.86767578125, 1.2548828125, 1.64208984375, 2.029296875, 2.41650390625, 2.8037109375, 3.19091796875, 3.578125, 3.96533203125, 4.3525390625, 4.73974609375, 5.126953125, 5.51416015625, 5.9013671875, 6.28857421875, 6.67578125, 7.06298828125, 7.4501953125, 7.83740234375, 8.224609375, 8.61181640625, 8.9990234375, 9.38623046875, 9.7734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 13.0, 5.0, 15.0, 16.0, 32.0, 53.0, 73.0, 120.0, 143.0, 313.0, 501.0, 1126.0, 2449.0, 6264.0, 19621.0, 68553.0, 272727.0, 453402.0, 161578.0, 41295.0, 12325.0, 4342.0, 1736.0, 826.0, 395.0, 226.0, 165.0, 75.0, 44.0, 36.0, 35.0, 19.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.57281494140625, -4.4112548828125, -4.24969482421875, -4.088134765625, -3.92657470703125, -3.7650146484375, -3.60345458984375, -3.44189453125, -3.28033447265625, -3.1187744140625, -2.95721435546875, -2.795654296875, -2.63409423828125, -2.4725341796875, -2.31097412109375, -2.1494140625, -1.98785400390625, -1.8262939453125, -1.66473388671875, -1.503173828125, -1.34161376953125, -1.1800537109375, -1.01849365234375, -0.85693359375, -0.69537353515625, -0.5338134765625, -0.37225341796875, -0.210693359375, -0.04913330078125, 0.1124267578125, 0.27398681640625, 0.435546875, 0.59710693359375, 0.7586669921875, 0.92022705078125, 1.081787109375, 1.24334716796875, 1.4049072265625, 1.56646728515625, 1.72802734375, 1.88958740234375, 2.0511474609375, 2.21270751953125, 2.374267578125, 2.53582763671875, 2.6973876953125, 2.85894775390625, 3.0205078125, 3.18206787109375, 3.3436279296875, 3.50518798828125, 3.666748046875, 3.82830810546875, 3.9898681640625, 4.15142822265625, 4.31298828125, 4.47454833984375, 4.6361083984375, 4.79766845703125, 4.959228515625, 5.12078857421875, 5.2823486328125, 5.44390869140625, 5.60546875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 5.0, 2.0, 15.0, 11.0, 8.0, 19.0, 20.0, 26.0, 44.0, 46.0, 52.0, 90.0, 121.0, 118.0, 115.0, 50.0, 51.0, 38.0, 36.0, 32.0, 20.0, 14.0, 7.0, 13.0, 4.0, 3.0, 5.0, 10.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.001033782958984375, -0.0010043010115623474, -0.0009748190641403198, -0.0009453371167182922, -0.0009158551692962646, -0.0008863732218742371, -0.0008568912744522095, -0.0008274093270301819, -0.0007979273796081543, -0.0007684454321861267, -0.0007389634847640991, -0.0007094815373420715, -0.0006799995899200439, -0.0006505176424980164, -0.0006210356950759888, -0.0005915537476539612, -0.0005620718002319336, -0.000532589852809906, -0.0005031079053878784, -0.00047362595796585083, -0.00044414401054382324, -0.00041466206312179565, -0.00038518011569976807, -0.0003556981682777405, -0.0003262162208557129, -0.0002967342734336853, -0.0002672523260116577, -0.00023777037858963013, -0.00020828843116760254, -0.00017880648374557495, -0.00014932453632354736, -0.00011984258890151978, -9.036064147949219e-05, -6.08786940574646e-05, -3.139674663543701e-05, -1.914799213409424e-06, 2.7567148208618164e-05, 5.704909563064575e-05, 8.653104305267334e-05, 0.00011601299047470093, 0.00014549493789672852, 0.0001749768853187561, 0.0002044588327407837, 0.00023394078016281128, 0.00026342272758483887, 0.00029290467500686646, 0.00032238662242889404, 0.00035186856985092163, 0.0003813505172729492, 0.0004108324646949768, 0.0004403144121170044, 0.000469796359539032, 0.0004992783069610596, 0.0005287602543830872, 0.0005582422018051147, 0.0005877241492271423, 0.0006172060966491699, 0.0006466880440711975, 0.0006761699914932251, 0.0007056519389152527, 0.0007351338863372803, 0.0007646158337593079, 0.0007940977811813354, 0.000823579728603363, 0.0008530616760253906]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 5.0, 5.0, 15.0, 17.0, 30.0, 34.0, 81.0, 99.0, 176.0, 285.0, 519.0, 979.0, 1924.0, 4634.0, 13255.0, 46353.0, 207464.0, 523924.0, 185949.0, 41957.0, 12266.0, 4367.0, 2007.0, 923.0, 495.0, 273.0, 199.0, 115.0, 72.0, 46.0, 22.0, 18.0, 10.0, 8.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.586181640625, -5.40283203125, -5.219482421875, -5.0361328125, -4.852783203125, -4.66943359375, -4.486083984375, -4.302734375, -4.119384765625, -3.93603515625, -3.752685546875, -3.5693359375, -3.385986328125, -3.20263671875, -3.019287109375, -2.8359375, -2.652587890625, -2.46923828125, -2.285888671875, -2.1025390625, -1.919189453125, -1.73583984375, -1.552490234375, -1.369140625, -1.185791015625, -1.00244140625, -0.819091796875, -0.6357421875, -0.452392578125, -0.26904296875, -0.085693359375, 0.09765625, 0.281005859375, 0.46435546875, 0.647705078125, 0.8310546875, 1.014404296875, 1.19775390625, 1.381103515625, 1.564453125, 1.747802734375, 1.93115234375, 2.114501953125, 2.2978515625, 2.481201171875, 2.66455078125, 2.847900390625, 3.03125, 3.214599609375, 3.39794921875, 3.581298828125, 3.7646484375, 3.947998046875, 4.13134765625, 4.314697265625, 4.498046875, 4.681396484375, 4.86474609375, 5.048095703125, 5.2314453125, 5.414794921875, 5.59814453125, 5.781494140625, 5.96484375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 6.0, 17.0, 27.0, 40.0, 56.0, 46.0, 76.0, 93.0, 101.0, 112.0, 80.0, 89.0, 62.0, 43.0, 31.0, 22.0, 25.0, 18.0, 10.0, 8.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.101318359375, -4.95654296875, -4.811767578125, -4.6669921875, -4.522216796875, -4.37744140625, -4.232666015625, -4.087890625, -3.943115234375, -3.79833984375, -3.653564453125, -3.5087890625, -3.364013671875, -3.21923828125, -3.074462890625, -2.9296875, -2.784912109375, -2.64013671875, -2.495361328125, -2.3505859375, -2.205810546875, -2.06103515625, -1.916259765625, -1.771484375, -1.626708984375, -1.48193359375, -1.337158203125, -1.1923828125, -1.047607421875, -0.90283203125, -0.758056640625, -0.61328125, -0.468505859375, -0.32373046875, -0.178955078125, -0.0341796875, 0.110595703125, 0.25537109375, 0.400146484375, 0.544921875, 0.689697265625, 0.83447265625, 0.979248046875, 1.1240234375, 1.268798828125, 1.41357421875, 1.558349609375, 1.703125, 1.847900390625, 1.99267578125, 2.137451171875, 2.2822265625, 2.427001953125, 2.57177734375, 2.716552734375, 2.861328125, 3.006103515625, 3.15087890625, 3.295654296875, 3.4404296875, 3.585205078125, 3.72998046875, 3.874755859375, 4.01953125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 12.0, 10.0, 10.0, 20.0, 22.0, 30.0, 33.0, 68.0, 68.0, 91.0, 76.0, 96.0, 67.0, 88.0, 75.0, 60.0, 47.0, 31.0, 23.0, 14.0, 6.0, 8.0, 15.0, 6.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-72.63877868652344, -70.62785339355469, -68.61692810058594, -66.60600280761719, -64.59507751464844, -62.58415222167969, -60.57322692871094, -58.56230163574219, -56.55137634277344, -54.54045104980469, -52.52952575683594, -50.51860046386719, -48.50767517089844, -46.49674987792969, -44.48582458496094, -42.47489929199219, -40.46397399902344, -38.45304870605469, -36.44212341308594, -34.43119812011719, -32.42027282714844, -30.409347534179688, -28.398422241210938, -26.387496948242188, -24.376571655273438, -22.365646362304688, -20.354721069335938, -18.343795776367188, -16.332870483398438, -14.321945190429688, -12.311019897460938, -10.300094604492188, -8.289169311523438, -6.2782440185546875, -4.2673187255859375, -2.2563934326171875, -0.2454681396484375, 1.7654571533203125, 3.7763824462890625, 5.7873077392578125, 7.7982330322265625, 9.809158325195312, 11.820083618164062, 13.831008911132812, 15.841934204101562, 17.852859497070312, 19.863784790039062, 21.874710083007812, 23.885635375976562, 25.896560668945312, 27.907485961914062, 29.918411254882812, 31.929336547851562, 33.94026184082031, 35.95118713378906, 37.96211242675781, 39.97303771972656, 41.98396301269531, 43.99488830566406, 46.00581359863281, 48.01673889160156, 50.02766418457031, 52.03858947753906, 54.04951477050781, 56.06044006347656]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 9.0, 7.0, 7.0, 11.0, 15.0, 14.0, 9.0, 26.0, 33.0, 29.0, 34.0, 31.0, 52.0, 60.0, 53.0, 63.0, 48.0, 52.0, 54.0, 50.0, 49.0, 44.0, 35.0, 39.0, 26.0, 26.0, 30.0, 15.0, 22.0, 8.0, 12.0, 7.0, 8.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.80264282226562, -68.59203338623047, -66.38142395019531, -64.17082214355469, -61.960208892822266, -59.749603271484375, -57.53899383544922, -55.32838439941406, -53.117774963378906, -50.90716552734375, -48.69655990600586, -46.4859504699707, -44.27534103393555, -42.064735412597656, -39.8541259765625, -37.643516540527344, -35.43291091918945, -33.2223014831543, -31.011693954467773, -28.80108642578125, -26.590476989746094, -24.37986946105957, -22.169261932373047, -19.95865249633789, -17.748044967651367, -15.537436485290527, -13.326828002929688, -11.116220474243164, -8.905611991882324, -6.695003509521484, -4.484395980834961, -2.273787498474121, -0.06317901611328125, 2.1474292278289795, 4.35803747177124, 6.568645477294922, 8.779253959655762, 10.989862442016602, 13.200469970703125, 15.411078453063965, 17.621686935424805, 19.832294464111328, 22.042903900146484, 24.253511428833008, 26.46411895751953, 28.674728393554688, 30.88533592224121, 33.095943450927734, 35.30655288696289, 37.51716232299805, 39.72776794433594, 41.938377380371094, 44.14898681640625, 46.359596252441406, 48.5702018737793, 50.78081130981445, 52.991416931152344, 55.2020263671875, 57.41263198852539, 59.62324142456055, 61.8338508605957, 64.0444564819336, 66.25506591796875, 68.4656753540039, 70.67628479003906]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 6.0, 4.0, 11.0, 15.0, 6.0, 22.0, 16.0, 27.0, 29.0, 38.0, 52.0, 58.0, 95.0, 118.0, 169.0, 195.0, 332.0, 547.0, 879.0, 1800.0, 3693.0, 8795.0, 25340.0, 107153.0, 3130368.0, 806389.0, 74670.0, 19887.0, 7083.0, 3144.0, 1407.0, 804.0, 396.0, 228.0, 143.0, 111.0, 64.0, 49.0, 27.0, 28.0, 25.0, 11.0, 18.0, 11.0, 6.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-25.6875, -24.9716796875, -24.255859375, -23.5400390625, -22.82421875, -22.1083984375, -21.392578125, -20.6767578125, -19.9609375, -19.2451171875, -18.529296875, -17.8134765625, -17.09765625, -16.3818359375, -15.666015625, -14.9501953125, -14.234375, -13.5185546875, -12.802734375, -12.0869140625, -11.37109375, -10.6552734375, -9.939453125, -9.2236328125, -8.5078125, -7.7919921875, -7.076171875, -6.3603515625, -5.64453125, -4.9287109375, -4.212890625, -3.4970703125, -2.78125, -2.0654296875, -1.349609375, -0.6337890625, 0.08203125, 0.7978515625, 1.513671875, 2.2294921875, 2.9453125, 3.6611328125, 4.376953125, 5.0927734375, 5.80859375, 6.5244140625, 7.240234375, 7.9560546875, 8.671875, 9.3876953125, 10.103515625, 10.8193359375, 11.53515625, 12.2509765625, 12.966796875, 13.6826171875, 14.3984375, 15.1142578125, 15.830078125, 16.5458984375, 17.26171875, 17.9775390625, 18.693359375, 19.4091796875, 20.125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 8.0, 9.0, 14.0, 24.0, 36.0, 59.0, 66.0, 92.0, 73.0, 87.0, 108.0, 95.0, 83.0, 60.0, 58.0, 44.0, 28.0, 21.0, 17.0, 5.0, 1.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.87890625, -5.732452392578125, -5.58599853515625, -5.439544677734375, -5.2930908203125, -5.146636962890625, -5.00018310546875, -4.853729248046875, -4.707275390625, -4.560821533203125, -4.41436767578125, -4.267913818359375, -4.1214599609375, -3.975006103515625, -3.82855224609375, -3.682098388671875, -3.53564453125, -3.389190673828125, -3.24273681640625, -3.096282958984375, -2.9498291015625, -2.803375244140625, -2.65692138671875, -2.510467529296875, -2.364013671875, -2.217559814453125, -2.07110595703125, -1.924652099609375, -1.7781982421875, -1.631744384765625, -1.48529052734375, -1.338836669921875, -1.1923828125, -1.045928955078125, -0.89947509765625, -0.753021240234375, -0.6065673828125, -0.460113525390625, -0.31365966796875, -0.167205810546875, -0.020751953125, 0.125701904296875, 0.27215576171875, 0.418609619140625, 0.5650634765625, 0.711517333984375, 0.85797119140625, 1.004425048828125, 1.15087890625, 1.297332763671875, 1.44378662109375, 1.590240478515625, 1.7366943359375, 1.883148193359375, 2.02960205078125, 2.176055908203125, 2.322509765625, 2.468963623046875, 2.61541748046875, 2.761871337890625, 2.9083251953125, 3.054779052734375, 3.20123291015625, 3.347686767578125, 3.494140625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 10.0, 8.0, 10.0, 19.0, 18.0, 24.0, 38.0, 57.0, 87.0, 103.0, 143.0, 205.0, 291.0, 445.0, 639.0, 946.0, 1613.0, 2855.0, 5705.0, 15919.0, 64204.0, 498362.0, 3310708.0, 232421.0, 39124.0, 10741.0, 4136.0, 2079.0, 1183.0, 713.0, 443.0, 301.0, 209.0, 166.0, 116.0, 69.0, 50.0, 39.0, 12.0, 23.0, 14.0, 11.0, 9.0, 8.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.132080078125, -17.51416015625, -16.896240234375, -16.2783203125, -15.660400390625, -15.04248046875, -14.424560546875, -13.806640625, -13.188720703125, -12.57080078125, -11.952880859375, -11.3349609375, -10.717041015625, -10.09912109375, -9.481201171875, -8.86328125, -8.245361328125, -7.62744140625, -7.009521484375, -6.3916015625, -5.773681640625, -5.15576171875, -4.537841796875, -3.919921875, -3.302001953125, -2.68408203125, -2.066162109375, -1.4482421875, -0.830322265625, -0.21240234375, 0.405517578125, 1.0234375, 1.641357421875, 2.25927734375, 2.877197265625, 3.4951171875, 4.113037109375, 4.73095703125, 5.348876953125, 5.966796875, 6.584716796875, 7.20263671875, 7.820556640625, 8.4384765625, 9.056396484375, 9.67431640625, 10.292236328125, 10.91015625, 11.528076171875, 12.14599609375, 12.763916015625, 13.3818359375, 13.999755859375, 14.61767578125, 15.235595703125, 15.853515625, 16.471435546875, 17.08935546875, 17.707275390625, 18.3251953125, 18.943115234375, 19.56103515625, 20.178955078125, 20.796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 4.0, 7.0, 12.0, 14.0, 31.0, 37.0, 84.0, 116.0, 244.0, 583.0, 1827.0, 563.0, 240.0, 113.0, 84.0, 38.0, 23.0, 16.0, 7.0, 10.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0625, -11.75714111328125, -11.4517822265625, -11.14642333984375, -10.841064453125, -10.53570556640625, -10.2303466796875, -9.92498779296875, -9.61962890625, -9.31427001953125, -9.0089111328125, -8.70355224609375, -8.398193359375, -8.09283447265625, -7.7874755859375, -7.48211669921875, -7.1767578125, -6.87139892578125, -6.5660400390625, -6.26068115234375, -5.955322265625, -5.64996337890625, -5.3446044921875, -5.03924560546875, -4.73388671875, -4.42852783203125, -4.1231689453125, -3.81781005859375, -3.512451171875, -3.20709228515625, -2.9017333984375, -2.59637451171875, -2.291015625, -1.98565673828125, -1.6802978515625, -1.37493896484375, -1.069580078125, -0.76422119140625, -0.4588623046875, -0.15350341796875, 0.15185546875, 0.45721435546875, 0.7625732421875, 1.06793212890625, 1.373291015625, 1.67864990234375, 1.9840087890625, 2.28936767578125, 2.5947265625, 2.90008544921875, 3.2054443359375, 3.51080322265625, 3.816162109375, 4.12152099609375, 4.4268798828125, 4.73223876953125, 5.03759765625, 5.34295654296875, 5.6483154296875, 5.95367431640625, 6.259033203125, 6.56439208984375, 6.8697509765625, 7.17510986328125, 7.48046875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 11.0, 9.0, 14.0, 23.0, 23.0, 59.0, 92.0, 115.0, 124.0, 134.0, 133.0, 93.0, 62.0, 36.0, 41.0, 10.0, 7.0, 8.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.80229568481445, -44.135501861572266, -42.46870803833008, -40.80191421508789, -39.1351203918457, -37.468326568603516, -35.80153274536133, -34.13473892211914, -32.46794509887695, -30.801151275634766, -29.134357452392578, -27.46756362915039, -25.800769805908203, -24.133975982666016, -22.467182159423828, -20.80038833618164, -19.133594512939453, -17.466800689697266, -15.800006866455078, -14.13321304321289, -12.466419219970703, -10.799625396728516, -9.132831573486328, -7.466037750244141, -5.799243927001953, -4.132450103759766, -2.465656280517578, -0.7988624572753906, 0.8679313659667969, 2.5347251892089844, 4.201519012451172, 5.868312835693359, 7.5351104736328125, 9.201904296875, 10.868698120117188, 12.535491943359375, 14.202285766601562, 15.86907958984375, 17.535873413085938, 19.202667236328125, 20.869461059570312, 22.5362548828125, 24.203048706054688, 25.869842529296875, 27.536636352539062, 29.20343017578125, 30.870223999023438, 32.537017822265625, 34.20381164550781, 35.87060546875, 37.53739929199219, 39.204193115234375, 40.87098693847656, 42.53778076171875, 44.20457458496094, 45.871368408203125, 47.53816223144531, 49.2049560546875, 50.87174987792969, 52.538543701171875, 54.20533752441406, 55.87213134765625, 57.53892517089844, 59.205718994140625, 60.87251281738281]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 8.0, 6.0, 17.0, 15.0, 14.0, 23.0, 31.0, 47.0, 55.0, 50.0, 63.0, 73.0, 71.0, 90.0, 85.0, 67.0, 63.0, 50.0, 47.0, 36.0, 27.0, 12.0, 18.0, 10.0, 3.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.92376708984375, -39.594913482666016, -38.266056060791016, -36.93720245361328, -35.60834884643555, -34.27949523925781, -32.95063781738281, -31.621784210205078, -30.29292869567871, -28.964073181152344, -27.63521957397461, -26.306364059448242, -24.977508544921875, -23.64865493774414, -22.319799423217773, -20.990943908691406, -19.662090301513672, -18.333234786987305, -17.00438117980957, -15.675525665283203, -14.346671104431152, -13.017816543579102, -11.688961029052734, -10.360106468200684, -9.031251907348633, -7.702397346496582, -6.373542308807373, -5.044687271118164, -3.7158327102661133, -2.3869781494140625, -1.0581231117248535, 0.27073192596435547, 1.5995864868164062, 2.928441286087036, 4.257296085357666, 5.586151123046875, 6.915005683898926, 8.243860244750977, 9.572715759277344, 10.901570320129395, 12.230424880981445, 13.559279441833496, 14.888134002685547, 16.216989517211914, 17.54584503173828, 18.874698638916016, 20.203554153442383, 21.53240966796875, 22.861263275146484, 24.19011878967285, 25.518972396850586, 26.847827911376953, 28.176681518554688, 29.505537033081055, 30.834392547607422, 32.163246154785156, 33.492103576660156, 34.82095718383789, 36.14981460571289, 37.478668212890625, 38.80752182006836, 40.136375427246094, 41.465232849121094, 42.79408645629883, 44.12294006347656]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 10.0, 10.0, 25.0, 36.0, 67.0, 97.0, 196.0, 340.0, 614.0, 1364.0, 4278.0, 31146.0, 485849.0, 486478.0, 30943.0, 4304.0, 1374.0, 638.0, 311.0, 214.0, 105.0, 62.0, 30.0, 30.0, 17.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-44.5625, -43.169921875, -41.77734375, -40.384765625, -38.9921875, -37.599609375, -36.20703125, -34.814453125, -33.421875, -32.029296875, -30.63671875, -29.244140625, -27.8515625, -26.458984375, -25.06640625, -23.673828125, -22.28125, -20.888671875, -19.49609375, -18.103515625, -16.7109375, -15.318359375, -13.92578125, -12.533203125, -11.140625, -9.748046875, -8.35546875, -6.962890625, -5.5703125, -4.177734375, -2.78515625, -1.392578125, 0.0, 1.392578125, 2.78515625, 4.177734375, 5.5703125, 6.962890625, 8.35546875, 9.748046875, 11.140625, 12.533203125, 13.92578125, 15.318359375, 16.7109375, 18.103515625, 19.49609375, 20.888671875, 22.28125, 23.673828125, 25.06640625, 26.458984375, 27.8515625, 29.244140625, 30.63671875, 32.029296875, 33.421875, 34.814453125, 36.20703125, 37.599609375, 38.9921875, 40.384765625, 41.77734375, 43.169921875, 44.5625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 7.0, 4.0, 6.0, 25.0, 38.0, 62.0, 81.0, 101.0, 101.0, 121.0, 117.0, 103.0, 75.0, 58.0, 44.0, 26.0, 17.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-7.44140625, -7.25787353515625, -7.0743408203125, -6.89080810546875, -6.707275390625, -6.52374267578125, -6.3402099609375, -6.15667724609375, -5.97314453125, -5.78961181640625, -5.6060791015625, -5.42254638671875, -5.239013671875, -5.05548095703125, -4.8719482421875, -4.68841552734375, -4.5048828125, -4.32135009765625, -4.1378173828125, -3.95428466796875, -3.770751953125, -3.58721923828125, -3.4036865234375, -3.22015380859375, -3.03662109375, -2.85308837890625, -2.6695556640625, -2.48602294921875, -2.302490234375, -2.11895751953125, -1.9354248046875, -1.75189208984375, -1.568359375, -1.38482666015625, -1.2012939453125, -1.01776123046875, -0.834228515625, -0.65069580078125, -0.4671630859375, -0.28363037109375, -0.10009765625, 0.08343505859375, 0.2669677734375, 0.45050048828125, 0.634033203125, 0.81756591796875, 1.0010986328125, 1.18463134765625, 1.3681640625, 1.55169677734375, 1.7352294921875, 1.91876220703125, 2.102294921875, 2.28582763671875, 2.4693603515625, 2.65289306640625, 2.83642578125, 3.01995849609375, 3.2034912109375, 3.38702392578125, 3.570556640625, 3.75408935546875, 3.9376220703125, 4.12115478515625, 4.3046875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 8.0, 6.0, 11.0, 26.0, 21.0, 29.0, 55.0, 65.0, 85.0, 157.0, 195.0, 319.0, 472.0, 709.0, 1209.0, 1927.0, 3280.0, 5762.0, 10473.0, 19632.0, 38146.0, 75359.0, 149239.0, 275539.0, 228385.0, 114982.0, 58195.0, 29249.0, 15266.0, 7982.0, 4628.0, 2589.0, 1597.0, 1043.0, 608.0, 401.0, 272.0, 198.0, 121.0, 95.0, 63.0, 44.0, 28.0, 22.0, 23.0, 17.0, 9.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.65625, -7.42291259765625, -7.1895751953125, -6.95623779296875, -6.722900390625, -6.48956298828125, -6.2562255859375, -6.02288818359375, -5.78955078125, -5.55621337890625, -5.3228759765625, -5.08953857421875, -4.856201171875, -4.62286376953125, -4.3895263671875, -4.15618896484375, -3.9228515625, -3.68951416015625, -3.4561767578125, -3.22283935546875, -2.989501953125, -2.75616455078125, -2.5228271484375, -2.28948974609375, -2.05615234375, -1.82281494140625, -1.5894775390625, -1.35614013671875, -1.122802734375, -0.88946533203125, -0.6561279296875, -0.42279052734375, -0.189453125, 0.04388427734375, 0.2772216796875, 0.51055908203125, 0.743896484375, 0.97723388671875, 1.2105712890625, 1.44390869140625, 1.67724609375, 1.91058349609375, 2.1439208984375, 2.37725830078125, 2.610595703125, 2.84393310546875, 3.0772705078125, 3.31060791015625, 3.5439453125, 3.77728271484375, 4.0106201171875, 4.24395751953125, 4.477294921875, 4.71063232421875, 4.9439697265625, 5.17730712890625, 5.41064453125, 5.64398193359375, 5.8773193359375, 6.11065673828125, 6.343994140625, 6.57733154296875, 6.8106689453125, 7.04400634765625, 7.27734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 2.0, 11.0, 8.0, 11.0, 26.0, 11.0, 13.0, 17.0, 19.0, 17.0, 34.0, 30.0, 37.0, 37.0, 49.0, 36.0, 39.0, 48.0, 39.0, 52.0, 47.0, 52.0, 38.0, 42.0, 36.0, 30.0, 27.0, 28.0, 22.0, 27.0, 21.0, 17.0, 15.0, 16.0, 10.0, 11.0, 6.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.640625, -10.3343505859375, -10.028076171875, -9.7218017578125, -9.41552734375, -9.1092529296875, -8.802978515625, -8.4967041015625, -8.1904296875, -7.8841552734375, -7.577880859375, -7.2716064453125, -6.96533203125, -6.6590576171875, -6.352783203125, -6.0465087890625, -5.740234375, -5.4339599609375, -5.127685546875, -4.8214111328125, -4.51513671875, -4.2088623046875, -3.902587890625, -3.5963134765625, -3.2900390625, -2.9837646484375, -2.677490234375, -2.3712158203125, -2.06494140625, -1.7586669921875, -1.452392578125, -1.1461181640625, -0.83984375, -0.5335693359375, -0.227294921875, 0.0789794921875, 0.38525390625, 0.6915283203125, 0.997802734375, 1.3040771484375, 1.6103515625, 1.9166259765625, 2.222900390625, 2.5291748046875, 2.83544921875, 3.1417236328125, 3.447998046875, 3.7542724609375, 4.060546875, 4.3668212890625, 4.673095703125, 4.9793701171875, 5.28564453125, 5.5919189453125, 5.898193359375, 6.2044677734375, 6.5107421875, 6.8170166015625, 7.123291015625, 7.4295654296875, 7.73583984375, 8.0421142578125, 8.348388671875, 8.6546630859375, 8.9609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 7.0, 9.0, 12.0, 23.0, 48.0, 79.0, 141.0, 335.0, 803.0, 2007.0, 6058.0, 24656.0, 151166.0, 594689.0, 222343.0, 34141.0, 7785.0, 2496.0, 943.0, 390.0, 181.0, 101.0, 44.0, 24.0, 21.0, 12.0, 13.0, 5.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8359375, -6.5882568359375, -6.340576171875, -6.0928955078125, -5.84521484375, -5.5975341796875, -5.349853515625, -5.1021728515625, -4.8544921875, -4.6068115234375, -4.359130859375, -4.1114501953125, -3.86376953125, -3.6160888671875, -3.368408203125, -3.1207275390625, -2.873046875, -2.6253662109375, -2.377685546875, -2.1300048828125, -1.88232421875, -1.6346435546875, -1.386962890625, -1.1392822265625, -0.8916015625, -0.6439208984375, -0.396240234375, -0.1485595703125, 0.09912109375, 0.3468017578125, 0.594482421875, 0.8421630859375, 1.08984375, 1.3375244140625, 1.585205078125, 1.8328857421875, 2.08056640625, 2.3282470703125, 2.575927734375, 2.8236083984375, 3.0712890625, 3.3189697265625, 3.566650390625, 3.8143310546875, 4.06201171875, 4.3096923828125, 4.557373046875, 4.8050537109375, 5.052734375, 5.3004150390625, 5.548095703125, 5.7957763671875, 6.04345703125, 6.2911376953125, 6.538818359375, 6.7864990234375, 7.0341796875, 7.2818603515625, 7.529541015625, 7.7772216796875, 8.02490234375, 8.2725830078125, 8.520263671875, 8.7679443359375, 9.015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 6.0, 3.0, 5.0, 6.0, 6.0, 7.0, 4.0, 9.0, 16.0, 8.0, 12.0, 11.0, 34.0, 32.0, 42.0, 46.0, 79.0, 83.0, 117.0, 108.0, 68.0, 71.0, 38.0, 33.0, 32.0, 20.0, 21.0, 12.0, 12.0, 8.0, 11.0, 3.0, 10.0, 6.0, 3.0, 7.0, 0.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007419586181640625, -0.0007184520363807678, -0.0006949454545974731, -0.0006714388728141785, -0.0006479322910308838, -0.0006244257092475891, -0.0006009191274642944, -0.0005774125456809998, -0.0005539059638977051, -0.0005303993821144104, -0.0005068928003311157, -0.00048338621854782104, -0.00045987963676452637, -0.0004363730549812317, -0.000412866473197937, -0.00038935989141464233, -0.00036585330963134766, -0.000342346727848053, -0.0003188401460647583, -0.0002953335642814636, -0.00027182698249816895, -0.00024832040071487427, -0.0002248138189315796, -0.0002013072371482849, -0.00017780065536499023, -0.00015429407358169556, -0.00013078749179840088, -0.0001072809100151062, -8.377432823181152e-05, -6.0267746448516846e-05, -3.676116466522217e-05, -1.325458288192749e-05, 1.0251998901367188e-05, 3.3758580684661865e-05, 5.726516246795654e-05, 8.077174425125122e-05, 0.0001042783260345459, 0.00012778490781784058, 0.00015129148960113525, 0.00017479807138442993, 0.0001983046531677246, 0.0002218112349510193, 0.00024531781673431396, 0.00026882439851760864, 0.0002923309803009033, 0.000315837562084198, 0.0003393441438674927, 0.00036285072565078735, 0.00038635730743408203, 0.0004098638892173767, 0.0004333704710006714, 0.00045687705278396606, 0.00048038363456726074, 0.0005038902163505554, 0.0005273967981338501, 0.0005509033799171448, 0.0005744099617004395, 0.0005979165434837341, 0.0006214231252670288, 0.0006449297070503235, 0.0006684362888336182, 0.0006919428706169128, 0.0007154494524002075, 0.0007389560341835022, 0.0007624626159667969]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 9.0, 19.0, 21.0, 40.0, 52.0, 81.0, 135.0, 235.0, 415.0, 829.0, 1986.0, 4742.0, 14601.0, 56731.0, 307096.0, 511809.0, 112260.0, 24795.0, 7440.0, 2709.0, 1178.0, 593.0, 316.0, 162.0, 112.0, 60.0, 32.0, 28.0, 23.0, 10.0, 10.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3046875, -6.0811767578125, -5.857666015625, -5.6341552734375, -5.41064453125, -5.1871337890625, -4.963623046875, -4.7401123046875, -4.5166015625, -4.2930908203125, -4.069580078125, -3.8460693359375, -3.62255859375, -3.3990478515625, -3.175537109375, -2.9520263671875, -2.728515625, -2.5050048828125, -2.281494140625, -2.0579833984375, -1.83447265625, -1.6109619140625, -1.387451171875, -1.1639404296875, -0.9404296875, -0.7169189453125, -0.493408203125, -0.2698974609375, -0.04638671875, 0.1771240234375, 0.400634765625, 0.6241455078125, 0.84765625, 1.0711669921875, 1.294677734375, 1.5181884765625, 1.74169921875, 1.9652099609375, 2.188720703125, 2.4122314453125, 2.6357421875, 2.8592529296875, 3.082763671875, 3.3062744140625, 3.52978515625, 3.7532958984375, 3.976806640625, 4.2003173828125, 4.423828125, 4.6473388671875, 4.870849609375, 5.0943603515625, 5.31787109375, 5.5413818359375, 5.764892578125, 5.9884033203125, 6.2119140625, 6.4354248046875, 6.658935546875, 6.8824462890625, 7.10595703125, 7.3294677734375, 7.552978515625, 7.7764892578125, 8.0]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 13.0, 19.0, 25.0, 36.0, 62.0, 81.0, 115.0, 171.0, 141.0, 98.0, 70.0, 55.0, 38.0, 19.0, 13.0, 10.0, 8.0, 2.0, 1.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.7264404296875, -7.491943359375, -7.2574462890625, -7.02294921875, -6.7884521484375, -6.553955078125, -6.3194580078125, -6.0849609375, -5.8504638671875, -5.615966796875, -5.3814697265625, -5.14697265625, -4.9124755859375, -4.677978515625, -4.4434814453125, -4.208984375, -3.9744873046875, -3.739990234375, -3.5054931640625, -3.27099609375, -3.0364990234375, -2.802001953125, -2.5675048828125, -2.3330078125, -2.0985107421875, -1.864013671875, -1.6295166015625, -1.39501953125, -1.1605224609375, -0.926025390625, -0.6915283203125, -0.45703125, -0.2225341796875, 0.011962890625, 0.2464599609375, 0.48095703125, 0.7154541015625, 0.949951171875, 1.1844482421875, 1.4189453125, 1.6534423828125, 1.887939453125, 2.1224365234375, 2.35693359375, 2.5914306640625, 2.825927734375, 3.0604248046875, 3.294921875, 3.5294189453125, 3.763916015625, 3.9984130859375, 4.23291015625, 4.4674072265625, 4.701904296875, 4.9364013671875, 5.1708984375, 5.4053955078125, 5.639892578125, 5.8743896484375, 6.10888671875, 6.3433837890625, 6.577880859375, 6.8123779296875, 7.046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 20.0, 11.0, 9.0, 28.0, 34.0, 69.0, 90.0, 150.0, 132.0, 150.0, 113.0, 77.0, 50.0, 26.0, 12.0, 15.0, 7.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.12527465820312, -73.14993286132812, -70.1745834350586, -67.1992416381836, -64.22389221191406, -61.24855041503906, -58.2732048034668, -55.29785919189453, -52.32251739501953, -49.347171783447266, -46.371826171875, -43.396484375, -40.421138763427734, -37.44579315185547, -34.4704475402832, -31.49510383605957, -28.519756317138672, -25.544410705566406, -22.569067001342773, -19.593721389770508, -16.618377685546875, -13.64303207397461, -10.667686462402344, -7.692342758178711, -4.716997146606445, -1.741652250289917, 1.2336926460266113, 4.209037780761719, 7.184382438659668, 10.159727096557617, 13.135072708129883, 16.110416412353516, 19.08576202392578, 22.061107635498047, 25.03645133972168, 28.011796951293945, 30.987140655517578, 33.962486267089844, 36.93783187866211, 39.913177490234375, 42.888519287109375, 45.86386489868164, 48.839210510253906, 51.814552307128906, 54.78989791870117, 57.76524353027344, 60.7405891418457, 63.71593475341797, 66.6912841796875, 69.6666259765625, 72.64197540283203, 75.61731719970703, 78.59266662597656, 81.56800842285156, 84.54335021972656, 87.5186996459961, 90.4940414428711, 93.4693832397461, 96.44473266601562, 99.42007446289062, 102.39542388916016, 105.37076568603516, 108.34611511230469, 111.32145690917969, 114.29679870605469]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 5.0, 16.0, 7.0, 16.0, 18.0, 15.0, 18.0, 31.0, 30.0, 37.0, 49.0, 54.0, 56.0, 52.0, 44.0, 61.0, 53.0, 53.0, 50.0, 55.0, 37.0, 44.0, 40.0, 34.0, 29.0, 22.0, 18.0, 7.0, 13.0, 10.0, 5.0, 8.0, 3.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.87411499023438, -78.74411010742188, -76.61410522460938, -74.48409271240234, -72.35408782958984, -70.22408294677734, -68.09407043457031, -65.96406555175781, -63.83406066894531, -61.70405578613281, -59.57404708862305, -57.44403839111328, -55.31403350830078, -53.18402862548828, -51.054019927978516, -48.92401123046875, -46.79400634765625, -44.66400146484375, -42.533992767333984, -40.40398406982422, -38.27397918701172, -36.14397430419922, -34.01396560668945, -31.88395881652832, -29.753952026367188, -27.623945236206055, -25.493938446044922, -23.36393165588379, -21.233924865722656, -19.103918075561523, -16.97391128540039, -14.843904495239258, -12.71390151977539, -10.583894729614258, -8.453887939453125, -6.323881149291992, -4.193874359130859, -2.0638675689697266, 0.06613922119140625, 2.196146011352539, 4.326152801513672, 6.456159591674805, 8.586166381835938, 10.71617317199707, 12.846179962158203, 14.976186752319336, 17.10619354248047, 19.2362003326416, 21.366207122802734, 23.496213912963867, 25.626220703125, 27.756227493286133, 29.886234283447266, 32.01624298095703, 34.14624786376953, 36.27625274658203, 38.4062614440918, 40.53627014160156, 42.66627502441406, 44.79627990722656, 46.92628860473633, 49.056297302246094, 51.186302185058594, 53.316307067871094, 55.44631576538086]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 9.0, 14.0, 11.0, 9.0, 24.0, 23.0, 38.0, 49.0, 85.0, 150.0, 285.0, 472.0, 1001.0, 2829.0, 11402.0, 143468.0, 3965297.0, 58640.0, 7079.0, 1831.0, 703.0, 345.0, 187.0, 101.0, 59.0, 42.0, 33.0, 19.0, 18.0, 13.0, 9.0, 4.0, 3.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.0, -34.63427734375, -33.2685546875, -31.90283203125, -30.537109375, -29.17138671875, -27.8056640625, -26.43994140625, -25.07421875, -23.70849609375, -22.3427734375, -20.97705078125, -19.611328125, -18.24560546875, -16.8798828125, -15.51416015625, -14.1484375, -12.78271484375, -11.4169921875, -10.05126953125, -8.685546875, -7.31982421875, -5.9541015625, -4.58837890625, -3.22265625, -1.85693359375, -0.4912109375, 0.87451171875, 2.240234375, 3.60595703125, 4.9716796875, 6.33740234375, 7.703125, 9.06884765625, 10.4345703125, 11.80029296875, 13.166015625, 14.53173828125, 15.8974609375, 17.26318359375, 18.62890625, 19.99462890625, 21.3603515625, 22.72607421875, 24.091796875, 25.45751953125, 26.8232421875, 28.18896484375, 29.5546875, 30.92041015625, 32.2861328125, 33.65185546875, 35.017578125, 36.38330078125, 37.7490234375, 39.11474609375, 40.48046875, 41.84619140625, 43.2119140625, 44.57763671875, 45.943359375, 47.30908203125, 48.6748046875, 50.04052734375, 51.40625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 11.0, 8.0, 25.0, 35.0, 61.0, 61.0, 89.0, 108.0, 115.0, 103.0, 96.0, 70.0, 68.0, 53.0, 32.0, 28.0, 10.0, 11.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.859375, -6.68304443359375, -6.5067138671875, -6.33038330078125, -6.154052734375, -5.97772216796875, -5.8013916015625, -5.62506103515625, -5.44873046875, -5.27239990234375, -5.0960693359375, -4.91973876953125, -4.743408203125, -4.56707763671875, -4.3907470703125, -4.21441650390625, -4.0380859375, -3.86175537109375, -3.6854248046875, -3.50909423828125, -3.332763671875, -3.15643310546875, -2.9801025390625, -2.80377197265625, -2.62744140625, -2.45111083984375, -2.2747802734375, -2.09844970703125, -1.922119140625, -1.74578857421875, -1.5694580078125, -1.39312744140625, -1.216796875, -1.04046630859375, -0.8641357421875, -0.68780517578125, -0.511474609375, -0.33514404296875, -0.1588134765625, 0.01751708984375, 0.19384765625, 0.37017822265625, 0.5465087890625, 0.72283935546875, 0.899169921875, 1.07550048828125, 1.2518310546875, 1.42816162109375, 1.6044921875, 1.78082275390625, 1.9571533203125, 2.13348388671875, 2.309814453125, 2.48614501953125, 2.6624755859375, 2.83880615234375, 3.01513671875, 3.19146728515625, 3.3677978515625, 3.54412841796875, 3.720458984375, 3.89678955078125, 4.0731201171875, 4.24945068359375, 4.42578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 5.0, 12.0, 12.0, 19.0, 17.0, 44.0, 36.0, 69.0, 88.0, 114.0, 165.0, 257.0, 423.0, 792.0, 1692.0, 4177.0, 11729.0, 40454.0, 203461.0, 3290072.0, 534963.0, 74410.0, 19708.0, 6288.0, 2512.0, 1170.0, 560.0, 328.0, 186.0, 128.0, 92.0, 73.0, 46.0, 39.0, 29.0, 25.0, 20.0, 10.0, 9.0, 11.0, 4.0, 10.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.3203125, -14.8214111328125, -14.322509765625, -13.8236083984375, -13.32470703125, -12.8258056640625, -12.326904296875, -11.8280029296875, -11.3291015625, -10.8302001953125, -10.331298828125, -9.8323974609375, -9.33349609375, -8.8345947265625, -8.335693359375, -7.8367919921875, -7.337890625, -6.8389892578125, -6.340087890625, -5.8411865234375, -5.34228515625, -4.8433837890625, -4.344482421875, -3.8455810546875, -3.3466796875, -2.8477783203125, -2.348876953125, -1.8499755859375, -1.35107421875, -0.8521728515625, -0.353271484375, 0.1456298828125, 0.64453125, 1.1434326171875, 1.642333984375, 2.1412353515625, 2.64013671875, 3.1390380859375, 3.637939453125, 4.1368408203125, 4.6357421875, 5.1346435546875, 5.633544921875, 6.1324462890625, 6.63134765625, 7.1302490234375, 7.629150390625, 8.1280517578125, 8.626953125, 9.1258544921875, 9.624755859375, 10.1236572265625, 10.62255859375, 11.1214599609375, 11.620361328125, 12.1192626953125, 12.6181640625, 13.1170654296875, 13.615966796875, 14.1148681640625, 14.61376953125, 15.1126708984375, 15.611572265625, 16.1104736328125, 16.609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 16.0, 16.0, 26.0, 34.0, 58.0, 111.0, 255.0, 889.0, 1883.0, 373.0, 178.0, 80.0, 54.0, 36.0, 19.0, 14.0, 14.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.88671875, -5.6328125, -5.37890625, -5.125, -4.87109375, -4.6171875, -4.36328125, -4.109375, -3.85546875, -3.6015625, -3.34765625, -3.09375, -2.83984375, -2.5859375, -2.33203125, -2.078125, -1.82421875, -1.5703125, -1.31640625, -1.0625, -0.80859375, -0.5546875, -0.30078125, -0.046875, 0.20703125, 0.4609375, 0.71484375, 0.96875, 1.22265625, 1.4765625, 1.73046875, 1.984375, 2.23828125, 2.4921875, 2.74609375, 3.0, 3.25390625, 3.5078125, 3.76171875, 4.015625, 4.26953125, 4.5234375, 4.77734375, 5.03125, 5.28515625, 5.5390625, 5.79296875, 6.046875, 6.30078125, 6.5546875, 6.80859375, 7.0625, 7.31640625, 7.5703125, 7.82421875, 8.078125, 8.33203125, 8.5859375, 8.83984375, 9.09375, 9.34765625, 9.6015625, 9.85546875, 10.109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 11.0, 10.0, 12.0, 18.0, 11.0, 30.0, 37.0, 37.0, 52.0, 50.0, 58.0, 72.0, 67.0, 74.0, 54.0, 73.0, 68.0, 47.0, 58.0, 35.0, 25.0, 16.0, 9.0, 15.0, 12.0, 9.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.55939483642578, -16.908037185668945, -16.25667953491211, -15.60532283782959, -14.95396614074707, -14.302608489990234, -13.651250839233398, -12.999893188476562, -12.348536491394043, -11.697178840637207, -11.045822143554688, -10.394464492797852, -9.743106842041016, -9.091750144958496, -8.44039249420166, -7.789035320281982, -7.137678146362305, -6.486320972442627, -5.834963798522949, -5.183606147766113, -4.5322489738464355, -3.880891799926758, -3.229534387588501, -2.578176975250244, -1.9268198013305664, -1.2754625082015991, -0.6241052150726318, 0.02725207805633545, 0.6786093711853027, 1.3299665451049805, 1.9813239574432373, 2.632681369781494, 3.284036636352539, 3.935393810272217, 4.5867509841918945, 5.2381086349487305, 5.889465808868408, 6.540822982788086, 7.192180633544922, 7.8435378074646, 8.494894981384277, 9.146252632141113, 9.797609329223633, 10.448966979980469, 11.100324630737305, 11.751681327819824, 12.40303897857666, 13.05439567565918, 13.705753326416016, 14.357110977172852, 15.008467674255371, 15.659825325012207, 16.311182022094727, 16.962539672851562, 17.6138973236084, 18.265254974365234, 18.916610717773438, 19.567968368530273, 20.21932601928711, 20.870681762695312, 21.52203941345215, 22.173397064208984, 22.82475471496582, 23.476112365722656, 24.127470016479492]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 1.0, 2.0, 9.0, 10.0, 14.0, 12.0, 12.0, 21.0, 25.0, 23.0, 23.0, 28.0, 39.0, 28.0, 30.0, 32.0, 41.0, 48.0, 34.0, 42.0, 41.0, 30.0, 46.0, 36.0, 48.0, 30.0, 29.0, 36.0, 25.0, 31.0, 27.0, 25.0, 26.0, 21.0, 17.0, 6.0, 12.0, 13.0, 3.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.76184844970703, -19.1953067779541, -18.628767013549805, -18.062225341796875, -17.495685577392578, -16.92914390563965, -16.36260414123535, -15.796062469482422, -15.229521751403809, -14.662981033325195, -14.096440315246582, -13.529899597167969, -12.963357925415039, -12.396818161010742, -11.830276489257812, -11.2637357711792, -10.697195053100586, -10.130654335021973, -9.56411361694336, -8.997572898864746, -8.431032180786133, -7.864490985870361, -7.29794979095459, -6.731409072875977, -6.164868354797363, -5.59832763671875, -5.031786918640137, -4.465245723724365, -3.898705005645752, -3.3321642875671387, -2.7656233310699463, -2.199082374572754, -1.6325416564941406, -1.0660008192062378, -0.49945998191833496, 0.06708085536956787, 0.6336216926574707, 1.200162410736084, 1.7667033672332764, 2.3332443237304688, 2.899785041809082, 3.4663257598876953, 4.032866477966309, 4.59940767288208, 5.165948390960693, 5.732489109039307, 6.299030303955078, 6.865571022033691, 7.432111740112305, 7.998652458190918, 8.565193176269531, 9.131733894348145, 9.698274612426758, 10.264816284179688, 10.8313570022583, 11.397897720336914, 11.964438438415527, 12.53097915649414, 13.097519874572754, 13.664060592651367, 14.230602264404297, 14.797142028808594, 15.363683700561523, 15.930224418640137, 16.49676513671875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 10.0, 12.0, 16.0, 28.0, 35.0, 67.0, 88.0, 167.0, 251.0, 434.0, 755.0, 1644.0, 4318.0, 17767.0, 113939.0, 604409.0, 256069.0, 36400.0, 7288.0, 2363.0, 1037.0, 536.0, 335.0, 206.0, 132.0, 75.0, 39.0, 35.0, 20.0, 25.0, 15.0, 9.0, 10.0, 5.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5625, -28.630126953125, -27.69775390625, -26.765380859375, -25.8330078125, -24.900634765625, -23.96826171875, -23.035888671875, -22.103515625, -21.171142578125, -20.23876953125, -19.306396484375, -18.3740234375, -17.441650390625, -16.50927734375, -15.576904296875, -14.64453125, -13.712158203125, -12.77978515625, -11.847412109375, -10.9150390625, -9.982666015625, -9.05029296875, -8.117919921875, -7.185546875, -6.253173828125, -5.32080078125, -4.388427734375, -3.4560546875, -2.523681640625, -1.59130859375, -0.658935546875, 0.2734375, 1.205810546875, 2.13818359375, 3.070556640625, 4.0029296875, 4.935302734375, 5.86767578125, 6.800048828125, 7.732421875, 8.664794921875, 9.59716796875, 10.529541015625, 11.4619140625, 12.394287109375, 13.32666015625, 14.259033203125, 15.19140625, 16.123779296875, 17.05615234375, 17.988525390625, 18.9208984375, 19.853271484375, 20.78564453125, 21.718017578125, 22.650390625, 23.582763671875, 24.51513671875, 25.447509765625, 26.3798828125, 27.312255859375, 28.24462890625, 29.177001953125, 30.109375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 10.0, 20.0, 27.0, 46.0, 55.0, 87.0, 88.0, 116.0, 121.0, 105.0, 85.0, 67.0, 48.0, 44.0, 41.0, 16.0, 7.0, 10.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.2421875, -7.0587158203125, -6.875244140625, -6.6917724609375, -6.50830078125, -6.3248291015625, -6.141357421875, -5.9578857421875, -5.7744140625, -5.5909423828125, -5.407470703125, -5.2239990234375, -5.04052734375, -4.8570556640625, -4.673583984375, -4.4901123046875, -4.306640625, -4.1231689453125, -3.939697265625, -3.7562255859375, -3.57275390625, -3.3892822265625, -3.205810546875, -3.0223388671875, -2.8388671875, -2.6553955078125, -2.471923828125, -2.2884521484375, -2.10498046875, -1.9215087890625, -1.738037109375, -1.5545654296875, -1.37109375, -1.1876220703125, -1.004150390625, -0.8206787109375, -0.63720703125, -0.4537353515625, -0.270263671875, -0.0867919921875, 0.0966796875, 0.2801513671875, 0.463623046875, 0.6470947265625, 0.83056640625, 1.0140380859375, 1.197509765625, 1.3809814453125, 1.564453125, 1.7479248046875, 1.931396484375, 2.1148681640625, 2.29833984375, 2.4818115234375, 2.665283203125, 2.8487548828125, 3.0322265625, 3.2156982421875, 3.399169921875, 3.5826416015625, 3.76611328125, 3.9495849609375, 4.133056640625, 4.3165283203125, 4.5]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 4.0, 8.0, 9.0, 16.0, 17.0, 20.0, 25.0, 46.0, 63.0, 80.0, 158.0, 219.0, 305.0, 492.0, 821.0, 1581.0, 3561.0, 8423.0, 23961.0, 74062.0, 235201.0, 431523.0, 179856.0, 56472.0, 18390.0, 6813.0, 2965.0, 1366.0, 719.0, 471.0, 245.0, 196.0, 155.0, 106.0, 73.0, 40.0, 28.0, 17.0, 17.0, 14.0, 12.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0078125, -9.642333984375, -9.27685546875, -8.911376953125, -8.5458984375, -8.180419921875, -7.81494140625, -7.449462890625, -7.083984375, -6.718505859375, -6.35302734375, -5.987548828125, -5.6220703125, -5.256591796875, -4.89111328125, -4.525634765625, -4.16015625, -3.794677734375, -3.42919921875, -3.063720703125, -2.6982421875, -2.332763671875, -1.96728515625, -1.601806640625, -1.236328125, -0.870849609375, -0.50537109375, -0.139892578125, 0.2255859375, 0.591064453125, 0.95654296875, 1.322021484375, 1.6875, 2.052978515625, 2.41845703125, 2.783935546875, 3.1494140625, 3.514892578125, 3.88037109375, 4.245849609375, 4.611328125, 4.976806640625, 5.34228515625, 5.707763671875, 6.0732421875, 6.438720703125, 6.80419921875, 7.169677734375, 7.53515625, 7.900634765625, 8.26611328125, 8.631591796875, 8.9970703125, 9.362548828125, 9.72802734375, 10.093505859375, 10.458984375, 10.824462890625, 11.18994140625, 11.555419921875, 11.9208984375, 12.286376953125, 12.65185546875, 13.017333984375, 13.3828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 4.0, 4.0, 5.0, 9.0, 8.0, 9.0, 14.0, 11.0, 18.0, 13.0, 22.0, 26.0, 19.0, 26.0, 35.0, 28.0, 43.0, 33.0, 47.0, 33.0, 38.0, 38.0, 38.0, 55.0, 47.0, 34.0, 37.0, 49.0, 28.0, 21.0, 34.0, 19.0, 38.0, 25.0, 17.0, 17.0, 13.0, 6.0, 7.0, 6.0, 3.0, 7.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.328125, -8.046630859375, -7.76513671875, -7.483642578125, -7.2021484375, -6.920654296875, -6.63916015625, -6.357666015625, -6.076171875, -5.794677734375, -5.51318359375, -5.231689453125, -4.9501953125, -4.668701171875, -4.38720703125, -4.105712890625, -3.82421875, -3.542724609375, -3.26123046875, -2.979736328125, -2.6982421875, -2.416748046875, -2.13525390625, -1.853759765625, -1.572265625, -1.290771484375, -1.00927734375, -0.727783203125, -0.4462890625, -0.164794921875, 0.11669921875, 0.398193359375, 0.6796875, 0.961181640625, 1.24267578125, 1.524169921875, 1.8056640625, 2.087158203125, 2.36865234375, 2.650146484375, 2.931640625, 3.213134765625, 3.49462890625, 3.776123046875, 4.0576171875, 4.339111328125, 4.62060546875, 4.902099609375, 5.18359375, 5.465087890625, 5.74658203125, 6.028076171875, 6.3095703125, 6.591064453125, 6.87255859375, 7.154052734375, 7.435546875, 7.717041015625, 7.99853515625, 8.280029296875, 8.5615234375, 8.843017578125, 9.12451171875, 9.406005859375, 9.6875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 9.0, 14.0, 24.0, 27.0, 33.0, 48.0, 51.0, 109.0, 136.0, 232.0, 413.0, 653.0, 1170.0, 2139.0, 3902.0, 7873.0, 15936.0, 34167.0, 77488.0, 188471.0, 332053.0, 217077.0, 90452.0, 39111.0, 18147.0, 8698.0, 4435.0, 2412.0, 1370.0, 720.0, 446.0, 270.0, 155.0, 111.0, 57.0, 42.0, 31.0, 15.0, 13.0, 6.0, 10.0, 7.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.18359375, -3.07598876953125, -2.9683837890625, -2.86077880859375, -2.753173828125, -2.64556884765625, -2.5379638671875, -2.43035888671875, -2.32275390625, -2.21514892578125, -2.1075439453125, -1.99993896484375, -1.892333984375, -1.78472900390625, -1.6771240234375, -1.56951904296875, -1.4619140625, -1.35430908203125, -1.2467041015625, -1.13909912109375, -1.031494140625, -0.92388916015625, -0.8162841796875, -0.70867919921875, -0.60107421875, -0.49346923828125, -0.3858642578125, -0.27825927734375, -0.170654296875, -0.06304931640625, 0.0445556640625, 0.15216064453125, 0.259765625, 0.36737060546875, 0.4749755859375, 0.58258056640625, 0.690185546875, 0.79779052734375, 0.9053955078125, 1.01300048828125, 1.12060546875, 1.22821044921875, 1.3358154296875, 1.44342041015625, 1.551025390625, 1.65863037109375, 1.7662353515625, 1.87384033203125, 1.9814453125, 2.08905029296875, 2.1966552734375, 2.30426025390625, 2.411865234375, 2.51947021484375, 2.6270751953125, 2.73468017578125, 2.84228515625, 2.94989013671875, 3.0574951171875, 3.16510009765625, 3.272705078125, 3.38031005859375, 3.4879150390625, 3.59552001953125, 3.703125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 7.0, 8.0, 8.0, 8.0, 8.0, 11.0, 11.0, 15.0, 18.0, 20.0, 23.0, 24.0, 37.0, 58.0, 65.0, 100.0, 119.0, 107.0, 76.0, 45.0, 42.0, 35.0, 23.0, 20.0, 17.0, 21.0, 10.0, 11.0, 17.0, 5.0, 7.0, 5.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008134841918945312, -0.0007884949445724487, -0.0007635056972503662, -0.0007385164499282837, -0.0007135272026062012, -0.0006885379552841187, -0.0006635487079620361, -0.0006385594606399536, -0.0006135702133178711, -0.0005885809659957886, -0.0005635917186737061, -0.0005386024713516235, -0.000513613224029541, -0.0004886239767074585, -0.000463634729385376, -0.00043864548206329346, -0.00041365623474121094, -0.0003886669874191284, -0.0003636777400970459, -0.0003386884927749634, -0.00031369924545288086, -0.00028870999813079834, -0.0002637207508087158, -0.0002387315034866333, -0.00021374225616455078, -0.00018875300884246826, -0.00016376376152038574, -0.00013877451419830322, -0.0001137852668762207, -8.879601955413818e-05, -6.380677223205566e-05, -3.8817524909973145e-05, -1.3828277587890625e-05, 1.1160969734191895e-05, 3.6150217056274414e-05, 6.113946437835693e-05, 8.612871170043945e-05, 0.00011111795902252197, 0.0001361072063446045, 0.000161096453666687, 0.00018608570098876953, 0.00021107494831085205, 0.00023606419563293457, 0.0002610534429550171, 0.0002860426902770996, 0.00031103193759918213, 0.00033602118492126465, 0.00036101043224334717, 0.0003859996795654297, 0.0004109889268875122, 0.0004359781742095947, 0.00046096742153167725, 0.00048595666885375977, 0.0005109459161758423, 0.0005359351634979248, 0.0005609244108200073, 0.0005859136581420898, 0.0006109029054641724, 0.0006358921527862549, 0.0006608814001083374, 0.0006858706474304199, 0.0007108598947525024, 0.000735849142074585, 0.0007608383893966675, 0.00078582763671875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 0.0, 4.0, 15.0, 11.0, 6.0, 22.0, 23.0, 47.0, 70.0, 94.0, 180.0, 244.0, 464.0, 840.0, 1582.0, 3738.0, 8667.0, 25188.0, 88610.0, 348953.0, 409906.0, 110872.0, 30517.0, 10364.0, 4132.0, 1864.0, 903.0, 465.0, 262.0, 177.0, 110.0, 73.0, 40.0, 41.0, 20.0, 12.0, 14.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.671875, -5.51019287109375, -5.3485107421875, -5.18682861328125, -5.025146484375, -4.86346435546875, -4.7017822265625, -4.54010009765625, -4.37841796875, -4.21673583984375, -4.0550537109375, -3.89337158203125, -3.731689453125, -3.57000732421875, -3.4083251953125, -3.24664306640625, -3.0849609375, -2.92327880859375, -2.7615966796875, -2.59991455078125, -2.438232421875, -2.27655029296875, -2.1148681640625, -1.95318603515625, -1.79150390625, -1.62982177734375, -1.4681396484375, -1.30645751953125, -1.144775390625, -0.98309326171875, -0.8214111328125, -0.65972900390625, -0.498046875, -0.33636474609375, -0.1746826171875, -0.01300048828125, 0.148681640625, 0.31036376953125, 0.4720458984375, 0.63372802734375, 0.79541015625, 0.95709228515625, 1.1187744140625, 1.28045654296875, 1.442138671875, 1.60382080078125, 1.7655029296875, 1.92718505859375, 2.0888671875, 2.25054931640625, 2.4122314453125, 2.57391357421875, 2.735595703125, 2.89727783203125, 3.0589599609375, 3.22064208984375, 3.38232421875, 3.54400634765625, 3.7056884765625, 3.86737060546875, 4.029052734375, 4.19073486328125, 4.3524169921875, 4.51409912109375, 4.67578125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 10.0, 13.0, 8.0, 13.0, 12.0, 16.0, 26.0, 36.0, 33.0, 47.0, 63.0, 56.0, 71.0, 65.0, 74.0, 74.0, 83.0, 49.0, 38.0, 53.0, 30.0, 27.0, 16.0, 20.0, 15.0, 8.0, 4.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.40625, -3.30523681640625, -3.2042236328125, -3.10321044921875, -3.002197265625, -2.90118408203125, -2.8001708984375, -2.69915771484375, -2.59814453125, -2.49713134765625, -2.3961181640625, -2.29510498046875, -2.194091796875, -2.09307861328125, -1.9920654296875, -1.89105224609375, -1.7900390625, -1.68902587890625, -1.5880126953125, -1.48699951171875, -1.385986328125, -1.28497314453125, -1.1839599609375, -1.08294677734375, -0.98193359375, -0.88092041015625, -0.7799072265625, -0.67889404296875, -0.577880859375, -0.47686767578125, -0.3758544921875, -0.27484130859375, -0.173828125, -0.07281494140625, 0.0281982421875, 0.12921142578125, 0.230224609375, 0.33123779296875, 0.4322509765625, 0.53326416015625, 0.63427734375, 0.73529052734375, 0.8363037109375, 0.93731689453125, 1.038330078125, 1.13934326171875, 1.2403564453125, 1.34136962890625, 1.4423828125, 1.54339599609375, 1.6444091796875, 1.74542236328125, 1.846435546875, 1.94744873046875, 2.0484619140625, 2.14947509765625, 2.25048828125, 2.35150146484375, 2.4525146484375, 2.55352783203125, 2.654541015625, 2.75555419921875, 2.8565673828125, 2.95758056640625, 3.05859375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 9.0, 20.0, 33.0, 44.0, 71.0, 103.0, 103.0, 111.0, 124.0, 100.0, 90.0, 65.0, 47.0, 16.0, 19.0, 14.0, 7.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.07290649414062, -86.70169067382812, -84.33047485351562, -81.95925903320312, -79.58804321289062, -77.21682739257812, -74.84561157226562, -72.47439575195312, -70.10317993164062, -67.73196411132812, -65.36074829101562, -62.989532470703125, -60.618316650390625, -58.247100830078125, -55.875885009765625, -53.504669189453125, -51.133453369140625, -48.762237548828125, -46.391021728515625, -44.019805908203125, -41.648590087890625, -39.277374267578125, -36.906158447265625, -34.534942626953125, -32.163726806640625, -29.792510986328125, -27.421295166015625, -25.050079345703125, -22.678863525390625, -20.307647705078125, -17.936431884765625, -15.565216064453125, -13.194000244140625, -10.822784423828125, -8.451568603515625, -6.080352783203125, -3.709136962890625, -1.337921142578125, 1.033294677734375, 3.404510498046875, 5.775726318359375, 8.146942138671875, 10.518157958984375, 12.889373779296875, 15.260589599609375, 17.631805419921875, 20.003021240234375, 22.374237060546875, 24.745452880859375, 27.116668701171875, 29.487884521484375, 31.859100341796875, 34.230316162109375, 36.601531982421875, 38.972747802734375, 41.343963623046875, 43.715179443359375, 46.086395263671875, 48.457611083984375, 50.828826904296875, 53.200042724609375, 55.571258544921875, 57.942474365234375, 60.313690185546875, 62.684906005859375]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 3.0, 5.0, 6.0, 12.0, 12.0, 11.0, 13.0, 21.0, 19.0, 27.0, 24.0, 29.0, 19.0, 31.0, 44.0, 35.0, 31.0, 57.0, 52.0, 47.0, 46.0, 42.0, 40.0, 42.0, 40.0, 34.0, 43.0, 32.0, 22.0, 25.0, 25.0, 20.0, 17.0, 14.0, 16.0, 7.0, 18.0, 4.0, 3.0, 5.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0], "bins": [-58.80186462402344, -57.26301193237305, -55.72415542602539, -54.185302734375, -52.64645004272461, -51.10759735107422, -49.56874084472656, -48.02988815307617, -46.49103546142578, -44.95218276977539, -43.413326263427734, -41.874473571777344, -40.33562088012695, -38.79676818847656, -37.257911682128906, -35.719058990478516, -34.18020248413086, -32.64134979248047, -31.102495193481445, -29.563640594482422, -28.02478790283203, -26.485933303833008, -24.947078704833984, -23.408226013183594, -21.86937141418457, -20.330516815185547, -18.791664123535156, -17.252809524536133, -15.713955879211426, -14.175102233886719, -12.636247634887695, -11.097393989562988, -9.558540344238281, -8.019686698913574, -6.480832576751709, -4.941978454589844, -3.4031248092651367, -1.8642711639404297, -0.32541656494140625, 1.2134370803833008, 2.752290725708008, 4.291144371032715, 5.82999849319458, 7.368852615356445, 8.907706260681152, 10.44655990600586, 11.985414505004883, 13.52426815032959, 15.063121795654297, 16.60197639465332, 18.14082908630371, 19.679683685302734, 21.218536376953125, 22.75739097595215, 24.296245574951172, 25.835098266601562, 27.373952865600586, 28.91280746459961, 30.45166015625, 31.990514755249023, 33.52936935424805, 35.06822204589844, 36.607078552246094, 38.145931243896484, 39.684783935546875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 5.0, 5.0, 10.0, 8.0, 10.0, 16.0, 17.0, 30.0, 38.0, 53.0, 72.0, 88.0, 116.0, 185.0, 299.0, 505.0, 908.0, 1823.0, 4622.0, 15132.0, 81091.0, 3539064.0, 494410.0, 40469.0, 9356.0, 3082.0, 1267.0, 584.0, 339.0, 198.0, 126.0, 85.0, 67.0, 48.0, 36.0, 22.0, 29.0, 15.0, 15.0, 10.0, 6.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-33.59375, -32.65576171875, -31.7177734375, -30.77978515625, -29.841796875, -28.90380859375, -27.9658203125, -27.02783203125, -26.08984375, -25.15185546875, -24.2138671875, -23.27587890625, -22.337890625, -21.39990234375, -20.4619140625, -19.52392578125, -18.5859375, -17.64794921875, -16.7099609375, -15.77197265625, -14.833984375, -13.89599609375, -12.9580078125, -12.02001953125, -11.08203125, -10.14404296875, -9.2060546875, -8.26806640625, -7.330078125, -6.39208984375, -5.4541015625, -4.51611328125, -3.578125, -2.64013671875, -1.7021484375, -0.76416015625, 0.173828125, 1.11181640625, 2.0498046875, 2.98779296875, 3.92578125, 4.86376953125, 5.8017578125, 6.73974609375, 7.677734375, 8.61572265625, 9.5537109375, 10.49169921875, 11.4296875, 12.36767578125, 13.3056640625, 14.24365234375, 15.181640625, 16.11962890625, 17.0576171875, 17.99560546875, 18.93359375, 19.87158203125, 20.8095703125, 21.74755859375, 22.685546875, 23.62353515625, 24.5615234375, 25.49951171875, 26.4375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 10.0, 7.0, 30.0, 40.0, 57.0, 71.0, 87.0, 107.0, 111.0, 93.0, 91.0, 79.0, 57.0, 49.0, 30.0, 29.0, 21.0, 13.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-6.8671875, -6.69061279296875, -6.5140380859375, -6.33746337890625, -6.160888671875, -5.98431396484375, -5.8077392578125, -5.63116455078125, -5.45458984375, -5.27801513671875, -5.1014404296875, -4.92486572265625, -4.748291015625, -4.57171630859375, -4.3951416015625, -4.21856689453125, -4.0419921875, -3.86541748046875, -3.6888427734375, -3.51226806640625, -3.335693359375, -3.15911865234375, -2.9825439453125, -2.80596923828125, -2.62939453125, -2.45281982421875, -2.2762451171875, -2.09967041015625, -1.923095703125, -1.74652099609375, -1.5699462890625, -1.39337158203125, -1.216796875, -1.04022216796875, -0.8636474609375, -0.68707275390625, -0.510498046875, -0.33392333984375, -0.1573486328125, 0.01922607421875, 0.19580078125, 0.37237548828125, 0.5489501953125, 0.72552490234375, 0.902099609375, 1.07867431640625, 1.2552490234375, 1.43182373046875, 1.6083984375, 1.78497314453125, 1.9615478515625, 2.13812255859375, 2.314697265625, 2.49127197265625, 2.6678466796875, 2.84442138671875, 3.02099609375, 3.19757080078125, 3.3741455078125, 3.55072021484375, 3.727294921875, 3.90386962890625, 4.0804443359375, 4.25701904296875, 4.43359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 3.0, 4.0, 8.0, 3.0, 11.0, 10.0, 8.0, 27.0, 13.0, 24.0, 47.0, 53.0, 68.0, 93.0, 137.0, 237.0, 430.0, 1084.0, 2894.0, 12222.0, 75819.0, 2204972.0, 1806991.0, 72336.0, 11882.0, 2863.0, 956.0, 406.0, 234.0, 133.0, 87.0, 54.0, 49.0, 28.0, 32.0, 16.0, 12.0, 6.0, 9.0, 3.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.71875, -22.977294921875, -22.23583984375, -21.494384765625, -20.7529296875, -20.011474609375, -19.27001953125, -18.528564453125, -17.787109375, -17.045654296875, -16.30419921875, -15.562744140625, -14.8212890625, -14.079833984375, -13.33837890625, -12.596923828125, -11.85546875, -11.114013671875, -10.37255859375, -9.631103515625, -8.8896484375, -8.148193359375, -7.40673828125, -6.665283203125, -5.923828125, -5.182373046875, -4.44091796875, -3.699462890625, -2.9580078125, -2.216552734375, -1.47509765625, -0.733642578125, 0.0078125, 0.749267578125, 1.49072265625, 2.232177734375, 2.9736328125, 3.715087890625, 4.45654296875, 5.197998046875, 5.939453125, 6.680908203125, 7.42236328125, 8.163818359375, 8.9052734375, 9.646728515625, 10.38818359375, 11.129638671875, 11.87109375, 12.612548828125, 13.35400390625, 14.095458984375, 14.8369140625, 15.578369140625, 16.31982421875, 17.061279296875, 17.802734375, 18.544189453125, 19.28564453125, 20.027099609375, 20.7685546875, 21.510009765625, 22.25146484375, 22.992919921875, 23.734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 16.0, 15.0, 37.0, 78.0, 124.0, 313.0, 1361.0, 1536.0, 341.0, 113.0, 57.0, 34.0, 21.0, 12.0, 4.0, 7.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.875, -18.48193359375, -18.0888671875, -17.69580078125, -17.302734375, -16.90966796875, -16.5166015625, -16.12353515625, -15.73046875, -15.33740234375, -14.9443359375, -14.55126953125, -14.158203125, -13.76513671875, -13.3720703125, -12.97900390625, -12.5859375, -12.19287109375, -11.7998046875, -11.40673828125, -11.013671875, -10.62060546875, -10.2275390625, -9.83447265625, -9.44140625, -9.04833984375, -8.6552734375, -8.26220703125, -7.869140625, -7.47607421875, -7.0830078125, -6.68994140625, -6.296875, -5.90380859375, -5.5107421875, -5.11767578125, -4.724609375, -4.33154296875, -3.9384765625, -3.54541015625, -3.15234375, -2.75927734375, -2.3662109375, -1.97314453125, -1.580078125, -1.18701171875, -0.7939453125, -0.40087890625, -0.0078125, 0.38525390625, 0.7783203125, 1.17138671875, 1.564453125, 1.95751953125, 2.3505859375, 2.74365234375, 3.13671875, 3.52978515625, 3.9228515625, 4.31591796875, 4.708984375, 5.10205078125, 5.4951171875, 5.88818359375, 6.28125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 14.0, 37.0, 57.0, 109.0, 160.0, 215.0, 179.0, 121.0, 62.0, 22.0, 12.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.28348541259766, -76.07717895507812, -73.87088012695312, -71.6645736694336, -69.45826721191406, -67.25196838378906, -65.04566192626953, -62.839359283447266, -60.633056640625, -58.426753997802734, -56.2204475402832, -54.01414489746094, -51.80784225463867, -49.601539611816406, -47.395233154296875, -45.18893051147461, -42.98262405395508, -40.77632141113281, -38.57001495361328, -36.363712310791016, -34.15740966796875, -31.95110511779785, -29.744800567626953, -27.538497924804688, -25.33219337463379, -23.12588882446289, -20.919586181640625, -18.713281631469727, -16.506977081298828, -14.300674438476562, -12.094369888305664, -9.888066291809082, -7.6817626953125, -5.475459098815918, -3.2691550254821777, -1.0628509521484375, 1.1434526443481445, 3.3497562408447266, 5.556060791015625, 7.762364387512207, 9.968667984008789, 12.174971580505371, 14.381275177001953, 16.58757972717285, 18.79388427734375, 21.000186920166016, 23.206491470336914, 25.412796020507812, 27.619098663330078, 29.825403213500977, 32.031707763671875, 34.23801040649414, 36.444313049316406, 38.65061950683594, 40.8569221496582, 43.06322479248047, 45.26953125, 47.475833892822266, 49.6821403503418, 51.88844299316406, 54.09474563598633, 56.301048278808594, 58.507354736328125, 60.71365737915039, 62.919960021972656]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 5.0, 10.0, 14.0, 17.0, 15.0, 23.0, 28.0, 32.0, 34.0, 63.0, 55.0, 61.0, 56.0, 71.0, 77.0, 66.0, 54.0, 65.0, 49.0, 38.0, 51.0, 21.0, 24.0, 25.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.172332763671875, -37.1909065246582, -36.209476470947266, -35.228050231933594, -34.246620178222656, -33.265193939208984, -32.28376388549805, -31.302335739135742, -30.320907592773438, -29.339479446411133, -28.358051300048828, -27.376623153686523, -26.39519500732422, -25.413766860961914, -24.43233871459961, -23.450910568237305, -22.469482421875, -21.488054275512695, -20.50662612915039, -19.525197982788086, -18.54376983642578, -17.562341690063477, -16.580913543701172, -15.599485397338867, -14.618059158325195, -13.63663101196289, -12.655202865600586, -11.673774719238281, -10.692346572875977, -9.710918426513672, -8.729490280151367, -7.748062610626221, -6.766633987426758, -5.785205841064453, -4.803777694702148, -3.822349786758423, -2.840921640396118, -1.8594937324523926, -0.8780655860900879, 0.1033625602722168, 1.0847907066345215, 2.066218852996826, 3.047646999359131, 4.029074668884277, 5.010502815246582, 5.991930961608887, 6.973359107971191, 7.954787254333496, 8.9362154006958, 9.917643547058105, 10.89907169342041, 11.880499839782715, 12.86192798614502, 13.843355178833008, 14.824783325195312, 15.806211471557617, 16.787639617919922, 17.769067764282227, 18.75049591064453, 19.731924057006836, 20.71335220336914, 21.694780349731445, 22.67620849609375, 23.657636642456055, 24.63906478881836]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 5.0, 11.0, 6.0, 20.0, 25.0, 28.0, 44.0, 59.0, 62.0, 138.0, 261.0, 437.0, 913.0, 2238.0, 7565.0, 40329.0, 448974.0, 492506.0, 42472.0, 8132.0, 2288.0, 924.0, 452.0, 252.0, 141.0, 90.0, 42.0, 51.0, 16.0, 14.0, 14.0, 6.0, 16.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.29638671875, -30.2177734375, -29.13916015625, -28.060546875, -26.98193359375, -25.9033203125, -24.82470703125, -23.74609375, -22.66748046875, -21.5888671875, -20.51025390625, -19.431640625, -18.35302734375, -17.2744140625, -16.19580078125, -15.1171875, -14.03857421875, -12.9599609375, -11.88134765625, -10.802734375, -9.72412109375, -8.6455078125, -7.56689453125, -6.48828125, -5.40966796875, -4.3310546875, -3.25244140625, -2.173828125, -1.09521484375, -0.0166015625, 1.06201171875, 2.140625, 3.21923828125, 4.2978515625, 5.37646484375, 6.455078125, 7.53369140625, 8.6123046875, 9.69091796875, 10.76953125, 11.84814453125, 12.9267578125, 14.00537109375, 15.083984375, 16.16259765625, 17.2412109375, 18.31982421875, 19.3984375, 20.47705078125, 21.5556640625, 22.63427734375, 23.712890625, 24.79150390625, 25.8701171875, 26.94873046875, 28.02734375, 29.10595703125, 30.1845703125, 31.26318359375, 32.341796875, 33.42041015625, 34.4990234375, 35.57763671875, 36.65625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 8.0, 7.0, 14.0, 42.0, 44.0, 59.0, 79.0, 90.0, 113.0, 92.0, 99.0, 83.0, 79.0, 51.0, 44.0, 32.0, 23.0, 15.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.8515625, -6.6734619140625, -6.495361328125, -6.3172607421875, -6.13916015625, -5.9610595703125, -5.782958984375, -5.6048583984375, -5.4267578125, -5.2486572265625, -5.070556640625, -4.8924560546875, -4.71435546875, -4.5362548828125, -4.358154296875, -4.1800537109375, -4.001953125, -3.8238525390625, -3.645751953125, -3.4676513671875, -3.28955078125, -3.1114501953125, -2.933349609375, -2.7552490234375, -2.5771484375, -2.3990478515625, -2.220947265625, -2.0428466796875, -1.86474609375, -1.6866455078125, -1.508544921875, -1.3304443359375, -1.15234375, -0.9742431640625, -0.796142578125, -0.6180419921875, -0.43994140625, -0.2618408203125, -0.083740234375, 0.0943603515625, 0.2724609375, 0.4505615234375, 0.628662109375, 0.8067626953125, 0.98486328125, 1.1629638671875, 1.341064453125, 1.5191650390625, 1.697265625, 1.8753662109375, 2.053466796875, 2.2315673828125, 2.40966796875, 2.5877685546875, 2.765869140625, 2.9439697265625, 3.1220703125, 3.3001708984375, 3.478271484375, 3.6563720703125, 3.83447265625, 4.0125732421875, 4.190673828125, 4.3687744140625, 4.546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 11.0, 18.0, 32.0, 29.0, 39.0, 85.0, 114.0, 164.0, 279.0, 455.0, 804.0, 1617.0, 4013.0, 12115.0, 46437.0, 213045.0, 576537.0, 144909.0, 32408.0, 9099.0, 3151.0, 1408.0, 682.0, 385.0, 237.0, 145.0, 99.0, 66.0, 47.0, 28.0, 25.0, 17.0, 10.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.359375, -11.890869140625, -11.42236328125, -10.953857421875, -10.4853515625, -10.016845703125, -9.54833984375, -9.079833984375, -8.611328125, -8.142822265625, -7.67431640625, -7.205810546875, -6.7373046875, -6.268798828125, -5.80029296875, -5.331787109375, -4.86328125, -4.394775390625, -3.92626953125, -3.457763671875, -2.9892578125, -2.520751953125, -2.05224609375, -1.583740234375, -1.115234375, -0.646728515625, -0.17822265625, 0.290283203125, 0.7587890625, 1.227294921875, 1.69580078125, 2.164306640625, 2.6328125, 3.101318359375, 3.56982421875, 4.038330078125, 4.5068359375, 4.975341796875, 5.44384765625, 5.912353515625, 6.380859375, 6.849365234375, 7.31787109375, 7.786376953125, 8.2548828125, 8.723388671875, 9.19189453125, 9.660400390625, 10.12890625, 10.597412109375, 11.06591796875, 11.534423828125, 12.0029296875, 12.471435546875, 12.93994140625, 13.408447265625, 13.876953125, 14.345458984375, 14.81396484375, 15.282470703125, 15.7509765625, 16.219482421875, 16.68798828125, 17.156494140625, 17.625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 5.0, 7.0, 14.0, 20.0, 18.0, 14.0, 17.0, 38.0, 34.0, 37.0, 43.0, 49.0, 46.0, 64.0, 53.0, 43.0, 69.0, 46.0, 55.0, 54.0, 53.0, 43.0, 37.0, 25.0, 31.0, 26.0, 15.0, 10.0, 11.0, 3.0, 12.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.2691650390625, -9.874267578125, -9.4793701171875, -9.08447265625, -8.6895751953125, -8.294677734375, -7.8997802734375, -7.5048828125, -7.1099853515625, -6.715087890625, -6.3201904296875, -5.92529296875, -5.5303955078125, -5.135498046875, -4.7406005859375, -4.345703125, -3.9508056640625, -3.555908203125, -3.1610107421875, -2.76611328125, -2.3712158203125, -1.976318359375, -1.5814208984375, -1.1865234375, -0.7916259765625, -0.396728515625, -0.0018310546875, 0.39306640625, 0.7879638671875, 1.182861328125, 1.5777587890625, 1.97265625, 2.3675537109375, 2.762451171875, 3.1573486328125, 3.55224609375, 3.9471435546875, 4.342041015625, 4.7369384765625, 5.1318359375, 5.5267333984375, 5.921630859375, 6.3165283203125, 6.71142578125, 7.1063232421875, 7.501220703125, 7.8961181640625, 8.291015625, 8.6859130859375, 9.080810546875, 9.4757080078125, 9.87060546875, 10.2655029296875, 10.660400390625, 11.0552978515625, 11.4501953125, 11.8450927734375, 12.239990234375, 12.6348876953125, 13.02978515625, 13.4246826171875, 13.819580078125, 14.2144775390625, 14.609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 10.0, 7.0, 13.0, 36.0, 40.0, 68.0, 117.0, 204.0, 374.0, 865.0, 2501.0, 7957.0, 33995.0, 206885.0, 641094.0, 121832.0, 23257.0, 5953.0, 1877.0, 699.0, 336.0, 161.0, 98.0, 60.0, 29.0, 28.0, 19.0, 9.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.93157958984375, -5.7225341796875, -5.51348876953125, -5.304443359375, -5.09539794921875, -4.8863525390625, -4.67730712890625, -4.46826171875, -4.25921630859375, -4.0501708984375, -3.84112548828125, -3.632080078125, -3.42303466796875, -3.2139892578125, -3.00494384765625, -2.7958984375, -2.58685302734375, -2.3778076171875, -2.16876220703125, -1.959716796875, -1.75067138671875, -1.5416259765625, -1.33258056640625, -1.12353515625, -0.91448974609375, -0.7054443359375, -0.49639892578125, -0.287353515625, -0.07830810546875, 0.1307373046875, 0.33978271484375, 0.548828125, 0.75787353515625, 0.9669189453125, 1.17596435546875, 1.385009765625, 1.59405517578125, 1.8031005859375, 2.01214599609375, 2.22119140625, 2.43023681640625, 2.6392822265625, 2.84832763671875, 3.057373046875, 3.26641845703125, 3.4754638671875, 3.68450927734375, 3.8935546875, 4.10260009765625, 4.3116455078125, 4.52069091796875, 4.729736328125, 4.93878173828125, 5.1478271484375, 5.35687255859375, 5.56591796875, 5.77496337890625, 5.9840087890625, 6.19305419921875, 6.402099609375, 6.61114501953125, 6.8201904296875, 7.02923583984375, 7.23828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 5.0, 9.0, 7.0, 2.0, 9.0, 12.0, 11.0, 12.0, 18.0, 24.0, 25.0, 40.0, 50.0, 102.0, 163.0, 157.0, 123.0, 48.0, 43.0, 26.0, 14.0, 12.0, 11.0, 18.0, 10.0, 10.0, 4.0, 4.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007829666137695312, -0.0007569491863250732, -0.0007309317588806152, -0.0007049143314361572, -0.0006788969039916992, -0.0006528794765472412, -0.0006268620491027832, -0.0006008446216583252, -0.0005748271942138672, -0.0005488097667694092, -0.0005227923393249512, -0.0004967749118804932, -0.00047075748443603516, -0.00044474005699157715, -0.00041872262954711914, -0.00039270520210266113, -0.0003666877746582031, -0.0003406703472137451, -0.0003146529197692871, -0.0002886354923248291, -0.0002626180648803711, -0.00023660063743591309, -0.00021058320999145508, -0.00018456578254699707, -0.00015854835510253906, -0.00013253092765808105, -0.00010651350021362305, -8.049607276916504e-05, -5.447864532470703e-05, -2.8461217880249023e-05, -2.4437904357910156e-06, 2.3573637008666992e-05, 4.9591064453125e-05, 7.560849189758301e-05, 0.00010162591934204102, 0.00012764334678649902, 0.00015366077423095703, 0.00017967820167541504, 0.00020569562911987305, 0.00023171305656433105, 0.00025773048400878906, 0.00028374791145324707, 0.0003097653388977051, 0.0003357827663421631, 0.0003618001937866211, 0.0003878176212310791, 0.0004138350486755371, 0.0004398524761199951, 0.0004658699035644531, 0.0004918873310089111, 0.0005179047584533691, 0.0005439221858978271, 0.0005699396133422852, 0.0005959570407867432, 0.0006219744682312012, 0.0006479918956756592, 0.0006740093231201172, 0.0007000267505645752, 0.0007260441780090332, 0.0007520616054534912, 0.0007780790328979492, 0.0008040964603424072, 0.0008301138877868652, 0.0008561313152313232, 0.0008821487426757812]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 2.0, 6.0, 7.0, 5.0, 6.0, 15.0, 14.0, 24.0, 31.0, 58.0, 75.0, 106.0, 227.0, 385.0, 905.0, 2379.0, 7843.0, 34605.0, 268790.0, 640473.0, 72333.0, 13916.0, 3754.0, 1322.0, 562.0, 277.0, 154.0, 111.0, 68.0, 28.0, 34.0, 24.0, 10.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.296875, -8.0677490234375, -7.838623046875, -7.6094970703125, -7.38037109375, -7.1512451171875, -6.922119140625, -6.6929931640625, -6.4638671875, -6.2347412109375, -6.005615234375, -5.7764892578125, -5.54736328125, -5.3182373046875, -5.089111328125, -4.8599853515625, -4.630859375, -4.4017333984375, -4.172607421875, -3.9434814453125, -3.71435546875, -3.4852294921875, -3.256103515625, -3.0269775390625, -2.7978515625, -2.5687255859375, -2.339599609375, -2.1104736328125, -1.88134765625, -1.6522216796875, -1.423095703125, -1.1939697265625, -0.96484375, -0.7357177734375, -0.506591796875, -0.2774658203125, -0.04833984375, 0.1807861328125, 0.409912109375, 0.6390380859375, 0.8681640625, 1.0972900390625, 1.326416015625, 1.5555419921875, 1.78466796875, 2.0137939453125, 2.242919921875, 2.4720458984375, 2.701171875, 2.9302978515625, 3.159423828125, 3.3885498046875, 3.61767578125, 3.8468017578125, 4.075927734375, 4.3050537109375, 4.5341796875, 4.7633056640625, 4.992431640625, 5.2215576171875, 5.45068359375, 5.6798095703125, 5.908935546875, 6.1380615234375, 6.3671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 2.0, 3.0, 9.0, 12.0, 6.0, 9.0, 13.0, 26.0, 33.0, 35.0, 68.0, 92.0, 131.0, 117.0, 125.0, 84.0, 63.0, 45.0, 29.0, 22.0, 18.0, 13.0, 7.0, 2.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.86944580078125, -3.7232666015625, -3.57708740234375, -3.430908203125, -3.28472900390625, -3.1385498046875, -2.99237060546875, -2.84619140625, -2.70001220703125, -2.5538330078125, -2.40765380859375, -2.261474609375, -2.11529541015625, -1.9691162109375, -1.82293701171875, -1.6767578125, -1.53057861328125, -1.3843994140625, -1.23822021484375, -1.092041015625, -0.94586181640625, -0.7996826171875, -0.65350341796875, -0.50732421875, -0.36114501953125, -0.2149658203125, -0.06878662109375, 0.077392578125, 0.22357177734375, 0.3697509765625, 0.51593017578125, 0.662109375, 0.80828857421875, 0.9544677734375, 1.10064697265625, 1.246826171875, 1.39300537109375, 1.5391845703125, 1.68536376953125, 1.83154296875, 1.97772216796875, 2.1239013671875, 2.27008056640625, 2.416259765625, 2.56243896484375, 2.7086181640625, 2.85479736328125, 3.0009765625, 3.14715576171875, 3.2933349609375, 3.43951416015625, 3.585693359375, 3.73187255859375, 3.8780517578125, 4.02423095703125, 4.17041015625, 4.31658935546875, 4.4627685546875, 4.60894775390625, 4.755126953125, 4.90130615234375, 5.0474853515625, 5.19366455078125, 5.33984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 18.0, 30.0, 34.0, 53.0, 68.0, 97.0, 116.0, 107.0, 108.0, 78.0, 76.0, 57.0, 46.0, 35.0, 17.0, 20.0, 5.0, 8.0, 3.0, 7.0, 2.0, 2.0, 1.0, 4.0], "bins": [-105.02230072021484, -102.8188247680664, -100.61534118652344, -98.411865234375, -96.20838928222656, -94.0049057006836, -91.80142974853516, -89.59794616699219, -87.39447021484375, -85.19099426269531, -82.98751068115234, -80.7840347290039, -78.58055114746094, -76.3770751953125, -74.17359924316406, -71.9701156616211, -69.76663970947266, -67.56316375732422, -65.35968017578125, -63.15620422363281, -60.95272445678711, -58.749244689941406, -56.54576873779297, -54.342288970947266, -52.13880920410156, -49.93532943725586, -47.731849670410156, -45.52837371826172, -43.324893951416016, -41.12141418457031, -38.917938232421875, -36.71445846557617, -34.510986328125, -32.3075065612793, -30.104028701782227, -27.900550842285156, -25.697071075439453, -23.49359130859375, -21.29011344909668, -19.08663558959961, -16.883155822753906, -14.67967700958252, -12.476198196411133, -10.272719383239746, -8.06924057006836, -5.865761756896973, -3.662282943725586, -1.4588041305541992, 0.7446746826171875, 2.948153495788574, 5.151632308959961, 7.355111122131348, 9.558589935302734, 11.762068748474121, 13.965547561645508, 16.169025421142578, 18.37250518798828, 20.575984954833984, 22.779462814331055, 24.982940673828125, 27.186420440673828, 29.38990020751953, 31.5933780670166, 33.79685592651367, 36.000335693359375]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 8.0, 14.0, 13.0, 12.0, 22.0, 22.0, 24.0, 22.0, 27.0, 33.0, 40.0, 49.0, 35.0, 48.0, 40.0, 42.0, 41.0, 57.0, 54.0, 41.0, 28.0, 35.0, 35.0, 37.0, 45.0, 29.0, 21.0, 21.0, 22.0, 12.0, 23.0, 6.0, 9.0, 3.0, 1.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-58.153343200683594, -56.416770935058594, -54.680198669433594, -52.943626403808594, -51.207054138183594, -49.470481872558594, -47.733909606933594, -45.99734115600586, -44.26076889038086, -42.52419662475586, -40.78762435913086, -39.05105209350586, -37.31447982788086, -35.577911376953125, -33.841339111328125, -32.104766845703125, -30.368192672729492, -28.631620407104492, -26.895048141479492, -25.158477783203125, -23.421905517578125, -21.685333251953125, -19.948760986328125, -18.212188720703125, -16.475616455078125, -14.739044189453125, -13.002472877502441, -11.265900611877441, -9.529329299926758, -7.792757034301758, -6.056184768676758, -4.319613456726074, -2.5830421447753906, -0.8464702367782593, 0.8901016712188721, 2.626673698425293, 4.363245487213135, 6.099817276000977, 7.836389541625977, 9.57296085357666, 11.30953311920166, 13.04610538482666, 14.782676696777344, 16.519248962402344, 18.255821228027344, 19.992393493652344, 21.728965759277344, 23.46553611755371, 25.20210838317871, 26.93868064880371, 28.67525291442871, 30.411823272705078, 32.14839553833008, 33.88496780395508, 35.62154006958008, 37.35811233520508, 39.09468460083008, 40.83125686645508, 42.56782913208008, 44.30440139770508, 46.04097366333008, 47.77754211425781, 49.51411437988281, 51.25068664550781, 52.98725891113281]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 9.0, 5.0, 6.0, 6.0, 10.0, 14.0, 6.0, 33.0, 25.0, 46.0, 56.0, 99.0, 122.0, 178.0, 325.0, 609.0, 1182.0, 2954.0, 9404.0, 46435.0, 3246499.0, 836754.0, 37144.0, 7863.0, 2438.0, 988.0, 420.0, 231.0, 153.0, 64.0, 58.0, 44.0, 31.0, 19.0, 16.0, 16.0, 4.0, 8.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-42.6875, -41.49951171875, -40.3115234375, -39.12353515625, -37.935546875, -36.74755859375, -35.5595703125, -34.37158203125, -33.18359375, -31.99560546875, -30.8076171875, -29.61962890625, -28.431640625, -27.24365234375, -26.0556640625, -24.86767578125, -23.6796875, -22.49169921875, -21.3037109375, -20.11572265625, -18.927734375, -17.73974609375, -16.5517578125, -15.36376953125, -14.17578125, -12.98779296875, -11.7998046875, -10.61181640625, -9.423828125, -8.23583984375, -7.0478515625, -5.85986328125, -4.671875, -3.48388671875, -2.2958984375, -1.10791015625, 0.080078125, 1.26806640625, 2.4560546875, 3.64404296875, 4.83203125, 6.02001953125, 7.2080078125, 8.39599609375, 9.583984375, 10.77197265625, 11.9599609375, 13.14794921875, 14.3359375, 15.52392578125, 16.7119140625, 17.89990234375, 19.087890625, 20.27587890625, 21.4638671875, 22.65185546875, 23.83984375, 25.02783203125, 26.2158203125, 27.40380859375, 28.591796875, 29.77978515625, 30.9677734375, 32.15576171875, 33.34375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 9.0, 16.0, 26.0, 35.0, 57.0, 61.0, 68.0, 95.0, 101.0, 93.0, 78.0, 83.0, 62.0, 56.0, 43.0, 30.0, 19.0, 23.0, 10.0, 9.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0], "bins": [-6.68359375, -6.51348876953125, -6.3433837890625, -6.17327880859375, -6.003173828125, -5.83306884765625, -5.6629638671875, -5.49285888671875, -5.32275390625, -5.15264892578125, -4.9825439453125, -4.81243896484375, -4.642333984375, -4.47222900390625, -4.3021240234375, -4.13201904296875, -3.9619140625, -3.79180908203125, -3.6217041015625, -3.45159912109375, -3.281494140625, -3.11138916015625, -2.9412841796875, -2.77117919921875, -2.60107421875, -2.43096923828125, -2.2608642578125, -2.09075927734375, -1.920654296875, -1.75054931640625, -1.5804443359375, -1.41033935546875, -1.240234375, -1.07012939453125, -0.9000244140625, -0.72991943359375, -0.559814453125, -0.38970947265625, -0.2196044921875, -0.04949951171875, 0.12060546875, 0.29071044921875, 0.4608154296875, 0.63092041015625, 0.801025390625, 0.97113037109375, 1.1412353515625, 1.31134033203125, 1.4814453125, 1.65155029296875, 1.8216552734375, 1.99176025390625, 2.161865234375, 2.33197021484375, 2.5020751953125, 2.67218017578125, 2.84228515625, 3.01239013671875, 3.1824951171875, 3.35260009765625, 3.522705078125, 3.69281005859375, 3.8629150390625, 4.03302001953125, 4.203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 13.0, 13.0, 25.0, 34.0, 51.0, 68.0, 85.0, 130.0, 197.0, 281.0, 375.0, 697.0, 1152.0, 2276.0, 4912.0, 12425.0, 39250.0, 192669.0, 3230851.0, 596519.0, 76805.0, 20802.0, 7473.0, 3236.0, 1567.0, 816.0, 462.0, 342.0, 253.0, 148.0, 89.0, 83.0, 53.0, 39.0, 21.0, 19.0, 12.0, 6.0, 5.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.43408203125, -15.8994140625, -15.36474609375, -14.830078125, -14.29541015625, -13.7607421875, -13.22607421875, -12.69140625, -12.15673828125, -11.6220703125, -11.08740234375, -10.552734375, -10.01806640625, -9.4833984375, -8.94873046875, -8.4140625, -7.87939453125, -7.3447265625, -6.81005859375, -6.275390625, -5.74072265625, -5.2060546875, -4.67138671875, -4.13671875, -3.60205078125, -3.0673828125, -2.53271484375, -1.998046875, -1.46337890625, -0.9287109375, -0.39404296875, 0.140625, 0.67529296875, 1.2099609375, 1.74462890625, 2.279296875, 2.81396484375, 3.3486328125, 3.88330078125, 4.41796875, 4.95263671875, 5.4873046875, 6.02197265625, 6.556640625, 7.09130859375, 7.6259765625, 8.16064453125, 8.6953125, 9.22998046875, 9.7646484375, 10.29931640625, 10.833984375, 11.36865234375, 11.9033203125, 12.43798828125, 12.97265625, 13.50732421875, 14.0419921875, 14.57666015625, 15.111328125, 15.64599609375, 16.1806640625, 16.71533203125, 17.25]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 14.0, 13.0, 16.0, 31.0, 48.0, 90.0, 132.0, 295.0, 738.0, 1674.0, 512.0, 204.0, 107.0, 54.0, 40.0, 24.0, 23.0, 8.0, 13.0, 7.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7650146484375, -8.530029296875, -8.2950439453125, -8.06005859375, -7.8250732421875, -7.590087890625, -7.3551025390625, -7.1201171875, -6.8851318359375, -6.650146484375, -6.4151611328125, -6.18017578125, -5.9451904296875, -5.710205078125, -5.4752197265625, -5.240234375, -5.0052490234375, -4.770263671875, -4.5352783203125, -4.30029296875, -4.0653076171875, -3.830322265625, -3.5953369140625, -3.3603515625, -3.1253662109375, -2.890380859375, -2.6553955078125, -2.42041015625, -2.1854248046875, -1.950439453125, -1.7154541015625, -1.48046875, -1.2454833984375, -1.010498046875, -0.7755126953125, -0.54052734375, -0.3055419921875, -0.070556640625, 0.1644287109375, 0.3994140625, 0.6343994140625, 0.869384765625, 1.1043701171875, 1.33935546875, 1.5743408203125, 1.809326171875, 2.0443115234375, 2.279296875, 2.5142822265625, 2.749267578125, 2.9842529296875, 3.21923828125, 3.4542236328125, 3.689208984375, 3.9241943359375, 4.1591796875, 4.3941650390625, 4.629150390625, 4.8641357421875, 5.09912109375, 5.3341064453125, 5.569091796875, 5.8040771484375, 6.0390625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 13.0, 11.0, 44.0, 101.0, 155.0, 209.0, 202.0, 141.0, 78.0, 31.0, 11.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.01611328125, -102.62124633789062, -100.22637939453125, -97.83151245117188, -95.4366455078125, -93.04177856445312, -90.64691162109375, -88.25204467773438, -85.857177734375, -83.46231079101562, -81.06744384765625, -78.67257690429688, -76.2777099609375, -73.88284301757812, -71.48797607421875, -69.09310913085938, -66.69824981689453, -64.30338287353516, -61.90851593017578, -59.513648986816406, -57.11878204345703, -54.723915100097656, -52.32905197143555, -49.93418502807617, -47.5393180847168, -45.14445114135742, -42.74958419799805, -40.35471725463867, -37.95985412597656, -35.56498718261719, -33.17012023925781, -30.775253295898438, -28.38037872314453, -25.985511779785156, -23.59064483642578, -21.19577980041504, -18.800912857055664, -16.40604591369629, -14.01117992401123, -11.616313934326172, -9.221446990966797, -6.82658052444458, -4.431714057922363, -2.0368475914001465, 0.3580188751220703, 2.7528858184814453, 5.147751808166504, 7.5426177978515625, 9.937484741210938, 12.332351684570312, 14.727217674255371, 17.12208366394043, 19.516950607299805, 21.91181755065918, 24.306682586669922, 26.701549530029297, 29.096416473388672, 31.491283416748047, 33.88615036010742, 36.2810173034668, 38.675880432128906, 41.07074737548828, 43.465614318847656, 45.86048126220703, 48.255348205566406]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 7.0, 12.0, 13.0, 15.0, 26.0, 33.0, 29.0, 31.0, 60.0, 55.0, 73.0, 76.0, 64.0, 48.0, 53.0, 69.0, 61.0, 64.0, 60.0, 49.0, 26.0, 12.0, 10.0, 15.0, 13.0, 8.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.578243255615234, -30.707008361816406, -29.835771560668945, -28.964536666870117, -28.093299865722656, -27.222064971923828, -26.350830078125, -25.47959327697754, -24.60835838317871, -23.737123489379883, -22.865886688232422, -21.994651794433594, -21.123414993286133, -20.252180099487305, -19.380943298339844, -18.509708404541016, -17.638473510742188, -16.76723861694336, -15.896001815795898, -15.02476692199707, -14.153531074523926, -13.282295227050781, -12.411059379577637, -11.539823532104492, -10.668586730957031, -9.797350883483887, -8.926115036010742, -8.054880142211914, -7.1836442947387695, -6.312408447265625, -5.4411725997924805, -4.569937229156494, -3.698701858520508, -2.8274662494659424, -1.9562305212020874, -1.0849947929382324, -0.213759183883667, 0.6574764251708984, 1.528712272644043, 2.3999476432800293, 3.271183490753174, 4.142419338226318, 5.013654708862305, 5.884890556335449, 6.756126403808594, 7.62736177444458, 8.498598098754883, 9.369832992553711, 10.241068840026855, 11.1123046875, 11.983540534973145, 12.854776382446289, 13.726011276245117, 14.597247123718262, 15.468482971191406, 16.339717864990234, 17.210954666137695, 18.082189559936523, 18.953426361083984, 19.824661254882812, 20.695898056030273, 21.5671329498291, 22.438369750976562, 23.30960464477539, 24.18083953857422]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 10.0, 18.0, 30.0, 53.0, 91.0, 148.0, 202.0, 363.0, 823.0, 2168.0, 9693.0, 67759.0, 767652.0, 173729.0, 19807.0, 3654.0, 1127.0, 500.0, 280.0, 171.0, 88.0, 66.0, 34.0, 28.0, 11.0, 9.0, 10.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.40625, -36.26220703125, -35.1181640625, -33.97412109375, -32.830078125, -31.68603515625, -30.5419921875, -29.39794921875, -28.25390625, -27.10986328125, -25.9658203125, -24.82177734375, -23.677734375, -22.53369140625, -21.3896484375, -20.24560546875, -19.1015625, -17.95751953125, -16.8134765625, -15.66943359375, -14.525390625, -13.38134765625, -12.2373046875, -11.09326171875, -9.94921875, -8.80517578125, -7.6611328125, -6.51708984375, -5.373046875, -4.22900390625, -3.0849609375, -1.94091796875, -0.796875, 0.34716796875, 1.4912109375, 2.63525390625, 3.779296875, 4.92333984375, 6.0673828125, 7.21142578125, 8.35546875, 9.49951171875, 10.6435546875, 11.78759765625, 12.931640625, 14.07568359375, 15.2197265625, 16.36376953125, 17.5078125, 18.65185546875, 19.7958984375, 20.93994140625, 22.083984375, 23.22802734375, 24.3720703125, 25.51611328125, 26.66015625, 27.80419921875, 28.9482421875, 30.09228515625, 31.236328125, 32.38037109375, 33.5244140625, 34.66845703125, 35.8125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 8.0, 26.0, 33.0, 39.0, 57.0, 76.0, 81.0, 86.0, 112.0, 93.0, 82.0, 71.0, 67.0, 47.0, 22.0, 31.0, 22.0, 16.0, 8.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.79296875, -6.6131591796875, -6.433349609375, -6.2535400390625, -6.07373046875, -5.8939208984375, -5.714111328125, -5.5343017578125, -5.3544921875, -5.1746826171875, -4.994873046875, -4.8150634765625, -4.63525390625, -4.4554443359375, -4.275634765625, -4.0958251953125, -3.916015625, -3.7362060546875, -3.556396484375, -3.3765869140625, -3.19677734375, -3.0169677734375, -2.837158203125, -2.6573486328125, -2.4775390625, -2.2977294921875, -2.117919921875, -1.9381103515625, -1.75830078125, -1.5784912109375, -1.398681640625, -1.2188720703125, -1.0390625, -0.8592529296875, -0.679443359375, -0.4996337890625, -0.31982421875, -0.1400146484375, 0.039794921875, 0.2196044921875, 0.3994140625, 0.5792236328125, 0.759033203125, 0.9388427734375, 1.11865234375, 1.2984619140625, 1.478271484375, 1.6580810546875, 1.837890625, 2.0177001953125, 2.197509765625, 2.3773193359375, 2.55712890625, 2.7369384765625, 2.916748046875, 3.0965576171875, 3.2763671875, 3.4561767578125, 3.635986328125, 3.8157958984375, 3.99560546875, 4.1754150390625, 4.355224609375, 4.5350341796875, 4.71484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 5.0, 6.0, 7.0, 6.0, 5.0, 9.0, 12.0, 34.0, 54.0, 61.0, 95.0, 150.0, 280.0, 608.0, 1223.0, 2617.0, 6506.0, 16878.0, 48325.0, 199023.0, 595093.0, 120419.0, 35170.0, 12890.0, 4920.0, 2022.0, 987.0, 509.0, 252.0, 143.0, 89.0, 47.0, 34.0, 29.0, 10.0, 10.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.18115234375, -12.7607421875, -12.34033203125, -11.919921875, -11.49951171875, -11.0791015625, -10.65869140625, -10.23828125, -9.81787109375, -9.3974609375, -8.97705078125, -8.556640625, -8.13623046875, -7.7158203125, -7.29541015625, -6.875, -6.45458984375, -6.0341796875, -5.61376953125, -5.193359375, -4.77294921875, -4.3525390625, -3.93212890625, -3.51171875, -3.09130859375, -2.6708984375, -2.25048828125, -1.830078125, -1.40966796875, -0.9892578125, -0.56884765625, -0.1484375, 0.27197265625, 0.6923828125, 1.11279296875, 1.533203125, 1.95361328125, 2.3740234375, 2.79443359375, 3.21484375, 3.63525390625, 4.0556640625, 4.47607421875, 4.896484375, 5.31689453125, 5.7373046875, 6.15771484375, 6.578125, 6.99853515625, 7.4189453125, 7.83935546875, 8.259765625, 8.68017578125, 9.1005859375, 9.52099609375, 9.94140625, 10.36181640625, 10.7822265625, 11.20263671875, 11.623046875, 12.04345703125, 12.4638671875, 12.88427734375, 13.3046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 9.0, 5.0, 17.0, 11.0, 15.0, 25.0, 35.0, 31.0, 36.0, 36.0, 52.0, 53.0, 46.0, 63.0, 60.0, 65.0, 56.0, 58.0, 55.0, 42.0, 47.0, 37.0, 32.0, 24.0, 18.0, 12.0, 13.0, 11.0, 7.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.0625, -12.6397705078125, -12.217041015625, -11.7943115234375, -11.37158203125, -10.9488525390625, -10.526123046875, -10.1033935546875, -9.6806640625, -9.2579345703125, -8.835205078125, -8.4124755859375, -7.98974609375, -7.5670166015625, -7.144287109375, -6.7215576171875, -6.298828125, -5.8760986328125, -5.453369140625, -5.0306396484375, -4.60791015625, -4.1851806640625, -3.762451171875, -3.3397216796875, -2.9169921875, -2.4942626953125, -2.071533203125, -1.6488037109375, -1.22607421875, -0.8033447265625, -0.380615234375, 0.0421142578125, 0.46484375, 0.8875732421875, 1.310302734375, 1.7330322265625, 2.15576171875, 2.5784912109375, 3.001220703125, 3.4239501953125, 3.8466796875, 4.2694091796875, 4.692138671875, 5.1148681640625, 5.53759765625, 5.9603271484375, 6.383056640625, 6.8057861328125, 7.228515625, 7.6512451171875, 8.073974609375, 8.4967041015625, 8.91943359375, 9.3421630859375, 9.764892578125, 10.1876220703125, 10.6103515625, 11.0330810546875, 11.455810546875, 11.8785400390625, 12.30126953125, 12.7239990234375, 13.146728515625, 13.5694580078125, 13.9921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 7.0, 11.0, 7.0, 10.0, 22.0, 20.0, 34.0, 36.0, 45.0, 85.0, 205.0, 620.0, 2215.0, 9230.0, 59198.0, 879662.0, 81737.0, 11574.0, 2584.0, 719.0, 218.0, 99.0, 60.0, 36.0, 31.0, 23.0, 21.0, 13.0, 9.0, 7.0, 11.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.3504638671875, -13.935302734375, -13.5201416015625, -13.10498046875, -12.6898193359375, -12.274658203125, -11.8594970703125, -11.4443359375, -11.0291748046875, -10.614013671875, -10.1988525390625, -9.78369140625, -9.3685302734375, -8.953369140625, -8.5382080078125, -8.123046875, -7.7078857421875, -7.292724609375, -6.8775634765625, -6.46240234375, -6.0472412109375, -5.632080078125, -5.2169189453125, -4.8017578125, -4.3865966796875, -3.971435546875, -3.5562744140625, -3.14111328125, -2.7259521484375, -2.310791015625, -1.8956298828125, -1.48046875, -1.0653076171875, -0.650146484375, -0.2349853515625, 0.18017578125, 0.5953369140625, 1.010498046875, 1.4256591796875, 1.8408203125, 2.2559814453125, 2.671142578125, 3.0863037109375, 3.50146484375, 3.9166259765625, 4.331787109375, 4.7469482421875, 5.162109375, 5.5772705078125, 5.992431640625, 6.4075927734375, 6.82275390625, 7.2379150390625, 7.653076171875, 8.0682373046875, 8.4833984375, 8.8985595703125, 9.313720703125, 9.7288818359375, 10.14404296875, 10.5592041015625, 10.974365234375, 11.3895263671875, 11.8046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 13.0, 7.0, 10.0, 9.0, 19.0, 17.0, 44.0, 230.0, 438.0, 89.0, 32.0, 19.0, 11.0, 15.0, 11.0, 9.0, 5.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0028972625732421875, -0.002830296754837036, -0.0027633309364318848, -0.0026963651180267334, -0.002629399299621582, -0.0025624334812164307, -0.0024954676628112793, -0.002428501844406128, -0.0023615360260009766, -0.002294570207595825, -0.002227604389190674, -0.0021606385707855225, -0.002093672752380371, -0.0020267069339752197, -0.0019597411155700684, -0.001892775297164917, -0.0018258094787597656, -0.0017588436603546143, -0.0016918778419494629, -0.0016249120235443115, -0.0015579462051391602, -0.0014909803867340088, -0.0014240145683288574, -0.001357048749923706, -0.0012900829315185547, -0.0012231171131134033, -0.001156151294708252, -0.0010891854763031006, -0.0010222196578979492, -0.0009552538394927979, -0.0008882880210876465, -0.0008213222026824951, -0.0007543563842773438, -0.0006873905658721924, -0.000620424747467041, -0.0005534589290618896, -0.0004864931106567383, -0.0004195272922515869, -0.00035256147384643555, -0.0002855956554412842, -0.0002186298370361328, -0.00015166401863098145, -8.469820022583008e-05, -1.773238182067871e-05, 4.9233436584472656e-05, 0.00011619925498962402, 0.0001831650733947754, 0.00025013089179992676, 0.0003170967102050781, 0.0003840625286102295, 0.00045102834701538086, 0.0005179941654205322, 0.0005849599838256836, 0.000651925802230835, 0.0007188916206359863, 0.0007858574390411377, 0.0008528232574462891, 0.0009197890758514404, 0.0009867548942565918, 0.0010537207126617432, 0.0011206865310668945, 0.001187652349472046, 0.0012546181678771973, 0.0013215839862823486, 0.0013885498046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 16.0, 18.0, 22.0, 22.0, 44.0, 55.0, 101.0, 198.0, 583.0, 2124.0, 12188.0, 116897.0, 868378.0, 40159.0, 5773.0, 1228.0, 340.0, 138.0, 89.0, 52.0, 35.0, 21.0, 18.0, 10.0, 12.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.25, -10.80517578125, -10.3603515625, -9.91552734375, -9.470703125, -9.02587890625, -8.5810546875, -8.13623046875, -7.69140625, -7.24658203125, -6.8017578125, -6.35693359375, -5.912109375, -5.46728515625, -5.0224609375, -4.57763671875, -4.1328125, -3.68798828125, -3.2431640625, -2.79833984375, -2.353515625, -1.90869140625, -1.4638671875, -1.01904296875, -0.57421875, -0.12939453125, 0.3154296875, 0.76025390625, 1.205078125, 1.64990234375, 2.0947265625, 2.53955078125, 2.984375, 3.42919921875, 3.8740234375, 4.31884765625, 4.763671875, 5.20849609375, 5.6533203125, 6.09814453125, 6.54296875, 6.98779296875, 7.4326171875, 7.87744140625, 8.322265625, 8.76708984375, 9.2119140625, 9.65673828125, 10.1015625, 10.54638671875, 10.9912109375, 11.43603515625, 11.880859375, 12.32568359375, 12.7705078125, 13.21533203125, 13.66015625, 14.10498046875, 14.5498046875, 14.99462890625, 15.439453125, 15.88427734375, 16.3291015625, 16.77392578125, 17.21875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 8.0, 7.0, 4.0, 10.0, 11.0, 15.0, 14.0, 25.0, 42.0, 91.0, 164.0, 189.0, 158.0, 90.0, 55.0, 25.0, 15.0, 14.0, 21.0, 7.0, 10.0, 8.0, 11.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5546875, -4.3525390625, -4.150390625, -3.9482421875, -3.74609375, -3.5439453125, -3.341796875, -3.1396484375, -2.9375, -2.7353515625, -2.533203125, -2.3310546875, -2.12890625, -1.9267578125, -1.724609375, -1.5224609375, -1.3203125, -1.1181640625, -0.916015625, -0.7138671875, -0.51171875, -0.3095703125, -0.107421875, 0.0947265625, 0.296875, 0.4990234375, 0.701171875, 0.9033203125, 1.10546875, 1.3076171875, 1.509765625, 1.7119140625, 1.9140625, 2.1162109375, 2.318359375, 2.5205078125, 2.72265625, 2.9248046875, 3.126953125, 3.3291015625, 3.53125, 3.7333984375, 3.935546875, 4.1376953125, 4.33984375, 4.5419921875, 4.744140625, 4.9462890625, 5.1484375, 5.3505859375, 5.552734375, 5.7548828125, 5.95703125, 6.1591796875, 6.361328125, 6.5634765625, 6.765625, 6.9677734375, 7.169921875, 7.3720703125, 7.57421875, 7.7763671875, 7.978515625, 8.1806640625, 8.3828125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 9.0, 17.0, 19.0, 31.0, 59.0, 56.0, 77.0, 109.0, 102.0, 100.0, 108.0, 88.0, 72.0, 53.0, 43.0, 31.0, 12.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.42281341552734, -99.05581665039062, -96.6888198852539, -94.32181549072266, -91.95481872558594, -89.58782196044922, -87.2208251953125, -84.85382080078125, -82.48682403564453, -80.11982727050781, -77.7528305053711, -75.38582611083984, -73.01882934570312, -70.6518325805664, -68.28483581542969, -65.91783142089844, -63.550838470458984, -61.183841705322266, -58.81684112548828, -56.44984436035156, -54.08284378051758, -51.71584701538086, -49.348846435546875, -46.981849670410156, -44.61485290527344, -42.24785614013672, -39.880855560302734, -37.513858795166016, -35.14685821533203, -32.77986145019531, -30.41286277770996, -28.04586410522461, -25.67886734008789, -23.31186866760254, -20.944869995117188, -18.57787322998047, -16.210872650146484, -13.84387493133545, -11.476877212524414, -9.109878540039062, -6.742879867553711, -4.375881195068359, -2.008882999420166, 0.35811519622802734, 2.725113868713379, 5.0921125411987305, 7.459110260009766, 9.826108932495117, 12.193107604980469, 14.56010627746582, 16.927104949951172, 19.29410171508789, 21.661102294921875, 24.028099060058594, 26.395097732543945, 28.762096405029297, 31.12909507751465, 33.49609375, 35.86309051513672, 38.2300910949707, 40.59708786010742, 42.964088439941406, 45.331085205078125, 47.698081970214844, 50.06508255004883]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 8.0, 16.0, 17.0, 16.0, 22.0, 13.0, 25.0, 30.0, 36.0, 43.0, 24.0, 37.0, 46.0, 38.0, 40.0, 36.0, 31.0, 57.0, 36.0, 47.0, 48.0, 43.0, 28.0, 39.0, 23.0, 27.0, 33.0, 24.0, 12.0, 18.0, 15.0, 13.0, 11.0, 7.0, 6.0, 5.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.16310501098633, -41.65765380859375, -40.152198791503906, -38.64674758911133, -37.141292572021484, -35.635841369628906, -34.13038635253906, -32.624935150146484, -31.119483947753906, -29.614030838012695, -28.108577728271484, -26.603126525878906, -25.097673416137695, -23.592220306396484, -22.086767196655273, -20.581314086914062, -19.07586097717285, -17.57040786743164, -16.06495475769043, -14.559502601623535, -13.05405044555664, -11.54859733581543, -10.043144226074219, -8.537692070007324, -7.032238960266113, -5.5267863273620605, -4.021333694458008, -2.515880584716797, -1.0104279518127441, 0.4950246810913086, 2.0004777908325195, 3.505929946899414, 5.011383056640625, 6.516835689544678, 8.02228832244873, 9.527741432189941, 11.033193588256836, 12.538646697998047, 14.044099807739258, 15.549551963806152, 17.055004119873047, 18.560457229614258, 20.06591033935547, 21.571361541748047, 23.076814651489258, 24.58226776123047, 26.08772087097168, 27.59317398071289, 29.0986270904541, 30.604080200195312, 32.10953140258789, 33.614986419677734, 35.12043762207031, 36.625892639160156, 38.131343841552734, 39.63679504394531, 41.142250061035156, 42.647701263427734, 44.15315628051758, 45.658607482910156, 47.1640625, 48.66951370239258, 50.174964904785156, 51.680419921875, 53.18587112426758]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 9.0, 13.0, 18.0, 16.0, 27.0, 36.0, 50.0, 83.0, 115.0, 179.0, 250.0, 472.0, 945.0, 2017.0, 5459.0, 22261.0, 165769.0, 3836547.0, 132034.0, 19604.0, 4888.0, 1740.0, 737.0, 394.0, 218.0, 131.0, 70.0, 53.0, 44.0, 24.0, 18.0, 15.0, 9.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -42.12939453125, -40.7900390625, -39.45068359375, -38.111328125, -36.77197265625, -35.4326171875, -34.09326171875, -32.75390625, -31.41455078125, -30.0751953125, -28.73583984375, -27.396484375, -26.05712890625, -24.7177734375, -23.37841796875, -22.0390625, -20.69970703125, -19.3603515625, -18.02099609375, -16.681640625, -15.34228515625, -14.0029296875, -12.66357421875, -11.32421875, -9.98486328125, -8.6455078125, -7.30615234375, -5.966796875, -4.62744140625, -3.2880859375, -1.94873046875, -0.609375, 0.72998046875, 2.0693359375, 3.40869140625, 4.748046875, 6.08740234375, 7.4267578125, 8.76611328125, 10.10546875, 11.44482421875, 12.7841796875, 14.12353515625, 15.462890625, 16.80224609375, 18.1416015625, 19.48095703125, 20.8203125, 22.15966796875, 23.4990234375, 24.83837890625, 26.177734375, 27.51708984375, 28.8564453125, 30.19580078125, 31.53515625, 32.87451171875, 34.2138671875, 35.55322265625, 36.892578125, 38.23193359375, 39.5712890625, 40.91064453125, 42.25]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 8.0, 10.0, 21.0, 20.0, 57.0, 38.0, 58.0, 68.0, 95.0, 80.0, 89.0, 88.0, 70.0, 77.0, 54.0, 50.0, 35.0, 35.0, 17.0, 10.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-6.8125, -6.63519287109375, -6.4578857421875, -6.28057861328125, -6.103271484375, -5.92596435546875, -5.7486572265625, -5.57135009765625, -5.39404296875, -5.21673583984375, -5.0394287109375, -4.86212158203125, -4.684814453125, -4.50750732421875, -4.3302001953125, -4.15289306640625, -3.9755859375, -3.79827880859375, -3.6209716796875, -3.44366455078125, -3.266357421875, -3.08905029296875, -2.9117431640625, -2.73443603515625, -2.55712890625, -2.37982177734375, -2.2025146484375, -2.02520751953125, -1.847900390625, -1.67059326171875, -1.4932861328125, -1.31597900390625, -1.138671875, -0.96136474609375, -0.7840576171875, -0.60675048828125, -0.429443359375, -0.25213623046875, -0.0748291015625, 0.10247802734375, 0.27978515625, 0.45709228515625, 0.6343994140625, 0.81170654296875, 0.989013671875, 1.16632080078125, 1.3436279296875, 1.52093505859375, 1.6982421875, 1.87554931640625, 2.0528564453125, 2.23016357421875, 2.407470703125, 2.58477783203125, 2.7620849609375, 2.93939208984375, 3.11669921875, 3.29400634765625, 3.4713134765625, 3.64862060546875, 3.825927734375, 4.00323486328125, 4.1805419921875, 4.35784912109375, 4.53515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 9.0, 7.0, 19.0, 23.0, 28.0, 44.0, 49.0, 66.0, 101.0, 152.0, 247.0, 362.0, 548.0, 1011.0, 1913.0, 4138.0, 9401.0, 24428.0, 72848.0, 309075.0, 3246492.0, 391994.0, 84159.0, 27283.0, 10510.0, 4377.0, 2133.0, 1096.0, 650.0, 369.0, 263.0, 161.0, 103.0, 62.0, 43.0, 28.0, 28.0, 17.0, 14.0, 9.0, 8.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.0003662109375, -14.492919921875, -13.9854736328125, -13.47802734375, -12.9705810546875, -12.463134765625, -11.9556884765625, -11.4482421875, -10.9407958984375, -10.433349609375, -9.9259033203125, -9.41845703125, -8.9110107421875, -8.403564453125, -7.8961181640625, -7.388671875, -6.8812255859375, -6.373779296875, -5.8663330078125, -5.35888671875, -4.8514404296875, -4.343994140625, -3.8365478515625, -3.3291015625, -2.8216552734375, -2.314208984375, -1.8067626953125, -1.29931640625, -0.7918701171875, -0.284423828125, 0.2230224609375, 0.73046875, 1.2379150390625, 1.745361328125, 2.2528076171875, 2.76025390625, 3.2677001953125, 3.775146484375, 4.2825927734375, 4.7900390625, 5.2974853515625, 5.804931640625, 6.3123779296875, 6.81982421875, 7.3272705078125, 7.834716796875, 8.3421630859375, 8.849609375, 9.3570556640625, 9.864501953125, 10.3719482421875, 10.87939453125, 11.3868408203125, 11.894287109375, 12.4017333984375, 12.9091796875, 13.4166259765625, 13.924072265625, 14.4315185546875, 14.93896484375, 15.4464111328125, 15.953857421875, 16.4613037109375, 16.96875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 10.0, 9.0, 16.0, 25.0, 35.0, 44.0, 60.0, 111.0, 204.0, 445.0, 1870.0, 660.0, 255.0, 124.0, 54.0, 43.0, 34.0, 24.0, 14.0, 9.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.71746826171875, -8.4583740234375, -8.19927978515625, -7.940185546875, -7.68109130859375, -7.4219970703125, -7.16290283203125, -6.90380859375, -6.64471435546875, -6.3856201171875, -6.12652587890625, -5.867431640625, -5.60833740234375, -5.3492431640625, -5.09014892578125, -4.8310546875, -4.57196044921875, -4.3128662109375, -4.05377197265625, -3.794677734375, -3.53558349609375, -3.2764892578125, -3.01739501953125, -2.75830078125, -2.49920654296875, -2.2401123046875, -1.98101806640625, -1.721923828125, -1.46282958984375, -1.2037353515625, -0.94464111328125, -0.685546875, -0.42645263671875, -0.1673583984375, 0.09173583984375, 0.350830078125, 0.60992431640625, 0.8690185546875, 1.12811279296875, 1.38720703125, 1.64630126953125, 1.9053955078125, 2.16448974609375, 2.423583984375, 2.68267822265625, 2.9417724609375, 3.20086669921875, 3.4599609375, 3.71905517578125, 3.9781494140625, 4.23724365234375, 4.496337890625, 4.75543212890625, 5.0145263671875, 5.27362060546875, 5.53271484375, 5.79180908203125, 6.0509033203125, 6.30999755859375, 6.569091796875, 6.82818603515625, 7.0872802734375, 7.34637451171875, 7.60546875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 8.0, 30.0, 55.0, 79.0, 141.0, 147.0, 185.0, 134.0, 111.0, 51.0, 28.0, 15.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.32022476196289, -61.35478210449219, -59.389339447021484, -57.42389678955078, -55.45845413208008, -53.493011474609375, -51.52757263183594, -49.56212615966797, -47.59668731689453, -45.63124465942383, -43.665802001953125, -41.70035934448242, -39.73491668701172, -37.769474029541016, -35.80403137207031, -33.838592529296875, -31.873146057128906, -29.907703399658203, -27.9422607421875, -25.976818084716797, -24.011375427246094, -22.04593276977539, -20.08049201965332, -18.115049362182617, -16.149606704711914, -14.184164047241211, -12.218721389770508, -10.253279685974121, -8.287837028503418, -6.322394371032715, -4.356952667236328, -2.391510009765625, -0.4260711669921875, 1.5393712520599365, 3.5048136711120605, 5.4702558517456055, 7.435698509216309, 9.401141166687012, 11.366582870483398, 13.332025527954102, 15.297468185424805, 17.262910842895508, 19.22835350036621, 21.19379425048828, 23.159236907958984, 25.124679565429688, 27.09012222290039, 29.055564880371094, 31.021007537841797, 32.9864501953125, 34.9518928527832, 36.917335510253906, 38.88277816772461, 40.84822082519531, 42.81365966796875, 44.77910614013672, 46.744544982910156, 48.70998764038086, 50.67543029785156, 52.640872955322266, 54.60631561279297, 56.57175827026367, 58.537200927734375, 60.50263977050781, 62.46808624267578]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 8.0, 1.0, 8.0, 8.0, 12.0, 6.0, 12.0, 17.0, 14.0, 21.0, 33.0, 25.0, 33.0, 34.0, 49.0, 55.0, 40.0, 49.0, 49.0, 49.0, 47.0, 43.0, 47.0, 45.0, 44.0, 36.0, 32.0, 28.0, 27.0, 27.0, 23.0, 15.0, 19.0, 17.0, 7.0, 9.0, 5.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.60849380493164, -22.891918182373047, -22.17534065246582, -21.458763122558594, -20.7421875, -20.025611877441406, -19.30903434753418, -18.592456817626953, -17.87588119506836, -17.159305572509766, -16.44272804260254, -15.726151466369629, -15.009574890136719, -14.292998313903809, -13.576421737670898, -12.859845161437988, -12.143268585205078, -11.426692008972168, -10.710115432739258, -9.993538856506348, -9.276962280273438, -8.560385704040527, -7.843809127807617, -7.127232551574707, -6.410655975341797, -5.694079399108887, -4.977502822875977, -4.260926246643066, -3.5443496704101562, -2.827773094177246, -2.111196517944336, -1.3946199417114258, -0.6780414581298828, 0.038535118103027344, 0.7551116943359375, 1.4716882705688477, 2.188264846801758, 2.904841423034668, 3.621417999267578, 4.337994575500488, 5.054571151733398, 5.771147727966309, 6.487724304199219, 7.204300880432129, 7.920877456665039, 8.63745403289795, 9.35403060913086, 10.07060718536377, 10.78718376159668, 11.50376033782959, 12.2203369140625, 12.93691349029541, 13.65349006652832, 14.37006664276123, 15.08664321899414, 15.80321979522705, 16.51979637145996, 17.236373901367188, 17.95294952392578, 18.669525146484375, 19.3861026763916, 20.102680206298828, 20.819255828857422, 21.535831451416016, 22.252408981323242]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 10.0, 10.0, 18.0, 38.0, 46.0, 78.0, 132.0, 219.0, 398.0, 837.0, 2102.0, 7579.0, 41339.0, 284588.0, 599753.0, 90906.0, 14639.0, 3416.0, 1172.0, 564.0, 283.0, 157.0, 112.0, 43.0, 43.0, 25.0, 12.0, 11.0, 7.0, 4.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.0, -25.10986328125, -24.2197265625, -23.32958984375, -22.439453125, -21.54931640625, -20.6591796875, -19.76904296875, -18.87890625, -17.98876953125, -17.0986328125, -16.20849609375, -15.318359375, -14.42822265625, -13.5380859375, -12.64794921875, -11.7578125, -10.86767578125, -9.9775390625, -9.08740234375, -8.197265625, -7.30712890625, -6.4169921875, -5.52685546875, -4.63671875, -3.74658203125, -2.8564453125, -1.96630859375, -1.076171875, -0.18603515625, 0.7041015625, 1.59423828125, 2.484375, 3.37451171875, 4.2646484375, 5.15478515625, 6.044921875, 6.93505859375, 7.8251953125, 8.71533203125, 9.60546875, 10.49560546875, 11.3857421875, 12.27587890625, 13.166015625, 14.05615234375, 14.9462890625, 15.83642578125, 16.7265625, 17.61669921875, 18.5068359375, 19.39697265625, 20.287109375, 21.17724609375, 22.0673828125, 22.95751953125, 23.84765625, 24.73779296875, 25.6279296875, 26.51806640625, 27.408203125, 28.29833984375, 29.1884765625, 30.07861328125, 30.96875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 11.0, 18.0, 15.0, 42.0, 41.0, 46.0, 77.0, 68.0, 79.0, 71.0, 95.0, 93.0, 71.0, 76.0, 56.0, 35.0, 33.0, 22.0, 14.0, 9.0, 11.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.9375, -6.7550048828125, -6.572509765625, -6.3900146484375, -6.20751953125, -6.0250244140625, -5.842529296875, -5.6600341796875, -5.4775390625, -5.2950439453125, -5.112548828125, -4.9300537109375, -4.74755859375, -4.5650634765625, -4.382568359375, -4.2000732421875, -4.017578125, -3.8350830078125, -3.652587890625, -3.4700927734375, -3.28759765625, -3.1051025390625, -2.922607421875, -2.7401123046875, -2.5576171875, -2.3751220703125, -2.192626953125, -2.0101318359375, -1.82763671875, -1.6451416015625, -1.462646484375, -1.2801513671875, -1.09765625, -0.9151611328125, -0.732666015625, -0.5501708984375, -0.36767578125, -0.1851806640625, -0.002685546875, 0.1798095703125, 0.3623046875, 0.5447998046875, 0.727294921875, 0.9097900390625, 1.09228515625, 1.2747802734375, 1.457275390625, 1.6397705078125, 1.822265625, 2.0047607421875, 2.187255859375, 2.3697509765625, 2.55224609375, 2.7347412109375, 2.917236328125, 3.0997314453125, 3.2822265625, 3.4647216796875, 3.647216796875, 3.8297119140625, 4.01220703125, 4.1947021484375, 4.377197265625, 4.5596923828125, 4.7421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 9.0, 12.0, 12.0, 17.0, 38.0, 37.0, 62.0, 64.0, 98.0, 137.0, 192.0, 265.0, 405.0, 619.0, 1089.0, 2266.0, 5677.0, 16593.0, 55103.0, 198683.0, 516397.0, 175851.0, 49693.0, 14992.0, 5167.0, 2164.0, 1034.0, 577.0, 413.0, 273.0, 164.0, 108.0, 97.0, 60.0, 45.0, 44.0, 25.0, 25.0, 13.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.3798828125, -11.986328125, -11.5927734375, -11.19921875, -10.8056640625, -10.412109375, -10.0185546875, -9.625, -9.2314453125, -8.837890625, -8.4443359375, -8.05078125, -7.6572265625, -7.263671875, -6.8701171875, -6.4765625, -6.0830078125, -5.689453125, -5.2958984375, -4.90234375, -4.5087890625, -4.115234375, -3.7216796875, -3.328125, -2.9345703125, -2.541015625, -2.1474609375, -1.75390625, -1.3603515625, -0.966796875, -0.5732421875, -0.1796875, 0.2138671875, 0.607421875, 1.0009765625, 1.39453125, 1.7880859375, 2.181640625, 2.5751953125, 2.96875, 3.3623046875, 3.755859375, 4.1494140625, 4.54296875, 4.9365234375, 5.330078125, 5.7236328125, 6.1171875, 6.5107421875, 6.904296875, 7.2978515625, 7.69140625, 8.0849609375, 8.478515625, 8.8720703125, 9.265625, 9.6591796875, 10.052734375, 10.4462890625, 10.83984375, 11.2333984375, 11.626953125, 12.0205078125, 12.4140625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 2.0, 6.0, 6.0, 10.0, 14.0, 10.0, 7.0, 15.0, 17.0, 27.0, 23.0, 14.0, 35.0, 30.0, 31.0, 41.0, 37.0, 45.0, 45.0, 32.0, 38.0, 39.0, 36.0, 49.0, 42.0, 34.0, 44.0, 35.0, 37.0, 29.0, 21.0, 20.0, 22.0, 19.0, 21.0, 14.0, 15.0, 14.0, 10.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5546875, -10.1959228515625, -9.837158203125, -9.4783935546875, -9.11962890625, -8.7608642578125, -8.402099609375, -8.0433349609375, -7.6845703125, -7.3258056640625, -6.967041015625, -6.6082763671875, -6.24951171875, -5.8907470703125, -5.531982421875, -5.1732177734375, -4.814453125, -4.4556884765625, -4.096923828125, -3.7381591796875, -3.37939453125, -3.0206298828125, -2.661865234375, -2.3031005859375, -1.9443359375, -1.5855712890625, -1.226806640625, -0.8680419921875, -0.50927734375, -0.1505126953125, 0.208251953125, 0.5670166015625, 0.92578125, 1.2845458984375, 1.643310546875, 2.0020751953125, 2.36083984375, 2.7196044921875, 3.078369140625, 3.4371337890625, 3.7958984375, 4.1546630859375, 4.513427734375, 4.8721923828125, 5.23095703125, 5.5897216796875, 5.948486328125, 6.3072509765625, 6.666015625, 7.0247802734375, 7.383544921875, 7.7423095703125, 8.10107421875, 8.4598388671875, 8.818603515625, 9.1773681640625, 9.5361328125, 9.8948974609375, 10.253662109375, 10.6124267578125, 10.97119140625, 11.3299560546875, 11.688720703125, 12.0474853515625, 12.40625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 12.0, 16.0, 14.0, 38.0, 61.0, 131.0, 260.0, 595.0, 1282.0, 3521.0, 11154.0, 43286.0, 203604.0, 604866.0, 136310.0, 30314.0, 8234.0, 2805.0, 1080.0, 464.0, 233.0, 124.0, 57.0, 35.0, 26.0, 14.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.5352783203125, -4.312744140625, -4.0902099609375, -3.86767578125, -3.6451416015625, -3.422607421875, -3.2000732421875, -2.9775390625, -2.7550048828125, -2.532470703125, -2.3099365234375, -2.08740234375, -1.8648681640625, -1.642333984375, -1.4197998046875, -1.197265625, -0.9747314453125, -0.752197265625, -0.5296630859375, -0.30712890625, -0.0845947265625, 0.137939453125, 0.3604736328125, 0.5830078125, 0.8055419921875, 1.028076171875, 1.2506103515625, 1.47314453125, 1.6956787109375, 1.918212890625, 2.1407470703125, 2.36328125, 2.5858154296875, 2.808349609375, 3.0308837890625, 3.25341796875, 3.4759521484375, 3.698486328125, 3.9210205078125, 4.1435546875, 4.3660888671875, 4.588623046875, 4.8111572265625, 5.03369140625, 5.2562255859375, 5.478759765625, 5.7012939453125, 5.923828125, 6.1463623046875, 6.368896484375, 6.5914306640625, 6.81396484375, 7.0364990234375, 7.259033203125, 7.4815673828125, 7.7041015625, 7.9266357421875, 8.149169921875, 8.3717041015625, 8.59423828125, 8.8167724609375, 9.039306640625, 9.2618408203125, 9.484375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 8.0, 5.0, 10.0, 11.0, 11.0, 14.0, 23.0, 34.0, 30.0, 50.0, 50.0, 91.0, 157.0, 180.0, 86.0, 48.0, 35.0, 41.0, 30.0, 22.0, 21.0, 12.0, 6.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012664794921875, -0.0012303143739700317, -0.0011941492557525635, -0.0011579841375350952, -0.001121819019317627, -0.0010856539011001587, -0.0010494887828826904, -0.0010133236646652222, -0.000977158546447754, -0.0009409934282302856, -0.0009048283100128174, -0.0008686631917953491, -0.0008324980735778809, -0.0007963329553604126, -0.0007601678371429443, -0.0007240027189254761, -0.0006878376007080078, -0.0006516724824905396, -0.0006155073642730713, -0.000579342246055603, -0.0005431771278381348, -0.0005070120096206665, -0.00047084689140319824, -0.00043468177318573, -0.0003985166549682617, -0.00036235153675079346, -0.0003261864185333252, -0.00029002130031585693, -0.00025385618209838867, -0.0002176910638809204, -0.00018152594566345215, -0.0001453608274459839, -0.00010919570922851562, -7.303059101104736e-05, -3.68654727935791e-05, -7.003545761108398e-07, 3.546476364135742e-05, 7.162988185882568e-05, 0.00010779500007629395, 0.0001439601182937622, 0.00018012523651123047, 0.00021629035472869873, 0.000252455472946167, 0.00028862059116363525, 0.0003247857093811035, 0.0003609508275985718, 0.00039711594581604004, 0.0004332810640335083, 0.00046944618225097656, 0.0005056113004684448, 0.0005417764186859131, 0.0005779415369033813, 0.0006141066551208496, 0.0006502717733383179, 0.0006864368915557861, 0.0007226020097732544, 0.0007587671279907227, 0.0007949322462081909, 0.0008310973644256592, 0.0008672624826431274, 0.0009034276008605957, 0.000939592719078064, 0.0009757578372955322, 0.0010119229555130005, 0.0010480880737304688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 12.0, 9.0, 28.0, 38.0, 55.0, 96.0, 207.0, 359.0, 763.0, 2211.0, 8590.0, 49787.0, 466550.0, 458577.0, 49237.0, 8375.0, 2080.0, 769.0, 350.0, 196.0, 86.0, 64.0, 41.0, 31.0, 19.0, 8.0, 2.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.44091796875, -8.1162109375, -7.79150390625, -7.466796875, -7.14208984375, -6.8173828125, -6.49267578125, -6.16796875, -5.84326171875, -5.5185546875, -5.19384765625, -4.869140625, -4.54443359375, -4.2197265625, -3.89501953125, -3.5703125, -3.24560546875, -2.9208984375, -2.59619140625, -2.271484375, -1.94677734375, -1.6220703125, -1.29736328125, -0.97265625, -0.64794921875, -0.3232421875, 0.00146484375, 0.326171875, 0.65087890625, 0.9755859375, 1.30029296875, 1.625, 1.94970703125, 2.2744140625, 2.59912109375, 2.923828125, 3.24853515625, 3.5732421875, 3.89794921875, 4.22265625, 4.54736328125, 4.8720703125, 5.19677734375, 5.521484375, 5.84619140625, 6.1708984375, 6.49560546875, 6.8203125, 7.14501953125, 7.4697265625, 7.79443359375, 8.119140625, 8.44384765625, 8.7685546875, 9.09326171875, 9.41796875, 9.74267578125, 10.0673828125, 10.39208984375, 10.716796875, 11.04150390625, 11.3662109375, 11.69091796875, 12.015625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 11.0, 6.0, 11.0, 19.0, 36.0, 64.0, 60.0, 105.0, 105.0, 134.0, 131.0, 102.0, 69.0, 44.0, 25.0, 24.0, 24.0, 15.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.421875, -9.17059326171875, -8.9193115234375, -8.66802978515625, -8.416748046875, -8.16546630859375, -7.9141845703125, -7.66290283203125, -7.41162109375, -7.16033935546875, -6.9090576171875, -6.65777587890625, -6.406494140625, -6.15521240234375, -5.9039306640625, -5.65264892578125, -5.4013671875, -5.15008544921875, -4.8988037109375, -4.64752197265625, -4.396240234375, -4.14495849609375, -3.8936767578125, -3.64239501953125, -3.39111328125, -3.13983154296875, -2.8885498046875, -2.63726806640625, -2.385986328125, -2.13470458984375, -1.8834228515625, -1.63214111328125, -1.380859375, -1.12957763671875, -0.8782958984375, -0.62701416015625, -0.375732421875, -0.12445068359375, 0.1268310546875, 0.37811279296875, 0.62939453125, 0.88067626953125, 1.1319580078125, 1.38323974609375, 1.634521484375, 1.88580322265625, 2.1370849609375, 2.38836669921875, 2.6396484375, 2.89093017578125, 3.1422119140625, 3.39349365234375, 3.644775390625, 3.89605712890625, 4.1473388671875, 4.39862060546875, 4.64990234375, 4.90118408203125, 5.1524658203125, 5.40374755859375, 5.655029296875, 5.90631103515625, 6.1575927734375, 6.40887451171875, 6.66015625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 15.0, 21.0, 26.0, 44.0, 72.0, 92.0, 131.0, 104.0, 137.0, 81.0, 79.0, 68.0, 43.0, 34.0, 21.0, 10.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.6036148071289, -63.78229904174805, -60.96098327636719, -58.13966751098633, -55.31835174560547, -52.49703598022461, -49.67572021484375, -46.85440444946289, -44.03308868408203, -41.21177291870117, -38.39045715332031, -35.56914138793945, -32.747825622558594, -29.926509857177734, -27.105194091796875, -24.283878326416016, -21.462562561035156, -18.641246795654297, -15.819931030273438, -12.998615264892578, -10.177299499511719, -7.355983734130859, -4.53466796875, -1.7133522033691406, 1.1079635620117188, 3.929279327392578, 6.7505950927734375, 9.571910858154297, 12.393226623535156, 15.214542388916016, 18.035858154296875, 20.857173919677734, 23.678497314453125, 26.499813079833984, 29.321128845214844, 32.1424446105957, 34.96376037597656, 37.78507614135742, 40.60639190673828, 43.42770767211914, 46.2490234375, 49.07033920288086, 51.89165496826172, 54.71297073364258, 57.53428649902344, 60.3556022644043, 63.176918029785156, 65.99822998046875, 68.81954956054688, 71.640869140625, 74.4621810913086, 77.28349304199219, 80.10481262207031, 82.92613220214844, 85.74744415283203, 88.56875610351562, 91.39007568359375, 94.21139526367188, 97.03270721435547, 99.85401916503906, 102.67533874511719, 105.49665832519531, 108.3179702758789, 111.1392822265625, 113.96060180664062]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 7.0, 4.0, 9.0, 6.0, 14.0, 16.0, 12.0, 11.0, 17.0, 10.0, 22.0, 31.0, 33.0, 24.0, 48.0, 28.0, 33.0, 44.0, 40.0, 43.0, 39.0, 41.0, 47.0, 41.0, 46.0, 37.0, 38.0, 29.0, 15.0, 30.0, 34.0, 23.0, 22.0, 20.0, 18.0, 20.0, 13.0, 9.0, 9.0, 5.0, 2.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.75072479248047, -56.954139709472656, -55.157554626464844, -53.36096954345703, -51.56438446044922, -49.767799377441406, -47.97121047973633, -46.174625396728516, -44.3780403137207, -42.58145523071289, -40.78487014770508, -38.988285064697266, -37.19169616699219, -35.395111083984375, -33.59852600097656, -31.80194091796875, -30.005355834960938, -28.208770751953125, -26.412185668945312, -24.615598678588867, -22.819013595581055, -21.022428512573242, -19.225841522216797, -17.429256439208984, -15.632671356201172, -13.83608627319336, -12.03950023651123, -10.242914199829102, -8.446329116821289, -6.649744033813477, -4.853157997131348, -3.0565719604492188, -1.2599906921386719, 0.5365948677062988, 2.3331804275512695, 4.12976598739624, 5.926351547241211, 7.722936630249023, 9.519522666931152, 11.316108703613281, 13.112693786621094, 14.909278869628906, 16.70586395263672, 18.502450942993164, 20.299036026000977, 22.09562110900879, 23.892208099365234, 25.688793182373047, 27.48537826538086, 29.281963348388672, 31.078548431396484, 32.8751335144043, 34.671722412109375, 36.46830749511719, 38.264892578125, 40.06147766113281, 41.858062744140625, 43.65464782714844, 45.45123291015625, 47.24781799316406, 49.044403076171875, 50.84098815917969, 52.637577056884766, 54.43416213989258, 56.23074722290039]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 7.0, 14.0, 17.0, 24.0, 33.0, 65.0, 98.0, 128.0, 201.0, 347.0, 582.0, 1048.0, 2467.0, 6951.0, 29375.0, 232201.0, 3663494.0, 218087.0, 27984.0, 6817.0, 2268.0, 872.0, 457.0, 239.0, 166.0, 110.0, 71.0, 36.0, 25.0, 24.0, 13.0, 10.0, 11.0, 11.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -37.474609375, -36.35546875, -35.236328125, -34.1171875, -32.998046875, -31.87890625, -30.759765625, -29.640625, -28.521484375, -27.40234375, -26.283203125, -25.1640625, -24.044921875, -22.92578125, -21.806640625, -20.6875, -19.568359375, -18.44921875, -17.330078125, -16.2109375, -15.091796875, -13.97265625, -12.853515625, -11.734375, -10.615234375, -9.49609375, -8.376953125, -7.2578125, -6.138671875, -5.01953125, -3.900390625, -2.78125, -1.662109375, -0.54296875, 0.576171875, 1.6953125, 2.814453125, 3.93359375, 5.052734375, 6.171875, 7.291015625, 8.41015625, 9.529296875, 10.6484375, 11.767578125, 12.88671875, 14.005859375, 15.125, 16.244140625, 17.36328125, 18.482421875, 19.6015625, 20.720703125, 21.83984375, 22.958984375, 24.078125, 25.197265625, 26.31640625, 27.435546875, 28.5546875, 29.673828125, 30.79296875, 31.912109375, 33.03125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 11.0, 15.0, 25.0, 30.0, 33.0, 48.0, 63.0, 73.0, 69.0, 94.0, 85.0, 72.0, 87.0, 73.0, 53.0, 44.0, 34.0, 30.0, 21.0, 11.0, 7.0, 9.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.91796875, -6.7374267578125, -6.556884765625, -6.3763427734375, -6.19580078125, -6.0152587890625, -5.834716796875, -5.6541748046875, -5.4736328125, -5.2930908203125, -5.112548828125, -4.9320068359375, -4.75146484375, -4.5709228515625, -4.390380859375, -4.2098388671875, -4.029296875, -3.8487548828125, -3.668212890625, -3.4876708984375, -3.30712890625, -3.1265869140625, -2.946044921875, -2.7655029296875, -2.5849609375, -2.4044189453125, -2.223876953125, -2.0433349609375, -1.86279296875, -1.6822509765625, -1.501708984375, -1.3211669921875, -1.140625, -0.9600830078125, -0.779541015625, -0.5989990234375, -0.41845703125, -0.2379150390625, -0.057373046875, 0.1231689453125, 0.3037109375, 0.4842529296875, 0.664794921875, 0.8453369140625, 1.02587890625, 1.2064208984375, 1.386962890625, 1.5675048828125, 1.748046875, 1.9285888671875, 2.109130859375, 2.2896728515625, 2.47021484375, 2.6507568359375, 2.831298828125, 3.0118408203125, 3.1923828125, 3.3729248046875, 3.553466796875, 3.7340087890625, 3.91455078125, 4.0950927734375, 4.275634765625, 4.4561767578125, 4.63671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 5.0, 26.0, 22.0, 16.0, 39.0, 47.0, 60.0, 73.0, 122.0, 169.0, 230.0, 391.0, 615.0, 1196.0, 2573.0, 6634.0, 20582.0, 82195.0, 474986.0, 3162980.0, 347180.0, 66353.0, 17027.0, 5720.0, 2250.0, 1059.0, 588.0, 352.0, 209.0, 172.0, 105.0, 86.0, 64.0, 36.0, 31.0, 25.0, 20.0, 11.0, 8.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.375, -17.790283203125, -17.20556640625, -16.620849609375, -16.0361328125, -15.451416015625, -14.86669921875, -14.281982421875, -13.697265625, -13.112548828125, -12.52783203125, -11.943115234375, -11.3583984375, -10.773681640625, -10.18896484375, -9.604248046875, -9.01953125, -8.434814453125, -7.85009765625, -7.265380859375, -6.6806640625, -6.095947265625, -5.51123046875, -4.926513671875, -4.341796875, -3.757080078125, -3.17236328125, -2.587646484375, -2.0029296875, -1.418212890625, -0.83349609375, -0.248779296875, 0.3359375, 0.920654296875, 1.50537109375, 2.090087890625, 2.6748046875, 3.259521484375, 3.84423828125, 4.428955078125, 5.013671875, 5.598388671875, 6.18310546875, 6.767822265625, 7.3525390625, 7.937255859375, 8.52197265625, 9.106689453125, 9.69140625, 10.276123046875, 10.86083984375, 11.445556640625, 12.0302734375, 12.614990234375, 13.19970703125, 13.784423828125, 14.369140625, 14.953857421875, 15.53857421875, 16.123291015625, 16.7080078125, 17.292724609375, 17.87744140625, 18.462158203125, 19.046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 7.0, 15.0, 28.0, 56.0, 72.0, 140.0, 329.0, 1038.0, 1578.0, 406.0, 197.0, 111.0, 35.0, 27.0, 21.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.15625, -17.7147216796875, -17.273193359375, -16.8316650390625, -16.39013671875, -15.9486083984375, -15.507080078125, -15.0655517578125, -14.6240234375, -14.1824951171875, -13.740966796875, -13.2994384765625, -12.85791015625, -12.4163818359375, -11.974853515625, -11.5333251953125, -11.091796875, -10.6502685546875, -10.208740234375, -9.7672119140625, -9.32568359375, -8.8841552734375, -8.442626953125, -8.0010986328125, -7.5595703125, -7.1180419921875, -6.676513671875, -6.2349853515625, -5.79345703125, -5.3519287109375, -4.910400390625, -4.4688720703125, -4.02734375, -3.5858154296875, -3.144287109375, -2.7027587890625, -2.26123046875, -1.8197021484375, -1.378173828125, -0.9366455078125, -0.4951171875, -0.0535888671875, 0.387939453125, 0.8294677734375, 1.27099609375, 1.7125244140625, 2.154052734375, 2.5955810546875, 3.037109375, 3.4786376953125, 3.920166015625, 4.3616943359375, 4.80322265625, 5.2447509765625, 5.686279296875, 6.1278076171875, 6.5693359375, 7.0108642578125, 7.452392578125, 7.8939208984375, 8.33544921875, 8.7769775390625, 9.218505859375, 9.6600341796875, 10.1015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 10.0, 13.0, 18.0, 35.0, 53.0, 59.0, 83.0, 96.0, 119.0, 120.0, 83.0, 103.0, 66.0, 40.0, 39.0, 20.0, 16.0, 4.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-75.74119567871094, -74.01606750488281, -72.29093933105469, -70.56581115722656, -68.84068298339844, -67.11555480957031, -65.39042663574219, -63.66529846191406, -61.94017028808594, -60.21504211425781, -58.48991394042969, -56.76478576660156, -55.03965759277344, -53.31452941894531, -51.58940124511719, -49.86427307128906, -48.13914489746094, -46.41401672363281, -44.68888854980469, -42.96376037597656, -41.23863220214844, -39.51350402832031, -37.78837585449219, -36.06324768066406, -34.3381233215332, -32.61299514770508, -30.887866973876953, -29.162738800048828, -27.437610626220703, -25.712482452392578, -23.987354278564453, -22.262226104736328, -20.537097930908203, -18.811969757080078, -17.086841583251953, -15.361713409423828, -13.636585235595703, -11.911458015441895, -10.18632984161377, -8.461201667785645, -6.7360734939575195, -5.0109453201293945, -3.2858173847198486, -1.5606894493103027, 0.16443872451782227, 1.889566421508789, 3.614694595336914, 5.339822769165039, 7.064950942993164, 8.790079116821289, 10.515207290649414, 12.240335464477539, 13.965463638305664, 15.690590858459473, 17.41571807861328, 19.140846252441406, 20.86597442626953, 22.591102600097656, 24.31623077392578, 26.041358947753906, 27.76648712158203, 29.491615295410156, 31.21674346923828, 32.941871643066406, 34.66699981689453]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 9.0, 9.0, 14.0, 23.0, 24.0, 26.0, 29.0, 30.0, 37.0, 55.0, 43.0, 45.0, 54.0, 53.0, 48.0, 68.0, 61.0, 55.0, 51.0, 46.0, 38.0, 41.0, 25.0, 25.0, 16.0, 22.0, 11.0, 11.0, 3.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.413959503173828, -30.300485610961914, -29.187009811401367, -28.073535919189453, -26.960060119628906, -25.846586227416992, -24.733112335205078, -23.61963653564453, -22.506160736083984, -21.39268684387207, -20.279211044311523, -19.16573715209961, -18.052261352539062, -16.93878746032715, -15.825312614440918, -14.711837768554688, -13.598363876342773, -12.484889030456543, -11.371414184570312, -10.257940292358398, -9.144464492797852, -8.030990600585938, -6.917515754699707, -5.804040908813477, -4.690566062927246, -3.5770912170410156, -2.4636166095733643, -1.350142002105713, -0.23666715621948242, 0.876807689666748, 1.9902820587158203, 3.103756904602051, 4.217231750488281, 5.330706596374512, 6.444181442260742, 7.5576558113098145, 8.671131134033203, 9.784605026245117, 10.898079872131348, 12.011554718017578, 13.125029563903809, 14.238504409790039, 15.35197925567627, 16.4654541015625, 17.578927993774414, 18.69240379333496, 19.805877685546875, 20.919353485107422, 22.032827377319336, 23.14630126953125, 24.259777069091797, 25.37325096130371, 26.486726760864258, 27.600200653076172, 28.71367645263672, 29.827150344848633, 30.940624237060547, 32.054100036621094, 33.167572021484375, 34.28104782104492, 35.39452362060547, 36.507999420166016, 37.6214714050293, 38.734947204589844, 39.84842300415039]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 9.0, 5.0, 10.0, 18.0, 35.0, 46.0, 78.0, 103.0, 191.0, 320.0, 650.0, 1337.0, 3273.0, 11879.0, 60260.0, 375295.0, 486341.0, 85341.0, 15908.0, 4209.0, 1593.0, 686.0, 375.0, 221.0, 123.0, 71.0, 50.0, 41.0, 28.0, 15.0, 9.0, 7.0, 4.0, 6.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.46875, -24.69921875, -23.9296875, -23.16015625, -22.390625, -21.62109375, -20.8515625, -20.08203125, -19.3125, -18.54296875, -17.7734375, -17.00390625, -16.234375, -15.46484375, -14.6953125, -13.92578125, -13.15625, -12.38671875, -11.6171875, -10.84765625, -10.078125, -9.30859375, -8.5390625, -7.76953125, -7.0, -6.23046875, -5.4609375, -4.69140625, -3.921875, -3.15234375, -2.3828125, -1.61328125, -0.84375, -0.07421875, 0.6953125, 1.46484375, 2.234375, 3.00390625, 3.7734375, 4.54296875, 5.3125, 6.08203125, 6.8515625, 7.62109375, 8.390625, 9.16015625, 9.9296875, 10.69921875, 11.46875, 12.23828125, 13.0078125, 13.77734375, 14.546875, 15.31640625, 16.0859375, 16.85546875, 17.625, 18.39453125, 19.1640625, 19.93359375, 20.703125, 21.47265625, 22.2421875, 23.01171875, 23.78125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 13.0, 19.0, 24.0, 37.0, 53.0, 55.0, 79.0, 77.0, 88.0, 98.0, 98.0, 85.0, 64.0, 52.0, 42.0, 27.0, 23.0, 27.0, 11.0, 11.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.32421875, -7.12286376953125, -6.9215087890625, -6.72015380859375, -6.518798828125, -6.31744384765625, -6.1160888671875, -5.91473388671875, -5.71337890625, -5.51202392578125, -5.3106689453125, -5.10931396484375, -4.907958984375, -4.70660400390625, -4.5052490234375, -4.30389404296875, -4.1025390625, -3.90118408203125, -3.6998291015625, -3.49847412109375, -3.297119140625, -3.09576416015625, -2.8944091796875, -2.69305419921875, -2.49169921875, -2.29034423828125, -2.0889892578125, -1.88763427734375, -1.686279296875, -1.48492431640625, -1.2835693359375, -1.08221435546875, -0.880859375, -0.67950439453125, -0.4781494140625, -0.27679443359375, -0.075439453125, 0.12591552734375, 0.3272705078125, 0.52862548828125, 0.72998046875, 0.93133544921875, 1.1326904296875, 1.33404541015625, 1.535400390625, 1.73675537109375, 1.9381103515625, 2.13946533203125, 2.3408203125, 2.54217529296875, 2.7435302734375, 2.94488525390625, 3.146240234375, 3.34759521484375, 3.5489501953125, 3.75030517578125, 3.95166015625, 4.15301513671875, 4.3543701171875, 4.55572509765625, 4.757080078125, 4.95843505859375, 5.1597900390625, 5.36114501953125, 5.5625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 12.0, 14.0, 25.0, 33.0, 45.0, 54.0, 63.0, 108.0, 136.0, 169.0, 234.0, 326.0, 429.0, 756.0, 1234.0, 2422.0, 5423.0, 12906.0, 36077.0, 122865.0, 419089.0, 315002.0, 84811.0, 26854.0, 9968.0, 4231.0, 2045.0, 1028.0, 669.0, 421.0, 305.0, 220.0, 158.0, 107.0, 72.0, 61.0, 45.0, 28.0, 29.0, 21.0, 13.0, 10.0, 8.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-12.1875, -11.804931640625, -11.42236328125, -11.039794921875, -10.6572265625, -10.274658203125, -9.89208984375, -9.509521484375, -9.126953125, -8.744384765625, -8.36181640625, -7.979248046875, -7.5966796875, -7.214111328125, -6.83154296875, -6.448974609375, -6.06640625, -5.683837890625, -5.30126953125, -4.918701171875, -4.5361328125, -4.153564453125, -3.77099609375, -3.388427734375, -3.005859375, -2.623291015625, -2.24072265625, -1.858154296875, -1.4755859375, -1.093017578125, -0.71044921875, -0.327880859375, 0.0546875, 0.437255859375, 0.81982421875, 1.202392578125, 1.5849609375, 1.967529296875, 2.35009765625, 2.732666015625, 3.115234375, 3.497802734375, 3.88037109375, 4.262939453125, 4.6455078125, 5.028076171875, 5.41064453125, 5.793212890625, 6.17578125, 6.558349609375, 6.94091796875, 7.323486328125, 7.7060546875, 8.088623046875, 8.47119140625, 8.853759765625, 9.236328125, 9.618896484375, 10.00146484375, 10.384033203125, 10.7666015625, 11.149169921875, 11.53173828125, 11.914306640625, 12.296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 8.0, 5.0, 4.0, 11.0, 15.0, 15.0, 11.0, 26.0, 25.0, 30.0, 34.0, 38.0, 34.0, 36.0, 42.0, 41.0, 49.0, 58.0, 46.0, 48.0, 45.0, 41.0, 43.0, 34.0, 41.0, 36.0, 23.0, 17.0, 23.0, 31.0, 13.0, 16.0, 7.0, 9.0, 6.0, 5.0, 2.0, 7.0, 1.0, 6.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.2421875, -13.8021240234375, -13.362060546875, -12.9219970703125, -12.48193359375, -12.0418701171875, -11.601806640625, -11.1617431640625, -10.7216796875, -10.2816162109375, -9.841552734375, -9.4014892578125, -8.96142578125, -8.5213623046875, -8.081298828125, -7.6412353515625, -7.201171875, -6.7611083984375, -6.321044921875, -5.8809814453125, -5.44091796875, -5.0008544921875, -4.560791015625, -4.1207275390625, -3.6806640625, -3.2406005859375, -2.800537109375, -2.3604736328125, -1.92041015625, -1.4803466796875, -1.040283203125, -0.6002197265625, -0.16015625, 0.2799072265625, 0.719970703125, 1.1600341796875, 1.60009765625, 2.0401611328125, 2.480224609375, 2.9202880859375, 3.3603515625, 3.8004150390625, 4.240478515625, 4.6805419921875, 5.12060546875, 5.5606689453125, 6.000732421875, 6.4407958984375, 6.880859375, 7.3209228515625, 7.760986328125, 8.2010498046875, 8.64111328125, 9.0811767578125, 9.521240234375, 9.9613037109375, 10.4013671875, 10.8414306640625, 11.281494140625, 11.7215576171875, 12.16162109375, 12.6016845703125, 13.041748046875, 13.4818115234375, 13.921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 4.0, 7.0, 8.0, 6.0, 16.0, 27.0, 28.0, 45.0, 74.0, 111.0, 142.0, 269.0, 477.0, 823.0, 1545.0, 3048.0, 7730.0, 22716.0, 85248.0, 321868.0, 422259.0, 130065.0, 33241.0, 10406.0, 4075.0, 1921.0, 1004.0, 536.0, 302.0, 178.0, 127.0, 66.0, 49.0, 30.0, 29.0, 14.0, 9.0, 6.0, 4.0, 14.0, 4.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-6.015625, -5.8394775390625, -5.663330078125, -5.4871826171875, -5.31103515625, -5.1348876953125, -4.958740234375, -4.7825927734375, -4.6064453125, -4.4302978515625, -4.254150390625, -4.0780029296875, -3.90185546875, -3.7257080078125, -3.549560546875, -3.3734130859375, -3.197265625, -3.0211181640625, -2.844970703125, -2.6688232421875, -2.49267578125, -2.3165283203125, -2.140380859375, -1.9642333984375, -1.7880859375, -1.6119384765625, -1.435791015625, -1.2596435546875, -1.08349609375, -0.9073486328125, -0.731201171875, -0.5550537109375, -0.37890625, -0.2027587890625, -0.026611328125, 0.1495361328125, 0.32568359375, 0.5018310546875, 0.677978515625, 0.8541259765625, 1.0302734375, 1.2064208984375, 1.382568359375, 1.5587158203125, 1.73486328125, 1.9110107421875, 2.087158203125, 2.2633056640625, 2.439453125, 2.6156005859375, 2.791748046875, 2.9678955078125, 3.14404296875, 3.3201904296875, 3.496337890625, 3.6724853515625, 3.8486328125, 4.0247802734375, 4.200927734375, 4.3770751953125, 4.55322265625, 4.7293701171875, 4.905517578125, 5.0816650390625, 5.2578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 10.0, 6.0, 9.0, 5.0, 12.0, 20.0, 26.0, 28.0, 35.0, 38.0, 48.0, 59.0, 63.0, 82.0, 81.0, 91.0, 66.0, 65.0, 63.0, 31.0, 41.0, 27.0, 17.0, 14.0, 12.0, 12.0, 6.0, 13.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0010042190551757812, -0.0009775981307029724, -0.0009509772062301636, -0.0009243562817573547, -0.0008977353572845459, -0.0008711144328117371, -0.0008444935083389282, -0.0008178725838661194, -0.0007912516593933105, -0.0007646307349205017, -0.0007380098104476929, -0.000711388885974884, -0.0006847679615020752, -0.0006581470370292664, -0.0006315261125564575, -0.0006049051880836487, -0.0005782842636108398, -0.000551663339138031, -0.0005250424146652222, -0.0004984214901924133, -0.0004718005657196045, -0.00044517964124679565, -0.0004185587167739868, -0.000391937792301178, -0.00036531686782836914, -0.0003386959433555603, -0.00031207501888275146, -0.0002854540944099426, -0.0002588331699371338, -0.00023221224546432495, -0.0002055913209915161, -0.00017897039651870728, -0.00015234947204589844, -0.0001257285475730896, -9.910762310028076e-05, -7.248669862747192e-05, -4.5865774154663086e-05, -1.9244849681854248e-05, 7.37607479095459e-06, 3.399699926376343e-05, 6.0617923736572266e-05, 8.72388482093811e-05, 0.00011385977268218994, 0.00014048069715499878, 0.00016710162162780762, 0.00019372254610061646, 0.0002203434705734253, 0.00024696439504623413, 0.00027358531951904297, 0.0003002062439918518, 0.00032682716846466064, 0.0003534480929374695, 0.0003800690174102783, 0.00040668994188308716, 0.000433310866355896, 0.00045993179082870483, 0.00048655271530151367, 0.0005131736397743225, 0.0005397945642471313, 0.0005664154887199402, 0.000593036413192749, 0.0006196573376655579, 0.0006462782621383667, 0.0006728991866111755, 0.0006995201110839844]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 6.0, 5.0, 4.0, 13.0, 18.0, 26.0, 43.0, 72.0, 140.0, 197.0, 389.0, 732.0, 1973.0, 5923.0, 26199.0, 227107.0, 655554.0, 107993.0, 15424.0, 4032.0, 1416.0, 598.0, 305.0, 162.0, 78.0, 46.0, 38.0, 25.0, 14.0, 9.0, 8.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.3697509765625, -8.052001953125, -7.7342529296875, -7.41650390625, -7.0987548828125, -6.781005859375, -6.4632568359375, -6.1455078125, -5.8277587890625, -5.510009765625, -5.1922607421875, -4.87451171875, -4.5567626953125, -4.239013671875, -3.9212646484375, -3.603515625, -3.2857666015625, -2.968017578125, -2.6502685546875, -2.33251953125, -2.0147705078125, -1.697021484375, -1.3792724609375, -1.0615234375, -0.7437744140625, -0.426025390625, -0.1082763671875, 0.20947265625, 0.5272216796875, 0.844970703125, 1.1627197265625, 1.48046875, 1.7982177734375, 2.115966796875, 2.4337158203125, 2.75146484375, 3.0692138671875, 3.386962890625, 3.7047119140625, 4.0224609375, 4.3402099609375, 4.657958984375, 4.9757080078125, 5.29345703125, 5.6112060546875, 5.928955078125, 6.2467041015625, 6.564453125, 6.8822021484375, 7.199951171875, 7.5177001953125, 7.83544921875, 8.1531982421875, 8.470947265625, 8.7886962890625, 9.1064453125, 9.4241943359375, 9.741943359375, 10.0596923828125, 10.37744140625, 10.6951904296875, 11.012939453125, 11.3306884765625, 11.6484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 9.0, 5.0, 10.0, 14.0, 13.0, 34.0, 38.0, 68.0, 95.0, 119.0, 144.0, 123.0, 93.0, 67.0, 58.0, 31.0, 24.0, 20.0, 13.0, 8.0, 4.0, 8.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0, -10.73095703125, -10.4619140625, -10.19287109375, -9.923828125, -9.65478515625, -9.3857421875, -9.11669921875, -8.84765625, -8.57861328125, -8.3095703125, -8.04052734375, -7.771484375, -7.50244140625, -7.2333984375, -6.96435546875, -6.6953125, -6.42626953125, -6.1572265625, -5.88818359375, -5.619140625, -5.35009765625, -5.0810546875, -4.81201171875, -4.54296875, -4.27392578125, -4.0048828125, -3.73583984375, -3.466796875, -3.19775390625, -2.9287109375, -2.65966796875, -2.390625, -2.12158203125, -1.8525390625, -1.58349609375, -1.314453125, -1.04541015625, -0.7763671875, -0.50732421875, -0.23828125, 0.03076171875, 0.2998046875, 0.56884765625, 0.837890625, 1.10693359375, 1.3759765625, 1.64501953125, 1.9140625, 2.18310546875, 2.4521484375, 2.72119140625, 2.990234375, 3.25927734375, 3.5283203125, 3.79736328125, 4.06640625, 4.33544921875, 4.6044921875, 4.87353515625, 5.142578125, 5.41162109375, 5.6806640625, 5.94970703125, 6.21875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 7.0, 16.0, 21.0, 34.0, 49.0, 87.0, 126.0, 128.0, 140.0, 134.0, 95.0, 71.0, 46.0, 20.0, 13.0, 8.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-140.7022705078125, -137.1635284423828, -133.62478637695312, -130.08604431152344, -126.54729461669922, -123.00855255126953, -119.46981048583984, -115.93106079101562, -112.39231872558594, -108.85357666015625, -105.31483459472656, -101.77608489990234, -98.23734283447266, -94.69860076904297, -91.15985870361328, -87.62110900878906, -84.08236694335938, -80.54362487792969, -77.0048828125, -73.46613311767578, -69.9273910522461, -66.3886489868164, -62.84990692138672, -59.311161041259766, -55.772422790527344, -52.233680725097656, -48.6949348449707, -45.156192779541016, -41.61744689941406, -38.078704833984375, -34.53996276855469, -31.001216888427734, -27.46247100830078, -23.92372703552246, -20.38498306274414, -16.846240997314453, -13.307496070861816, -9.768753051757812, -6.230009078979492, -2.691265106201172, 0.8474788665771484, 4.386222839355469, 7.924966335296631, 11.463709831237793, 15.002453804016113, 18.541196823120117, 22.079940795898438, 25.618684768676758, 29.157428741455078, 32.696170806884766, 36.23491668701172, 39.773658752441406, 43.31240463256836, 46.85114669799805, 50.389892578125, 53.92863464355469, 57.467376708984375, 61.00611877441406, 64.54486083984375, 68.08361053466797, 71.62235260009766, 75.16109466552734, 78.69983673095703, 82.23858642578125, 85.77732849121094]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 4.0, 5.0, 4.0, 8.0, 7.0, 7.0, 10.0, 18.0, 22.0, 26.0, 30.0, 34.0, 32.0, 34.0, 45.0, 30.0, 43.0, 37.0, 45.0, 58.0, 44.0, 52.0, 40.0, 43.0, 39.0, 41.0, 26.0, 32.0, 25.0, 23.0, 26.0, 30.0, 13.0, 15.0, 10.0, 11.0, 6.0, 6.0, 7.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.773948669433594, -59.61188888549805, -57.4498291015625, -55.28776931762695, -53.125709533691406, -50.963653564453125, -48.80159378051758, -46.63953399658203, -44.477474212646484, -42.31541442871094, -40.15335464477539, -37.991294860839844, -35.82923889160156, -33.66717529296875, -31.50511932373047, -29.343059539794922, -27.180999755859375, -25.018939971923828, -22.85688018798828, -20.694822311401367, -18.53276252746582, -16.370702743530273, -14.208643913269043, -12.046585083007812, -9.884525299072266, -7.722465991973877, -5.560406684875488, -3.3983473777770996, -1.236288070678711, 0.9257717132568359, 3.0878305435180664, 5.249889373779297, 7.4119415283203125, 9.57400131225586, 11.73606014251709, 13.89811897277832, 16.060178756713867, 18.222238540649414, 20.384296417236328, 22.546356201171875, 24.708415985107422, 26.87047576904297, 29.032535552978516, 31.19459342956543, 33.356651306152344, 35.518714904785156, 37.68077087402344, 39.842830657958984, 42.00489044189453, 44.16695022583008, 46.329010009765625, 48.49106979370117, 50.65312957763672, 52.815185546875, 54.97724533081055, 57.139305114746094, 59.30136489868164, 61.46342468261719, 63.625484466552734, 65.78754425048828, 67.94960021972656, 70.11166381835938, 72.27371978759766, 74.43577575683594, 76.59783935546875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 18.0, 21.0, 38.0, 55.0, 112.0, 184.0, 428.0, 1203.0, 3990.0, 23055.0, 4055822.0, 97079.0, 8831.0, 2135.0, 695.0, 295.0, 135.0, 72.0, 36.0, 22.0, 21.0, 6.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0, -68.0419921875, -66.083984375, -64.1259765625, -62.16796875, -60.2099609375, -58.251953125, -56.2939453125, -54.3359375, -52.3779296875, -50.419921875, -48.4619140625, -46.50390625, -44.5458984375, -42.587890625, -40.6298828125, -38.671875, -36.7138671875, -34.755859375, -32.7978515625, -30.83984375, -28.8818359375, -26.923828125, -24.9658203125, -23.0078125, -21.0498046875, -19.091796875, -17.1337890625, -15.17578125, -13.2177734375, -11.259765625, -9.3017578125, -7.34375, -5.3857421875, -3.427734375, -1.4697265625, 0.48828125, 2.4462890625, 4.404296875, 6.3623046875, 8.3203125, 10.2783203125, 12.236328125, 14.1943359375, 16.15234375, 18.1103515625, 20.068359375, 22.0263671875, 23.984375, 25.9423828125, 27.900390625, 29.8583984375, 31.81640625, 33.7744140625, 35.732421875, 37.6904296875, 39.6484375, 41.6064453125, 43.564453125, 45.5224609375, 47.48046875, 49.4384765625, 51.396484375, 53.3544921875, 55.3125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 4.0, 12.0, 14.0, 14.0, 26.0, 36.0, 45.0, 55.0, 62.0, 70.0, 69.0, 78.0, 83.0, 71.0, 81.0, 64.0, 55.0, 36.0, 37.0, 20.0, 17.0, 12.0, 7.0, 15.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.28515625, -7.082763671875, -6.88037109375, -6.677978515625, -6.4755859375, -6.273193359375, -6.07080078125, -5.868408203125, -5.666015625, -5.463623046875, -5.26123046875, -5.058837890625, -4.8564453125, -4.654052734375, -4.45166015625, -4.249267578125, -4.046875, -3.844482421875, -3.64208984375, -3.439697265625, -3.2373046875, -3.034912109375, -2.83251953125, -2.630126953125, -2.427734375, -2.225341796875, -2.02294921875, -1.820556640625, -1.6181640625, -1.415771484375, -1.21337890625, -1.010986328125, -0.80859375, -0.606201171875, -0.40380859375, -0.201416015625, 0.0009765625, 0.203369140625, 0.40576171875, 0.608154296875, 0.810546875, 1.012939453125, 1.21533203125, 1.417724609375, 1.6201171875, 1.822509765625, 2.02490234375, 2.227294921875, 2.4296875, 2.632080078125, 2.83447265625, 3.036865234375, 3.2392578125, 3.441650390625, 3.64404296875, 3.846435546875, 4.048828125, 4.251220703125, 4.45361328125, 4.656005859375, 4.8583984375, 5.060791015625, 5.26318359375, 5.465576171875, 5.66796875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 4.0, 10.0, 11.0, 15.0, 18.0, 28.0, 35.0, 52.0, 66.0, 78.0, 118.0, 219.0, 403.0, 1063.0, 2973.0, 11256.0, 100501.0, 4011900.0, 53581.0, 8011.0, 2161.0, 769.0, 368.0, 191.0, 124.0, 84.0, 66.0, 43.0, 25.0, 25.0, 18.0, 15.0, 10.0, 14.0, 4.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875, -31.82763671875, -30.7802734375, -29.73291015625, -28.685546875, -27.63818359375, -26.5908203125, -25.54345703125, -24.49609375, -23.44873046875, -22.4013671875, -21.35400390625, -20.306640625, -19.25927734375, -18.2119140625, -17.16455078125, -16.1171875, -15.06982421875, -14.0224609375, -12.97509765625, -11.927734375, -10.88037109375, -9.8330078125, -8.78564453125, -7.73828125, -6.69091796875, -5.6435546875, -4.59619140625, -3.548828125, -2.50146484375, -1.4541015625, -0.40673828125, 0.640625, 1.68798828125, 2.7353515625, 3.78271484375, 4.830078125, 5.87744140625, 6.9248046875, 7.97216796875, 9.01953125, 10.06689453125, 11.1142578125, 12.16162109375, 13.208984375, 14.25634765625, 15.3037109375, 16.35107421875, 17.3984375, 18.44580078125, 19.4931640625, 20.54052734375, 21.587890625, 22.63525390625, 23.6826171875, 24.72998046875, 25.77734375, 26.82470703125, 27.8720703125, 28.91943359375, 29.966796875, 31.01416015625, 32.0615234375, 33.10888671875, 34.15625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 7.0, 8.0, 9.0, 13.0, 18.0, 42.0, 100.0, 285.0, 3170.0, 251.0, 70.0, 39.0, 26.0, 18.0, 10.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2578125, -3.09844970703125, -2.9390869140625, -2.77972412109375, -2.620361328125, -2.46099853515625, -2.3016357421875, -2.14227294921875, -1.98291015625, -1.82354736328125, -1.6641845703125, -1.50482177734375, -1.345458984375, -1.18609619140625, -1.0267333984375, -0.86737060546875, -0.7080078125, -0.54864501953125, -0.3892822265625, -0.22991943359375, -0.070556640625, 0.08880615234375, 0.2481689453125, 0.40753173828125, 0.56689453125, 0.72625732421875, 0.8856201171875, 1.04498291015625, 1.204345703125, 1.36370849609375, 1.5230712890625, 1.68243408203125, 1.841796875, 2.00115966796875, 2.1605224609375, 2.31988525390625, 2.479248046875, 2.63861083984375, 2.7979736328125, 2.95733642578125, 3.11669921875, 3.27606201171875, 3.4354248046875, 3.59478759765625, 3.754150390625, 3.91351318359375, 4.0728759765625, 4.23223876953125, 4.3916015625, 4.55096435546875, 4.7103271484375, 4.86968994140625, 5.029052734375, 5.18841552734375, 5.3477783203125, 5.50714111328125, 5.66650390625, 5.82586669921875, 5.9852294921875, 6.14459228515625, 6.303955078125, 6.46331787109375, 6.6226806640625, 6.78204345703125, 6.94140625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 11.0, 22.0, 28.0, 26.0, 36.0, 75.0, 55.0, 84.0, 93.0, 83.0, 102.0, 83.0, 54.0, 60.0, 50.0, 39.0, 26.0, 20.0, 9.0, 11.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.421051025390625, -14.940620422363281, -14.460189819335938, -13.97976016998291, -13.499329566955566, -13.018898963928223, -12.538468360900879, -12.058038711547852, -11.577608108520508, -11.097177505493164, -10.61674690246582, -10.136317253112793, -9.65588665008545, -9.175456047058105, -8.695025444030762, -8.214595794677734, -7.734164714813232, -7.253734111785889, -6.773303985595703, -6.292873382568359, -5.812443256378174, -5.33201265335083, -4.8515825271606445, -4.371151924133301, -3.890721559524536, -3.4102911949157715, -2.929860830307007, -2.449430465698242, -1.968999981880188, -1.4885694980621338, -1.0081391334533691, -0.5277087688446045, -0.047278404235839844, 0.4331519901752472, 0.9135823845863342, 1.3940128087997437, 1.8744431734085083, 2.3548736572265625, 2.835304021835327, 3.315734386444092, 3.7961647510528564, 4.276595115661621, 4.757025718688965, 5.23745584487915, 5.717886447906494, 6.19831657409668, 6.678747177124023, 7.159177780151367, 7.639607906341553, 8.120038032531738, 8.600468635559082, 9.080899238586426, 9.56132984161377, 10.041759490966797, 10.52219009399414, 11.002620697021484, 11.483051300048828, 11.963481903076172, 12.443912506103516, 12.924342155456543, 13.404772758483887, 13.88520336151123, 14.365633964538574, 14.846063613891602, 15.326494216918945]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 6.0, 5.0, 11.0, 26.0, 19.0, 19.0, 25.0, 21.0, 21.0, 23.0, 38.0, 30.0, 43.0, 24.0, 28.0, 39.0, 50.0, 52.0, 55.0, 58.0, 47.0, 37.0, 36.0, 47.0, 34.0, 34.0, 31.0, 23.0, 18.0, 19.0, 21.0, 10.0, 9.0, 9.0, 4.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.898616790771484, -6.622825622558594, -6.347034454345703, -6.071243762969971, -5.79545259475708, -5.5196614265441895, -5.243870735168457, -4.968079566955566, -4.692288398742676, -4.416497230529785, -4.1407060623168945, -3.864915370941162, -3.5891242027282715, -3.313333034515381, -3.0375421047210693, -2.761751174926758, -2.485960006713867, -2.2101688385009766, -1.934377908706665, -1.658586859703064, -1.382795810699463, -1.1070047616958618, -0.8312137126922607, -0.5554226636886597, -0.2796316146850586, -0.0038405656814575195, 0.27195048332214355, 0.5477415323257446, 0.8235325813293457, 1.0993236303329468, 1.3751146793365479, 1.650905728340149, 1.92669677734375, 2.2024879455566406, 2.478278875350952, 2.7540698051452637, 3.0298609733581543, 3.305652141571045, 3.5814430713653564, 3.857234001159668, 4.133025169372559, 4.408816337585449, 4.68460750579834, 4.960398197174072, 5.236189365386963, 5.5119805335998535, 5.787771224975586, 6.063562393188477, 6.339353561401367, 6.615144729614258, 6.890935897827148, 7.166726589202881, 7.4425177574157715, 7.718308925628662, 7.9940996170043945, 8.269890785217285, 8.545681953430176, 8.821473121643066, 9.097264289855957, 9.373055458068848, 9.648845672607422, 9.924636840820312, 10.200428009033203, 10.476219177246094, 10.752010345458984]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 10.0, 15.0, 39.0, 37.0, 60.0, 112.0, 195.0, 319.0, 673.0, 1451.0, 3994.0, 15023.0, 67371.0, 318364.0, 478703.0, 124677.0, 27086.0, 6480.0, 2122.0, 866.0, 430.0, 227.0, 113.0, 84.0, 42.0, 22.0, 13.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.5625, -19.961181640625, -19.35986328125, -18.758544921875, -18.1572265625, -17.555908203125, -16.95458984375, -16.353271484375, -15.751953125, -15.150634765625, -14.54931640625, -13.947998046875, -13.3466796875, -12.745361328125, -12.14404296875, -11.542724609375, -10.94140625, -10.340087890625, -9.73876953125, -9.137451171875, -8.5361328125, -7.934814453125, -7.33349609375, -6.732177734375, -6.130859375, -5.529541015625, -4.92822265625, -4.326904296875, -3.7255859375, -3.124267578125, -2.52294921875, -1.921630859375, -1.3203125, -0.718994140625, -0.11767578125, 0.483642578125, 1.0849609375, 1.686279296875, 2.28759765625, 2.888916015625, 3.490234375, 4.091552734375, 4.69287109375, 5.294189453125, 5.8955078125, 6.496826171875, 7.09814453125, 7.699462890625, 8.30078125, 8.902099609375, 9.50341796875, 10.104736328125, 10.7060546875, 11.307373046875, 11.90869140625, 12.510009765625, 13.111328125, 13.712646484375, 14.31396484375, 14.915283203125, 15.5166015625, 16.117919921875, 16.71923828125, 17.320556640625, 17.921875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 8.0, 13.0, 9.0, 20.0, 24.0, 33.0, 51.0, 58.0, 51.0, 84.0, 71.0, 69.0, 87.0, 68.0, 59.0, 59.0, 56.0, 41.0, 31.0, 20.0, 20.0, 18.0, 14.0, 11.0, 9.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.0736083984375, -6.865966796875, -6.6583251953125, -6.45068359375, -6.2430419921875, -6.035400390625, -5.8277587890625, -5.6201171875, -5.4124755859375, -5.204833984375, -4.9971923828125, -4.78955078125, -4.5819091796875, -4.374267578125, -4.1666259765625, -3.958984375, -3.7513427734375, -3.543701171875, -3.3360595703125, -3.12841796875, -2.9207763671875, -2.713134765625, -2.5054931640625, -2.2978515625, -2.0902099609375, -1.882568359375, -1.6749267578125, -1.46728515625, -1.2596435546875, -1.052001953125, -0.8443603515625, -0.63671875, -0.4290771484375, -0.221435546875, -0.0137939453125, 0.19384765625, 0.4014892578125, 0.609130859375, 0.8167724609375, 1.0244140625, 1.2320556640625, 1.439697265625, 1.6473388671875, 1.85498046875, 2.0626220703125, 2.270263671875, 2.4779052734375, 2.685546875, 2.8931884765625, 3.100830078125, 3.3084716796875, 3.51611328125, 3.7237548828125, 3.931396484375, 4.1390380859375, 4.3466796875, 4.5543212890625, 4.761962890625, 4.9696044921875, 5.17724609375, 5.3848876953125, 5.592529296875, 5.8001708984375, 6.0078125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 14.0, 16.0, 20.0, 27.0, 46.0, 52.0, 71.0, 129.0, 158.0, 202.0, 311.0, 458.0, 652.0, 1021.0, 1936.0, 4950.0, 18908.0, 96823.0, 490233.0, 347973.0, 63130.0, 13241.0, 3816.0, 1583.0, 886.0, 567.0, 393.0, 290.0, 171.0, 126.0, 90.0, 64.0, 49.0, 32.0, 27.0, 24.0, 18.0, 9.0, 8.0, 8.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -12.9149169921875, -12.415771484375, -11.9166259765625, -11.41748046875, -10.9183349609375, -10.419189453125, -9.9200439453125, -9.4208984375, -8.9217529296875, -8.422607421875, -7.9234619140625, -7.42431640625, -6.9251708984375, -6.426025390625, -5.9268798828125, -5.427734375, -4.9285888671875, -4.429443359375, -3.9302978515625, -3.43115234375, -2.9320068359375, -2.432861328125, -1.9337158203125, -1.4345703125, -0.9354248046875, -0.436279296875, 0.0628662109375, 0.56201171875, 1.0611572265625, 1.560302734375, 2.0594482421875, 2.55859375, 3.0577392578125, 3.556884765625, 4.0560302734375, 4.55517578125, 5.0543212890625, 5.553466796875, 6.0526123046875, 6.5517578125, 7.0509033203125, 7.550048828125, 8.0491943359375, 8.54833984375, 9.0474853515625, 9.546630859375, 10.0457763671875, 10.544921875, 11.0440673828125, 11.543212890625, 12.0423583984375, 12.54150390625, 13.0406494140625, 13.539794921875, 14.0389404296875, 14.5380859375, 15.0372314453125, 15.536376953125, 16.0355224609375, 16.53466796875, 17.0338134765625, 17.532958984375, 18.0321044921875, 18.53125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 7.0, 10.0, 11.0, 15.0, 16.0, 18.0, 17.0, 29.0, 33.0, 38.0, 34.0, 42.0, 38.0, 37.0, 48.0, 41.0, 43.0, 54.0, 41.0, 48.0, 39.0, 42.0, 33.0, 43.0, 26.0, 29.0, 25.0, 25.0, 22.0, 18.0, 12.0, 11.0, 8.0, 10.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0], "bins": [-19.90625, -19.357666015625, -18.80908203125, -18.260498046875, -17.7119140625, -17.163330078125, -16.61474609375, -16.066162109375, -15.517578125, -14.968994140625, -14.42041015625, -13.871826171875, -13.3232421875, -12.774658203125, -12.22607421875, -11.677490234375, -11.12890625, -10.580322265625, -10.03173828125, -9.483154296875, -8.9345703125, -8.385986328125, -7.83740234375, -7.288818359375, -6.740234375, -6.191650390625, -5.64306640625, -5.094482421875, -4.5458984375, -3.997314453125, -3.44873046875, -2.900146484375, -2.3515625, -1.802978515625, -1.25439453125, -0.705810546875, -0.1572265625, 0.391357421875, 0.93994140625, 1.488525390625, 2.037109375, 2.585693359375, 3.13427734375, 3.682861328125, 4.2314453125, 4.780029296875, 5.32861328125, 5.877197265625, 6.42578125, 6.974365234375, 7.52294921875, 8.071533203125, 8.6201171875, 9.168701171875, 9.71728515625, 10.265869140625, 10.814453125, 11.363037109375, 11.91162109375, 12.460205078125, 13.0087890625, 13.557373046875, 14.10595703125, 14.654541015625, 15.203125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 13.0, 13.0, 24.0, 25.0, 43.0, 88.0, 88.0, 185.0, 318.0, 668.0, 1409.0, 3142.0, 8246.0, 23920.0, 89304.0, 392639.0, 399159.0, 90842.0, 24185.0, 8173.0, 3165.0, 1346.0, 626.0, 345.0, 201.0, 134.0, 79.0, 50.0, 38.0, 20.0, 14.0, 14.0, 7.0, 5.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.51171875, -6.30169677734375, -6.0916748046875, -5.88165283203125, -5.671630859375, -5.46160888671875, -5.2515869140625, -5.04156494140625, -4.83154296875, -4.62152099609375, -4.4114990234375, -4.20147705078125, -3.991455078125, -3.78143310546875, -3.5714111328125, -3.36138916015625, -3.1513671875, -2.94134521484375, -2.7313232421875, -2.52130126953125, -2.311279296875, -2.10125732421875, -1.8912353515625, -1.68121337890625, -1.47119140625, -1.26116943359375, -1.0511474609375, -0.84112548828125, -0.631103515625, -0.42108154296875, -0.2110595703125, -0.00103759765625, 0.208984375, 0.41900634765625, 0.6290283203125, 0.83905029296875, 1.049072265625, 1.25909423828125, 1.4691162109375, 1.67913818359375, 1.88916015625, 2.09918212890625, 2.3092041015625, 2.51922607421875, 2.729248046875, 2.93927001953125, 3.1492919921875, 3.35931396484375, 3.5693359375, 3.77935791015625, 3.9893798828125, 4.19940185546875, 4.409423828125, 4.61944580078125, 4.8294677734375, 5.03948974609375, 5.24951171875, 5.45953369140625, 5.6695556640625, 5.87957763671875, 6.089599609375, 6.29962158203125, 6.5096435546875, 6.71966552734375, 6.9296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 9.0, 13.0, 6.0, 18.0, 9.0, 23.0, 20.0, 39.0, 46.0, 41.0, 62.0, 83.0, 72.0, 80.0, 75.0, 71.0, 70.0, 41.0, 36.0, 40.0, 31.0, 20.0, 11.0, 14.0, 15.0, 8.0, 8.0, 9.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0007638931274414062, -0.0007372498512268066, -0.000710606575012207, -0.0006839632987976074, -0.0006573200225830078, -0.0006306767463684082, -0.0006040334701538086, -0.000577390193939209, -0.0005507469177246094, -0.0005241036415100098, -0.0004974603652954102, -0.00047081708908081055, -0.00044417381286621094, -0.00041753053665161133, -0.0003908872604370117, -0.0003642439842224121, -0.0003376007080078125, -0.0003109574317932129, -0.0002843141555786133, -0.00025767087936401367, -0.00023102760314941406, -0.00020438432693481445, -0.00017774105072021484, -0.00015109777450561523, -0.00012445449829101562, -9.781122207641602e-05, -7.11679458618164e-05, -4.45246696472168e-05, -1.7881393432617188e-05, 8.761882781982422e-06, 3.540515899658203e-05, 6.204843521118164e-05, 8.869171142578125e-05, 0.00011533498764038086, 0.00014197826385498047, 0.00016862154006958008, 0.0001952648162841797, 0.0002219080924987793, 0.0002485513687133789, 0.0002751946449279785, 0.0003018379211425781, 0.00032848119735717773, 0.00035512447357177734, 0.00038176774978637695, 0.00040841102600097656, 0.00043505430221557617, 0.0004616975784301758, 0.0004883408546447754, 0.000514984130859375, 0.0005416274070739746, 0.0005682706832885742, 0.0005949139595031738, 0.0006215572357177734, 0.000648200511932373, 0.0006748437881469727, 0.0007014870643615723, 0.0007281303405761719, 0.0007547736167907715, 0.0007814168930053711, 0.0008080601692199707, 0.0008347034454345703, 0.0008613467216491699, 0.0008879899978637695, 0.0009146332740783691, 0.0009412765502929688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 8.0, 1.0, 3.0, 9.0, 18.0, 15.0, 31.0, 27.0, 63.0, 116.0, 189.0, 288.0, 499.0, 1094.0, 2668.0, 9264.0, 50012.0, 459598.0, 460268.0, 50076.0, 9071.0, 2827.0, 1146.0, 546.0, 270.0, 144.0, 107.0, 74.0, 30.0, 26.0, 20.0, 16.0, 8.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.417236328125, -11.10009765625, -10.782958984375, -10.4658203125, -10.148681640625, -9.83154296875, -9.514404296875, -9.197265625, -8.880126953125, -8.56298828125, -8.245849609375, -7.9287109375, -7.611572265625, -7.29443359375, -6.977294921875, -6.66015625, -6.343017578125, -6.02587890625, -5.708740234375, -5.3916015625, -5.074462890625, -4.75732421875, -4.440185546875, -4.123046875, -3.805908203125, -3.48876953125, -3.171630859375, -2.8544921875, -2.537353515625, -2.22021484375, -1.903076171875, -1.5859375, -1.268798828125, -0.95166015625, -0.634521484375, -0.3173828125, -0.000244140625, 0.31689453125, 0.634033203125, 0.951171875, 1.268310546875, 1.58544921875, 1.902587890625, 2.2197265625, 2.536865234375, 2.85400390625, 3.171142578125, 3.48828125, 3.805419921875, 4.12255859375, 4.439697265625, 4.7568359375, 5.073974609375, 5.39111328125, 5.708251953125, 6.025390625, 6.342529296875, 6.65966796875, 6.976806640625, 7.2939453125, 7.611083984375, 7.92822265625, 8.245361328125, 8.5625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 10.0, 19.0, 34.0, 36.0, 67.0, 111.0, 147.0, 151.0, 128.0, 91.0, 75.0, 51.0, 35.0, 17.0, 13.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.03125, -11.6612548828125, -11.291259765625, -10.9212646484375, -10.55126953125, -10.1812744140625, -9.811279296875, -9.4412841796875, -9.0712890625, -8.7012939453125, -8.331298828125, -7.9613037109375, -7.59130859375, -7.2213134765625, -6.851318359375, -6.4813232421875, -6.111328125, -5.7413330078125, -5.371337890625, -5.0013427734375, -4.63134765625, -4.2613525390625, -3.891357421875, -3.5213623046875, -3.1513671875, -2.7813720703125, -2.411376953125, -2.0413818359375, -1.67138671875, -1.3013916015625, -0.931396484375, -0.5614013671875, -0.19140625, 0.1785888671875, 0.548583984375, 0.9185791015625, 1.28857421875, 1.6585693359375, 2.028564453125, 2.3985595703125, 2.7685546875, 3.1385498046875, 3.508544921875, 3.8785400390625, 4.24853515625, 4.6185302734375, 4.988525390625, 5.3585205078125, 5.728515625, 6.0985107421875, 6.468505859375, 6.8385009765625, 7.20849609375, 7.5784912109375, 7.948486328125, 8.3184814453125, 8.6884765625, 9.0584716796875, 9.428466796875, 9.7984619140625, 10.16845703125, 10.5384521484375, 10.908447265625, 11.2784423828125, 11.6484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 10.0, 18.0, 28.0, 44.0, 48.0, 75.0, 85.0, 111.0, 125.0, 104.0, 85.0, 62.0, 81.0, 43.0, 27.0, 20.0, 9.0, 14.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-140.40362548828125, -136.83731079101562, -133.27099609375, -129.7046661376953, -126.13835144042969, -122.57203674316406, -119.0057144165039, -115.43939208984375, -111.87307739257812, -108.3067626953125, -104.74044036865234, -101.17411804199219, -97.60780334472656, -94.04148864746094, -90.47516632080078, -86.90884399414062, -83.342529296875, -79.77621459960938, -76.20989227294922, -72.64356994628906, -69.07725524902344, -65.51094055175781, -61.944618225097656, -58.378299713134766, -54.811981201171875, -51.245662689208984, -47.679344177246094, -44.1130256652832, -40.54670715332031, -36.98038864135742, -33.41407012939453, -29.84775161743164, -26.28143310546875, -22.71511459350586, -19.14879608154297, -15.582477569580078, -12.016159057617188, -8.449840545654297, -4.883522033691406, -1.3172035217285156, 2.249114990234375, 5.815433502197266, 9.381752014160156, 12.948070526123047, 16.514389038085938, 20.080707550048828, 23.64702606201172, 27.21334457397461, 30.7796630859375, 34.34598159790039, 37.91230010986328, 41.47861862182617, 45.04493713378906, 48.61125564575195, 52.177574157714844, 55.743892669677734, 59.310211181640625, 62.876529693603516, 66.4428482055664, 70.00917053222656, 73.57548522949219, 77.14179992675781, 80.70812225341797, 84.27444458007812, 87.84075927734375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 2.0, 7.0, 11.0, 13.0, 15.0, 11.0, 14.0, 15.0, 24.0, 29.0, 25.0, 30.0, 34.0, 34.0, 33.0, 30.0, 35.0, 47.0, 51.0, 40.0, 39.0, 50.0, 37.0, 42.0, 27.0, 29.0, 33.0, 29.0, 26.0, 17.0, 18.0, 12.0, 20.0, 24.0, 9.0, 14.0, 9.0, 11.0, 8.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-75.84077453613281, -73.36387634277344, -70.88697814941406, -68.41007995605469, -65.93318939208984, -63.45629119873047, -60.979393005371094, -58.50249481201172, -56.025596618652344, -53.54869842529297, -51.07180404663086, -48.594905853271484, -46.11800765991211, -43.64111328125, -41.164215087890625, -38.68731689453125, -36.21042251586914, -33.733524322509766, -31.256628036499023, -28.77973175048828, -26.302833557128906, -23.825937271118164, -21.349040985107422, -18.872142791748047, -16.395246505737305, -13.918349266052246, -11.441452026367188, -8.964555740356445, -6.487658500671387, -4.010761260986328, -1.533864974975586, 0.9430332183837891, 3.4199295043945312, 5.89682674407959, 8.373723983764648, 10.85062026977539, 13.32751750946045, 15.804414749145508, 18.28131103515625, 20.758209228515625, 23.235105514526367, 25.71200180053711, 28.188899993896484, 30.665796279907227, 33.14269256591797, 35.619590759277344, 38.09648895263672, 40.573387145996094, 43.0502815246582, 45.52717971801758, 48.00407409667969, 50.48097229003906, 52.95787048339844, 55.43476867675781, 57.91166305541992, 60.3885612487793, 62.865455627441406, 65.34235382080078, 67.81925201416016, 70.296142578125, 72.77304077148438, 75.24993896484375, 77.72683715820312, 80.2037353515625, 82.68063354492188]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 2.0, 9.0, 4.0, 5.0, 12.0, 13.0, 19.0, 17.0, 35.0, 63.0, 117.0, 187.0, 419.0, 748.0, 1725.0, 4326.0, 13890.0, 83888.0, 3990459.0, 77439.0, 13426.0, 4328.0, 1627.0, 714.0, 361.0, 180.0, 91.0, 54.0, 29.0, 23.0, 19.0, 12.0, 4.0, 4.0, 7.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.28125, -34.2275390625, -33.173828125, -32.1201171875, -31.06640625, -30.0126953125, -28.958984375, -27.9052734375, -26.8515625, -25.7978515625, -24.744140625, -23.6904296875, -22.63671875, -21.5830078125, -20.529296875, -19.4755859375, -18.421875, -17.3681640625, -16.314453125, -15.2607421875, -14.20703125, -13.1533203125, -12.099609375, -11.0458984375, -9.9921875, -8.9384765625, -7.884765625, -6.8310546875, -5.77734375, -4.7236328125, -3.669921875, -2.6162109375, -1.5625, -0.5087890625, 0.544921875, 1.5986328125, 2.65234375, 3.7060546875, 4.759765625, 5.8134765625, 6.8671875, 7.9208984375, 8.974609375, 10.0283203125, 11.08203125, 12.1357421875, 13.189453125, 14.2431640625, 15.296875, 16.3505859375, 17.404296875, 18.4580078125, 19.51171875, 20.5654296875, 21.619140625, 22.6728515625, 23.7265625, 24.7802734375, 25.833984375, 26.8876953125, 27.94140625, 28.9951171875, 30.048828125, 31.1025390625, 32.15625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 7.0, 8.0, 14.0, 21.0, 27.0, 35.0, 52.0, 57.0, 58.0, 55.0, 71.0, 66.0, 82.0, 77.0, 70.0, 64.0, 42.0, 40.0, 42.0, 21.0, 26.0, 17.0, 16.0, 9.0, 8.0, 10.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.39453125, -7.18438720703125, -6.9742431640625, -6.76409912109375, -6.553955078125, -6.34381103515625, -6.1336669921875, -5.92352294921875, -5.71337890625, -5.50323486328125, -5.2930908203125, -5.08294677734375, -4.872802734375, -4.66265869140625, -4.4525146484375, -4.24237060546875, -4.0322265625, -3.82208251953125, -3.6119384765625, -3.40179443359375, -3.191650390625, -2.98150634765625, -2.7713623046875, -2.56121826171875, -2.35107421875, -2.14093017578125, -1.9307861328125, -1.72064208984375, -1.510498046875, -1.30035400390625, -1.0902099609375, -0.88006591796875, -0.669921875, -0.45977783203125, -0.2496337890625, -0.03948974609375, 0.170654296875, 0.38079833984375, 0.5909423828125, 0.80108642578125, 1.01123046875, 1.22137451171875, 1.4315185546875, 1.64166259765625, 1.851806640625, 2.06195068359375, 2.2720947265625, 2.48223876953125, 2.6923828125, 2.90252685546875, 3.1126708984375, 3.32281494140625, 3.532958984375, 3.74310302734375, 3.9532470703125, 4.16339111328125, 4.37353515625, 4.58367919921875, 4.7938232421875, 5.00396728515625, 5.214111328125, 5.42425537109375, 5.6343994140625, 5.84454345703125, 6.0546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 9.0, 11.0, 12.0, 22.0, 25.0, 39.0, 59.0, 63.0, 104.0, 103.0, 185.0, 209.0, 309.0, 407.0, 599.0, 888.0, 1505.0, 2581.0, 4841.0, 9973.0, 24216.0, 77829.0, 1086996.0, 2855891.0, 80504.0, 24639.0, 10224.0, 4854.0, 2615.0, 1444.0, 984.0, 594.0, 420.0, 324.0, 204.0, 151.0, 143.0, 93.0, 56.0, 46.0, 28.0, 26.0, 14.0, 11.0, 9.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0], "bins": [-15.953125, -15.5101318359375, -15.067138671875, -14.6241455078125, -14.18115234375, -13.7381591796875, -13.295166015625, -12.8521728515625, -12.4091796875, -11.9661865234375, -11.523193359375, -11.0802001953125, -10.63720703125, -10.1942138671875, -9.751220703125, -9.3082275390625, -8.865234375, -8.4222412109375, -7.979248046875, -7.5362548828125, -7.09326171875, -6.6502685546875, -6.207275390625, -5.7642822265625, -5.3212890625, -4.8782958984375, -4.435302734375, -3.9923095703125, -3.54931640625, -3.1063232421875, -2.663330078125, -2.2203369140625, -1.77734375, -1.3343505859375, -0.891357421875, -0.4483642578125, -0.00537109375, 0.4376220703125, 0.880615234375, 1.3236083984375, 1.7666015625, 2.2095947265625, 2.652587890625, 3.0955810546875, 3.53857421875, 3.9815673828125, 4.424560546875, 4.8675537109375, 5.310546875, 5.7535400390625, 6.196533203125, 6.6395263671875, 7.08251953125, 7.5255126953125, 7.968505859375, 8.4114990234375, 8.8544921875, 9.2974853515625, 9.740478515625, 10.1834716796875, 10.62646484375, 11.0694580078125, 11.512451171875, 11.9554443359375, 12.3984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 0.0, 12.0, 17.0, 28.0, 28.0, 38.0, 64.0, 100.0, 203.0, 1157.0, 1925.0, 191.0, 95.0, 53.0, 43.0, 31.0, 16.0, 18.0, 10.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.767578125, -2.656890869140625, -2.54620361328125, -2.435516357421875, -2.3248291015625, -2.214141845703125, -2.10345458984375, -1.992767333984375, -1.882080078125, -1.771392822265625, -1.66070556640625, -1.550018310546875, -1.4393310546875, -1.328643798828125, -1.21795654296875, -1.107269287109375, -0.99658203125, -0.885894775390625, -0.77520751953125, -0.664520263671875, -0.5538330078125, -0.443145751953125, -0.33245849609375, -0.221771240234375, -0.111083984375, -0.000396728515625, 0.11029052734375, 0.220977783203125, 0.3316650390625, 0.442352294921875, 0.55303955078125, 0.663726806640625, 0.7744140625, 0.885101318359375, 0.99578857421875, 1.106475830078125, 1.2171630859375, 1.327850341796875, 1.43853759765625, 1.549224853515625, 1.659912109375, 1.770599365234375, 1.88128662109375, 1.991973876953125, 2.1026611328125, 2.213348388671875, 2.32403564453125, 2.434722900390625, 2.54541015625, 2.656097412109375, 2.76678466796875, 2.877471923828125, 2.9881591796875, 3.098846435546875, 3.20953369140625, 3.320220947265625, 3.430908203125, 3.541595458984375, 3.65228271484375, 3.762969970703125, 3.8736572265625, 3.984344482421875, 4.09503173828125, 4.205718994140625, 4.31640625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 11.0, 10.0, 24.0, 19.0, 30.0, 52.0, 57.0, 66.0, 76.0, 98.0, 97.0, 83.0, 88.0, 76.0, 52.0, 36.0, 30.0, 26.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.667232513427734, -16.06989288330078, -15.472551345825195, -14.875210762023926, -14.277870178222656, -13.680529594421387, -13.083189010620117, -12.485848426818848, -11.888507843017578, -11.291167259216309, -10.693826675415039, -10.09648609161377, -9.4991455078125, -8.90180492401123, -8.304464340209961, -7.707123756408691, -7.109783172607422, -6.512442588806152, -5.915102005004883, -5.317761421203613, -4.720420837402344, -4.123080253601074, -3.5257396697998047, -2.928399085998535, -2.3310585021972656, -1.733717918395996, -1.1363773345947266, -0.539036750793457, 0.0583038330078125, 0.655644416809082, 1.2529850006103516, 1.850325584411621, 2.4476661682128906, 3.04500675201416, 3.6423473358154297, 4.239687919616699, 4.837028503417969, 5.434369087219238, 6.031709671020508, 6.629050254821777, 7.226390838623047, 7.823731422424316, 8.421072006225586, 9.018412590026855, 9.615753173828125, 10.213093757629395, 10.810434341430664, 11.407774925231934, 12.005115509033203, 12.602456092834473, 13.199796676635742, 13.797137260437012, 14.394477844238281, 14.99181842803955, 15.58915901184082, 16.186500549316406, 16.78384017944336, 17.381179809570312, 17.9785213470459, 18.575862884521484, 19.173202514648438, 19.77054214477539, 20.367883682250977, 20.965225219726562, 21.562564849853516]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 8.0, 9.0, 10.0, 7.0, 6.0, 12.0, 17.0, 10.0, 27.0, 24.0, 21.0, 32.0, 20.0, 46.0, 36.0, 36.0, 37.0, 46.0, 34.0, 41.0, 49.0, 39.0, 33.0, 45.0, 29.0, 29.0, 32.0, 26.0, 25.0, 25.0, 20.0, 24.0, 25.0, 22.0, 10.0, 9.0, 12.0, 15.0, 14.0, 9.0, 6.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-10.456367492675781, -10.142704963684082, -9.829042434692383, -9.515380859375, -9.2017183303833, -8.888055801391602, -8.574393272399902, -8.260730743408203, -7.947068691253662, -7.633406162261963, -7.319744110107422, -7.006081581115723, -6.692419052124023, -6.378756999969482, -6.065094470977783, -5.751432418823242, -5.437769889831543, -5.124107360839844, -4.810445308685303, -4.4967827796936035, -4.1831207275390625, -3.8694581985473633, -3.555795669555664, -3.242133378982544, -2.928471088409424, -2.6148087978363037, -2.3011465072631836, -1.9874839782714844, -1.6738216876983643, -1.3601593971252441, -1.0464969873428345, -0.7328345775604248, -0.4191722869873047, -0.1055099368095398, 0.2081524133682251, 0.52181476354599, 0.8354771137237549, 1.149139404296875, 1.4628018140792847, 1.7764642238616943, 2.0901265144348145, 2.4037888050079346, 2.7174510955810547, 3.031113624572754, 3.344775915145874, 3.658438205718994, 3.9721007347106934, 4.285762786865234, 4.599425315856934, 4.913087844848633, 5.226749897003174, 5.540412425994873, 5.854074478149414, 6.167737007141113, 6.4813995361328125, 6.795062065124512, 7.108724117279053, 7.422386646270752, 7.736048698425293, 8.049711227416992, 8.363373756408691, 8.67703628540039, 8.990697860717773, 9.304360389709473, 9.618022918701172]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 5.0, 11.0, 17.0, 17.0, 45.0, 41.0, 69.0, 116.0, 183.0, 267.0, 418.0, 701.0, 1180.0, 2438.0, 4757.0, 10344.0, 24010.0, 57940.0, 141890.0, 284757.0, 280506.0, 138443.0, 56743.0, 23469.0, 10182.0, 4682.0, 2262.0, 1155.0, 701.0, 432.0, 265.0, 169.0, 95.0, 73.0, 55.0, 36.0, 25.0, 14.0, 7.0, 9.0, 4.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.859375, -8.5823974609375, -8.305419921875, -8.0284423828125, -7.75146484375, -7.4744873046875, -7.197509765625, -6.9205322265625, -6.6435546875, -6.3665771484375, -6.089599609375, -5.8126220703125, -5.53564453125, -5.2586669921875, -4.981689453125, -4.7047119140625, -4.427734375, -4.1507568359375, -3.873779296875, -3.5968017578125, -3.31982421875, -3.0428466796875, -2.765869140625, -2.4888916015625, -2.2119140625, -1.9349365234375, -1.657958984375, -1.3809814453125, -1.10400390625, -0.8270263671875, -0.550048828125, -0.2730712890625, 0.00390625, 0.2808837890625, 0.557861328125, 0.8348388671875, 1.11181640625, 1.3887939453125, 1.665771484375, 1.9427490234375, 2.2197265625, 2.4967041015625, 2.773681640625, 3.0506591796875, 3.32763671875, 3.6046142578125, 3.881591796875, 4.1585693359375, 4.435546875, 4.7125244140625, 4.989501953125, 5.2664794921875, 5.54345703125, 5.8204345703125, 6.097412109375, 6.3743896484375, 6.6513671875, 6.9283447265625, 7.205322265625, 7.4822998046875, 7.75927734375, 8.0362548828125, 8.313232421875, 8.5902099609375, 8.8671875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 13.0, 11.0, 17.0, 26.0, 34.0, 36.0, 39.0, 60.0, 57.0, 73.0, 61.0, 74.0, 83.0, 68.0, 67.0, 52.0, 33.0, 42.0, 36.0, 30.0, 22.0, 16.0, 10.0, 16.0, 7.0, 9.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.330810546875, -7.11474609375, -6.898681640625, -6.6826171875, -6.466552734375, -6.25048828125, -6.034423828125, -5.818359375, -5.602294921875, -5.38623046875, -5.170166015625, -4.9541015625, -4.738037109375, -4.52197265625, -4.305908203125, -4.08984375, -3.873779296875, -3.65771484375, -3.441650390625, -3.2255859375, -3.009521484375, -2.79345703125, -2.577392578125, -2.361328125, -2.145263671875, -1.92919921875, -1.713134765625, -1.4970703125, -1.281005859375, -1.06494140625, -0.848876953125, -0.6328125, -0.416748046875, -0.20068359375, 0.015380859375, 0.2314453125, 0.447509765625, 0.66357421875, 0.879638671875, 1.095703125, 1.311767578125, 1.52783203125, 1.743896484375, 1.9599609375, 2.176025390625, 2.39208984375, 2.608154296875, 2.82421875, 3.040283203125, 3.25634765625, 3.472412109375, 3.6884765625, 3.904541015625, 4.12060546875, 4.336669921875, 4.552734375, 4.768798828125, 4.98486328125, 5.200927734375, 5.4169921875, 5.633056640625, 5.84912109375, 6.065185546875, 6.28125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 11.0, 14.0, 26.0, 47.0, 90.0, 133.0, 189.0, 360.0, 649.0, 1187.0, 3135.0, 17934.0, 389601.0, 601256.0, 27027.0, 3785.0, 1410.0, 740.0, 411.0, 233.0, 134.0, 89.0, 46.0, 19.0, 15.0, 10.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.44677734375, -32.6123046875, -31.77783203125, -30.943359375, -30.10888671875, -29.2744140625, -28.43994140625, -27.60546875, -26.77099609375, -25.9365234375, -25.10205078125, -24.267578125, -23.43310546875, -22.5986328125, -21.76416015625, -20.9296875, -20.09521484375, -19.2607421875, -18.42626953125, -17.591796875, -16.75732421875, -15.9228515625, -15.08837890625, -14.25390625, -13.41943359375, -12.5849609375, -11.75048828125, -10.916015625, -10.08154296875, -9.2470703125, -8.41259765625, -7.578125, -6.74365234375, -5.9091796875, -5.07470703125, -4.240234375, -3.40576171875, -2.5712890625, -1.73681640625, -0.90234375, -0.06787109375, 0.7666015625, 1.60107421875, 2.435546875, 3.27001953125, 4.1044921875, 4.93896484375, 5.7734375, 6.60791015625, 7.4423828125, 8.27685546875, 9.111328125, 9.94580078125, 10.7802734375, 11.61474609375, 12.44921875, 13.28369140625, 14.1181640625, 14.95263671875, 15.787109375, 16.62158203125, 17.4560546875, 18.29052734375, 19.125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 6.0, 10.0, 9.0, 11.0, 10.0, 14.0, 22.0, 36.0, 26.0, 35.0, 35.0, 35.0, 37.0, 47.0, 41.0, 34.0, 62.0, 41.0, 55.0, 57.0, 46.0, 42.0, 41.0, 39.0, 33.0, 35.0, 23.0, 24.0, 28.0, 20.0, 8.0, 11.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.96875, -22.3173828125, -21.666015625, -21.0146484375, -20.36328125, -19.7119140625, -19.060546875, -18.4091796875, -17.7578125, -17.1064453125, -16.455078125, -15.8037109375, -15.15234375, -14.5009765625, -13.849609375, -13.1982421875, -12.546875, -11.8955078125, -11.244140625, -10.5927734375, -9.94140625, -9.2900390625, -8.638671875, -7.9873046875, -7.3359375, -6.6845703125, -6.033203125, -5.3818359375, -4.73046875, -4.0791015625, -3.427734375, -2.7763671875, -2.125, -1.4736328125, -0.822265625, -0.1708984375, 0.48046875, 1.1318359375, 1.783203125, 2.4345703125, 3.0859375, 3.7373046875, 4.388671875, 5.0400390625, 5.69140625, 6.3427734375, 6.994140625, 7.6455078125, 8.296875, 8.9482421875, 9.599609375, 10.2509765625, 10.90234375, 11.5537109375, 12.205078125, 12.8564453125, 13.5078125, 14.1591796875, 14.810546875, 15.4619140625, 16.11328125, 16.7646484375, 17.416015625, 18.0673828125, 18.71875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 0.0, 4.0, 5.0, 8.0, 2.0, 9.0, 15.0, 24.0, 23.0, 33.0, 40.0, 94.0, 112.0, 148.0, 263.0, 386.0, 690.0, 1398.0, 3225.0, 8645.0, 30208.0, 135636.0, 562947.0, 235256.0, 48418.0, 12702.0, 4251.0, 1755.0, 881.0, 498.0, 278.0, 172.0, 108.0, 89.0, 63.0, 45.0, 31.0, 26.0, 15.0, 12.0, 15.0, 10.0, 7.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-6.265625, -6.0947265625, -5.923828125, -5.7529296875, -5.58203125, -5.4111328125, -5.240234375, -5.0693359375, -4.8984375, -4.7275390625, -4.556640625, -4.3857421875, -4.21484375, -4.0439453125, -3.873046875, -3.7021484375, -3.53125, -3.3603515625, -3.189453125, -3.0185546875, -2.84765625, -2.6767578125, -2.505859375, -2.3349609375, -2.1640625, -1.9931640625, -1.822265625, -1.6513671875, -1.48046875, -1.3095703125, -1.138671875, -0.9677734375, -0.796875, -0.6259765625, -0.455078125, -0.2841796875, -0.11328125, 0.0576171875, 0.228515625, 0.3994140625, 0.5703125, 0.7412109375, 0.912109375, 1.0830078125, 1.25390625, 1.4248046875, 1.595703125, 1.7666015625, 1.9375, 2.1083984375, 2.279296875, 2.4501953125, 2.62109375, 2.7919921875, 2.962890625, 3.1337890625, 3.3046875, 3.4755859375, 3.646484375, 3.8173828125, 3.98828125, 4.1591796875, 4.330078125, 4.5009765625, 4.671875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 10.0, 15.0, 15.0, 16.0, 31.0, 47.0, 60.0, 87.0, 110.0, 140.0, 140.0, 85.0, 67.0, 62.0, 31.0, 20.0, 15.0, 11.0, 10.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0016241073608398438, -0.0015850886702537537, -0.0015460699796676636, -0.0015070512890815735, -0.0014680325984954834, -0.0014290139079093933, -0.0013899952173233032, -0.0013509765267372131, -0.001311957836151123, -0.001272939145565033, -0.0012339204549789429, -0.0011949017643928528, -0.0011558830738067627, -0.0011168643832206726, -0.0010778456926345825, -0.0010388270020484924, -0.0009998083114624023, -0.0009607896208763123, -0.0009217709302902222, -0.0008827522397041321, -0.000843733549118042, -0.0008047148585319519, -0.0007656961679458618, -0.0007266774773597717, -0.0006876587867736816, -0.0006486400961875916, -0.0006096214056015015, -0.0005706027150154114, -0.0005315840244293213, -0.0004925653338432312, -0.0004535466432571411, -0.000414527952671051, -0.00037550926208496094, -0.00033649057149887085, -0.00029747188091278076, -0.0002584531903266907, -0.00021943449974060059, -0.0001804158091545105, -0.0001413971185684204, -0.00010237842798233032, -6.335973739624023e-05, -2.4341046810150146e-05, 1.4677643775939941e-05, 5.369633436203003e-05, 9.271502494812012e-05, 0.0001317337155342102, 0.0001707524061203003, 0.00020977109670639038, 0.00024878978729248047, 0.00028780847787857056, 0.00032682716846466064, 0.00036584585905075073, 0.0004048645496368408, 0.0004438832402229309, 0.000482901930809021, 0.0005219206213951111, 0.0005609393119812012, 0.0005999580025672913, 0.0006389766931533813, 0.0006779953837394714, 0.0007170140743255615, 0.0007560327649116516, 0.0007950514554977417, 0.0008340701460838318, 0.0008730888366699219]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 11.0, 8.0, 16.0, 27.0, 46.0, 77.0, 126.0, 261.0, 530.0, 1249.0, 3992.0, 23658.0, 350726.0, 619055.0, 40107.0, 5692.0, 1552.0, 696.0, 303.0, 181.0, 91.0, 51.0, 37.0, 19.0, 13.0, 9.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.3507080078125, -9.029541015625, -8.7083740234375, -8.38720703125, -8.0660400390625, -7.744873046875, -7.4237060546875, -7.1025390625, -6.7813720703125, -6.460205078125, -6.1390380859375, -5.81787109375, -5.4967041015625, -5.175537109375, -4.8543701171875, -4.533203125, -4.2120361328125, -3.890869140625, -3.5697021484375, -3.24853515625, -2.9273681640625, -2.606201171875, -2.2850341796875, -1.9638671875, -1.6427001953125, -1.321533203125, -1.0003662109375, -0.67919921875, -0.3580322265625, -0.036865234375, 0.2843017578125, 0.60546875, 0.9266357421875, 1.247802734375, 1.5689697265625, 1.89013671875, 2.2113037109375, 2.532470703125, 2.8536376953125, 3.1748046875, 3.4959716796875, 3.817138671875, 4.1383056640625, 4.45947265625, 4.7806396484375, 5.101806640625, 5.4229736328125, 5.744140625, 6.0653076171875, 6.386474609375, 6.7076416015625, 7.02880859375, 7.3499755859375, 7.671142578125, 7.9923095703125, 8.3134765625, 8.6346435546875, 8.955810546875, 9.2769775390625, 9.59814453125, 9.9193115234375, 10.240478515625, 10.5616455078125, 10.8828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 5.0, 6.0, 25.0, 31.0, 47.0, 69.0, 84.0, 99.0, 154.0, 146.0, 102.0, 76.0, 54.0, 38.0, 17.0, 12.0, 14.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7109375, -6.439453125, -6.16796875, -5.896484375, -5.625, -5.353515625, -5.08203125, -4.810546875, -4.5390625, -4.267578125, -3.99609375, -3.724609375, -3.453125, -3.181640625, -2.91015625, -2.638671875, -2.3671875, -2.095703125, -1.82421875, -1.552734375, -1.28125, -1.009765625, -0.73828125, -0.466796875, -0.1953125, 0.076171875, 0.34765625, 0.619140625, 0.890625, 1.162109375, 1.43359375, 1.705078125, 1.9765625, 2.248046875, 2.51953125, 2.791015625, 3.0625, 3.333984375, 3.60546875, 3.876953125, 4.1484375, 4.419921875, 4.69140625, 4.962890625, 5.234375, 5.505859375, 5.77734375, 6.048828125, 6.3203125, 6.591796875, 6.86328125, 7.134765625, 7.40625, 7.677734375, 7.94921875, 8.220703125, 8.4921875, 8.763671875, 9.03515625, 9.306640625, 9.578125, 9.849609375, 10.12109375, 10.392578125, 10.6640625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 8.0, 6.0, 12.0, 29.0, 33.0, 60.0, 73.0, 84.0, 132.0, 126.0, 125.0, 73.0, 78.0, 51.0, 46.0, 22.0, 10.0, 14.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.80582427978516, -117.44103240966797, -114.07623291015625, -110.71144104003906, -107.34664916992188, -103.98184967041016, -100.61705780029297, -97.25225830078125, -93.88746643066406, -90.52267456054688, -87.15787506103516, -83.79308319091797, -80.42828369140625, -77.06349182128906, -73.69869995117188, -70.33390808105469, -66.96910858154297, -63.604312896728516, -60.23951721191406, -56.874725341796875, -53.50992965698242, -50.14513397216797, -46.78034210205078, -43.41554641723633, -40.050750732421875, -36.68595504760742, -33.32115936279297, -29.95636749267578, -26.591571807861328, -23.226776123046875, -19.861982345581055, -16.497188568115234, -13.13238525390625, -9.767590522766113, -6.402795791625977, -3.03800106048584, 0.3267936706542969, 3.69158935546875, 7.05638313293457, 10.42117691040039, 13.785972595214844, 17.150768280029297, 20.515562057495117, 23.880355834960938, 27.24515151977539, 30.609947204589844, 33.97473907470703, 37.339534759521484, 40.70433044433594, 44.06912612915039, 47.433921813964844, 50.79871368408203, 54.163509368896484, 57.52830505371094, 60.893096923828125, 64.25788879394531, 67.62268829345703, 70.98748016357422, 74.35227966308594, 77.71707153320312, 81.08186340332031, 84.44666290283203, 87.81145477294922, 91.17625427246094, 94.54104614257812]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 13.0, 4.0, 8.0, 6.0, 11.0, 8.0, 18.0, 14.0, 21.0, 27.0, 18.0, 30.0, 39.0, 32.0, 45.0, 46.0, 41.0, 51.0, 53.0, 37.0, 48.0, 52.0, 46.0, 42.0, 31.0, 29.0, 39.0, 24.0, 27.0, 25.0, 18.0, 15.0, 17.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.33171081542969, -83.55594635009766, -80.78018951416016, -78.00442504882812, -75.2286605834961, -72.45289611816406, -69.67713928222656, -66.90137481689453, -64.1256103515625, -61.349849700927734, -58.5740852355957, -55.79832458496094, -53.022560119628906, -50.24679946899414, -47.471038818359375, -44.695274353027344, -41.919517517089844, -39.14375686645508, -36.36799240112305, -33.59223175048828, -30.816469192504883, -28.040706634521484, -25.26494598388672, -22.48918342590332, -19.713420867919922, -16.937658309936523, -14.161896705627441, -11.38613510131836, -8.610372543334961, -5.8346099853515625, -3.058849334716797, -0.28308677673339844, 2.49267578125, 5.26843786239624, 8.04419994354248, 10.819961547851562, 13.595724105834961, 16.37148666381836, 19.147247314453125, 21.923009872436523, 24.698772430419922, 27.47453498840332, 30.25029754638672, 33.026058197021484, 35.80181884765625, 38.57758331298828, 41.35334396362305, 44.12910461425781, 46.904869079589844, 49.68062973022461, 52.45639419555664, 55.232154846191406, 58.00791931152344, 60.7836799621582, 63.55944061279297, 66.335205078125, 69.1109619140625, 71.88672637939453, 74.66248321533203, 77.43824768066406, 80.2140121459961, 82.98977661132812, 85.76553344726562, 88.54129791259766, 91.31706237792969]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 3.0, 12.0, 20.0, 24.0, 40.0, 56.0, 95.0, 172.0, 307.0, 633.0, 1410.0, 3474.0, 11161.0, 77116.0, 4062617.0, 26438.0, 6407.0, 2262.0, 981.0, 483.0, 223.0, 133.0, 71.0, 45.0, 29.0, 17.0, 15.0, 7.0, 6.0, 3.0, 8.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.5, -34.49365234375, -33.4873046875, -32.48095703125, -31.474609375, -30.46826171875, -29.4619140625, -28.45556640625, -27.44921875, -26.44287109375, -25.4365234375, -24.43017578125, -23.423828125, -22.41748046875, -21.4111328125, -20.40478515625, -19.3984375, -18.39208984375, -17.3857421875, -16.37939453125, -15.373046875, -14.36669921875, -13.3603515625, -12.35400390625, -11.34765625, -10.34130859375, -9.3349609375, -8.32861328125, -7.322265625, -6.31591796875, -5.3095703125, -4.30322265625, -3.296875, -2.29052734375, -1.2841796875, -0.27783203125, 0.728515625, 1.73486328125, 2.7412109375, 3.74755859375, 4.75390625, 5.76025390625, 6.7666015625, 7.77294921875, 8.779296875, 9.78564453125, 10.7919921875, 11.79833984375, 12.8046875, 13.81103515625, 14.8173828125, 15.82373046875, 16.830078125, 17.83642578125, 18.8427734375, 19.84912109375, 20.85546875, 21.86181640625, 22.8681640625, 23.87451171875, 24.880859375, 25.88720703125, 26.8935546875, 27.89990234375, 28.90625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 14.0, 15.0, 16.0, 26.0, 36.0, 47.0, 56.0, 37.0, 68.0, 67.0, 74.0, 72.0, 72.0, 60.0, 71.0, 49.0, 36.0, 43.0, 37.0, 23.0, 12.0, 15.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2318115234375, -7.014404296875, -6.7969970703125, -6.57958984375, -6.3621826171875, -6.144775390625, -5.9273681640625, -5.7099609375, -5.4925537109375, -5.275146484375, -5.0577392578125, -4.84033203125, -4.6229248046875, -4.405517578125, -4.1881103515625, -3.970703125, -3.7532958984375, -3.535888671875, -3.3184814453125, -3.10107421875, -2.8836669921875, -2.666259765625, -2.4488525390625, -2.2314453125, -2.0140380859375, -1.796630859375, -1.5792236328125, -1.36181640625, -1.1444091796875, -0.927001953125, -0.7095947265625, -0.4921875, -0.2747802734375, -0.057373046875, 0.1600341796875, 0.37744140625, 0.5948486328125, 0.812255859375, 1.0296630859375, 1.2470703125, 1.4644775390625, 1.681884765625, 1.8992919921875, 2.11669921875, 2.3341064453125, 2.551513671875, 2.7689208984375, 2.986328125, 3.2037353515625, 3.421142578125, 3.6385498046875, 3.85595703125, 4.0733642578125, 4.290771484375, 4.5081787109375, 4.7255859375, 4.9429931640625, 5.160400390625, 5.3778076171875, 5.59521484375, 5.8126220703125, 6.030029296875, 6.2474365234375, 6.46484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 15.0, 21.0, 17.0, 34.0, 49.0, 59.0, 80.0, 96.0, 121.0, 145.0, 205.0, 311.0, 410.0, 674.0, 1069.0, 1710.0, 3423.0, 8449.0, 32443.0, 3918431.0, 193354.0, 19882.0, 6223.0, 2716.0, 1506.0, 868.0, 546.0, 378.0, 254.0, 186.0, 149.0, 118.0, 87.0, 57.0, 35.0, 39.0, 29.0, 21.0, 18.0, 10.0, 9.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.0126953125, -18.353515625, -17.6943359375, -17.03515625, -16.3759765625, -15.716796875, -15.0576171875, -14.3984375, -13.7392578125, -13.080078125, -12.4208984375, -11.76171875, -11.1025390625, -10.443359375, -9.7841796875, -9.125, -8.4658203125, -7.806640625, -7.1474609375, -6.48828125, -5.8291015625, -5.169921875, -4.5107421875, -3.8515625, -3.1923828125, -2.533203125, -1.8740234375, -1.21484375, -0.5556640625, 0.103515625, 0.7626953125, 1.421875, 2.0810546875, 2.740234375, 3.3994140625, 4.05859375, 4.7177734375, 5.376953125, 6.0361328125, 6.6953125, 7.3544921875, 8.013671875, 8.6728515625, 9.33203125, 9.9912109375, 10.650390625, 11.3095703125, 11.96875, 12.6279296875, 13.287109375, 13.9462890625, 14.60546875, 15.2646484375, 15.923828125, 16.5830078125, 17.2421875, 17.9013671875, 18.560546875, 19.2197265625, 19.87890625, 20.5380859375, 21.197265625, 21.8564453125, 22.515625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 6.0, 10.0, 17.0, 27.0, 66.0, 188.0, 3438.0, 162.0, 62.0, 33.0, 22.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53125, -5.37982177734375, -5.2283935546875, -5.07696533203125, -4.925537109375, -4.77410888671875, -4.6226806640625, -4.47125244140625, -4.31982421875, -4.16839599609375, -4.0169677734375, -3.86553955078125, -3.714111328125, -3.56268310546875, -3.4112548828125, -3.25982666015625, -3.1083984375, -2.95697021484375, -2.8055419921875, -2.65411376953125, -2.502685546875, -2.35125732421875, -2.1998291015625, -2.04840087890625, -1.89697265625, -1.74554443359375, -1.5941162109375, -1.44268798828125, -1.291259765625, -1.13983154296875, -0.9884033203125, -0.83697509765625, -0.685546875, -0.53411865234375, -0.3826904296875, -0.23126220703125, -0.079833984375, 0.07159423828125, 0.2230224609375, 0.37445068359375, 0.52587890625, 0.67730712890625, 0.8287353515625, 0.98016357421875, 1.131591796875, 1.28302001953125, 1.4344482421875, 1.58587646484375, 1.7373046875, 1.88873291015625, 2.0401611328125, 2.19158935546875, 2.343017578125, 2.49444580078125, 2.6458740234375, 2.79730224609375, 2.94873046875, 3.10015869140625, 3.2515869140625, 3.40301513671875, 3.554443359375, 3.70587158203125, 3.8572998046875, 4.00872802734375, 4.16015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 15.0, 23.0, 35.0, 45.0, 69.0, 78.0, 119.0, 119.0, 129.0, 111.0, 83.0, 60.0, 32.0, 16.0, 19.0, 9.0, 6.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.163795471191406, -18.525264739990234, -17.886735916137695, -17.248205184936523, -16.609676361083984, -15.971145629882812, -15.332615852355957, -14.694086074829102, -14.05555534362793, -13.417025566101074, -12.778495788574219, -12.139965057373047, -11.501435279846191, -10.862905502319336, -10.22437572479248, -9.585845947265625, -8.94731616973877, -8.308786392211914, -7.6702561378479, -7.031726360321045, -6.393196105957031, -5.754666328430176, -5.11613655090332, -4.477606296539307, -3.839076519012451, -3.2005465030670166, -2.562016487121582, -1.9234867095947266, -1.284956693649292, -0.6464266777038574, -0.007896900177001953, 0.6306333541870117, 1.2691631317138672, 1.9076931476593018, 2.5462231636047363, 3.184752941131592, 3.8232829570770264, 4.461812973022461, 5.100342750549316, 5.73887300491333, 6.3774027824401855, 7.015932559967041, 7.654462814331055, 8.29299259185791, 8.931522369384766, 9.570053100585938, 10.208581924438477, 10.847112655639648, 11.485642433166504, 12.12417221069336, 12.762701988220215, 13.40123176574707, 14.039762496948242, 14.678292274475098, 15.316822052001953, 15.955352783203125, 16.593881607055664, 17.232412338256836, 17.870941162109375, 18.509471893310547, 19.148000717163086, 19.786531448364258, 20.425060272216797, 21.06359100341797, 21.70212173461914]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 7.0, 5.0, 15.0, 10.0, 15.0, 25.0, 23.0, 17.0, 21.0, 36.0, 33.0, 34.0, 30.0, 45.0, 31.0, 49.0, 29.0, 43.0, 26.0, 34.0, 45.0, 49.0, 35.0, 36.0, 32.0, 39.0, 41.0, 27.0, 18.0, 23.0, 20.0, 18.0, 13.0, 12.0, 5.0, 14.0, 8.0, 1.0, 4.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-8.571041107177734, -8.310115814208984, -8.049189567565918, -7.78826379776001, -7.527338027954102, -7.266412258148193, -7.005486488342285, -6.744560718536377, -6.483634948730469, -6.2227091789245605, -5.961783409118652, -5.700857639312744, -5.439931869506836, -5.179006099700928, -4.9180803298950195, -4.657154560089111, -4.396228790283203, -4.135303020477295, -3.8743772506713867, -3.6134514808654785, -3.3525257110595703, -3.091599941253662, -2.830674171447754, -2.5697484016418457, -2.3088226318359375, -2.0478968620300293, -1.786971092224121, -1.526045322418213, -1.2651195526123047, -1.0041937828063965, -0.7432680130004883, -0.4823422431945801, -0.22141742706298828, 0.03950834274291992, 0.3004341125488281, 0.5613598823547363, 0.8222856521606445, 1.0832114219665527, 1.344137191772461, 1.6050629615783691, 1.8659887313842773, 2.1269145011901855, 2.3878402709960938, 2.648766040802002, 2.90969181060791, 3.1706175804138184, 3.4315433502197266, 3.6924691200256348, 3.953394889831543, 4.214320659637451, 4.475246429443359, 4.736172199249268, 4.997097969055176, 5.258023738861084, 5.518949508666992, 5.7798752784729, 6.040801048278809, 6.301726818084717, 6.562652587890625, 6.823578357696533, 7.084504127502441, 7.34542989730835, 7.606355667114258, 7.867281436920166, 8.128207206726074]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 10.0, 7.0, 17.0, 31.0, 24.0, 45.0, 56.0, 89.0, 126.0, 178.0, 275.0, 459.0, 730.0, 1185.0, 2123.0, 3960.0, 7828.0, 15815.0, 33060.0, 70314.0, 145065.0, 254923.0, 247177.0, 136625.0, 66593.0, 30867.0, 14962.0, 7121.0, 3621.0, 2056.0, 1216.0, 637.0, 479.0, 298.0, 186.0, 122.0, 89.0, 55.0, 32.0, 28.0, 22.0, 16.0, 6.0, 5.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 3.0], "bins": [-7.18359375, -6.9720458984375, -6.760498046875, -6.5489501953125, -6.33740234375, -6.1258544921875, -5.914306640625, -5.7027587890625, -5.4912109375, -5.2796630859375, -5.068115234375, -4.8565673828125, -4.64501953125, -4.4334716796875, -4.221923828125, -4.0103759765625, -3.798828125, -3.5872802734375, -3.375732421875, -3.1641845703125, -2.95263671875, -2.7410888671875, -2.529541015625, -2.3179931640625, -2.1064453125, -1.8948974609375, -1.683349609375, -1.4718017578125, -1.26025390625, -1.0487060546875, -0.837158203125, -0.6256103515625, -0.4140625, -0.2025146484375, 0.009033203125, 0.2205810546875, 0.43212890625, 0.6436767578125, 0.855224609375, 1.0667724609375, 1.2783203125, 1.4898681640625, 1.701416015625, 1.9129638671875, 2.12451171875, 2.3360595703125, 2.547607421875, 2.7591552734375, 2.970703125, 3.1822509765625, 3.393798828125, 3.6053466796875, 3.81689453125, 4.0284423828125, 4.239990234375, 4.4515380859375, 4.6630859375, 4.8746337890625, 5.086181640625, 5.2977294921875, 5.50927734375, 5.7208251953125, 5.932373046875, 6.1439208984375, 6.35546875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 14.0, 14.0, 12.0, 20.0, 29.0, 33.0, 48.0, 44.0, 36.0, 59.0, 66.0, 60.0, 59.0, 69.0, 80.0, 54.0, 52.0, 48.0, 36.0, 39.0, 35.0, 28.0, 14.0, 12.0, 10.0, 11.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.54296875, -7.32623291015625, -7.1094970703125, -6.89276123046875, -6.676025390625, -6.45928955078125, -6.2425537109375, -6.02581787109375, -5.80908203125, -5.59234619140625, -5.3756103515625, -5.15887451171875, -4.942138671875, -4.72540283203125, -4.5086669921875, -4.29193115234375, -4.0751953125, -3.85845947265625, -3.6417236328125, -3.42498779296875, -3.208251953125, -2.99151611328125, -2.7747802734375, -2.55804443359375, -2.34130859375, -2.12457275390625, -1.9078369140625, -1.69110107421875, -1.474365234375, -1.25762939453125, -1.0408935546875, -0.82415771484375, -0.607421875, -0.39068603515625, -0.1739501953125, 0.04278564453125, 0.259521484375, 0.47625732421875, 0.6929931640625, 0.90972900390625, 1.12646484375, 1.34320068359375, 1.5599365234375, 1.77667236328125, 1.993408203125, 2.21014404296875, 2.4268798828125, 2.64361572265625, 2.8603515625, 3.07708740234375, 3.2938232421875, 3.51055908203125, 3.727294921875, 3.94403076171875, 4.1607666015625, 4.37750244140625, 4.59423828125, 4.81097412109375, 5.0277099609375, 5.24444580078125, 5.461181640625, 5.67791748046875, 5.8946533203125, 6.11138916015625, 6.328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 1.0, 11.0, 15.0, 14.0, 25.0, 28.0, 45.0, 55.0, 82.0, 136.0, 208.0, 236.0, 395.0, 559.0, 937.0, 1643.0, 4575.0, 25469.0, 282682.0, 651439.0, 65675.0, 8704.0, 2457.0, 1123.0, 689.0, 385.0, 273.0, 224.0, 135.0, 99.0, 69.0, 36.0, 26.0, 29.0, 21.0, 8.0, 10.0, 11.0, 5.0, 5.0, 8.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.25, -16.697265625, -16.14453125, -15.591796875, -15.0390625, -14.486328125, -13.93359375, -13.380859375, -12.828125, -12.275390625, -11.72265625, -11.169921875, -10.6171875, -10.064453125, -9.51171875, -8.958984375, -8.40625, -7.853515625, -7.30078125, -6.748046875, -6.1953125, -5.642578125, -5.08984375, -4.537109375, -3.984375, -3.431640625, -2.87890625, -2.326171875, -1.7734375, -1.220703125, -0.66796875, -0.115234375, 0.4375, 0.990234375, 1.54296875, 2.095703125, 2.6484375, 3.201171875, 3.75390625, 4.306640625, 4.859375, 5.412109375, 5.96484375, 6.517578125, 7.0703125, 7.623046875, 8.17578125, 8.728515625, 9.28125, 9.833984375, 10.38671875, 10.939453125, 11.4921875, 12.044921875, 12.59765625, 13.150390625, 13.703125, 14.255859375, 14.80859375, 15.361328125, 15.9140625, 16.466796875, 17.01953125, 17.572265625, 18.125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 8.0, 12.0, 12.0, 10.0, 15.0, 29.0, 23.0, 20.0, 26.0, 26.0, 41.0, 31.0, 47.0, 52.0, 62.0, 48.0, 51.0, 41.0, 54.0, 39.0, 59.0, 40.0, 52.0, 34.0, 37.0, 22.0, 25.0, 22.0, 19.0, 10.0, 10.0, 7.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.125, -22.43505859375, -21.7451171875, -21.05517578125, -20.365234375, -19.67529296875, -18.9853515625, -18.29541015625, -17.60546875, -16.91552734375, -16.2255859375, -15.53564453125, -14.845703125, -14.15576171875, -13.4658203125, -12.77587890625, -12.0859375, -11.39599609375, -10.7060546875, -10.01611328125, -9.326171875, -8.63623046875, -7.9462890625, -7.25634765625, -6.56640625, -5.87646484375, -5.1865234375, -4.49658203125, -3.806640625, -3.11669921875, -2.4267578125, -1.73681640625, -1.046875, -0.35693359375, 0.3330078125, 1.02294921875, 1.712890625, 2.40283203125, 3.0927734375, 3.78271484375, 4.47265625, 5.16259765625, 5.8525390625, 6.54248046875, 7.232421875, 7.92236328125, 8.6123046875, 9.30224609375, 9.9921875, 10.68212890625, 11.3720703125, 12.06201171875, 12.751953125, 13.44189453125, 14.1318359375, 14.82177734375, 15.51171875, 16.20166015625, 16.8916015625, 17.58154296875, 18.271484375, 18.96142578125, 19.6513671875, 20.34130859375, 21.03125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 13.0, 14.0, 22.0, 36.0, 50.0, 84.0, 158.0, 219.0, 485.0, 1095.0, 3364.0, 14487.0, 126645.0, 772675.0, 110547.0, 13371.0, 3111.0, 1089.0, 464.0, 223.0, 126.0, 81.0, 59.0, 39.0, 22.0, 15.0, 14.0, 11.0, 10.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0390625, -7.79150390625, -7.5439453125, -7.29638671875, -7.048828125, -6.80126953125, -6.5537109375, -6.30615234375, -6.05859375, -5.81103515625, -5.5634765625, -5.31591796875, -5.068359375, -4.82080078125, -4.5732421875, -4.32568359375, -4.078125, -3.83056640625, -3.5830078125, -3.33544921875, -3.087890625, -2.84033203125, -2.5927734375, -2.34521484375, -2.09765625, -1.85009765625, -1.6025390625, -1.35498046875, -1.107421875, -0.85986328125, -0.6123046875, -0.36474609375, -0.1171875, 0.13037109375, 0.3779296875, 0.62548828125, 0.873046875, 1.12060546875, 1.3681640625, 1.61572265625, 1.86328125, 2.11083984375, 2.3583984375, 2.60595703125, 2.853515625, 3.10107421875, 3.3486328125, 3.59619140625, 3.84375, 4.09130859375, 4.3388671875, 4.58642578125, 4.833984375, 5.08154296875, 5.3291015625, 5.57666015625, 5.82421875, 6.07177734375, 6.3193359375, 6.56689453125, 6.814453125, 7.06201171875, 7.3095703125, 7.55712890625, 7.8046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 5.0, 3.0, 9.0, 3.0, 15.0, 15.0, 13.0, 14.0, 33.0, 50.0, 60.0, 60.0, 64.0, 101.0, 128.0, 82.0, 75.0, 69.0, 37.0, 40.0, 23.0, 22.0, 11.0, 12.0, 12.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0008478164672851562, -0.000820748507976532, -0.0007936805486679077, -0.0007666125893592834, -0.0007395446300506592, -0.0007124766707420349, -0.0006854087114334106, -0.0006583407521247864, -0.0006312727928161621, -0.0006042048335075378, -0.0005771368741989136, -0.0005500689148902893, -0.000523000955581665, -0.0004959329962730408, -0.0004688650369644165, -0.00044179707765579224, -0.00041472911834716797, -0.0003876611590385437, -0.00036059319972991943, -0.00033352524042129517, -0.0003064572811126709, -0.00027938932180404663, -0.00025232136249542236, -0.0002252534031867981, -0.00019818544387817383, -0.00017111748456954956, -0.0001440495252609253, -0.00011698156595230103, -8.991360664367676e-05, -6.284564733505249e-05, -3.577768802642822e-05, -8.709728717803955e-06, 1.8358230590820312e-05, 4.542618989944458e-05, 7.249414920806885e-05, 9.956210851669312e-05, 0.00012663006782531738, 0.00015369802713394165, 0.00018076598644256592, 0.00020783394575119019, 0.00023490190505981445, 0.0002619698643684387, 0.000289037823677063, 0.00031610578298568726, 0.0003431737422943115, 0.0003702417016029358, 0.00039730966091156006, 0.0004243776202201843, 0.0004514455795288086, 0.00047851353883743286, 0.0005055814981460571, 0.0005326494574546814, 0.0005597174167633057, 0.0005867853760719299, 0.0006138533353805542, 0.0006409212946891785, 0.0006679892539978027, 0.000695057213306427, 0.0007221251726150513, 0.0007491931319236755, 0.0007762610912322998, 0.0008033290505409241, 0.0008303970098495483, 0.0008574649691581726, 0.0008845329284667969]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 5.0, 6.0, 24.0, 28.0, 58.0, 91.0, 173.0, 428.0, 1266.0, 4988.0, 57650.0, 879033.0, 95882.0, 6529.0, 1420.0, 503.0, 210.0, 101.0, 71.0, 32.0, 18.0, 15.0, 7.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.484375, -14.098876953125, -13.71337890625, -13.327880859375, -12.9423828125, -12.556884765625, -12.17138671875, -11.785888671875, -11.400390625, -11.014892578125, -10.62939453125, -10.243896484375, -9.8583984375, -9.472900390625, -9.08740234375, -8.701904296875, -8.31640625, -7.930908203125, -7.54541015625, -7.159912109375, -6.7744140625, -6.388916015625, -6.00341796875, -5.617919921875, -5.232421875, -4.846923828125, -4.46142578125, -4.075927734375, -3.6904296875, -3.304931640625, -2.91943359375, -2.533935546875, -2.1484375, -1.762939453125, -1.37744140625, -0.991943359375, -0.6064453125, -0.220947265625, 0.16455078125, 0.550048828125, 0.935546875, 1.321044921875, 1.70654296875, 2.092041015625, 2.4775390625, 2.863037109375, 3.24853515625, 3.634033203125, 4.01953125, 4.405029296875, 4.79052734375, 5.176025390625, 5.5615234375, 5.947021484375, 6.33251953125, 6.718017578125, 7.103515625, 7.489013671875, 7.87451171875, 8.260009765625, 8.6455078125, 9.031005859375, 9.41650390625, 9.802001953125, 10.1875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 10.0, 15.0, 19.0, 34.0, 52.0, 60.0, 81.0, 90.0, 91.0, 113.0, 99.0, 84.0, 62.0, 47.0, 48.0, 25.0, 16.0, 14.0, 11.0, 6.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-9.2578125, -9.04412841796875, -8.8304443359375, -8.61676025390625, -8.403076171875, -8.18939208984375, -7.9757080078125, -7.76202392578125, -7.54833984375, -7.33465576171875, -7.1209716796875, -6.90728759765625, -6.693603515625, -6.47991943359375, -6.2662353515625, -6.05255126953125, -5.8388671875, -5.62518310546875, -5.4114990234375, -5.19781494140625, -4.984130859375, -4.77044677734375, -4.5567626953125, -4.34307861328125, -4.12939453125, -3.91571044921875, -3.7020263671875, -3.48834228515625, -3.274658203125, -3.06097412109375, -2.8472900390625, -2.63360595703125, -2.419921875, -2.20623779296875, -1.9925537109375, -1.77886962890625, -1.565185546875, -1.35150146484375, -1.1378173828125, -0.92413330078125, -0.71044921875, -0.49676513671875, -0.2830810546875, -0.06939697265625, 0.144287109375, 0.35797119140625, 0.5716552734375, 0.78533935546875, 0.9990234375, 1.21270751953125, 1.4263916015625, 1.64007568359375, 1.853759765625, 2.06744384765625, 2.2811279296875, 2.49481201171875, 2.70849609375, 2.92218017578125, 3.1358642578125, 3.34954833984375, 3.563232421875, 3.77691650390625, 3.9906005859375, 4.20428466796875, 4.41796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 11.0, 21.0, 47.0, 79.0, 163.0, 209.0, 206.0, 116.0, 72.0, 54.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-201.981689453125, -197.05015563964844, -192.11862182617188, -187.1870880126953, -182.25555419921875, -177.3240203857422, -172.39248657226562, -167.46095275878906, -162.5294189453125, -157.59788513183594, -152.66635131835938, -147.7348175048828, -142.80328369140625, -137.8717498779297, -132.94021606445312, -128.00868225097656, -123.07714080810547, -118.1456069946289, -113.21407318115234, -108.28253936767578, -103.35100555419922, -98.41947174072266, -93.48793029785156, -88.556396484375, -83.62486267089844, -78.69332885742188, -73.76179504394531, -68.83026123046875, -63.89872741699219, -58.967193603515625, -54.0356559753418, -49.104122161865234, -44.17259216308594, -39.241058349609375, -34.30952453613281, -29.377988815307617, -24.446455001831055, -19.514921188354492, -14.583385467529297, -9.651851654052734, -4.720317840576172, 0.21121644973754883, 5.1427507400512695, 10.074285507202148, 15.005819320678711, 19.937353134155273, 24.86888885498047, 29.80042266845703, 34.731956481933594, 39.663490295410156, 44.59502410888672, 49.52655792236328, 54.458091735839844, 59.389625549316406, 64.3211669921875, 69.25270080566406, 74.18423461914062, 79.11576843261719, 84.04730224609375, 88.97883605957031, 93.91036987304688, 98.84190368652344, 103.7734375, 108.70497131347656, 113.63650512695312]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 6.0, 5.0, 22.0, 15.0, 12.0, 21.0, 24.0, 24.0, 40.0, 36.0, 30.0, 34.0, 42.0, 51.0, 51.0, 50.0, 54.0, 52.0, 48.0, 32.0, 36.0, 32.0, 41.0, 43.0, 31.0, 31.0, 21.0, 14.0, 22.0, 11.0, 10.0, 12.0, 6.0, 9.0, 1.0, 3.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-92.803955078125, -90.09944152832031, -87.3949203491211, -84.6904067993164, -81.98589324951172, -79.2813720703125, -76.57685852050781, -73.87234497070312, -71.1678237915039, -68.46331024169922, -65.7587890625, -63.05427551269531, -60.34975814819336, -57.645240783691406, -54.94072723388672, -52.236209869384766, -49.53169631958008, -46.827178955078125, -44.12266540527344, -41.418148040771484, -38.71363067626953, -36.009117126464844, -33.30459976196289, -30.600082397460938, -27.895566940307617, -25.191051483154297, -22.486534118652344, -19.782018661499023, -17.077503204345703, -14.37298583984375, -11.66847038269043, -8.963953018188477, -6.259437561035156, -3.5549213886260986, -0.850405216217041, 1.8541107177734375, 4.558627128601074, 7.263143539428711, 9.967658996582031, 12.672176361083984, 15.376691818237305, 18.081207275390625, 20.785724639892578, 23.4902400970459, 26.19475555419922, 28.899272918701172, 31.603788375854492, 34.30830383300781, 37.012821197509766, 39.71733856201172, 42.421852111816406, 45.12636947631836, 47.83088684082031, 50.535400390625, 53.23991775512695, 55.944435119628906, 58.648948669433594, 61.35346603393555, 64.0579833984375, 66.76249694824219, 69.46701049804688, 72.1715316772461, 74.87604522705078, 77.58056640625, 80.28507995605469]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 7.0, 11.0, 12.0, 11.0, 36.0, 41.0, 68.0, 118.0, 200.0, 489.0, 1089.0, 3818.0, 20695.0, 3959876.0, 191658.0, 11932.0, 2550.0, 883.0, 357.0, 181.0, 89.0, 58.0, 37.0, 20.0, 15.0, 9.0, 10.0, 8.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.328125, -28.311767578125, -27.29541015625, -26.279052734375, -25.2626953125, -24.246337890625, -23.22998046875, -22.213623046875, -21.197265625, -20.180908203125, -19.16455078125, -18.148193359375, -17.1318359375, -16.115478515625, -15.09912109375, -14.082763671875, -13.06640625, -12.050048828125, -11.03369140625, -10.017333984375, -9.0009765625, -7.984619140625, -6.96826171875, -5.951904296875, -4.935546875, -3.919189453125, -2.90283203125, -1.886474609375, -0.8701171875, 0.146240234375, 1.16259765625, 2.178955078125, 3.1953125, 4.211669921875, 5.22802734375, 6.244384765625, 7.2607421875, 8.277099609375, 9.29345703125, 10.309814453125, 11.326171875, 12.342529296875, 13.35888671875, 14.375244140625, 15.3916015625, 16.407958984375, 17.42431640625, 18.440673828125, 19.45703125, 20.473388671875, 21.48974609375, 22.506103515625, 23.5224609375, 24.538818359375, 25.55517578125, 26.571533203125, 27.587890625, 28.604248046875, 29.62060546875, 30.636962890625, 31.6533203125, 32.669677734375, 33.68603515625, 34.702392578125, 35.71875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 4.0, 7.0, 12.0, 17.0, 18.0, 27.0, 42.0, 35.0, 59.0, 55.0, 66.0, 73.0, 69.0, 61.0, 85.0, 73.0, 49.0, 42.0, 44.0, 38.0, 23.0, 21.0, 18.0, 16.0, 8.0, 17.0, 8.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.546875, -7.32611083984375, -7.1053466796875, -6.88458251953125, -6.663818359375, -6.44305419921875, -6.2222900390625, -6.00152587890625, -5.78076171875, -5.55999755859375, -5.3392333984375, -5.11846923828125, -4.897705078125, -4.67694091796875, -4.4561767578125, -4.23541259765625, -4.0146484375, -3.79388427734375, -3.5731201171875, -3.35235595703125, -3.131591796875, -2.91082763671875, -2.6900634765625, -2.46929931640625, -2.24853515625, -2.02777099609375, -1.8070068359375, -1.58624267578125, -1.365478515625, -1.14471435546875, -0.9239501953125, -0.70318603515625, -0.482421875, -0.26165771484375, -0.0408935546875, 0.17987060546875, 0.400634765625, 0.62139892578125, 0.8421630859375, 1.06292724609375, 1.28369140625, 1.50445556640625, 1.7252197265625, 1.94598388671875, 2.166748046875, 2.38751220703125, 2.6082763671875, 2.82904052734375, 3.0498046875, 3.27056884765625, 3.4913330078125, 3.71209716796875, 3.932861328125, 4.15362548828125, 4.3743896484375, 4.59515380859375, 4.81591796875, 5.03668212890625, 5.2574462890625, 5.47821044921875, 5.698974609375, 5.91973876953125, 6.1405029296875, 6.36126708984375, 6.58203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 17.0, 27.0, 23.0, 35.0, 37.0, 51.0, 76.0, 132.0, 143.0, 234.0, 380.0, 674.0, 1225.0, 2625.0, 6684.0, 22562.0, 312253.0, 3794708.0, 36549.0, 8799.0, 3298.0, 1528.0, 739.0, 433.0, 297.0, 189.0, 119.0, 103.0, 79.0, 55.0, 35.0, 32.0, 30.0, 18.0, 20.0, 6.0, 8.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.671875, -21.05517578125, -20.4384765625, -19.82177734375, -19.205078125, -18.58837890625, -17.9716796875, -17.35498046875, -16.73828125, -16.12158203125, -15.5048828125, -14.88818359375, -14.271484375, -13.65478515625, -13.0380859375, -12.42138671875, -11.8046875, -11.18798828125, -10.5712890625, -9.95458984375, -9.337890625, -8.72119140625, -8.1044921875, -7.48779296875, -6.87109375, -6.25439453125, -5.6376953125, -5.02099609375, -4.404296875, -3.78759765625, -3.1708984375, -2.55419921875, -1.9375, -1.32080078125, -0.7041015625, -0.08740234375, 0.529296875, 1.14599609375, 1.7626953125, 2.37939453125, 2.99609375, 3.61279296875, 4.2294921875, 4.84619140625, 5.462890625, 6.07958984375, 6.6962890625, 7.31298828125, 7.9296875, 8.54638671875, 9.1630859375, 9.77978515625, 10.396484375, 11.01318359375, 11.6298828125, 12.24658203125, 12.86328125, 13.47998046875, 14.0966796875, 14.71337890625, 15.330078125, 15.94677734375, 16.5634765625, 17.18017578125, 17.796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 10.0, 10.0, 12.0, 31.0, 50.0, 216.0, 3172.0, 375.0, 94.0, 44.0, 19.0, 12.0, 8.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3011474609375, -8.000732421875, -7.7003173828125, -7.39990234375, -7.0994873046875, -6.799072265625, -6.4986572265625, -6.1982421875, -5.8978271484375, -5.597412109375, -5.2969970703125, -4.99658203125, -4.6961669921875, -4.395751953125, -4.0953369140625, -3.794921875, -3.4945068359375, -3.194091796875, -2.8936767578125, -2.59326171875, -2.2928466796875, -1.992431640625, -1.6920166015625, -1.3916015625, -1.0911865234375, -0.790771484375, -0.4903564453125, -0.18994140625, 0.1104736328125, 0.410888671875, 0.7113037109375, 1.01171875, 1.3121337890625, 1.612548828125, 1.9129638671875, 2.21337890625, 2.5137939453125, 2.814208984375, 3.1146240234375, 3.4150390625, 3.7154541015625, 4.015869140625, 4.3162841796875, 4.61669921875, 4.9171142578125, 5.217529296875, 5.5179443359375, 5.818359375, 6.1187744140625, 6.419189453125, 6.7196044921875, 7.02001953125, 7.3204345703125, 7.620849609375, 7.9212646484375, 8.2216796875, 8.5220947265625, 8.822509765625, 9.1229248046875, 9.42333984375, 9.7237548828125, 10.024169921875, 10.3245849609375, 10.625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 14.0, 26.0, 13.0, 35.0, 35.0, 51.0, 76.0, 107.0, 93.0, 106.0, 93.0, 78.0, 68.0, 44.0, 43.0, 24.0, 17.0, 10.0, 12.0, 9.0, 6.0, 7.0, 0.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.830476760864258, -25.04753303527832, -24.264591217041016, -23.481647491455078, -22.69870376586914, -21.915760040283203, -21.132816314697266, -20.34987449645996, -19.566930770874023, -18.783987045288086, -18.00104522705078, -17.218101501464844, -16.435157775878906, -15.652214050292969, -14.869271278381348, -14.086328506469727, -13.303384780883789, -12.520441055297852, -11.73749828338623, -10.95455551147461, -10.171611785888672, -9.388668060302734, -8.605725288391113, -7.822782039642334, -7.039838790893555, -6.256895542144775, -5.473952293395996, -4.691009044647217, -3.9080657958984375, -3.125122547149658, -2.342179298400879, -1.5592360496520996, -0.7762947082519531, 0.006648540496826172, 0.7895917892456055, 1.5725350379943848, 2.355478286743164, 3.1384215354919434, 3.9213647842407227, 4.704308032989502, 5.487251281738281, 6.2701945304870605, 7.05313777923584, 7.836081027984619, 8.619024276733398, 9.401968002319336, 10.184910774230957, 10.967853546142578, 11.750797271728516, 12.533740997314453, 13.316683769226074, 14.099626541137695, 14.882570266723633, 15.66551399230957, 16.448455810546875, 17.231399536132812, 18.01434326171875, 18.797286987304688, 19.580230712890625, 20.36317253112793, 21.146116256713867, 21.929059982299805, 22.71200180053711, 23.494945526123047, 24.277889251708984]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 8.0, 2.0, 4.0, 3.0, 6.0, 7.0, 10.0, 9.0, 14.0, 14.0, 21.0, 20.0, 37.0, 31.0, 37.0, 33.0, 30.0, 32.0, 43.0, 45.0, 39.0, 42.0, 45.0, 47.0, 50.0, 43.0, 42.0, 51.0, 23.0, 28.0, 40.0, 32.0, 19.0, 25.0, 15.0, 12.0, 11.0, 6.0, 10.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.05459976196289, -15.5525541305542, -15.050508499145508, -14.548463821411133, -14.046418190002441, -13.54437255859375, -13.042326927185059, -12.540281295776367, -12.038236618041992, -11.5361909866333, -11.03414535522461, -10.532100677490234, -10.030055046081543, -9.528009414672852, -9.02596378326416, -8.523918151855469, -8.021872520446777, -7.519826889038086, -7.017781734466553, -6.515736103057861, -6.013690948486328, -5.511645317077637, -5.009599685668945, -4.507554054260254, -4.005508899688721, -3.5034635066986084, -3.001418113708496, -2.4993724822998047, -1.9973270893096924, -1.49528169631958, -0.9932360649108887, -0.49119067192077637, 0.010854721069335938, 0.512900173664093, 1.01494562625885, 1.516991138458252, 2.0190365314483643, 2.5210819244384766, 3.023127555847168, 3.5251729488372803, 4.027218341827393, 4.529263973236084, 5.031309127807617, 5.533354759216309, 6.035400390625, 6.537445545196533, 7.039491176605225, 7.541536331176758, 8.04358196258545, 8.54562759399414, 9.047673225402832, 9.549718856811523, 10.051763534545898, 10.55380916595459, 11.055854797363281, 11.557900428771973, 12.059946060180664, 12.561991691589355, 13.064037322998047, 13.566082000732422, 14.068127632141113, 14.570173263549805, 15.072218894958496, 15.574264526367188, 16.076309204101562]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 10.0, 7.0, 18.0, 26.0, 23.0, 43.0, 73.0, 101.0, 172.0, 297.0, 484.0, 931.0, 1773.0, 3847.0, 9042.0, 22821.0, 60563.0, 160357.0, 373895.0, 254156.0, 97996.0, 36639.0, 14014.0, 5753.0, 2633.0, 1243.0, 635.0, 376.0, 209.0, 138.0, 81.0, 52.0, 41.0, 32.0, 23.0, 15.0, 7.0, 4.0, 5.0, 4.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.546875, -12.151611328125, -11.75634765625, -11.361083984375, -10.9658203125, -10.570556640625, -10.17529296875, -9.780029296875, -9.384765625, -8.989501953125, -8.59423828125, -8.198974609375, -7.8037109375, -7.408447265625, -7.01318359375, -6.617919921875, -6.22265625, -5.827392578125, -5.43212890625, -5.036865234375, -4.6416015625, -4.246337890625, -3.85107421875, -3.455810546875, -3.060546875, -2.665283203125, -2.27001953125, -1.874755859375, -1.4794921875, -1.084228515625, -0.68896484375, -0.293701171875, 0.1015625, 0.496826171875, 0.89208984375, 1.287353515625, 1.6826171875, 2.077880859375, 2.47314453125, 2.868408203125, 3.263671875, 3.658935546875, 4.05419921875, 4.449462890625, 4.8447265625, 5.239990234375, 5.63525390625, 6.030517578125, 6.42578125, 6.821044921875, 7.21630859375, 7.611572265625, 8.0068359375, 8.402099609375, 8.79736328125, 9.192626953125, 9.587890625, 9.983154296875, 10.37841796875, 10.773681640625, 11.1689453125, 11.564208984375, 11.95947265625, 12.354736328125, 12.75]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 5.0, 10.0, 14.0, 14.0, 22.0, 25.0, 43.0, 46.0, 42.0, 50.0, 62.0, 70.0, 80.0, 67.0, 67.0, 55.0, 69.0, 50.0, 40.0, 34.0, 26.0, 27.0, 15.0, 8.0, 13.0, 11.0, 9.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.578125, -7.356201171875, -7.13427734375, -6.912353515625, -6.6904296875, -6.468505859375, -6.24658203125, -6.024658203125, -5.802734375, -5.580810546875, -5.35888671875, -5.136962890625, -4.9150390625, -4.693115234375, -4.47119140625, -4.249267578125, -4.02734375, -3.805419921875, -3.58349609375, -3.361572265625, -3.1396484375, -2.917724609375, -2.69580078125, -2.473876953125, -2.251953125, -2.030029296875, -1.80810546875, -1.586181640625, -1.3642578125, -1.142333984375, -0.92041015625, -0.698486328125, -0.4765625, -0.254638671875, -0.03271484375, 0.189208984375, 0.4111328125, 0.633056640625, 0.85498046875, 1.076904296875, 1.298828125, 1.520751953125, 1.74267578125, 1.964599609375, 2.1865234375, 2.408447265625, 2.63037109375, 2.852294921875, 3.07421875, 3.296142578125, 3.51806640625, 3.739990234375, 3.9619140625, 4.183837890625, 4.40576171875, 4.627685546875, 4.849609375, 5.071533203125, 5.29345703125, 5.515380859375, 5.7373046875, 5.959228515625, 6.18115234375, 6.403076171875, 6.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 5.0, 14.0, 18.0, 24.0, 30.0, 36.0, 45.0, 72.0, 91.0, 129.0, 184.0, 303.0, 562.0, 963.0, 2424.0, 8647.0, 60738.0, 611007.0, 323041.0, 30764.0, 5486.0, 1748.0, 841.0, 440.0, 292.0, 181.0, 119.0, 96.0, 67.0, 45.0, 43.0, 16.0, 12.0, 14.0, 7.0, 12.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-22.625, -21.91455078125, -21.2041015625, -20.49365234375, -19.783203125, -19.07275390625, -18.3623046875, -17.65185546875, -16.94140625, -16.23095703125, -15.5205078125, -14.81005859375, -14.099609375, -13.38916015625, -12.6787109375, -11.96826171875, -11.2578125, -10.54736328125, -9.8369140625, -9.12646484375, -8.416015625, -7.70556640625, -6.9951171875, -6.28466796875, -5.57421875, -4.86376953125, -4.1533203125, -3.44287109375, -2.732421875, -2.02197265625, -1.3115234375, -0.60107421875, 0.109375, 0.81982421875, 1.5302734375, 2.24072265625, 2.951171875, 3.66162109375, 4.3720703125, 5.08251953125, 5.79296875, 6.50341796875, 7.2138671875, 7.92431640625, 8.634765625, 9.34521484375, 10.0556640625, 10.76611328125, 11.4765625, 12.18701171875, 12.8974609375, 13.60791015625, 14.318359375, 15.02880859375, 15.7392578125, 16.44970703125, 17.16015625, 17.87060546875, 18.5810546875, 19.29150390625, 20.001953125, 20.71240234375, 21.4228515625, 22.13330078125, 22.84375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 11.0, 8.0, 11.0, 9.0, 12.0, 9.0, 25.0, 24.0, 21.0, 23.0, 25.0, 30.0, 35.0, 49.0, 32.0, 53.0, 30.0, 47.0, 43.0, 41.0, 39.0, 56.0, 34.0, 45.0, 33.0, 44.0, 32.0, 43.0, 18.0, 16.0, 21.0, 18.0, 15.0, 10.0, 9.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -15.87451171875, -15.2802734375, -14.68603515625, -14.091796875, -13.49755859375, -12.9033203125, -12.30908203125, -11.71484375, -11.12060546875, -10.5263671875, -9.93212890625, -9.337890625, -8.74365234375, -8.1494140625, -7.55517578125, -6.9609375, -6.36669921875, -5.7724609375, -5.17822265625, -4.583984375, -3.98974609375, -3.3955078125, -2.80126953125, -2.20703125, -1.61279296875, -1.0185546875, -0.42431640625, 0.169921875, 0.76416015625, 1.3583984375, 1.95263671875, 2.546875, 3.14111328125, 3.7353515625, 4.32958984375, 4.923828125, 5.51806640625, 6.1123046875, 6.70654296875, 7.30078125, 7.89501953125, 8.4892578125, 9.08349609375, 9.677734375, 10.27197265625, 10.8662109375, 11.46044921875, 12.0546875, 12.64892578125, 13.2431640625, 13.83740234375, 14.431640625, 15.02587890625, 15.6201171875, 16.21435546875, 16.80859375, 17.40283203125, 17.9970703125, 18.59130859375, 19.185546875, 19.77978515625, 20.3740234375, 20.96826171875, 21.5625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 12.0, 19.0, 26.0, 51.0, 65.0, 125.0, 204.0, 440.0, 838.0, 2295.0, 8294.0, 41914.0, 357119.0, 558945.0, 62070.0, 11151.0, 2916.0, 1082.0, 407.0, 229.0, 112.0, 71.0, 42.0, 27.0, 23.0, 13.0, 16.0, 16.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.671875, -7.4468994140625, -7.221923828125, -6.9969482421875, -6.77197265625, -6.5469970703125, -6.322021484375, -6.0970458984375, -5.8720703125, -5.6470947265625, -5.422119140625, -5.1971435546875, -4.97216796875, -4.7471923828125, -4.522216796875, -4.2972412109375, -4.072265625, -3.8472900390625, -3.622314453125, -3.3973388671875, -3.17236328125, -2.9473876953125, -2.722412109375, -2.4974365234375, -2.2724609375, -2.0474853515625, -1.822509765625, -1.5975341796875, -1.37255859375, -1.1475830078125, -0.922607421875, -0.6976318359375, -0.47265625, -0.2476806640625, -0.022705078125, 0.2022705078125, 0.42724609375, 0.6522216796875, 0.877197265625, 1.1021728515625, 1.3271484375, 1.5521240234375, 1.777099609375, 2.0020751953125, 2.22705078125, 2.4520263671875, 2.677001953125, 2.9019775390625, 3.126953125, 3.3519287109375, 3.576904296875, 3.8018798828125, 4.02685546875, 4.2518310546875, 4.476806640625, 4.7017822265625, 4.9267578125, 5.1517333984375, 5.376708984375, 5.6016845703125, 5.82666015625, 6.0516357421875, 6.276611328125, 6.5015869140625, 6.7265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 6.0, 7.0, 7.0, 4.0, 5.0, 7.0, 8.0, 6.0, 13.0, 23.0, 19.0, 26.0, 34.0, 40.0, 44.0, 64.0, 102.0, 114.0, 131.0, 70.0, 67.0, 44.0, 22.0, 26.0, 26.0, 24.0, 17.0, 14.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011415481567382812, -0.0011044889688491821, -0.001067429780960083, -0.0010303705930709839, -0.0009933114051818848, -0.0009562522172927856, -0.0009191930294036865, -0.0008821338415145874, -0.0008450746536254883, -0.0008080154657363892, -0.00077095627784729, -0.0007338970899581909, -0.0006968379020690918, -0.0006597787141799927, -0.0006227195262908936, -0.0005856603384017944, -0.0005486011505126953, -0.0005115419626235962, -0.00047448277473449707, -0.00043742358684539795, -0.00040036439895629883, -0.0003633052110671997, -0.0003262460231781006, -0.00028918683528900146, -0.00025212764739990234, -0.00021506845951080322, -0.0001780092716217041, -0.00014095008373260498, -0.00010389089584350586, -6.683170795440674e-05, -2.9772520065307617e-05, 7.286667823791504e-06, 4.4345855712890625e-05, 8.140504360198975e-05, 0.00011846423149108887, 0.000155523419380188, 0.0001925826072692871, 0.00022964179515838623, 0.00026670098304748535, 0.00030376017093658447, 0.0003408193588256836, 0.0003778785467147827, 0.00041493773460388184, 0.00045199692249298096, 0.0004890561103820801, 0.0005261152982711792, 0.0005631744861602783, 0.0006002336740493774, 0.0006372928619384766, 0.0006743520498275757, 0.0007114112377166748, 0.0007484704256057739, 0.000785529613494873, 0.0008225888013839722, 0.0008596479892730713, 0.0008967071771621704, 0.0009337663650512695, 0.0009708255529403687, 0.0010078847408294678, 0.001044943928718567, 0.001082003116607666, 0.0011190623044967651, 0.0011561214923858643, 0.0011931806802749634, 0.0012302398681640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 6.0, 4.0, 10.0, 5.0, 11.0, 29.0, 30.0, 52.0, 73.0, 112.0, 185.0, 361.0, 826.0, 2132.0, 8425.0, 57454.0, 686545.0, 261516.0, 23533.0, 4593.0, 1403.0, 563.0, 261.0, 154.0, 94.0, 57.0, 26.0, 31.0, 15.0, 14.0, 13.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.8250732421875, -7.532958984375, -7.2408447265625, -6.94873046875, -6.6566162109375, -6.364501953125, -6.0723876953125, -5.7802734375, -5.4881591796875, -5.196044921875, -4.9039306640625, -4.61181640625, -4.3197021484375, -4.027587890625, -3.7354736328125, -3.443359375, -3.1512451171875, -2.859130859375, -2.5670166015625, -2.27490234375, -1.9827880859375, -1.690673828125, -1.3985595703125, -1.1064453125, -0.8143310546875, -0.522216796875, -0.2301025390625, 0.06201171875, 0.3541259765625, 0.646240234375, 0.9383544921875, 1.23046875, 1.5225830078125, 1.814697265625, 2.1068115234375, 2.39892578125, 2.6910400390625, 2.983154296875, 3.2752685546875, 3.5673828125, 3.8594970703125, 4.151611328125, 4.4437255859375, 4.73583984375, 5.0279541015625, 5.320068359375, 5.6121826171875, 5.904296875, 6.1964111328125, 6.488525390625, 6.7806396484375, 7.07275390625, 7.3648681640625, 7.656982421875, 7.9490966796875, 8.2412109375, 8.5333251953125, 8.825439453125, 9.1175537109375, 9.40966796875, 9.7017822265625, 9.993896484375, 10.2860107421875, 10.578125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 7.0, 10.0, 12.0, 23.0, 30.0, 32.0, 34.0, 41.0, 71.0, 73.0, 73.0, 112.0, 83.0, 113.0, 66.0, 43.0, 45.0, 33.0, 26.0, 12.0, 19.0, 5.0, 6.0, 6.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.394287109375, -6.17138671875, -5.948486328125, -5.7255859375, -5.502685546875, -5.27978515625, -5.056884765625, -4.833984375, -4.611083984375, -4.38818359375, -4.165283203125, -3.9423828125, -3.719482421875, -3.49658203125, -3.273681640625, -3.05078125, -2.827880859375, -2.60498046875, -2.382080078125, -2.1591796875, -1.936279296875, -1.71337890625, -1.490478515625, -1.267578125, -1.044677734375, -0.82177734375, -0.598876953125, -0.3759765625, -0.153076171875, 0.06982421875, 0.292724609375, 0.515625, 0.738525390625, 0.96142578125, 1.184326171875, 1.4072265625, 1.630126953125, 1.85302734375, 2.075927734375, 2.298828125, 2.521728515625, 2.74462890625, 2.967529296875, 3.1904296875, 3.413330078125, 3.63623046875, 3.859130859375, 4.08203125, 4.304931640625, 4.52783203125, 4.750732421875, 4.9736328125, 5.196533203125, 5.41943359375, 5.642333984375, 5.865234375, 6.088134765625, 6.31103515625, 6.533935546875, 6.7568359375, 6.979736328125, 7.20263671875, 7.425537109375, 7.6484375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 9.0, 3.0, 17.0, 29.0, 39.0, 96.0, 133.0, 160.0, 176.0, 122.0, 79.0, 56.0, 35.0, 23.0, 9.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.20683288574219, -55.46512222290039, -50.723411560058594, -45.98170471191406, -41.239994049072266, -36.49828338623047, -31.756574630737305, -27.01486587524414, -22.273155212402344, -17.531444549560547, -12.789735794067383, -8.048026084899902, -3.306316375732422, 1.435394287109375, 6.177103042602539, 10.918811798095703, 15.6605224609375, 20.402233123779297, 25.14394187927246, 29.885650634765625, 34.62736129760742, 39.36907196044922, 44.11077880859375, 48.85248947143555, 53.594200134277344, 58.33591079711914, 63.07762145996094, 67.81932830810547, 72.56103515625, 77.30274963378906, 82.0444564819336, 86.78616333007812, 91.52789306640625, 96.26959991455078, 101.01131439208984, 105.75302124023438, 110.49473571777344, 115.23644256591797, 119.9781494140625, 124.71986389160156, 129.46157836914062, 134.2032928466797, 138.9449920654297, 143.68670654296875, 148.4284210205078, 153.17013549804688, 157.91183471679688, 162.65354919433594, 167.39524841308594, 172.136962890625, 176.878662109375, 181.62037658691406, 186.36209106445312, 191.10379028320312, 195.8455047607422, 200.58721923828125, 205.32891845703125, 210.0706329345703, 214.8123321533203, 219.55404663085938, 224.29576110839844, 229.0374755859375, 233.7791748046875, 238.52088928222656, 243.26260375976562]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 9.0, 8.0, 6.0, 6.0, 15.0, 27.0, 19.0, 29.0, 24.0, 20.0, 36.0, 29.0, 45.0, 50.0, 50.0, 54.0, 56.0, 59.0, 57.0, 49.0, 55.0, 38.0, 37.0, 27.0, 40.0, 29.0, 26.0, 21.0, 15.0, 8.0, 14.0, 9.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-100.76631164550781, -97.7457275390625, -94.72514343261719, -91.70455932617188, -88.68397521972656, -85.66339111328125, -82.64280700683594, -79.62223052978516, -76.60164642333984, -73.58106231689453, -70.56047821044922, -67.5398941040039, -64.5193099975586, -61.49872970581055, -58.478145599365234, -55.45756530761719, -52.43697738647461, -49.4163932800293, -46.395809173583984, -43.37522888183594, -40.354644775390625, -37.33406066894531, -34.3134765625, -31.29289436340332, -28.272310256958008, -25.251726150512695, -22.231143951416016, -19.210559844970703, -16.18997573852539, -13.169393539428711, -10.148809432983398, -7.128227233886719, -4.107643127441406, -1.087059736251831, 1.9335236549377441, 4.954107284545898, 7.9746904373168945, 10.99527359008789, 14.015857696533203, 17.036439895629883, 20.057024002075195, 23.077608108520508, 26.098190307617188, 29.1187744140625, 32.13935852050781, 35.159942626953125, 38.18052673339844, 41.201107025146484, 44.2216911315918, 47.24227523803711, 50.26285934448242, 53.28343963623047, 56.30402374267578, 59.324607849121094, 62.345191955566406, 65.36577606201172, 68.38636016845703, 71.40694427490234, 74.42752838134766, 77.44811248779297, 80.46869659423828, 83.48927307128906, 86.50985717773438, 89.53044128417969, 92.551025390625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 6.0, 16.0, 19.0, 18.0, 25.0, 43.0, 56.0, 75.0, 119.0, 203.0, 302.0, 548.0, 853.0, 1594.0, 2996.0, 5981.0, 13459.0, 38907.0, 172678.0, 2533582.0, 1255370.0, 115735.0, 30229.0, 11113.0, 4865.0, 2483.0, 1289.0, 683.0, 392.0, 209.0, 135.0, 73.0, 69.0, 51.0, 28.0, 19.0, 22.0, 8.0, 9.0, 6.0, 5.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.4765625, -10.14794921875, -9.8193359375, -9.49072265625, -9.162109375, -8.83349609375, -8.5048828125, -8.17626953125, -7.84765625, -7.51904296875, -7.1904296875, -6.86181640625, -6.533203125, -6.20458984375, -5.8759765625, -5.54736328125, -5.21875, -4.89013671875, -4.5615234375, -4.23291015625, -3.904296875, -3.57568359375, -3.2470703125, -2.91845703125, -2.58984375, -2.26123046875, -1.9326171875, -1.60400390625, -1.275390625, -0.94677734375, -0.6181640625, -0.28955078125, 0.0390625, 0.36767578125, 0.6962890625, 1.02490234375, 1.353515625, 1.68212890625, 2.0107421875, 2.33935546875, 2.66796875, 2.99658203125, 3.3251953125, 3.65380859375, 3.982421875, 4.31103515625, 4.6396484375, 4.96826171875, 5.296875, 5.62548828125, 5.9541015625, 6.28271484375, 6.611328125, 6.93994140625, 7.2685546875, 7.59716796875, 7.92578125, 8.25439453125, 8.5830078125, 8.91162109375, 9.240234375, 9.56884765625, 9.8974609375, 10.22607421875, 10.5546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 8.0, 12.0, 21.0, 26.0, 28.0, 52.0, 54.0, 68.0, 66.0, 75.0, 81.0, 90.0, 78.0, 79.0, 67.0, 43.0, 50.0, 31.0, 19.0, 16.0, 17.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4140625, -7.157470703125, -6.90087890625, -6.644287109375, -6.3876953125, -6.131103515625, -5.87451171875, -5.617919921875, -5.361328125, -5.104736328125, -4.84814453125, -4.591552734375, -4.3349609375, -4.078369140625, -3.82177734375, -3.565185546875, -3.30859375, -3.052001953125, -2.79541015625, -2.538818359375, -2.2822265625, -2.025634765625, -1.76904296875, -1.512451171875, -1.255859375, -0.999267578125, -0.74267578125, -0.486083984375, -0.2294921875, 0.027099609375, 0.28369140625, 0.540283203125, 0.796875, 1.053466796875, 1.31005859375, 1.566650390625, 1.8232421875, 2.079833984375, 2.33642578125, 2.593017578125, 2.849609375, 3.106201171875, 3.36279296875, 3.619384765625, 3.8759765625, 4.132568359375, 4.38916015625, 4.645751953125, 4.90234375, 5.158935546875, 5.41552734375, 5.672119140625, 5.9287109375, 6.185302734375, 6.44189453125, 6.698486328125, 6.955078125, 7.211669921875, 7.46826171875, 7.724853515625, 7.9814453125, 8.238037109375, 8.49462890625, 8.751220703125, 9.0078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 9.0, 9.0, 15.0, 19.0, 24.0, 32.0, 51.0, 88.0, 122.0, 259.0, 411.0, 708.0, 1306.0, 2832.0, 6240.0, 16515.0, 56347.0, 415161.0, 3361170.0, 264134.0, 44633.0, 13663.0, 5352.0, 2335.0, 1155.0, 646.0, 385.0, 223.0, 129.0, 91.0, 56.0, 45.0, 30.0, 19.0, 6.0, 9.0, 10.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-12.375, -11.9681396484375, -11.561279296875, -11.1544189453125, -10.74755859375, -10.3406982421875, -9.933837890625, -9.5269775390625, -9.1201171875, -8.7132568359375, -8.306396484375, -7.8995361328125, -7.49267578125, -7.0858154296875, -6.678955078125, -6.2720947265625, -5.865234375, -5.4583740234375, -5.051513671875, -4.6446533203125, -4.23779296875, -3.8309326171875, -3.424072265625, -3.0172119140625, -2.6103515625, -2.2034912109375, -1.796630859375, -1.3897705078125, -0.98291015625, -0.5760498046875, -0.169189453125, 0.2376708984375, 0.64453125, 1.0513916015625, 1.458251953125, 1.8651123046875, 2.27197265625, 2.6788330078125, 3.085693359375, 3.4925537109375, 3.8994140625, 4.3062744140625, 4.713134765625, 5.1199951171875, 5.52685546875, 5.9337158203125, 6.340576171875, 6.7474365234375, 7.154296875, 7.5611572265625, 7.968017578125, 8.3748779296875, 8.78173828125, 9.1885986328125, 9.595458984375, 10.0023193359375, 10.4091796875, 10.8160400390625, 11.222900390625, 11.6297607421875, 12.03662109375, 12.4434814453125, 12.850341796875, 13.2572021484375, 13.6640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 5.0, 19.0, 23.0, 16.0, 30.0, 41.0, 72.0, 119.0, 244.0, 596.0, 1236.0, 865.0, 363.0, 176.0, 101.0, 63.0, 29.0, 20.0, 12.0, 3.0, 10.0, 6.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.5902099609375, -18.055419921875, -17.5206298828125, -16.98583984375, -16.4510498046875, -15.916259765625, -15.3814697265625, -14.8466796875, -14.3118896484375, -13.777099609375, -13.2423095703125, -12.70751953125, -12.1727294921875, -11.637939453125, -11.1031494140625, -10.568359375, -10.0335693359375, -9.498779296875, -8.9639892578125, -8.42919921875, -7.8944091796875, -7.359619140625, -6.8248291015625, -6.2900390625, -5.7552490234375, -5.220458984375, -4.6856689453125, -4.15087890625, -3.6160888671875, -3.081298828125, -2.5465087890625, -2.01171875, -1.4769287109375, -0.942138671875, -0.4073486328125, 0.12744140625, 0.6622314453125, 1.197021484375, 1.7318115234375, 2.2666015625, 2.8013916015625, 3.336181640625, 3.8709716796875, 4.40576171875, 4.9405517578125, 5.475341796875, 6.0101318359375, 6.544921875, 7.0797119140625, 7.614501953125, 8.1492919921875, 8.68408203125, 9.2188720703125, 9.753662109375, 10.2884521484375, 10.8232421875, 11.3580322265625, 11.892822265625, 12.4276123046875, 12.96240234375, 13.4971923828125, 14.031982421875, 14.5667724609375, 15.1015625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 1.0, 6.0, 4.0, 9.0, 13.0, 14.0, 25.0, 47.0, 71.0, 111.0, 112.0, 114.0, 123.0, 113.0, 80.0, 47.0, 35.0, 17.0, 15.0, 10.0, 6.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-121.56648254394531, -118.35519409179688, -115.14391326904297, -111.93262481689453, -108.72134399414062, -105.51005554199219, -102.29876708984375, -99.08748626708984, -95.8761978149414, -92.66490936279297, -89.45362854003906, -86.24234008789062, -83.03105926513672, -79.81977081298828, -76.60848999023438, -73.39720153808594, -70.1859130859375, -66.97462463378906, -63.763343811035156, -60.55205535888672, -57.34077072143555, -54.129486083984375, -50.9182014465332, -47.70691680908203, -44.495635986328125, -41.28435134887695, -38.07306671142578, -34.861778259277344, -31.650493621826172, -28.439208984375, -25.227924346923828, -22.016637802124023, -18.80535125732422, -15.59406566619873, -12.382780075073242, -9.17149543762207, -5.960209846496582, -2.7489242553710938, 0.4623603820800781, 3.673646926879883, 6.884931564331055, 10.096217155456543, 13.307502746582031, 16.518787384033203, 19.730072021484375, 22.94135856628418, 26.15264320373535, 29.363929748535156, 32.57521438598633, 35.7864990234375, 38.99778366088867, 42.209068298339844, 45.42035675048828, 48.63164138793945, 51.842926025390625, 55.05421447753906, 58.26549530029297, 61.47677993774414, 64.68806457519531, 67.89935302734375, 71.11063385009766, 74.3219223022461, 77.533203125, 80.74449157714844, 83.95578002929688]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 12.0, 9.0, 13.0, 23.0, 19.0, 35.0, 25.0, 44.0, 30.0, 40.0, 48.0, 46.0, 53.0, 45.0, 47.0, 53.0, 54.0, 42.0, 47.0, 54.0, 47.0, 36.0, 41.0, 22.0, 26.0, 13.0, 17.0, 13.0, 8.0, 7.0, 4.0, 10.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-73.15232849121094, -71.20829772949219, -69.2642593383789, -67.32022857666016, -65.37619018554688, -63.432159423828125, -61.48812484741211, -59.544090270996094, -57.600059509277344, -55.65602493286133, -53.71199035644531, -51.76795959472656, -49.82392501831055, -47.87989044189453, -45.935855865478516, -43.9918212890625, -42.047786712646484, -40.10375213623047, -38.15971755981445, -36.21568298339844, -34.27165222167969, -32.32761764526367, -30.383583068847656, -28.43954849243164, -26.495515823364258, -24.551481246948242, -22.60744857788086, -20.663414001464844, -18.719379425048828, -16.775346755981445, -14.83131217956543, -12.88727855682373, -10.943241119384766, -8.999207496643066, -7.055173397064209, -5.111139297485352, -3.1671056747436523, -1.2230720520019531, 0.7209625244140625, 2.6649961471557617, 4.609029769897461, 6.55306339263916, 8.49709701538086, 10.441131591796875, 12.385165214538574, 14.329198837280273, 16.27323341369629, 18.217266082763672, 20.161300659179688, 22.105335235595703, 24.049367904663086, 25.9934024810791, 27.937435150146484, 29.8814697265625, 31.825504302978516, 33.76953887939453, 35.71356964111328, 37.6576042175293, 39.60163879394531, 41.54566955566406, 43.48970413208008, 45.433738708496094, 47.37777328491211, 49.321807861328125, 51.26584243774414]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 9.0, 12.0, 25.0, 27.0, 46.0, 51.0, 94.0, 166.0, 259.0, 392.0, 770.0, 1385.0, 2495.0, 4990.0, 10841.0, 25466.0, 60662.0, 161050.0, 408964.0, 228693.0, 81239.0, 33327.0, 14182.0, 6338.0, 3160.0, 1644.0, 887.0, 522.0, 323.0, 196.0, 112.0, 76.0, 46.0, 38.0, 21.0, 8.0, 14.0, 6.0, 1.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.625, -10.2784423828125, -9.931884765625, -9.5853271484375, -9.23876953125, -8.8922119140625, -8.545654296875, -8.1990966796875, -7.8525390625, -7.5059814453125, -7.159423828125, -6.8128662109375, -6.46630859375, -6.1197509765625, -5.773193359375, -5.4266357421875, -5.080078125, -4.7335205078125, -4.386962890625, -4.0404052734375, -3.69384765625, -3.3472900390625, -3.000732421875, -2.6541748046875, -2.3076171875, -1.9610595703125, -1.614501953125, -1.2679443359375, -0.92138671875, -0.5748291015625, -0.228271484375, 0.1182861328125, 0.46484375, 0.8114013671875, 1.157958984375, 1.5045166015625, 1.85107421875, 2.1976318359375, 2.544189453125, 2.8907470703125, 3.2373046875, 3.5838623046875, 3.930419921875, 4.2769775390625, 4.62353515625, 4.9700927734375, 5.316650390625, 5.6632080078125, 6.009765625, 6.3563232421875, 6.702880859375, 7.0494384765625, 7.39599609375, 7.7425537109375, 8.089111328125, 8.4356689453125, 8.7822265625, 9.1287841796875, 9.475341796875, 9.8218994140625, 10.16845703125, 10.5150146484375, 10.861572265625, 11.2081298828125, 11.5546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 11.0, 10.0, 11.0, 29.0, 26.0, 45.0, 48.0, 60.0, 54.0, 60.0, 61.0, 72.0, 62.0, 76.0, 66.0, 58.0, 46.0, 50.0, 36.0, 35.0, 19.0, 17.0, 11.0, 12.0, 6.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.42578125, -7.20660400390625, -6.9874267578125, -6.76824951171875, -6.549072265625, -6.32989501953125, -6.1107177734375, -5.89154052734375, -5.67236328125, -5.45318603515625, -5.2340087890625, -5.01483154296875, -4.795654296875, -4.57647705078125, -4.3572998046875, -4.13812255859375, -3.9189453125, -3.69976806640625, -3.4805908203125, -3.26141357421875, -3.042236328125, -2.82305908203125, -2.6038818359375, -2.38470458984375, -2.16552734375, -1.94635009765625, -1.7271728515625, -1.50799560546875, -1.288818359375, -1.06964111328125, -0.8504638671875, -0.63128662109375, -0.412109375, -0.19293212890625, 0.0262451171875, 0.24542236328125, 0.464599609375, 0.68377685546875, 0.9029541015625, 1.12213134765625, 1.34130859375, 1.56048583984375, 1.7796630859375, 1.99884033203125, 2.218017578125, 2.43719482421875, 2.6563720703125, 2.87554931640625, 3.0947265625, 3.31390380859375, 3.5330810546875, 3.75225830078125, 3.971435546875, 4.19061279296875, 4.4097900390625, 4.62896728515625, 4.84814453125, 5.06732177734375, 5.2864990234375, 5.50567626953125, 5.724853515625, 5.94403076171875, 6.1632080078125, 6.38238525390625, 6.6015625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 4.0, 3.0, 14.0, 13.0, 9.0, 15.0, 26.0, 34.0, 51.0, 58.0, 104.0, 150.0, 202.0, 378.0, 713.0, 1806.0, 5720.0, 41660.0, 778177.0, 199075.0, 14638.0, 3127.0, 1158.0, 547.0, 330.0, 174.0, 104.0, 70.0, 56.0, 39.0, 25.0, 15.0, 18.0, 11.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5625, -28.712158203125, -27.86181640625, -27.011474609375, -26.1611328125, -25.310791015625, -24.46044921875, -23.610107421875, -22.759765625, -21.909423828125, -21.05908203125, -20.208740234375, -19.3583984375, -18.508056640625, -17.65771484375, -16.807373046875, -15.95703125, -15.106689453125, -14.25634765625, -13.406005859375, -12.5556640625, -11.705322265625, -10.85498046875, -10.004638671875, -9.154296875, -8.303955078125, -7.45361328125, -6.603271484375, -5.7529296875, -4.902587890625, -4.05224609375, -3.201904296875, -2.3515625, -1.501220703125, -0.65087890625, 0.199462890625, 1.0498046875, 1.900146484375, 2.75048828125, 3.600830078125, 4.451171875, 5.301513671875, 6.15185546875, 7.002197265625, 7.8525390625, 8.702880859375, 9.55322265625, 10.403564453125, 11.25390625, 12.104248046875, 12.95458984375, 13.804931640625, 14.6552734375, 15.505615234375, 16.35595703125, 17.206298828125, 18.056640625, 18.906982421875, 19.75732421875, 20.607666015625, 21.4580078125, 22.308349609375, 23.15869140625, 24.009033203125, 24.859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 7.0, 10.0, 18.0, 17.0, 15.0, 37.0, 26.0, 31.0, 25.0, 45.0, 44.0, 45.0, 38.0, 49.0, 53.0, 63.0, 49.0, 55.0, 51.0, 38.0, 35.0, 44.0, 29.0, 23.0, 19.0, 14.0, 25.0, 15.0, 10.0, 13.0, 8.0, 6.0, 6.0, 6.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.84375, -19.256591796875, -18.66943359375, -18.082275390625, -17.4951171875, -16.907958984375, -16.32080078125, -15.733642578125, -15.146484375, -14.559326171875, -13.97216796875, -13.385009765625, -12.7978515625, -12.210693359375, -11.62353515625, -11.036376953125, -10.44921875, -9.862060546875, -9.27490234375, -8.687744140625, -8.1005859375, -7.513427734375, -6.92626953125, -6.339111328125, -5.751953125, -5.164794921875, -4.57763671875, -3.990478515625, -3.4033203125, -2.816162109375, -2.22900390625, -1.641845703125, -1.0546875, -0.467529296875, 0.11962890625, 0.706787109375, 1.2939453125, 1.881103515625, 2.46826171875, 3.055419921875, 3.642578125, 4.229736328125, 4.81689453125, 5.404052734375, 5.9912109375, 6.578369140625, 7.16552734375, 7.752685546875, 8.33984375, 8.927001953125, 9.51416015625, 10.101318359375, 10.6884765625, 11.275634765625, 11.86279296875, 12.449951171875, 13.037109375, 13.624267578125, 14.21142578125, 14.798583984375, 15.3857421875, 15.972900390625, 16.56005859375, 17.147216796875, 17.734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 9.0, 7.0, 10.0, 23.0, 13.0, 24.0, 41.0, 43.0, 77.0, 132.0, 235.0, 452.0, 962.0, 2330.0, 7544.0, 32044.0, 221694.0, 684395.0, 76688.0, 14839.0, 4076.0, 1509.0, 579.0, 331.0, 177.0, 108.0, 56.0, 37.0, 25.0, 20.0, 21.0, 9.0, 11.0, 15.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66796875, -5.4599609375, -5.251953125, -5.0439453125, -4.8359375, -4.6279296875, -4.419921875, -4.2119140625, -4.00390625, -3.7958984375, -3.587890625, -3.3798828125, -3.171875, -2.9638671875, -2.755859375, -2.5478515625, -2.33984375, -2.1318359375, -1.923828125, -1.7158203125, -1.5078125, -1.2998046875, -1.091796875, -0.8837890625, -0.67578125, -0.4677734375, -0.259765625, -0.0517578125, 0.15625, 0.3642578125, 0.572265625, 0.7802734375, 0.98828125, 1.1962890625, 1.404296875, 1.6123046875, 1.8203125, 2.0283203125, 2.236328125, 2.4443359375, 2.65234375, 2.8603515625, 3.068359375, 3.2763671875, 3.484375, 3.6923828125, 3.900390625, 4.1083984375, 4.31640625, 4.5244140625, 4.732421875, 4.9404296875, 5.1484375, 5.3564453125, 5.564453125, 5.7724609375, 5.98046875, 6.1884765625, 6.396484375, 6.6044921875, 6.8125, 7.0205078125, 7.228515625, 7.4365234375, 7.64453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 12.0, 9.0, 10.0, 11.0, 14.0, 12.0, 33.0, 35.0, 59.0, 116.0, 167.0, 167.0, 117.0, 39.0, 31.0, 34.0, 19.0, 25.0, 13.0, 15.0, 13.0, 12.0, 11.0, 4.0, 4.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001697540283203125, -0.0016528666019439697, -0.0016081929206848145, -0.0015635192394256592, -0.001518845558166504, -0.0014741718769073486, -0.0014294981956481934, -0.001384824514389038, -0.0013401508331298828, -0.0012954771518707275, -0.0012508034706115723, -0.001206129789352417, -0.0011614561080932617, -0.0011167824268341064, -0.0010721087455749512, -0.001027435064315796, -0.0009827613830566406, -0.0009380877017974854, -0.0008934140205383301, -0.0008487403392791748, -0.0008040666580200195, -0.0007593929767608643, -0.000714719295501709, -0.0006700456142425537, -0.0006253719329833984, -0.0005806982517242432, -0.0005360245704650879, -0.0004913508892059326, -0.00044667720794677734, -0.00040200352668762207, -0.0003573298454284668, -0.0003126561641693115, -0.00026798248291015625, -0.00022330880165100098, -0.0001786351203918457, -0.00013396143913269043, -8.928775787353516e-05, -4.461407661437988e-05, 5.960464477539063e-08, 4.4733285903930664e-05, 8.940696716308594e-05, 0.0001340806484222412, 0.00017875432968139648, 0.00022342801094055176, 0.00026810169219970703, 0.0003127753734588623, 0.0003574490547180176, 0.00040212273597717285, 0.0004467964172363281, 0.0004914700984954834, 0.0005361437797546387, 0.0005808174610137939, 0.0006254911422729492, 0.0006701648235321045, 0.0007148385047912598, 0.000759512186050415, 0.0008041858673095703, 0.0008488595485687256, 0.0008935332298278809, 0.0009382069110870361, 0.0009828805923461914, 0.0010275542736053467, 0.001072227954864502, 0.0011169016361236572, 0.0011615753173828125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 10.0, 9.0, 21.0, 25.0, 27.0, 34.0, 52.0, 114.0, 149.0, 239.0, 404.0, 777.0, 1900.0, 5991.0, 32527.0, 376622.0, 575489.0, 42699.0, 7281.0, 2216.0, 868.0, 436.0, 254.0, 128.0, 98.0, 61.0, 36.0, 19.0, 21.0, 10.0, 5.0, 7.0, 8.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.890625, -8.64410400390625, -8.3975830078125, -8.15106201171875, -7.904541015625, -7.65802001953125, -7.4114990234375, -7.16497802734375, -6.91845703125, -6.67193603515625, -6.4254150390625, -6.17889404296875, -5.932373046875, -5.68585205078125, -5.4393310546875, -5.19281005859375, -4.9462890625, -4.69976806640625, -4.4532470703125, -4.20672607421875, -3.960205078125, -3.71368408203125, -3.4671630859375, -3.22064208984375, -2.97412109375, -2.72760009765625, -2.4810791015625, -2.23455810546875, -1.988037109375, -1.74151611328125, -1.4949951171875, -1.24847412109375, -1.001953125, -0.75543212890625, -0.5089111328125, -0.26239013671875, -0.015869140625, 0.23065185546875, 0.4771728515625, 0.72369384765625, 0.97021484375, 1.21673583984375, 1.4632568359375, 1.70977783203125, 1.956298828125, 2.20281982421875, 2.4493408203125, 2.69586181640625, 2.9423828125, 3.18890380859375, 3.4354248046875, 3.68194580078125, 3.928466796875, 4.17498779296875, 4.4215087890625, 4.66802978515625, 4.91455078125, 5.16107177734375, 5.4075927734375, 5.65411376953125, 5.900634765625, 6.14715576171875, 6.3936767578125, 6.64019775390625, 6.88671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 5.0, 17.0, 19.0, 16.0, 19.0, 29.0, 40.0, 38.0, 50.0, 48.0, 78.0, 96.0, 87.0, 86.0, 64.0, 65.0, 45.0, 40.0, 26.0, 30.0, 22.0, 17.0, 14.0, 7.0, 7.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33203125, -4.1676025390625, -4.003173828125, -3.8387451171875, -3.67431640625, -3.5098876953125, -3.345458984375, -3.1810302734375, -3.0166015625, -2.8521728515625, -2.687744140625, -2.5233154296875, -2.35888671875, -2.1944580078125, -2.030029296875, -1.8656005859375, -1.701171875, -1.5367431640625, -1.372314453125, -1.2078857421875, -1.04345703125, -0.8790283203125, -0.714599609375, -0.5501708984375, -0.3857421875, -0.2213134765625, -0.056884765625, 0.1075439453125, 0.27197265625, 0.4364013671875, 0.600830078125, 0.7652587890625, 0.9296875, 1.0941162109375, 1.258544921875, 1.4229736328125, 1.58740234375, 1.7518310546875, 1.916259765625, 2.0806884765625, 2.2451171875, 2.4095458984375, 2.573974609375, 2.7384033203125, 2.90283203125, 3.0672607421875, 3.231689453125, 3.3961181640625, 3.560546875, 3.7249755859375, 3.889404296875, 4.0538330078125, 4.21826171875, 4.3826904296875, 4.547119140625, 4.7115478515625, 4.8759765625, 5.0404052734375, 5.204833984375, 5.3692626953125, 5.53369140625, 5.6981201171875, 5.862548828125, 6.0269775390625, 6.19140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 12.0, 18.0, 34.0, 37.0, 74.0, 108.0, 153.0, 185.0, 138.0, 84.0, 67.0, 28.0, 21.0, 19.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.46044921875, -135.43824768066406, -131.41604614257812, -127.39384460449219, -123.37164306640625, -119.34944152832031, -115.32723999023438, -111.30503845214844, -107.2828369140625, -103.26063537597656, -99.23843383789062, -95.21623229980469, -91.19403076171875, -87.17182922363281, -83.14962768554688, -79.12742614746094, -75.105224609375, -71.08302307128906, -67.06082153320312, -63.03861999511719, -59.01641845703125, -54.99421691894531, -50.972015380859375, -46.94981384277344, -42.9276123046875, -38.90541076660156, -34.883209228515625, -30.861007690429688, -26.83880615234375, -22.816604614257812, -18.794403076171875, -14.772201538085938, -10.75, -6.7277984619140625, -2.705596923828125, 1.3166046142578125, 5.33880615234375, 9.361007690429688, 13.383209228515625, 17.405410766601562, 21.4276123046875, 25.449813842773438, 29.472015380859375, 33.49421691894531, 37.51641845703125, 41.53861999511719, 45.560821533203125, 49.58302307128906, 53.605224609375, 57.62742614746094, 61.649627685546875, 65.67182922363281, 69.69403076171875, 73.71623229980469, 77.73843383789062, 81.76063537597656, 85.7828369140625, 89.80503845214844, 93.82723999023438, 97.84944152832031, 101.87164306640625, 105.89384460449219, 109.91604614257812, 113.93824768066406, 117.96044921875]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 13.0, 7.0, 3.0, 12.0, 11.0, 6.0, 9.0, 21.0, 30.0, 26.0, 22.0, 39.0, 42.0, 36.0, 42.0, 50.0, 40.0, 51.0, 70.0, 62.0, 51.0, 40.0, 49.0, 23.0, 31.0, 29.0, 25.0, 24.0, 20.0, 18.0, 22.0, 22.0, 8.0, 7.0, 11.0, 7.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.69190979003906, -68.3661117553711, -66.04031372070312, -63.714515686035156, -61.38871383666992, -59.06291580200195, -56.737117767333984, -54.41131591796875, -52.08551788330078, -49.75971984863281, -47.433921813964844, -45.108123779296875, -42.78232192993164, -40.45652389526367, -38.1307258605957, -35.80492401123047, -33.479129791259766, -31.153331756591797, -28.827531814575195, -26.501733779907227, -24.175933837890625, -21.850135803222656, -19.524337768554688, -17.198537826538086, -14.872739791870117, -12.546940803527832, -10.221141815185547, -7.895343780517578, -5.569544792175293, -3.243745803833008, -0.9179477691650391, 1.4078521728515625, 3.7336502075195312, 6.059449195861816, 8.385248184204102, 10.71104621887207, 13.036845207214355, 15.36264419555664, 17.68844223022461, 20.01424217224121, 22.34004020690918, 24.66583824157715, 26.99163818359375, 29.31743621826172, 31.643234252929688, 33.969032287597656, 36.294830322265625, 38.62063217163086, 40.94643020629883, 43.2722282409668, 45.598026275634766, 47.923828125, 50.24962615966797, 52.57542419433594, 54.901222229003906, 57.227020263671875, 59.552818298339844, 61.87861633300781, 64.20441436767578, 66.53021240234375, 68.85601043701172, 71.18180847167969, 73.50761413574219, 75.83341217041016, 78.15921020507812]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 5.0, 10.0, 17.0, 11.0, 30.0, 43.0, 50.0, 77.0, 123.0, 213.0, 366.0, 752.0, 1580.0, 3951.0, 12280.0, 60932.0, 1497289.0, 2515295.0, 78798.0, 14644.0, 4432.0, 1668.0, 737.0, 379.0, 197.0, 144.0, 82.0, 48.0, 37.0, 29.0, 24.0, 13.0, 9.0, 9.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-13.875, -13.479248046875, -13.08349609375, -12.687744140625, -12.2919921875, -11.896240234375, -11.50048828125, -11.104736328125, -10.708984375, -10.313232421875, -9.91748046875, -9.521728515625, -9.1259765625, -8.730224609375, -8.33447265625, -7.938720703125, -7.54296875, -7.147216796875, -6.75146484375, -6.355712890625, -5.9599609375, -5.564208984375, -5.16845703125, -4.772705078125, -4.376953125, -3.981201171875, -3.58544921875, -3.189697265625, -2.7939453125, -2.398193359375, -2.00244140625, -1.606689453125, -1.2109375, -0.815185546875, -0.41943359375, -0.023681640625, 0.3720703125, 0.767822265625, 1.16357421875, 1.559326171875, 1.955078125, 2.350830078125, 2.74658203125, 3.142333984375, 3.5380859375, 3.933837890625, 4.32958984375, 4.725341796875, 5.12109375, 5.516845703125, 5.91259765625, 6.308349609375, 6.7041015625, 7.099853515625, 7.49560546875, 7.891357421875, 8.287109375, 8.682861328125, 9.07861328125, 9.474365234375, 9.8701171875, 10.265869140625, 10.66162109375, 11.057373046875, 11.453125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 4.0, 10.0, 12.0, 26.0, 27.0, 39.0, 51.0, 55.0, 62.0, 71.0, 84.0, 92.0, 73.0, 65.0, 75.0, 76.0, 49.0, 38.0, 28.0, 16.0, 18.0, 6.0, 10.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.52734375, -7.288818359375, -7.05029296875, -6.811767578125, -6.5732421875, -6.334716796875, -6.09619140625, -5.857666015625, -5.619140625, -5.380615234375, -5.14208984375, -4.903564453125, -4.6650390625, -4.426513671875, -4.18798828125, -3.949462890625, -3.7109375, -3.472412109375, -3.23388671875, -2.995361328125, -2.7568359375, -2.518310546875, -2.27978515625, -2.041259765625, -1.802734375, -1.564208984375, -1.32568359375, -1.087158203125, -0.8486328125, -0.610107421875, -0.37158203125, -0.133056640625, 0.10546875, 0.343994140625, 0.58251953125, 0.821044921875, 1.0595703125, 1.298095703125, 1.53662109375, 1.775146484375, 2.013671875, 2.252197265625, 2.49072265625, 2.729248046875, 2.9677734375, 3.206298828125, 3.44482421875, 3.683349609375, 3.921875, 4.160400390625, 4.39892578125, 4.637451171875, 4.8759765625, 5.114501953125, 5.35302734375, 5.591552734375, 5.830078125, 6.068603515625, 6.30712890625, 6.545654296875, 6.7841796875, 7.022705078125, 7.26123046875, 7.499755859375, 7.73828125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 5.0, 3.0, 4.0, 4.0, 13.0, 22.0, 23.0, 45.0, 66.0, 105.0, 199.0, 351.0, 641.0, 1188.0, 2403.0, 5044.0, 11512.0, 29691.0, 101269.0, 745376.0, 2899791.0, 300196.0, 59419.0, 20252.0, 8549.0, 3802.0, 1898.0, 978.0, 586.0, 314.0, 207.0, 110.0, 62.0, 53.0, 30.0, 21.0, 18.0, 15.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3515625, -8.0760498046875, -7.800537109375, -7.5250244140625, -7.24951171875, -6.9739990234375, -6.698486328125, -6.4229736328125, -6.1474609375, -5.8719482421875, -5.596435546875, -5.3209228515625, -5.04541015625, -4.7698974609375, -4.494384765625, -4.2188720703125, -3.943359375, -3.6678466796875, -3.392333984375, -3.1168212890625, -2.84130859375, -2.5657958984375, -2.290283203125, -2.0147705078125, -1.7392578125, -1.4637451171875, -1.188232421875, -0.9127197265625, -0.63720703125, -0.3616943359375, -0.086181640625, 0.1893310546875, 0.46484375, 0.7403564453125, 1.015869140625, 1.2913818359375, 1.56689453125, 1.8424072265625, 2.117919921875, 2.3934326171875, 2.6689453125, 2.9444580078125, 3.219970703125, 3.4954833984375, 3.77099609375, 4.0465087890625, 4.322021484375, 4.5975341796875, 4.873046875, 5.1485595703125, 5.424072265625, 5.6995849609375, 5.97509765625, 6.2506103515625, 6.526123046875, 6.8016357421875, 7.0771484375, 7.3526611328125, 7.628173828125, 7.9036865234375, 8.17919921875, 8.4547119140625, 8.730224609375, 9.0057373046875, 9.28125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 12.0, 11.0, 12.0, 10.0, 20.0, 39.0, 39.0, 63.0, 91.0, 117.0, 210.0, 319.0, 621.0, 803.0, 672.0, 387.0, 221.0, 127.0, 77.0, 63.0, 39.0, 21.0, 22.0, 14.0, 15.0, 7.0, 7.0, 3.0, 6.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.720947265625, -7.41845703125, -7.115966796875, -6.8134765625, -6.510986328125, -6.20849609375, -5.906005859375, -5.603515625, -5.301025390625, -4.99853515625, -4.696044921875, -4.3935546875, -4.091064453125, -3.78857421875, -3.486083984375, -3.18359375, -2.881103515625, -2.57861328125, -2.276123046875, -1.9736328125, -1.671142578125, -1.36865234375, -1.066162109375, -0.763671875, -0.461181640625, -0.15869140625, 0.143798828125, 0.4462890625, 0.748779296875, 1.05126953125, 1.353759765625, 1.65625, 1.958740234375, 2.26123046875, 2.563720703125, 2.8662109375, 3.168701171875, 3.47119140625, 3.773681640625, 4.076171875, 4.378662109375, 4.68115234375, 4.983642578125, 5.2861328125, 5.588623046875, 5.89111328125, 6.193603515625, 6.49609375, 6.798583984375, 7.10107421875, 7.403564453125, 7.7060546875, 8.008544921875, 8.31103515625, 8.613525390625, 8.916015625, 9.218505859375, 9.52099609375, 9.823486328125, 10.1259765625, 10.428466796875, 10.73095703125, 11.033447265625, 11.3359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 5.0, 9.0, 16.0, 56.0, 93.0, 185.0, 226.0, 199.0, 118.0, 49.0, 22.0, 9.0, 6.0, 8.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.13871765136719, -101.05137634277344, -96.96403503417969, -92.87670135498047, -88.78936004638672, -84.70201873779297, -80.61468505859375, -76.52734375, -72.44000244140625, -68.3526611328125, -64.26531982421875, -60.17798614501953, -56.09064483642578, -52.00330352783203, -47.91596603393555, -43.82862854003906, -39.74128723144531, -35.65394592285156, -31.566608428955078, -27.47926902770996, -23.391929626464844, -19.304590225219727, -15.21725082397461, -11.129911422729492, -7.042572021484375, -2.955232620239258, 1.1321067810058594, 5.219446182250977, 9.306785583496094, 13.394124984741211, 17.481464385986328, 21.568803787231445, 25.656158447265625, 29.743497848510742, 33.83083724975586, 37.918174743652344, 42.005516052246094, 46.092857360839844, 50.18019485473633, 54.26753234863281, 58.35487365722656, 62.44221496582031, 66.52955627441406, 70.61688995361328, 74.70423126220703, 78.79157257080078, 82.87890625, 86.96624755859375, 91.0535888671875, 95.14093017578125, 99.228271484375, 103.31560516357422, 107.40294647216797, 111.49028778076172, 115.57762145996094, 119.66496276855469, 123.75230407714844, 127.83964538574219, 131.92698669433594, 136.0143280029297, 140.10165405273438, 144.18899536132812, 148.27633666992188, 152.36367797851562, 156.45101928710938]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 4.0, 3.0, 10.0, 6.0, 11.0, 19.0, 16.0, 24.0, 13.0, 32.0, 33.0, 46.0, 42.0, 40.0, 40.0, 45.0, 47.0, 48.0, 54.0, 59.0, 49.0, 57.0, 46.0, 43.0, 43.0, 26.0, 35.0, 27.0, 25.0, 14.0, 14.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.13266372680664, -51.6064567565918, -50.08025360107422, -48.554046630859375, -47.02783966064453, -45.50163650512695, -43.97542953491211, -42.44922637939453, -40.92301940917969, -39.396812438964844, -37.870609283447266, -36.34440231323242, -34.818199157714844, -33.2919921875, -31.765785217285156, -30.239580154418945, -28.713375091552734, -27.187170028686523, -25.660964965820312, -24.13475799560547, -22.608552932739258, -21.082347869873047, -19.556140899658203, -18.029935836791992, -16.50373077392578, -14.97752571105957, -13.451319694519043, -11.925113677978516, -10.398908615112305, -8.872703552246094, -7.346497535705566, -5.820291519165039, -4.2940826416015625, -2.7678771018981934, -1.2416715621948242, 0.2845339775085449, 1.810739517211914, 3.336945056915283, 4.863150596618652, 6.38935661315918, 7.915561676025391, 9.441766738891602, 10.967972755432129, 12.494178771972656, 14.020383834838867, 15.546588897705078, 17.072795867919922, 18.599000930786133, 20.125205993652344, 21.651411056518555, 23.177616119384766, 24.70382308959961, 26.23002815246582, 27.75623321533203, 29.282440185546875, 30.808645248413086, 32.3348503112793, 33.86105728149414, 35.38726043701172, 36.91346740722656, 38.439674377441406, 39.965877532958984, 41.49208450317383, 43.018287658691406, 44.54449462890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 14.0, 17.0, 22.0, 36.0, 63.0, 112.0, 187.0, 311.0, 600.0, 1134.0, 2194.0, 4886.0, 11148.0, 27498.0, 78436.0, 286555.0, 437781.0, 128175.0, 40935.0, 15701.0, 6542.0, 3010.0, 1456.0, 751.0, 413.0, 236.0, 110.0, 79.0, 33.0, 38.0, 23.0, 8.0, 9.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.0078125, -11.6461181640625, -11.284423828125, -10.9227294921875, -10.56103515625, -10.1993408203125, -9.837646484375, -9.4759521484375, -9.1142578125, -8.7525634765625, -8.390869140625, -8.0291748046875, -7.66748046875, -7.3057861328125, -6.944091796875, -6.5823974609375, -6.220703125, -5.8590087890625, -5.497314453125, -5.1356201171875, -4.77392578125, -4.4122314453125, -4.050537109375, -3.6888427734375, -3.3271484375, -2.9654541015625, -2.603759765625, -2.2420654296875, -1.88037109375, -1.5186767578125, -1.156982421875, -0.7952880859375, -0.43359375, -0.0718994140625, 0.289794921875, 0.6514892578125, 1.01318359375, 1.3748779296875, 1.736572265625, 2.0982666015625, 2.4599609375, 2.8216552734375, 3.183349609375, 3.5450439453125, 3.90673828125, 4.2684326171875, 4.630126953125, 4.9918212890625, 5.353515625, 5.7152099609375, 6.076904296875, 6.4385986328125, 6.80029296875, 7.1619873046875, 7.523681640625, 7.8853759765625, 8.2470703125, 8.6087646484375, 8.970458984375, 9.3321533203125, 9.69384765625, 10.0555419921875, 10.417236328125, 10.7789306640625, 11.140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 5.0, 5.0, 13.0, 16.0, 18.0, 27.0, 27.0, 42.0, 31.0, 53.0, 53.0, 82.0, 67.0, 63.0, 63.0, 74.0, 70.0, 70.0, 50.0, 34.0, 38.0, 22.0, 25.0, 12.0, 13.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3671875, -7.1551513671875, -6.943115234375, -6.7310791015625, -6.51904296875, -6.3070068359375, -6.094970703125, -5.8829345703125, -5.6708984375, -5.4588623046875, -5.246826171875, -5.0347900390625, -4.82275390625, -4.6107177734375, -4.398681640625, -4.1866455078125, -3.974609375, -3.7625732421875, -3.550537109375, -3.3385009765625, -3.12646484375, -2.9144287109375, -2.702392578125, -2.4903564453125, -2.2783203125, -2.0662841796875, -1.854248046875, -1.6422119140625, -1.43017578125, -1.2181396484375, -1.006103515625, -0.7940673828125, -0.58203125, -0.3699951171875, -0.157958984375, 0.0540771484375, 0.26611328125, 0.4781494140625, 0.690185546875, 0.9022216796875, 1.1142578125, 1.3262939453125, 1.538330078125, 1.7503662109375, 1.96240234375, 2.1744384765625, 2.386474609375, 2.5985107421875, 2.810546875, 3.0225830078125, 3.234619140625, 3.4466552734375, 3.65869140625, 3.8707275390625, 4.082763671875, 4.2947998046875, 4.5068359375, 4.7188720703125, 4.930908203125, 5.1429443359375, 5.35498046875, 5.5670166015625, 5.779052734375, 5.9910888671875, 6.203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 7.0, 8.0, 19.0, 18.0, 13.0, 19.0, 32.0, 42.0, 58.0, 88.0, 120.0, 175.0, 263.0, 521.0, 958.0, 2016.0, 5114.0, 17660.0, 83806.0, 635069.0, 247080.0, 39322.0, 9709.0, 3193.0, 1378.0, 719.0, 414.0, 240.0, 147.0, 92.0, 54.0, 43.0, 39.0, 26.0, 21.0, 16.0, 18.0, 8.0, 9.0, 1.0, 7.0, 0.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.859375, -15.343994140625, -14.82861328125, -14.313232421875, -13.7978515625, -13.282470703125, -12.76708984375, -12.251708984375, -11.736328125, -11.220947265625, -10.70556640625, -10.190185546875, -9.6748046875, -9.159423828125, -8.64404296875, -8.128662109375, -7.61328125, -7.097900390625, -6.58251953125, -6.067138671875, -5.5517578125, -5.036376953125, -4.52099609375, -4.005615234375, -3.490234375, -2.974853515625, -2.45947265625, -1.944091796875, -1.4287109375, -0.913330078125, -0.39794921875, 0.117431640625, 0.6328125, 1.148193359375, 1.66357421875, 2.178955078125, 2.6943359375, 3.209716796875, 3.72509765625, 4.240478515625, 4.755859375, 5.271240234375, 5.78662109375, 6.302001953125, 6.8173828125, 7.332763671875, 7.84814453125, 8.363525390625, 8.87890625, 9.394287109375, 9.90966796875, 10.425048828125, 10.9404296875, 11.455810546875, 11.97119140625, 12.486572265625, 13.001953125, 13.517333984375, 14.03271484375, 14.548095703125, 15.0634765625, 15.578857421875, 16.09423828125, 16.609619140625, 17.125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 6.0, 7.0, 10.0, 12.0, 16.0, 16.0, 22.0, 27.0, 21.0, 27.0, 20.0, 45.0, 46.0, 39.0, 42.0, 44.0, 44.0, 44.0, 57.0, 53.0, 42.0, 46.0, 48.0, 39.0, 40.0, 32.0, 25.0, 14.0, 23.0, 14.0, 18.0, 13.0, 7.0, 10.0, 8.0, 2.0, 1.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.5625, -17.005126953125, -16.44775390625, -15.890380859375, -15.3330078125, -14.775634765625, -14.21826171875, -13.660888671875, -13.103515625, -12.546142578125, -11.98876953125, -11.431396484375, -10.8740234375, -10.316650390625, -9.75927734375, -9.201904296875, -8.64453125, -8.087158203125, -7.52978515625, -6.972412109375, -6.4150390625, -5.857666015625, -5.30029296875, -4.742919921875, -4.185546875, -3.628173828125, -3.07080078125, -2.513427734375, -1.9560546875, -1.398681640625, -0.84130859375, -0.283935546875, 0.2734375, 0.830810546875, 1.38818359375, 1.945556640625, 2.5029296875, 3.060302734375, 3.61767578125, 4.175048828125, 4.732421875, 5.289794921875, 5.84716796875, 6.404541015625, 6.9619140625, 7.519287109375, 8.07666015625, 8.634033203125, 9.19140625, 9.748779296875, 10.30615234375, 10.863525390625, 11.4208984375, 11.978271484375, 12.53564453125, 13.093017578125, 13.650390625, 14.207763671875, 14.76513671875, 15.322509765625, 15.8798828125, 16.437255859375, 16.99462890625, 17.552001953125, 18.109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 6.0, 15.0, 12.0, 34.0, 31.0, 79.0, 177.0, 407.0, 1329.0, 8691.0, 188222.0, 815532.0, 29944.0, 2884.0, 684.0, 223.0, 109.0, 61.0, 36.0, 30.0, 12.0, 12.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1875, -10.8607177734375, -10.533935546875, -10.2071533203125, -9.88037109375, -9.5535888671875, -9.226806640625, -8.9000244140625, -8.5732421875, -8.2464599609375, -7.919677734375, -7.5928955078125, -7.26611328125, -6.9393310546875, -6.612548828125, -6.2857666015625, -5.958984375, -5.6322021484375, -5.305419921875, -4.9786376953125, -4.65185546875, -4.3250732421875, -3.998291015625, -3.6715087890625, -3.3447265625, -3.0179443359375, -2.691162109375, -2.3643798828125, -2.03759765625, -1.7108154296875, -1.384033203125, -1.0572509765625, -0.73046875, -0.4036865234375, -0.076904296875, 0.2498779296875, 0.57666015625, 0.9034423828125, 1.230224609375, 1.5570068359375, 1.8837890625, 2.2105712890625, 2.537353515625, 2.8641357421875, 3.19091796875, 3.5177001953125, 3.844482421875, 4.1712646484375, 4.498046875, 4.8248291015625, 5.151611328125, 5.4783935546875, 5.80517578125, 6.1319580078125, 6.458740234375, 6.7855224609375, 7.1123046875, 7.4390869140625, 7.765869140625, 8.0926513671875, 8.41943359375, 8.7462158203125, 9.072998046875, 9.3997802734375, 9.7265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 8.0, 4.0, 7.0, 9.0, 12.0, 14.0, 23.0, 18.0, 30.0, 51.0, 69.0, 98.0, 126.0, 135.0, 104.0, 65.0, 62.0, 42.0, 36.0, 16.0, 16.0, 16.0, 7.0, 6.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008220672607421875, -0.0007881522178649902, -0.000754237174987793, -0.0007203221321105957, -0.0006864070892333984, -0.0006524920463562012, -0.0006185770034790039, -0.0005846619606018066, -0.0005507469177246094, -0.0005168318748474121, -0.00048291683197021484, -0.0004490017890930176, -0.0004150867462158203, -0.00038117170333862305, -0.0003472566604614258, -0.0003133416175842285, -0.00027942657470703125, -0.000245511531829834, -0.00021159648895263672, -0.00017768144607543945, -0.0001437664031982422, -0.00010985136032104492, -7.593631744384766e-05, -4.202127456665039e-05, -8.106231689453125e-06, 2.580881118774414e-05, 5.9723854064941406e-05, 9.363889694213867e-05, 0.00012755393981933594, 0.0001614689826965332, 0.00019538402557373047, 0.00022929906845092773, 0.000263214111328125, 0.00029712915420532227, 0.00033104419708251953, 0.0003649592399597168, 0.00039887428283691406, 0.00043278932571411133, 0.0004667043685913086, 0.0005006194114685059, 0.0005345344543457031, 0.0005684494972229004, 0.0006023645401000977, 0.0006362795829772949, 0.0006701946258544922, 0.0007041096687316895, 0.0007380247116088867, 0.000771939754486084, 0.0008058547973632812, 0.0008397698402404785, 0.0008736848831176758, 0.000907599925994873, 0.0009415149688720703, 0.0009754300117492676, 0.0010093450546264648, 0.0010432600975036621, 0.0010771751403808594, 0.0011110901832580566, 0.001145005226135254, 0.0011789202690124512, 0.0012128353118896484, 0.0012467503547668457, 0.001280665397644043, 0.0013145804405212402, 0.0013484954833984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 12.0, 16.0, 15.0, 22.0, 25.0, 36.0, 54.0, 103.0, 167.0, 261.0, 509.0, 1058.0, 2513.0, 7859.0, 34229.0, 248346.0, 638780.0, 91202.0, 15766.0, 4298.0, 1582.0, 737.0, 359.0, 217.0, 136.0, 83.0, 60.0, 24.0, 27.0, 15.0, 3.0, 12.0, 3.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.46875, -6.29034423828125, -6.1119384765625, -5.93353271484375, -5.755126953125, -5.57672119140625, -5.3983154296875, -5.21990966796875, -5.04150390625, -4.86309814453125, -4.6846923828125, -4.50628662109375, -4.327880859375, -4.14947509765625, -3.9710693359375, -3.79266357421875, -3.6142578125, -3.43585205078125, -3.2574462890625, -3.07904052734375, -2.900634765625, -2.72222900390625, -2.5438232421875, -2.36541748046875, -2.18701171875, -2.00860595703125, -1.8302001953125, -1.65179443359375, -1.473388671875, -1.29498291015625, -1.1165771484375, -0.93817138671875, -0.759765625, -0.58135986328125, -0.4029541015625, -0.22454833984375, -0.046142578125, 0.13226318359375, 0.3106689453125, 0.48907470703125, 0.66748046875, 0.84588623046875, 1.0242919921875, 1.20269775390625, 1.381103515625, 1.55950927734375, 1.7379150390625, 1.91632080078125, 2.0947265625, 2.27313232421875, 2.4515380859375, 2.62994384765625, 2.808349609375, 2.98675537109375, 3.1651611328125, 3.34356689453125, 3.52197265625, 3.70037841796875, 3.8787841796875, 4.05718994140625, 4.235595703125, 4.41400146484375, 4.5924072265625, 4.77081298828125, 4.94921875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 10.0, 5.0, 19.0, 16.0, 19.0, 31.0, 38.0, 45.0, 68.0, 70.0, 71.0, 79.0, 106.0, 73.0, 65.0, 61.0, 60.0, 34.0, 26.0, 20.0, 16.0, 8.0, 11.0, 5.0, 12.0, 8.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.43359375, -5.27349853515625, -5.1134033203125, -4.95330810546875, -4.793212890625, -4.63311767578125, -4.4730224609375, -4.31292724609375, -4.15283203125, -3.99273681640625, -3.8326416015625, -3.67254638671875, -3.512451171875, -3.35235595703125, -3.1922607421875, -3.03216552734375, -2.8720703125, -2.71197509765625, -2.5518798828125, -2.39178466796875, -2.231689453125, -2.07159423828125, -1.9114990234375, -1.75140380859375, -1.59130859375, -1.43121337890625, -1.2711181640625, -1.11102294921875, -0.950927734375, -0.79083251953125, -0.6307373046875, -0.47064208984375, -0.310546875, -0.15045166015625, 0.0096435546875, 0.16973876953125, 0.329833984375, 0.48992919921875, 0.6500244140625, 0.81011962890625, 0.97021484375, 1.13031005859375, 1.2904052734375, 1.45050048828125, 1.610595703125, 1.77069091796875, 1.9307861328125, 2.09088134765625, 2.2509765625, 2.41107177734375, 2.5711669921875, 2.73126220703125, 2.891357421875, 3.05145263671875, 3.2115478515625, 3.37164306640625, 3.53173828125, 3.69183349609375, 3.8519287109375, 4.01202392578125, 4.172119140625, 4.33221435546875, 4.4923095703125, 4.65240478515625, 4.8125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 9.0, 11.0, 33.0, 53.0, 104.0, 137.0, 219.0, 192.0, 121.0, 52.0, 38.0, 22.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.90288543701172, -100.81990051269531, -96.73692321777344, -92.65393829345703, -88.57095336914062, -84.48797607421875, -80.40499114990234, -76.32200622558594, -72.23902893066406, -68.15604400634766, -64.07306671142578, -59.990081787109375, -55.90709686279297, -51.82411575317383, -47.74113464355469, -43.65814971923828, -39.575164794921875, -35.492183685302734, -31.409198760986328, -27.326217651367188, -23.243234634399414, -19.16025161743164, -15.0772705078125, -10.994287490844727, -6.911304473876953, -2.828321933746338, 1.2546606063842773, 5.337642669677734, 9.420625686645508, 13.503608703613281, 17.586589813232422, 21.669572830200195, 25.7525634765625, 29.835546493530273, 33.91852951049805, 38.00151062011719, 42.084495544433594, 46.167476654052734, 50.250457763671875, 54.33344268798828, 58.41642379760742, 62.49940490722656, 66.58238983154297, 70.66537475585938, 74.74835205078125, 78.83133697509766, 82.91432189941406, 86.99729919433594, 91.08028411865234, 95.16326904296875, 99.24624633789062, 103.32923126220703, 107.41221618652344, 111.49519348144531, 115.57817840576172, 119.66116333007812, 123.744140625, 127.8271255493164, 131.9101104736328, 135.9930877685547, 140.07606506347656, 144.1590576171875, 148.24203491210938, 152.32501220703125, 156.4080047607422]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [5.0, 3.0, 0.0, 4.0, 6.0, 5.0, 7.0, 9.0, 9.0, 28.0, 23.0, 51.0, 52.0, 58.0, 57.0, 83.0, 102.0, 101.0, 77.0, 77.0, 50.0, 59.0, 32.0, 29.0, 31.0, 15.0, 14.0, 8.0, 9.0, 7.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.24456787109375, -59.54783248901367, -55.85109329223633, -52.15435791015625, -48.457618713378906, -44.76088333129883, -41.06414794921875, -37.367408752441406, -33.67066955566406, -29.97393226623535, -26.27719497680664, -22.580459594726562, -18.88372039794922, -15.18698501586914, -11.49024772644043, -7.793510437011719, -4.096775054931641, -0.4000380039215088, 3.296699047088623, 6.993435859680176, 10.690173149108887, 14.386909484863281, 18.083646774291992, 21.780384063720703, 25.477121353149414, 29.173858642578125, 32.8705940246582, 36.56733322143555, 40.264068603515625, 43.96080780029297, 47.65754318237305, 51.354278564453125, 55.05101776123047, 58.74775314331055, 62.44449234008789, 66.14122772216797, 69.83796691894531, 73.53469848632812, 77.23143768310547, 80.92817687988281, 84.62491607666016, 88.3216552734375, 92.01838684082031, 95.71512603759766, 99.411865234375, 103.10859680175781, 106.80533599853516, 110.5020751953125, 114.19880676269531, 117.89554595947266, 121.59227752685547, 125.28901672363281, 128.98574829101562, 132.6824951171875, 136.3792266845703, 140.07595825195312, 143.772705078125, 147.4694366455078, 151.1661834716797, 154.8629150390625, 158.5596466064453, 162.2563934326172, 165.953125, 169.64987182617188, 173.3466033935547]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 4.0, 11.0, 28.0, 29.0, 64.0, 88.0, 191.0, 388.0, 818.0, 2014.0, 5575.0, 20867.0, 117209.0, 1690110.0, 2173144.0, 151496.0, 23596.0, 5620.0, 1741.0, 579.0, 287.0, 121.0, 87.0, 53.0, 43.0, 35.0, 20.0, 8.0, 13.0, 14.0, 4.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.5335693359375, -6.207763671875, -5.8819580078125, -5.55615234375, -5.2303466796875, -4.904541015625, -4.5787353515625, -4.2529296875, -3.9271240234375, -3.601318359375, -3.2755126953125, -2.94970703125, -2.6239013671875, -2.298095703125, -1.9722900390625, -1.646484375, -1.3206787109375, -0.994873046875, -0.6690673828125, -0.34326171875, -0.0174560546875, 0.308349609375, 0.6341552734375, 0.9599609375, 1.2857666015625, 1.611572265625, 1.9373779296875, 2.26318359375, 2.5889892578125, 2.914794921875, 3.2406005859375, 3.56640625, 3.8922119140625, 4.218017578125, 4.5438232421875, 4.86962890625, 5.1954345703125, 5.521240234375, 5.8470458984375, 6.1728515625, 6.4986572265625, 6.824462890625, 7.1502685546875, 7.47607421875, 7.8018798828125, 8.127685546875, 8.4534912109375, 8.779296875, 9.1051025390625, 9.430908203125, 9.7567138671875, 10.08251953125, 10.4083251953125, 10.734130859375, 11.0599365234375, 11.3857421875, 11.7115478515625, 12.037353515625, 12.3631591796875, 12.68896484375, 13.0147705078125, 13.340576171875, 13.6663818359375, 13.9921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 7.0, 4.0, 11.0, 22.0, 66.0, 72.0, 132.0, 154.0, 149.0, 153.0, 126.0, 58.0, 34.0, 11.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -6.89111328125, -6.4384765625, -5.98583984375, -5.533203125, -5.08056640625, -4.6279296875, -4.17529296875, -3.72265625, -3.27001953125, -2.8173828125, -2.36474609375, -1.912109375, -1.45947265625, -1.0068359375, -0.55419921875, -0.1015625, 0.35107421875, 0.8037109375, 1.25634765625, 1.708984375, 2.16162109375, 2.6142578125, 3.06689453125, 3.51953125, 3.97216796875, 4.4248046875, 4.87744140625, 5.330078125, 5.78271484375, 6.2353515625, 6.68798828125, 7.140625, 7.59326171875, 8.0458984375, 8.49853515625, 8.951171875, 9.40380859375, 9.8564453125, 10.30908203125, 10.76171875, 11.21435546875, 11.6669921875, 12.11962890625, 12.572265625, 13.02490234375, 13.4775390625, 13.93017578125, 14.3828125, 14.83544921875, 15.2880859375, 15.74072265625, 16.193359375, 16.64599609375, 17.0986328125, 17.55126953125, 18.00390625, 18.45654296875, 18.9091796875, 19.36181640625, 19.814453125, 20.26708984375, 20.7197265625, 21.17236328125, 21.625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 11.0, 32.0, 23.0, 47.0, 96.0, 143.0, 306.0, 612.0, 1408.0, 3535.0, 10430.0, 38299.0, 229896.0, 2969649.0, 829110.0, 83812.0, 18110.0, 5230.0, 1887.0, 791.0, 384.0, 173.0, 113.0, 59.0, 41.0, 22.0, 13.0, 8.0, 10.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.8944091796875, -10.515380859375, -10.1363525390625, -9.75732421875, -9.3782958984375, -8.999267578125, -8.6202392578125, -8.2412109375, -7.8621826171875, -7.483154296875, -7.1041259765625, -6.72509765625, -6.3460693359375, -5.967041015625, -5.5880126953125, -5.208984375, -4.8299560546875, -4.450927734375, -4.0718994140625, -3.69287109375, -3.3138427734375, -2.934814453125, -2.5557861328125, -2.1767578125, -1.7977294921875, -1.418701171875, -1.0396728515625, -0.66064453125, -0.2816162109375, 0.097412109375, 0.4764404296875, 0.85546875, 1.2344970703125, 1.613525390625, 1.9925537109375, 2.37158203125, 2.7506103515625, 3.129638671875, 3.5086669921875, 3.8876953125, 4.2667236328125, 4.645751953125, 5.0247802734375, 5.40380859375, 5.7828369140625, 6.161865234375, 6.5408935546875, 6.919921875, 7.2989501953125, 7.677978515625, 8.0570068359375, 8.43603515625, 8.8150634765625, 9.194091796875, 9.5731201171875, 9.9521484375, 10.3311767578125, 10.710205078125, 11.0892333984375, 11.46826171875, 11.8472900390625, 12.226318359375, 12.6053466796875, 12.984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 8.0, 2.0, 10.0, 12.0, 21.0, 16.0, 22.0, 31.0, 47.0, 75.0, 109.0, 145.0, 271.0, 420.0, 683.0, 701.0, 510.0, 353.0, 198.0, 129.0, 87.0, 66.0, 38.0, 24.0, 26.0, 19.0, 7.0, 7.0, 8.0, 8.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6015625, -11.1912841796875, -10.781005859375, -10.3707275390625, -9.96044921875, -9.5501708984375, -9.139892578125, -8.7296142578125, -8.3193359375, -7.9090576171875, -7.498779296875, -7.0885009765625, -6.67822265625, -6.2679443359375, -5.857666015625, -5.4473876953125, -5.037109375, -4.6268310546875, -4.216552734375, -3.8062744140625, -3.39599609375, -2.9857177734375, -2.575439453125, -2.1651611328125, -1.7548828125, -1.3446044921875, -0.934326171875, -0.5240478515625, -0.11376953125, 0.2965087890625, 0.706787109375, 1.1170654296875, 1.52734375, 1.9376220703125, 2.347900390625, 2.7581787109375, 3.16845703125, 3.5787353515625, 3.989013671875, 4.3992919921875, 4.8095703125, 5.2198486328125, 5.630126953125, 6.0404052734375, 6.45068359375, 6.8609619140625, 7.271240234375, 7.6815185546875, 8.091796875, 8.5020751953125, 8.912353515625, 9.3226318359375, 9.73291015625, 10.1431884765625, 10.553466796875, 10.9637451171875, 11.3740234375, 11.7843017578125, 12.194580078125, 12.6048583984375, 13.01513671875, 13.4254150390625, 13.835693359375, 14.2459716796875, 14.65625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 11.0, 17.0, 28.0, 69.0, 101.0, 214.0, 222.0, 169.0, 92.0, 35.0, 18.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.29918670654297, -64.43740844726562, -59.57563400268555, -54.7138557434082, -49.852081298828125, -44.99030303955078, -40.12852478027344, -35.26675033569336, -30.404972076416016, -25.543195724487305, -20.681419372558594, -15.81964111328125, -10.957864761352539, -6.096088409423828, -1.2343101501464844, 3.6274642944335938, 8.489242553710938, 13.351018905639648, 18.21279525756836, 23.074573516845703, 27.936349868774414, 32.798126220703125, 37.65990447998047, 42.52167892456055, 47.38345718383789, 52.245235443115234, 57.10700988769531, 61.968788146972656, 66.83056640625, 71.69233703613281, 76.55412292480469, 81.4158935546875, 86.27766418457031, 91.13944244384766, 96.001220703125, 100.86299133300781, 105.72476959228516, 110.5865478515625, 115.44832611083984, 120.31010437011719, 125.171875, 130.0336456298828, 134.8954315185547, 139.7572021484375, 144.61898803710938, 149.4807586669922, 154.342529296875, 159.20431518554688, 164.06610107421875, 168.92787170410156, 173.78965759277344, 178.65142822265625, 183.51321411132812, 188.37498474121094, 193.23675537109375, 198.09854125976562, 202.96031188964844, 207.82208251953125, 212.68386840820312, 217.54563903808594, 222.4074249267578, 227.26919555664062, 232.1309814453125, 236.9927520751953, 241.85452270507812]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 12.0, 22.0, 36.0, 31.0, 32.0, 78.0, 82.0, 87.0, 95.0, 106.0, 74.0, 73.0, 79.0, 49.0, 40.0, 28.0, 35.0, 14.0, 8.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-171.31390380859375, -167.6932373046875, -164.0725555419922, -160.45188903808594, -156.83120727539062, -153.21054077148438, -149.58985900878906, -145.9691925048828, -142.3485107421875, -138.72784423828125, -135.10716247558594, -131.4864959716797, -127.86581420898438, -124.24514770507812, -120.62447357177734, -117.00379943847656, -113.38313293457031, -109.76245880126953, -106.14178466796875, -102.52111053466797, -98.90043640136719, -95.27976989746094, -91.65909576416016, -88.03842163085938, -84.4177474975586, -80.79707336425781, -77.17639923095703, -73.55572509765625, -69.93505859375, -66.31437683105469, -62.69371032714844, -59.073036193847656, -55.452369689941406, -51.831695556640625, -48.211021423339844, -44.59035110473633, -40.96967697143555, -37.349002838134766, -33.72833251953125, -30.10765838623047, -26.486984252929688, -22.866310119628906, -19.245637893676758, -15.624964714050293, -12.004291534423828, -8.383617401123047, -4.762945175170898, -1.14227294921875, 2.4784011840820312, 6.099074363708496, 9.719747543334961, 13.340420722961426, 16.96109390258789, 20.581768035888672, 24.20244026184082, 27.82311248779297, 31.44378662109375, 35.06446075439453, 38.68513488769531, 42.30580520629883, 45.92647933959961, 49.54715347290039, 53.167823791503906, 56.78849792480469, 60.40917205810547]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 6.0, 0.0, 4.0, 7.0, 7.0, 10.0, 17.0, 25.0, 40.0, 77.0, 107.0, 188.0, 329.0, 533.0, 916.0, 1924.0, 3579.0, 7362.0, 16461.0, 38483.0, 88969.0, 213883.0, 349972.0, 186375.0, 77969.0, 33153.0, 14471.0, 6793.0, 3195.0, 1638.0, 883.0, 472.0, 281.0, 154.0, 106.0, 56.0, 37.0, 31.0, 15.0, 16.0, 2.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.51953125, -7.24530029296875, -6.9710693359375, -6.69683837890625, -6.422607421875, -6.14837646484375, -5.8741455078125, -5.59991455078125, -5.32568359375, -5.05145263671875, -4.7772216796875, -4.50299072265625, -4.228759765625, -3.95452880859375, -3.6802978515625, -3.40606689453125, -3.1318359375, -2.85760498046875, -2.5833740234375, -2.30914306640625, -2.034912109375, -1.76068115234375, -1.4864501953125, -1.21221923828125, -0.93798828125, -0.66375732421875, -0.3895263671875, -0.11529541015625, 0.158935546875, 0.43316650390625, 0.7073974609375, 0.98162841796875, 1.255859375, 1.53009033203125, 1.8043212890625, 2.07855224609375, 2.352783203125, 2.62701416015625, 2.9012451171875, 3.17547607421875, 3.44970703125, 3.72393798828125, 3.9981689453125, 4.27239990234375, 4.546630859375, 4.82086181640625, 5.0950927734375, 5.36932373046875, 5.6435546875, 5.91778564453125, 6.1920166015625, 6.46624755859375, 6.740478515625, 7.01470947265625, 7.2889404296875, 7.56317138671875, 7.83740234375, 8.11163330078125, 8.3858642578125, 8.66009521484375, 8.934326171875, 9.20855712890625, 9.4827880859375, 9.75701904296875, 10.03125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 5.0, 5.0, 7.0, 9.0, 22.0, 22.0, 39.0, 36.0, 40.0, 56.0, 68.0, 60.0, 52.0, 63.0, 88.0, 73.0, 64.0, 70.0, 58.0, 43.0, 41.0, 22.0, 18.0, 18.0, 6.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.58203125, -7.3697509765625, -7.157470703125, -6.9451904296875, -6.73291015625, -6.5206298828125, -6.308349609375, -6.0960693359375, -5.8837890625, -5.6715087890625, -5.459228515625, -5.2469482421875, -5.03466796875, -4.8223876953125, -4.610107421875, -4.3978271484375, -4.185546875, -3.9732666015625, -3.760986328125, -3.5487060546875, -3.33642578125, -3.1241455078125, -2.911865234375, -2.6995849609375, -2.4873046875, -2.2750244140625, -2.062744140625, -1.8504638671875, -1.63818359375, -1.4259033203125, -1.213623046875, -1.0013427734375, -0.7890625, -0.5767822265625, -0.364501953125, -0.1522216796875, 0.06005859375, 0.2723388671875, 0.484619140625, 0.6968994140625, 0.9091796875, 1.1214599609375, 1.333740234375, 1.5460205078125, 1.75830078125, 1.9705810546875, 2.182861328125, 2.3951416015625, 2.607421875, 2.8197021484375, 3.031982421875, 3.2442626953125, 3.45654296875, 3.6688232421875, 3.881103515625, 4.0933837890625, 4.3056640625, 4.5179443359375, 4.730224609375, 4.9425048828125, 5.15478515625, 5.3670654296875, 5.579345703125, 5.7916259765625, 6.00390625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 11.0, 17.0, 19.0, 21.0, 25.0, 31.0, 51.0, 70.0, 105.0, 141.0, 196.0, 246.0, 386.0, 556.0, 996.0, 1624.0, 3376.0, 9166.0, 45509.0, 420244.0, 501363.0, 47182.0, 9165.0, 3357.0, 1753.0, 976.0, 624.0, 365.0, 272.0, 186.0, 139.0, 83.0, 72.0, 60.0, 41.0, 24.0, 25.0, 14.0, 9.0, 9.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0625, -16.474365234375, -15.88623046875, -15.298095703125, -14.7099609375, -14.121826171875, -13.53369140625, -12.945556640625, -12.357421875, -11.769287109375, -11.18115234375, -10.593017578125, -10.0048828125, -9.416748046875, -8.82861328125, -8.240478515625, -7.65234375, -7.064208984375, -6.47607421875, -5.887939453125, -5.2998046875, -4.711669921875, -4.12353515625, -3.535400390625, -2.947265625, -2.359130859375, -1.77099609375, -1.182861328125, -0.5947265625, -0.006591796875, 0.58154296875, 1.169677734375, 1.7578125, 2.345947265625, 2.93408203125, 3.522216796875, 4.1103515625, 4.698486328125, 5.28662109375, 5.874755859375, 6.462890625, 7.051025390625, 7.63916015625, 8.227294921875, 8.8154296875, 9.403564453125, 9.99169921875, 10.579833984375, 11.16796875, 11.756103515625, 12.34423828125, 12.932373046875, 13.5205078125, 14.108642578125, 14.69677734375, 15.284912109375, 15.873046875, 16.461181640625, 17.04931640625, 17.637451171875, 18.2255859375, 18.813720703125, 19.40185546875, 19.989990234375, 20.578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 6.0, 16.0, 18.0, 23.0, 22.0, 29.0, 35.0, 44.0, 55.0, 50.0, 42.0, 56.0, 59.0, 58.0, 62.0, 47.0, 52.0, 50.0, 41.0, 36.0, 32.0, 37.0, 33.0, 33.0, 14.0, 10.0, 5.0, 7.0, 6.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.390625, -21.6591796875, -20.927734375, -20.1962890625, -19.46484375, -18.7333984375, -18.001953125, -17.2705078125, -16.5390625, -15.8076171875, -15.076171875, -14.3447265625, -13.61328125, -12.8818359375, -12.150390625, -11.4189453125, -10.6875, -9.9560546875, -9.224609375, -8.4931640625, -7.76171875, -7.0302734375, -6.298828125, -5.5673828125, -4.8359375, -4.1044921875, -3.373046875, -2.6416015625, -1.91015625, -1.1787109375, -0.447265625, 0.2841796875, 1.015625, 1.7470703125, 2.478515625, 3.2099609375, 3.94140625, 4.6728515625, 5.404296875, 6.1357421875, 6.8671875, 7.5986328125, 8.330078125, 9.0615234375, 9.79296875, 10.5244140625, 11.255859375, 11.9873046875, 12.71875, 13.4501953125, 14.181640625, 14.9130859375, 15.64453125, 16.3759765625, 17.107421875, 17.8388671875, 18.5703125, 19.3017578125, 20.033203125, 20.7646484375, 21.49609375, 22.2275390625, 22.958984375, 23.6904296875, 24.421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 4.0, 7.0, 14.0, 18.0, 11.0, 15.0, 32.0, 52.0, 68.0, 143.0, 222.0, 428.0, 1040.0, 3260.0, 16361.0, 127745.0, 766746.0, 112755.0, 14533.0, 3059.0, 983.0, 423.0, 247.0, 129.0, 68.0, 42.0, 32.0, 23.0, 19.0, 7.0, 9.0, 12.0, 6.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-6.375, -6.1900634765625, -6.005126953125, -5.8201904296875, -5.63525390625, -5.4503173828125, -5.265380859375, -5.0804443359375, -4.8955078125, -4.7105712890625, -4.525634765625, -4.3406982421875, -4.15576171875, -3.9708251953125, -3.785888671875, -3.6009521484375, -3.416015625, -3.2310791015625, -3.046142578125, -2.8612060546875, -2.67626953125, -2.4913330078125, -2.306396484375, -2.1214599609375, -1.9365234375, -1.7515869140625, -1.566650390625, -1.3817138671875, -1.19677734375, -1.0118408203125, -0.826904296875, -0.6419677734375, -0.45703125, -0.2720947265625, -0.087158203125, 0.0977783203125, 0.28271484375, 0.4676513671875, 0.652587890625, 0.8375244140625, 1.0224609375, 1.2073974609375, 1.392333984375, 1.5772705078125, 1.76220703125, 1.9471435546875, 2.132080078125, 2.3170166015625, 2.501953125, 2.6868896484375, 2.871826171875, 3.0567626953125, 3.24169921875, 3.4266357421875, 3.611572265625, 3.7965087890625, 3.9814453125, 4.1663818359375, 4.351318359375, 4.5362548828125, 4.72119140625, 4.9061279296875, 5.091064453125, 5.2760009765625, 5.4609375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 3.0, 7.0, 6.0, 1.0, 6.0, 10.0, 13.0, 21.0, 23.0, 22.0, 32.0, 36.0, 39.0, 50.0, 61.0, 85.0, 130.0, 97.0, 78.0, 50.0, 42.0, 45.0, 30.0, 26.0, 15.0, 16.0, 15.0, 9.0, 8.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0], "bins": [-0.0014705657958984375, -0.001436866819858551, -0.0014031678438186646, -0.001369468867778778, -0.0013357698917388916, -0.0013020709156990051, -0.0012683719396591187, -0.0012346729636192322, -0.0012009739875793457, -0.0011672750115394592, -0.0011335760354995728, -0.0010998770594596863, -0.0010661780834197998, -0.0010324791073799133, -0.0009987801313400269, -0.0009650811553001404, -0.0009313821792602539, -0.0008976832032203674, -0.000863984227180481, -0.0008302852511405945, -0.000796586275100708, -0.0007628872990608215, -0.0007291883230209351, -0.0006954893469810486, -0.0006617903709411621, -0.0006280913949012756, -0.0005943924188613892, -0.0005606934428215027, -0.0005269944667816162, -0.0004932954907417297, -0.00045959651470184326, -0.0004258975386619568, -0.0003921985626220703, -0.00035849958658218384, -0.00032480061054229736, -0.0002911016345024109, -0.0002574026584625244, -0.00022370368242263794, -0.00019000470638275146, -0.000156305730342865, -0.00012260675430297852, -8.890777826309204e-05, -5.5208802223205566e-05, -2.1509826183319092e-05, 1.2189149856567383e-05, 4.588812589645386e-05, 7.958710193634033e-05, 0.0001132860779762268, 0.00014698505401611328, 0.00018068403005599976, 0.00021438300609588623, 0.0002480819821357727, 0.0002817809581756592, 0.00031547993421554565, 0.00034917891025543213, 0.0003828778862953186, 0.0004165768623352051, 0.00045027583837509155, 0.00048397481441497803, 0.0005176737904548645, 0.000551372766494751, 0.0005850717425346375, 0.0006187707185745239, 0.0006524696946144104, 0.0006861686706542969]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 16.0, 18.0, 22.0, 41.0, 81.0, 118.0, 206.0, 407.0, 785.0, 1757.0, 4787.0, 22567.0, 287662.0, 676480.0, 42479.0, 6868.0, 2169.0, 983.0, 483.0, 249.0, 153.0, 76.0, 46.0, 27.0, 17.0, 12.0, 13.0, 6.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1953125, -6.00836181640625, -5.8214111328125, -5.63446044921875, -5.447509765625, -5.26055908203125, -5.0736083984375, -4.88665771484375, -4.69970703125, -4.51275634765625, -4.3258056640625, -4.13885498046875, -3.951904296875, -3.76495361328125, -3.5780029296875, -3.39105224609375, -3.2041015625, -3.01715087890625, -2.8302001953125, -2.64324951171875, -2.456298828125, -2.26934814453125, -2.0823974609375, -1.89544677734375, -1.70849609375, -1.52154541015625, -1.3345947265625, -1.14764404296875, -0.960693359375, -0.77374267578125, -0.5867919921875, -0.39984130859375, -0.212890625, -0.02593994140625, 0.1610107421875, 0.34796142578125, 0.534912109375, 0.72186279296875, 0.9088134765625, 1.09576416015625, 1.28271484375, 1.46966552734375, 1.6566162109375, 1.84356689453125, 2.030517578125, 2.21746826171875, 2.4044189453125, 2.59136962890625, 2.7783203125, 2.96527099609375, 3.1522216796875, 3.33917236328125, 3.526123046875, 3.71307373046875, 3.9000244140625, 4.08697509765625, 4.27392578125, 4.46087646484375, 4.6478271484375, 4.83477783203125, 5.021728515625, 5.20867919921875, 5.3956298828125, 5.58258056640625, 5.76953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 3.0, 10.0, 9.0, 16.0, 24.0, 26.0, 40.0, 47.0, 54.0, 92.0, 100.0, 99.0, 104.0, 83.0, 72.0, 48.0, 40.0, 37.0, 31.0, 21.0, 16.0, 10.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5625, -5.4110107421875, -5.259521484375, -5.1080322265625, -4.95654296875, -4.8050537109375, -4.653564453125, -4.5020751953125, -4.3505859375, -4.1990966796875, -4.047607421875, -3.8961181640625, -3.74462890625, -3.5931396484375, -3.441650390625, -3.2901611328125, -3.138671875, -2.9871826171875, -2.835693359375, -2.6842041015625, -2.53271484375, -2.3812255859375, -2.229736328125, -2.0782470703125, -1.9267578125, -1.7752685546875, -1.623779296875, -1.4722900390625, -1.32080078125, -1.1693115234375, -1.017822265625, -0.8663330078125, -0.71484375, -0.5633544921875, -0.411865234375, -0.2603759765625, -0.10888671875, 0.0426025390625, 0.194091796875, 0.3455810546875, 0.4970703125, 0.6485595703125, 0.800048828125, 0.9515380859375, 1.10302734375, 1.2545166015625, 1.406005859375, 1.5574951171875, 1.708984375, 1.8604736328125, 2.011962890625, 2.1634521484375, 2.31494140625, 2.4664306640625, 2.617919921875, 2.7694091796875, 2.9208984375, 3.0723876953125, 3.223876953125, 3.3753662109375, 3.52685546875, 3.6783447265625, 3.829833984375, 3.9813232421875, 4.1328125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 8.0, 9.0, 18.0, 32.0, 72.0, 120.0, 161.0, 237.0, 139.0, 84.0, 56.0, 29.0, 12.0, 5.0, 9.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.37045288085938, -112.7570571899414, -109.14366912841797, -105.5302734375, -101.91688537597656, -98.3034896850586, -94.69009399414062, -91.07670593261719, -87.46331024169922, -83.84991455078125, -80.23652648925781, -76.62313079833984, -73.0097427368164, -69.39634704589844, -65.782958984375, -62.16956329345703, -58.55617141723633, -54.942779541015625, -51.32938766479492, -47.71599578857422, -44.10260009765625, -40.48920822143555, -36.875816345214844, -33.262420654296875, -29.649030685424805, -26.0356388092041, -22.422245025634766, -18.808853149414062, -15.195460319519043, -11.582067489624023, -7.96867561340332, -4.355281829833984, -0.7418899536132812, 2.871502637863159, 6.4848952293396, 10.098287582397461, 13.71168041229248, 17.3250732421875, 20.938465118408203, 24.55185890197754, 28.165250778198242, 31.778642654418945, 35.39203643798828, 39.005428314208984, 42.61882019042969, 46.232215881347656, 49.845603942871094, 53.45899963378906, 57.072391510009766, 60.68578338623047, 64.29917907714844, 67.91256713867188, 71.52596282958984, 75.13935852050781, 78.75274658203125, 82.36614227294922, 85.97953033447266, 89.59292602539062, 93.20631408691406, 96.81970977783203, 100.43309783935547, 104.04649353027344, 107.65988159179688, 111.27327728271484, 114.88667297363281]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 18.0, 11.0, 11.0, 15.0, 25.0, 20.0, 29.0, 24.0, 28.0, 37.0, 26.0, 39.0, 44.0, 61.0, 65.0, 79.0, 64.0, 45.0, 39.0, 29.0, 31.0, 38.0, 27.0, 31.0, 27.0, 21.0, 13.0, 14.0, 15.0, 9.0, 10.0, 9.0, 6.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-77.44097900390625, -75.11964416503906, -72.79830932617188, -70.47698211669922, -68.15564727783203, -65.83431243896484, -63.512977600097656, -61.19164276123047, -58.87031173706055, -56.54897689819336, -54.22764587402344, -51.90631103515625, -49.58497619628906, -47.26364517211914, -44.94231033325195, -42.62097930908203, -40.299644470214844, -37.978309631347656, -35.656978607177734, -33.33564376831055, -31.014310836791992, -28.692977905273438, -26.37164306640625, -24.050310134887695, -21.72897720336914, -19.407644271850586, -17.08631134033203, -14.764976501464844, -12.443643569946289, -10.122310638427734, -7.800976753234863, -5.479642868041992, -3.1583099365234375, -0.8369765281677246, 1.4843568801879883, 3.805690288543701, 6.127023696899414, 8.448356628417969, 10.76969051361084, 13.091024398803711, 15.412357330322266, 17.73369026184082, 20.055023193359375, 22.376358032226562, 24.697690963745117, 27.019023895263672, 29.34035873413086, 31.661691665649414, 33.98302459716797, 36.304359436035156, 38.62569046020508, 40.947025299072266, 43.26835632324219, 45.589691162109375, 47.91102600097656, 50.23236083984375, 52.55369186401367, 54.87502670288086, 57.19635772705078, 59.51769256591797, 61.839027404785156, 64.16035461425781, 66.481689453125, 68.80302429199219, 71.12435913085938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 8.0, 17.0, 27.0, 44.0, 72.0, 115.0, 222.0, 498.0, 1160.0, 3045.0, 9608.0, 40597.0, 316884.0, 3043267.0, 690043.0, 67332.0, 14578.0, 4206.0, 1461.0, 596.0, 240.0, 113.0, 55.0, 26.0, 21.0, 11.0, 11.0, 8.0, 5.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.70703125, -6.42327880859375, -6.1395263671875, -5.85577392578125, -5.572021484375, -5.28826904296875, -5.0045166015625, -4.72076416015625, -4.43701171875, -4.15325927734375, -3.8695068359375, -3.58575439453125, -3.302001953125, -3.01824951171875, -2.7344970703125, -2.45074462890625, -2.1669921875, -1.88323974609375, -1.5994873046875, -1.31573486328125, -1.031982421875, -0.74822998046875, -0.4644775390625, -0.18072509765625, 0.10302734375, 0.38677978515625, 0.6705322265625, 0.95428466796875, 1.238037109375, 1.52178955078125, 1.8055419921875, 2.08929443359375, 2.373046875, 2.65679931640625, 2.9405517578125, 3.22430419921875, 3.508056640625, 3.79180908203125, 4.0755615234375, 4.35931396484375, 4.64306640625, 4.92681884765625, 5.2105712890625, 5.49432373046875, 5.778076171875, 6.06182861328125, 6.3455810546875, 6.62933349609375, 6.9130859375, 7.19683837890625, 7.4805908203125, 7.76434326171875, 8.048095703125, 8.33184814453125, 8.6156005859375, 8.89935302734375, 9.18310546875, 9.46685791015625, 9.7506103515625, 10.03436279296875, 10.318115234375, 10.60186767578125, 10.8856201171875, 11.16937255859375, 11.453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 2.0, 6.0, 5.0, 8.0, 10.0, 11.0, 29.0, 21.0, 26.0, 45.0, 37.0, 54.0, 45.0, 61.0, 55.0, 65.0, 66.0, 59.0, 69.0, 61.0, 65.0, 44.0, 34.0, 34.0, 19.0, 23.0, 11.0, 10.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.5625, -7.367919921875, -7.17333984375, -6.978759765625, -6.7841796875, -6.589599609375, -6.39501953125, -6.200439453125, -6.005859375, -5.811279296875, -5.61669921875, -5.422119140625, -5.2275390625, -5.032958984375, -4.83837890625, -4.643798828125, -4.44921875, -4.254638671875, -4.06005859375, -3.865478515625, -3.6708984375, -3.476318359375, -3.28173828125, -3.087158203125, -2.892578125, -2.697998046875, -2.50341796875, -2.308837890625, -2.1142578125, -1.919677734375, -1.72509765625, -1.530517578125, -1.3359375, -1.141357421875, -0.94677734375, -0.752197265625, -0.5576171875, -0.363037109375, -0.16845703125, 0.026123046875, 0.220703125, 0.415283203125, 0.60986328125, 0.804443359375, 0.9990234375, 1.193603515625, 1.38818359375, 1.582763671875, 1.77734375, 1.971923828125, 2.16650390625, 2.361083984375, 2.5556640625, 2.750244140625, 2.94482421875, 3.139404296875, 3.333984375, 3.528564453125, 3.72314453125, 3.917724609375, 4.1123046875, 4.306884765625, 4.50146484375, 4.696044921875, 4.890625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 15.0, 13.0, 28.0, 31.0, 59.0, 130.0, 282.0, 621.0, 1408.0, 3993.0, 12010.0, 51521.0, 504615.0, 3334452.0, 237653.0, 34191.0, 8675.0, 2697.0, 1013.0, 406.0, 195.0, 99.0, 50.0, 35.0, 24.0, 22.0, 8.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.796875, -14.40087890625, -14.0048828125, -13.60888671875, -13.212890625, -12.81689453125, -12.4208984375, -12.02490234375, -11.62890625, -11.23291015625, -10.8369140625, -10.44091796875, -10.044921875, -9.64892578125, -9.2529296875, -8.85693359375, -8.4609375, -8.06494140625, -7.6689453125, -7.27294921875, -6.876953125, -6.48095703125, -6.0849609375, -5.68896484375, -5.29296875, -4.89697265625, -4.5009765625, -4.10498046875, -3.708984375, -3.31298828125, -2.9169921875, -2.52099609375, -2.125, -1.72900390625, -1.3330078125, -0.93701171875, -0.541015625, -0.14501953125, 0.2509765625, 0.64697265625, 1.04296875, 1.43896484375, 1.8349609375, 2.23095703125, 2.626953125, 3.02294921875, 3.4189453125, 3.81494140625, 4.2109375, 4.60693359375, 5.0029296875, 5.39892578125, 5.794921875, 6.19091796875, 6.5869140625, 6.98291015625, 7.37890625, 7.77490234375, 8.1708984375, 8.56689453125, 8.962890625, 9.35888671875, 9.7548828125, 10.15087890625, 10.546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 12.0, 9.0, 11.0, 12.0, 25.0, 31.0, 53.0, 72.0, 63.0, 142.0, 198.0, 316.0, 486.0, 667.0, 605.0, 446.0, 282.0, 188.0, 122.0, 78.0, 59.0, 45.0, 24.0, 24.0, 21.0, 12.0, 8.0, 5.0, 8.0, 4.0, 4.0, 8.0, 6.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-11.953125, -11.6197509765625, -11.286376953125, -10.9530029296875, -10.61962890625, -10.2862548828125, -9.952880859375, -9.6195068359375, -9.2861328125, -8.9527587890625, -8.619384765625, -8.2860107421875, -7.95263671875, -7.6192626953125, -7.285888671875, -6.9525146484375, -6.619140625, -6.2857666015625, -5.952392578125, -5.6190185546875, -5.28564453125, -4.9522705078125, -4.618896484375, -4.2855224609375, -3.9521484375, -3.6187744140625, -3.285400390625, -2.9520263671875, -2.61865234375, -2.2852783203125, -1.951904296875, -1.6185302734375, -1.28515625, -0.9517822265625, -0.618408203125, -0.2850341796875, 0.04833984375, 0.3817138671875, 0.715087890625, 1.0484619140625, 1.3818359375, 1.7152099609375, 2.048583984375, 2.3819580078125, 2.71533203125, 3.0487060546875, 3.382080078125, 3.7154541015625, 4.048828125, 4.3822021484375, 4.715576171875, 5.0489501953125, 5.38232421875, 5.7156982421875, 6.049072265625, 6.3824462890625, 6.7158203125, 7.0491943359375, 7.382568359375, 7.7159423828125, 8.04931640625, 8.3826904296875, 8.716064453125, 9.0494384765625, 9.3828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 16.0, 30.0, 78.0, 123.0, 222.0, 189.0, 161.0, 64.0, 40.0, 22.0, 12.0, 8.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.49143981933594, -100.48389434814453, -96.47634887695312, -92.46880340576172, -88.46125793457031, -84.45370483398438, -80.44615936279297, -76.43861389160156, -72.43106842041016, -68.42352294921875, -64.41597747802734, -60.40842819213867, -56.400882720947266, -52.39333724975586, -48.38578796386719, -44.37824249267578, -40.370697021484375, -36.36315155029297, -32.35560607910156, -28.34805679321289, -24.340511322021484, -20.332965850830078, -16.32541847229004, -12.31787109375, -8.310325622558594, -4.302779197692871, -0.29523277282714844, 3.712313652038574, 7.719860076904297, 11.727405548095703, 15.734952926635742, 19.74250030517578, 23.75006103515625, 27.757606506347656, 31.765153884887695, 35.772701263427734, 39.78024673461914, 43.78779220581055, 47.79534149169922, 51.802886962890625, 55.81043243408203, 59.81797790527344, 63.825523376464844, 67.83306884765625, 71.84062194824219, 75.84815979003906, 79.855712890625, 83.8632583618164, 87.87080383300781, 91.87834930419922, 95.88589477539062, 99.89344024658203, 103.90098571777344, 107.90853881835938, 111.91608428955078, 115.92362976074219, 119.9311752319336, 123.938720703125, 127.9462661743164, 131.9538116455078, 135.96136474609375, 139.96890258789062, 143.97645568847656, 147.9840087890625, 151.99154663085938]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 9.0, 9.0, 13.0, 12.0, 16.0, 20.0, 19.0, 24.0, 34.0, 25.0, 34.0, 34.0, 58.0, 65.0, 49.0, 40.0, 59.0, 62.0, 42.0, 45.0, 47.0, 33.0, 33.0, 30.0, 38.0, 24.0, 23.0, 24.0, 15.0, 9.0, 11.0, 7.0, 5.0, 7.0, 6.0, 3.0, 0.0, 6.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.781036376953125, -53.00529479980469, -51.22955322265625, -49.45381164550781, -47.678070068359375, -45.90232849121094, -44.1265869140625, -42.35084533691406, -40.575103759765625, -38.79936218261719, -37.02362060546875, -35.24787902832031, -33.472137451171875, -31.696395874023438, -29.920656204223633, -28.144914627075195, -26.36917495727539, -24.593433380126953, -22.817691802978516, -21.041950225830078, -19.26620864868164, -17.490467071533203, -15.714727401733398, -13.938985824584961, -12.163244247436523, -10.387502670288086, -8.611761093139648, -6.836020469665527, -5.06027889251709, -3.2845373153686523, -1.5087966918945312, 0.26694488525390625, 2.0426902770996094, 3.8184316158294678, 5.594172954559326, 7.3699140548706055, 9.145655632019043, 10.92139720916748, 12.697137832641602, 14.472879409790039, 16.248620986938477, 18.024362564086914, 19.80010414123535, 21.575843811035156, 23.351585388183594, 25.12732696533203, 26.90306854248047, 28.678810119628906, 30.454551696777344, 32.23029327392578, 34.00603485107422, 35.781776428222656, 37.557518005371094, 39.33325958251953, 41.10900115966797, 42.884742736816406, 44.660484313964844, 46.43622589111328, 48.21196746826172, 49.987709045410156, 51.763450622558594, 53.53919219970703, 55.31493377685547, 57.090675354003906, 58.86641311645508]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 15.0, 25.0, 44.0, 52.0, 93.0, 153.0, 301.0, 557.0, 1025.0, 2016.0, 4074.0, 8219.0, 18873.0, 44183.0, 118053.0, 349562.0, 322205.0, 105766.0, 40363.0, 17306.0, 7793.0, 3779.0, 1982.0, 983.0, 499.0, 308.0, 141.0, 64.0, 47.0, 27.0, 22.0, 12.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.1484375, -9.86614990234375, -9.5838623046875, -9.30157470703125, -9.019287109375, -8.73699951171875, -8.4547119140625, -8.17242431640625, -7.89013671875, -7.60784912109375, -7.3255615234375, -7.04327392578125, -6.760986328125, -6.47869873046875, -6.1964111328125, -5.91412353515625, -5.6318359375, -5.34954833984375, -5.0672607421875, -4.78497314453125, -4.502685546875, -4.22039794921875, -3.9381103515625, -3.65582275390625, -3.37353515625, -3.09124755859375, -2.8089599609375, -2.52667236328125, -2.244384765625, -1.96209716796875, -1.6798095703125, -1.39752197265625, -1.115234375, -0.83294677734375, -0.5506591796875, -0.26837158203125, 0.013916015625, 0.29620361328125, 0.5784912109375, 0.86077880859375, 1.14306640625, 1.42535400390625, 1.7076416015625, 1.98992919921875, 2.272216796875, 2.55450439453125, 2.8367919921875, 3.11907958984375, 3.4013671875, 3.68365478515625, 3.9659423828125, 4.24822998046875, 4.530517578125, 4.81280517578125, 5.0950927734375, 5.37738037109375, 5.65966796875, 5.94195556640625, 6.2242431640625, 6.50653076171875, 6.788818359375, 7.07110595703125, 7.3533935546875, 7.63568115234375, 7.91796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 12.0, 9.0, 17.0, 18.0, 22.0, 30.0, 32.0, 45.0, 55.0, 57.0, 67.0, 46.0, 60.0, 65.0, 77.0, 71.0, 54.0, 46.0, 47.0, 37.0, 27.0, 21.0, 21.0, 19.0, 11.0, 6.0, 5.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-7.55859375, -7.36444091796875, -7.1702880859375, -6.97613525390625, -6.781982421875, -6.58782958984375, -6.3936767578125, -6.19952392578125, -6.00537109375, -5.81121826171875, -5.6170654296875, -5.42291259765625, -5.228759765625, -5.03460693359375, -4.8404541015625, -4.64630126953125, -4.4521484375, -4.25799560546875, -4.0638427734375, -3.86968994140625, -3.675537109375, -3.48138427734375, -3.2872314453125, -3.09307861328125, -2.89892578125, -2.70477294921875, -2.5106201171875, -2.31646728515625, -2.122314453125, -1.92816162109375, -1.7340087890625, -1.53985595703125, -1.345703125, -1.15155029296875, -0.9573974609375, -0.76324462890625, -0.569091796875, -0.37493896484375, -0.1807861328125, 0.01336669921875, 0.20751953125, 0.40167236328125, 0.5958251953125, 0.78997802734375, 0.984130859375, 1.17828369140625, 1.3724365234375, 1.56658935546875, 1.7607421875, 1.95489501953125, 2.1490478515625, 2.34320068359375, 2.537353515625, 2.73150634765625, 2.9256591796875, 3.11981201171875, 3.31396484375, 3.50811767578125, 3.7022705078125, 3.89642333984375, 4.090576171875, 4.28472900390625, 4.4788818359375, 4.67303466796875, 4.8671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 6.0, 11.0, 14.0, 13.0, 33.0, 40.0, 68.0, 81.0, 114.0, 156.0, 228.0, 392.0, 554.0, 946.0, 1783.0, 4030.0, 14245.0, 94983.0, 769036.0, 134931.0, 17723.0, 4618.0, 1852.0, 971.0, 610.0, 384.0, 220.0, 173.0, 93.0, 70.0, 49.0, 42.0, 25.0, 21.0, 12.0, 10.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-23.109375, -22.494384765625, -21.87939453125, -21.264404296875, -20.6494140625, -20.034423828125, -19.41943359375, -18.804443359375, -18.189453125, -17.574462890625, -16.95947265625, -16.344482421875, -15.7294921875, -15.114501953125, -14.49951171875, -13.884521484375, -13.26953125, -12.654541015625, -12.03955078125, -11.424560546875, -10.8095703125, -10.194580078125, -9.57958984375, -8.964599609375, -8.349609375, -7.734619140625, -7.11962890625, -6.504638671875, -5.8896484375, -5.274658203125, -4.65966796875, -4.044677734375, -3.4296875, -2.814697265625, -2.19970703125, -1.584716796875, -0.9697265625, -0.354736328125, 0.26025390625, 0.875244140625, 1.490234375, 2.105224609375, 2.72021484375, 3.335205078125, 3.9501953125, 4.565185546875, 5.18017578125, 5.795166015625, 6.41015625, 7.025146484375, 7.64013671875, 8.255126953125, 8.8701171875, 9.485107421875, 10.10009765625, 10.715087890625, 11.330078125, 11.945068359375, 12.56005859375, 13.175048828125, 13.7900390625, 14.405029296875, 15.02001953125, 15.635009765625, 16.25]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 5.0, 2.0, 7.0, 7.0, 9.0, 14.0, 12.0, 17.0, 26.0, 16.0, 16.0, 35.0, 32.0, 40.0, 59.0, 41.0, 44.0, 48.0, 55.0, 48.0, 54.0, 54.0, 49.0, 46.0, 34.0, 34.0, 29.0, 25.0, 28.0, 19.0, 13.0, 9.0, 19.0, 14.0, 12.0, 9.0, 3.0, 5.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-20.953125, -20.35791015625, -19.7626953125, -19.16748046875, -18.572265625, -17.97705078125, -17.3818359375, -16.78662109375, -16.19140625, -15.59619140625, -15.0009765625, -14.40576171875, -13.810546875, -13.21533203125, -12.6201171875, -12.02490234375, -11.4296875, -10.83447265625, -10.2392578125, -9.64404296875, -9.048828125, -8.45361328125, -7.8583984375, -7.26318359375, -6.66796875, -6.07275390625, -5.4775390625, -4.88232421875, -4.287109375, -3.69189453125, -3.0966796875, -2.50146484375, -1.90625, -1.31103515625, -0.7158203125, -0.12060546875, 0.474609375, 1.06982421875, 1.6650390625, 2.26025390625, 2.85546875, 3.45068359375, 4.0458984375, 4.64111328125, 5.236328125, 5.83154296875, 6.4267578125, 7.02197265625, 7.6171875, 8.21240234375, 8.8076171875, 9.40283203125, 9.998046875, 10.59326171875, 11.1884765625, 11.78369140625, 12.37890625, 12.97412109375, 13.5693359375, 14.16455078125, 14.759765625, 15.35498046875, 15.9501953125, 16.54541015625, 17.140625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 6.0, 13.0, 15.0, 31.0, 47.0, 102.0, 157.0, 387.0, 1104.0, 4111.0, 25962.0, 577799.0, 408842.0, 24124.0, 4038.0, 1042.0, 345.0, 176.0, 94.0, 52.0, 30.0, 21.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.97265625, -7.7510986328125, -7.529541015625, -7.3079833984375, -7.08642578125, -6.8648681640625, -6.643310546875, -6.4217529296875, -6.2001953125, -5.9786376953125, -5.757080078125, -5.5355224609375, -5.31396484375, -5.0924072265625, -4.870849609375, -4.6492919921875, -4.427734375, -4.2061767578125, -3.984619140625, -3.7630615234375, -3.54150390625, -3.3199462890625, -3.098388671875, -2.8768310546875, -2.6552734375, -2.4337158203125, -2.212158203125, -1.9906005859375, -1.76904296875, -1.5474853515625, -1.325927734375, -1.1043701171875, -0.8828125, -0.6612548828125, -0.439697265625, -0.2181396484375, 0.00341796875, 0.2249755859375, 0.446533203125, 0.6680908203125, 0.8896484375, 1.1112060546875, 1.332763671875, 1.5543212890625, 1.77587890625, 1.9974365234375, 2.218994140625, 2.4405517578125, 2.662109375, 2.8836669921875, 3.105224609375, 3.3267822265625, 3.54833984375, 3.7698974609375, 3.991455078125, 4.2130126953125, 4.4345703125, 4.6561279296875, 4.877685546875, 5.0992431640625, 5.32080078125, 5.5423583984375, 5.763916015625, 5.9854736328125, 6.20703125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 8.0, 7.0, 8.0, 15.0, 12.0, 6.0, 25.0, 19.0, 49.0, 85.0, 148.0, 214.0, 131.0, 95.0, 52.0, 26.0, 16.0, 19.0, 11.0, 15.0, 13.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016422271728515625, -0.0015899091958999634, -0.0015375912189483643, -0.0014852732419967651, -0.001432955265045166, -0.001380637288093567, -0.0013283193111419678, -0.0012760013341903687, -0.0012236833572387695, -0.0011713653802871704, -0.0011190474033355713, -0.0010667294263839722, -0.001014411449432373, -0.0009620934724807739, -0.0009097754955291748, -0.0008574575185775757, -0.0008051395416259766, -0.0007528215646743774, -0.0007005035877227783, -0.0006481856107711792, -0.0005958676338195801, -0.000543549656867981, -0.0004912316799163818, -0.0004389137029647827, -0.0003865957260131836, -0.00033427774906158447, -0.00028195977210998535, -0.00022964179515838623, -0.0001773238182067871, -0.000125005841255188, -7.268786430358887e-05, -2.0369887351989746e-05, 3.1948089599609375e-05, 8.42660665512085e-05, 0.00013658404350280762, 0.00018890202045440674, 0.00024121999740600586, 0.000293537974357605, 0.0003458559513092041, 0.0003981739282608032, 0.00045049190521240234, 0.0005028098821640015, 0.0005551278591156006, 0.0006074458360671997, 0.0006597638130187988, 0.000712081789970398, 0.0007643997669219971, 0.0008167177438735962, 0.0008690357208251953, 0.0009213536977767944, 0.0009736716747283936, 0.0010259896516799927, 0.0010783076286315918, 0.001130625605583191, 0.00118294358253479, 0.0012352615594863892, 0.0012875795364379883, 0.0013398975133895874, 0.0013922154903411865, 0.0014445334672927856, 0.0014968514442443848, 0.0015491694211959839, 0.001601487398147583, 0.0016538053750991821, 0.0017061233520507812]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 11.0, 11.0, 17.0, 24.0, 25.0, 37.0, 74.0, 137.0, 219.0, 340.0, 565.0, 1133.0, 2255.0, 5780.0, 21787.0, 149220.0, 725526.0, 113568.0, 18087.0, 5254.0, 2130.0, 953.0, 526.0, 324.0, 177.0, 120.0, 89.0, 55.0, 22.0, 21.0, 20.0, 10.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.3359375, -4.206268310546875, -4.07659912109375, -3.946929931640625, -3.8172607421875, -3.687591552734375, -3.55792236328125, -3.428253173828125, -3.298583984375, -3.168914794921875, -3.03924560546875, -2.909576416015625, -2.7799072265625, -2.650238037109375, -2.52056884765625, -2.390899658203125, -2.26123046875, -2.131561279296875, -2.00189208984375, -1.872222900390625, -1.7425537109375, -1.612884521484375, -1.48321533203125, -1.353546142578125, -1.223876953125, -1.094207763671875, -0.96453857421875, -0.834869384765625, -0.7052001953125, -0.575531005859375, -0.44586181640625, -0.316192626953125, -0.1865234375, -0.056854248046875, 0.07281494140625, 0.202484130859375, 0.3321533203125, 0.461822509765625, 0.59149169921875, 0.721160888671875, 0.850830078125, 0.980499267578125, 1.11016845703125, 1.239837646484375, 1.3695068359375, 1.499176025390625, 1.62884521484375, 1.758514404296875, 1.88818359375, 2.017852783203125, 2.14752197265625, 2.277191162109375, 2.4068603515625, 2.536529541015625, 2.66619873046875, 2.795867919921875, 2.925537109375, 3.055206298828125, 3.18487548828125, 3.314544677734375, 3.4442138671875, 3.573883056640625, 3.70355224609375, 3.833221435546875, 3.962890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 20.0, 14.0, 19.0, 15.0, 26.0, 32.0, 39.0, 66.0, 75.0, 93.0, 99.0, 105.0, 101.0, 79.0, 49.0, 41.0, 44.0, 16.0, 25.0, 13.0, 9.0, 10.0, 4.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.30859375, -6.164459228515625, -6.02032470703125, -5.876190185546875, -5.7320556640625, -5.587921142578125, -5.44378662109375, -5.299652099609375, -5.155517578125, -5.011383056640625, -4.86724853515625, -4.723114013671875, -4.5789794921875, -4.434844970703125, -4.29071044921875, -4.146575927734375, -4.00244140625, -3.858306884765625, -3.71417236328125, -3.570037841796875, -3.4259033203125, -3.281768798828125, -3.13763427734375, -2.993499755859375, -2.849365234375, -2.705230712890625, -2.56109619140625, -2.416961669921875, -2.2728271484375, -2.128692626953125, -1.98455810546875, -1.840423583984375, -1.6962890625, -1.552154541015625, -1.40802001953125, -1.263885498046875, -1.1197509765625, -0.975616455078125, -0.83148193359375, -0.687347412109375, -0.543212890625, -0.399078369140625, -0.25494384765625, -0.110809326171875, 0.0333251953125, 0.177459716796875, 0.32159423828125, 0.465728759765625, 0.60986328125, 0.753997802734375, 0.89813232421875, 1.042266845703125, 1.1864013671875, 1.330535888671875, 1.47467041015625, 1.618804931640625, 1.762939453125, 1.907073974609375, 2.05120849609375, 2.195343017578125, 2.3394775390625, 2.483612060546875, 2.62774658203125, 2.771881103515625, 2.916015625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 8.0, 12.0, 33.0, 68.0, 112.0, 222.0, 189.0, 132.0, 97.0, 48.0, 25.0, 17.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-98.76103210449219, -95.45972442626953, -92.1584243774414, -88.85711669921875, -85.55581665039062, -82.25450897216797, -78.95320129394531, -75.65190124511719, -72.35059356689453, -69.04928588867188, -65.74798583984375, -62.446678161621094, -59.1453742980957, -55.84407043457031, -52.542762756347656, -49.241458892822266, -45.940155029296875, -42.638851165771484, -39.337547302246094, -36.03623962402344, -32.73493576049805, -29.433631896972656, -26.132326126098633, -22.83102035522461, -19.52971649169922, -16.228412628173828, -12.927106857299805, -9.625802040100098, -6.324497222900391, -3.023193359375, 0.27811241149902344, 3.579418182373047, 6.8807220458984375, 10.182026863098145, 13.483331680297852, 16.784637451171875, 20.085941314697266, 23.387245178222656, 26.68855094909668, 29.989856719970703, 33.291160583496094, 36.592464447021484, 39.893768310546875, 43.19507598876953, 46.49637985229492, 49.79768371582031, 53.09899139404297, 56.40029525756836, 59.70159912109375, 63.00290298461914, 66.30420684814453, 69.60551452636719, 72.90681457519531, 76.20812225341797, 79.50942993164062, 82.81072998046875, 86.1120376586914, 89.41334533691406, 92.71464538574219, 96.01595306396484, 99.3172607421875, 102.61856079101562, 105.91986846923828, 109.22117614746094, 112.52247619628906]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 1.0, 4.0, 5.0, 5.0, 6.0, 6.0, 6.0, 10.0, 8.0, 14.0, 16.0, 13.0, 16.0, 14.0, 15.0, 26.0, 26.0, 25.0, 25.0, 23.0, 35.0, 46.0, 58.0, 55.0, 51.0, 66.0, 56.0, 38.0, 26.0, 30.0, 29.0, 38.0, 29.0, 30.0, 25.0, 17.0, 22.0, 15.0, 15.0, 12.0, 6.0, 10.0, 5.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.51411437988281, -65.44088745117188, -63.36766052246094, -61.29443359375, -59.22120666503906, -57.147979736328125, -55.07475280761719, -53.00152587890625, -50.92829895019531, -48.855072021484375, -46.78184509277344, -44.7086181640625, -42.63539123535156, -40.562164306640625, -38.48893737792969, -36.41571044921875, -34.34248352050781, -32.269256591796875, -30.196029663085938, -28.122802734375, -26.049575805664062, -23.976348876953125, -21.903121948242188, -19.82989501953125, -17.756668090820312, -15.683441162109375, -13.610214233398438, -11.5369873046875, -9.463760375976562, -7.390533447265625, -5.3173065185546875, -3.24407958984375, -1.1708526611328125, 0.902374267578125, 2.9756011962890625, 5.048828125, 7.1220550537109375, 9.195281982421875, 11.268508911132812, 13.34173583984375, 15.414962768554688, 17.488189697265625, 19.561416625976562, 21.6346435546875, 23.707870483398438, 25.781097412109375, 27.854324340820312, 29.92755126953125, 32.00077819824219, 34.074005126953125, 36.14723205566406, 38.220458984375, 40.29368591308594, 42.366912841796875, 44.44013977050781, 46.51336669921875, 48.58659362792969, 50.659820556640625, 52.73304748535156, 54.8062744140625, 56.87950134277344, 58.952728271484375, 61.02595520019531, 63.09918212890625, 65.17240905761719]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 6.0, 8.0, 14.0, 27.0, 31.0, 40.0, 71.0, 106.0, 195.0, 358.0, 645.0, 1227.0, 2727.0, 6819.0, 23590.0, 138211.0, 1798961.0, 2024132.0, 157450.0, 26334.0, 7619.0, 2856.0, 1319.0, 637.0, 328.0, 205.0, 132.0, 63.0, 64.0, 26.0, 21.0, 20.0, 13.0, 7.0, 7.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.787353515625, -8.54345703125, -8.299560546875, -8.0556640625, -7.811767578125, -7.56787109375, -7.323974609375, -7.080078125, -6.836181640625, -6.59228515625, -6.348388671875, -6.1044921875, -5.860595703125, -5.61669921875, -5.372802734375, -5.12890625, -4.885009765625, -4.64111328125, -4.397216796875, -4.1533203125, -3.909423828125, -3.66552734375, -3.421630859375, -3.177734375, -2.933837890625, -2.68994140625, -2.446044921875, -2.2021484375, -1.958251953125, -1.71435546875, -1.470458984375, -1.2265625, -0.982666015625, -0.73876953125, -0.494873046875, -0.2509765625, -0.007080078125, 0.23681640625, 0.480712890625, 0.724609375, 0.968505859375, 1.21240234375, 1.456298828125, 1.7001953125, 1.944091796875, 2.18798828125, 2.431884765625, 2.67578125, 2.919677734375, 3.16357421875, 3.407470703125, 3.6513671875, 3.895263671875, 4.13916015625, 4.383056640625, 4.626953125, 4.870849609375, 5.11474609375, 5.358642578125, 5.6025390625, 5.846435546875, 6.09033203125, 6.334228515625, 6.578125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 4.0, 10.0, 20.0, 25.0, 22.0, 28.0, 34.0, 41.0, 53.0, 66.0, 68.0, 57.0, 51.0, 48.0, 70.0, 57.0, 53.0, 49.0, 48.0, 36.0, 29.0, 32.0, 20.0, 17.0, 11.0, 8.0, 2.0, 8.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.1953125, -7.01568603515625, -6.8360595703125, -6.65643310546875, -6.476806640625, -6.29718017578125, -6.1175537109375, -5.93792724609375, -5.75830078125, -5.57867431640625, -5.3990478515625, -5.21942138671875, -5.039794921875, -4.86016845703125, -4.6805419921875, -4.50091552734375, -4.3212890625, -4.14166259765625, -3.9620361328125, -3.78240966796875, -3.602783203125, -3.42315673828125, -3.2435302734375, -3.06390380859375, -2.88427734375, -2.70465087890625, -2.5250244140625, -2.34539794921875, -2.165771484375, -1.98614501953125, -1.8065185546875, -1.62689208984375, -1.447265625, -1.26763916015625, -1.0880126953125, -0.90838623046875, -0.728759765625, -0.54913330078125, -0.3695068359375, -0.18988037109375, -0.01025390625, 0.16937255859375, 0.3489990234375, 0.52862548828125, 0.708251953125, 0.88787841796875, 1.0675048828125, 1.24713134765625, 1.4267578125, 1.60638427734375, 1.7860107421875, 1.96563720703125, 2.145263671875, 2.32489013671875, 2.5045166015625, 2.68414306640625, 2.86376953125, 3.04339599609375, 3.2230224609375, 3.40264892578125, 3.582275390625, 3.76190185546875, 3.9415283203125, 4.12115478515625, 4.30078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 7.0, 7.0, 17.0, 19.0, 32.0, 43.0, 85.0, 126.0, 275.0, 503.0, 1130.0, 2900.0, 9126.0, 38600.0, 344807.0, 3455870.0, 290781.0, 36352.0, 8676.0, 2741.0, 1061.0, 486.0, 235.0, 136.0, 99.0, 46.0, 32.0, 32.0, 19.0, 12.0, 6.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.0546875, -10.7142333984375, -10.373779296875, -10.0333251953125, -9.69287109375, -9.3524169921875, -9.011962890625, -8.6715087890625, -8.3310546875, -7.9906005859375, -7.650146484375, -7.3096923828125, -6.96923828125, -6.6287841796875, -6.288330078125, -5.9478759765625, -5.607421875, -5.2669677734375, -4.926513671875, -4.5860595703125, -4.24560546875, -3.9051513671875, -3.564697265625, -3.2242431640625, -2.8837890625, -2.5433349609375, -2.202880859375, -1.8624267578125, -1.52197265625, -1.1815185546875, -0.841064453125, -0.5006103515625, -0.16015625, 0.1802978515625, 0.520751953125, 0.8612060546875, 1.20166015625, 1.5421142578125, 1.882568359375, 2.2230224609375, 2.5634765625, 2.9039306640625, 3.244384765625, 3.5848388671875, 3.92529296875, 4.2657470703125, 4.606201171875, 4.9466552734375, 5.287109375, 5.6275634765625, 5.968017578125, 6.3084716796875, 6.64892578125, 6.9893798828125, 7.329833984375, 7.6702880859375, 8.0107421875, 8.3511962890625, 8.691650390625, 9.0321044921875, 9.37255859375, 9.7130126953125, 10.053466796875, 10.3939208984375, 10.734375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 9.0, 9.0, 12.0, 16.0, 18.0, 29.0, 41.0, 58.0, 105.0, 146.0, 242.0, 396.0, 622.0, 718.0, 614.0, 379.0, 192.0, 136.0, 104.0, 49.0, 41.0, 32.0, 27.0, 12.0, 17.0, 10.0, 9.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.2027587890625, -8.889892578125, -8.5770263671875, -8.26416015625, -7.9512939453125, -7.638427734375, -7.3255615234375, -7.0126953125, -6.6998291015625, -6.386962890625, -6.0740966796875, -5.76123046875, -5.4483642578125, -5.135498046875, -4.8226318359375, -4.509765625, -4.1968994140625, -3.884033203125, -3.5711669921875, -3.25830078125, -2.9454345703125, -2.632568359375, -2.3197021484375, -2.0068359375, -1.6939697265625, -1.381103515625, -1.0682373046875, -0.75537109375, -0.4425048828125, -0.129638671875, 0.1832275390625, 0.49609375, 0.8089599609375, 1.121826171875, 1.4346923828125, 1.74755859375, 2.0604248046875, 2.373291015625, 2.6861572265625, 2.9990234375, 3.3118896484375, 3.624755859375, 3.9376220703125, 4.25048828125, 4.5633544921875, 4.876220703125, 5.1890869140625, 5.501953125, 5.8148193359375, 6.127685546875, 6.4405517578125, 6.75341796875, 7.0662841796875, 7.379150390625, 7.6920166015625, 8.0048828125, 8.3177490234375, 8.630615234375, 8.9434814453125, 9.25634765625, 9.5692138671875, 9.882080078125, 10.1949462890625, 10.5078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 9.0, 16.0, 60.0, 160.0, 261.0, 263.0, 130.0, 52.0, 22.0, 10.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-65.722900390625, -61.28992462158203, -56.85694885253906, -52.423973083496094, -47.990997314453125, -43.558021545410156, -39.12504577636719, -34.69207000732422, -30.25909423828125, -25.82611846923828, -21.393142700195312, -16.960166931152344, -12.527191162109375, -8.094215393066406, -3.6612396240234375, 0.7717361450195312, 5.2047119140625, 9.637687683105469, 14.070663452148438, 18.503639221191406, 22.936614990234375, 27.369590759277344, 31.802566528320312, 36.23554229736328, 40.66851806640625, 45.10149383544922, 49.53446960449219, 53.967445373535156, 58.400421142578125, 62.833396911621094, 67.26637268066406, 71.69934844970703, 76.13230895996094, 80.5652847290039, 84.99826049804688, 89.43123626708984, 93.86421203613281, 98.29718780517578, 102.73016357421875, 107.16313934326172, 111.59611511230469, 116.02909088134766, 120.46206665039062, 124.8950424194336, 129.32801818847656, 133.760986328125, 138.1939697265625, 142.626953125, 147.05992126464844, 151.49288940429688, 155.92587280273438, 160.35885620117188, 164.7918243408203, 169.22479248046875, 173.65777587890625, 178.09075927734375, 182.5237274169922, 186.95669555664062, 191.38967895507812, 195.82266235351562, 200.25563049316406, 204.6885986328125, 209.12158203125, 213.5545654296875, 217.98753356933594]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 5.0, 15.0, 15.0, 18.0, 20.0, 23.0, 37.0, 31.0, 34.0, 38.0, 39.0, 43.0, 65.0, 60.0, 57.0, 61.0, 42.0, 51.0, 46.0, 42.0, 43.0, 30.0, 41.0, 21.0, 23.0, 11.0, 17.0, 20.0, 7.0, 7.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.74586868286133, -44.099727630615234, -42.453590393066406, -40.80744934082031, -39.16130828857422, -37.515167236328125, -35.86902618408203, -34.2228889465332, -32.57674789428711, -30.930606842041016, -29.284467697143555, -27.638328552246094, -25.9921875, -24.346046447753906, -22.699907302856445, -21.053768157958984, -19.40762710571289, -17.761486053466797, -16.115346908569336, -14.469206809997559, -12.823066711425781, -11.176926612854004, -9.530786514282227, -7.884646415710449, -6.238506317138672, -4.5923662185668945, -2.946226119995117, -1.3000860214233398, 0.3460540771484375, 1.9921941757202148, 3.638334274291992, 5.2844743728637695, 6.930610656738281, 8.576750755310059, 10.222890853881836, 11.869030952453613, 13.51517105102539, 15.161311149597168, 16.807451248168945, 18.453590393066406, 20.0997314453125, 21.745872497558594, 23.392011642456055, 25.038150787353516, 26.68429183959961, 28.330432891845703, 29.976572036743164, 31.622711181640625, 33.26885223388672, 34.91499328613281, 36.561134338378906, 38.207271575927734, 39.85341262817383, 41.49955368041992, 43.14569091796875, 44.791831970214844, 46.43797302246094, 48.08411407470703, 49.730255126953125, 51.37639236450195, 53.02253341674805, 54.66867446899414, 56.31481170654297, 57.96095275878906, 59.607093811035156]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 11.0, 9.0, 8.0, 16.0, 24.0, 40.0, 63.0, 84.0, 150.0, 214.0, 327.0, 593.0, 954.0, 1688.0, 2953.0, 5645.0, 11645.0, 25221.0, 59222.0, 142403.0, 285404.0, 276035.0, 133666.0, 55431.0, 23564.0, 10886.0, 5419.0, 2860.0, 1609.0, 953.0, 544.0, 351.0, 209.0, 130.0, 77.0, 55.0, 33.0, 22.0, 19.0, 6.0, 9.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.95947265625, -4.7939453125, -4.62841796875, -4.462890625, -4.29736328125, -4.1318359375, -3.96630859375, -3.80078125, -3.63525390625, -3.4697265625, -3.30419921875, -3.138671875, -2.97314453125, -2.8076171875, -2.64208984375, -2.4765625, -2.31103515625, -2.1455078125, -1.97998046875, -1.814453125, -1.64892578125, -1.4833984375, -1.31787109375, -1.15234375, -0.98681640625, -0.8212890625, -0.65576171875, -0.490234375, -0.32470703125, -0.1591796875, 0.00634765625, 0.171875, 0.33740234375, 0.5029296875, 0.66845703125, 0.833984375, 0.99951171875, 1.1650390625, 1.33056640625, 1.49609375, 1.66162109375, 1.8271484375, 1.99267578125, 2.158203125, 2.32373046875, 2.4892578125, 2.65478515625, 2.8203125, 2.98583984375, 3.1513671875, 3.31689453125, 3.482421875, 3.64794921875, 3.8134765625, 3.97900390625, 4.14453125, 4.31005859375, 4.4755859375, 4.64111328125, 4.806640625, 4.97216796875, 5.1376953125, 5.30322265625, 5.46875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 8.0, 8.0, 9.0, 10.0, 16.0, 15.0, 25.0, 25.0, 32.0, 49.0, 40.0, 44.0, 63.0, 62.0, 48.0, 67.0, 55.0, 53.0, 53.0, 52.0, 58.0, 49.0, 28.0, 30.0, 29.0, 15.0, 15.0, 12.0, 11.0, 6.0, 6.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.10546875, -6.9261474609375, -6.746826171875, -6.5675048828125, -6.38818359375, -6.2088623046875, -6.029541015625, -5.8502197265625, -5.6708984375, -5.4915771484375, -5.312255859375, -5.1329345703125, -4.95361328125, -4.7742919921875, -4.594970703125, -4.4156494140625, -4.236328125, -4.0570068359375, -3.877685546875, -3.6983642578125, -3.51904296875, -3.3397216796875, -3.160400390625, -2.9810791015625, -2.8017578125, -2.6224365234375, -2.443115234375, -2.2637939453125, -2.08447265625, -1.9051513671875, -1.725830078125, -1.5465087890625, -1.3671875, -1.1878662109375, -1.008544921875, -0.8292236328125, -0.64990234375, -0.4705810546875, -0.291259765625, -0.1119384765625, 0.0673828125, 0.2467041015625, 0.426025390625, 0.6053466796875, 0.78466796875, 0.9639892578125, 1.143310546875, 1.3226318359375, 1.501953125, 1.6812744140625, 1.860595703125, 2.0399169921875, 2.21923828125, 2.3985595703125, 2.577880859375, 2.7572021484375, 2.9365234375, 3.1158447265625, 3.295166015625, 3.4744873046875, 3.65380859375, 3.8331298828125, 4.012451171875, 4.1917724609375, 4.37109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 6.0, 9.0, 6.0, 15.0, 20.0, 39.0, 41.0, 67.0, 106.0, 216.0, 440.0, 1173.0, 3589.0, 15378.0, 101135.0, 717294.0, 177574.0, 23611.0, 5104.0, 1500.0, 591.0, 253.0, 128.0, 74.0, 49.0, 40.0, 29.0, 24.0, 14.0, 9.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.7991943359375, -14.371826171875, -13.9444580078125, -13.51708984375, -13.0897216796875, -12.662353515625, -12.2349853515625, -11.8076171875, -11.3802490234375, -10.952880859375, -10.5255126953125, -10.09814453125, -9.6707763671875, -9.243408203125, -8.8160400390625, -8.388671875, -7.9613037109375, -7.533935546875, -7.1065673828125, -6.67919921875, -6.2518310546875, -5.824462890625, -5.3970947265625, -4.9697265625, -4.5423583984375, -4.114990234375, -3.6876220703125, -3.26025390625, -2.8328857421875, -2.405517578125, -1.9781494140625, -1.55078125, -1.1234130859375, -0.696044921875, -0.2686767578125, 0.15869140625, 0.5860595703125, 1.013427734375, 1.4407958984375, 1.8681640625, 2.2955322265625, 2.722900390625, 3.1502685546875, 3.57763671875, 4.0050048828125, 4.432373046875, 4.8597412109375, 5.287109375, 5.7144775390625, 6.141845703125, 6.5692138671875, 6.99658203125, 7.4239501953125, 7.851318359375, 8.2786865234375, 8.7060546875, 9.1334228515625, 9.560791015625, 9.9881591796875, 10.41552734375, 10.8428955078125, 11.270263671875, 11.6976318359375, 12.125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 11.0, 9.0, 16.0, 20.0, 13.0, 27.0, 32.0, 38.0, 35.0, 43.0, 69.0, 57.0, 60.0, 75.0, 63.0, 71.0, 56.0, 50.0, 41.0, 34.0, 47.0, 40.0, 28.0, 19.0, 10.0, 9.0, 4.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.03125, -22.3662109375, -21.701171875, -21.0361328125, -20.37109375, -19.7060546875, -19.041015625, -18.3759765625, -17.7109375, -17.0458984375, -16.380859375, -15.7158203125, -15.05078125, -14.3857421875, -13.720703125, -13.0556640625, -12.390625, -11.7255859375, -11.060546875, -10.3955078125, -9.73046875, -9.0654296875, -8.400390625, -7.7353515625, -7.0703125, -6.4052734375, -5.740234375, -5.0751953125, -4.41015625, -3.7451171875, -3.080078125, -2.4150390625, -1.75, -1.0849609375, -0.419921875, 0.2451171875, 0.91015625, 1.5751953125, 2.240234375, 2.9052734375, 3.5703125, 4.2353515625, 4.900390625, 5.5654296875, 6.23046875, 6.8955078125, 7.560546875, 8.2255859375, 8.890625, 9.5556640625, 10.220703125, 10.8857421875, 11.55078125, 12.2158203125, 12.880859375, 13.5458984375, 14.2109375, 14.8759765625, 15.541015625, 16.2060546875, 16.87109375, 17.5361328125, 18.201171875, 18.8662109375, 19.53125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 8.0, 7.0, 10.0, 5.0, 10.0, 29.0, 31.0, 30.0, 54.0, 63.0, 120.0, 229.0, 432.0, 938.0, 2620.0, 8991.0, 39418.0, 246164.0, 642108.0, 83605.0, 16438.0, 4337.0, 1499.0, 645.0, 292.0, 170.0, 107.0, 73.0, 37.0, 28.0, 11.0, 15.0, 8.0, 3.0, 5.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.154296875, -3.06719970703125, -2.9801025390625, -2.89300537109375, -2.805908203125, -2.71881103515625, -2.6317138671875, -2.54461669921875, -2.45751953125, -2.37042236328125, -2.2833251953125, -2.19622802734375, -2.109130859375, -2.02203369140625, -1.9349365234375, -1.84783935546875, -1.7607421875, -1.67364501953125, -1.5865478515625, -1.49945068359375, -1.412353515625, -1.32525634765625, -1.2381591796875, -1.15106201171875, -1.06396484375, -0.97686767578125, -0.8897705078125, -0.80267333984375, -0.715576171875, -0.62847900390625, -0.5413818359375, -0.45428466796875, -0.3671875, -0.28009033203125, -0.1929931640625, -0.10589599609375, -0.018798828125, 0.06829833984375, 0.1553955078125, 0.24249267578125, 0.32958984375, 0.41668701171875, 0.5037841796875, 0.59088134765625, 0.677978515625, 0.76507568359375, 0.8521728515625, 0.93927001953125, 1.0263671875, 1.11346435546875, 1.2005615234375, 1.28765869140625, 1.374755859375, 1.46185302734375, 1.5489501953125, 1.63604736328125, 1.72314453125, 1.81024169921875, 1.8973388671875, 1.98443603515625, 2.071533203125, 2.15863037109375, 2.2457275390625, 2.33282470703125, 2.419921875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 6.0, 6.0, 2.0, 13.0, 16.0, 20.0, 42.0, 85.0, 122.0, 173.0, 185.0, 128.0, 73.0, 41.0, 29.0, 15.0, 16.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001033782958984375, -0.001005902886390686, -0.000978022813796997, -0.0009501427412033081, -0.0009222626686096191, -0.0008943825960159302, -0.0008665025234222412, -0.0008386224508285522, -0.0008107423782348633, -0.0007828623056411743, -0.0007549822330474854, -0.0007271021604537964, -0.0006992220878601074, -0.0006713420152664185, -0.0006434619426727295, -0.0006155818700790405, -0.0005877017974853516, -0.0005598217248916626, -0.0005319416522979736, -0.0005040615797042847, -0.0004761815071105957, -0.00044830143451690674, -0.0004204213619232178, -0.0003925412893295288, -0.00036466121673583984, -0.0003367811441421509, -0.0003089010715484619, -0.00028102099895477295, -0.000253140926361084, -0.00022526085376739502, -0.00019738078117370605, -0.0001695007085800171, -0.00014162063598632812, -0.00011374056339263916, -8.58604907989502e-05, -5.798041820526123e-05, -3.0100345611572266e-05, -2.2202730178833008e-06, 2.5659799575805664e-05, 5.353987216949463e-05, 8.14199447631836e-05, 0.00010930001735687256, 0.00013718008995056152, 0.0001650601625442505, 0.00019294023513793945, 0.00022082030773162842, 0.0002487003803253174, 0.00027658045291900635, 0.0003044605255126953, 0.0003323405981063843, 0.00036022067070007324, 0.0003881007432937622, 0.00041598081588745117, 0.00044386088848114014, 0.0004717409610748291, 0.0004996210336685181, 0.000527501106262207, 0.000555381178855896, 0.000583261251449585, 0.0006111413240432739, 0.0006390213966369629, 0.0006669014692306519, 0.0006947815418243408, 0.0007226616144180298, 0.0007505416870117188]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 6.0, 3.0, 3.0, 8.0, 4.0, 8.0, 16.0, 24.0, 49.0, 55.0, 88.0, 148.0, 283.0, 481.0, 1064.0, 2813.0, 9446.0, 50285.0, 568875.0, 358563.0, 43094.0, 8525.0, 2622.0, 1048.0, 473.0, 222.0, 117.0, 74.0, 44.0, 33.0, 20.0, 18.0, 16.0, 10.0, 6.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41796875, -2.307861328125, -2.19775390625, -2.087646484375, -1.9775390625, -1.867431640625, -1.75732421875, -1.647216796875, -1.537109375, -1.427001953125, -1.31689453125, -1.206787109375, -1.0966796875, -0.986572265625, -0.87646484375, -0.766357421875, -0.65625, -0.546142578125, -0.43603515625, -0.325927734375, -0.2158203125, -0.105712890625, 0.00439453125, 0.114501953125, 0.224609375, 0.334716796875, 0.44482421875, 0.554931640625, 0.6650390625, 0.775146484375, 0.88525390625, 0.995361328125, 1.10546875, 1.215576171875, 1.32568359375, 1.435791015625, 1.5458984375, 1.656005859375, 1.76611328125, 1.876220703125, 1.986328125, 2.096435546875, 2.20654296875, 2.316650390625, 2.4267578125, 2.536865234375, 2.64697265625, 2.757080078125, 2.8671875, 2.977294921875, 3.08740234375, 3.197509765625, 3.3076171875, 3.417724609375, 3.52783203125, 3.637939453125, 3.748046875, 3.858154296875, 3.96826171875, 4.078369140625, 4.1884765625, 4.298583984375, 4.40869140625, 4.518798828125, 4.62890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 14.0, 22.0, 43.0, 43.0, 62.0, 87.0, 106.0, 105.0, 102.0, 106.0, 94.0, 67.0, 50.0, 22.0, 22.0, 14.0, 7.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.716796875, -3.60052490234375, -3.4842529296875, -3.36798095703125, -3.251708984375, -3.13543701171875, -3.0191650390625, -2.90289306640625, -2.78662109375, -2.67034912109375, -2.5540771484375, -2.43780517578125, -2.321533203125, -2.20526123046875, -2.0889892578125, -1.97271728515625, -1.8564453125, -1.74017333984375, -1.6239013671875, -1.50762939453125, -1.391357421875, -1.27508544921875, -1.1588134765625, -1.04254150390625, -0.92626953125, -0.80999755859375, -0.6937255859375, -0.57745361328125, -0.461181640625, -0.34490966796875, -0.2286376953125, -0.11236572265625, 0.00390625, 0.12017822265625, 0.2364501953125, 0.35272216796875, 0.468994140625, 0.58526611328125, 0.7015380859375, 0.81781005859375, 0.93408203125, 1.05035400390625, 1.1666259765625, 1.28289794921875, 1.399169921875, 1.51544189453125, 1.6317138671875, 1.74798583984375, 1.8642578125, 1.98052978515625, 2.0968017578125, 2.21307373046875, 2.329345703125, 2.44561767578125, 2.5618896484375, 2.67816162109375, 2.79443359375, 2.91070556640625, 3.0269775390625, 3.14324951171875, 3.259521484375, 3.37579345703125, 3.4920654296875, 3.60833740234375, 3.724609375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 15.0, 9.0, 26.0, 54.0, 93.0, 171.0, 279.0, 156.0, 87.0, 52.0, 19.0, 11.0, 6.0, 3.0, 4.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.44622039794922, -82.81043243408203, -80.17463684082031, -77.53884887695312, -74.90306091308594, -72.26727294921875, -69.63148498535156, -66.99568939208984, -64.35990142822266, -61.72411346435547, -59.088321685791016, -56.45252990722656, -53.816741943359375, -51.18095397949219, -48.545162200927734, -45.90937042236328, -43.273582458496094, -40.637794494628906, -38.00200271606445, -35.3662109375, -32.73042297363281, -30.094633102416992, -27.458843231201172, -24.82305335998535, -22.18726348876953, -19.55147361755371, -16.91568374633789, -14.27989387512207, -11.64410400390625, -9.00831413269043, -6.372524261474609, -3.736734390258789, -1.1009521484375, 1.5348377227783203, 4.170627593994141, 6.806417465209961, 9.442207336425781, 12.077997207641602, 14.713787078857422, 17.349576950073242, 19.985366821289062, 22.621156692504883, 25.256946563720703, 27.892736434936523, 30.528526306152344, 33.16431427001953, 35.800106048583984, 38.43589782714844, 41.071685791015625, 43.70747375488281, 46.343265533447266, 48.97905731201172, 51.614845275878906, 54.250633239746094, 56.88642501831055, 59.522216796875, 62.15800476074219, 64.79379272460938, 67.42958068847656, 70.06537628173828, 72.70116424560547, 75.33695220947266, 77.97274780273438, 80.60853576660156, 83.24432373046875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 2.0, 8.0, 9.0, 3.0, 8.0, 7.0, 12.0, 5.0, 11.0, 13.0, 4.0, 22.0, 13.0, 12.0, 24.0, 24.0, 22.0, 29.0, 23.0, 46.0, 44.0, 49.0, 60.0, 86.0, 72.0, 51.0, 34.0, 34.0, 31.0, 17.0, 16.0, 24.0, 25.0, 14.0, 20.0, 17.0, 15.0, 11.0, 12.0, 13.0, 8.0, 8.0, 8.0, 6.0, 4.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-48.299293518066406, -46.72604751586914, -45.15279769897461, -43.579551696777344, -42.00630569458008, -40.43305969238281, -38.85980987548828, -37.286563873291016, -35.71331787109375, -34.140071868896484, -32.56682205200195, -30.993576049804688, -29.420330047607422, -27.847082138061523, -26.273834228515625, -24.70058822631836, -23.127338409423828, -21.55409049987793, -19.980844497680664, -18.407596588134766, -16.8343505859375, -15.261102676391602, -13.687854766845703, -12.114607810974121, -10.541360855102539, -8.968113899230957, -7.394866466522217, -5.821619033813477, -4.2483720779418945, -2.6751251220703125, -1.101877212524414, 0.47136974334716797, 2.0446128845214844, 3.6178600788116455, 5.191107273101807, 6.764354705810547, 8.337601661682129, 9.910848617553711, 11.48409652709961, 13.057343482971191, 14.630590438842773, 16.203838348388672, 17.777084350585938, 19.350332260131836, 20.923580169677734, 22.496826171875, 24.0700740814209, 25.643321990966797, 27.216567993164062, 28.78981590270996, 30.363061904907227, 31.936309814453125, 33.50955581665039, 35.082801818847656, 36.65605163574219, 38.22929763793945, 39.80254364013672, 41.375789642333984, 42.949039459228516, 44.52228546142578, 46.09553146362305, 47.66877746582031, 49.242027282714844, 50.81527328491211, 52.38852310180664]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 5.0, 12.0, 6.0, 11.0, 17.0, 29.0, 34.0, 48.0, 77.0, 115.0, 168.0, 258.0, 457.0, 812.0, 1566.0, 3260.0, 7604.0, 21498.0, 76368.0, 352798.0, 1626213.0, 1629429.0, 359075.0, 76669.0, 22215.0, 8296.0, 3522.0, 1717.0, 813.0, 447.0, 260.0, 163.0, 92.0, 70.0, 50.0, 33.0, 28.0, 14.0, 13.0, 4.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.71484375, -4.583892822265625, -4.45294189453125, -4.321990966796875, -4.1910400390625, -4.060089111328125, -3.92913818359375, -3.798187255859375, -3.667236328125, -3.536285400390625, -3.40533447265625, -3.274383544921875, -3.1434326171875, -3.012481689453125, -2.88153076171875, -2.750579833984375, -2.61962890625, -2.488677978515625, -2.35772705078125, -2.226776123046875, -2.0958251953125, -1.964874267578125, -1.83392333984375, -1.702972412109375, -1.572021484375, -1.441070556640625, -1.31011962890625, -1.179168701171875, -1.0482177734375, -0.917266845703125, -0.78631591796875, -0.655364990234375, -0.5244140625, -0.393463134765625, -0.26251220703125, -0.131561279296875, -0.0006103515625, 0.130340576171875, 0.26129150390625, 0.392242431640625, 0.523193359375, 0.654144287109375, 0.78509521484375, 0.916046142578125, 1.0469970703125, 1.177947998046875, 1.30889892578125, 1.439849853515625, 1.57080078125, 1.701751708984375, 1.83270263671875, 1.963653564453125, 2.0946044921875, 2.225555419921875, 2.35650634765625, 2.487457275390625, 2.618408203125, 2.749359130859375, 2.88031005859375, 3.011260986328125, 3.1422119140625, 3.273162841796875, 3.40411376953125, 3.535064697265625, 3.666015625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 6.0, 12.0, 10.0, 18.0, 19.0, 21.0, 39.0, 35.0, 41.0, 47.0, 65.0, 54.0, 52.0, 67.0, 68.0, 62.0, 64.0, 53.0, 44.0, 56.0, 26.0, 23.0, 21.0, 25.0, 13.0, 13.0, 7.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.875, -6.697998046875, -6.52099609375, -6.343994140625, -6.1669921875, -5.989990234375, -5.81298828125, -5.635986328125, -5.458984375, -5.281982421875, -5.10498046875, -4.927978515625, -4.7509765625, -4.573974609375, -4.39697265625, -4.219970703125, -4.04296875, -3.865966796875, -3.68896484375, -3.511962890625, -3.3349609375, -3.157958984375, -2.98095703125, -2.803955078125, -2.626953125, -2.449951171875, -2.27294921875, -2.095947265625, -1.9189453125, -1.741943359375, -1.56494140625, -1.387939453125, -1.2109375, -1.033935546875, -0.85693359375, -0.679931640625, -0.5029296875, -0.325927734375, -0.14892578125, 0.028076171875, 0.205078125, 0.382080078125, 0.55908203125, 0.736083984375, 0.9130859375, 1.090087890625, 1.26708984375, 1.444091796875, 1.62109375, 1.798095703125, 1.97509765625, 2.152099609375, 2.3291015625, 2.506103515625, 2.68310546875, 2.860107421875, 3.037109375, 3.214111328125, 3.39111328125, 3.568115234375, 3.7451171875, 3.922119140625, 4.09912109375, 4.276123046875, 4.453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 6.0, 3.0, 6.0, 12.0, 13.0, 13.0, 8.0, 22.0, 38.0, 50.0, 80.0, 128.0, 267.0, 704.0, 2155.0, 8679.0, 55559.0, 1525105.0, 2508072.0, 77807.0, 11260.0, 2674.0, 885.0, 322.0, 151.0, 80.0, 48.0, 41.0, 29.0, 10.0, 17.0, 9.0, 8.0, 10.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.6015625, -10.2904052734375, -9.979248046875, -9.6680908203125, -9.35693359375, -9.0457763671875, -8.734619140625, -8.4234619140625, -8.1123046875, -7.8011474609375, -7.489990234375, -7.1788330078125, -6.86767578125, -6.5565185546875, -6.245361328125, -5.9342041015625, -5.623046875, -5.3118896484375, -5.000732421875, -4.6895751953125, -4.37841796875, -4.0672607421875, -3.756103515625, -3.4449462890625, -3.1337890625, -2.8226318359375, -2.511474609375, -2.2003173828125, -1.88916015625, -1.5780029296875, -1.266845703125, -0.9556884765625, -0.64453125, -0.3333740234375, -0.022216796875, 0.2889404296875, 0.60009765625, 0.9112548828125, 1.222412109375, 1.5335693359375, 1.8447265625, 2.1558837890625, 2.467041015625, 2.7781982421875, 3.08935546875, 3.4005126953125, 3.711669921875, 4.0228271484375, 4.333984375, 4.6451416015625, 4.956298828125, 5.2674560546875, 5.57861328125, 5.8897705078125, 6.200927734375, 6.5120849609375, 6.8232421875, 7.1343994140625, 7.445556640625, 7.7567138671875, 8.06787109375, 8.3790283203125, 8.690185546875, 9.0013427734375, 9.3125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 14.0, 3.0, 16.0, 27.0, 24.0, 36.0, 74.0, 103.0, 164.0, 259.0, 369.0, 539.0, 631.0, 541.0, 400.0, 267.0, 181.0, 120.0, 72.0, 52.0, 37.0, 38.0, 16.0, 15.0, 18.0, 3.0, 6.0, 10.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44921875, -6.2244873046875, -5.999755859375, -5.7750244140625, -5.55029296875, -5.3255615234375, -5.100830078125, -4.8760986328125, -4.6513671875, -4.4266357421875, -4.201904296875, -3.9771728515625, -3.75244140625, -3.5277099609375, -3.302978515625, -3.0782470703125, -2.853515625, -2.6287841796875, -2.404052734375, -2.1793212890625, -1.95458984375, -1.7298583984375, -1.505126953125, -1.2803955078125, -1.0556640625, -0.8309326171875, -0.606201171875, -0.3814697265625, -0.15673828125, 0.0679931640625, 0.292724609375, 0.5174560546875, 0.7421875, 0.9669189453125, 1.191650390625, 1.4163818359375, 1.64111328125, 1.8658447265625, 2.090576171875, 2.3153076171875, 2.5400390625, 2.7647705078125, 2.989501953125, 3.2142333984375, 3.43896484375, 3.6636962890625, 3.888427734375, 4.1131591796875, 4.337890625, 4.5626220703125, 4.787353515625, 5.0120849609375, 5.23681640625, 5.4615478515625, 5.686279296875, 5.9110107421875, 6.1357421875, 6.3604736328125, 6.585205078125, 6.8099365234375, 7.03466796875, 7.2593994140625, 7.484130859375, 7.7088623046875, 7.93359375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 8.0, 10.0, 50.0, 146.0, 270.0, 279.0, 156.0, 48.0, 22.0, 11.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.215763092041016, -32.5795783996582, -28.94339370727539, -25.307209014892578, -21.671024322509766, -18.034841537475586, -14.398656845092773, -10.762472152709961, -7.126287460327148, -3.490103006362915, 0.14608144760131836, 3.7822656631469727, 7.418450355529785, 11.054634094238281, 14.690818786621094, 18.327003479003906, 21.96318817138672, 25.59937286376953, 29.235557556152344, 32.871742248535156, 36.50792694091797, 40.14411163330078, 43.780296325683594, 47.416481018066406, 51.05266571044922, 54.68885040283203, 58.325035095214844, 61.961219787597656, 65.59740447998047, 69.23358917236328, 72.8697738647461, 76.5059585571289, 80.14214324951172, 83.77832794189453, 87.41451263427734, 91.05069732666016, 94.68688201904297, 98.32306671142578, 101.9592514038086, 105.5954360961914, 109.23162078857422, 112.86780548095703, 116.50399017333984, 120.14017486572266, 123.77635955810547, 127.41254425048828, 131.04872131347656, 134.68490600585938, 138.3210906982422, 141.957275390625, 145.5934600830078, 149.22964477539062, 152.86582946777344, 156.50201416015625, 160.13819885253906, 163.77438354492188, 167.4105682373047, 171.0467529296875, 174.6829376220703, 178.31912231445312, 181.95530700683594, 185.59149169921875, 189.22767639160156, 192.86386108398438, 196.5000457763672]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 4.0, 15.0, 7.0, 8.0, 7.0, 11.0, 22.0, 17.0, 25.0, 20.0, 24.0, 24.0, 26.0, 24.0, 34.0, 30.0, 53.0, 33.0, 52.0, 44.0, 48.0, 46.0, 48.0, 53.0, 39.0, 45.0, 38.0, 29.0, 30.0, 25.0, 20.0, 16.0, 18.0, 13.0, 11.0, 8.0, 6.0, 3.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.613895416259766, -28.661489486694336, -27.709083557128906, -26.75667953491211, -25.80427360534668, -24.85186767578125, -23.899463653564453, -22.947057723999023, -21.994651794433594, -21.042245864868164, -20.089839935302734, -19.137435913085938, -18.185029983520508, -17.232624053955078, -16.28022003173828, -15.327814102172852, -14.375408172607422, -13.423002243041992, -12.470597267150879, -11.518192291259766, -10.565786361694336, -9.613380432128906, -8.660975456237793, -7.7085700035095215, -6.75616455078125, -5.8037590980529785, -4.851353645324707, -3.8989481925964355, -2.946542739868164, -1.9941372871398926, -1.041731834411621, -0.08932638168334961, 0.8630809783935547, 1.8154864311218262, 2.7678918838500977, 3.720297336578369, 4.672702789306641, 5.625108242034912, 6.577513694763184, 7.529919147491455, 8.482324600219727, 9.434730529785156, 10.38713550567627, 11.339540481567383, 12.291946411132812, 13.244352340698242, 14.196757316589355, 15.149162292480469, 16.1015682220459, 17.053974151611328, 18.006378173828125, 18.958784103393555, 19.911190032958984, 20.863595962524414, 21.816001892089844, 22.76840591430664, 23.72081184387207, 24.6732177734375, 25.625621795654297, 26.578027725219727, 27.530433654785156, 28.482839584350586, 29.435245513916016, 30.387649536132812, 31.340055465698242]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 8.0, 10.0, 24.0, 20.0, 28.0, 54.0, 84.0, 142.0, 228.0, 341.0, 553.0, 861.0, 1557.0, 2780.0, 5367.0, 11109.0, 23423.0, 53292.0, 126176.0, 279616.0, 295314.0, 139037.0, 58182.0, 25618.0, 11644.0, 5863.0, 3100.0, 1696.0, 905.0, 556.0, 345.0, 203.0, 141.0, 87.0, 50.0, 38.0, 28.0, 20.0, 11.0, 9.0, 10.0, 5.0, 2.0, 1.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.7890625, -4.6396484375, -4.490234375, -4.3408203125, -4.19140625, -4.0419921875, -3.892578125, -3.7431640625, -3.59375, -3.4443359375, -3.294921875, -3.1455078125, -2.99609375, -2.8466796875, -2.697265625, -2.5478515625, -2.3984375, -2.2490234375, -2.099609375, -1.9501953125, -1.80078125, -1.6513671875, -1.501953125, -1.3525390625, -1.203125, -1.0537109375, -0.904296875, -0.7548828125, -0.60546875, -0.4560546875, -0.306640625, -0.1572265625, -0.0078125, 0.1416015625, 0.291015625, 0.4404296875, 0.58984375, 0.7392578125, 0.888671875, 1.0380859375, 1.1875, 1.3369140625, 1.486328125, 1.6357421875, 1.78515625, 1.9345703125, 2.083984375, 2.2333984375, 2.3828125, 2.5322265625, 2.681640625, 2.8310546875, 2.98046875, 3.1298828125, 3.279296875, 3.4287109375, 3.578125, 3.7275390625, 3.876953125, 4.0263671875, 4.17578125, 4.3251953125, 4.474609375, 4.6240234375, 4.7734375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 3.0, 2.0, 3.0, 9.0, 11.0, 16.0, 17.0, 30.0, 34.0, 37.0, 40.0, 37.0, 59.0, 45.0, 46.0, 65.0, 75.0, 59.0, 75.0, 63.0, 46.0, 35.0, 45.0, 33.0, 16.0, 17.0, 18.0, 21.0, 14.0, 11.0, 3.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.7734375, -6.5972900390625, -6.421142578125, -6.2449951171875, -6.06884765625, -5.8927001953125, -5.716552734375, -5.5404052734375, -5.3642578125, -5.1881103515625, -5.011962890625, -4.8358154296875, -4.65966796875, -4.4835205078125, -4.307373046875, -4.1312255859375, -3.955078125, -3.7789306640625, -3.602783203125, -3.4266357421875, -3.25048828125, -3.0743408203125, -2.898193359375, -2.7220458984375, -2.5458984375, -2.3697509765625, -2.193603515625, -2.0174560546875, -1.84130859375, -1.6651611328125, -1.489013671875, -1.3128662109375, -1.13671875, -0.9605712890625, -0.784423828125, -0.6082763671875, -0.43212890625, -0.2559814453125, -0.079833984375, 0.0963134765625, 0.2724609375, 0.4486083984375, 0.624755859375, 0.8009033203125, 0.97705078125, 1.1531982421875, 1.329345703125, 1.5054931640625, 1.681640625, 1.8577880859375, 2.033935546875, 2.2100830078125, 2.38623046875, 2.5623779296875, 2.738525390625, 2.9146728515625, 3.0908203125, 3.2669677734375, 3.443115234375, 3.6192626953125, 3.79541015625, 3.9715576171875, 4.147705078125, 4.3238525390625, 4.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 5.0, 10.0, 8.0, 9.0, 17.0, 28.0, 19.0, 34.0, 55.0, 78.0, 96.0, 130.0, 164.0, 233.0, 352.0, 624.0, 946.0, 1849.0, 4129.0, 11489.0, 41906.0, 209026.0, 640763.0, 100300.0, 22946.0, 7183.0, 2739.0, 1331.0, 721.0, 422.0, 279.0, 179.0, 115.0, 85.0, 66.0, 53.0, 39.0, 25.0, 26.0, 19.0, 9.0, 12.0, 10.0, 8.0, 5.0, 8.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.5703125, -9.2911376953125, -9.011962890625, -8.7327880859375, -8.45361328125, -8.1744384765625, -7.895263671875, -7.6160888671875, -7.3369140625, -7.0577392578125, -6.778564453125, -6.4993896484375, -6.22021484375, -5.9410400390625, -5.661865234375, -5.3826904296875, -5.103515625, -4.8243408203125, -4.545166015625, -4.2659912109375, -3.98681640625, -3.7076416015625, -3.428466796875, -3.1492919921875, -2.8701171875, -2.5909423828125, -2.311767578125, -2.0325927734375, -1.75341796875, -1.4742431640625, -1.195068359375, -0.9158935546875, -0.63671875, -0.3575439453125, -0.078369140625, 0.2008056640625, 0.47998046875, 0.7591552734375, 1.038330078125, 1.3175048828125, 1.5966796875, 1.8758544921875, 2.155029296875, 2.4342041015625, 2.71337890625, 2.9925537109375, 3.271728515625, 3.5509033203125, 3.830078125, 4.1092529296875, 4.388427734375, 4.6676025390625, 4.94677734375, 5.2259521484375, 5.505126953125, 5.7843017578125, 6.0634765625, 6.3426513671875, 6.621826171875, 6.9010009765625, 7.18017578125, 7.4593505859375, 7.738525390625, 8.0177001953125, 8.296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 9.0, 4.0, 8.0, 9.0, 12.0, 12.0, 12.0, 33.0, 32.0, 29.0, 47.0, 25.0, 48.0, 42.0, 51.0, 45.0, 52.0, 67.0, 54.0, 59.0, 48.0, 38.0, 43.0, 28.0, 31.0, 26.0, 27.0, 23.0, 11.0, 19.0, 8.0, 7.0, 6.0, 4.0, 6.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.1099853515625, -14.602783203125, -14.0955810546875, -13.58837890625, -13.0811767578125, -12.573974609375, -12.0667724609375, -11.5595703125, -11.0523681640625, -10.545166015625, -10.0379638671875, -9.53076171875, -9.0235595703125, -8.516357421875, -8.0091552734375, -7.501953125, -6.9947509765625, -6.487548828125, -5.9803466796875, -5.47314453125, -4.9659423828125, -4.458740234375, -3.9515380859375, -3.4443359375, -2.9371337890625, -2.429931640625, -1.9227294921875, -1.41552734375, -0.9083251953125, -0.401123046875, 0.1060791015625, 0.61328125, 1.1204833984375, 1.627685546875, 2.1348876953125, 2.64208984375, 3.1492919921875, 3.656494140625, 4.1636962890625, 4.6708984375, 5.1781005859375, 5.685302734375, 6.1925048828125, 6.69970703125, 7.2069091796875, 7.714111328125, 8.2213134765625, 8.728515625, 9.2357177734375, 9.742919921875, 10.2501220703125, 10.75732421875, 11.2645263671875, 11.771728515625, 12.2789306640625, 12.7861328125, 13.2933349609375, 13.800537109375, 14.3077392578125, 14.81494140625, 15.3221435546875, 15.829345703125, 16.3365478515625, 16.84375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 10.0, 9.0, 16.0, 10.0, 28.0, 34.0, 46.0, 70.0, 112.0, 164.0, 304.0, 554.0, 1153.0, 2745.0, 7111.0, 20483.0, 78984.0, 642381.0, 228119.0, 44368.0, 13182.0, 4670.0, 2038.0, 839.0, 432.0, 239.0, 160.0, 82.0, 60.0, 46.0, 28.0, 21.0, 8.0, 11.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.03515625, -1.973114013671875, -1.91107177734375, -1.849029541015625, -1.7869873046875, -1.724945068359375, -1.66290283203125, -1.600860595703125, -1.538818359375, -1.476776123046875, -1.41473388671875, -1.352691650390625, -1.2906494140625, -1.228607177734375, -1.16656494140625, -1.104522705078125, -1.04248046875, -0.980438232421875, -0.91839599609375, -0.856353759765625, -0.7943115234375, -0.732269287109375, -0.67022705078125, -0.608184814453125, -0.546142578125, -0.484100341796875, -0.42205810546875, -0.360015869140625, -0.2979736328125, -0.235931396484375, -0.17388916015625, -0.111846923828125, -0.0498046875, 0.012237548828125, 0.07427978515625, 0.136322021484375, 0.1983642578125, 0.260406494140625, 0.32244873046875, 0.384490966796875, 0.446533203125, 0.508575439453125, 0.57061767578125, 0.632659912109375, 0.6947021484375, 0.756744384765625, 0.81878662109375, 0.880828857421875, 0.94287109375, 1.004913330078125, 1.06695556640625, 1.128997802734375, 1.1910400390625, 1.253082275390625, 1.31512451171875, 1.377166748046875, 1.439208984375, 1.501251220703125, 1.56329345703125, 1.625335693359375, 1.6873779296875, 1.749420166015625, 1.81146240234375, 1.873504638671875, 1.935546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 15.0, 17.0, 25.0, 30.0, 51.0, 98.0, 142.0, 182.0, 129.0, 107.0, 61.0, 35.0, 24.0, 14.0, 9.0, 9.0, 7.0, 3.0, 5.0, 3.0, 5.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005769729614257812, -0.0005551576614379883, -0.0005333423614501953, -0.0005115270614624023, -0.0004897117614746094, -0.0004678964614868164, -0.00044608116149902344, -0.00042426586151123047, -0.0004024505615234375, -0.00038063526153564453, -0.00035881996154785156, -0.0003370046615600586, -0.0003151893615722656, -0.00029337406158447266, -0.0002715587615966797, -0.0002497434616088867, -0.00022792816162109375, -0.00020611286163330078, -0.0001842975616455078, -0.00016248226165771484, -0.00014066696166992188, -0.0001188516616821289, -9.703636169433594e-05, -7.522106170654297e-05, -5.340576171875e-05, -3.159046173095703e-05, -9.775161743164062e-06, 1.2040138244628906e-05, 3.3855438232421875e-05, 5.5670738220214844e-05, 7.748603820800781e-05, 9.930133819580078e-05, 0.00012111663818359375, 0.00014293193817138672, 0.0001647472381591797, 0.00018656253814697266, 0.00020837783813476562, 0.0002301931381225586, 0.00025200843811035156, 0.00027382373809814453, 0.0002956390380859375, 0.00031745433807373047, 0.00033926963806152344, 0.0003610849380493164, 0.0003829002380371094, 0.00040471553802490234, 0.0004265308380126953, 0.0004483461380004883, 0.00047016143798828125, 0.0004919767379760742, 0.0005137920379638672, 0.0005356073379516602, 0.0005574226379394531, 0.0005792379379272461, 0.0006010532379150391, 0.000622868537902832, 0.000644683837890625, 0.000666499137878418, 0.0006883144378662109, 0.0007101297378540039, 0.0007319450378417969, 0.0007537603378295898, 0.0007755756378173828, 0.0007973909378051758, 0.0008192062377929688]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 11.0, 12.0, 23.0, 47.0, 95.0, 268.0, 580.0, 1690.0, 7069.0, 52511.0, 816416.0, 150991.0, 14475.0, 2874.0, 854.0, 350.0, 124.0, 66.0, 32.0, 29.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.784912109375, -3.66162109375, -3.538330078125, -3.4150390625, -3.291748046875, -3.16845703125, -3.045166015625, -2.921875, -2.798583984375, -2.67529296875, -2.552001953125, -2.4287109375, -2.305419921875, -2.18212890625, -2.058837890625, -1.935546875, -1.812255859375, -1.68896484375, -1.565673828125, -1.4423828125, -1.319091796875, -1.19580078125, -1.072509765625, -0.94921875, -0.825927734375, -0.70263671875, -0.579345703125, -0.4560546875, -0.332763671875, -0.20947265625, -0.086181640625, 0.037109375, 0.160400390625, 0.28369140625, 0.406982421875, 0.5302734375, 0.653564453125, 0.77685546875, 0.900146484375, 1.0234375, 1.146728515625, 1.27001953125, 1.393310546875, 1.5166015625, 1.639892578125, 1.76318359375, 1.886474609375, 2.009765625, 2.133056640625, 2.25634765625, 2.379638671875, 2.5029296875, 2.626220703125, 2.74951171875, 2.872802734375, 2.99609375, 3.119384765625, 3.24267578125, 3.365966796875, 3.4892578125, 3.612548828125, 3.73583984375, 3.859130859375, 3.982421875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 8.0, 14.0, 19.0, 23.0, 28.0, 40.0, 47.0, 77.0, 95.0, 122.0, 107.0, 123.0, 83.0, 53.0, 42.0, 30.0, 29.0, 14.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.802520751953125, -2.71246337890625, -2.622406005859375, -2.5323486328125, -2.442291259765625, -2.35223388671875, -2.262176513671875, -2.172119140625, -2.082061767578125, -1.99200439453125, -1.901947021484375, -1.8118896484375, -1.721832275390625, -1.63177490234375, -1.541717529296875, -1.45166015625, -1.361602783203125, -1.27154541015625, -1.181488037109375, -1.0914306640625, -1.001373291015625, -0.91131591796875, -0.821258544921875, -0.731201171875, -0.641143798828125, -0.55108642578125, -0.461029052734375, -0.3709716796875, -0.280914306640625, -0.19085693359375, -0.100799560546875, -0.0107421875, 0.079315185546875, 0.16937255859375, 0.259429931640625, 0.3494873046875, 0.439544677734375, 0.52960205078125, 0.619659423828125, 0.709716796875, 0.799774169921875, 0.88983154296875, 0.979888916015625, 1.0699462890625, 1.160003662109375, 1.25006103515625, 1.340118408203125, 1.43017578125, 1.520233154296875, 1.61029052734375, 1.700347900390625, 1.7904052734375, 1.880462646484375, 1.97052001953125, 2.060577392578125, 2.150634765625, 2.240692138671875, 2.33074951171875, 2.420806884765625, 2.5108642578125, 2.600921630859375, 2.69097900390625, 2.781036376953125, 2.87109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 13.0, 9.0, 26.0, 57.0, 158.0, 356.0, 205.0, 84.0, 40.0, 14.0, 15.0, 14.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.64359283447266, -113.7037353515625, -110.76387023925781, -107.82400512695312, -104.88414764404297, -101.94429016113281, -99.00442504882812, -96.06455993652344, -93.12470245361328, -90.18484497070312, -87.24497985839844, -84.30511474609375, -81.3652572631836, -78.42539978027344, -75.48553466796875, -72.54566955566406, -69.6058120727539, -66.66595458984375, -63.72608947753906, -60.78622817993164, -57.84636688232422, -54.9065055847168, -51.966644287109375, -49.02678298950195, -46.08692169189453, -43.14706039428711, -40.20719909667969, -37.267337799072266, -34.327476501464844, -31.387615203857422, -28.44775390625, -25.507892608642578, -22.568031311035156, -19.628170013427734, -16.688308715820312, -13.74844741821289, -10.808586120605469, -7.868724822998047, -4.928863525390625, -1.9890022277832031, 0.9508590698242188, 3.8907203674316406, 6.8305816650390625, 9.770442962646484, 12.710304260253906, 15.650165557861328, 18.59002685546875, 21.529888153076172, 24.469749450683594, 27.409610748291016, 30.349472045898438, 33.28933334350586, 36.22919464111328, 39.1690559387207, 42.108917236328125, 45.04877853393555, 47.98863983154297, 50.92850112915039, 53.86836242675781, 56.808223724365234, 59.748085021972656, 62.68794631958008, 65.6278076171875, 68.56767272949219, 71.50753021240234]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 6.0, 6.0, 9.0, 6.0, 11.0, 14.0, 16.0, 14.0, 25.0, 18.0, 25.0, 26.0, 25.0, 36.0, 32.0, 38.0, 68.0, 89.0, 103.0, 84.0, 51.0, 44.0, 32.0, 31.0, 31.0, 26.0, 26.0, 12.0, 18.0, 19.0, 11.0, 10.0, 4.0, 7.0, 6.0, 5.0, 6.0, 3.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.973663330078125, -59.201786041259766, -57.429908752441406, -55.65803146362305, -53.88615417480469, -52.114280700683594, -50.342403411865234, -48.570526123046875, -46.798648834228516, -45.026771545410156, -43.2548942565918, -41.48301696777344, -39.711143493652344, -37.93926239013672, -36.167388916015625, -34.395511627197266, -32.623634338378906, -30.851757049560547, -29.079879760742188, -27.30800437927246, -25.5361270904541, -23.764249801635742, -21.992374420166016, -20.220497131347656, -18.448619842529297, -16.676742553710938, -14.904866218566895, -13.132989883422852, -11.361112594604492, -9.589235305786133, -7.81735897064209, -6.045482635498047, -4.273601531982422, -2.5017247200012207, -0.7298479080200195, 1.0420289039611816, 2.813905715942383, 4.585783004760742, 6.357659339904785, 8.129535675048828, 9.901412963867188, 11.673290252685547, 13.44516658782959, 15.217042922973633, 16.988920211791992, 18.76079750061035, 20.532672882080078, 22.304550170898438, 24.076427459716797, 25.848304748535156, 27.620182037353516, 29.392057418823242, 31.1639347076416, 32.935813903808594, 34.70768737792969, 36.47956466674805, 38.251441955566406, 40.023319244384766, 41.795196533203125, 43.567073822021484, 45.338951110839844, 47.11082458496094, 48.8827018737793, 50.654579162597656, 52.426456451416016]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 1.0, 8.0, 5.0, 15.0, 24.0, 30.0, 58.0, 104.0, 159.0, 273.0, 497.0, 1045.0, 2176.0, 4912.0, 12837.0, 41315.0, 172272.0, 849241.0, 2100030.0, 784583.0, 162300.0, 39908.0, 13003.0, 5044.0, 2210.0, 1024.0, 505.0, 303.0, 159.0, 89.0, 55.0, 33.0, 16.0, 15.0, 11.0, 6.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.734375, -4.59295654296875, -4.4515380859375, -4.31011962890625, -4.168701171875, -4.02728271484375, -3.8858642578125, -3.74444580078125, -3.60302734375, -3.46160888671875, -3.3201904296875, -3.17877197265625, -3.037353515625, -2.89593505859375, -2.7545166015625, -2.61309814453125, -2.4716796875, -2.33026123046875, -2.1888427734375, -2.04742431640625, -1.906005859375, -1.76458740234375, -1.6231689453125, -1.48175048828125, -1.34033203125, -1.19891357421875, -1.0574951171875, -0.91607666015625, -0.774658203125, -0.63323974609375, -0.4918212890625, -0.35040283203125, -0.208984375, -0.06756591796875, 0.0738525390625, 0.21527099609375, 0.356689453125, 0.49810791015625, 0.6395263671875, 0.78094482421875, 0.92236328125, 1.06378173828125, 1.2052001953125, 1.34661865234375, 1.488037109375, 1.62945556640625, 1.7708740234375, 1.91229248046875, 2.0537109375, 2.19512939453125, 2.3365478515625, 2.47796630859375, 2.619384765625, 2.76080322265625, 2.9022216796875, 3.04364013671875, 3.18505859375, 3.32647705078125, 3.4678955078125, 3.60931396484375, 3.750732421875, 3.89215087890625, 4.0335693359375, 4.17498779296875, 4.31640625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 4.0, 13.0, 13.0, 16.0, 25.0, 23.0, 30.0, 36.0, 41.0, 54.0, 55.0, 52.0, 54.0, 62.0, 69.0, 66.0, 57.0, 60.0, 48.0, 47.0, 39.0, 29.0, 20.0, 15.0, 13.0, 18.0, 8.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.4427490234375, -6.268310546875, -6.0938720703125, -5.91943359375, -5.7449951171875, -5.570556640625, -5.3961181640625, -5.2216796875, -5.0472412109375, -4.872802734375, -4.6983642578125, -4.52392578125, -4.3494873046875, -4.175048828125, -4.0006103515625, -3.826171875, -3.6517333984375, -3.477294921875, -3.3028564453125, -3.12841796875, -2.9539794921875, -2.779541015625, -2.6051025390625, -2.4306640625, -2.2562255859375, -2.081787109375, -1.9073486328125, -1.73291015625, -1.5584716796875, -1.384033203125, -1.2095947265625, -1.03515625, -0.8607177734375, -0.686279296875, -0.5118408203125, -0.33740234375, -0.1629638671875, 0.011474609375, 0.1859130859375, 0.3603515625, 0.5347900390625, 0.709228515625, 0.8836669921875, 1.05810546875, 1.2325439453125, 1.406982421875, 1.5814208984375, 1.755859375, 1.9302978515625, 2.104736328125, 2.2791748046875, 2.45361328125, 2.6280517578125, 2.802490234375, 2.9769287109375, 3.1513671875, 3.3258056640625, 3.500244140625, 3.6746826171875, 3.84912109375, 4.0235595703125, 4.197998046875, 4.3724365234375, 4.546875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 14.0, 9.0, 13.0, 17.0, 24.0, 22.0, 63.0, 76.0, 133.0, 241.0, 546.0, 1428.0, 5440.0, 33556.0, 609602.0, 3379779.0, 143728.0, 14681.0, 3098.0, 925.0, 363.0, 158.0, 102.0, 90.0, 41.0, 38.0, 18.0, 9.0, 16.0, 8.0, 6.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.7708740234375, -8.471435546875, -8.1719970703125, -7.87255859375, -7.5731201171875, -7.273681640625, -6.9742431640625, -6.6748046875, -6.3753662109375, -6.075927734375, -5.7764892578125, -5.47705078125, -5.1776123046875, -4.878173828125, -4.5787353515625, -4.279296875, -3.9798583984375, -3.680419921875, -3.3809814453125, -3.08154296875, -2.7821044921875, -2.482666015625, -2.1832275390625, -1.8837890625, -1.5843505859375, -1.284912109375, -0.9854736328125, -0.68603515625, -0.3865966796875, -0.087158203125, 0.2122802734375, 0.51171875, 0.8111572265625, 1.110595703125, 1.4100341796875, 1.70947265625, 2.0089111328125, 2.308349609375, 2.6077880859375, 2.9072265625, 3.2066650390625, 3.506103515625, 3.8055419921875, 4.10498046875, 4.4044189453125, 4.703857421875, 5.0032958984375, 5.302734375, 5.6021728515625, 5.901611328125, 6.2010498046875, 6.50048828125, 6.7999267578125, 7.099365234375, 7.3988037109375, 7.6982421875, 7.9976806640625, 8.297119140625, 8.5965576171875, 8.89599609375, 9.1954345703125, 9.494873046875, 9.7943115234375, 10.09375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 4.0, 2.0, 3.0, 8.0, 8.0, 9.0, 21.0, 14.0, 30.0, 25.0, 43.0, 74.0, 114.0, 142.0, 265.0, 350.0, 484.0, 572.0, 559.0, 429.0, 304.0, 191.0, 121.0, 75.0, 62.0, 50.0, 26.0, 23.0, 19.0, 12.0, 14.0, 7.0, 4.0, 5.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.23162841796875, -5.9984130859375, -5.76519775390625, -5.531982421875, -5.29876708984375, -5.0655517578125, -4.83233642578125, -4.59912109375, -4.36590576171875, -4.1326904296875, -3.89947509765625, -3.666259765625, -3.43304443359375, -3.1998291015625, -2.96661376953125, -2.7333984375, -2.50018310546875, -2.2669677734375, -2.03375244140625, -1.800537109375, -1.56732177734375, -1.3341064453125, -1.10089111328125, -0.86767578125, -0.63446044921875, -0.4012451171875, -0.16802978515625, 0.065185546875, 0.29840087890625, 0.5316162109375, 0.76483154296875, 0.998046875, 1.23126220703125, 1.4644775390625, 1.69769287109375, 1.930908203125, 2.16412353515625, 2.3973388671875, 2.63055419921875, 2.86376953125, 3.09698486328125, 3.3302001953125, 3.56341552734375, 3.796630859375, 4.02984619140625, 4.2630615234375, 4.49627685546875, 4.7294921875, 4.96270751953125, 5.1959228515625, 5.42913818359375, 5.662353515625, 5.89556884765625, 6.1287841796875, 6.36199951171875, 6.59521484375, 6.82843017578125, 7.0616455078125, 7.29486083984375, 7.528076171875, 7.76129150390625, 7.9945068359375, 8.22772216796875, 8.4609375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 4.0, 22.0, 38.0, 97.0, 162.0, 231.0, 212.0, 120.0, 53.0, 31.0, 11.0, 7.0, 3.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.22959899902344, -59.60778045654297, -56.9859619140625, -54.36414337158203, -51.74232482910156, -49.120506286621094, -46.498687744140625, -43.876869201660156, -41.25505065917969, -38.63323211669922, -36.01141357421875, -33.38959503173828, -30.767776489257812, -28.145957946777344, -25.524137496948242, -22.902318954467773, -20.280498504638672, -17.658679962158203, -15.036861419677734, -12.41504192352295, -9.79322338104248, -7.171404838562012, -4.549585342407227, -1.9277667999267578, 0.6940517425537109, 3.315870523452759, 5.937689304351807, 8.559508323669434, 11.181326866149902, 13.803145408630371, 16.424964904785156, 19.046783447265625, 21.668601989746094, 24.290420532226562, 26.91223907470703, 29.5340576171875, 32.15587615966797, 34.77769470214844, 37.399513244628906, 40.021331787109375, 42.643150329589844, 45.26496887207031, 47.88678741455078, 50.50860595703125, 53.13042449951172, 55.75224304199219, 58.374061584472656, 60.995880126953125, 63.61770248413086, 66.2395248413086, 68.86134338378906, 71.48316192626953, 74.10498046875, 76.72679901123047, 79.34861755371094, 81.9704360961914, 84.59225463867188, 87.21407318115234, 89.83589172363281, 92.45771026611328, 95.07952880859375, 97.70134735107422, 100.32316589355469, 102.94498443603516, 105.56680297851562]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 11.0, 13.0, 9.0, 12.0, 19.0, 21.0, 19.0, 22.0, 28.0, 28.0, 31.0, 31.0, 30.0, 35.0, 43.0, 48.0, 46.0, 35.0, 34.0, 47.0, 38.0, 35.0, 45.0, 37.0, 34.0, 18.0, 26.0, 25.0, 26.0, 22.0, 21.0, 14.0, 14.0, 6.0, 14.0, 8.0, 9.0, 6.0, 2.0, 6.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 5.0, 0.0, 1.0], "bins": [-28.26177406311035, -27.412242889404297, -26.562711715698242, -25.713180541992188, -24.863651275634766, -24.014118194580078, -23.164588928222656, -22.3150577545166, -21.465526580810547, -20.615995407104492, -19.766464233398438, -18.916933059692383, -18.067401885986328, -17.217872619628906, -16.36834144592285, -15.518810272216797, -14.669279098510742, -13.819747924804688, -12.970216751098633, -12.120686531066895, -11.27115535736084, -10.421624183654785, -9.572093963623047, -8.722562789916992, -7.8730316162109375, -7.023500442504883, -6.173969745635986, -5.32443904876709, -4.474907875061035, -3.6253767013549805, -2.775846004486084, -1.9263153076171875, -1.0767822265625, -0.22725129127502441, 0.6222796440124512, 1.4718105792999268, 2.3213415145874023, 3.170872688293457, 4.0204033851623535, 4.86993408203125, 5.719465255737305, 6.568996429443359, 7.418527126312256, 8.268057823181152, 9.117588996887207, 9.967120170593262, 10.816650390625, 11.666181564331055, 12.51571273803711, 13.365243911743164, 14.214775085449219, 15.064305305480957, 15.913836479187012, 16.76336669921875, 17.612897872924805, 18.46242904663086, 19.311960220336914, 20.16149139404297, 21.011022567749023, 21.860553741455078, 22.7100830078125, 23.559616088867188, 24.40914535522461, 25.258676528930664, 26.10820770263672]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 11.0, 12.0, 16.0, 31.0, 39.0, 80.0, 91.0, 141.0, 238.0, 390.0, 595.0, 1086.0, 1855.0, 3509.0, 7005.0, 14669.0, 32094.0, 78015.0, 197802.0, 363517.0, 203667.0, 80199.0, 33027.0, 14770.0, 7292.0, 3642.0, 2008.0, 1049.0, 653.0, 367.0, 232.0, 149.0, 109.0, 70.0, 41.0, 31.0, 13.0, 17.0, 8.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.69921875, -4.534423828125, -4.36962890625, -4.204833984375, -4.0400390625, -3.875244140625, -3.71044921875, -3.545654296875, -3.380859375, -3.216064453125, -3.05126953125, -2.886474609375, -2.7216796875, -2.556884765625, -2.39208984375, -2.227294921875, -2.0625, -1.897705078125, -1.73291015625, -1.568115234375, -1.4033203125, -1.238525390625, -1.07373046875, -0.908935546875, -0.744140625, -0.579345703125, -0.41455078125, -0.249755859375, -0.0849609375, 0.079833984375, 0.24462890625, 0.409423828125, 0.57421875, 0.739013671875, 0.90380859375, 1.068603515625, 1.2333984375, 1.398193359375, 1.56298828125, 1.727783203125, 1.892578125, 2.057373046875, 2.22216796875, 2.386962890625, 2.5517578125, 2.716552734375, 2.88134765625, 3.046142578125, 3.2109375, 3.375732421875, 3.54052734375, 3.705322265625, 3.8701171875, 4.034912109375, 4.19970703125, 4.364501953125, 4.529296875, 4.694091796875, 4.85888671875, 5.023681640625, 5.1884765625, 5.353271484375, 5.51806640625, 5.682861328125, 5.84765625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 2.0, 0.0, 7.0, 13.0, 8.0, 16.0, 12.0, 24.0, 27.0, 39.0, 43.0, 39.0, 51.0, 44.0, 74.0, 56.0, 58.0, 55.0, 57.0, 58.0, 55.0, 44.0, 43.0, 43.0, 33.0, 28.0, 15.0, 15.0, 16.0, 7.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.5390625, -6.3658447265625, -6.192626953125, -6.0194091796875, -5.84619140625, -5.6729736328125, -5.499755859375, -5.3265380859375, -5.1533203125, -4.9801025390625, -4.806884765625, -4.6336669921875, -4.46044921875, -4.2872314453125, -4.114013671875, -3.9407958984375, -3.767578125, -3.5943603515625, -3.421142578125, -3.2479248046875, -3.07470703125, -2.9014892578125, -2.728271484375, -2.5550537109375, -2.3818359375, -2.2086181640625, -2.035400390625, -1.8621826171875, -1.68896484375, -1.5157470703125, -1.342529296875, -1.1693115234375, -0.99609375, -0.8228759765625, -0.649658203125, -0.4764404296875, -0.30322265625, -0.1300048828125, 0.043212890625, 0.2164306640625, 0.3896484375, 0.5628662109375, 0.736083984375, 0.9093017578125, 1.08251953125, 1.2557373046875, 1.428955078125, 1.6021728515625, 1.775390625, 1.9486083984375, 2.121826171875, 2.2950439453125, 2.46826171875, 2.6414794921875, 2.814697265625, 2.9879150390625, 3.1611328125, 3.3343505859375, 3.507568359375, 3.6807861328125, 3.85400390625, 4.0272216796875, 4.200439453125, 4.3736572265625, 4.546875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 10.0, 9.0, 23.0, 28.0, 27.0, 49.0, 66.0, 107.0, 134.0, 221.0, 359.0, 494.0, 873.0, 1746.0, 4118.0, 15304.0, 123208.0, 816949.0, 67714.0, 10490.0, 3170.0, 1423.0, 739.0, 426.0, 277.0, 190.0, 123.0, 91.0, 60.0, 41.0, 27.0, 17.0, 13.0, 11.0, 5.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.375, -12.9619140625, -12.548828125, -12.1357421875, -11.72265625, -11.3095703125, -10.896484375, -10.4833984375, -10.0703125, -9.6572265625, -9.244140625, -8.8310546875, -8.41796875, -8.0048828125, -7.591796875, -7.1787109375, -6.765625, -6.3525390625, -5.939453125, -5.5263671875, -5.11328125, -4.7001953125, -4.287109375, -3.8740234375, -3.4609375, -3.0478515625, -2.634765625, -2.2216796875, -1.80859375, -1.3955078125, -0.982421875, -0.5693359375, -0.15625, 0.2568359375, 0.669921875, 1.0830078125, 1.49609375, 1.9091796875, 2.322265625, 2.7353515625, 3.1484375, 3.5615234375, 3.974609375, 4.3876953125, 4.80078125, 5.2138671875, 5.626953125, 6.0400390625, 6.453125, 6.8662109375, 7.279296875, 7.6923828125, 8.10546875, 8.5185546875, 8.931640625, 9.3447265625, 9.7578125, 10.1708984375, 10.583984375, 10.9970703125, 11.41015625, 11.8232421875, 12.236328125, 12.6494140625, 13.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 8.0, 6.0, 12.0, 10.0, 9.0, 16.0, 29.0, 27.0, 42.0, 25.0, 38.0, 52.0, 44.0, 51.0, 53.0, 48.0, 45.0, 56.0, 54.0, 46.0, 47.0, 45.0, 47.0, 31.0, 22.0, 24.0, 22.0, 10.0, 12.0, 10.0, 8.0, 10.0, 3.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.248291015625, -12.74658203125, -12.244873046875, -11.7431640625, -11.241455078125, -10.73974609375, -10.238037109375, -9.736328125, -9.234619140625, -8.73291015625, -8.231201171875, -7.7294921875, -7.227783203125, -6.72607421875, -6.224365234375, -5.72265625, -5.220947265625, -4.71923828125, -4.217529296875, -3.7158203125, -3.214111328125, -2.71240234375, -2.210693359375, -1.708984375, -1.207275390625, -0.70556640625, -0.203857421875, 0.2978515625, 0.799560546875, 1.30126953125, 1.802978515625, 2.3046875, 2.806396484375, 3.30810546875, 3.809814453125, 4.3115234375, 4.813232421875, 5.31494140625, 5.816650390625, 6.318359375, 6.820068359375, 7.32177734375, 7.823486328125, 8.3251953125, 8.826904296875, 9.32861328125, 9.830322265625, 10.33203125, 10.833740234375, 11.33544921875, 11.837158203125, 12.3388671875, 12.840576171875, 13.34228515625, 13.843994140625, 14.345703125, 14.847412109375, 15.34912109375, 15.850830078125, 16.3525390625, 16.854248046875, 17.35595703125, 17.857666015625, 18.359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 3.0, 3.0, 13.0, 9.0, 13.0, 11.0, 22.0, 22.0, 31.0, 43.0, 71.0, 146.0, 299.0, 631.0, 1770.0, 8101.0, 75396.0, 910137.0, 43393.0, 5890.0, 1420.0, 476.0, 228.0, 125.0, 81.0, 49.0, 48.0, 35.0, 18.0, 17.0, 13.0, 8.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.7421875, -2.642120361328125, -2.54205322265625, -2.441986083984375, -2.3419189453125, -2.241851806640625, -2.14178466796875, -2.041717529296875, -1.941650390625, -1.841583251953125, -1.74151611328125, -1.641448974609375, -1.5413818359375, -1.441314697265625, -1.34124755859375, -1.241180419921875, -1.14111328125, -1.041046142578125, -0.94097900390625, -0.840911865234375, -0.7408447265625, -0.640777587890625, -0.54071044921875, -0.440643310546875, -0.340576171875, -0.240509033203125, -0.14044189453125, -0.040374755859375, 0.0596923828125, 0.159759521484375, 0.25982666015625, 0.359893798828125, 0.4599609375, 0.560028076171875, 0.66009521484375, 0.760162353515625, 0.8602294921875, 0.960296630859375, 1.06036376953125, 1.160430908203125, 1.260498046875, 1.360565185546875, 1.46063232421875, 1.560699462890625, 1.6607666015625, 1.760833740234375, 1.86090087890625, 1.960968017578125, 2.06103515625, 2.161102294921875, 2.26116943359375, 2.361236572265625, 2.4613037109375, 2.561370849609375, 2.66143798828125, 2.761505126953125, 2.861572265625, 2.961639404296875, 3.06170654296875, 3.161773681640625, 3.2618408203125, 3.361907958984375, 3.46197509765625, 3.562042236328125, 3.662109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 8.0, 8.0, 8.0, 9.0, 9.0, 21.0, 24.0, 34.0, 85.0, 152.0, 237.0, 145.0, 86.0, 51.0, 28.0, 20.0, 16.0, 9.0, 8.0, 4.0, 4.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007147789001464844, -0.0006945878267288208, -0.0006743967533111572, -0.0006542056798934937, -0.0006340146064758301, -0.0006138235330581665, -0.0005936324596405029, -0.0005734413862228394, -0.0005532503128051758, -0.0005330592393875122, -0.0005128681659698486, -0.0004926770925521851, -0.0004724860191345215, -0.0004522949457168579, -0.00043210387229919434, -0.00041191279888153076, -0.0003917217254638672, -0.0003715306520462036, -0.00035133957862854004, -0.00033114850521087646, -0.0003109574317932129, -0.0002907663583755493, -0.00027057528495788574, -0.00025038421154022217, -0.0002301931381225586, -0.00021000206470489502, -0.00018981099128723145, -0.00016961991786956787, -0.0001494288444519043, -0.00012923777103424072, -0.00010904669761657715, -8.885562419891357e-05, -6.866455078125e-05, -4.8473477363586426e-05, -2.828240394592285e-05, -8.091330528259277e-06, 1.2099742889404297e-05, 3.229081630706787e-05, 5.2481889724731445e-05, 7.267296314239502e-05, 9.28640365600586e-05, 0.00011305510997772217, 0.00013324618339538574, 0.00015343725681304932, 0.0001736283302307129, 0.00019381940364837646, 0.00021401047706604004, 0.0002342015504837036, 0.0002543926239013672, 0.00027458369731903076, 0.00029477477073669434, 0.0003149658441543579, 0.0003351569175720215, 0.00035534799098968506, 0.00037553906440734863, 0.0003957301378250122, 0.0004159212112426758, 0.00043611228466033936, 0.00045630335807800293, 0.0004764944314956665, 0.0004966855049133301, 0.0005168765783309937, 0.0005370676517486572, 0.0005572587251663208, 0.0005774497985839844]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 9.0, 14.0, 12.0, 19.0, 35.0, 58.0, 99.0, 131.0, 224.0, 391.0, 748.0, 1595.0, 4284.0, 14881.0, 76739.0, 782679.0, 135022.0, 21518.0, 5781.0, 2168.0, 922.0, 506.0, 281.0, 161.0, 98.0, 58.0, 45.0, 18.0, 17.0, 10.0, 8.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.5682830810546875, -2.501800537109375, -2.4353179931640625, -2.36883544921875, -2.3023529052734375, -2.235870361328125, -2.1693878173828125, -2.1029052734375, -2.0364227294921875, -1.969940185546875, -1.9034576416015625, -1.83697509765625, -1.7704925537109375, -1.704010009765625, -1.6375274658203125, -1.571044921875, -1.5045623779296875, -1.438079833984375, -1.3715972900390625, -1.30511474609375, -1.2386322021484375, -1.172149658203125, -1.1056671142578125, -1.0391845703125, -0.9727020263671875, -0.906219482421875, -0.8397369384765625, -0.77325439453125, -0.7067718505859375, -0.640289306640625, -0.5738067626953125, -0.50732421875, -0.4408416748046875, -0.374359130859375, -0.3078765869140625, -0.24139404296875, -0.1749114990234375, -0.108428955078125, -0.0419464111328125, 0.0245361328125, 0.0910186767578125, 0.157501220703125, 0.2239837646484375, 0.29046630859375, 0.3569488525390625, 0.423431396484375, 0.4899139404296875, 0.556396484375, 0.6228790283203125, 0.689361572265625, 0.7558441162109375, 0.82232666015625, 0.8888092041015625, 0.955291748046875, 1.0217742919921875, 1.0882568359375, 1.1547393798828125, 1.221221923828125, 1.2877044677734375, 1.35418701171875, 1.4206695556640625, 1.487152099609375, 1.5536346435546875, 1.6201171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 9.0, 5.0, 13.0, 16.0, 19.0, 44.0, 40.0, 60.0, 82.0, 119.0, 127.0, 99.0, 90.0, 80.0, 57.0, 30.0, 14.0, 11.0, 17.0, 14.0, 12.0, 10.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.22265625, -3.1451568603515625, -3.067657470703125, -2.9901580810546875, -2.91265869140625, -2.8351593017578125, -2.757659912109375, -2.6801605224609375, -2.6026611328125, -2.5251617431640625, -2.447662353515625, -2.3701629638671875, -2.29266357421875, -2.2151641845703125, -2.137664794921875, -2.0601654052734375, -1.982666015625, -1.9051666259765625, -1.827667236328125, -1.7501678466796875, -1.67266845703125, -1.5951690673828125, -1.517669677734375, -1.4401702880859375, -1.3626708984375, -1.2851715087890625, -1.207672119140625, -1.1301727294921875, -1.05267333984375, -0.9751739501953125, -0.897674560546875, -0.8201751708984375, -0.74267578125, -0.6651763916015625, -0.587677001953125, -0.5101776123046875, -0.43267822265625, -0.3551788330078125, -0.277679443359375, -0.2001800537109375, -0.1226806640625, -0.0451812744140625, 0.032318115234375, 0.1098175048828125, 0.18731689453125, 0.2648162841796875, 0.342315673828125, 0.4198150634765625, 0.497314453125, 0.5748138427734375, 0.652313232421875, 0.7298126220703125, 0.80731201171875, 0.8848114013671875, 0.962310791015625, 1.0398101806640625, 1.1173095703125, 1.1948089599609375, 1.272308349609375, 1.3498077392578125, 1.42730712890625, 1.5048065185546875, 1.582305908203125, 1.6598052978515625, 1.7373046875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 36.0, 125.0, 469.0, 245.0, 60.0, 24.0, 11.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.29277801513672, -72.94034576416016, -68.58792114257812, -64.23548889160156, -59.883056640625, -55.53062438964844, -51.17819595336914, -46.825767517089844, -42.47333526611328, -38.12090301513672, -33.76847457885742, -29.416044235229492, -25.063613891601562, -20.711183547973633, -16.358753204345703, -12.006322860717773, -7.653892517089844, -3.301462173461914, 1.0509681701660156, 5.403398513793945, 9.755828857421875, 14.108259201049805, 18.460689544677734, 22.813119888305664, 27.165550231933594, 31.517980575561523, 35.87041091918945, 40.22283935546875, 44.57527160644531, 48.927703857421875, 53.28013229370117, 57.63256072998047, 61.98500061035156, 66.33743286132812, 70.68986511230469, 75.04228973388672, 79.39472198486328, 83.74715423583984, 88.09957885742188, 92.45201110839844, 96.804443359375, 101.15687561035156, 105.50930786132812, 109.86173248291016, 114.21416473388672, 118.56659698486328, 122.91902160644531, 127.27145385742188, 131.62388610839844, 135.976318359375, 140.32875061035156, 144.68118286132812, 149.03359985351562, 153.3860321044922, 157.73846435546875, 162.0908966064453, 166.44332885742188, 170.79576110839844, 175.148193359375, 179.50062561035156, 183.85305786132812, 188.20547485351562, 192.5579071044922, 196.91033935546875, 201.2627716064453]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 8.0, 5.0, 5.0, 16.0, 9.0, 12.0, 15.0, 15.0, 15.0, 21.0, 24.0, 28.0, 33.0, 26.0, 48.0, 57.0, 104.0, 133.0, 87.0, 61.0, 36.0, 22.0, 27.0, 21.0, 26.0, 16.0, 26.0, 14.0, 13.0, 11.0, 16.0, 9.0, 3.0, 10.0, 9.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.68390655517578, -53.799259185791016, -51.91461181640625, -50.029964447021484, -48.14531707763672, -46.26066589355469, -44.37602233886719, -42.491371154785156, -40.60672378540039, -38.722076416015625, -36.83742904663086, -34.952781677246094, -33.06813430786133, -31.18348503112793, -29.298837661743164, -27.414188385009766, -25.529542922973633, -23.644895553588867, -21.7602481842041, -19.875598907470703, -17.990951538085938, -16.106304168701172, -14.221656799316406, -12.337008476257324, -10.452361106872559, -8.567713737487793, -6.683065414428711, -4.798418045043945, -2.9137701988220215, -1.0291223526000977, 0.855525016784668, 2.74017333984375, 4.624820709228516, 6.5094685554504395, 8.394116401672363, 10.278763771057129, 12.163412094116211, 14.048059463500977, 15.932706832885742, 17.81735610961914, 19.702003479003906, 21.586650848388672, 23.471298217773438, 25.355945587158203, 27.2405948638916, 29.125242233276367, 31.009889602661133, 32.89453887939453, 34.77918243408203, 36.6638298034668, 38.54847717285156, 40.43312454223633, 42.317771911621094, 44.202423095703125, 46.087066650390625, 47.971717834472656, 49.85636520385742, 51.74101257324219, 53.62565994262695, 55.51030731201172, 57.394954681396484, 59.27960205078125, 61.16425323486328, 63.04890060424805, 64.93354797363281]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 4.0, 12.0, 13.0, 13.0, 32.0, 39.0, 93.0, 95.0, 121.0, 217.0, 386.0, 517.0, 1012.0, 1981.0, 4321.0, 12969.0, 48746.0, 255232.0, 1231205.0, 1949046.0, 552775.0, 98057.0, 22896.0, 7967.0, 3151.0, 1395.0, 781.0, 444.0, 288.0, 154.0, 98.0, 69.0, 58.0, 28.0, 17.0, 16.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.5625, -6.38134765625, -6.2001953125, -6.01904296875, -5.837890625, -5.65673828125, -5.4755859375, -5.29443359375, -5.11328125, -4.93212890625, -4.7509765625, -4.56982421875, -4.388671875, -4.20751953125, -4.0263671875, -3.84521484375, -3.6640625, -3.48291015625, -3.3017578125, -3.12060546875, -2.939453125, -2.75830078125, -2.5771484375, -2.39599609375, -2.21484375, -2.03369140625, -1.8525390625, -1.67138671875, -1.490234375, -1.30908203125, -1.1279296875, -0.94677734375, -0.765625, -0.58447265625, -0.4033203125, -0.22216796875, -0.041015625, 0.14013671875, 0.3212890625, 0.50244140625, 0.68359375, 0.86474609375, 1.0458984375, 1.22705078125, 1.408203125, 1.58935546875, 1.7705078125, 1.95166015625, 2.1328125, 2.31396484375, 2.4951171875, 2.67626953125, 2.857421875, 3.03857421875, 3.2197265625, 3.40087890625, 3.58203125, 3.76318359375, 3.9443359375, 4.12548828125, 4.306640625, 4.48779296875, 4.6689453125, 4.85009765625, 5.03125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 7.0, 10.0, 13.0, 21.0, 34.0, 30.0, 48.0, 44.0, 43.0, 54.0, 72.0, 57.0, 69.0, 70.0, 69.0, 54.0, 47.0, 44.0, 46.0, 32.0, 39.0, 27.0, 14.0, 15.0, 8.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.53125, -6.35821533203125, -6.1851806640625, -6.01214599609375, -5.839111328125, -5.66607666015625, -5.4930419921875, -5.32000732421875, -5.14697265625, -4.97393798828125, -4.8009033203125, -4.62786865234375, -4.454833984375, -4.28179931640625, -4.1087646484375, -3.93572998046875, -3.7626953125, -3.58966064453125, -3.4166259765625, -3.24359130859375, -3.070556640625, -2.89752197265625, -2.7244873046875, -2.55145263671875, -2.37841796875, -2.20538330078125, -2.0323486328125, -1.85931396484375, -1.686279296875, -1.51324462890625, -1.3402099609375, -1.16717529296875, -0.994140625, -0.82110595703125, -0.6480712890625, -0.47503662109375, -0.302001953125, -0.12896728515625, 0.0440673828125, 0.21710205078125, 0.39013671875, 0.56317138671875, 0.7362060546875, 0.90924072265625, 1.082275390625, 1.25531005859375, 1.4283447265625, 1.60137939453125, 1.7744140625, 1.94744873046875, 2.1204833984375, 2.29351806640625, 2.466552734375, 2.63958740234375, 2.8126220703125, 2.98565673828125, 3.15869140625, 3.33172607421875, 3.5047607421875, 3.67779541015625, 3.850830078125, 4.02386474609375, 4.1968994140625, 4.36993408203125, 4.54296875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 7.0, 10.0, 18.0, 19.0, 37.0, 53.0, 64.0, 112.0, 206.0, 359.0, 691.0, 1590.0, 5632.0, 42902.0, 3528528.0, 590139.0, 18103.0, 3358.0, 1106.0, 545.0, 296.0, 165.0, 98.0, 70.0, 49.0, 26.0, 32.0, 16.0, 16.0, 2.0, 4.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.527587890625, -16.00830078125, -15.489013671875, -14.9697265625, -14.450439453125, -13.93115234375, -13.411865234375, -12.892578125, -12.373291015625, -11.85400390625, -11.334716796875, -10.8154296875, -10.296142578125, -9.77685546875, -9.257568359375, -8.73828125, -8.218994140625, -7.69970703125, -7.180419921875, -6.6611328125, -6.141845703125, -5.62255859375, -5.103271484375, -4.583984375, -4.064697265625, -3.54541015625, -3.026123046875, -2.5068359375, -1.987548828125, -1.46826171875, -0.948974609375, -0.4296875, 0.089599609375, 0.60888671875, 1.128173828125, 1.6474609375, 2.166748046875, 2.68603515625, 3.205322265625, 3.724609375, 4.243896484375, 4.76318359375, 5.282470703125, 5.8017578125, 6.321044921875, 6.84033203125, 7.359619140625, 7.87890625, 8.398193359375, 8.91748046875, 9.436767578125, 9.9560546875, 10.475341796875, 10.99462890625, 11.513916015625, 12.033203125, 12.552490234375, 13.07177734375, 13.591064453125, 14.1103515625, 14.629638671875, 15.14892578125, 15.668212890625, 16.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 6.0, 5.0, 10.0, 13.0, 22.0, 18.0, 26.0, 46.0, 77.0, 83.0, 124.0, 179.0, 296.0, 442.0, 610.0, 624.0, 477.0, 338.0, 230.0, 134.0, 101.0, 61.0, 38.0, 29.0, 21.0, 18.0, 10.0, 8.0, 11.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.2398681640625, -8.885986328125, -8.5321044921875, -8.17822265625, -7.8243408203125, -7.470458984375, -7.1165771484375, -6.7626953125, -6.4088134765625, -6.054931640625, -5.7010498046875, -5.34716796875, -4.9932861328125, -4.639404296875, -4.2855224609375, -3.931640625, -3.5777587890625, -3.223876953125, -2.8699951171875, -2.51611328125, -2.1622314453125, -1.808349609375, -1.4544677734375, -1.1005859375, -0.7467041015625, -0.392822265625, -0.0389404296875, 0.31494140625, 0.6688232421875, 1.022705078125, 1.3765869140625, 1.73046875, 2.0843505859375, 2.438232421875, 2.7921142578125, 3.14599609375, 3.4998779296875, 3.853759765625, 4.2076416015625, 4.5615234375, 4.9154052734375, 5.269287109375, 5.6231689453125, 5.97705078125, 6.3309326171875, 6.684814453125, 7.0386962890625, 7.392578125, 7.7464599609375, 8.100341796875, 8.4542236328125, 8.80810546875, 9.1619873046875, 9.515869140625, 9.8697509765625, 10.2236328125, 10.5775146484375, 10.931396484375, 11.2852783203125, 11.63916015625, 11.9930419921875, 12.346923828125, 12.7008056640625, 13.0546875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 1.0, 6.0, 9.0, 8.0, 10.0, 25.0, 58.0, 101.0, 214.0, 263.0, 144.0, 66.0, 35.0, 20.0, 14.0, 14.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.87327575683594, -77.40188598632812, -72.93049621582031, -68.4591064453125, -63.98771286010742, -59.51632308959961, -55.04492950439453, -50.57353973388672, -46.102149963378906, -41.630760192871094, -37.15937042236328, -32.6879768371582, -28.21658706665039, -23.745197296142578, -19.273805618286133, -14.802413940429688, -10.331024169921875, -5.859633445739746, -1.3882427215576172, 3.0831480026245117, 7.554538726806641, 12.025928497314453, 16.4973201751709, 20.968711853027344, 25.440101623535156, 29.91149139404297, 34.38288116455078, 38.85427474975586, 43.32566452026367, 47.797054290771484, 52.26844787597656, 56.739837646484375, 61.211212158203125, 65.68260192871094, 70.15399169921875, 74.62538146972656, 79.09677124023438, 83.56816101074219, 88.03955841064453, 92.51094818115234, 96.98233795166016, 101.45372772216797, 105.92511749267578, 110.3965072631836, 114.86790466308594, 119.33929443359375, 123.81068420410156, 128.28207397460938, 132.7534637451172, 137.224853515625, 141.6962432861328, 146.16763305664062, 150.63902282714844, 155.11041259765625, 159.58180236816406, 164.05319213867188, 168.52459716796875, 172.99598693847656, 177.46737670898438, 181.9387664794922, 186.41015625, 190.8815460205078, 195.35293579101562, 199.8243408203125, 204.29571533203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 4.0, 12.0, 13.0, 17.0, 22.0, 20.0, 24.0, 21.0, 33.0, 51.0, 38.0, 68.0, 63.0, 70.0, 66.0, 58.0, 66.0, 53.0, 40.0, 42.0, 28.0, 35.0, 25.0, 26.0, 15.0, 21.0, 21.0, 9.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.707542419433594, -48.63362503051758, -46.55970764160156, -44.48579406738281, -42.4118766784668, -40.33795928955078, -38.264041900634766, -36.19012451171875, -34.1162109375, -32.042293548583984, -29.9683780670166, -27.894460678100586, -25.820545196533203, -23.746627807617188, -21.672710418701172, -19.598793029785156, -17.52487564086914, -15.450959205627441, -13.377042770385742, -11.303125381469727, -9.229208946228027, -7.155292510986328, -5.0813751220703125, -3.0074586868286133, -0.9335422515869141, 1.1403744220733643, 3.2142910957336426, 5.2882080078125, 7.362124443054199, 9.436040878295898, 11.509958267211914, 13.583874702453613, 15.657791137695312, 17.731708526611328, 19.80562400817871, 21.879541397094727, 23.95345687866211, 26.027374267578125, 28.10129165649414, 30.175209045410156, 32.249122619628906, 34.32304000854492, 36.39695739746094, 38.47087097167969, 40.5447883605957, 42.61870574951172, 44.692623138427734, 46.76654052734375, 48.840457916259766, 50.91437530517578, 52.9882926940918, 55.06221008300781, 57.13612365722656, 59.21004104614258, 61.283958435058594, 63.35787582397461, 65.43179321289062, 67.50570678710938, 69.57962799072266, 71.6535415649414, 73.72746276855469, 75.80137634277344, 77.87528991699219, 79.94921112060547, 82.02312469482422]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 10.0, 9.0, 19.0, 38.0, 26.0, 51.0, 97.0, 141.0, 226.0, 382.0, 690.0, 1433.0, 3233.0, 7912.0, 21474.0, 73093.0, 308158.0, 469842.0, 112240.0, 31102.0, 10295.0, 4153.0, 1807.0, 928.0, 470.0, 270.0, 142.0, 126.0, 59.0, 40.0, 24.0, 22.0, 15.0, 9.0, 3.0, 2.0, 5.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8359375, -5.628662109375, -5.42138671875, -5.214111328125, -5.0068359375, -4.799560546875, -4.59228515625, -4.385009765625, -4.177734375, -3.970458984375, -3.76318359375, -3.555908203125, -3.3486328125, -3.141357421875, -2.93408203125, -2.726806640625, -2.51953125, -2.312255859375, -2.10498046875, -1.897705078125, -1.6904296875, -1.483154296875, -1.27587890625, -1.068603515625, -0.861328125, -0.654052734375, -0.44677734375, -0.239501953125, -0.0322265625, 0.175048828125, 0.38232421875, 0.589599609375, 0.796875, 1.004150390625, 1.21142578125, 1.418701171875, 1.6259765625, 1.833251953125, 2.04052734375, 2.247802734375, 2.455078125, 2.662353515625, 2.86962890625, 3.076904296875, 3.2841796875, 3.491455078125, 3.69873046875, 3.906005859375, 4.11328125, 4.320556640625, 4.52783203125, 4.735107421875, 4.9423828125, 5.149658203125, 5.35693359375, 5.564208984375, 5.771484375, 5.978759765625, 6.18603515625, 6.393310546875, 6.6005859375, 6.807861328125, 7.01513671875, 7.222412109375, 7.4296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 8.0, 12.0, 13.0, 6.0, 14.0, 17.0, 22.0, 35.0, 43.0, 42.0, 44.0, 61.0, 63.0, 62.0, 63.0, 54.0, 64.0, 57.0, 57.0, 53.0, 45.0, 30.0, 29.0, 24.0, 13.0, 22.0, 12.0, 9.0, 9.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.5390625, -6.366455078125, -6.19384765625, -6.021240234375, -5.8486328125, -5.676025390625, -5.50341796875, -5.330810546875, -5.158203125, -4.985595703125, -4.81298828125, -4.640380859375, -4.4677734375, -4.295166015625, -4.12255859375, -3.949951171875, -3.77734375, -3.604736328125, -3.43212890625, -3.259521484375, -3.0869140625, -2.914306640625, -2.74169921875, -2.569091796875, -2.396484375, -2.223876953125, -2.05126953125, -1.878662109375, -1.7060546875, -1.533447265625, -1.36083984375, -1.188232421875, -1.015625, -0.843017578125, -0.67041015625, -0.497802734375, -0.3251953125, -0.152587890625, 0.02001953125, 0.192626953125, 0.365234375, 0.537841796875, 0.71044921875, 0.883056640625, 1.0556640625, 1.228271484375, 1.40087890625, 1.573486328125, 1.74609375, 1.918701171875, 2.09130859375, 2.263916015625, 2.4365234375, 2.609130859375, 2.78173828125, 2.954345703125, 3.126953125, 3.299560546875, 3.47216796875, 3.644775390625, 3.8173828125, 3.989990234375, 4.16259765625, 4.335205078125, 4.5078125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 14.0, 18.0, 30.0, 37.0, 45.0, 88.0, 142.0, 288.0, 582.0, 1455.0, 7431.0, 131253.0, 875461.0, 26665.0, 3224.0, 905.0, 388.0, 190.0, 118.0, 65.0, 40.0, 24.0, 25.0, 14.0, 13.0, 9.0, 5.0, 0.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4296875, -9.0565185546875, -8.683349609375, -8.3101806640625, -7.93701171875, -7.5638427734375, -7.190673828125, -6.8175048828125, -6.4443359375, -6.0711669921875, -5.697998046875, -5.3248291015625, -4.95166015625, -4.5784912109375, -4.205322265625, -3.8321533203125, -3.458984375, -3.0858154296875, -2.712646484375, -2.3394775390625, -1.96630859375, -1.5931396484375, -1.219970703125, -0.8468017578125, -0.4736328125, -0.1004638671875, 0.272705078125, 0.6458740234375, 1.01904296875, 1.3922119140625, 1.765380859375, 2.1385498046875, 2.51171875, 2.8848876953125, 3.258056640625, 3.6312255859375, 4.00439453125, 4.3775634765625, 4.750732421875, 5.1239013671875, 5.4970703125, 5.8702392578125, 6.243408203125, 6.6165771484375, 6.98974609375, 7.3629150390625, 7.736083984375, 8.1092529296875, 8.482421875, 8.8555908203125, 9.228759765625, 9.6019287109375, 9.97509765625, 10.3482666015625, 10.721435546875, 11.0946044921875, 11.4677734375, 11.8409423828125, 12.214111328125, 12.5872802734375, 12.96044921875, 13.3336181640625, 13.706787109375, 14.0799560546875, 14.453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 8.0, 5.0, 11.0, 12.0, 8.0, 10.0, 11.0, 23.0, 19.0, 19.0, 31.0, 41.0, 49.0, 52.0, 83.0, 83.0, 99.0, 76.0, 66.0, 55.0, 51.0, 36.0, 27.0, 18.0, 24.0, 18.0, 13.0, 8.0, 12.0, 7.0, 7.0, 2.0, 6.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.0625, -19.428466796875, -18.79443359375, -18.160400390625, -17.5263671875, -16.892333984375, -16.25830078125, -15.624267578125, -14.990234375, -14.356201171875, -13.72216796875, -13.088134765625, -12.4541015625, -11.820068359375, -11.18603515625, -10.552001953125, -9.91796875, -9.283935546875, -8.64990234375, -8.015869140625, -7.3818359375, -6.747802734375, -6.11376953125, -5.479736328125, -4.845703125, -4.211669921875, -3.57763671875, -2.943603515625, -2.3095703125, -1.675537109375, -1.04150390625, -0.407470703125, 0.2265625, 0.860595703125, 1.49462890625, 2.128662109375, 2.7626953125, 3.396728515625, 4.03076171875, 4.664794921875, 5.298828125, 5.932861328125, 6.56689453125, 7.200927734375, 7.8349609375, 8.468994140625, 9.10302734375, 9.737060546875, 10.37109375, 11.005126953125, 11.63916015625, 12.273193359375, 12.9072265625, 13.541259765625, 14.17529296875, 14.809326171875, 15.443359375, 16.077392578125, 16.71142578125, 17.345458984375, 17.9794921875, 18.613525390625, 19.24755859375, 19.881591796875, 20.515625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 8.0, 6.0, 0.0, 12.0, 14.0, 18.0, 34.0, 41.0, 75.0, 104.0, 226.0, 434.0, 1125.0, 3297.0, 15371.0, 198335.0, 800290.0, 22301.0, 4292.0, 1402.0, 536.0, 229.0, 148.0, 83.0, 56.0, 42.0, 30.0, 16.0, 10.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9609375, -0.9226531982421875, -0.884368896484375, -0.8460845947265625, -0.80780029296875, -0.7695159912109375, -0.731231689453125, -0.6929473876953125, -0.6546630859375, -0.6163787841796875, -0.578094482421875, -0.5398101806640625, -0.50152587890625, -0.4632415771484375, -0.424957275390625, -0.3866729736328125, -0.348388671875, -0.3101043701171875, -0.271820068359375, -0.2335357666015625, -0.19525146484375, -0.1569671630859375, -0.118682861328125, -0.0803985595703125, -0.0421142578125, -0.0038299560546875, 0.034454345703125, 0.0727386474609375, 0.11102294921875, 0.1493072509765625, 0.187591552734375, 0.2258758544921875, 0.26416015625, 0.3024444580078125, 0.340728759765625, 0.3790130615234375, 0.41729736328125, 0.4555816650390625, 0.493865966796875, 0.5321502685546875, 0.5704345703125, 0.6087188720703125, 0.647003173828125, 0.6852874755859375, 0.72357177734375, 0.7618560791015625, 0.800140380859375, 0.8384246826171875, 0.876708984375, 0.9149932861328125, 0.953277587890625, 0.9915618896484375, 1.02984619140625, 1.0681304931640625, 1.106414794921875, 1.1446990966796875, 1.1829833984375, 1.2212677001953125, 1.259552001953125, 1.2978363037109375, 1.33612060546875, 1.3744049072265625, 1.412689208984375, 1.4509735107421875, 1.4892578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 7.0, 6.0, 8.0, 12.0, 23.0, 16.0, 25.0, 25.0, 36.0, 37.0, 59.0, 67.0, 93.0, 95.0, 89.0, 75.0, 64.0, 42.0, 41.0, 38.0, 19.0, 25.0, 17.0, 14.0, 10.0, 15.0, 7.0, 9.0, 2.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015091896057128906, -0.000145668163895607, -0.00014041736721992493, -0.00013516657054424286, -0.0001299157738685608, -0.00012466497719287872, -0.00011941418051719666, -0.00011416338384151459, -0.00010891258716583252, -0.00010366179049015045, -9.841099381446838e-05, -9.316019713878632e-05, -8.790940046310425e-05, -8.265860378742218e-05, -7.740780711174011e-05, -7.215701043605804e-05, -6.690621376037598e-05, -6.165541708469391e-05, -5.640462040901184e-05, -5.115382373332977e-05, -4.5903027057647705e-05, -4.065223038196564e-05, -3.540143370628357e-05, -3.01506370306015e-05, -2.4899840354919434e-05, -1.9649043679237366e-05, -1.4398247003555298e-05, -9.14745032787323e-06, -3.896653652191162e-06, 1.3541430234909058e-06, 6.604939699172974e-06, 1.1855736374855042e-05, 1.710653305053711e-05, 2.2357329726219177e-05, 2.7608126401901245e-05, 3.285892307758331e-05, 3.810971975326538e-05, 4.336051642894745e-05, 4.8611313104629517e-05, 5.3862109780311584e-05, 5.911290645599365e-05, 6.436370313167572e-05, 6.961449980735779e-05, 7.486529648303986e-05, 8.011609315872192e-05, 8.536688983440399e-05, 9.061768651008606e-05, 9.586848318576813e-05, 0.0001011192798614502, 0.00010637007653713226, 0.00011162087321281433, 0.0001168716698884964, 0.00012212246656417847, 0.00012737326323986053, 0.0001326240599155426, 0.00013787485659122467, 0.00014312565326690674, 0.0001483764499425888, 0.00015362724661827087, 0.00015887804329395294, 0.000164128839969635, 0.00016937963664531708, 0.00017463043332099915, 0.0001798812299966812, 0.00018513202667236328]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 7.0, 12.0, 18.0, 23.0, 27.0, 47.0, 83.0, 129.0, 188.0, 296.0, 485.0, 900.0, 1706.0, 3572.0, 8343.0, 22690.0, 84459.0, 756279.0, 122521.0, 28040.0, 10084.0, 4143.0, 2016.0, 1010.0, 552.0, 318.0, 199.0, 147.0, 83.0, 50.0, 31.0, 27.0, 24.0, 10.0, 7.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7197265625, -0.6976470947265625, -0.675567626953125, -0.6534881591796875, -0.63140869140625, -0.6093292236328125, -0.587249755859375, -0.5651702880859375, -0.5430908203125, -0.5210113525390625, -0.498931884765625, -0.4768524169921875, -0.45477294921875, -0.4326934814453125, -0.410614013671875, -0.3885345458984375, -0.366455078125, -0.3443756103515625, -0.322296142578125, -0.3002166748046875, -0.27813720703125, -0.2560577392578125, -0.233978271484375, -0.2118988037109375, -0.1898193359375, -0.1677398681640625, -0.145660400390625, -0.1235809326171875, -0.10150146484375, -0.0794219970703125, -0.057342529296875, -0.0352630615234375, -0.01318359375, 0.0088958740234375, 0.030975341796875, 0.0530548095703125, 0.07513427734375, 0.0972137451171875, 0.119293212890625, 0.1413726806640625, 0.1634521484375, 0.1855316162109375, 0.207611083984375, 0.2296905517578125, 0.25177001953125, 0.2738494873046875, 0.295928955078125, 0.3180084228515625, 0.340087890625, 0.3621673583984375, 0.384246826171875, 0.4063262939453125, 0.42840576171875, 0.4504852294921875, 0.472564697265625, 0.4946441650390625, 0.5167236328125, 0.5388031005859375, 0.560882568359375, 0.5829620361328125, 0.60504150390625, 0.6271209716796875, 0.649200439453125, 0.6712799072265625, 0.693359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 1.0, 5.0, 5.0, 1.0, 5.0, 6.0, 11.0, 17.0, 9.0, 15.0, 26.0, 30.0, 57.0, 68.0, 75.0, 76.0, 117.0, 105.0, 100.0, 72.0, 44.0, 32.0, 20.0, 23.0, 17.0, 19.0, 8.0, 9.0, 8.0, 7.0, 5.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.07421875, -1.0433349609375, -1.012451171875, -0.9815673828125, -0.95068359375, -0.9197998046875, -0.888916015625, -0.8580322265625, -0.8271484375, -0.7962646484375, -0.765380859375, -0.7344970703125, -0.70361328125, -0.6727294921875, -0.641845703125, -0.6109619140625, -0.580078125, -0.5491943359375, -0.518310546875, -0.4874267578125, -0.45654296875, -0.4256591796875, -0.394775390625, -0.3638916015625, -0.3330078125, -0.3021240234375, -0.271240234375, -0.2403564453125, -0.20947265625, -0.1785888671875, -0.147705078125, -0.1168212890625, -0.0859375, -0.0550537109375, -0.024169921875, 0.0067138671875, 0.03759765625, 0.0684814453125, 0.099365234375, 0.1302490234375, 0.1611328125, 0.1920166015625, 0.222900390625, 0.2537841796875, 0.28466796875, 0.3155517578125, 0.346435546875, 0.3773193359375, 0.408203125, 0.4390869140625, 0.469970703125, 0.5008544921875, 0.53173828125, 0.5626220703125, 0.593505859375, 0.6243896484375, 0.6552734375, 0.6861572265625, 0.717041015625, 0.7479248046875, 0.77880859375, 0.8096923828125, 0.840576171875, 0.8714599609375, 0.90234375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 12.0, 11.0, 33.0, 59.0, 293.0, 413.0, 106.0, 37.0, 18.0, 10.0, 9.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.06237030029297, -95.34998321533203, -92.6375961303711, -89.92520141601562, -87.21281433105469, -84.50042724609375, -81.78804016113281, -79.07565307617188, -76.36326599121094, -73.65087890625, -70.93849182128906, -68.22610473632812, -65.51371002197266, -62.80132293701172, -60.08893585205078, -57.376548767089844, -54.664154052734375, -51.95176696777344, -49.239376068115234, -46.5269889831543, -43.814598083496094, -41.102210998535156, -38.38982391357422, -35.67743682861328, -32.96504592895508, -30.252656936645508, -27.540267944335938, -24.827880859375, -22.11549186706543, -19.40310287475586, -16.690715789794922, -13.978326797485352, -11.26593017578125, -8.55354118347168, -5.841153144836426, -3.128765106201172, -0.41637611389160156, 2.2960128784179688, 5.008399963378906, 7.720788955688477, 10.433177947998047, 13.145566940307617, 15.857954978942871, 18.570343017578125, 21.282732009887695, 23.995121002197266, 26.707508087158203, 29.419897079467773, 32.132286071777344, 34.84467315673828, 37.557064056396484, 40.26945114135742, 42.981842041015625, 45.69422912597656, 48.4066162109375, 51.11900329589844, 53.83139419555664, 56.54378128051758, 59.25617218017578, 61.96855926513672, 64.68094635009766, 67.39334106445312, 70.10572814941406, 72.818115234375, 75.53050231933594]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 3.0, 3.0, 8.0, 9.0, 14.0, 18.0, 14.0, 18.0, 31.0, 16.0, 35.0, 20.0, 34.0, 147.0, 123.0, 87.0, 150.0, 83.0, 28.0, 21.0, 16.0, 21.0, 14.0, 12.0, 17.0, 10.0, 2.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-55.161460876464844, -53.451499938964844, -51.741539001464844, -50.03157424926758, -48.32161331176758, -46.61165237426758, -44.90168762207031, -43.19172668457031, -41.48176574707031, -39.77180480957031, -38.06184387207031, -36.35187911987305, -34.64191818237305, -32.93195724487305, -31.221994400024414, -29.51203155517578, -27.80207061767578, -26.09210968017578, -24.38214683532715, -22.672183990478516, -20.962223052978516, -19.252262115478516, -17.542299270629883, -15.832337379455566, -14.12237548828125, -12.412413597106934, -10.702451705932617, -8.9924898147583, -7.282527923583984, -5.572566032409668, -3.8626041412353516, -2.152642250061035, -0.44268035888671875, 1.2672815322875977, 2.977243423461914, 4.6872053146362305, 6.397167205810547, 8.107129096984863, 9.81709098815918, 11.527052879333496, 13.237014770507812, 14.946976661682129, 16.656938552856445, 18.366901397705078, 20.076862335205078, 21.786823272705078, 23.49678611755371, 25.206748962402344, 26.916709899902344, 28.626670837402344, 30.336633682250977, 32.04659652709961, 33.75655746459961, 35.46651840209961, 37.176483154296875, 38.886444091796875, 40.596405029296875, 42.306365966796875, 44.016326904296875, 45.72629165649414, 47.43625259399414, 49.14621353149414, 50.856178283691406, 52.566139221191406, 54.276100158691406]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 2.0, 8.0, 5.0, 5.0, 18.0, 17.0, 20.0, 32.0, 28.0, 34.0, 49.0, 66.0, 246.0, 190.0, 59.0, 39.0, 30.0, 30.0, 29.0, 15.0, 26.0, 11.0, 2.0, 11.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.55078125, -6.363525390625, -6.17626953125, -5.989013671875, -5.8017578125, -5.614501953125, -5.42724609375, -5.239990234375, -5.052734375, -4.865478515625, -4.67822265625, -4.490966796875, -4.3037109375, -4.116455078125, -3.92919921875, -3.741943359375, -3.5546875, -3.367431640625, -3.18017578125, -2.992919921875, -2.8056640625, -2.618408203125, -2.43115234375, -2.243896484375, -2.056640625, -1.869384765625, -1.68212890625, -1.494873046875, -1.3076171875, -1.120361328125, -0.93310546875, -0.745849609375, -0.55859375, -0.371337890625, -0.18408203125, 0.003173828125, 0.1904296875, 0.377685546875, 0.56494140625, 0.752197265625, 0.939453125, 1.126708984375, 1.31396484375, 1.501220703125, 1.6884765625, 1.875732421875, 2.06298828125, 2.250244140625, 2.4375, 2.624755859375, 2.81201171875, 2.999267578125, 3.1865234375, 3.373779296875, 3.56103515625, 3.748291015625, 3.935546875, 4.122802734375, 4.31005859375, 4.497314453125, 4.6845703125, 4.871826171875, 5.05908203125, 5.246337890625, 5.43359375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 9.0, 8.0, 10.0, 11.0, 17.0, 31.0, 33.0, 56.0, 138.0, 208.0, 451.0, 1306.0, 5207.0, 108822.0, 8262138.0, 7220.0, 1708.0, 554.0, 259.0, 132.0, 87.0, 51.0, 28.0, 13.0, 8.0, 18.0, 9.0, 6.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0], "bins": [-40.63267517089844, -39.186492919921875, -37.74030685424805, -36.29412078857422, -34.847938537597656, -33.401756286621094, -31.955570220947266, -30.50938606262207, -29.063201904296875, -27.61701774597168, -26.170833587646484, -24.72464942932129, -23.278465270996094, -21.8322811126709, -20.386096954345703, -18.939912796020508, -17.493728637695312, -16.047544479370117, -14.601360321044922, -13.155176162719727, -11.708992004394531, -10.262807846069336, -8.81662368774414, -7.370439529418945, -5.92425537109375, -4.478071212768555, -3.0318870544433594, -1.585702896118164, -0.13951873779296875, 1.3066654205322266, 2.752849578857422, 4.199033737182617, 5.645214080810547, 7.091398239135742, 8.537582397460938, 9.983766555786133, 11.429950714111328, 12.876134872436523, 14.322319030761719, 15.768503189086914, 17.21468734741211, 18.660871505737305, 20.1070556640625, 21.553239822387695, 22.99942398071289, 24.445608139038086, 25.89179229736328, 27.337976455688477, 28.784160614013672, 30.230344772338867, 31.676528930664062, 33.122711181640625, 34.56889724731445, 36.01508331298828, 37.461265563964844, 38.907447814941406, 40.353633880615234, 41.79981994628906, 43.246002197265625, 44.69218444824219, 46.138370513916016, 47.584556579589844, 49.030738830566406, 50.47692108154297, 51.9231071472168]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 7.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.533843994140625, -57.82734298706055, -56.1208381652832, -54.414337158203125, -52.70783615112305, -51.00133514404297, -49.294830322265625, -47.58832931518555, -45.88182830810547, -44.17532730102539, -42.46882247924805, -40.76232147216797, -39.05582046508789, -37.34931945800781, -35.64281463623047, -33.93631362915039, -32.22980880737305, -30.523305892944336, -28.816804885864258, -27.110301971435547, -25.40380096435547, -23.697298049926758, -21.990795135498047, -20.28429412841797, -18.577791213989258, -16.871288299560547, -15.164787292480469, -13.458284378051758, -11.751782417297363, -10.045280456542969, -8.338777542114258, -6.632275581359863, -4.925773620605469, -3.219271421432495, -1.5127692222595215, 0.19373321533203125, 1.9002351760864258, 3.6067371368408203, 5.313240051269531, 7.019742012023926, 8.72624397277832, 10.432745933532715, 12.13924789428711, 13.84575080871582, 15.552252769470215, 17.25875473022461, 18.96525764465332, 20.67176055908203, 22.37826156616211, 24.08476448059082, 25.7912654876709, 27.49776840209961, 29.204269409179688, 30.9107723236084, 32.61727523803711, 34.32377624511719, 36.03028106689453, 37.73678207397461, 39.44328689575195, 41.14978790283203, 42.85628890991211, 44.56278991699219, 46.26929473876953, 47.97579574584961, 49.68229675292969]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 11.0, 12.0, 32.0, 42.0, 66.0, 85.0, 187.0, 362.0, 636.0, 1180.0, 2383.0, 4808.0, 10396.0, 21895.0, 47568.0, 100811.0, 149742.0, 97533.0, 46040.0, 20998.0, 9720.0, 4919.0, 2258.0, 1227.0, 582.0, 309.0, 151.0, 113.0, 58.0, 42.0, 25.0, 20.0, 15.0, 6.0, 8.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.875, -20.14208984375, -19.4091796875, -18.67626953125, -17.943359375, -17.21044921875, -16.4775390625, -15.74462890625, -15.01171875, -14.27880859375, -13.5458984375, -12.81298828125, -12.080078125, -11.34716796875, -10.6142578125, -9.88134765625, -9.1484375, -8.41552734375, -7.6826171875, -6.94970703125, -6.216796875, -5.48388671875, -4.7509765625, -4.01806640625, -3.28515625, -2.55224609375, -1.8193359375, -1.08642578125, -0.353515625, 0.37939453125, 1.1123046875, 1.84521484375, 2.578125, 3.31103515625, 4.0439453125, 4.77685546875, 5.509765625, 6.24267578125, 6.9755859375, 7.70849609375, 8.44140625, 9.17431640625, 9.9072265625, 10.64013671875, 11.373046875, 12.10595703125, 12.8388671875, 13.57177734375, 14.3046875, 15.03759765625, 15.7705078125, 16.50341796875, 17.236328125, 17.96923828125, 18.7021484375, 19.43505859375, 20.16796875, 20.90087890625, 21.6337890625, 22.36669921875, 23.099609375, 23.83251953125, 24.5654296875, 25.29833984375, 26.03125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 4.0, 12.0, 15.0, 11.0, 17.0, 17.0, 14.0, 23.0, 25.0, 43.0, 33.0, 53.0, 64.0, 53.0, 53.0, 62.0, 70.0, 56.0, 36.0, 64.0, 46.0, 38.0, 46.0, 18.0, 9.0, 22.0, 20.0, 15.0, 15.0, 11.0, 3.0, 3.0, 5.0, 0.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.10546875, -4.96246337890625, -4.8194580078125, -4.67645263671875, -4.533447265625, -4.39044189453125, -4.2474365234375, -4.10443115234375, -3.96142578125, -3.81842041015625, -3.6754150390625, -3.53240966796875, -3.389404296875, -3.24639892578125, -3.1033935546875, -2.96038818359375, -2.8173828125, -2.67437744140625, -2.5313720703125, -2.38836669921875, -2.245361328125, -2.10235595703125, -1.9593505859375, -1.81634521484375, -1.67333984375, -1.53033447265625, -1.3873291015625, -1.24432373046875, -1.101318359375, -0.95831298828125, -0.8153076171875, -0.67230224609375, -0.529296875, -0.38629150390625, -0.2432861328125, -0.10028076171875, 0.042724609375, 0.18572998046875, 0.3287353515625, 0.47174072265625, 0.61474609375, 0.75775146484375, 0.9007568359375, 1.04376220703125, 1.186767578125, 1.32977294921875, 1.4727783203125, 1.61578369140625, 1.7587890625, 1.90179443359375, 2.0447998046875, 2.18780517578125, 2.330810546875, 2.47381591796875, 2.6168212890625, 2.75982666015625, 2.90283203125, 3.04583740234375, 3.1888427734375, 3.33184814453125, 3.474853515625, 3.61785888671875, 3.7608642578125, 3.90386962890625, 4.046875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 9.0, 6.0, 20.0, 17.0, 29.0, 46.0, 82.0, 85.0, 85.0, 47.0, 25.0, 6.0, 7.0, 6.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.987567901611328, -23.861854553222656, -22.736141204833984, -21.610427856445312, -20.48471450805664, -19.35900115966797, -18.233287811279297, -17.107574462890625, -15.981861114501953, -14.856147766113281, -13.73043441772461, -12.604721069335938, -11.479007720947266, -10.353294372558594, -9.227581024169922, -8.10186767578125, -6.976154327392578, -5.850440979003906, -4.724727630615234, -3.5990142822265625, -2.4733009338378906, -1.3475875854492188, -0.22187423706054688, 0.903839111328125, 2.029552459716797, 3.1552658081054688, 4.280979156494141, 5.4066925048828125, 6.532405853271484, 7.658119201660156, 8.783832550048828, 9.9095458984375, 11.035259246826172, 12.160972595214844, 13.286685943603516, 14.412399291992188, 15.53811264038086, 16.66382598876953, 17.789539337158203, 18.915252685546875, 20.040966033935547, 21.16667938232422, 22.29239273071289, 23.418106079101562, 24.543819427490234, 25.669532775878906, 26.795246124267578, 27.92095947265625, 29.046672821044922, 30.172386169433594, 31.298099517822266, 32.42381286621094, 33.54952621459961, 34.67523956298828, 35.80095291137695, 36.926666259765625, 38.0523796081543, 39.17809295654297, 40.30380630493164, 41.42951965332031, 42.555233001708984, 43.680946350097656, 44.80665969848633, 45.932373046875, 47.05808639526367]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 4.0, 9.0, 15.0, 26.0, 38.0, 56.0, 69.0, 72.0, 62.0, 33.0, 23.0, 21.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.846797943115234, -27.125289916992188, -26.40378189086914, -25.68227195739746, -24.960763931274414, -24.239255905151367, -23.51774787902832, -22.79623794555664, -22.074729919433594, -21.353221893310547, -20.6317138671875, -19.91020393371582, -19.188695907592773, -18.467187881469727, -17.74567985534668, -17.024169921875, -16.302661895751953, -15.581153869628906, -14.859644889831543, -14.138136863708496, -13.416627883911133, -12.695119857788086, -11.973611831665039, -11.252102851867676, -10.530595779418945, -9.809087753295898, -9.087578773498535, -8.366070747375488, -7.644561767578125, -6.923053741455078, -6.201545238494873, -5.480036735534668, -4.758527755737305, -4.0370192527771, -3.3155107498168945, -2.5940024852752686, -1.8724939823150635, -1.1509854793548584, -0.4294772148132324, 0.29203128814697266, 1.0135397911071777, 1.7350482940673828, 2.456556797027588, 3.178065061569214, 3.899573564529419, 4.621082305908203, 5.34259033203125, 6.064098834991455, 6.78560733795166, 7.507115840911865, 8.22862434387207, 8.950132369995117, 9.67164134979248, 10.393149375915527, 11.11465835571289, 11.836166381835938, 12.557674407958984, 13.279182434082031, 14.000691413879395, 14.722199440002441, 15.443708419799805, 16.16521644592285, 16.8867244720459, 17.608234405517578, 18.329742431640625]}, "eval/loss": 1.0561981201171875, "eval/wer": 0.15931503859356708, "eval/runtime": 866.3742, "eval/samples_per_second": 3.049, "eval/steps_per_second": 0.382} \ No newline at end of file +{"train/loss": 0.5258, "train/learning_rate": 5.068289786223278e-06, "train/epoch": 16.82, "train/global_step": 15000, "_runtime": 98095, "_timestamp": 1646759334, "_step": 15009, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 16.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 12.0, 29.0, 30160.0, 218.0, 32.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-204.0, -200.2578125, -196.515625, -192.7734375, -189.03125, -185.2890625, -181.546875, -177.8046875, -174.0625, -170.3203125, -166.578125, -162.8359375, -159.09375, -155.3515625, -151.609375, -147.8671875, -144.125, -140.3828125, -136.640625, -132.8984375, -129.15625, -125.4140625, -121.671875, -117.9296875, -114.1875, -110.4453125, -106.703125, -102.9609375, -99.21875, -95.4765625, -91.734375, -87.9921875, -84.25, -80.5078125, -76.765625, -73.0234375, -69.28125, -65.5390625, -61.796875, -58.0546875, -54.3125, -50.5703125, -46.828125, -43.0859375, -39.34375, -35.6015625, -31.859375, -28.1171875, -24.375, -20.6328125, -16.890625, -13.1484375, -9.40625, -5.6640625, -1.921875, 1.8203125, 5.5625, 9.3046875, 13.046875, 16.7890625, 20.53125, 24.2734375, 28.015625, 31.7578125, 35.5]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 5.0, 2.0, 4.0, 4.0, 8.0, 10.0, 12.0, 7.0, 8.0, 18.0, 15.0, 10.0, 11.0, 15.0, 16.0, 24.0, 21.0, 27.0, 27.0, 22.0, 39.0, 34.0, 47.0, 43.0, 44.0, 41.0, 33.0, 47.0, 33.0, 55.0, 32.0, 37.0, 31.0, 20.0, 19.0, 34.0, 27.0, 18.0, 12.0, 16.0, 15.0, 9.0, 12.0, 12.0, 13.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-58.242820739746094, -56.97196960449219, -55.70111846923828, -54.430267333984375, -53.15941619873047, -51.88856506347656, -50.617713928222656, -49.346866607666016, -48.07601547241211, -46.8051643371582, -45.5343132019043, -44.26346206665039, -42.992610931396484, -41.721763610839844, -40.45091247558594, -39.18006134033203, -37.909210205078125, -36.63835906982422, -35.36750793457031, -34.096656799316406, -32.8258056640625, -31.554956436157227, -30.28410530090332, -29.013256072998047, -27.742401123046875, -26.47154998779297, -25.200698852539062, -23.929847717285156, -22.658998489379883, -21.388147354125977, -20.11729621887207, -18.846446990966797, -17.575593948364258, -16.30474281311035, -15.033892631530762, -13.763041496276855, -12.492191314697266, -11.22134017944336, -9.950489044189453, -8.679638862609863, -7.408787727355957, -6.137937068939209, -4.867086410522461, -3.5962352752685547, -2.3253846168518066, -1.0545339584350586, 0.21631717681884766, 1.4871673583984375, 2.7580184936523438, 4.028869152069092, 5.29971981048584, 6.570570945739746, 7.841421604156494, 9.112272262573242, 10.383123397827148, 11.653973579406738, 12.924824714660645, 14.19567584991455, 15.46652603149414, 16.737377166748047, 18.008228302001953, 19.27907943725586, 20.549930572509766, 21.82077980041504, 23.091630935668945]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 10.0, 9.0, 11.0, 10.0, 15.0, 9.0, 24.0, 16.0, 25.0, 21.0, 31.0, 25.0, 35.0, 31.0, 27.0, 39.0, 39.0, 35.0, 41.0, 40.0, 42.0, 47.0, 37.0, 38.0, 31.0, 36.0, 35.0, 36.0, 43.0, 30.0, 19.0, 14.0, 23.0, 12.0, 14.0, 14.0, 12.0, 8.0, 7.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.22478103637695, -37.84811019897461, -36.471435546875, -35.094764709472656, -33.71809387207031, -32.3414192199707, -30.96474838256836, -29.588075637817383, -28.211402893066406, -26.83473014831543, -25.458059310913086, -24.08138656616211, -22.704713821411133, -21.328041076660156, -19.951370239257812, -18.574697494506836, -17.198026657104492, -15.821354866027832, -14.444682121276855, -13.068010330200195, -11.691337585449219, -10.314665794372559, -8.937994003295898, -7.561321258544922, -6.184649467468262, -4.807977199554443, -3.431305170059204, -2.054633140563965, -0.6779608726501465, 0.6987113952636719, 2.075383186340332, 3.4520559310913086, 4.828727722167969, 6.205399990081787, 7.5820722579956055, 8.958744049072266, 10.335416793823242, 11.712088584899902, 13.088760375976562, 14.465433120727539, 15.8421049118042, 17.21877670288086, 18.595449447631836, 19.972122192382812, 21.348793029785156, 22.725465774536133, 24.10213851928711, 25.478809356689453, 26.85548210144043, 28.232154846191406, 29.60882568359375, 30.985498428344727, 32.3621711730957, 33.73884201049805, 35.115516662597656, 36.4921875, 37.868858337402344, 39.24552917480469, 40.6222038269043, 41.99887466430664, 43.375545501708984, 44.752220153808594, 46.12889099121094, 47.50556182861328, 48.88223648071289]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 8.0, 25.0, 25.0, 35.0, 59.0, 69.0, 131.0, 198.0, 339.0, 505.0, 848.0, 1367.0, 2121.0, 3390.0, 5243.0, 7777.0, 11615.0, 17170.0, 24596.0, 34286.0, 46270.0, 60108.0, 75241.0, 89448.0, 101241.0, 126627.0, 95908.0, 84113.0, 69515.0, 55165.0, 40889.0, 30012.0, 21089.0, 14654.0, 9856.0, 6604.0, 4347.0, 2808.0, 1772.0, 1187.0, 738.0, 422.0, 270.0, 170.0, 120.0, 62.0, 46.0, 27.0, 17.0, 12.0, 7.0, 3.0, 3.0, 2.0, 2.0], "bins": [-161.375, -156.669921875, -151.96484375, -147.259765625, -142.5546875, -137.849609375, -133.14453125, -128.439453125, -123.734375, -119.029296875, -114.32421875, -109.619140625, -104.9140625, -100.208984375, -95.50390625, -90.798828125, -86.09375, -81.388671875, -76.68359375, -71.978515625, -67.2734375, -62.568359375, -57.86328125, -53.158203125, -48.453125, -43.748046875, -39.04296875, -34.337890625, -29.6328125, -24.927734375, -20.22265625, -15.517578125, -10.8125, -6.107421875, -1.40234375, 3.302734375, 8.0078125, 12.712890625, 17.41796875, 22.123046875, 26.828125, 31.533203125, 36.23828125, 40.943359375, 45.6484375, 50.353515625, 55.05859375, 59.763671875, 64.46875, 69.173828125, 73.87890625, 78.583984375, 83.2890625, 87.994140625, 92.69921875, 97.404296875, 102.109375, 106.814453125, 111.51953125, 116.224609375, 120.9296875, 125.634765625, 130.33984375, 135.044921875, 139.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 1.0, 5.0, 1.0, 7.0, 5.0, 10.0, 7.0, 8.0, 10.0, 10.0, 9.0, 10.0, 14.0, 22.0, 22.0, 18.0, 25.0, 21.0, 29.0, 35.0, 39.0, 37.0, 29.0, 45.0, 36.0, 50.0, 50.0, 35.0, 32.0, 34.0, 31.0, 35.0, 33.0, 25.0, 17.0, 30.0, 17.0, 23.0, 20.0, 11.0, 15.0, 17.0, 17.0, 7.0, 8.0, 10.0, 10.0, 9.0, 6.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.90625, -57.91845703125, -55.9306640625, -53.94287109375, -51.955078125, -49.96728515625, -47.9794921875, -45.99169921875, -44.00390625, -42.01611328125, -40.0283203125, -38.04052734375, -36.052734375, -34.06494140625, -32.0771484375, -30.08935546875, -28.1015625, -26.11376953125, -24.1259765625, -22.13818359375, -20.150390625, -18.16259765625, -16.1748046875, -14.18701171875, -12.19921875, -10.21142578125, -8.2236328125, -6.23583984375, -4.248046875, -2.26025390625, -0.2724609375, 1.71533203125, 3.703125, 5.69091796875, 7.6787109375, 9.66650390625, 11.654296875, 13.64208984375, 15.6298828125, 17.61767578125, 19.60546875, 21.59326171875, 23.5810546875, 25.56884765625, 27.556640625, 29.54443359375, 31.5322265625, 33.52001953125, 35.5078125, 37.49560546875, 39.4833984375, 41.47119140625, 43.458984375, 45.44677734375, 47.4345703125, 49.42236328125, 51.41015625, 53.39794921875, 55.3857421875, 57.37353515625, 59.361328125, 61.34912109375, 63.3369140625, 65.32470703125, 67.3125]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 3.0, 5.0, 4.0, 5.0, 6.0, 11.0, 14.0, 11.0, 15.0, 20.0, 17.0, 31.0, 35.0, 35.0, 27.0, 38.0, 44.0, 47.0, 39.0, 56.0, 42.0, 45.0, 54.0, 44.0, 46.0, 37.0, 43.0, 35.0, 25.0, 19.0, 25.0, 17.0, 22.0, 11.0, 17.0, 11.0, 13.0, 7.0, 7.0, 2.0, 5.0, 7.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.55672836303711, -47.03756332397461, -45.518394470214844, -43.999229431152344, -42.48006057739258, -40.96089553833008, -39.44172668457031, -37.92256164550781, -36.40339660644531, -34.88423156738281, -33.36506271362305, -31.845897674560547, -30.32672882080078, -28.80756378173828, -27.28839683532715, -25.769229888916016, -24.25006103515625, -22.730894088745117, -21.211727142333984, -19.692562103271484, -18.17339324951172, -16.65422821044922, -15.135061264038086, -13.615894317626953, -12.09672737121582, -10.577560424804688, -9.058393478393555, -7.539227485656738, -6.0200605392456055, -4.500893592834473, -2.9817276000976562, -1.4625606536865234, 0.056610107421875, 1.5757768154144287, 3.0949435234069824, 4.614109992980957, 6.13327693939209, 7.652443885803223, 9.171609878540039, 10.690776824951172, 12.209943771362305, 13.729110717773438, 15.24827766418457, 16.767444610595703, 18.286609649658203, 19.80577850341797, 21.32494354248047, 22.8441104888916, 24.363277435302734, 25.882444381713867, 27.401611328125, 28.9207763671875, 30.439945220947266, 31.959110260009766, 33.47827911376953, 34.99744415283203, 36.51660919189453, 38.03577423095703, 39.5549430847168, 41.0741081237793, 42.59327697753906, 44.11244201660156, 45.63160705566406, 47.15077590942383, 48.669944763183594]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 8.0, 12.0, 14.0, 18.0, 14.0, 13.0, 24.0, 18.0, 23.0, 21.0, 28.0, 24.0, 30.0, 36.0, 44.0, 46.0, 50.0, 29.0, 44.0, 48.0, 42.0, 36.0, 18.0, 49.0, 35.0, 31.0, 46.0, 18.0, 16.0, 26.0, 21.0, 16.0, 24.0, 9.0, 11.0, 7.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0], "bins": [-51.44761657714844, -49.96538162231445, -48.4831428527832, -47.00090789794922, -45.51866912841797, -44.036434173583984, -42.55419921875, -41.07196044921875, -39.589725494384766, -38.10749053955078, -36.62525177001953, -35.14301681518555, -33.66078186035156, -32.17854309082031, -30.696308135986328, -29.21407127380371, -27.731834411621094, -26.249597549438477, -24.76736068725586, -23.285125732421875, -21.802888870239258, -20.32065200805664, -18.838417053222656, -17.35618019104004, -15.873943328857422, -14.391706466674805, -12.909470558166504, -11.427234649658203, -9.944997787475586, -8.462760925292969, -6.980525016784668, -5.498289108276367, -4.01605224609375, -2.533815860748291, -1.051579475402832, 0.43065690994262695, 1.912893295288086, 3.395129680633545, 4.877366065979004, 6.359601974487305, 7.841838836669922, 9.324075698852539, 10.80631160736084, 12.28854751586914, 13.770784378051758, 15.253021240234375, 16.73525619506836, 18.217493057250977, 19.699729919433594, 21.18196678161621, 22.664203643798828, 24.146438598632812, 25.62867546081543, 27.110912322998047, 28.59314727783203, 30.07538414001465, 31.557621002197266, 33.03985595703125, 34.5220947265625, 36.004329681396484, 37.48656463623047, 38.96880340576172, 40.4510383605957, 41.93327331542969, 43.41551208496094]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 20.0, 25.0, 37.0, 52.0, 93.0, 149.0, 275.0, 339.0, 609.0, 943.0, 1510.0, 2436.0, 3865.0, 6211.0, 9995.0, 16294.0, 26501.0, 43423.0, 70672.0, 117489.0, 193413.0, 320495.0, 528809.0, 787279.0, 772325.0, 512200.0, 309424.0, 186214.0, 111785.0, 67434.0, 40454.0, 24690.0, 14972.0, 9217.0, 5618.0, 3455.0, 2140.0, 1253.0, 834.0, 513.0, 289.0, 214.0, 128.0, 72.0, 38.0, 39.0, 15.0, 10.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -76.2255859375, -73.763671875, -71.3017578125, -68.83984375, -66.3779296875, -63.916015625, -61.4541015625, -58.9921875, -56.5302734375, -54.068359375, -51.6064453125, -49.14453125, -46.6826171875, -44.220703125, -41.7587890625, -39.296875, -36.8349609375, -34.373046875, -31.9111328125, -29.44921875, -26.9873046875, -24.525390625, -22.0634765625, -19.6015625, -17.1396484375, -14.677734375, -12.2158203125, -9.75390625, -7.2919921875, -4.830078125, -2.3681640625, 0.09375, 2.5556640625, 5.017578125, 7.4794921875, 9.94140625, 12.4033203125, 14.865234375, 17.3271484375, 19.7890625, 22.2509765625, 24.712890625, 27.1748046875, 29.63671875, 32.0986328125, 34.560546875, 37.0224609375, 39.484375, 41.9462890625, 44.408203125, 46.8701171875, 49.33203125, 51.7939453125, 54.255859375, 56.7177734375, 59.1796875, 61.6416015625, 64.103515625, 66.5654296875, 69.02734375, 71.4892578125, 73.951171875, 76.4130859375, 78.875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 7.0, 5.0, 10.0, 11.0, 6.0, 7.0, 13.0, 17.0, 25.0, 12.0, 16.0, 19.0, 25.0, 30.0, 26.0, 25.0, 27.0, 45.0, 42.0, 31.0, 40.0, 39.0, 38.0, 41.0, 48.0, 41.0, 38.0, 26.0, 29.0, 27.0, 37.0, 17.0, 27.0, 26.0, 21.0, 22.0, 19.0, 8.0, 8.0, 8.0, 14.0, 5.0, 7.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-41.8125, -40.55517578125, -39.2978515625, -38.04052734375, -36.783203125, -35.52587890625, -34.2685546875, -33.01123046875, -31.75390625, -30.49658203125, -29.2392578125, -27.98193359375, -26.724609375, -25.46728515625, -24.2099609375, -22.95263671875, -21.6953125, -20.43798828125, -19.1806640625, -17.92333984375, -16.666015625, -15.40869140625, -14.1513671875, -12.89404296875, -11.63671875, -10.37939453125, -9.1220703125, -7.86474609375, -6.607421875, -5.35009765625, -4.0927734375, -2.83544921875, -1.578125, -0.32080078125, 0.9365234375, 2.19384765625, 3.451171875, 4.70849609375, 5.9658203125, 7.22314453125, 8.48046875, 9.73779296875, 10.9951171875, 12.25244140625, 13.509765625, 14.76708984375, 16.0244140625, 17.28173828125, 18.5390625, 19.79638671875, 21.0537109375, 22.31103515625, 23.568359375, 24.82568359375, 26.0830078125, 27.34033203125, 28.59765625, 29.85498046875, 31.1123046875, 32.36962890625, 33.626953125, 34.88427734375, 36.1416015625, 37.39892578125, 38.65625]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 17.0, 27.0, 41.0, 68.0, 79.0, 139.0, 221.0, 366.0, 567.0, 937.0, 1559.0, 2673.0, 4364.0, 7335.0, 11855.0, 20233.0, 33330.0, 55258.0, 91577.0, 147523.0, 235897.0, 361487.0, 516783.0, 649434.0, 637974.0, 494972.0, 341776.0, 222490.0, 139409.0, 85942.0, 51698.0, 31423.0, 18455.0, 11160.0, 6912.0, 4024.0, 2446.0, 1461.0, 918.0, 539.0, 314.0, 223.0, 123.0, 78.0, 48.0, 32.0, 21.0, 20.0, 14.0, 7.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-48.0625, -46.5087890625, -44.955078125, -43.4013671875, -41.84765625, -40.2939453125, -38.740234375, -37.1865234375, -35.6328125, -34.0791015625, -32.525390625, -30.9716796875, -29.41796875, -27.8642578125, -26.310546875, -24.7568359375, -23.203125, -21.6494140625, -20.095703125, -18.5419921875, -16.98828125, -15.4345703125, -13.880859375, -12.3271484375, -10.7734375, -9.2197265625, -7.666015625, -6.1123046875, -4.55859375, -3.0048828125, -1.451171875, 0.1025390625, 1.65625, 3.2099609375, 4.763671875, 6.3173828125, 7.87109375, 9.4248046875, 10.978515625, 12.5322265625, 14.0859375, 15.6396484375, 17.193359375, 18.7470703125, 20.30078125, 21.8544921875, 23.408203125, 24.9619140625, 26.515625, 28.0693359375, 29.623046875, 31.1767578125, 32.73046875, 34.2841796875, 35.837890625, 37.3916015625, 38.9453125, 40.4990234375, 42.052734375, 43.6064453125, 45.16015625, 46.7138671875, 48.267578125, 49.8212890625, 51.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 11.0, 13.0, 3.0, 15.0, 15.0, 17.0, 24.0, 31.0, 34.0, 52.0, 39.0, 77.0, 81.0, 94.0, 125.0, 129.0, 154.0, 186.0, 207.0, 186.0, 213.0, 244.0, 224.0, 216.0, 231.0, 205.0, 219.0, 165.0, 147.0, 140.0, 117.0, 83.0, 84.0, 63.0, 50.0, 44.0, 31.0, 18.0, 15.0, 17.0, 7.0, 14.0, 11.0, 8.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -20.01171875, -19.3671875, -18.72265625, -18.078125, -17.43359375, -16.7890625, -16.14453125, -15.5, -14.85546875, -14.2109375, -13.56640625, -12.921875, -12.27734375, -11.6328125, -10.98828125, -10.34375, -9.69921875, -9.0546875, -8.41015625, -7.765625, -7.12109375, -6.4765625, -5.83203125, -5.1875, -4.54296875, -3.8984375, -3.25390625, -2.609375, -1.96484375, -1.3203125, -0.67578125, -0.03125, 0.61328125, 1.2578125, 1.90234375, 2.546875, 3.19140625, 3.8359375, 4.48046875, 5.125, 5.76953125, 6.4140625, 7.05859375, 7.703125, 8.34765625, 8.9921875, 9.63671875, 10.28125, 10.92578125, 11.5703125, 12.21484375, 12.859375, 13.50390625, 14.1484375, 14.79296875, 15.4375, 16.08203125, 16.7265625, 17.37109375, 18.015625, 18.66015625, 19.3046875, 19.94921875, 20.59375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 11.0, 13.0, 15.0, 19.0, 20.0, 24.0, 25.0, 41.0, 44.0, 46.0, 58.0, 58.0, 45.0, 44.0, 54.0, 68.0, 39.0, 49.0, 40.0, 40.0, 31.0, 39.0, 21.0, 26.0, 21.0, 15.0, 22.0, 18.0, 18.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.5589714050293, -50.855369567871094, -49.15176773071289, -47.44816589355469, -45.744564056396484, -44.04096221923828, -42.33735656738281, -40.633758544921875, -38.930152893066406, -37.2265510559082, -35.52294921875, -33.8193473815918, -32.115745544433594, -30.41214370727539, -28.708539962768555, -27.00493812561035, -25.30133819580078, -23.597736358642578, -21.894134521484375, -20.190532684326172, -18.48693084716797, -16.783329010009766, -15.07972526550293, -13.376123428344727, -11.672521591186523, -9.96891975402832, -8.265317916870117, -6.561715126037598, -4.8581132888793945, -3.1545114517211914, -1.4509086608886719, 0.25269317626953125, 1.9562950134277344, 3.6598970890045166, 5.363499164581299, 7.06710147857666, 8.770703315734863, 10.474305152893066, 12.177907943725586, 13.881509780883789, 15.585111618041992, 17.288713455200195, 18.9923152923584, 20.695919036865234, 22.399520874023438, 24.10312271118164, 25.806724548339844, 27.510326385498047, 29.21392822265625, 30.917530059814453, 32.621131896972656, 34.32473373413086, 36.02833557128906, 37.731937408447266, 39.43553924560547, 41.13914489746094, 42.842742919921875, 44.54634475708008, 46.24994659423828, 47.953548431396484, 49.65715026855469, 51.36075210571289, 53.064353942871094, 54.76795959472656, 56.471561431884766]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 4.0, 8.0, 8.0, 5.0, 15.0, 12.0, 10.0, 14.0, 11.0, 20.0, 12.0, 21.0, 19.0, 31.0, 36.0, 33.0, 47.0, 32.0, 42.0, 51.0, 30.0, 32.0, 31.0, 46.0, 37.0, 40.0, 42.0, 37.0, 33.0, 29.0, 29.0, 25.0, 21.0, 20.0, 17.0, 27.0, 14.0, 13.0, 7.0, 9.0, 9.0, 3.0, 4.0, 2.0, 0.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-47.955162048339844, -46.58327102661133, -45.21137619018555, -43.83948516845703, -42.46759033203125, -41.095699310302734, -39.72380828857422, -38.35191345214844, -36.980018615722656, -35.60812759399414, -34.23623275756836, -32.864341735839844, -31.492446899414062, -30.120555877685547, -28.7486629486084, -27.37677001953125, -26.004878997802734, -24.632986068725586, -23.261093139648438, -21.889202117919922, -20.51730728149414, -19.145416259765625, -17.773523330688477, -16.401630401611328, -15.02973747253418, -13.657844543457031, -12.285951614379883, -10.91405963897705, -9.542166709899902, -8.170273780822754, -6.798381805419922, -5.426488876342773, -4.054599761962891, -2.6827070713043213, -1.310814380645752, 0.06107807159423828, 1.4329710006713867, 2.804863929748535, 4.176755905151367, 5.548648834228516, 6.920541763305664, 8.292434692382812, 9.664327621459961, 11.036219596862793, 12.408112525939941, 13.78000545501709, 15.151897430419922, 16.52379035949707, 17.89568328857422, 19.267576217651367, 20.639469146728516, 22.01136016845703, 23.383255004882812, 24.755146026611328, 26.127038955688477, 27.498931884765625, 28.870824813842773, 30.242717742919922, 31.61461067199707, 32.98650360107422, 34.358394622802734, 35.730289459228516, 37.10218048095703, 38.47407531738281, 39.84596633911133]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 14.0, 21.0, 39.0, 44.0, 71.0, 107.0, 163.0, 238.0, 397.0, 611.0, 930.0, 1363.0, 2189.0, 3275.0, 5170.0, 7678.0, 12117.0, 18816.0, 29531.0, 47621.0, 78676.0, 127177.0, 179032.0, 182505.0, 132928.0, 81872.0, 50047.0, 30402.0, 19418.0, 12609.0, 8209.0, 5391.0, 3501.0, 2268.0, 1447.0, 926.0, 615.0, 402.0, 251.0, 169.0, 123.0, 61.0, 46.0, 30.0, 14.0, 18.0, 4.0, 7.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-72.0625, -69.8818359375, -67.701171875, -65.5205078125, -63.33984375, -61.1591796875, -58.978515625, -56.7978515625, -54.6171875, -52.4365234375, -50.255859375, -48.0751953125, -45.89453125, -43.7138671875, -41.533203125, -39.3525390625, -37.171875, -34.9912109375, -32.810546875, -30.6298828125, -28.44921875, -26.2685546875, -24.087890625, -21.9072265625, -19.7265625, -17.5458984375, -15.365234375, -13.1845703125, -11.00390625, -8.8232421875, -6.642578125, -4.4619140625, -2.28125, -0.1005859375, 2.080078125, 4.2607421875, 6.44140625, 8.6220703125, 10.802734375, 12.9833984375, 15.1640625, 17.3447265625, 19.525390625, 21.7060546875, 23.88671875, 26.0673828125, 28.248046875, 30.4287109375, 32.609375, 34.7900390625, 36.970703125, 39.1513671875, 41.33203125, 43.5126953125, 45.693359375, 47.8740234375, 50.0546875, 52.2353515625, 54.416015625, 56.5966796875, 58.77734375, 60.9580078125, 63.138671875, 65.3193359375, 67.5]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 7.0, 11.0, 4.0, 6.0, 7.0, 12.0, 10.0, 10.0, 20.0, 19.0, 20.0, 29.0, 29.0, 41.0, 40.0, 26.0, 42.0, 37.0, 34.0, 32.0, 41.0, 45.0, 39.0, 50.0, 45.0, 37.0, 38.0, 31.0, 34.0, 23.0, 28.0, 28.0, 24.0, 14.0, 11.0, 17.0, 13.0, 10.0, 6.0, 7.0, 1.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 5.0], "bins": [-45.78125, -44.54638671875, -43.3115234375, -42.07666015625, -40.841796875, -39.60693359375, -38.3720703125, -37.13720703125, -35.90234375, -34.66748046875, -33.4326171875, -32.19775390625, -30.962890625, -29.72802734375, -28.4931640625, -27.25830078125, -26.0234375, -24.78857421875, -23.5537109375, -22.31884765625, -21.083984375, -19.84912109375, -18.6142578125, -17.37939453125, -16.14453125, -14.90966796875, -13.6748046875, -12.43994140625, -11.205078125, -9.97021484375, -8.7353515625, -7.50048828125, -6.265625, -5.03076171875, -3.7958984375, -2.56103515625, -1.326171875, -0.09130859375, 1.1435546875, 2.37841796875, 3.61328125, 4.84814453125, 6.0830078125, 7.31787109375, 8.552734375, 9.78759765625, 11.0224609375, 12.25732421875, 13.4921875, 14.72705078125, 15.9619140625, 17.19677734375, 18.431640625, 19.66650390625, 20.9013671875, 22.13623046875, 23.37109375, 24.60595703125, 25.8408203125, 27.07568359375, 28.310546875, 29.54541015625, 30.7802734375, 32.01513671875, 33.25]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 4.0, 9.0, 13.0, 18.0, 30.0, 36.0, 61.0, 70.0, 109.0, 173.0, 196.0, 380.0, 531.0, 751.0, 1086.0, 1657.0, 2575.0, 3910.0, 6251.0, 9744.0, 15968.0, 26566.0, 45571.0, 85470.0, 164166.0, 255535.0, 192641.0, 101553.0, 53644.0, 30438.0, 18055.0, 11160.0, 7198.0, 4483.0, 2869.0, 1873.0, 1134.0, 858.0, 536.0, 392.0, 251.0, 198.0, 118.0, 76.0, 60.0, 37.0, 26.0, 17.0, 20.0, 11.0, 9.0, 8.0, 6.0, 2.0, 0.0, 1.0, 5.0], "bins": [-93.625, -90.755859375, -87.88671875, -85.017578125, -82.1484375, -79.279296875, -76.41015625, -73.541015625, -70.671875, -67.802734375, -64.93359375, -62.064453125, -59.1953125, -56.326171875, -53.45703125, -50.587890625, -47.71875, -44.849609375, -41.98046875, -39.111328125, -36.2421875, -33.373046875, -30.50390625, -27.634765625, -24.765625, -21.896484375, -19.02734375, -16.158203125, -13.2890625, -10.419921875, -7.55078125, -4.681640625, -1.8125, 1.056640625, 3.92578125, 6.794921875, 9.6640625, 12.533203125, 15.40234375, 18.271484375, 21.140625, 24.009765625, 26.87890625, 29.748046875, 32.6171875, 35.486328125, 38.35546875, 41.224609375, 44.09375, 46.962890625, 49.83203125, 52.701171875, 55.5703125, 58.439453125, 61.30859375, 64.177734375, 67.046875, 69.916015625, 72.78515625, 75.654296875, 78.5234375, 81.392578125, 84.26171875, 87.130859375, 90.0]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 8.0, 13.0, 15.0, 22.0, 18.0, 17.0, 23.0, 19.0, 24.0, 36.0, 35.0, 34.0, 25.0, 32.0, 29.0, 36.0, 38.0, 37.0, 40.0, 35.0, 47.0, 51.0, 40.0, 36.0, 36.0, 31.0, 36.0, 27.0, 23.0, 30.0, 9.0, 18.0, 14.0, 14.0, 2.0, 15.0, 4.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.609375, -26.753662109375, -25.89794921875, -25.042236328125, -24.1865234375, -23.330810546875, -22.47509765625, -21.619384765625, -20.763671875, -19.907958984375, -19.05224609375, -18.196533203125, -17.3408203125, -16.485107421875, -15.62939453125, -14.773681640625, -13.91796875, -13.062255859375, -12.20654296875, -11.350830078125, -10.4951171875, -9.639404296875, -8.78369140625, -7.927978515625, -7.072265625, -6.216552734375, -5.36083984375, -4.505126953125, -3.6494140625, -2.793701171875, -1.93798828125, -1.082275390625, -0.2265625, 0.629150390625, 1.48486328125, 2.340576171875, 3.1962890625, 4.052001953125, 4.90771484375, 5.763427734375, 6.619140625, 7.474853515625, 8.33056640625, 9.186279296875, 10.0419921875, 10.897705078125, 11.75341796875, 12.609130859375, 13.46484375, 14.320556640625, 15.17626953125, 16.031982421875, 16.8876953125, 17.743408203125, 18.59912109375, 19.454833984375, 20.310546875, 21.166259765625, 22.02197265625, 22.877685546875, 23.7333984375, 24.589111328125, 25.44482421875, 26.300537109375, 27.15625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 14.0, 15.0, 25.0, 33.0, 52.0, 52.0, 92.0, 152.0, 236.0, 300.0, 564.0, 918.0, 1525.0, 2820.0, 5294.0, 10068.0, 20319.0, 43603.0, 97125.0, 206720.0, 294559.0, 193679.0, 89912.0, 40455.0, 19289.0, 9192.0, 4980.0, 2683.0, 1510.0, 887.0, 537.0, 324.0, 212.0, 118.0, 92.0, 68.0, 34.0, 31.0, 20.0, 14.0, 13.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.625, -41.3115234375, -39.998046875, -38.6845703125, -37.37109375, -36.0576171875, -34.744140625, -33.4306640625, -32.1171875, -30.8037109375, -29.490234375, -28.1767578125, -26.86328125, -25.5498046875, -24.236328125, -22.9228515625, -21.609375, -20.2958984375, -18.982421875, -17.6689453125, -16.35546875, -15.0419921875, -13.728515625, -12.4150390625, -11.1015625, -9.7880859375, -8.474609375, -7.1611328125, -5.84765625, -4.5341796875, -3.220703125, -1.9072265625, -0.59375, 0.7197265625, 2.033203125, 3.3466796875, 4.66015625, 5.9736328125, 7.287109375, 8.6005859375, 9.9140625, 11.2275390625, 12.541015625, 13.8544921875, 15.16796875, 16.4814453125, 17.794921875, 19.1083984375, 20.421875, 21.7353515625, 23.048828125, 24.3623046875, 25.67578125, 26.9892578125, 28.302734375, 29.6162109375, 30.9296875, 32.2431640625, 33.556640625, 34.8701171875, 36.18359375, 37.4970703125, 38.810546875, 40.1240234375, 41.4375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 4.0, 5.0, 12.0, 11.0, 28.0, 34.0, 104.0, 156.0, 203.0, 176.0, 99.0, 62.0, 28.0, 28.0, 8.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007694244384765625, -0.007504522800445557, -0.007314801216125488, -0.00712507963180542, -0.0069353580474853516, -0.006745636463165283, -0.006555914878845215, -0.0063661932945251465, -0.006176471710205078, -0.00598675012588501, -0.005797028541564941, -0.005607306957244873, -0.005417585372924805, -0.005227863788604736, -0.005038142204284668, -0.0048484206199646, -0.004658699035644531, -0.004468977451324463, -0.0042792558670043945, -0.004089534282684326, -0.003899812698364258, -0.0037100911140441895, -0.003520369529724121, -0.0033306479454040527, -0.0031409263610839844, -0.002951204776763916, -0.0027614831924438477, -0.0025717616081237793, -0.002382040023803711, -0.0021923184394836426, -0.0020025968551635742, -0.0018128752708435059, -0.0016231536865234375, -0.0014334321022033691, -0.0012437105178833008, -0.0010539889335632324, -0.0008642673492431641, -0.0006745457649230957, -0.00048482418060302734, -0.000295102596282959, -0.00010538101196289062, 8.434057235717773e-05, 0.0002740621566772461, 0.00046378374099731445, 0.0006535053253173828, 0.0008432269096374512, 0.0010329484939575195, 0.0012226700782775879, 0.0014123916625976562, 0.0016021132469177246, 0.001791834831237793, 0.0019815564155578613, 0.0021712779998779297, 0.002360999584197998, 0.0025507211685180664, 0.0027404427528381348, 0.002930164337158203, 0.0031198859214782715, 0.00330960750579834, 0.003499329090118408, 0.0036890506744384766, 0.003878772258758545, 0.004068493843078613, 0.004258215427398682, 0.00444793701171875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 12.0, 13.0, 6.0, 21.0, 22.0, 33.0, 43.0, 71.0, 98.0, 144.0, 263.0, 384.0, 583.0, 1032.0, 1878.0, 3133.0, 5843.0, 10738.0, 19964.0, 37650.0, 68236.0, 115371.0, 169329.0, 195367.0, 164929.0, 111178.0, 65043.0, 35332.0, 18950.0, 10007.0, 5457.0, 3028.0, 1742.0, 979.0, 592.0, 399.0, 218.0, 153.0, 98.0, 73.0, 45.0, 28.0, 18.0, 13.0, 9.0, 15.0, 6.0, 6.0, 8.0, 1.0, 2.0, 0.0, 2.0], "bins": [-40.125, -38.96044921875, -37.7958984375, -36.63134765625, -35.466796875, -34.30224609375, -33.1376953125, -31.97314453125, -30.80859375, -29.64404296875, -28.4794921875, -27.31494140625, -26.150390625, -24.98583984375, -23.8212890625, -22.65673828125, -21.4921875, -20.32763671875, -19.1630859375, -17.99853515625, -16.833984375, -15.66943359375, -14.5048828125, -13.34033203125, -12.17578125, -11.01123046875, -9.8466796875, -8.68212890625, -7.517578125, -6.35302734375, -5.1884765625, -4.02392578125, -2.859375, -1.69482421875, -0.5302734375, 0.63427734375, 1.798828125, 2.96337890625, 4.1279296875, 5.29248046875, 6.45703125, 7.62158203125, 8.7861328125, 9.95068359375, 11.115234375, 12.27978515625, 13.4443359375, 14.60888671875, 15.7734375, 16.93798828125, 18.1025390625, 19.26708984375, 20.431640625, 21.59619140625, 22.7607421875, 23.92529296875, 25.08984375, 26.25439453125, 27.4189453125, 28.58349609375, 29.748046875, 30.91259765625, 32.0771484375, 33.24169921875, 34.40625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 8.0, 2.0, 1.0, 2.0, 11.0, 6.0, 14.0, 14.0, 20.0, 16.0, 34.0, 28.0, 21.0, 33.0, 48.0, 52.0, 58.0, 38.0, 54.0, 59.0, 69.0, 54.0, 44.0, 49.0, 49.0, 44.0, 31.0, 31.0, 20.0, 19.0, 17.0, 16.0, 7.0, 6.0, 9.0, 7.0, 0.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.3704833984375, -11.967529296875, -11.5645751953125, -11.16162109375, -10.7586669921875, -10.355712890625, -9.9527587890625, -9.5498046875, -9.1468505859375, -8.743896484375, -8.3409423828125, -7.93798828125, -7.5350341796875, -7.132080078125, -6.7291259765625, -6.326171875, -5.9232177734375, -5.520263671875, -5.1173095703125, -4.71435546875, -4.3114013671875, -3.908447265625, -3.5054931640625, -3.1025390625, -2.6995849609375, -2.296630859375, -1.8936767578125, -1.49072265625, -1.0877685546875, -0.684814453125, -0.2818603515625, 0.12109375, 0.5240478515625, 0.927001953125, 1.3299560546875, 1.73291015625, 2.1358642578125, 2.538818359375, 2.9417724609375, 3.3447265625, 3.7476806640625, 4.150634765625, 4.5535888671875, 4.95654296875, 5.3594970703125, 5.762451171875, 6.1654052734375, 6.568359375, 6.9713134765625, 7.374267578125, 7.7772216796875, 8.18017578125, 8.5831298828125, 8.986083984375, 9.3890380859375, 9.7919921875, 10.1949462890625, 10.597900390625, 11.0008544921875, 11.40380859375, 11.8067626953125, 12.209716796875, 12.6126708984375, 13.015625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 10.0, 11.0, 9.0, 12.0, 19.0, 15.0, 33.0, 25.0, 33.0, 45.0, 38.0, 52.0, 52.0, 55.0, 59.0, 46.0, 58.0, 75.0, 33.0, 49.0, 50.0, 31.0, 34.0, 20.0, 25.0, 21.0, 16.0, 18.0, 10.0, 10.0, 9.0, 13.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-49.54157257080078, -48.033504486083984, -46.52544021606445, -45.017372131347656, -43.509307861328125, -42.00123977661133, -40.49317169189453, -38.985107421875, -37.47704315185547, -35.96897506713867, -34.46091079711914, -32.952842712402344, -31.444778442382812, -29.936710357666016, -28.42864418029785, -26.920578002929688, -25.41250991821289, -23.904443740844727, -22.396377563476562, -20.888309478759766, -19.380245208740234, -17.872177124023438, -16.364110946655273, -14.85604476928711, -13.347978591918945, -11.839912414550781, -10.331846237182617, -8.823779106140137, -7.315712928771973, -5.807646751403809, -4.299579620361328, -2.791513442993164, -1.2834510803222656, 0.22461533546447754, 1.7326817512512207, 3.240748405456543, 4.748814582824707, 6.256880760192871, 7.764947891235352, 9.273014068603516, 10.78108024597168, 12.289146423339844, 13.797212600708008, 15.305279731750488, 16.81334686279297, 18.3214111328125, 19.829479217529297, 21.33754539489746, 22.845611572265625, 24.35367774963379, 25.861743927001953, 27.36981201171875, 28.87787628173828, 30.385944366455078, 31.894010543823242, 33.402076721191406, 34.91014099121094, 36.418209075927734, 37.926273345947266, 39.43434143066406, 40.942405700683594, 42.45047378540039, 43.95854187011719, 45.46660614013672, 46.974674224853516]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 10.0, 8.0, 10.0, 23.0, 9.0, 9.0, 8.0, 19.0, 19.0, 19.0, 26.0, 22.0, 18.0, 33.0, 47.0, 34.0, 52.0, 40.0, 36.0, 35.0, 31.0, 39.0, 45.0, 40.0, 35.0, 37.0, 56.0, 31.0, 18.0, 21.0, 23.0, 19.0, 21.0, 17.0, 13.0, 16.0, 14.0, 7.0, 7.0, 6.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0], "bins": [-40.58488082885742, -39.42475128173828, -38.26462173461914, -37.1044921875, -35.94436264038086, -34.78423309326172, -33.62410354614258, -32.46397399902344, -31.303844451904297, -30.143714904785156, -28.983585357666016, -27.823455810546875, -26.663326263427734, -25.503196716308594, -24.343067169189453, -23.182937622070312, -22.02280616760254, -20.8626766204834, -19.702547073364258, -18.542417526245117, -17.382287979125977, -16.222158432006836, -15.062027931213379, -13.901898384094238, -12.741768836975098, -11.581639289855957, -10.421509742736816, -9.26137924194336, -8.101249694824219, -6.941120624542236, -5.7809906005859375, -4.620861053466797, -3.4607315063476562, -2.3006019592285156, -1.140472173690796, 0.019657611846923828, 1.1797871589660645, 2.339916706085205, 3.500046730041504, 4.6601762771606445, 5.820305824279785, 6.980435371398926, 8.140564918518066, 9.300695419311523, 10.460824966430664, 11.620954513549805, 12.781084060668945, 13.941213607788086, 15.101343154907227, 16.261472702026367, 17.421602249145508, 18.58173179626465, 19.74186134338379, 20.90199089050293, 22.062122344970703, 23.222251892089844, 24.382381439208984, 25.542510986328125, 26.702640533447266, 27.862770080566406, 29.022899627685547, 30.183029174804688, 31.343158721923828, 32.50328826904297, 33.66341781616211]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 7.0, 12.0, 15.0, 33.0, 34.0, 50.0, 78.0, 163.0, 201.0, 305.0, 528.0, 795.0, 1191.0, 1896.0, 3124.0, 4759.0, 7258.0, 11451.0, 17487.0, 26634.0, 39100.0, 55328.0, 75192.0, 94269.0, 110395.0, 117948.0, 113353.0, 99236.0, 79780.0, 60058.0, 42763.0, 29409.0, 19882.0, 12851.0, 8228.0, 5421.0, 3368.0, 2159.0, 1419.0, 806.0, 573.0, 352.0, 220.0, 169.0, 88.0, 52.0, 46.0, 18.0, 16.0, 19.0, 8.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0], "bins": [-47.8125, -46.34716796875, -44.8818359375, -43.41650390625, -41.951171875, -40.48583984375, -39.0205078125, -37.55517578125, -36.08984375, -34.62451171875, -33.1591796875, -31.69384765625, -30.228515625, -28.76318359375, -27.2978515625, -25.83251953125, -24.3671875, -22.90185546875, -21.4365234375, -19.97119140625, -18.505859375, -17.04052734375, -15.5751953125, -14.10986328125, -12.64453125, -11.17919921875, -9.7138671875, -8.24853515625, -6.783203125, -5.31787109375, -3.8525390625, -2.38720703125, -0.921875, 0.54345703125, 2.0087890625, 3.47412109375, 4.939453125, 6.40478515625, 7.8701171875, 9.33544921875, 10.80078125, 12.26611328125, 13.7314453125, 15.19677734375, 16.662109375, 18.12744140625, 19.5927734375, 21.05810546875, 22.5234375, 23.98876953125, 25.4541015625, 26.91943359375, 28.384765625, 29.85009765625, 31.3154296875, 32.78076171875, 34.24609375, 35.71142578125, 37.1767578125, 38.64208984375, 40.107421875, 41.57275390625, 43.0380859375, 44.50341796875, 45.96875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 5.0, 6.0, 9.0, 11.0, 14.0, 9.0, 9.0, 15.0, 19.0, 20.0, 15.0, 23.0, 31.0, 26.0, 30.0, 29.0, 31.0, 35.0, 41.0, 51.0, 43.0, 29.0, 34.0, 49.0, 33.0, 48.0, 40.0, 37.0, 28.0, 25.0, 32.0, 24.0, 17.0, 16.0, 10.0, 21.0, 16.0, 14.0, 12.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 3.0], "bins": [-37.03125, -35.975341796875, -34.91943359375, -33.863525390625, -32.8076171875, -31.751708984375, -30.69580078125, -29.639892578125, -28.583984375, -27.528076171875, -26.47216796875, -25.416259765625, -24.3603515625, -23.304443359375, -22.24853515625, -21.192626953125, -20.13671875, -19.080810546875, -18.02490234375, -16.968994140625, -15.9130859375, -14.857177734375, -13.80126953125, -12.745361328125, -11.689453125, -10.633544921875, -9.57763671875, -8.521728515625, -7.4658203125, -6.409912109375, -5.35400390625, -4.298095703125, -3.2421875, -2.186279296875, -1.13037109375, -0.074462890625, 0.9814453125, 2.037353515625, 3.09326171875, 4.149169921875, 5.205078125, 6.260986328125, 7.31689453125, 8.372802734375, 9.4287109375, 10.484619140625, 11.54052734375, 12.596435546875, 13.65234375, 14.708251953125, 15.76416015625, 16.820068359375, 17.8759765625, 18.931884765625, 19.98779296875, 21.043701171875, 22.099609375, 23.155517578125, 24.21142578125, 25.267333984375, 26.3232421875, 27.379150390625, 28.43505859375, 29.490966796875, 30.546875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 9.0, 6.0, 24.0, 31.0, 37.0, 78.0, 138.0, 233.0, 386.0, 658.0, 1146.0, 1985.0, 3439.0, 6278.0, 10776.0, 18044.0, 29903.0, 47372.0, 70692.0, 97786.0, 122984.0, 136800.0, 133736.0, 115352.0, 88330.0, 61432.0, 40073.0, 25012.0, 14879.0, 8915.0, 5167.0, 2893.0, 1622.0, 959.0, 562.0, 314.0, 223.0, 111.0, 56.0, 47.0, 27.0, 22.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.0, -48.4287109375, -46.857421875, -45.2861328125, -43.71484375, -42.1435546875, -40.572265625, -39.0009765625, -37.4296875, -35.8583984375, -34.287109375, -32.7158203125, -31.14453125, -29.5732421875, -28.001953125, -26.4306640625, -24.859375, -23.2880859375, -21.716796875, -20.1455078125, -18.57421875, -17.0029296875, -15.431640625, -13.8603515625, -12.2890625, -10.7177734375, -9.146484375, -7.5751953125, -6.00390625, -4.4326171875, -2.861328125, -1.2900390625, 0.28125, 1.8525390625, 3.423828125, 4.9951171875, 6.56640625, 8.1376953125, 9.708984375, 11.2802734375, 12.8515625, 14.4228515625, 15.994140625, 17.5654296875, 19.13671875, 20.7080078125, 22.279296875, 23.8505859375, 25.421875, 26.9931640625, 28.564453125, 30.1357421875, 31.70703125, 33.2783203125, 34.849609375, 36.4208984375, 37.9921875, 39.5634765625, 41.134765625, 42.7060546875, 44.27734375, 45.8486328125, 47.419921875, 48.9912109375, 50.5625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 6.0, 9.0, 9.0, 10.0, 14.0, 16.0, 17.0, 22.0, 26.0, 29.0, 25.0, 23.0, 32.0, 46.0, 37.0, 46.0, 49.0, 41.0, 49.0, 42.0, 41.0, 28.0, 31.0, 30.0, 24.0, 32.0, 28.0, 34.0, 27.0, 35.0, 19.0, 26.0, 9.0, 15.0, 10.0, 14.0, 17.0, 4.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.59619140625, -22.8642578125, -22.13232421875, -21.400390625, -20.66845703125, -19.9365234375, -19.20458984375, -18.47265625, -17.74072265625, -17.0087890625, -16.27685546875, -15.544921875, -14.81298828125, -14.0810546875, -13.34912109375, -12.6171875, -11.88525390625, -11.1533203125, -10.42138671875, -9.689453125, -8.95751953125, -8.2255859375, -7.49365234375, -6.76171875, -6.02978515625, -5.2978515625, -4.56591796875, -3.833984375, -3.10205078125, -2.3701171875, -1.63818359375, -0.90625, -0.17431640625, 0.5576171875, 1.28955078125, 2.021484375, 2.75341796875, 3.4853515625, 4.21728515625, 4.94921875, 5.68115234375, 6.4130859375, 7.14501953125, 7.876953125, 8.60888671875, 9.3408203125, 10.07275390625, 10.8046875, 11.53662109375, 12.2685546875, 13.00048828125, 13.732421875, 14.46435546875, 15.1962890625, 15.92822265625, 16.66015625, 17.39208984375, 18.1240234375, 18.85595703125, 19.587890625, 20.31982421875, 21.0517578125, 21.78369140625, 22.515625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 9.0, 7.0, 15.0, 28.0, 33.0, 53.0, 75.0, 80.0, 128.0, 157.0, 231.0, 370.0, 516.0, 769.0, 1313.0, 2150.0, 3949.0, 7366.0, 14507.0, 30301.0, 62441.0, 122172.0, 200716.0, 231380.0, 174566.0, 97784.0, 48611.0, 23334.0, 11333.0, 5837.0, 3185.0, 1899.0, 1078.0, 648.0, 465.0, 292.0, 238.0, 121.0, 95.0, 83.0, 63.0, 37.0, 31.0, 28.0, 20.0, 9.0, 11.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-28.296875, -27.3935546875, -26.490234375, -25.5869140625, -24.68359375, -23.7802734375, -22.876953125, -21.9736328125, -21.0703125, -20.1669921875, -19.263671875, -18.3603515625, -17.45703125, -16.5537109375, -15.650390625, -14.7470703125, -13.84375, -12.9404296875, -12.037109375, -11.1337890625, -10.23046875, -9.3271484375, -8.423828125, -7.5205078125, -6.6171875, -5.7138671875, -4.810546875, -3.9072265625, -3.00390625, -2.1005859375, -1.197265625, -0.2939453125, 0.609375, 1.5126953125, 2.416015625, 3.3193359375, 4.22265625, 5.1259765625, 6.029296875, 6.9326171875, 7.8359375, 8.7392578125, 9.642578125, 10.5458984375, 11.44921875, 12.3525390625, 13.255859375, 14.1591796875, 15.0625, 15.9658203125, 16.869140625, 17.7724609375, 18.67578125, 19.5791015625, 20.482421875, 21.3857421875, 22.2890625, 23.1923828125, 24.095703125, 24.9990234375, 25.90234375, 26.8056640625, 27.708984375, 28.6123046875, 29.515625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 13.0, 6.0, 18.0, 18.0, 26.0, 35.0, 45.0, 51.0, 61.0, 86.0, 82.0, 91.0, 92.0, 83.0, 60.0, 57.0, 35.0, 34.0, 21.0, 15.0, 15.0, 9.0, 6.0, 1.0, 10.0, 5.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029392242431640625, -0.0028423964977264404, -0.0027455687522888184, -0.0026487410068511963, -0.0025519132614135742, -0.002455085515975952, -0.00235825777053833, -0.002261430025100708, -0.002164602279663086, -0.002067774534225464, -0.001970946788787842, -0.0018741190433502197, -0.0017772912979125977, -0.0016804635524749756, -0.0015836358070373535, -0.0014868080615997314, -0.0013899803161621094, -0.0012931525707244873, -0.0011963248252868652, -0.0010994970798492432, -0.001002669334411621, -0.000905841588973999, -0.000809013843536377, -0.0007121860980987549, -0.0006153583526611328, -0.0005185306072235107, -0.00042170286178588867, -0.0003248751163482666, -0.00022804737091064453, -0.00013121962547302246, -3.439188003540039e-05, 6.243586540222168e-05, 0.00015926361083984375, 0.0002560913562774658, 0.0003529191017150879, 0.00044974684715270996, 0.000546574592590332, 0.0006434023380279541, 0.0007402300834655762, 0.0008370578289031982, 0.0009338855743408203, 0.0010307133197784424, 0.0011275410652160645, 0.0012243688106536865, 0.0013211965560913086, 0.0014180243015289307, 0.0015148520469665527, 0.0016116797924041748, 0.0017085075378417969, 0.001805335283279419, 0.001902163028717041, 0.001998990774154663, 0.002095818519592285, 0.0021926462650299072, 0.0022894740104675293, 0.0023863017559051514, 0.0024831295013427734, 0.0025799572467803955, 0.0026767849922180176, 0.0027736127376556396, 0.0028704404830932617, 0.002967268228530884, 0.003064095973968506, 0.003160923719406128, 0.00325775146484375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 13.0, 18.0, 34.0, 44.0, 75.0, 92.0, 145.0, 200.0, 331.0, 457.0, 721.0, 1118.0, 1830.0, 2879.0, 4767.0, 8029.0, 13350.0, 22974.0, 38804.0, 64802.0, 103760.0, 146971.0, 172121.0, 157665.0, 117788.0, 76332.0, 45982.0, 27282.0, 15967.0, 9280.0, 5486.0, 3359.0, 2041.0, 1309.0, 878.0, 573.0, 354.0, 243.0, 144.0, 105.0, 64.0, 45.0, 35.0, 27.0, 19.0, 9.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0], "bins": [-20.140625, -19.52392578125, -18.9072265625, -18.29052734375, -17.673828125, -17.05712890625, -16.4404296875, -15.82373046875, -15.20703125, -14.59033203125, -13.9736328125, -13.35693359375, -12.740234375, -12.12353515625, -11.5068359375, -10.89013671875, -10.2734375, -9.65673828125, -9.0400390625, -8.42333984375, -7.806640625, -7.18994140625, -6.5732421875, -5.95654296875, -5.33984375, -4.72314453125, -4.1064453125, -3.48974609375, -2.873046875, -2.25634765625, -1.6396484375, -1.02294921875, -0.40625, 0.21044921875, 0.8271484375, 1.44384765625, 2.060546875, 2.67724609375, 3.2939453125, 3.91064453125, 4.52734375, 5.14404296875, 5.7607421875, 6.37744140625, 6.994140625, 7.61083984375, 8.2275390625, 8.84423828125, 9.4609375, 10.07763671875, 10.6943359375, 11.31103515625, 11.927734375, 12.54443359375, 13.1611328125, 13.77783203125, 14.39453125, 15.01123046875, 15.6279296875, 16.24462890625, 16.861328125, 17.47802734375, 18.0947265625, 18.71142578125, 19.328125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 4.0, 3.0, 13.0, 18.0, 15.0, 15.0, 20.0, 23.0, 14.0, 37.0, 38.0, 43.0, 48.0, 48.0, 52.0, 45.0, 47.0, 53.0, 45.0, 54.0, 34.0, 42.0, 35.0, 32.0, 34.0, 35.0, 24.0, 24.0, 18.0, 15.0, 10.0, 12.0, 6.0, 6.0, 3.0, 1.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91015625, -6.686279296875, -6.46240234375, -6.238525390625, -6.0146484375, -5.790771484375, -5.56689453125, -5.343017578125, -5.119140625, -4.895263671875, -4.67138671875, -4.447509765625, -4.2236328125, -3.999755859375, -3.77587890625, -3.552001953125, -3.328125, -3.104248046875, -2.88037109375, -2.656494140625, -2.4326171875, -2.208740234375, -1.98486328125, -1.760986328125, -1.537109375, -1.313232421875, -1.08935546875, -0.865478515625, -0.6416015625, -0.417724609375, -0.19384765625, 0.030029296875, 0.25390625, 0.477783203125, 0.70166015625, 0.925537109375, 1.1494140625, 1.373291015625, 1.59716796875, 1.821044921875, 2.044921875, 2.268798828125, 2.49267578125, 2.716552734375, 2.9404296875, 3.164306640625, 3.38818359375, 3.612060546875, 3.8359375, 4.059814453125, 4.28369140625, 4.507568359375, 4.7314453125, 4.955322265625, 5.17919921875, 5.403076171875, 5.626953125, 5.850830078125, 6.07470703125, 6.298583984375, 6.5224609375, 6.746337890625, 6.97021484375, 7.194091796875, 7.41796875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 5.0, 7.0, 4.0, 9.0, 22.0, 17.0, 29.0, 24.0, 39.0, 32.0, 35.0, 45.0, 54.0, 58.0, 57.0, 56.0, 51.0, 50.0, 46.0, 56.0, 43.0, 43.0, 30.0, 26.0, 23.0, 27.0, 24.0, 17.0, 13.0, 13.0, 9.0, 10.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.233482360839844, -38.822452545166016, -37.41141891479492, -36.000389099121094, -34.58935546875, -33.17832565307617, -31.76729393005371, -30.35626220703125, -28.94523048400879, -27.534198760986328, -26.123167037963867, -24.712135314941406, -23.301105499267578, -21.890071868896484, -20.479042053222656, -19.068010330200195, -17.656978607177734, -16.245946884155273, -14.834915161132812, -13.423884391784668, -12.012852668762207, -10.601820945739746, -9.190790176391602, -7.779758453369141, -6.36872673034668, -4.957695007324219, -3.546663761138916, -2.1356325149536133, -0.7246007919311523, 0.6864309310913086, 2.097461700439453, 3.508493423461914, 4.919521331787109, 6.33055305480957, 7.741584300994873, 9.152615547180176, 10.563647270202637, 11.974678993225098, 13.385709762573242, 14.796741485595703, 16.207773208618164, 17.618804931640625, 19.029836654663086, 20.440868377685547, 21.851898193359375, 23.26293182373047, 24.673961639404297, 26.084993362426758, 27.49602508544922, 28.90705680847168, 30.31808853149414, 31.72911834716797, 33.14015197753906, 34.55118179321289, 35.96221160888672, 37.37324523925781, 38.784278869628906, 40.195308685302734, 41.60634231567383, 43.017372131347656, 44.42840576171875, 45.83943557739258, 47.250465393066406, 48.6614990234375, 50.07252883911133]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 2.0, 7.0, 9.0, 5.0, 6.0, 7.0, 10.0, 8.0, 10.0, 16.0, 6.0, 11.0, 17.0, 18.0, 19.0, 25.0, 38.0, 39.0, 19.0, 41.0, 36.0, 47.0, 36.0, 37.0, 42.0, 44.0, 49.0, 41.0, 45.0, 32.0, 24.0, 31.0, 36.0, 23.0, 25.0, 15.0, 23.0, 21.0, 17.0, 22.0, 14.0, 6.0, 9.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-40.91275405883789, -39.78478240966797, -38.65681076049805, -37.528839111328125, -36.4008674621582, -35.27289581298828, -34.14492416381836, -33.01695251464844, -31.888978958129883, -30.76100730895996, -29.63303565979004, -28.505064010620117, -27.377090454101562, -26.24911880493164, -25.12114715576172, -23.993175506591797, -22.865203857421875, -21.737232208251953, -20.60926055908203, -19.48128890991211, -18.353317260742188, -17.225345611572266, -16.09737205505371, -14.969400405883789, -13.841428756713867, -12.713457107543945, -11.585485458374023, -10.457512855529785, -9.329541206359863, -8.201569557189941, -7.073597431182861, -5.945625305175781, -4.817649841308594, -3.6896779537200928, -2.561706066131592, -1.4337341785430908, -0.30576229095458984, 0.822209358215332, 1.950181484222412, 3.078153610229492, 4.206125259399414, 5.334096908569336, 6.462069034576416, 7.590041160583496, 8.718012809753418, 9.84598445892334, 10.973957061767578, 12.1019287109375, 13.229900360107422, 14.357872009277344, 15.485843658447266, 16.613815307617188, 17.74178695678711, 18.86975860595703, 19.997732162475586, 21.125703811645508, 22.25367546081543, 23.38164710998535, 24.509618759155273, 25.637590408325195, 26.76556396484375, 27.893535614013672, 29.021507263183594, 30.149478912353516, 31.277450561523438]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 11.0, 8.0, 18.0, 34.0, 43.0, 60.0, 88.0, 144.0, 215.0, 316.0, 471.0, 722.0, 1197.0, 1820.0, 2963.0, 4814.0, 7859.0, 12766.0, 21281.0, 35084.0, 58698.0, 99158.0, 168897.0, 292391.0, 493190.0, 748890.0, 804589.0, 580676.0, 352488.0, 207352.0, 121112.0, 71273.0, 42173.0, 25336.0, 15114.0, 9113.0, 5374.0, 3261.0, 1954.0, 1260.0, 752.0, 488.0, 277.0, 190.0, 118.0, 86.0, 52.0, 38.0, 21.0, 19.0, 10.0, 10.0, 2.0, 2.0, 2.0], "bins": [-54.0625, -52.52490234375, -50.9873046875, -49.44970703125, -47.912109375, -46.37451171875, -44.8369140625, -43.29931640625, -41.76171875, -40.22412109375, -38.6865234375, -37.14892578125, -35.611328125, -34.07373046875, -32.5361328125, -30.99853515625, -29.4609375, -27.92333984375, -26.3857421875, -24.84814453125, -23.310546875, -21.77294921875, -20.2353515625, -18.69775390625, -17.16015625, -15.62255859375, -14.0849609375, -12.54736328125, -11.009765625, -9.47216796875, -7.9345703125, -6.39697265625, -4.859375, -3.32177734375, -1.7841796875, -0.24658203125, 1.291015625, 2.82861328125, 4.3662109375, 5.90380859375, 7.44140625, 8.97900390625, 10.5166015625, 12.05419921875, 13.591796875, 15.12939453125, 16.6669921875, 18.20458984375, 19.7421875, 21.27978515625, 22.8173828125, 24.35498046875, 25.892578125, 27.43017578125, 28.9677734375, 30.50537109375, 32.04296875, 33.58056640625, 35.1181640625, 36.65576171875, 38.193359375, 39.73095703125, 41.2685546875, 42.80615234375, 44.34375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 1.0, 4.0, 6.0, 7.0, 13.0, 10.0, 3.0, 12.0, 11.0, 16.0, 14.0, 13.0, 20.0, 28.0, 26.0, 29.0, 41.0, 36.0, 36.0, 47.0, 36.0, 39.0, 39.0, 50.0, 47.0, 52.0, 34.0, 31.0, 32.0, 23.0, 36.0, 30.0, 24.0, 25.0, 14.0, 22.0, 19.0, 10.0, 14.0, 14.0, 8.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-29.4375, -28.629150390625, -27.82080078125, -27.012451171875, -26.2041015625, -25.395751953125, -24.58740234375, -23.779052734375, -22.970703125, -22.162353515625, -21.35400390625, -20.545654296875, -19.7373046875, -18.928955078125, -18.12060546875, -17.312255859375, -16.50390625, -15.695556640625, -14.88720703125, -14.078857421875, -13.2705078125, -12.462158203125, -11.65380859375, -10.845458984375, -10.037109375, -9.228759765625, -8.42041015625, -7.612060546875, -6.8037109375, -5.995361328125, -5.18701171875, -4.378662109375, -3.5703125, -2.761962890625, -1.95361328125, -1.145263671875, -0.3369140625, 0.471435546875, 1.27978515625, 2.088134765625, 2.896484375, 3.704833984375, 4.51318359375, 5.321533203125, 6.1298828125, 6.938232421875, 7.74658203125, 8.554931640625, 9.36328125, 10.171630859375, 10.97998046875, 11.788330078125, 12.5966796875, 13.405029296875, 14.21337890625, 15.021728515625, 15.830078125, 16.638427734375, 17.44677734375, 18.255126953125, 19.0634765625, 19.871826171875, 20.68017578125, 21.488525390625, 22.296875]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 10.0, 18.0, 22.0, 21.0, 48.0, 87.0, 125.0, 180.0, 308.0, 606.0, 1008.0, 1826.0, 3350.0, 5958.0, 11064.0, 20526.0, 38176.0, 72667.0, 135413.0, 248043.0, 431045.0, 670883.0, 820532.0, 696986.0, 456845.0, 265053.0, 145910.0, 77410.0, 41512.0, 22055.0, 11951.0, 6351.0, 3620.0, 1989.0, 1111.0, 621.0, 398.0, 208.0, 140.0, 81.0, 36.0, 25.0, 21.0, 16.0, 13.0, 10.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.03125, -39.77099609375, -38.5107421875, -37.25048828125, -35.990234375, -34.72998046875, -33.4697265625, -32.20947265625, -30.94921875, -29.68896484375, -28.4287109375, -27.16845703125, -25.908203125, -24.64794921875, -23.3876953125, -22.12744140625, -20.8671875, -19.60693359375, -18.3466796875, -17.08642578125, -15.826171875, -14.56591796875, -13.3056640625, -12.04541015625, -10.78515625, -9.52490234375, -8.2646484375, -7.00439453125, -5.744140625, -4.48388671875, -3.2236328125, -1.96337890625, -0.703125, 0.55712890625, 1.8173828125, 3.07763671875, 4.337890625, 5.59814453125, 6.8583984375, 8.11865234375, 9.37890625, 10.63916015625, 11.8994140625, 13.15966796875, 14.419921875, 15.68017578125, 16.9404296875, 18.20068359375, 19.4609375, 20.72119140625, 21.9814453125, 23.24169921875, 24.501953125, 25.76220703125, 27.0224609375, 28.28271484375, 29.54296875, 30.80322265625, 32.0634765625, 33.32373046875, 34.583984375, 35.84423828125, 37.1044921875, 38.36474609375, 39.625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 11.0, 14.0, 30.0, 24.0, 41.0, 46.0, 67.0, 69.0, 94.0, 98.0, 130.0, 148.0, 180.0, 180.0, 200.0, 235.0, 270.0, 288.0, 227.0, 258.0, 236.0, 216.0, 202.0, 167.0, 124.0, 95.0, 84.0, 67.0, 60.0, 57.0, 41.0, 25.0, 21.0, 17.0, 17.0, 4.0, 9.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.688232421875, -14.22021484375, -13.752197265625, -13.2841796875, -12.816162109375, -12.34814453125, -11.880126953125, -11.412109375, -10.944091796875, -10.47607421875, -10.008056640625, -9.5400390625, -9.072021484375, -8.60400390625, -8.135986328125, -7.66796875, -7.199951171875, -6.73193359375, -6.263916015625, -5.7958984375, -5.327880859375, -4.85986328125, -4.391845703125, -3.923828125, -3.455810546875, -2.98779296875, -2.519775390625, -2.0517578125, -1.583740234375, -1.11572265625, -0.647705078125, -0.1796875, 0.288330078125, 0.75634765625, 1.224365234375, 1.6923828125, 2.160400390625, 2.62841796875, 3.096435546875, 3.564453125, 4.032470703125, 4.50048828125, 4.968505859375, 5.4365234375, 5.904541015625, 6.37255859375, 6.840576171875, 7.30859375, 7.776611328125, 8.24462890625, 8.712646484375, 9.1806640625, 9.648681640625, 10.11669921875, 10.584716796875, 11.052734375, 11.520751953125, 11.98876953125, 12.456787109375, 12.9248046875, 13.392822265625, 13.86083984375, 14.328857421875, 14.796875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 5.0, 2.0, 14.0, 3.0, 11.0, 12.0, 15.0, 24.0, 24.0, 32.0, 42.0, 41.0, 42.0, 35.0, 40.0, 52.0, 66.0, 54.0, 64.0, 48.0, 54.0, 47.0, 39.0, 39.0, 32.0, 25.0, 31.0, 15.0, 22.0, 16.0, 10.0, 8.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.40579605102539, -28.250099182128906, -27.094402313232422, -25.938703536987305, -24.78300666809082, -23.627309799194336, -22.47161102294922, -21.315914154052734, -20.16021728515625, -19.004520416259766, -17.84882354736328, -16.693124771118164, -15.53742790222168, -14.381731033325195, -13.226033210754395, -12.070335388183594, -10.91463851928711, -9.758941650390625, -8.603243827819824, -7.447546482086182, -6.291849136352539, -5.1361517906188965, -3.980454444885254, -2.824756622314453, -1.6690597534179688, -0.5133624076843262, 0.6423349380493164, 1.798032283782959, 2.9537296295166016, 4.109426975250244, 5.265124320983887, 6.4208221435546875, 7.576515197753906, 8.73221206665039, 9.887909889221191, 11.043607711791992, 12.199304580688477, 13.355001449584961, 14.510699272155762, 15.666397094726562, 16.822093963623047, 17.97779083251953, 19.133487701416016, 20.289186477661133, 21.444883346557617, 22.6005802154541, 23.75627899169922, 24.911975860595703, 26.067672729492188, 27.223369598388672, 28.379066467285156, 29.534765243530273, 30.690462112426758, 31.846158981323242, 33.00185775756836, 34.157554626464844, 35.31325149536133, 36.46894836425781, 37.6246452331543, 38.78034210205078, 39.93604278564453, 41.091739654541016, 42.2474365234375, 43.403133392333984, 44.55883026123047]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 10.0, 7.0, 6.0, 9.0, 6.0, 18.0, 21.0, 26.0, 26.0, 26.0, 25.0, 21.0, 39.0, 39.0, 35.0, 43.0, 38.0, 35.0, 52.0, 45.0, 28.0, 37.0, 44.0, 44.0, 42.0, 33.0, 29.0, 26.0, 29.0, 24.0, 25.0, 16.0, 17.0, 14.0, 8.0, 9.0, 11.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-31.140579223632812, -30.188535690307617, -29.236492156982422, -28.28445053100586, -27.332406997680664, -26.38036346435547, -25.428321838378906, -24.47627830505371, -23.524234771728516, -22.57219123840332, -21.620147705078125, -20.668106079101562, -19.716062545776367, -18.764019012451172, -17.81197738647461, -16.859933853149414, -15.907890319824219, -14.955846786499023, -14.003804206848145, -13.051761627197266, -12.09971809387207, -11.147674560546875, -10.195631980895996, -9.243589401245117, -8.291545867919922, -7.339502811431885, -6.387459754943848, -5.4354166984558105, -4.483373641967773, -3.5313305854797363, -2.579287528991699, -1.627244472503662, -0.6751995086669922, 0.2768435478210449, 1.228886604309082, 2.180929660797119, 3.1329727172851562, 4.085015773773193, 5.0370588302612305, 5.989101886749268, 6.941144943237305, 7.893187999725342, 8.845231056213379, 9.797273635864258, 10.749317169189453, 11.701360702514648, 12.653403282165527, 13.605445861816406, 14.557489395141602, 15.509532928466797, 16.46157455444336, 17.413618087768555, 18.36566162109375, 19.317705154418945, 20.26974868774414, 21.221790313720703, 22.1738338470459, 23.125877380371094, 24.077919006347656, 25.02996253967285, 25.982006072998047, 26.934049606323242, 27.886093139648438, 28.838134765625, 29.790178298950195]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 6.0, 5.0, 14.0, 20.0, 29.0, 31.0, 69.0, 109.0, 152.0, 271.0, 441.0, 735.0, 1230.0, 2119.0, 3577.0, 6233.0, 11135.0, 18571.0, 30696.0, 50133.0, 77452.0, 111214.0, 140879.0, 152386.0, 138337.0, 107848.0, 74506.0, 47997.0, 29425.0, 17821.0, 10457.0, 6167.0, 3487.0, 1969.0, 1192.0, 739.0, 444.0, 233.0, 153.0, 95.0, 73.0, 35.0, 26.0, 13.0, 10.0, 14.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.9375, -64.875, -62.8125, -60.75, -58.6875, -56.625, -54.5625, -52.5, -50.4375, -48.375, -46.3125, -44.25, -42.1875, -40.125, -38.0625, -36.0, -33.9375, -31.875, -29.8125, -27.75, -25.6875, -23.625, -21.5625, -19.5, -17.4375, -15.375, -13.3125, -11.25, -9.1875, -7.125, -5.0625, -3.0, -0.9375, 1.125, 3.1875, 5.25, 7.3125, 9.375, 11.4375, 13.5, 15.5625, 17.625, 19.6875, 21.75, 23.8125, 25.875, 27.9375, 30.0, 32.0625, 34.125, 36.1875, 38.25, 40.3125, 42.375, 44.4375, 46.5, 48.5625, 50.625, 52.6875, 54.75, 56.8125, 58.875, 60.9375, 63.0, 65.0625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 10.0, 4.0, 5.0, 2.0, 3.0, 9.0, 6.0, 5.0, 18.0, 14.0, 19.0, 21.0, 15.0, 19.0, 25.0, 24.0, 34.0, 32.0, 35.0, 33.0, 30.0, 40.0, 45.0, 40.0, 43.0, 39.0, 43.0, 41.0, 42.0, 26.0, 37.0, 25.0, 32.0, 22.0, 22.0, 17.0, 27.0, 14.0, 19.0, 11.0, 10.0, 5.0, 9.0, 4.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-20.5625, -19.95654296875, -19.3505859375, -18.74462890625, -18.138671875, -17.53271484375, -16.9267578125, -16.32080078125, -15.71484375, -15.10888671875, -14.5029296875, -13.89697265625, -13.291015625, -12.68505859375, -12.0791015625, -11.47314453125, -10.8671875, -10.26123046875, -9.6552734375, -9.04931640625, -8.443359375, -7.83740234375, -7.2314453125, -6.62548828125, -6.01953125, -5.41357421875, -4.8076171875, -4.20166015625, -3.595703125, -2.98974609375, -2.3837890625, -1.77783203125, -1.171875, -0.56591796875, 0.0400390625, 0.64599609375, 1.251953125, 1.85791015625, 2.4638671875, 3.06982421875, 3.67578125, 4.28173828125, 4.8876953125, 5.49365234375, 6.099609375, 6.70556640625, 7.3115234375, 7.91748046875, 8.5234375, 9.12939453125, 9.7353515625, 10.34130859375, 10.947265625, 11.55322265625, 12.1591796875, 12.76513671875, 13.37109375, 13.97705078125, 14.5830078125, 15.18896484375, 15.794921875, 16.40087890625, 17.0068359375, 17.61279296875, 18.21875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 15.0, 14.0, 17.0, 22.0, 47.0, 96.0, 101.0, 198.0, 330.0, 484.0, 755.0, 1230.0, 1897.0, 2997.0, 4809.0, 7669.0, 12967.0, 21192.0, 34601.0, 57754.0, 94939.0, 146880.0, 188409.0, 169864.0, 116935.0, 72346.0, 43341.0, 26557.0, 15799.0, 9887.0, 6033.0, 3812.0, 2434.0, 1508.0, 995.0, 577.0, 383.0, 238.0, 157.0, 101.0, 60.0, 34.0, 20.0, 20.0, 14.0, 9.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.8125, -69.6181640625, -67.423828125, -65.2294921875, -63.03515625, -60.8408203125, -58.646484375, -56.4521484375, -54.2578125, -52.0634765625, -49.869140625, -47.6748046875, -45.48046875, -43.2861328125, -41.091796875, -38.8974609375, -36.703125, -34.5087890625, -32.314453125, -30.1201171875, -27.92578125, -25.7314453125, -23.537109375, -21.3427734375, -19.1484375, -16.9541015625, -14.759765625, -12.5654296875, -10.37109375, -8.1767578125, -5.982421875, -3.7880859375, -1.59375, 0.6005859375, 2.794921875, 4.9892578125, 7.18359375, 9.3779296875, 11.572265625, 13.7666015625, 15.9609375, 18.1552734375, 20.349609375, 22.5439453125, 24.73828125, 26.9326171875, 29.126953125, 31.3212890625, 33.515625, 35.7099609375, 37.904296875, 40.0986328125, 42.29296875, 44.4873046875, 46.681640625, 48.8759765625, 51.0703125, 53.2646484375, 55.458984375, 57.6533203125, 59.84765625, 62.0419921875, 64.236328125, 66.4306640625, 68.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 4.0, 15.0, 7.0, 10.0, 16.0, 18.0, 23.0, 24.0, 31.0, 24.0, 25.0, 33.0, 37.0, 31.0, 38.0, 45.0, 44.0, 35.0, 32.0, 41.0, 36.0, 41.0, 33.0, 35.0, 26.0, 47.0, 37.0, 30.0, 28.0, 26.0, 25.0, 21.0, 15.0, 13.0, 8.0, 11.0, 2.0, 2.0, 8.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8515625, -14.3096923828125, -13.767822265625, -13.2259521484375, -12.68408203125, -12.1422119140625, -11.600341796875, -11.0584716796875, -10.5166015625, -9.9747314453125, -9.432861328125, -8.8909912109375, -8.34912109375, -7.8072509765625, -7.265380859375, -6.7235107421875, -6.181640625, -5.6397705078125, -5.097900390625, -4.5560302734375, -4.01416015625, -3.4722900390625, -2.930419921875, -2.3885498046875, -1.8466796875, -1.3048095703125, -0.762939453125, -0.2210693359375, 0.32080078125, 0.8626708984375, 1.404541015625, 1.9464111328125, 2.48828125, 3.0301513671875, 3.572021484375, 4.1138916015625, 4.65576171875, 5.1976318359375, 5.739501953125, 6.2813720703125, 6.8232421875, 7.3651123046875, 7.906982421875, 8.4488525390625, 8.99072265625, 9.5325927734375, 10.074462890625, 10.6163330078125, 11.158203125, 11.7000732421875, 12.241943359375, 12.7838134765625, 13.32568359375, 13.8675537109375, 14.409423828125, 14.9512939453125, 15.4931640625, 16.0350341796875, 16.576904296875, 17.1187744140625, 17.66064453125, 18.2025146484375, 18.744384765625, 19.2862548828125, 19.828125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 4.0, 9.0, 17.0, 14.0, 21.0, 37.0, 50.0, 70.0, 89.0, 155.0, 168.0, 267.0, 393.0, 609.0, 852.0, 1307.0, 2097.0, 3635.0, 6763.0, 13749.0, 32039.0, 92044.0, 324319.0, 383908.0, 113928.0, 37795.0, 15916.0, 7673.0, 4089.0, 2351.0, 1320.0, 871.0, 562.0, 423.0, 284.0, 181.0, 136.0, 128.0, 68.0, 62.0, 51.0, 21.0, 25.0, 17.0, 15.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-62.46875, -60.52197265625, -58.5751953125, -56.62841796875, -54.681640625, -52.73486328125, -50.7880859375, -48.84130859375, -46.89453125, -44.94775390625, -43.0009765625, -41.05419921875, -39.107421875, -37.16064453125, -35.2138671875, -33.26708984375, -31.3203125, -29.37353515625, -27.4267578125, -25.47998046875, -23.533203125, -21.58642578125, -19.6396484375, -17.69287109375, -15.74609375, -13.79931640625, -11.8525390625, -9.90576171875, -7.958984375, -6.01220703125, -4.0654296875, -2.11865234375, -0.171875, 1.77490234375, 3.7216796875, 5.66845703125, 7.615234375, 9.56201171875, 11.5087890625, 13.45556640625, 15.40234375, 17.34912109375, 19.2958984375, 21.24267578125, 23.189453125, 25.13623046875, 27.0830078125, 29.02978515625, 30.9765625, 32.92333984375, 34.8701171875, 36.81689453125, 38.763671875, 40.71044921875, 42.6572265625, 44.60400390625, 46.55078125, 48.49755859375, 50.4443359375, 52.39111328125, 54.337890625, 56.28466796875, 58.2314453125, 60.17822265625, 62.125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 3.0, 8.0, 13.0, 13.0, 20.0, 21.0, 25.0, 36.0, 69.0, 84.0, 109.0, 129.0, 123.0, 102.0, 77.0, 51.0, 30.0, 22.0, 10.0, 18.0, 7.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.005649566650390625, -0.0054724812507629395, -0.005295395851135254, -0.005118310451507568, -0.004941225051879883, -0.004764139652252197, -0.004587054252624512, -0.004409968852996826, -0.004232883453369141, -0.004055798053741455, -0.0038787126541137695, -0.003701627254486084, -0.0035245418548583984, -0.003347456455230713, -0.0031703710556030273, -0.002993285655975342, -0.0028162002563476562, -0.0026391148567199707, -0.002462029457092285, -0.0022849440574645996, -0.002107858657836914, -0.0019307732582092285, -0.001753687858581543, -0.0015766024589538574, -0.0013995170593261719, -0.0012224316596984863, -0.0010453462600708008, -0.0008682608604431152, -0.0006911754608154297, -0.0005140900611877441, -0.0003370046615600586, -0.00015991926193237305, 1.71661376953125e-05, 0.00019425153732299805, 0.0003713369369506836, 0.0005484223365783691, 0.0007255077362060547, 0.0009025931358337402, 0.0010796785354614258, 0.0012567639350891113, 0.0014338493347167969, 0.0016109347343444824, 0.001788020133972168, 0.0019651055335998535, 0.002142190933227539, 0.0023192763328552246, 0.00249636173248291, 0.0026734471321105957, 0.0028505325317382812, 0.003027617931365967, 0.0032047033309936523, 0.003381788730621338, 0.0035588741302490234, 0.003735959529876709, 0.0039130449295043945, 0.00409013032913208, 0.004267215728759766, 0.004444301128387451, 0.004621386528015137, 0.004798471927642822, 0.004975557327270508, 0.005152642726898193, 0.005329728126525879, 0.0055068135261535645, 0.00568389892578125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 10.0, 16.0, 10.0, 23.0, 29.0, 45.0, 60.0, 84.0, 90.0, 122.0, 156.0, 212.0, 301.0, 425.0, 578.0, 841.0, 1114.0, 1771.0, 2765.0, 4595.0, 8464.0, 17606.0, 42407.0, 111086.0, 257671.0, 314130.0, 166599.0, 64011.0, 25612.0, 11467.0, 5897.0, 3378.0, 2175.0, 1382.0, 939.0, 689.0, 478.0, 355.0, 251.0, 198.0, 135.0, 99.0, 80.0, 54.0, 35.0, 40.0, 21.0, 20.0, 15.0, 2.0, 9.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-32.40625, -31.3681640625, -30.330078125, -29.2919921875, -28.25390625, -27.2158203125, -26.177734375, -25.1396484375, -24.1015625, -23.0634765625, -22.025390625, -20.9873046875, -19.94921875, -18.9111328125, -17.873046875, -16.8349609375, -15.796875, -14.7587890625, -13.720703125, -12.6826171875, -11.64453125, -10.6064453125, -9.568359375, -8.5302734375, -7.4921875, -6.4541015625, -5.416015625, -4.3779296875, -3.33984375, -2.3017578125, -1.263671875, -0.2255859375, 0.8125, 1.8505859375, 2.888671875, 3.9267578125, 4.96484375, 6.0029296875, 7.041015625, 8.0791015625, 9.1171875, 10.1552734375, 11.193359375, 12.2314453125, 13.26953125, 14.3076171875, 15.345703125, 16.3837890625, 17.421875, 18.4599609375, 19.498046875, 20.5361328125, 21.57421875, 22.6123046875, 23.650390625, 24.6884765625, 25.7265625, 26.7646484375, 27.802734375, 28.8408203125, 29.87890625, 30.9169921875, 31.955078125, 32.9931640625, 34.03125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 9.0, 12.0, 12.0, 21.0, 27.0, 39.0, 67.0, 87.0, 118.0, 124.0, 110.0, 90.0, 66.0, 49.0, 43.0, 30.0, 21.0, 13.0, 8.0, 7.0, 3.0, 5.0, 5.0, 7.0, 7.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.6365966796875, -12.249755859375, -11.8629150390625, -11.47607421875, -11.0892333984375, -10.702392578125, -10.3155517578125, -9.9287109375, -9.5418701171875, -9.155029296875, -8.7681884765625, -8.38134765625, -7.9945068359375, -7.607666015625, -7.2208251953125, -6.833984375, -6.4471435546875, -6.060302734375, -5.6734619140625, -5.28662109375, -4.8997802734375, -4.512939453125, -4.1260986328125, -3.7392578125, -3.3524169921875, -2.965576171875, -2.5787353515625, -2.19189453125, -1.8050537109375, -1.418212890625, -1.0313720703125, -0.64453125, -0.2576904296875, 0.129150390625, 0.5159912109375, 0.90283203125, 1.2896728515625, 1.676513671875, 2.0633544921875, 2.4501953125, 2.8370361328125, 3.223876953125, 3.6107177734375, 3.99755859375, 4.3843994140625, 4.771240234375, 5.1580810546875, 5.544921875, 5.9317626953125, 6.318603515625, 6.7054443359375, 7.09228515625, 7.4791259765625, 7.865966796875, 8.2528076171875, 8.6396484375, 9.0264892578125, 9.413330078125, 9.8001708984375, 10.18701171875, 10.5738525390625, 10.960693359375, 11.3475341796875, 11.734375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 7.0, 5.0, 7.0, 4.0, 9.0, 14.0, 9.0, 8.0, 23.0, 15.0, 20.0, 20.0, 39.0, 44.0, 40.0, 38.0, 45.0, 43.0, 48.0, 59.0, 52.0, 52.0, 61.0, 55.0, 39.0, 33.0, 34.0, 31.0, 32.0, 25.0, 19.0, 13.0, 11.0, 11.0, 10.0, 6.0, 8.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.93026351928711, -20.15152359008789, -19.372785568237305, -18.59404754638672, -17.8153076171875, -17.03656768798828, -16.257829666137695, -15.479090690612793, -14.70035171508789, -13.921612739562988, -13.142873764038086, -12.364134788513184, -11.585395812988281, -10.806656837463379, -10.027917861938477, -9.249178886413574, -8.470439910888672, -7.6917009353637695, -6.912961959838867, -6.134222984313965, -5.3554840087890625, -4.57674503326416, -3.798006057739258, -3.0192670822143555, -2.240528106689453, -1.4617891311645508, -0.6830501556396484, 0.0956888198852539, 0.8744277954101562, 1.6531667709350586, 2.431905746459961, 3.2106447219848633, 3.9893856048583984, 4.768124580383301, 5.546863555908203, 6.3256025314331055, 7.104341506958008, 7.88308048248291, 8.661819458007812, 9.440558433532715, 10.219297409057617, 10.99803638458252, 11.776775360107422, 12.555514335632324, 13.334253311157227, 14.112992286682129, 14.891731262207031, 15.670470237731934, 16.449209213256836, 17.227947235107422, 18.00668716430664, 18.78542709350586, 19.564165115356445, 20.34290313720703, 21.12164306640625, 21.90038299560547, 22.679121017456055, 23.45785903930664, 24.23659896850586, 25.015338897705078, 25.794076919555664, 26.57281494140625, 27.35155487060547, 28.130294799804688, 28.909032821655273]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 7.0, 2.0, 8.0, 4.0, 9.0, 7.0, 11.0, 17.0, 20.0, 16.0, 17.0, 13.0, 18.0, 26.0, 21.0, 34.0, 33.0, 34.0, 34.0, 36.0, 37.0, 54.0, 45.0, 34.0, 27.0, 35.0, 41.0, 24.0, 42.0, 35.0, 35.0, 25.0, 26.0, 37.0, 19.0, 21.0, 11.0, 15.0, 14.0, 5.0, 8.0, 6.0, 8.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-18.94991683959961, -18.35383415222168, -17.757753372192383, -17.161670684814453, -16.565587997436523, -15.96950626373291, -15.373424530029297, -14.777341842651367, -14.181260108947754, -13.58517837524414, -12.989095687866211, -12.393013954162598, -11.796932220458984, -11.200849533081055, -10.604767799377441, -10.008686065673828, -9.412603378295898, -8.816521644592285, -8.220438957214355, -7.624357223510742, -7.028275012969971, -6.432192802429199, -5.836111068725586, -5.2400288581848145, -4.643946647644043, -4.0478644371032715, -3.451782464981079, -2.8557004928588867, -2.2596182823181152, -1.6635360717773438, -1.0674540996551514, -0.471372127532959, 0.12471199035644531, 0.7207940816879272, 1.3168761730194092, 1.9129582643508911, 2.509040355682373, 3.1051225662231445, 3.701204538345337, 4.297286510467529, 4.893368721008301, 5.489450931549072, 6.085533142089844, 6.681614875793457, 7.2776970863342285, 7.873779296875, 8.469861030578613, 9.065942764282227, 9.662025451660156, 10.25810718536377, 10.8541898727417, 11.450271606445312, 12.046354293823242, 12.642436027526855, 13.238517761230469, 13.834600448608398, 14.430682182312012, 15.026763916015625, 15.622846603393555, 16.218929290771484, 16.81501007080078, 17.41109275817871, 18.00717544555664, 18.603256225585938, 19.199338912963867]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 11.0, 10.0, 17.0, 14.0, 23.0, 31.0, 65.0, 99.0, 124.0, 185.0, 303.0, 400.0, 687.0, 987.0, 1536.0, 2315.0, 3568.0, 5245.0, 8097.0, 12217.0, 18713.0, 27616.0, 39665.0, 56286.0, 75608.0, 96796.0, 113196.0, 119923.0, 113718.0, 96491.0, 75889.0, 56172.0, 39708.0, 27481.0, 18799.0, 12576.0, 8121.0, 5455.0, 3556.0, 2344.0, 1591.0, 987.0, 677.0, 422.0, 278.0, 174.0, 135.0, 100.0, 48.0, 46.0, 20.0, 16.0, 10.0, 4.0, 4.0, 1.0, 3.0], "bins": [-18.65625, -18.1156005859375, -17.574951171875, -17.0343017578125, -16.49365234375, -15.9530029296875, -15.412353515625, -14.8717041015625, -14.3310546875, -13.7904052734375, -13.249755859375, -12.7091064453125, -12.16845703125, -11.6278076171875, -11.087158203125, -10.5465087890625, -10.005859375, -9.4652099609375, -8.924560546875, -8.3839111328125, -7.84326171875, -7.3026123046875, -6.761962890625, -6.2213134765625, -5.6806640625, -5.1400146484375, -4.599365234375, -4.0587158203125, -3.51806640625, -2.9774169921875, -2.436767578125, -1.8961181640625, -1.35546875, -0.8148193359375, -0.274169921875, 0.2664794921875, 0.80712890625, 1.3477783203125, 1.888427734375, 2.4290771484375, 2.9697265625, 3.5103759765625, 4.051025390625, 4.5916748046875, 5.13232421875, 5.6729736328125, 6.213623046875, 6.7542724609375, 7.294921875, 7.8355712890625, 8.376220703125, 8.9168701171875, 9.45751953125, 9.9981689453125, 10.538818359375, 11.0794677734375, 11.6201171875, 12.1607666015625, 12.701416015625, 13.2420654296875, 13.78271484375, 14.3233642578125, 14.864013671875, 15.4046630859375, 15.9453125]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 10.0, 4.0, 7.0, 12.0, 11.0, 16.0, 13.0, 13.0, 16.0, 17.0, 21.0, 22.0, 24.0, 25.0, 25.0, 41.0, 30.0, 38.0, 45.0, 37.0, 44.0, 38.0, 29.0, 35.0, 36.0, 28.0, 31.0, 44.0, 40.0, 31.0, 32.0, 24.0, 28.0, 16.0, 17.0, 19.0, 15.0, 13.0, 12.0, 7.0, 6.0, 8.0, 2.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.0625, -16.50830078125, -15.9541015625, -15.39990234375, -14.845703125, -14.29150390625, -13.7373046875, -13.18310546875, -12.62890625, -12.07470703125, -11.5205078125, -10.96630859375, -10.412109375, -9.85791015625, -9.3037109375, -8.74951171875, -8.1953125, -7.64111328125, -7.0869140625, -6.53271484375, -5.978515625, -5.42431640625, -4.8701171875, -4.31591796875, -3.76171875, -3.20751953125, -2.6533203125, -2.09912109375, -1.544921875, -0.99072265625, -0.4365234375, 0.11767578125, 0.671875, 1.22607421875, 1.7802734375, 2.33447265625, 2.888671875, 3.44287109375, 3.9970703125, 4.55126953125, 5.10546875, 5.65966796875, 6.2138671875, 6.76806640625, 7.322265625, 7.87646484375, 8.4306640625, 8.98486328125, 9.5390625, 10.09326171875, 10.6474609375, 11.20166015625, 11.755859375, 12.31005859375, 12.8642578125, 13.41845703125, 13.97265625, 14.52685546875, 15.0810546875, 15.63525390625, 16.189453125, 16.74365234375, 17.2978515625, 17.85205078125, 18.40625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 11.0, 17.0, 35.0, 28.0, 58.0, 74.0, 145.0, 241.0, 350.0, 582.0, 963.0, 1604.0, 2644.0, 4558.0, 7877.0, 14256.0, 25127.0, 44033.0, 75277.0, 119143.0, 164357.0, 180092.0, 151866.0, 104894.0, 64333.0, 37105.0, 20903.0, 11626.0, 6774.0, 3809.0, 2389.0, 1340.0, 783.0, 442.0, 324.0, 191.0, 115.0, 73.0, 36.0, 33.0, 17.0, 12.0, 6.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.46875, -25.650390625, -24.83203125, -24.013671875, -23.1953125, -22.376953125, -21.55859375, -20.740234375, -19.921875, -19.103515625, -18.28515625, -17.466796875, -16.6484375, -15.830078125, -15.01171875, -14.193359375, -13.375, -12.556640625, -11.73828125, -10.919921875, -10.1015625, -9.283203125, -8.46484375, -7.646484375, -6.828125, -6.009765625, -5.19140625, -4.373046875, -3.5546875, -2.736328125, -1.91796875, -1.099609375, -0.28125, 0.537109375, 1.35546875, 2.173828125, 2.9921875, 3.810546875, 4.62890625, 5.447265625, 6.265625, 7.083984375, 7.90234375, 8.720703125, 9.5390625, 10.357421875, 11.17578125, 11.994140625, 12.8125, 13.630859375, 14.44921875, 15.267578125, 16.0859375, 16.904296875, 17.72265625, 18.541015625, 19.359375, 20.177734375, 20.99609375, 21.814453125, 22.6328125, 23.451171875, 24.26953125, 25.087890625, 25.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 3.0, 0.0, 4.0, 6.0, 7.0, 8.0, 6.0, 8.0, 10.0, 11.0, 24.0, 23.0, 28.0, 20.0, 23.0, 24.0, 40.0, 39.0, 35.0, 37.0, 43.0, 50.0, 39.0, 51.0, 42.0, 33.0, 43.0, 34.0, 37.0, 34.0, 35.0, 34.0, 27.0, 24.0, 22.0, 15.0, 10.0, 15.0, 9.0, 8.0, 7.0, 9.0, 11.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.28125, -11.8624267578125, -11.443603515625, -11.0247802734375, -10.60595703125, -10.1871337890625, -9.768310546875, -9.3494873046875, -8.9306640625, -8.5118408203125, -8.093017578125, -7.6741943359375, -7.25537109375, -6.8365478515625, -6.417724609375, -5.9989013671875, -5.580078125, -5.1612548828125, -4.742431640625, -4.3236083984375, -3.90478515625, -3.4859619140625, -3.067138671875, -2.6483154296875, -2.2294921875, -1.8106689453125, -1.391845703125, -0.9730224609375, -0.55419921875, -0.1353759765625, 0.283447265625, 0.7022705078125, 1.12109375, 1.5399169921875, 1.958740234375, 2.3775634765625, 2.79638671875, 3.2152099609375, 3.634033203125, 4.0528564453125, 4.4716796875, 4.8905029296875, 5.309326171875, 5.7281494140625, 6.14697265625, 6.5657958984375, 6.984619140625, 7.4034423828125, 7.822265625, 8.2410888671875, 8.659912109375, 9.0787353515625, 9.49755859375, 9.9163818359375, 10.335205078125, 10.7540283203125, 11.1728515625, 11.5916748046875, 12.010498046875, 12.4293212890625, 12.84814453125, 13.2669677734375, 13.685791015625, 14.1046142578125, 14.5234375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 9.0, 13.0, 20.0, 25.0, 38.0, 60.0, 93.0, 113.0, 155.0, 242.0, 349.0, 580.0, 830.0, 1265.0, 2088.0, 3493.0, 6147.0, 10677.0, 18756.0, 35132.0, 65036.0, 115011.0, 182545.0, 212501.0, 166419.0, 101228.0, 55814.0, 30455.0, 16500.0, 9117.0, 5374.0, 3127.0, 1917.0, 1181.0, 720.0, 502.0, 311.0, 215.0, 149.0, 108.0, 68.0, 50.0, 38.0, 26.0, 19.0, 13.0, 7.0, 4.0, 0.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-16.703125, -16.1533203125, -15.603515625, -15.0537109375, -14.50390625, -13.9541015625, -13.404296875, -12.8544921875, -12.3046875, -11.7548828125, -11.205078125, -10.6552734375, -10.10546875, -9.5556640625, -9.005859375, -8.4560546875, -7.90625, -7.3564453125, -6.806640625, -6.2568359375, -5.70703125, -5.1572265625, -4.607421875, -4.0576171875, -3.5078125, -2.9580078125, -2.408203125, -1.8583984375, -1.30859375, -0.7587890625, -0.208984375, 0.3408203125, 0.890625, 1.4404296875, 1.990234375, 2.5400390625, 3.08984375, 3.6396484375, 4.189453125, 4.7392578125, 5.2890625, 5.8388671875, 6.388671875, 6.9384765625, 7.48828125, 8.0380859375, 8.587890625, 9.1376953125, 9.6875, 10.2373046875, 10.787109375, 11.3369140625, 11.88671875, 12.4365234375, 12.986328125, 13.5361328125, 14.0859375, 14.6357421875, 15.185546875, 15.7353515625, 16.28515625, 16.8349609375, 17.384765625, 17.9345703125, 18.484375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 2.0, 12.0, 20.0, 28.0, 28.0, 33.0, 47.0, 57.0, 59.0, 72.0, 68.0, 83.0, 86.0, 67.0, 54.0, 62.0, 50.0, 31.0, 40.0, 21.0, 12.0, 9.0, 8.0, 13.0, 11.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00156402587890625, -0.0015097260475158691, -0.0014554262161254883, -0.0014011263847351074, -0.0013468265533447266, -0.0012925267219543457, -0.0012382268905639648, -0.001183927059173584, -0.0011296272277832031, -0.0010753273963928223, -0.0010210275650024414, -0.0009667277336120605, -0.0009124279022216797, -0.0008581280708312988, -0.000803828239440918, -0.0007495284080505371, -0.0006952285766601562, -0.0006409287452697754, -0.0005866289138793945, -0.0005323290824890137, -0.0004780292510986328, -0.00042372941970825195, -0.0003694295883178711, -0.00031512975692749023, -0.0002608299255371094, -0.00020653009414672852, -0.00015223026275634766, -9.79304313659668e-05, -4.363059997558594e-05, 1.0669231414794922e-05, 6.496906280517578e-05, 0.00011926889419555664, 0.0001735687255859375, 0.00022786855697631836, 0.0002821683883666992, 0.0003364682197570801, 0.00039076805114746094, 0.0004450678825378418, 0.0004993677139282227, 0.0005536675453186035, 0.0006079673767089844, 0.0006622672080993652, 0.0007165670394897461, 0.000770866870880127, 0.0008251667022705078, 0.0008794665336608887, 0.0009337663650512695, 0.0009880661964416504, 0.0010423660278320312, 0.0010966658592224121, 0.001150965690612793, 0.0012052655220031738, 0.0012595653533935547, 0.0013138651847839355, 0.0013681650161743164, 0.0014224648475646973, 0.0014767646789550781, 0.001531064510345459, 0.0015853643417358398, 0.0016396641731262207, 0.0016939640045166016, 0.0017482638359069824, 0.0018025636672973633, 0.0018568634986877441, 0.001911163330078125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 22.0, 21.0, 42.0, 56.0, 81.0, 118.0, 172.0, 239.0, 417.0, 544.0, 847.0, 1200.0, 1898.0, 2775.0, 4056.0, 6241.0, 9315.0, 14092.0, 21533.0, 32821.0, 49374.0, 72942.0, 102212.0, 130032.0, 141953.0, 130610.0, 102833.0, 74225.0, 50517.0, 33132.0, 21663.0, 14257.0, 9361.0, 6267.0, 4104.0, 2726.0, 1915.0, 1283.0, 855.0, 584.0, 405.0, 267.0, 179.0, 120.0, 75.0, 59.0, 40.0, 30.0, 20.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.32568359375, -9.9873046875, -9.64892578125, -9.310546875, -8.97216796875, -8.6337890625, -8.29541015625, -7.95703125, -7.61865234375, -7.2802734375, -6.94189453125, -6.603515625, -6.26513671875, -5.9267578125, -5.58837890625, -5.25, -4.91162109375, -4.5732421875, -4.23486328125, -3.896484375, -3.55810546875, -3.2197265625, -2.88134765625, -2.54296875, -2.20458984375, -1.8662109375, -1.52783203125, -1.189453125, -0.85107421875, -0.5126953125, -0.17431640625, 0.1640625, 0.50244140625, 0.8408203125, 1.17919921875, 1.517578125, 1.85595703125, 2.1943359375, 2.53271484375, 2.87109375, 3.20947265625, 3.5478515625, 3.88623046875, 4.224609375, 4.56298828125, 4.9013671875, 5.23974609375, 5.578125, 5.91650390625, 6.2548828125, 6.59326171875, 6.931640625, 7.27001953125, 7.6083984375, 7.94677734375, 8.28515625, 8.62353515625, 8.9619140625, 9.30029296875, 9.638671875, 9.97705078125, 10.3154296875, 10.65380859375, 10.9921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 8.0, 7.0, 16.0, 10.0, 12.0, 16.0, 25.0, 29.0, 30.0, 36.0, 26.0, 43.0, 44.0, 46.0, 50.0, 70.0, 61.0, 72.0, 55.0, 58.0, 58.0, 43.0, 28.0, 44.0, 23.0, 13.0, 14.0, 12.0, 16.0, 7.0, 4.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.03515625, -5.8533935546875, -5.671630859375, -5.4898681640625, -5.30810546875, -5.1263427734375, -4.944580078125, -4.7628173828125, -4.5810546875, -4.3992919921875, -4.217529296875, -4.0357666015625, -3.85400390625, -3.6722412109375, -3.490478515625, -3.3087158203125, -3.126953125, -2.9451904296875, -2.763427734375, -2.5816650390625, -2.39990234375, -2.2181396484375, -2.036376953125, -1.8546142578125, -1.6728515625, -1.4910888671875, -1.309326171875, -1.1275634765625, -0.94580078125, -0.7640380859375, -0.582275390625, -0.4005126953125, -0.21875, -0.0369873046875, 0.144775390625, 0.3265380859375, 0.50830078125, 0.6900634765625, 0.871826171875, 1.0535888671875, 1.2353515625, 1.4171142578125, 1.598876953125, 1.7806396484375, 1.96240234375, 2.1441650390625, 2.325927734375, 2.5076904296875, 2.689453125, 2.8712158203125, 3.052978515625, 3.2347412109375, 3.41650390625, 3.5982666015625, 3.780029296875, 3.9617919921875, 4.1435546875, 4.3253173828125, 4.507080078125, 4.6888427734375, 4.87060546875, 5.0523681640625, 5.234130859375, 5.4158935546875, 5.59765625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 4.0, 3.0, 8.0, 15.0, 11.0, 20.0, 21.0, 23.0, 18.0, 27.0, 35.0, 33.0, 39.0, 59.0, 52.0, 49.0, 52.0, 71.0, 64.0, 51.0, 52.0, 41.0, 40.0, 28.0, 28.0, 20.0, 28.0, 16.0, 20.0, 17.0, 15.0, 8.0, 5.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.777170181274414, -20.99321937561035, -20.209270477294922, -19.42531967163086, -18.641368865966797, -17.857418060302734, -17.073467254638672, -16.289518356323242, -15.50556755065918, -14.721616744995117, -13.937666893005371, -13.153717041015625, -12.369766235351562, -11.5858154296875, -10.801865577697754, -10.017915725708008, -9.233964920043945, -8.450014114379883, -7.666064262390137, -6.882113933563232, -6.098163604736328, -5.314213275909424, -4.5302629470825195, -3.7463126182556152, -2.962362289428711, -2.1784119606018066, -1.3944616317749023, -0.610511302947998, 0.17343902587890625, 0.9573893547058105, 1.7413396835327148, 2.525290012359619, 3.3092403411865234, 4.093190670013428, 4.877140998840332, 5.661091327667236, 6.445041656494141, 7.228991985321045, 8.01294231414795, 8.796892166137695, 9.580842971801758, 10.36479377746582, 11.148743629455566, 11.932693481445312, 12.716644287109375, 13.500595092773438, 14.284544944763184, 15.06849479675293, 15.852445602416992, 16.636396408081055, 17.420345306396484, 18.204296112060547, 18.98824691772461, 19.772197723388672, 20.556148529052734, 21.340097427368164, 22.124048233032227, 22.90799903869629, 23.69194793701172, 24.47589874267578, 25.259849548339844, 26.043800354003906, 26.82775115966797, 27.6117000579834, 28.39565086364746]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 4.0, 7.0, 5.0, 5.0, 6.0, 16.0, 9.0, 12.0, 14.0, 14.0, 20.0, 23.0, 20.0, 23.0, 23.0, 38.0, 37.0, 22.0, 37.0, 31.0, 43.0, 36.0, 39.0, 42.0, 39.0, 40.0, 40.0, 32.0, 31.0, 31.0, 33.0, 30.0, 23.0, 20.0, 26.0, 20.0, 14.0, 20.0, 15.0, 11.0, 9.0, 7.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-18.282730102539062, -17.698646545410156, -17.11456298828125, -16.530481338500977, -15.94639778137207, -15.362314224243164, -14.778231620788574, -14.194149017333984, -13.610065460205078, -13.025981903076172, -12.441899299621582, -11.857816696166992, -11.273733139038086, -10.68964958190918, -10.10556697845459, -9.521484375, -8.937400817871094, -8.353317260742188, -7.769234657287598, -7.18515157699585, -6.601068496704102, -6.0169854164123535, -5.4329023361206055, -4.848819255828857, -4.264736175537109, -3.6806530952453613, -3.0965700149536133, -2.5124869346618652, -1.9284038543701172, -1.3443207740783691, -0.7602376937866211, -0.17615461349487305, 0.4079265594482422, 0.9920096397399902, 1.5760927200317383, 2.1601758003234863, 2.7442588806152344, 3.3283419609069824, 3.9124250411987305, 4.4965081214904785, 5.080591201782227, 5.664674282073975, 6.248757362365723, 6.832840442657471, 7.416923522949219, 8.001007080078125, 8.585089683532715, 9.169172286987305, 9.753255844116211, 10.337339401245117, 10.921422004699707, 11.505504608154297, 12.089588165283203, 12.67367172241211, 13.2577543258667, 13.841836929321289, 14.425920486450195, 15.010004043579102, 15.594086647033691, 16.17816925048828, 16.762252807617188, 17.346336364746094, 17.930419921875, 18.514501571655273, 19.09858512878418]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 8.0, 9.0, 13.0, 22.0, 33.0, 39.0, 58.0, 104.0, 141.0, 251.0, 349.0, 522.0, 842.0, 1383.0, 2239.0, 3751.0, 6390.0, 10906.0, 19303.0, 34865.0, 65121.0, 126112.0, 251957.0, 498013.0, 840633.0, 944350.0, 661286.0, 352082.0, 175014.0, 89538.0, 47293.0, 25764.0, 14798.0, 8389.0, 4886.0, 2889.0, 1837.0, 1134.0, 678.0, 458.0, 240.0, 197.0, 134.0, 85.0, 55.0, 36.0, 24.0, 23.0, 7.0, 8.0, 9.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-21.46875, -20.781494140625, -20.09423828125, -19.406982421875, -18.7197265625, -18.032470703125, -17.34521484375, -16.657958984375, -15.970703125, -15.283447265625, -14.59619140625, -13.908935546875, -13.2216796875, -12.534423828125, -11.84716796875, -11.159912109375, -10.47265625, -9.785400390625, -9.09814453125, -8.410888671875, -7.7236328125, -7.036376953125, -6.34912109375, -5.661865234375, -4.974609375, -4.287353515625, -3.60009765625, -2.912841796875, -2.2255859375, -1.538330078125, -0.85107421875, -0.163818359375, 0.5234375, 1.210693359375, 1.89794921875, 2.585205078125, 3.2724609375, 3.959716796875, 4.64697265625, 5.334228515625, 6.021484375, 6.708740234375, 7.39599609375, 8.083251953125, 8.7705078125, 9.457763671875, 10.14501953125, 10.832275390625, 11.51953125, 12.206787109375, 12.89404296875, 13.581298828125, 14.2685546875, 14.955810546875, 15.64306640625, 16.330322265625, 17.017578125, 17.704833984375, 18.39208984375, 19.079345703125, 19.7666015625, 20.453857421875, 21.14111328125, 21.828369140625, 22.515625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 5.0, 13.0, 8.0, 7.0, 9.0, 21.0, 13.0, 22.0, 18.0, 23.0, 27.0, 20.0, 31.0, 26.0, 34.0, 40.0, 33.0, 41.0, 39.0, 44.0, 45.0, 54.0, 42.0, 37.0, 36.0, 24.0, 33.0, 39.0, 29.0, 21.0, 35.0, 12.0, 17.0, 16.0, 19.0, 11.0, 9.0, 9.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.125, -13.6710205078125, -13.217041015625, -12.7630615234375, -12.30908203125, -11.8551025390625, -11.401123046875, -10.9471435546875, -10.4931640625, -10.0391845703125, -9.585205078125, -9.1312255859375, -8.67724609375, -8.2232666015625, -7.769287109375, -7.3153076171875, -6.861328125, -6.4073486328125, -5.953369140625, -5.4993896484375, -5.04541015625, -4.5914306640625, -4.137451171875, -3.6834716796875, -3.2294921875, -2.7755126953125, -2.321533203125, -1.8675537109375, -1.41357421875, -0.9595947265625, -0.505615234375, -0.0516357421875, 0.40234375, 0.8563232421875, 1.310302734375, 1.7642822265625, 2.21826171875, 2.6722412109375, 3.126220703125, 3.5802001953125, 4.0341796875, 4.4881591796875, 4.942138671875, 5.3961181640625, 5.85009765625, 6.3040771484375, 6.758056640625, 7.2120361328125, 7.666015625, 8.1199951171875, 8.573974609375, 9.0279541015625, 9.48193359375, 9.9359130859375, 10.389892578125, 10.8438720703125, 11.2978515625, 11.7518310546875, 12.205810546875, 12.6597900390625, 13.11376953125, 13.5677490234375, 14.021728515625, 14.4757080078125, 14.9296875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 12.0, 11.0, 23.0, 25.0, 44.0, 74.0, 131.0, 197.0, 270.0, 476.0, 726.0, 1137.0, 1881.0, 3106.0, 5307.0, 8765.0, 14902.0, 25829.0, 45126.0, 77991.0, 136778.0, 232662.0, 385400.0, 585130.0, 738348.0, 686736.0, 493560.0, 310828.0, 184725.0, 106539.0, 61912.0, 35458.0, 20369.0, 11808.0, 6877.0, 4359.0, 2604.0, 1551.0, 938.0, 598.0, 375.0, 262.0, 164.0, 108.0, 63.0, 32.0, 27.0, 18.0, 7.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.0625, -17.494140625, -16.92578125, -16.357421875, -15.7890625, -15.220703125, -14.65234375, -14.083984375, -13.515625, -12.947265625, -12.37890625, -11.810546875, -11.2421875, -10.673828125, -10.10546875, -9.537109375, -8.96875, -8.400390625, -7.83203125, -7.263671875, -6.6953125, -6.126953125, -5.55859375, -4.990234375, -4.421875, -3.853515625, -3.28515625, -2.716796875, -2.1484375, -1.580078125, -1.01171875, -0.443359375, 0.125, 0.693359375, 1.26171875, 1.830078125, 2.3984375, 2.966796875, 3.53515625, 4.103515625, 4.671875, 5.240234375, 5.80859375, 6.376953125, 6.9453125, 7.513671875, 8.08203125, 8.650390625, 9.21875, 9.787109375, 10.35546875, 10.923828125, 11.4921875, 12.060546875, 12.62890625, 13.197265625, 13.765625, 14.333984375, 14.90234375, 15.470703125, 16.0390625, 16.607421875, 17.17578125, 17.744140625, 18.3125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 4.0, 12.0, 7.0, 11.0, 18.0, 27.0, 31.0, 36.0, 45.0, 53.0, 80.0, 112.0, 133.0, 142.0, 154.0, 196.0, 191.0, 227.0, 263.0, 268.0, 263.0, 258.0, 244.0, 207.0, 175.0, 152.0, 155.0, 102.0, 103.0, 99.0, 76.0, 56.0, 36.0, 33.0, 28.0, 20.0, 19.0, 11.0, 7.0, 4.0, 4.0, 5.0, 4.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.15234375, -6.91156005859375, -6.6707763671875, -6.42999267578125, -6.189208984375, -5.94842529296875, -5.7076416015625, -5.46685791015625, -5.22607421875, -4.98529052734375, -4.7445068359375, -4.50372314453125, -4.262939453125, -4.02215576171875, -3.7813720703125, -3.54058837890625, -3.2998046875, -3.05902099609375, -2.8182373046875, -2.57745361328125, -2.336669921875, -2.09588623046875, -1.8551025390625, -1.61431884765625, -1.37353515625, -1.13275146484375, -0.8919677734375, -0.65118408203125, -0.410400390625, -0.16961669921875, 0.0711669921875, 0.31195068359375, 0.552734375, 0.79351806640625, 1.0343017578125, 1.27508544921875, 1.515869140625, 1.75665283203125, 1.9974365234375, 2.23822021484375, 2.47900390625, 2.71978759765625, 2.9605712890625, 3.20135498046875, 3.442138671875, 3.68292236328125, 3.9237060546875, 4.16448974609375, 4.4052734375, 4.64605712890625, 4.8868408203125, 5.12762451171875, 5.368408203125, 5.60919189453125, 5.8499755859375, 6.09075927734375, 6.33154296875, 6.57232666015625, 6.8131103515625, 7.05389404296875, 7.294677734375, 7.53546142578125, 7.7762451171875, 8.01702880859375, 8.2578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 11.0, 10.0, 9.0, 11.0, 17.0, 18.0, 17.0, 25.0, 33.0, 31.0, 33.0, 43.0, 58.0, 66.0, 57.0, 72.0, 54.0, 57.0, 61.0, 64.0, 43.0, 35.0, 35.0, 40.0, 21.0, 17.0, 17.0, 10.0, 5.0, 5.0, 7.0, 6.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.756803512573242, -16.042152404785156, -15.327502250671387, -14.6128511428833, -13.898200988769531, -13.183549880981445, -12.46889877319336, -11.754247665405273, -11.039597511291504, -10.324946403503418, -9.610296249389648, -8.895645141601562, -8.180994033813477, -7.466343879699707, -6.751692771911621, -6.037042140960693, -5.322391510009766, -4.607740879058838, -3.893090009689331, -3.178439140319824, -2.4637885093688965, -1.7491378784179688, -1.0344867706298828, -0.3198361396789551, 0.39481449127197266, 1.10946524143219, 1.8241159915924072, 2.538766860961914, 3.253417491912842, 3.9680681228637695, 4.6827192306518555, 5.397369861602783, 6.112022399902344, 6.8266730308532715, 7.541323661804199, 8.255974769592285, 8.970624923706055, 9.68527603149414, 10.399927139282227, 11.114578247070312, 11.829228401184082, 12.543879508972168, 13.258529663085938, 13.973180770874023, 14.68783187866211, 15.402482032775879, 16.11713409423828, 16.831783294677734, 17.54643440246582, 18.261085510253906, 18.975736618041992, 19.690387725830078, 20.40503692626953, 21.119688034057617, 21.834339141845703, 22.54899024963379, 23.263641357421875, 23.97829246520996, 24.692943572998047, 25.4075927734375, 26.122243881225586, 26.836894989013672, 27.551546096801758, 28.266197204589844, 28.980846405029297]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 7.0, 12.0, 6.0, 10.0, 7.0, 8.0, 15.0, 9.0, 20.0, 20.0, 18.0, 20.0, 24.0, 30.0, 26.0, 37.0, 21.0, 31.0, 40.0, 35.0, 43.0, 33.0, 46.0, 31.0, 39.0, 52.0, 43.0, 30.0, 27.0, 26.0, 27.0, 35.0, 22.0, 15.0, 24.0, 15.0, 10.0, 21.0, 12.0, 14.0, 10.0, 8.0, 8.0, 2.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.44165802001953, -15.951186180114746, -15.460715293884277, -14.970243453979492, -14.479771614074707, -13.989299774169922, -13.498828887939453, -13.008357048034668, -12.517885208129883, -12.027413368225098, -11.536942481994629, -11.046470642089844, -10.555998802185059, -10.065526962280273, -9.575056076049805, -9.08458423614502, -8.59411334991455, -8.103641510009766, -7.613170146942139, -7.122698783874512, -6.632226943969727, -6.1417555809021, -5.651284217834473, -5.1608123779296875, -4.6703410148620605, -4.179869651794434, -3.6893978118896484, -3.1989264488220215, -2.7084548473358154, -2.2179832458496094, -1.7275118827819824, -1.2370402812957764, -0.7465677261352539, -0.2560961842536926, 0.23437535762786865, 0.7248468399047852, 1.2153184413909912, 1.7057900428771973, 2.196261405944824, 2.6867330074310303, 3.1772046089172363, 3.6676762104034424, 4.158147811889648, 4.648619174957275, 5.139090538024902, 5.6295623779296875, 6.1200337409973145, 6.610505104064941, 7.100976943969727, 7.5914483070373535, 8.08191967010498, 8.572391510009766, 9.06286334991455, 9.553335189819336, 10.043806076049805, 10.53427791595459, 11.024749755859375, 11.51522159576416, 12.005692481994629, 12.496164321899414, 12.9866361618042, 13.477108001708984, 13.967578887939453, 14.458050727844238, 14.948521614074707]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 17.0, 23.0, 29.0, 45.0, 58.0, 102.0, 153.0, 230.0, 324.0, 502.0, 737.0, 1156.0, 1718.0, 2676.0, 4212.0, 6861.0, 10942.0, 17867.0, 29504.0, 49723.0, 83332.0, 135872.0, 192615.0, 186923.0, 127350.0, 77428.0, 45942.0, 27489.0, 16899.0, 10314.0, 6211.0, 3981.0, 2553.0, 1669.0, 1043.0, 666.0, 462.0, 299.0, 202.0, 128.0, 84.0, 69.0, 38.0, 30.0, 22.0, 18.0, 7.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0], "bins": [-53.875, -52.287109375, -50.69921875, -49.111328125, -47.5234375, -45.935546875, -44.34765625, -42.759765625, -41.171875, -39.583984375, -37.99609375, -36.408203125, -34.8203125, -33.232421875, -31.64453125, -30.056640625, -28.46875, -26.880859375, -25.29296875, -23.705078125, -22.1171875, -20.529296875, -18.94140625, -17.353515625, -15.765625, -14.177734375, -12.58984375, -11.001953125, -9.4140625, -7.826171875, -6.23828125, -4.650390625, -3.0625, -1.474609375, 0.11328125, 1.701171875, 3.2890625, 4.876953125, 6.46484375, 8.052734375, 9.640625, 11.228515625, 12.81640625, 14.404296875, 15.9921875, 17.580078125, 19.16796875, 20.755859375, 22.34375, 23.931640625, 25.51953125, 27.107421875, 28.6953125, 30.283203125, 31.87109375, 33.458984375, 35.046875, 36.634765625, 38.22265625, 39.810546875, 41.3984375, 42.986328125, 44.57421875, 46.162109375, 47.75]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 6.0, 11.0, 14.0, 10.0, 12.0, 15.0, 10.0, 11.0, 18.0, 25.0, 25.0, 35.0, 29.0, 40.0, 30.0, 29.0, 46.0, 41.0, 44.0, 46.0, 28.0, 32.0, 47.0, 28.0, 39.0, 52.0, 32.0, 29.0, 32.0, 24.0, 22.0, 17.0, 20.0, 15.0, 11.0, 13.0, 15.0, 10.0, 6.0, 4.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.984375, -12.567138671875, -12.14990234375, -11.732666015625, -11.3154296875, -10.898193359375, -10.48095703125, -10.063720703125, -9.646484375, -9.229248046875, -8.81201171875, -8.394775390625, -7.9775390625, -7.560302734375, -7.14306640625, -6.725830078125, -6.30859375, -5.891357421875, -5.47412109375, -5.056884765625, -4.6396484375, -4.222412109375, -3.80517578125, -3.387939453125, -2.970703125, -2.553466796875, -2.13623046875, -1.718994140625, -1.3017578125, -0.884521484375, -0.46728515625, -0.050048828125, 0.3671875, 0.784423828125, 1.20166015625, 1.618896484375, 2.0361328125, 2.453369140625, 2.87060546875, 3.287841796875, 3.705078125, 4.122314453125, 4.53955078125, 4.956787109375, 5.3740234375, 5.791259765625, 6.20849609375, 6.625732421875, 7.04296875, 7.460205078125, 7.87744140625, 8.294677734375, 8.7119140625, 9.129150390625, 9.54638671875, 9.963623046875, 10.380859375, 10.798095703125, 11.21533203125, 11.632568359375, 12.0498046875, 12.467041015625, 12.88427734375, 13.301513671875, 13.71875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 7.0, 18.0, 23.0, 30.0, 47.0, 65.0, 98.0, 141.0, 205.0, 341.0, 530.0, 819.0, 1257.0, 1917.0, 3119.0, 5194.0, 8650.0, 15001.0, 26320.0, 48678.0, 91981.0, 177534.0, 261423.0, 188151.0, 98045.0, 51674.0, 28061.0, 15794.0, 9039.0, 5421.0, 3307.0, 2016.0, 1304.0, 784.0, 524.0, 342.0, 223.0, 156.0, 86.0, 78.0, 47.0, 33.0, 27.0, 16.0, 10.0, 5.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-50.1875, -48.54443359375, -46.9013671875, -45.25830078125, -43.615234375, -41.97216796875, -40.3291015625, -38.68603515625, -37.04296875, -35.39990234375, -33.7568359375, -32.11376953125, -30.470703125, -28.82763671875, -27.1845703125, -25.54150390625, -23.8984375, -22.25537109375, -20.6123046875, -18.96923828125, -17.326171875, -15.68310546875, -14.0400390625, -12.39697265625, -10.75390625, -9.11083984375, -7.4677734375, -5.82470703125, -4.181640625, -2.53857421875, -0.8955078125, 0.74755859375, 2.390625, 4.03369140625, 5.6767578125, 7.31982421875, 8.962890625, 10.60595703125, 12.2490234375, 13.89208984375, 15.53515625, 17.17822265625, 18.8212890625, 20.46435546875, 22.107421875, 23.75048828125, 25.3935546875, 27.03662109375, 28.6796875, 30.32275390625, 31.9658203125, 33.60888671875, 35.251953125, 36.89501953125, 38.5380859375, 40.18115234375, 41.82421875, 43.46728515625, 45.1103515625, 46.75341796875, 48.396484375, 50.03955078125, 51.6826171875, 53.32568359375, 54.96875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 11.0, 6.0, 3.0, 7.0, 11.0, 13.0, 18.0, 19.0, 18.0, 27.0, 27.0, 34.0, 45.0, 40.0, 46.0, 43.0, 43.0, 48.0, 43.0, 62.0, 39.0, 43.0, 55.0, 37.0, 27.0, 36.0, 33.0, 37.0, 30.0, 18.0, 17.0, 20.0, 13.0, 15.0, 6.0, 7.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -10.0281982421875, -9.665771484375, -9.3033447265625, -8.94091796875, -8.5784912109375, -8.216064453125, -7.8536376953125, -7.4912109375, -7.1287841796875, -6.766357421875, -6.4039306640625, -6.04150390625, -5.6790771484375, -5.316650390625, -4.9542236328125, -4.591796875, -4.2293701171875, -3.866943359375, -3.5045166015625, -3.14208984375, -2.7796630859375, -2.417236328125, -2.0548095703125, -1.6923828125, -1.3299560546875, -0.967529296875, -0.6051025390625, -0.24267578125, 0.1197509765625, 0.482177734375, 0.8446044921875, 1.20703125, 1.5694580078125, 1.931884765625, 2.2943115234375, 2.65673828125, 3.0191650390625, 3.381591796875, 3.7440185546875, 4.1064453125, 4.4688720703125, 4.831298828125, 5.1937255859375, 5.55615234375, 5.9185791015625, 6.281005859375, 6.6434326171875, 7.005859375, 7.3682861328125, 7.730712890625, 8.0931396484375, 8.45556640625, 8.8179931640625, 9.180419921875, 9.5428466796875, 9.9052734375, 10.2677001953125, 10.630126953125, 10.9925537109375, 11.35498046875, 11.7174072265625, 12.079833984375, 12.4422607421875, 12.8046875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 15.0, 12.0, 41.0, 60.0, 77.0, 110.0, 148.0, 231.0, 346.0, 531.0, 757.0, 1231.0, 1917.0, 3209.0, 5513.0, 9689.0, 19914.0, 52765.0, 225760.0, 530416.0, 125548.0, 35235.0, 15135.0, 7856.0, 4540.0, 2717.0, 1664.0, 1077.0, 723.0, 431.0, 293.0, 195.0, 94.0, 91.0, 60.0, 62.0, 25.0, 17.0, 10.0, 13.0, 8.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.375, -66.3828125, -64.390625, -62.3984375, -60.40625, -58.4140625, -56.421875, -54.4296875, -52.4375, -50.4453125, -48.453125, -46.4609375, -44.46875, -42.4765625, -40.484375, -38.4921875, -36.5, -34.5078125, -32.515625, -30.5234375, -28.53125, -26.5390625, -24.546875, -22.5546875, -20.5625, -18.5703125, -16.578125, -14.5859375, -12.59375, -10.6015625, -8.609375, -6.6171875, -4.625, -2.6328125, -0.640625, 1.3515625, 3.34375, 5.3359375, 7.328125, 9.3203125, 11.3125, 13.3046875, 15.296875, 17.2890625, 19.28125, 21.2734375, 23.265625, 25.2578125, 27.25, 29.2421875, 31.234375, 33.2265625, 35.21875, 37.2109375, 39.203125, 41.1953125, 43.1875, 45.1796875, 47.171875, 49.1640625, 51.15625, 53.1484375, 55.140625, 57.1328125, 59.125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 1.0, 2.0, 5.0, 9.0, 7.0, 11.0, 8.0, 16.0, 25.0, 22.0, 45.0, 56.0, 126.0, 201.0, 204.0, 95.0, 53.0, 25.0, 18.0, 15.0, 11.0, 7.0, 9.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.005359649658203125, -0.005191922187805176, -0.0050241947174072266, -0.004856467247009277, -0.004688739776611328, -0.004521012306213379, -0.00435328483581543, -0.0041855573654174805, -0.004017829895019531, -0.003850102424621582, -0.003682374954223633, -0.0035146474838256836, -0.0033469200134277344, -0.003179192543029785, -0.003011465072631836, -0.0028437376022338867, -0.0026760101318359375, -0.0025082826614379883, -0.002340555191040039, -0.00217282772064209, -0.0020051002502441406, -0.0018373727798461914, -0.0016696453094482422, -0.001501917839050293, -0.0013341903686523438, -0.0011664628982543945, -0.0009987354278564453, -0.0008310079574584961, -0.0006632804870605469, -0.0004955530166625977, -0.00032782554626464844, -0.00016009807586669922, 7.62939453125e-06, 0.00017535686492919922, 0.00034308433532714844, 0.0005108118057250977, 0.0006785392761230469, 0.0008462667465209961, 0.0010139942169189453, 0.0011817216873168945, 0.0013494491577148438, 0.001517176628112793, 0.0016849040985107422, 0.0018526315689086914, 0.0020203590393066406, 0.00218808650970459, 0.002355813980102539, 0.0025235414505004883, 0.0026912689208984375, 0.0028589963912963867, 0.003026723861694336, 0.003194451332092285, 0.0033621788024902344, 0.0035299062728881836, 0.003697633743286133, 0.003865361213684082, 0.004033088684082031, 0.0042008161544799805, 0.00436854362487793, 0.004536271095275879, 0.004703998565673828, 0.004871726036071777, 0.0050394535064697266, 0.005207180976867676, 0.005374908447265625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 4.0, 5.0, 6.0, 14.0, 9.0, 16.0, 23.0, 27.0, 58.0, 65.0, 126.0, 201.0, 256.0, 435.0, 692.0, 1118.0, 1775.0, 2922.0, 5036.0, 8551.0, 15089.0, 27969.0, 54827.0, 113401.0, 213150.0, 256957.0, 170330.0, 83515.0, 40932.0, 21552.0, 11986.0, 6979.0, 4055.0, 2421.0, 1511.0, 932.0, 555.0, 328.0, 254.0, 156.0, 111.0, 63.0, 50.0, 29.0, 27.0, 18.0, 9.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.46875, -19.745361328125, -19.02197265625, -18.298583984375, -17.5751953125, -16.851806640625, -16.12841796875, -15.405029296875, -14.681640625, -13.958251953125, -13.23486328125, -12.511474609375, -11.7880859375, -11.064697265625, -10.34130859375, -9.617919921875, -8.89453125, -8.171142578125, -7.44775390625, -6.724365234375, -6.0009765625, -5.277587890625, -4.55419921875, -3.830810546875, -3.107421875, -2.384033203125, -1.66064453125, -0.937255859375, -0.2138671875, 0.509521484375, 1.23291015625, 1.956298828125, 2.6796875, 3.403076171875, 4.12646484375, 4.849853515625, 5.5732421875, 6.296630859375, 7.02001953125, 7.743408203125, 8.466796875, 9.190185546875, 9.91357421875, 10.636962890625, 11.3603515625, 12.083740234375, 12.80712890625, 13.530517578125, 14.25390625, 14.977294921875, 15.70068359375, 16.424072265625, 17.1474609375, 17.870849609375, 18.59423828125, 19.317626953125, 20.041015625, 20.764404296875, 21.48779296875, 22.211181640625, 22.9345703125, 23.657958984375, 24.38134765625, 25.104736328125, 25.828125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 11.0, 3.0, 13.0, 7.0, 4.0, 13.0, 14.0, 16.0, 20.0, 33.0, 38.0, 45.0, 33.0, 62.0, 64.0, 66.0, 62.0, 70.0, 75.0, 51.0, 51.0, 52.0, 26.0, 28.0, 20.0, 23.0, 21.0, 9.0, 13.0, 16.0, 8.0, 5.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.296875, -7.0692138671875, -6.841552734375, -6.6138916015625, -6.38623046875, -6.1585693359375, -5.930908203125, -5.7032470703125, -5.4755859375, -5.2479248046875, -5.020263671875, -4.7926025390625, -4.56494140625, -4.3372802734375, -4.109619140625, -3.8819580078125, -3.654296875, -3.4266357421875, -3.198974609375, -2.9713134765625, -2.74365234375, -2.5159912109375, -2.288330078125, -2.0606689453125, -1.8330078125, -1.6053466796875, -1.377685546875, -1.1500244140625, -0.92236328125, -0.6947021484375, -0.467041015625, -0.2393798828125, -0.01171875, 0.2159423828125, 0.443603515625, 0.6712646484375, 0.89892578125, 1.1265869140625, 1.354248046875, 1.5819091796875, 1.8095703125, 2.0372314453125, 2.264892578125, 2.4925537109375, 2.72021484375, 2.9478759765625, 3.175537109375, 3.4031982421875, 3.630859375, 3.8585205078125, 4.086181640625, 4.3138427734375, 4.54150390625, 4.7691650390625, 4.996826171875, 5.2244873046875, 5.4521484375, 5.6798095703125, 5.907470703125, 6.1351318359375, 6.36279296875, 6.5904541015625, 6.818115234375, 7.0457763671875, 7.2734375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 7.0, 6.0, 13.0, 15.0, 16.0, 26.0, 32.0, 33.0, 24.0, 34.0, 40.0, 41.0, 62.0, 50.0, 68.0, 67.0, 63.0, 63.0, 40.0, 53.0, 43.0, 44.0, 26.0, 21.0, 21.0, 14.0, 12.0, 12.0, 16.0, 17.0, 4.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.731992721557617, -17.144939422607422, -16.557886123657227, -15.970832824707031, -15.383779525756836, -14.79672622680664, -14.209672927856445, -13.62261962890625, -13.035566329956055, -12.44851303100586, -11.861459732055664, -11.274406433105469, -10.687353134155273, -10.100299835205078, -9.513246536254883, -8.926193237304688, -8.339139938354492, -7.752086639404297, -7.165033340454102, -6.577980041503906, -5.990926742553711, -5.403873443603516, -4.81682014465332, -4.229766845703125, -3.6427135467529297, -3.0556602478027344, -2.468606948852539, -1.8815536499023438, -1.2945003509521484, -0.7074470520019531, -0.12039375305175781, 0.4666595458984375, 1.0537109375, 1.6407642364501953, 2.2278175354003906, 2.814870834350586, 3.4019241333007812, 3.9889774322509766, 4.576030731201172, 5.163084030151367, 5.7501373291015625, 6.337190628051758, 6.924243927001953, 7.511297225952148, 8.098350524902344, 8.685403823852539, 9.272457122802734, 9.85951042175293, 10.446563720703125, 11.03361701965332, 11.620670318603516, 12.207723617553711, 12.794776916503906, 13.381830215454102, 13.968883514404297, 14.555936813354492, 15.142990112304688, 15.730043411254883, 16.317096710205078, 16.904150009155273, 17.49120330810547, 18.078256607055664, 18.66530990600586, 19.252363204956055, 19.83941650390625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 10.0, 9.0, 3.0, 11.0, 8.0, 12.0, 15.0, 20.0, 21.0, 21.0, 24.0, 43.0, 25.0, 26.0, 27.0, 39.0, 35.0, 35.0, 43.0, 32.0, 36.0, 42.0, 40.0, 35.0, 37.0, 29.0, 46.0, 30.0, 29.0, 28.0, 31.0, 21.0, 12.0, 18.0, 18.0, 8.0, 13.0, 14.0, 13.0, 6.0, 6.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.537544250488281, -13.119582176208496, -12.701620101928711, -12.283658027648926, -11.86569595336914, -11.447732925415039, -11.029770851135254, -10.611808776855469, -10.193846702575684, -9.775884628295898, -9.357922554016113, -8.939960479736328, -8.521997451782227, -8.104036331176758, -7.686073303222656, -7.268111228942871, -6.850149154663086, -6.432187080383301, -6.014225006103516, -5.596262454986572, -5.178300380706787, -4.760338306427002, -4.342375755310059, -3.9244136810302734, -3.5064516067504883, -3.088489532470703, -2.670527219772339, -2.2525649070739746, -1.8346028327941895, -1.4166407585144043, -0.99867844581604, -0.5807161331176758, -0.16275405883789062, 0.2552081346511841, 0.6731703281402588, 1.0911325216293335, 1.5090947151184082, 1.9270567893981934, 2.3450191020965576, 2.762981414794922, 3.180943489074707, 3.598905563354492, 4.016867637634277, 4.434830188751221, 4.852792263031006, 5.270754337310791, 5.688716888427734, 6.1066789627075195, 6.524641036987305, 6.94260311126709, 7.360565185546875, 7.778527736663818, 8.196489334106445, 8.614452362060547, 9.032414436340332, 9.450376510620117, 9.868338584899902, 10.286300659179688, 10.704262733459473, 11.122224807739258, 11.54018783569336, 11.958148956298828, 12.37611198425293, 12.794074058532715, 13.2120361328125]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 9.0, 15.0, 17.0, 35.0, 43.0, 43.0, 68.0, 117.0, 188.0, 263.0, 420.0, 584.0, 966.0, 1453.0, 2194.0, 3312.0, 5101.0, 7665.0, 11510.0, 17013.0, 25047.0, 36329.0, 51203.0, 69625.0, 89380.0, 106633.0, 116517.0, 114517.0, 101045.0, 81939.0, 62711.0, 45189.0, 31718.0, 21828.0, 14578.0, 10102.0, 6569.0, 4261.0, 2892.0, 1855.0, 1244.0, 809.0, 539.0, 328.0, 239.0, 147.0, 99.0, 64.0, 53.0, 21.0, 20.0, 18.0, 15.0, 7.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.84375, -10.5133056640625, -10.182861328125, -9.8524169921875, -9.52197265625, -9.1915283203125, -8.861083984375, -8.5306396484375, -8.2001953125, -7.8697509765625, -7.539306640625, -7.2088623046875, -6.87841796875, -6.5479736328125, -6.217529296875, -5.8870849609375, -5.556640625, -5.2261962890625, -4.895751953125, -4.5653076171875, -4.23486328125, -3.9044189453125, -3.573974609375, -3.2435302734375, -2.9130859375, -2.5826416015625, -2.252197265625, -1.9217529296875, -1.59130859375, -1.2608642578125, -0.930419921875, -0.5999755859375, -0.26953125, 0.0609130859375, 0.391357421875, 0.7218017578125, 1.05224609375, 1.3826904296875, 1.713134765625, 2.0435791015625, 2.3740234375, 2.7044677734375, 3.034912109375, 3.3653564453125, 3.69580078125, 4.0262451171875, 4.356689453125, 4.6871337890625, 5.017578125, 5.3480224609375, 5.678466796875, 6.0089111328125, 6.33935546875, 6.6697998046875, 7.000244140625, 7.3306884765625, 7.6611328125, 7.9915771484375, 8.322021484375, 8.6524658203125, 8.98291015625, 9.3133544921875, 9.643798828125, 9.9742431640625, 10.3046875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 6.0, 7.0, 12.0, 7.0, 7.0, 15.0, 11.0, 17.0, 32.0, 25.0, 20.0, 22.0, 23.0, 39.0, 43.0, 41.0, 33.0, 31.0, 32.0, 41.0, 50.0, 39.0, 38.0, 34.0, 38.0, 24.0, 33.0, 41.0, 41.0, 20.0, 34.0, 26.0, 22.0, 16.0, 14.0, 7.0, 6.0, 9.0, 6.0, 10.0, 4.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.0703125, -12.662353515625, -12.25439453125, -11.846435546875, -11.4384765625, -11.030517578125, -10.62255859375, -10.214599609375, -9.806640625, -9.398681640625, -8.99072265625, -8.582763671875, -8.1748046875, -7.766845703125, -7.35888671875, -6.950927734375, -6.54296875, -6.135009765625, -5.72705078125, -5.319091796875, -4.9111328125, -4.503173828125, -4.09521484375, -3.687255859375, -3.279296875, -2.871337890625, -2.46337890625, -2.055419921875, -1.6474609375, -1.239501953125, -0.83154296875, -0.423583984375, -0.015625, 0.392333984375, 0.80029296875, 1.208251953125, 1.6162109375, 2.024169921875, 2.43212890625, 2.840087890625, 3.248046875, 3.656005859375, 4.06396484375, 4.471923828125, 4.8798828125, 5.287841796875, 5.69580078125, 6.103759765625, 6.51171875, 6.919677734375, 7.32763671875, 7.735595703125, 8.1435546875, 8.551513671875, 8.95947265625, 9.367431640625, 9.775390625, 10.183349609375, 10.59130859375, 10.999267578125, 11.4072265625, 11.815185546875, 12.22314453125, 12.631103515625, 13.0390625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 7.0, 9.0, 10.0, 17.0, 35.0, 43.0, 61.0, 125.0, 170.0, 234.0, 377.0, 561.0, 797.0, 1199.0, 1813.0, 2798.0, 4238.0, 6656.0, 10348.0, 16055.0, 25578.0, 38449.0, 57980.0, 82791.0, 109264.0, 130881.0, 136108.0, 121355.0, 96107.0, 69374.0, 46867.0, 31312.0, 20035.0, 12936.0, 8303.0, 5302.0, 3459.0, 2277.0, 1502.0, 1035.0, 660.0, 470.0, 321.0, 193.0, 143.0, 103.0, 73.0, 43.0, 29.0, 17.0, 17.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-11.234375, -10.885986328125, -10.53759765625, -10.189208984375, -9.8408203125, -9.492431640625, -9.14404296875, -8.795654296875, -8.447265625, -8.098876953125, -7.75048828125, -7.402099609375, -7.0537109375, -6.705322265625, -6.35693359375, -6.008544921875, -5.66015625, -5.311767578125, -4.96337890625, -4.614990234375, -4.2666015625, -3.918212890625, -3.56982421875, -3.221435546875, -2.873046875, -2.524658203125, -2.17626953125, -1.827880859375, -1.4794921875, -1.131103515625, -0.78271484375, -0.434326171875, -0.0859375, 0.262451171875, 0.61083984375, 0.959228515625, 1.3076171875, 1.656005859375, 2.00439453125, 2.352783203125, 2.701171875, 3.049560546875, 3.39794921875, 3.746337890625, 4.0947265625, 4.443115234375, 4.79150390625, 5.139892578125, 5.48828125, 5.836669921875, 6.18505859375, 6.533447265625, 6.8818359375, 7.230224609375, 7.57861328125, 7.927001953125, 8.275390625, 8.623779296875, 8.97216796875, 9.320556640625, 9.6689453125, 10.017333984375, 10.36572265625, 10.714111328125, 11.0625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 9.0, 6.0, 10.0, 17.0, 9.0, 12.0, 13.0, 14.0, 21.0, 19.0, 22.0, 34.0, 34.0, 27.0, 30.0, 39.0, 36.0, 33.0, 45.0, 34.0, 48.0, 45.0, 33.0, 33.0, 26.0, 34.0, 35.0, 30.0, 27.0, 33.0, 31.0, 21.0, 22.0, 24.0, 15.0, 7.0, 9.0, 14.0, 7.0, 10.0, 3.0, 6.0, 11.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-9.0390625, -8.7698974609375, -8.500732421875, -8.2315673828125, -7.96240234375, -7.6932373046875, -7.424072265625, -7.1549072265625, -6.8857421875, -6.6165771484375, -6.347412109375, -6.0782470703125, -5.80908203125, -5.5399169921875, -5.270751953125, -5.0015869140625, -4.732421875, -4.4632568359375, -4.194091796875, -3.9249267578125, -3.65576171875, -3.3865966796875, -3.117431640625, -2.8482666015625, -2.5791015625, -2.3099365234375, -2.040771484375, -1.7716064453125, -1.50244140625, -1.2332763671875, -0.964111328125, -0.6949462890625, -0.42578125, -0.1566162109375, 0.112548828125, 0.3817138671875, 0.65087890625, 0.9200439453125, 1.189208984375, 1.4583740234375, 1.7275390625, 1.9967041015625, 2.265869140625, 2.5350341796875, 2.80419921875, 3.0733642578125, 3.342529296875, 3.6116943359375, 3.880859375, 4.1500244140625, 4.419189453125, 4.6883544921875, 4.95751953125, 5.2266845703125, 5.495849609375, 5.7650146484375, 6.0341796875, 6.3033447265625, 6.572509765625, 6.8416748046875, 7.11083984375, 7.3800048828125, 7.649169921875, 7.9183349609375, 8.1875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 4.0, 0.0, 9.0, 2.0, 7.0, 9.0, 24.0, 22.0, 37.0, 52.0, 81.0, 127.0, 198.0, 293.0, 499.0, 781.0, 1201.0, 2093.0, 3707.0, 6459.0, 11743.0, 21699.0, 41113.0, 79188.0, 144675.0, 215558.0, 213364.0, 141148.0, 77006.0, 40080.0, 21103.0, 11237.0, 6240.0, 3561.0, 2063.0, 1165.0, 728.0, 454.0, 267.0, 201.0, 128.0, 85.0, 43.0, 41.0, 20.0, 18.0, 6.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.4609375, -12.0308837890625, -11.600830078125, -11.1707763671875, -10.74072265625, -10.3106689453125, -9.880615234375, -9.4505615234375, -9.0205078125, -8.5904541015625, -8.160400390625, -7.7303466796875, -7.30029296875, -6.8702392578125, -6.440185546875, -6.0101318359375, -5.580078125, -5.1500244140625, -4.719970703125, -4.2899169921875, -3.85986328125, -3.4298095703125, -2.999755859375, -2.5697021484375, -2.1396484375, -1.7095947265625, -1.279541015625, -0.8494873046875, -0.41943359375, 0.0106201171875, 0.440673828125, 0.8707275390625, 1.30078125, 1.7308349609375, 2.160888671875, 2.5909423828125, 3.02099609375, 3.4510498046875, 3.881103515625, 4.3111572265625, 4.7412109375, 5.1712646484375, 5.601318359375, 6.0313720703125, 6.46142578125, 6.8914794921875, 7.321533203125, 7.7515869140625, 8.181640625, 8.6116943359375, 9.041748046875, 9.4718017578125, 9.90185546875, 10.3319091796875, 10.761962890625, 11.1920166015625, 11.6220703125, 12.0521240234375, 12.482177734375, 12.9122314453125, 13.34228515625, 13.7723388671875, 14.202392578125, 14.6324462890625, 15.0625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 7.0, 11.0, 14.0, 18.0, 30.0, 35.0, 42.0, 56.0, 60.0, 77.0, 91.0, 93.0, 84.0, 70.0, 66.0, 58.0, 45.0, 37.0, 25.0, 25.0, 19.0, 16.0, 6.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010709762573242188, -0.0010169297456741333, -0.0009628832340240479, -0.0009088367223739624, -0.000854790210723877, -0.0008007436990737915, -0.0007466971874237061, -0.0006926506757736206, -0.0006386041641235352, -0.0005845576524734497, -0.0005305111408233643, -0.0004764646291732788, -0.00042241811752319336, -0.0003683716058731079, -0.00031432509422302246, -0.000260278582572937, -0.00020623207092285156, -0.0001521855592727661, -9.813904762268066e-05, -4.4092535972595215e-05, 9.953975677490234e-06, 6.400048732757568e-05, 0.00011804699897766113, 0.00017209351062774658, 0.00022614002227783203, 0.0002801865339279175, 0.00033423304557800293, 0.0003882795572280884, 0.00044232606887817383, 0.0004963725805282593, 0.0005504190921783447, 0.0006044656038284302, 0.0006585121154785156, 0.0007125586271286011, 0.0007666051387786865, 0.000820651650428772, 0.0008746981620788574, 0.0009287446737289429, 0.0009827911853790283, 0.0010368376970291138, 0.0010908842086791992, 0.0011449307203292847, 0.0011989772319793701, 0.0012530237436294556, 0.001307070255279541, 0.0013611167669296265, 0.001415163278579712, 0.0014692097902297974, 0.0015232563018798828, 0.0015773028135299683, 0.0016313493251800537, 0.0016853958368301392, 0.0017394423484802246, 0.00179348886013031, 0.0018475353717803955, 0.001901581883430481, 0.0019556283950805664, 0.002009674906730652, 0.0020637214183807373, 0.0021177679300308228, 0.002171814441680908, 0.0022258609533309937, 0.002279907464981079, 0.0023339539766311646, 0.00238800048828125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 7.0, 16.0, 11.0, 22.0, 31.0, 48.0, 71.0, 115.0, 160.0, 224.0, 421.0, 674.0, 1202.0, 2137.0, 4205.0, 8099.0, 16358.0, 33959.0, 70540.0, 141798.0, 229378.0, 235063.0, 152643.0, 77791.0, 37156.0, 17665.0, 8761.0, 4519.0, 2301.0, 1263.0, 702.0, 429.0, 255.0, 180.0, 115.0, 73.0, 47.0, 31.0, 22.0, 12.0, 17.0, 5.0, 7.0, 5.0, 6.0, 7.0, 0.0, 3.0, 0.0, 1.0], "bins": [-16.203125, -15.740966796875, -15.27880859375, -14.816650390625, -14.3544921875, -13.892333984375, -13.43017578125, -12.968017578125, -12.505859375, -12.043701171875, -11.58154296875, -11.119384765625, -10.6572265625, -10.195068359375, -9.73291015625, -9.270751953125, -8.80859375, -8.346435546875, -7.88427734375, -7.422119140625, -6.9599609375, -6.497802734375, -6.03564453125, -5.573486328125, -5.111328125, -4.649169921875, -4.18701171875, -3.724853515625, -3.2626953125, -2.800537109375, -2.33837890625, -1.876220703125, -1.4140625, -0.951904296875, -0.48974609375, -0.027587890625, 0.4345703125, 0.896728515625, 1.35888671875, 1.821044921875, 2.283203125, 2.745361328125, 3.20751953125, 3.669677734375, 4.1318359375, 4.593994140625, 5.05615234375, 5.518310546875, 5.98046875, 6.442626953125, 6.90478515625, 7.366943359375, 7.8291015625, 8.291259765625, 8.75341796875, 9.215576171875, 9.677734375, 10.139892578125, 10.60205078125, 11.064208984375, 11.5263671875, 11.988525390625, 12.45068359375, 12.912841796875, 13.375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 7.0, 12.0, 5.0, 14.0, 15.0, 15.0, 15.0, 21.0, 19.0, 26.0, 20.0, 36.0, 36.0, 35.0, 37.0, 58.0, 58.0, 55.0, 69.0, 50.0, 52.0, 53.0, 66.0, 35.0, 29.0, 35.0, 28.0, 16.0, 13.0, 16.0, 16.0, 7.0, 13.0, 3.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.275390625, -3.1685791015625, -3.061767578125, -2.9549560546875, -2.84814453125, -2.7413330078125, -2.634521484375, -2.5277099609375, -2.4208984375, -2.3140869140625, -2.207275390625, -2.1004638671875, -1.99365234375, -1.8868408203125, -1.780029296875, -1.6732177734375, -1.56640625, -1.4595947265625, -1.352783203125, -1.2459716796875, -1.13916015625, -1.0323486328125, -0.925537109375, -0.8187255859375, -0.7119140625, -0.6051025390625, -0.498291015625, -0.3914794921875, -0.28466796875, -0.1778564453125, -0.071044921875, 0.0357666015625, 0.142578125, 0.2493896484375, 0.356201171875, 0.4630126953125, 0.56982421875, 0.6766357421875, 0.783447265625, 0.8902587890625, 0.9970703125, 1.1038818359375, 1.210693359375, 1.3175048828125, 1.42431640625, 1.5311279296875, 1.637939453125, 1.7447509765625, 1.8515625, 1.9583740234375, 2.065185546875, 2.1719970703125, 2.27880859375, 2.3856201171875, 2.492431640625, 2.5992431640625, 2.7060546875, 2.8128662109375, 2.919677734375, 3.0264892578125, 3.13330078125, 3.2401123046875, 3.346923828125, 3.4537353515625, 3.560546875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 6.0, 10.0, 7.0, 8.0, 16.0, 20.0, 19.0, 35.0, 30.0, 30.0, 49.0, 38.0, 63.0, 66.0, 64.0, 56.0, 73.0, 66.0, 57.0, 51.0, 49.0, 33.0, 24.0, 28.0, 22.0, 16.0, 10.0, 15.0, 12.0, 9.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.925884246826172, -18.344158172607422, -17.762432098388672, -17.180706024169922, -16.598979949951172, -16.017255783081055, -15.435529708862305, -14.853803634643555, -14.272077560424805, -13.690351486206055, -13.108625411987305, -12.526900291442871, -11.945174217224121, -11.363448143005371, -10.781723022460938, -10.199996948242188, -9.618270874023438, -9.036544799804688, -8.454818725585938, -7.873093605041504, -7.291367530822754, -6.709641456604004, -6.127915859222412, -5.54619026184082, -4.96446418762207, -4.38273811340332, -3.8010125160217285, -3.2192866802215576, -2.6375608444213867, -2.055835008621216, -1.474109172821045, -0.8923835754394531, -0.3106575012207031, 0.2710683345794678, 0.8527941703796387, 1.4345200061798096, 2.0162458419799805, 2.5979716777801514, 3.1796975135803223, 3.761423110961914, 4.343149185180664, 4.924875259399414, 5.506600856781006, 6.088326454162598, 6.670052528381348, 7.251778602600098, 7.8335041999816895, 8.415229797363281, 8.996955871582031, 9.578681945800781, 10.160408020019531, 10.742133140563965, 11.323859214782715, 11.905585289001465, 12.487310409545898, 13.069036483764648, 13.650762557983398, 14.232488632202148, 14.814214706420898, 15.395939826965332, 15.977665901184082, 16.559391021728516, 17.141117095947266, 17.722843170166016, 18.304569244384766]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 6.0, 6.0, 11.0, 12.0, 12.0, 11.0, 14.0, 14.0, 17.0, 16.0, 27.0, 18.0, 21.0, 24.0, 28.0, 35.0, 27.0, 36.0, 36.0, 33.0, 34.0, 39.0, 48.0, 33.0, 38.0, 35.0, 28.0, 39.0, 29.0, 20.0, 25.0, 16.0, 30.0, 27.0, 20.0, 14.0, 20.0, 14.0, 12.0, 11.0, 5.0, 13.0, 5.0, 9.0, 10.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-11.267414093017578, -10.8882417678833, -10.509069442749023, -10.129897117614746, -9.750724792480469, -9.371553421020508, -8.99238109588623, -8.613208770751953, -8.234036445617676, -7.854864120483398, -7.475691795349121, -7.096519947052002, -6.717347621917725, -6.338175296783447, -5.959003448486328, -5.579831123352051, -5.200658798217773, -4.821486473083496, -4.442314147949219, -4.0631422996521, -3.6839699745178223, -3.304797649383545, -2.9256255626678467, -2.5464534759521484, -2.167281150817871, -1.7881089448928833, -1.4089367389678955, -1.0297645330429077, -0.6505923271179199, -0.27142012119293213, 0.10775208473205566, 0.4869241714477539, 0.8660955429077148, 1.2452677488327026, 1.6244399547576904, 2.0036120414733887, 2.382784366607666, 2.7619566917419434, 3.1411287784576416, 3.52030086517334, 3.899473190307617, 4.2786455154418945, 4.657817840576172, 5.036989688873291, 5.416162014007568, 5.795334339141846, 6.174506187438965, 6.553678512573242, 6.9328508377075195, 7.312023162841797, 7.691195487976074, 8.070367813110352, 8.449539184570312, 8.82871150970459, 9.207883834838867, 9.587056159973145, 9.966228485107422, 10.3454008102417, 10.724573135375977, 11.103745460510254, 11.482917785644531, 11.862089157104492, 12.24126148223877, 12.620433807373047, 12.999606132507324]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 23.0, 34.0, 47.0, 63.0, 112.0, 147.0, 261.0, 425.0, 646.0, 1032.0, 1734.0, 2861.0, 4728.0, 7842.0, 12972.0, 22349.0, 37767.0, 66672.0, 119785.0, 221210.0, 407467.0, 672667.0, 842449.0, 730747.0, 466408.0, 255253.0, 137538.0, 75797.0, 43165.0, 24901.0, 14655.0, 8839.0, 5226.0, 3237.0, 1966.0, 1171.0, 760.0, 500.0, 311.0, 168.0, 133.0, 80.0, 44.0, 22.0, 16.0, 11.0, 7.0, 9.0, 2.0, 3.0, 2.0, 2.0], "bins": [-12.875, -12.5030517578125, -12.131103515625, -11.7591552734375, -11.38720703125, -11.0152587890625, -10.643310546875, -10.2713623046875, -9.8994140625, -9.5274658203125, -9.155517578125, -8.7835693359375, -8.41162109375, -8.0396728515625, -7.667724609375, -7.2957763671875, -6.923828125, -6.5518798828125, -6.179931640625, -5.8079833984375, -5.43603515625, -5.0640869140625, -4.692138671875, -4.3201904296875, -3.9482421875, -3.5762939453125, -3.204345703125, -2.8323974609375, -2.46044921875, -2.0885009765625, -1.716552734375, -1.3446044921875, -0.97265625, -0.6007080078125, -0.228759765625, 0.1431884765625, 0.51513671875, 0.8870849609375, 1.259033203125, 1.6309814453125, 2.0029296875, 2.3748779296875, 2.746826171875, 3.1187744140625, 3.49072265625, 3.8626708984375, 4.234619140625, 4.6065673828125, 4.978515625, 5.3504638671875, 5.722412109375, 6.0943603515625, 6.46630859375, 6.8382568359375, 7.210205078125, 7.5821533203125, 7.9541015625, 8.3260498046875, 8.697998046875, 9.0699462890625, 9.44189453125, 9.8138427734375, 10.185791015625, 10.5577392578125, 10.9296875]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 9.0, 3.0, 7.0, 8.0, 9.0, 9.0, 10.0, 14.0, 15.0, 18.0, 12.0, 16.0, 32.0, 23.0, 25.0, 29.0, 28.0, 31.0, 39.0, 36.0, 33.0, 30.0, 33.0, 37.0, 40.0, 44.0, 32.0, 39.0, 41.0, 24.0, 25.0, 29.0, 27.0, 32.0, 22.0, 22.0, 19.0, 16.0, 12.0, 12.0, 11.0, 13.0, 9.0, 7.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-9.390625, -9.1121826171875, -8.833740234375, -8.5552978515625, -8.27685546875, -7.9984130859375, -7.719970703125, -7.4415283203125, -7.1630859375, -6.8846435546875, -6.606201171875, -6.3277587890625, -6.04931640625, -5.7708740234375, -5.492431640625, -5.2139892578125, -4.935546875, -4.6571044921875, -4.378662109375, -4.1002197265625, -3.82177734375, -3.5433349609375, -3.264892578125, -2.9864501953125, -2.7080078125, -2.4295654296875, -2.151123046875, -1.8726806640625, -1.59423828125, -1.3157958984375, -1.037353515625, -0.7589111328125, -0.48046875, -0.2020263671875, 0.076416015625, 0.3548583984375, 0.63330078125, 0.9117431640625, 1.190185546875, 1.4686279296875, 1.7470703125, 2.0255126953125, 2.303955078125, 2.5823974609375, 2.86083984375, 3.1392822265625, 3.417724609375, 3.6961669921875, 3.974609375, 4.2530517578125, 4.531494140625, 4.8099365234375, 5.08837890625, 5.3668212890625, 5.645263671875, 5.9237060546875, 6.2021484375, 6.4805908203125, 6.759033203125, 7.0374755859375, 7.31591796875, 7.5943603515625, 7.872802734375, 8.1512451171875, 8.4296875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 15.0, 6.0, 9.0, 13.0, 34.0, 32.0, 80.0, 114.0, 195.0, 317.0, 583.0, 980.0, 1920.0, 3210.0, 6255.0, 11884.0, 22534.0, 44803.0, 90057.0, 184016.0, 365729.0, 673924.0, 955697.0, 831436.0, 494061.0, 253448.0, 125490.0, 62254.0, 31148.0, 15625.0, 8379.0, 4444.0, 2360.0, 1394.0, 781.0, 407.0, 260.0, 166.0, 81.0, 54.0, 35.0, 27.0, 15.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.30029296875, -13.8349609375, -13.36962890625, -12.904296875, -12.43896484375, -11.9736328125, -11.50830078125, -11.04296875, -10.57763671875, -10.1123046875, -9.64697265625, -9.181640625, -8.71630859375, -8.2509765625, -7.78564453125, -7.3203125, -6.85498046875, -6.3896484375, -5.92431640625, -5.458984375, -4.99365234375, -4.5283203125, -4.06298828125, -3.59765625, -3.13232421875, -2.6669921875, -2.20166015625, -1.736328125, -1.27099609375, -0.8056640625, -0.34033203125, 0.125, 0.59033203125, 1.0556640625, 1.52099609375, 1.986328125, 2.45166015625, 2.9169921875, 3.38232421875, 3.84765625, 4.31298828125, 4.7783203125, 5.24365234375, 5.708984375, 6.17431640625, 6.6396484375, 7.10498046875, 7.5703125, 8.03564453125, 8.5009765625, 8.96630859375, 9.431640625, 9.89697265625, 10.3623046875, 10.82763671875, 11.29296875, 11.75830078125, 12.2236328125, 12.68896484375, 13.154296875, 13.61962890625, 14.0849609375, 14.55029296875, 15.015625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 6.0, 18.0, 25.0, 33.0, 34.0, 56.0, 93.0, 89.0, 140.0, 161.0, 184.0, 234.0, 258.0, 302.0, 320.0, 285.0, 323.0, 306.0, 210.0, 206.0, 166.0, 135.0, 115.0, 80.0, 75.0, 55.0, 42.0, 24.0, 21.0, 18.0, 18.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.6717529296875, -4.491943359375, -4.3121337890625, -4.13232421875, -3.9525146484375, -3.772705078125, -3.5928955078125, -3.4130859375, -3.2332763671875, -3.053466796875, -2.8736572265625, -2.69384765625, -2.5140380859375, -2.334228515625, -2.1544189453125, -1.974609375, -1.7947998046875, -1.614990234375, -1.4351806640625, -1.25537109375, -1.0755615234375, -0.895751953125, -0.7159423828125, -0.5361328125, -0.3563232421875, -0.176513671875, 0.0032958984375, 0.18310546875, 0.3629150390625, 0.542724609375, 0.7225341796875, 0.90234375, 1.0821533203125, 1.261962890625, 1.4417724609375, 1.62158203125, 1.8013916015625, 1.981201171875, 2.1610107421875, 2.3408203125, 2.5206298828125, 2.700439453125, 2.8802490234375, 3.06005859375, 3.2398681640625, 3.419677734375, 3.5994873046875, 3.779296875, 3.9591064453125, 4.138916015625, 4.3187255859375, 4.49853515625, 4.6783447265625, 4.858154296875, 5.0379638671875, 5.2177734375, 5.3975830078125, 5.577392578125, 5.7572021484375, 5.93701171875, 6.1168212890625, 6.296630859375, 6.4764404296875, 6.65625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 4.0, 3.0, 13.0, 12.0, 22.0, 27.0, 22.0, 34.0, 37.0, 47.0, 48.0, 56.0, 77.0, 67.0, 66.0, 68.0, 60.0, 47.0, 42.0, 42.0, 38.0, 35.0, 30.0, 21.0, 21.0, 12.0, 10.0, 10.0, 7.0, 6.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.35306739807129, -15.859697341918945, -15.366327285766602, -14.872958183288574, -14.37958812713623, -13.886218070983887, -13.392848014831543, -12.899478912353516, -12.406108856201172, -11.912738800048828, -11.419368743896484, -10.925999641418457, -10.432629585266113, -9.93925952911377, -9.445889472961426, -8.952520370483398, -8.459150314331055, -7.965780258178711, -7.472410678863525, -6.979040622711182, -6.485671043395996, -5.992300987243652, -5.498930931091309, -5.005561351776123, -4.512190818786621, -4.018820762634277, -3.525451183319092, -3.032081127166748, -2.5387115478515625, -2.0453414916992188, -1.551971673965454, -1.0586018562316895, -0.5652322769165039, -0.07186242938041687, 0.42150741815567017, 0.9148772954940796, 1.4082471132278442, 1.9016170501708984, 2.394986867904663, 2.8883566856384277, 3.3817265033721924, 3.875096321105957, 4.368466377258301, 4.861835956573486, 5.35520601272583, 5.848575592041016, 6.341945648193359, 6.835315704345703, 7.328685283660889, 7.822055339813232, 8.315424919128418, 8.808794975280762, 9.302165031433105, 9.795534133911133, 10.288904190063477, 10.78227424621582, 11.275644302368164, 11.769014358520508, 12.262384414672852, 12.755753517150879, 13.249123573303223, 13.742493629455566, 14.23586368560791, 14.729232788085938, 15.222602844238281]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 9.0, 7.0, 11.0, 5.0, 12.0, 13.0, 20.0, 28.0, 30.0, 24.0, 25.0, 32.0, 33.0, 36.0, 45.0, 38.0, 41.0, 41.0, 42.0, 45.0, 34.0, 35.0, 40.0, 36.0, 36.0, 34.0, 28.0, 30.0, 28.0, 20.0, 25.0, 19.0, 18.0, 11.0, 11.0, 14.0, 11.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.916070938110352, -10.57299518585205, -10.22991943359375, -9.88684368133545, -9.543767929077148, -9.200692176818848, -8.857616424560547, -8.514540672302246, -8.171464920043945, -7.8283891677856445, -7.485313415527344, -7.142237663269043, -6.799161911010742, -6.456086158752441, -6.113010406494141, -5.76993465423584, -5.426858901977539, -5.083783149719238, -4.7407073974609375, -4.397631645202637, -4.054555892944336, -3.711480140686035, -3.3684043884277344, -3.0253286361694336, -2.682252883911133, -2.339177131652832, -1.9961013793945312, -1.6530256271362305, -1.3099498748779297, -0.9668741226196289, -0.6237983703613281, -0.28072261810302734, 0.062354087829589844, 0.4054298400878906, 0.7485055923461914, 1.0915813446044922, 1.434657096862793, 1.7777328491210938, 2.1208086013793945, 2.4638843536376953, 2.806960105895996, 3.150035858154297, 3.4931116104125977, 3.8361873626708984, 4.179263114929199, 4.5223388671875, 4.865414619445801, 5.208490371704102, 5.551566123962402, 5.894641876220703, 6.237717628479004, 6.580793380737305, 6.9238691329956055, 7.266944885253906, 7.610020637512207, 7.953096389770508, 8.296172142028809, 8.63924789428711, 8.98232364654541, 9.325399398803711, 9.668475151062012, 10.011550903320312, 10.354626655578613, 10.697702407836914, 11.040778160095215]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 10.0, 7.0, 21.0, 15.0, 30.0, 42.0, 66.0, 88.0, 128.0, 169.0, 242.0, 348.0, 440.0, 606.0, 930.0, 1328.0, 2095.0, 3140.0, 4886.0, 8178.0, 14342.0, 29209.0, 71116.0, 198042.0, 357410.0, 210879.0, 75655.0, 30505.0, 15035.0, 8460.0, 5157.0, 3281.0, 2184.0, 1368.0, 904.0, 642.0, 471.0, 341.0, 240.0, 175.0, 112.0, 85.0, 42.0, 43.0, 26.0, 21.0, 16.0, 11.0, 3.0, 7.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-33.78125, -32.6748046875, -31.568359375, -30.4619140625, -29.35546875, -28.2490234375, -27.142578125, -26.0361328125, -24.9296875, -23.8232421875, -22.716796875, -21.6103515625, -20.50390625, -19.3974609375, -18.291015625, -17.1845703125, -16.078125, -14.9716796875, -13.865234375, -12.7587890625, -11.65234375, -10.5458984375, -9.439453125, -8.3330078125, -7.2265625, -6.1201171875, -5.013671875, -3.9072265625, -2.80078125, -1.6943359375, -0.587890625, 0.5185546875, 1.625, 2.7314453125, 3.837890625, 4.9443359375, 6.05078125, 7.1572265625, 8.263671875, 9.3701171875, 10.4765625, 11.5830078125, 12.689453125, 13.7958984375, 14.90234375, 16.0087890625, 17.115234375, 18.2216796875, 19.328125, 20.4345703125, 21.541015625, 22.6474609375, 23.75390625, 24.8603515625, 25.966796875, 27.0732421875, 28.1796875, 29.2861328125, 30.392578125, 31.4990234375, 32.60546875, 33.7119140625, 34.818359375, 35.9248046875, 37.03125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 1.0, 7.0, 3.0, 8.0, 6.0, 6.0, 6.0, 16.0, 14.0, 18.0, 21.0, 18.0, 33.0, 31.0, 30.0, 34.0, 31.0, 37.0, 43.0, 46.0, 34.0, 35.0, 34.0, 38.0, 35.0, 42.0, 45.0, 44.0, 41.0, 25.0, 26.0, 28.0, 22.0, 25.0, 18.0, 22.0, 15.0, 13.0, 14.0, 8.0, 6.0, 7.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.09375, -9.7830810546875, -9.472412109375, -9.1617431640625, -8.85107421875, -8.5404052734375, -8.229736328125, -7.9190673828125, -7.6083984375, -7.2977294921875, -6.987060546875, -6.6763916015625, -6.36572265625, -6.0550537109375, -5.744384765625, -5.4337158203125, -5.123046875, -4.8123779296875, -4.501708984375, -4.1910400390625, -3.88037109375, -3.5697021484375, -3.259033203125, -2.9483642578125, -2.6376953125, -2.3270263671875, -2.016357421875, -1.7056884765625, -1.39501953125, -1.0843505859375, -0.773681640625, -0.4630126953125, -0.15234375, 0.1583251953125, 0.468994140625, 0.7796630859375, 1.09033203125, 1.4010009765625, 1.711669921875, 2.0223388671875, 2.3330078125, 2.6436767578125, 2.954345703125, 3.2650146484375, 3.57568359375, 3.8863525390625, 4.197021484375, 4.5076904296875, 4.818359375, 5.1290283203125, 5.439697265625, 5.7503662109375, 6.06103515625, 6.3717041015625, 6.682373046875, 6.9930419921875, 7.3037109375, 7.6143798828125, 7.925048828125, 8.2357177734375, 8.54638671875, 8.8570556640625, 9.167724609375, 9.4783935546875, 9.7890625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 21.0, 14.0, 27.0, 55.0, 69.0, 119.0, 199.0, 354.0, 500.0, 771.0, 1372.0, 2199.0, 3706.0, 6576.0, 11647.0, 22201.0, 46851.0, 115482.0, 302284.0, 311853.0, 121886.0, 49024.0, 22885.0, 12069.0, 6735.0, 3749.0, 2281.0, 1365.0, 842.0, 544.0, 325.0, 204.0, 124.0, 82.0, 44.0, 24.0, 15.0, 8.0, 9.0, 9.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-34.90625, -33.88037109375, -32.8544921875, -31.82861328125, -30.802734375, -29.77685546875, -28.7509765625, -27.72509765625, -26.69921875, -25.67333984375, -24.6474609375, -23.62158203125, -22.595703125, -21.56982421875, -20.5439453125, -19.51806640625, -18.4921875, -17.46630859375, -16.4404296875, -15.41455078125, -14.388671875, -13.36279296875, -12.3369140625, -11.31103515625, -10.28515625, -9.25927734375, -8.2333984375, -7.20751953125, -6.181640625, -5.15576171875, -4.1298828125, -3.10400390625, -2.078125, -1.05224609375, -0.0263671875, 0.99951171875, 2.025390625, 3.05126953125, 4.0771484375, 5.10302734375, 6.12890625, 7.15478515625, 8.1806640625, 9.20654296875, 10.232421875, 11.25830078125, 12.2841796875, 13.31005859375, 14.3359375, 15.36181640625, 16.3876953125, 17.41357421875, 18.439453125, 19.46533203125, 20.4912109375, 21.51708984375, 22.54296875, 23.56884765625, 24.5947265625, 25.62060546875, 26.646484375, 27.67236328125, 28.6982421875, 29.72412109375, 30.75]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 7.0, 6.0, 9.0, 12.0, 14.0, 23.0, 15.0, 29.0, 24.0, 27.0, 38.0, 38.0, 56.0, 35.0, 48.0, 44.0, 52.0, 57.0, 46.0, 39.0, 61.0, 37.0, 43.0, 37.0, 32.0, 31.0, 27.0, 20.0, 20.0, 15.0, 16.0, 12.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.93505859375, -8.6826171875, -8.43017578125, -8.177734375, -7.92529296875, -7.6728515625, -7.42041015625, -7.16796875, -6.91552734375, -6.6630859375, -6.41064453125, -6.158203125, -5.90576171875, -5.6533203125, -5.40087890625, -5.1484375, -4.89599609375, -4.6435546875, -4.39111328125, -4.138671875, -3.88623046875, -3.6337890625, -3.38134765625, -3.12890625, -2.87646484375, -2.6240234375, -2.37158203125, -2.119140625, -1.86669921875, -1.6142578125, -1.36181640625, -1.109375, -0.85693359375, -0.6044921875, -0.35205078125, -0.099609375, 0.15283203125, 0.4052734375, 0.65771484375, 0.91015625, 1.16259765625, 1.4150390625, 1.66748046875, 1.919921875, 2.17236328125, 2.4248046875, 2.67724609375, 2.9296875, 3.18212890625, 3.4345703125, 3.68701171875, 3.939453125, 4.19189453125, 4.4443359375, 4.69677734375, 4.94921875, 5.20166015625, 5.4541015625, 5.70654296875, 5.958984375, 6.21142578125, 6.4638671875, 6.71630859375, 6.96875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 11.0, 25.0, 25.0, 33.0, 54.0, 83.0, 130.0, 169.0, 281.0, 380.0, 620.0, 955.0, 1488.0, 2471.0, 3965.0, 6912.0, 13229.0, 28187.0, 75232.0, 239899.0, 409027.0, 164285.0, 53671.0, 21813.0, 10506.0, 5873.0, 3480.0, 2012.0, 1246.0, 853.0, 579.0, 348.0, 234.0, 152.0, 100.0, 79.0, 37.0, 36.0, 19.0, 18.0, 12.0, 7.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.73291015625, -17.1845703125, -16.63623046875, -16.087890625, -15.53955078125, -14.9912109375, -14.44287109375, -13.89453125, -13.34619140625, -12.7978515625, -12.24951171875, -11.701171875, -11.15283203125, -10.6044921875, -10.05615234375, -9.5078125, -8.95947265625, -8.4111328125, -7.86279296875, -7.314453125, -6.76611328125, -6.2177734375, -5.66943359375, -5.12109375, -4.57275390625, -4.0244140625, -3.47607421875, -2.927734375, -2.37939453125, -1.8310546875, -1.28271484375, -0.734375, -0.18603515625, 0.3623046875, 0.91064453125, 1.458984375, 2.00732421875, 2.5556640625, 3.10400390625, 3.65234375, 4.20068359375, 4.7490234375, 5.29736328125, 5.845703125, 6.39404296875, 6.9423828125, 7.49072265625, 8.0390625, 8.58740234375, 9.1357421875, 9.68408203125, 10.232421875, 10.78076171875, 11.3291015625, 11.87744140625, 12.42578125, 12.97412109375, 13.5224609375, 14.07080078125, 14.619140625, 15.16748046875, 15.7158203125, 16.26416015625, 16.8125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 7.0, 5.0, 13.0, 15.0, 32.0, 54.0, 113.0, 208.0, 239.0, 133.0, 69.0, 24.0, 19.0, 12.0, 10.0, 6.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001354217529296875, -0.0013023614883422852, -0.0012505054473876953, -0.0011986494064331055, -0.0011467933654785156, -0.0010949373245239258, -0.001043081283569336, -0.000991225242614746, -0.0009393692016601562, -0.0008875131607055664, -0.0008356571197509766, -0.0007838010787963867, -0.0007319450378417969, -0.000680088996887207, -0.0006282329559326172, -0.0005763769149780273, -0.0005245208740234375, -0.00047266483306884766, -0.0004208087921142578, -0.00036895275115966797, -0.0003170967102050781, -0.0002652406692504883, -0.00021338462829589844, -0.0001615285873413086, -0.00010967254638671875, -5.7816505432128906e-05, -5.9604644775390625e-06, 4.589557647705078e-05, 9.775161743164062e-05, 0.00014960765838623047, 0.0002014636993408203, 0.00025331974029541016, 0.00030517578125, 0.00035703182220458984, 0.0004088878631591797, 0.00046074390411376953, 0.0005125999450683594, 0.0005644559860229492, 0.0006163120269775391, 0.0006681680679321289, 0.0007200241088867188, 0.0007718801498413086, 0.0008237361907958984, 0.0008755922317504883, 0.0009274482727050781, 0.000979304313659668, 0.0010311603546142578, 0.0010830163955688477, 0.0011348724365234375, 0.0011867284774780273, 0.0012385845184326172, 0.001290440559387207, 0.0013422966003417969, 0.0013941526412963867, 0.0014460086822509766, 0.0014978647232055664, 0.0015497207641601562, 0.001601576805114746, 0.001653432846069336, 0.0017052888870239258, 0.0017571449279785156, 0.0018090009689331055, 0.0018608570098876953, 0.0019127130508422852, 0.001964569091796875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 5.0, 4.0, 5.0, 21.0, 25.0, 27.0, 42.0, 49.0, 92.0, 129.0, 189.0, 282.0, 383.0, 512.0, 775.0, 1145.0, 1684.0, 2394.0, 3477.0, 5543.0, 8707.0, 14192.0, 24289.0, 43735.0, 81277.0, 148599.0, 220437.0, 204474.0, 125885.0, 67957.0, 36777.0, 20851.0, 12106.0, 7511.0, 4847.0, 3155.0, 2081.0, 1532.0, 1052.0, 706.0, 464.0, 346.0, 253.0, 167.0, 119.0, 77.0, 54.0, 54.0, 15.0, 21.0, 13.0, 7.0, 8.0, 5.0, 4.0, 1.0, 1.0], "bins": [-10.6953125, -10.37939453125, -10.0634765625, -9.74755859375, -9.431640625, -9.11572265625, -8.7998046875, -8.48388671875, -8.16796875, -7.85205078125, -7.5361328125, -7.22021484375, -6.904296875, -6.58837890625, -6.2724609375, -5.95654296875, -5.640625, -5.32470703125, -5.0087890625, -4.69287109375, -4.376953125, -4.06103515625, -3.7451171875, -3.42919921875, -3.11328125, -2.79736328125, -2.4814453125, -2.16552734375, -1.849609375, -1.53369140625, -1.2177734375, -0.90185546875, -0.5859375, -0.27001953125, 0.0458984375, 0.36181640625, 0.677734375, 0.99365234375, 1.3095703125, 1.62548828125, 1.94140625, 2.25732421875, 2.5732421875, 2.88916015625, 3.205078125, 3.52099609375, 3.8369140625, 4.15283203125, 4.46875, 4.78466796875, 5.1005859375, 5.41650390625, 5.732421875, 6.04833984375, 6.3642578125, 6.68017578125, 6.99609375, 7.31201171875, 7.6279296875, 7.94384765625, 8.259765625, 8.57568359375, 8.8916015625, 9.20751953125, 9.5234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 5.0, 4.0, 6.0, 7.0, 10.0, 14.0, 12.0, 12.0, 24.0, 25.0, 27.0, 46.0, 46.0, 47.0, 56.0, 65.0, 63.0, 65.0, 73.0, 58.0, 48.0, 46.0, 29.0, 35.0, 34.0, 20.0, 20.0, 20.0, 10.0, 10.0, 15.0, 9.0, 5.0, 7.0, 4.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.77734375, -3.6678466796875, -3.558349609375, -3.4488525390625, -3.33935546875, -3.2298583984375, -3.120361328125, -3.0108642578125, -2.9013671875, -2.7918701171875, -2.682373046875, -2.5728759765625, -2.46337890625, -2.3538818359375, -2.244384765625, -2.1348876953125, -2.025390625, -1.9158935546875, -1.806396484375, -1.6968994140625, -1.58740234375, -1.4779052734375, -1.368408203125, -1.2589111328125, -1.1494140625, -1.0399169921875, -0.930419921875, -0.8209228515625, -0.71142578125, -0.6019287109375, -0.492431640625, -0.3829345703125, -0.2734375, -0.1639404296875, -0.054443359375, 0.0550537109375, 0.16455078125, 0.2740478515625, 0.383544921875, 0.4930419921875, 0.6025390625, 0.7120361328125, 0.821533203125, 0.9310302734375, 1.04052734375, 1.1500244140625, 1.259521484375, 1.3690185546875, 1.478515625, 1.5880126953125, 1.697509765625, 1.8070068359375, 1.91650390625, 2.0260009765625, 2.135498046875, 2.2449951171875, 2.3544921875, 2.4639892578125, 2.573486328125, 2.6829833984375, 2.79248046875, 2.9019775390625, 3.011474609375, 3.1209716796875, 3.23046875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 5.0, 10.0, 15.0, 18.0, 30.0, 27.0, 41.0, 33.0, 33.0, 56.0, 43.0, 58.0, 56.0, 67.0, 59.0, 46.0, 45.0, 57.0, 44.0, 36.0, 36.0, 29.0, 36.0, 22.0, 15.0, 15.0, 11.0, 11.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.397262573242188, -11.993739128112793, -11.590215682983398, -11.18669319152832, -10.783169746398926, -10.379646301269531, -9.976123809814453, -9.572600364685059, -9.169076919555664, -8.76555347442627, -8.362030029296875, -7.958507537841797, -7.554984092712402, -7.151460647583008, -6.7479376792907715, -6.344414710998535, -5.940891265869141, -5.537367820739746, -5.13384485244751, -4.730321884155273, -4.326798439025879, -3.9232752323150635, -3.519752025604248, -3.1162288188934326, -2.712705612182617, -2.3091824054718018, -1.9056591987609863, -1.502135992050171, -1.0986127853393555, -0.69508957862854, -0.2915663719177246, 0.11195683479309082, 0.5154809951782227, 0.9190042018890381, 1.3225274085998535, 1.726050615310669, 2.1295738220214844, 2.5330970287323, 2.9366202354431152, 3.3401434421539307, 3.743666648864746, 4.147190093994141, 4.550713062286377, 4.954236030578613, 5.357759475708008, 5.761282920837402, 6.164805889129639, 6.568328857421875, 6.9718523025512695, 7.375375747680664, 7.7788987159729, 8.182421684265137, 8.585945129394531, 8.989468574523926, 9.39299201965332, 9.796514511108398, 10.200037956237793, 10.603561401367188, 11.007083892822266, 11.41060733795166, 11.814130783081055, 12.21765422821045, 12.621177673339844, 13.024700164794922, 13.428223609924316]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 9.0, 6.0, 9.0, 6.0, 24.0, 20.0, 15.0, 12.0, 25.0, 30.0, 23.0, 34.0, 47.0, 31.0, 40.0, 42.0, 42.0, 33.0, 29.0, 41.0, 41.0, 44.0, 38.0, 24.0, 42.0, 27.0, 34.0, 30.0, 23.0, 18.0, 15.0, 34.0, 16.0, 13.0, 18.0, 8.0, 10.0, 3.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.400344848632812, -9.10395622253418, -8.807567596435547, -8.511178970336914, -8.214790344238281, -7.918401718139648, -7.622012615203857, -7.325623989105225, -7.029235363006592, -6.732846736907959, -6.436458110809326, -6.140069484710693, -5.843680381774902, -5.5472917556762695, -5.250903129577637, -4.954514503479004, -4.658125877380371, -4.361737251281738, -4.0653486251831055, -3.7689597606658936, -3.4725711345672607, -3.176182508468628, -2.879793643951416, -2.583405017852783, -2.2870163917541504, -1.9906277656555176, -1.6942390203475952, -1.3978502750396729, -1.10146164894104, -0.8050730228424072, -0.5086842775344849, -0.2122955322265625, 0.08409404754638672, 0.3804827332496643, 0.6768714189529419, 0.9732601046562195, 1.269648790359497, 1.5660374164581299, 1.8624261617660522, 2.1588149070739746, 2.4552035331726074, 2.7515921592712402, 3.047980785369873, 3.344369649887085, 3.6407582759857178, 3.9371469020843506, 4.2335357666015625, 4.529924392700195, 4.826313018798828, 5.122701644897461, 5.419090270996094, 5.715478897094727, 6.011867523193359, 6.308256149291992, 6.604645252227783, 6.901033878326416, 7.197422504425049, 7.493811130523682, 7.7901997566223145, 8.086588859558105, 8.382977485656738, 8.679366111755371, 8.975754737854004, 9.272143363952637, 9.56853199005127]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 7.0, 14.0, 16.0, 33.0, 50.0, 75.0, 117.0, 153.0, 242.0, 360.0, 596.0, 888.0, 1447.0, 2242.0, 3461.0, 5398.0, 8505.0, 13307.0, 21045.0, 32578.0, 48962.0, 70915.0, 98560.0, 124216.0, 136167.0, 130083.0, 107818.0, 80482.0, 56051.0, 37048.0, 24173.0, 15801.0, 10124.0, 6410.0, 4009.0, 2570.0, 1594.0, 1081.0, 667.0, 437.0, 293.0, 200.0, 118.0, 102.0, 59.0, 29.0, 22.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-9.2890625, -9.01318359375, -8.7373046875, -8.46142578125, -8.185546875, -7.90966796875, -7.6337890625, -7.35791015625, -7.08203125, -6.80615234375, -6.5302734375, -6.25439453125, -5.978515625, -5.70263671875, -5.4267578125, -5.15087890625, -4.875, -4.59912109375, -4.3232421875, -4.04736328125, -3.771484375, -3.49560546875, -3.2197265625, -2.94384765625, -2.66796875, -2.39208984375, -2.1162109375, -1.84033203125, -1.564453125, -1.28857421875, -1.0126953125, -0.73681640625, -0.4609375, -0.18505859375, 0.0908203125, 0.36669921875, 0.642578125, 0.91845703125, 1.1943359375, 1.47021484375, 1.74609375, 2.02197265625, 2.2978515625, 2.57373046875, 2.849609375, 3.12548828125, 3.4013671875, 3.67724609375, 3.953125, 4.22900390625, 4.5048828125, 4.78076171875, 5.056640625, 5.33251953125, 5.6083984375, 5.88427734375, 6.16015625, 6.43603515625, 6.7119140625, 6.98779296875, 7.263671875, 7.53955078125, 7.8154296875, 8.09130859375, 8.3671875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 6.0, 4.0, 4.0, 3.0, 9.0, 7.0, 15.0, 11.0, 24.0, 16.0, 25.0, 24.0, 25.0, 27.0, 32.0, 45.0, 33.0, 38.0, 33.0, 42.0, 43.0, 38.0, 42.0, 31.0, 37.0, 40.0, 29.0, 30.0, 32.0, 25.0, 27.0, 23.0, 29.0, 22.0, 17.0, 18.0, 20.0, 12.0, 14.0, 7.0, 9.0, 8.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.71875, -9.438232421875, -9.15771484375, -8.877197265625, -8.5966796875, -8.316162109375, -8.03564453125, -7.755126953125, -7.474609375, -7.194091796875, -6.91357421875, -6.633056640625, -6.3525390625, -6.072021484375, -5.79150390625, -5.510986328125, -5.23046875, -4.949951171875, -4.66943359375, -4.388916015625, -4.1083984375, -3.827880859375, -3.54736328125, -3.266845703125, -2.986328125, -2.705810546875, -2.42529296875, -2.144775390625, -1.8642578125, -1.583740234375, -1.30322265625, -1.022705078125, -0.7421875, -0.461669921875, -0.18115234375, 0.099365234375, 0.3798828125, 0.660400390625, 0.94091796875, 1.221435546875, 1.501953125, 1.782470703125, 2.06298828125, 2.343505859375, 2.6240234375, 2.904541015625, 3.18505859375, 3.465576171875, 3.74609375, 4.026611328125, 4.30712890625, 4.587646484375, 4.8681640625, 5.148681640625, 5.42919921875, 5.709716796875, 5.990234375, 6.270751953125, 6.55126953125, 6.831787109375, 7.1123046875, 7.392822265625, 7.67333984375, 7.953857421875, 8.234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 12.0, 21.0, 26.0, 52.0, 58.0, 111.0, 186.0, 268.0, 404.0, 678.0, 1112.0, 1969.0, 3129.0, 5303.0, 8832.0, 15104.0, 25813.0, 42076.0, 68583.0, 102174.0, 138942.0, 159001.0, 148712.0, 117667.0, 80353.0, 51055.0, 31179.0, 18562.0, 11075.0, 6389.0, 3845.0, 2258.0, 1357.0, 833.0, 532.0, 324.0, 219.0, 134.0, 78.0, 57.0, 26.0, 16.0, 14.0, 5.0, 6.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.44775390625, -8.1533203125, -7.85888671875, -7.564453125, -7.27001953125, -6.9755859375, -6.68115234375, -6.38671875, -6.09228515625, -5.7978515625, -5.50341796875, -5.208984375, -4.91455078125, -4.6201171875, -4.32568359375, -4.03125, -3.73681640625, -3.4423828125, -3.14794921875, -2.853515625, -2.55908203125, -2.2646484375, -1.97021484375, -1.67578125, -1.38134765625, -1.0869140625, -0.79248046875, -0.498046875, -0.20361328125, 0.0908203125, 0.38525390625, 0.6796875, 0.97412109375, 1.2685546875, 1.56298828125, 1.857421875, 2.15185546875, 2.4462890625, 2.74072265625, 3.03515625, 3.32958984375, 3.6240234375, 3.91845703125, 4.212890625, 4.50732421875, 4.8017578125, 5.09619140625, 5.390625, 5.68505859375, 5.9794921875, 6.27392578125, 6.568359375, 6.86279296875, 7.1572265625, 7.45166015625, 7.74609375, 8.04052734375, 8.3349609375, 8.62939453125, 8.923828125, 9.21826171875, 9.5126953125, 9.80712890625, 10.1015625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 8.0, 8.0, 19.0, 19.0, 16.0, 14.0, 19.0, 28.0, 32.0, 30.0, 37.0, 41.0, 27.0, 38.0, 34.0, 37.0, 57.0, 52.0, 41.0, 32.0, 39.0, 34.0, 38.0, 32.0, 38.0, 39.0, 28.0, 23.0, 17.0, 24.0, 12.0, 18.0, 15.0, 9.0, 6.0, 6.0, 11.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-7.07421875, -6.8753662109375, -6.676513671875, -6.4776611328125, -6.27880859375, -6.0799560546875, -5.881103515625, -5.6822509765625, -5.4833984375, -5.2845458984375, -5.085693359375, -4.8868408203125, -4.68798828125, -4.4891357421875, -4.290283203125, -4.0914306640625, -3.892578125, -3.6937255859375, -3.494873046875, -3.2960205078125, -3.09716796875, -2.8983154296875, -2.699462890625, -2.5006103515625, -2.3017578125, -2.1029052734375, -1.904052734375, -1.7052001953125, -1.50634765625, -1.3074951171875, -1.108642578125, -0.9097900390625, -0.7109375, -0.5120849609375, -0.313232421875, -0.1143798828125, 0.08447265625, 0.2833251953125, 0.482177734375, 0.6810302734375, 0.8798828125, 1.0787353515625, 1.277587890625, 1.4764404296875, 1.67529296875, 1.8741455078125, 2.072998046875, 2.2718505859375, 2.470703125, 2.6695556640625, 2.868408203125, 3.0672607421875, 3.26611328125, 3.4649658203125, 3.663818359375, 3.8626708984375, 4.0615234375, 4.2603759765625, 4.459228515625, 4.6580810546875, 4.85693359375, 5.0557861328125, 5.254638671875, 5.4534912109375, 5.65234375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 7.0, 20.0, 17.0, 27.0, 37.0, 45.0, 71.0, 138.0, 156.0, 234.0, 373.0, 590.0, 909.0, 1360.0, 2501.0, 4270.0, 7608.0, 14135.0, 27343.0, 57002.0, 121707.0, 225898.0, 259061.0, 165541.0, 79884.0, 37500.0, 18634.0, 9844.0, 5453.0, 3174.0, 1875.0, 1128.0, 702.0, 414.0, 295.0, 204.0, 131.0, 77.0, 59.0, 34.0, 22.0, 21.0, 17.0, 11.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.880615234375, -8.60498046875, -8.329345703125, -8.0537109375, -7.778076171875, -7.50244140625, -7.226806640625, -6.951171875, -6.675537109375, -6.39990234375, -6.124267578125, -5.8486328125, -5.572998046875, -5.29736328125, -5.021728515625, -4.74609375, -4.470458984375, -4.19482421875, -3.919189453125, -3.6435546875, -3.367919921875, -3.09228515625, -2.816650390625, -2.541015625, -2.265380859375, -1.98974609375, -1.714111328125, -1.4384765625, -1.162841796875, -0.88720703125, -0.611572265625, -0.3359375, -0.060302734375, 0.21533203125, 0.490966796875, 0.7666015625, 1.042236328125, 1.31787109375, 1.593505859375, 1.869140625, 2.144775390625, 2.42041015625, 2.696044921875, 2.9716796875, 3.247314453125, 3.52294921875, 3.798583984375, 4.07421875, 4.349853515625, 4.62548828125, 4.901123046875, 5.1767578125, 5.452392578125, 5.72802734375, 6.003662109375, 6.279296875, 6.554931640625, 6.83056640625, 7.106201171875, 7.3818359375, 7.657470703125, 7.93310546875, 8.208740234375, 8.484375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 8.0, 6.0, 14.0, 13.0, 12.0, 17.0, 29.0, 31.0, 32.0, 49.0, 68.0, 68.0, 79.0, 70.0, 69.0, 65.0, 67.0, 63.0, 53.0, 34.0, 27.0, 23.0, 19.0, 13.0, 15.0, 9.0, 10.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0009379386901855469, -0.0009131729602813721, -0.0008884072303771973, -0.0008636415004730225, -0.0008388757705688477, -0.0008141100406646729, -0.000789344310760498, -0.0007645785808563232, -0.0007398128509521484, -0.0007150471210479736, -0.0006902813911437988, -0.000665515661239624, -0.0006407499313354492, -0.0006159842014312744, -0.0005912184715270996, -0.0005664527416229248, -0.00054168701171875, -0.0005169212818145752, -0.0004921555519104004, -0.0004673898220062256, -0.0004426240921020508, -0.000417858362197876, -0.00039309263229370117, -0.00036832690238952637, -0.00034356117248535156, -0.00031879544258117676, -0.00029402971267700195, -0.00026926398277282715, -0.00024449825286865234, -0.00021973252296447754, -0.00019496679306030273, -0.00017020106315612793, -0.00014543533325195312, -0.00012066960334777832, -9.590387344360352e-05, -7.113814353942871e-05, -4.6372413635253906e-05, -2.16066837310791e-05, 3.159046173095703e-06, 2.7924776077270508e-05, 5.269050598144531e-05, 7.745623588562012e-05, 0.00010222196578979492, 0.00012698769569396973, 0.00015175342559814453, 0.00017651915550231934, 0.00020128488540649414, 0.00022605061531066895, 0.00025081634521484375, 0.00027558207511901855, 0.00030034780502319336, 0.00032511353492736816, 0.00034987926483154297, 0.0003746449947357178, 0.0003994107246398926, 0.0004241764545440674, 0.0004489421844482422, 0.000473707914352417, 0.0004984736442565918, 0.0005232393741607666, 0.0005480051040649414, 0.0005727708339691162, 0.000597536563873291, 0.0006223022937774658, 0.0006470680236816406]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 26.0, 31.0, 61.0, 75.0, 150.0, 258.0, 379.0, 699.0, 1232.0, 2080.0, 3736.0, 6542.0, 12153.0, 22525.0, 42240.0, 79699.0, 141819.0, 205604.0, 207591.0, 145187.0, 81722.0, 43383.0, 23300.0, 12351.0, 6795.0, 3671.0, 2225.0, 1228.0, 711.0, 415.0, 285.0, 134.0, 74.0, 68.0, 34.0, 17.0, 22.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4609375, -7.24163818359375, -7.0223388671875, -6.80303955078125, -6.583740234375, -6.36444091796875, -6.1451416015625, -5.92584228515625, -5.70654296875, -5.48724365234375, -5.2679443359375, -5.04864501953125, -4.829345703125, -4.61004638671875, -4.3907470703125, -4.17144775390625, -3.9521484375, -3.73284912109375, -3.5135498046875, -3.29425048828125, -3.074951171875, -2.85565185546875, -2.6363525390625, -2.41705322265625, -2.19775390625, -1.97845458984375, -1.7591552734375, -1.53985595703125, -1.320556640625, -1.10125732421875, -0.8819580078125, -0.66265869140625, -0.443359375, -0.22406005859375, -0.0047607421875, 0.21453857421875, 0.433837890625, 0.65313720703125, 0.8724365234375, 1.09173583984375, 1.31103515625, 1.53033447265625, 1.7496337890625, 1.96893310546875, 2.188232421875, 2.40753173828125, 2.6268310546875, 2.84613037109375, 3.0654296875, 3.28472900390625, 3.5040283203125, 3.72332763671875, 3.942626953125, 4.16192626953125, 4.3812255859375, 4.60052490234375, 4.81982421875, 5.03912353515625, 5.2584228515625, 5.47772216796875, 5.697021484375, 5.91632080078125, 6.1356201171875, 6.35491943359375, 6.57421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 8.0, 4.0, 10.0, 10.0, 12.0, 14.0, 12.0, 29.0, 28.0, 33.0, 52.0, 35.0, 80.0, 68.0, 74.0, 74.0, 62.0, 64.0, 65.0, 62.0, 35.0, 45.0, 31.0, 18.0, 19.0, 6.0, 15.0, 2.0, 4.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.705078125, -2.62939453125, -2.5537109375, -2.47802734375, -2.40234375, -2.32666015625, -2.2509765625, -2.17529296875, -2.099609375, -2.02392578125, -1.9482421875, -1.87255859375, -1.796875, -1.72119140625, -1.6455078125, -1.56982421875, -1.494140625, -1.41845703125, -1.3427734375, -1.26708984375, -1.19140625, -1.11572265625, -1.0400390625, -0.96435546875, -0.888671875, -0.81298828125, -0.7373046875, -0.66162109375, -0.5859375, -0.51025390625, -0.4345703125, -0.35888671875, -0.283203125, -0.20751953125, -0.1318359375, -0.05615234375, 0.01953125, 0.09521484375, 0.1708984375, 0.24658203125, 0.322265625, 0.39794921875, 0.4736328125, 0.54931640625, 0.625, 0.70068359375, 0.7763671875, 0.85205078125, 0.927734375, 1.00341796875, 1.0791015625, 1.15478515625, 1.23046875, 1.30615234375, 1.3818359375, 1.45751953125, 1.533203125, 1.60888671875, 1.6845703125, 1.76025390625, 1.8359375, 1.91162109375, 1.9873046875, 2.06298828125, 2.138671875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 6.0, 6.0, 9.0, 11.0, 16.0, 9.0, 30.0, 23.0, 33.0, 34.0, 38.0, 39.0, 50.0, 44.0, 58.0, 57.0, 48.0, 53.0, 48.0, 43.0, 47.0, 46.0, 35.0, 40.0, 46.0, 15.0, 22.0, 17.0, 15.0, 15.0, 7.0, 8.0, 11.0, 7.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.908158302307129, -11.533546447753906, -11.158933639526367, -10.784321784973145, -10.409708976745605, -10.035097122192383, -9.660484313964844, -9.285872459411621, -8.911260604858398, -8.536648750305176, -8.162035942077637, -7.787424087524414, -7.412811279296875, -7.038199424743652, -6.6635870933532715, -6.288974761962891, -5.914361953735352, -5.539749622344971, -5.16513729095459, -4.790525436401367, -4.415912628173828, -4.0413007736206055, -3.6666884422302246, -3.2920761108398438, -2.917463779449463, -2.542851448059082, -2.168239116668701, -1.7936270236968994, -1.4190146923065186, -1.0444023609161377, -0.6697902679443359, -0.2951779365539551, 0.07943439483642578, 0.45404666662216187, 0.828658938407898, 1.2032711505889893, 1.5778834819793701, 1.952495813369751, 2.3271079063415527, 2.7017202377319336, 3.0763325691223145, 3.4509449005126953, 3.825557231903076, 4.200169563293457, 4.57478141784668, 4.949394226074219, 5.324006080627441, 5.698618412017822, 6.073230743408203, 6.447843074798584, 6.822455406188965, 7.1970672607421875, 7.571680068969727, 7.946291923522949, 8.320903778076172, 8.695516586303711, 9.07012939453125, 9.444741249084473, 9.819354057312012, 10.193965911865234, 10.568578720092773, 10.943190574645996, 11.317802429199219, 11.692415237426758, 12.06702709197998]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 9.0, 8.0, 13.0, 7.0, 14.0, 12.0, 15.0, 32.0, 18.0, 19.0, 33.0, 27.0, 35.0, 40.0, 43.0, 37.0, 43.0, 37.0, 41.0, 38.0, 45.0, 41.0, 39.0, 29.0, 31.0, 44.0, 37.0, 27.0, 31.0, 31.0, 24.0, 14.0, 18.0, 18.0, 9.0, 12.0, 3.0, 3.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.542945861816406, -10.234869003295898, -9.926793098449707, -9.6187162399292, -9.310640335083008, -9.0025634765625, -8.694487571716309, -8.3864107131958, -8.07833480834961, -7.77025842666626, -7.46218204498291, -7.1541056632995605, -6.846029281616211, -6.537952423095703, -6.2298760414123535, -5.921799659729004, -5.613722801208496, -5.3056464195251465, -4.997570037841797, -4.689493656158447, -4.381417274475098, -4.07334041595459, -3.7652640342712402, -3.4571876525878906, -3.149111270904541, -2.8410348892211914, -2.532958507537842, -2.224881887435913, -1.9168055057525635, -1.6087291240692139, -1.3006526231765747, -0.9925761222839355, -0.6845006942749023, -0.37642425298690796, -0.06834781169891357, 0.2397286295890808, 0.5478050708770752, 0.8558814525604248, 1.163957953453064, 1.4720344543457031, 1.7801108360290527, 2.0881872177124023, 2.396263599395752, 2.7043402194976807, 3.0124166011810303, 3.32049298286438, 3.6285696029663086, 3.936645984649658, 4.244722366333008, 4.552798748016357, 4.860875129699707, 5.168951511383057, 5.477027893066406, 5.785104751586914, 6.093181133270264, 6.401257514953613, 6.709333896636963, 7.0174102783203125, 7.325486660003662, 7.633563041687012, 7.9416399002075195, 8.249715805053711, 8.557792663574219, 8.865869522094727, 9.173945426940918]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 11.0, 10.0, 14.0, 20.0, 39.0, 52.0, 80.0, 107.0, 155.0, 266.0, 436.0, 634.0, 1033.0, 1647.0, 2600.0, 4257.0, 7141.0, 12318.0, 21712.0, 39254.0, 75224.0, 148606.0, 312483.0, 625358.0, 957229.0, 898150.0, 541000.0, 266716.0, 130012.0, 65902.0, 35453.0, 19619.0, 11044.0, 6498.0, 3596.0, 2274.0, 1245.0, 776.0, 494.0, 310.0, 180.0, 115.0, 81.0, 56.0, 31.0, 23.0, 15.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-11.0, -10.6846923828125, -10.369384765625, -10.0540771484375, -9.73876953125, -9.4234619140625, -9.108154296875, -8.7928466796875, -8.4775390625, -8.1622314453125, -7.846923828125, -7.5316162109375, -7.21630859375, -6.9010009765625, -6.585693359375, -6.2703857421875, -5.955078125, -5.6397705078125, -5.324462890625, -5.0091552734375, -4.69384765625, -4.3785400390625, -4.063232421875, -3.7479248046875, -3.4326171875, -3.1173095703125, -2.802001953125, -2.4866943359375, -2.17138671875, -1.8560791015625, -1.540771484375, -1.2254638671875, -0.91015625, -0.5948486328125, -0.279541015625, 0.0357666015625, 0.35107421875, 0.6663818359375, 0.981689453125, 1.2969970703125, 1.6123046875, 1.9276123046875, 2.242919921875, 2.5582275390625, 2.87353515625, 3.1888427734375, 3.504150390625, 3.8194580078125, 4.134765625, 4.4500732421875, 4.765380859375, 5.0806884765625, 5.39599609375, 5.7113037109375, 6.026611328125, 6.3419189453125, 6.6572265625, 6.9725341796875, 7.287841796875, 7.6031494140625, 7.91845703125, 8.2337646484375, 8.549072265625, 8.8643798828125, 9.1796875]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 6.0, 7.0, 9.0, 9.0, 18.0, 14.0, 11.0, 14.0, 29.0, 28.0, 28.0, 36.0, 27.0, 30.0, 51.0, 39.0, 41.0, 35.0, 46.0, 33.0, 34.0, 31.0, 47.0, 35.0, 24.0, 47.0, 38.0, 39.0, 37.0, 24.0, 12.0, 18.0, 22.0, 11.0, 14.0, 14.0, 5.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-7.49609375, -7.2891845703125, -7.082275390625, -6.8753662109375, -6.66845703125, -6.4615478515625, -6.254638671875, -6.0477294921875, -5.8408203125, -5.6339111328125, -5.427001953125, -5.2200927734375, -5.01318359375, -4.8062744140625, -4.599365234375, -4.3924560546875, -4.185546875, -3.9786376953125, -3.771728515625, -3.5648193359375, -3.35791015625, -3.1510009765625, -2.944091796875, -2.7371826171875, -2.5302734375, -2.3233642578125, -2.116455078125, -1.9095458984375, -1.70263671875, -1.4957275390625, -1.288818359375, -1.0819091796875, -0.875, -0.6680908203125, -0.461181640625, -0.2542724609375, -0.04736328125, 0.1595458984375, 0.366455078125, 0.5733642578125, 0.7802734375, 0.9871826171875, 1.194091796875, 1.4010009765625, 1.60791015625, 1.8148193359375, 2.021728515625, 2.2286376953125, 2.435546875, 2.6424560546875, 2.849365234375, 3.0562744140625, 3.26318359375, 3.4700927734375, 3.677001953125, 3.8839111328125, 4.0908203125, 4.2977294921875, 4.504638671875, 4.7115478515625, 4.91845703125, 5.1253662109375, 5.332275390625, 5.5391845703125, 5.74609375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 13.0, 17.0, 27.0, 37.0, 50.0, 84.0, 115.0, 178.0, 277.0, 423.0, 681.0, 1060.0, 1630.0, 2460.0, 3817.0, 6146.0, 9833.0, 16267.0, 26855.0, 45287.0, 76466.0, 130528.0, 221630.0, 369830.0, 571713.0, 743872.0, 700965.0, 498807.0, 311026.0, 185055.0, 108320.0, 63728.0, 37812.0, 22693.0, 13421.0, 8604.0, 5257.0, 3337.0, 2054.0, 1352.0, 905.0, 614.0, 357.0, 228.0, 153.0, 108.0, 63.0, 44.0, 29.0, 24.0, 17.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-8.2890625, -8.03656005859375, -7.7840576171875, -7.53155517578125, -7.279052734375, -7.02655029296875, -6.7740478515625, -6.52154541015625, -6.26904296875, -6.01654052734375, -5.7640380859375, -5.51153564453125, -5.259033203125, -5.00653076171875, -4.7540283203125, -4.50152587890625, -4.2490234375, -3.99652099609375, -3.7440185546875, -3.49151611328125, -3.239013671875, -2.98651123046875, -2.7340087890625, -2.48150634765625, -2.22900390625, -1.97650146484375, -1.7239990234375, -1.47149658203125, -1.218994140625, -0.96649169921875, -0.7139892578125, -0.46148681640625, -0.208984375, 0.04351806640625, 0.2960205078125, 0.54852294921875, 0.801025390625, 1.05352783203125, 1.3060302734375, 1.55853271484375, 1.81103515625, 2.06353759765625, 2.3160400390625, 2.56854248046875, 2.821044921875, 3.07354736328125, 3.3260498046875, 3.57855224609375, 3.8310546875, 4.08355712890625, 4.3360595703125, 4.58856201171875, 4.841064453125, 5.09356689453125, 5.3460693359375, 5.59857177734375, 5.85107421875, 6.10357666015625, 6.3560791015625, 6.60858154296875, 6.861083984375, 7.11358642578125, 7.3660888671875, 7.61859130859375, 7.87109375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 6.0, 8.0, 7.0, 11.0, 14.0, 23.0, 34.0, 48.0, 43.0, 51.0, 93.0, 119.0, 136.0, 155.0, 192.0, 232.0, 262.0, 285.0, 315.0, 288.0, 245.0, 247.0, 226.0, 206.0, 154.0, 147.0, 108.0, 86.0, 81.0, 63.0, 52.0, 30.0, 31.0, 16.0, 13.0, 19.0, 6.0, 6.0, 7.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.1524658203125, -3.039306640625, -2.9261474609375, -2.81298828125, -2.6998291015625, -2.586669921875, -2.4735107421875, -2.3603515625, -2.2471923828125, -2.134033203125, -2.0208740234375, -1.90771484375, -1.7945556640625, -1.681396484375, -1.5682373046875, -1.455078125, -1.3419189453125, -1.228759765625, -1.1156005859375, -1.00244140625, -0.8892822265625, -0.776123046875, -0.6629638671875, -0.5498046875, -0.4366455078125, -0.323486328125, -0.2103271484375, -0.09716796875, 0.0159912109375, 0.129150390625, 0.2423095703125, 0.35546875, 0.4686279296875, 0.581787109375, 0.6949462890625, 0.80810546875, 0.9212646484375, 1.034423828125, 1.1475830078125, 1.2607421875, 1.3739013671875, 1.487060546875, 1.6002197265625, 1.71337890625, 1.8265380859375, 1.939697265625, 2.0528564453125, 2.166015625, 2.2791748046875, 2.392333984375, 2.5054931640625, 2.61865234375, 2.7318115234375, 2.844970703125, 2.9581298828125, 3.0712890625, 3.1844482421875, 3.297607421875, 3.4107666015625, 3.52392578125, 3.6370849609375, 3.750244140625, 3.8634033203125, 3.9765625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 10.0, 6.0, 14.0, 16.0, 9.0, 12.0, 21.0, 27.0, 22.0, 41.0, 36.0, 34.0, 45.0, 53.0, 50.0, 53.0, 46.0, 58.0, 50.0, 50.0, 55.0, 35.0, 36.0, 38.0, 24.0, 32.0, 16.0, 22.0, 25.0, 9.0, 9.0, 9.0, 11.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.457452774047852, -8.151654243469238, -7.845856189727783, -7.540058135986328, -7.234259605407715, -6.92846155166626, -6.622663497924805, -6.316864967346191, -6.011066913604736, -5.705268859863281, -5.399470329284668, -5.093672275543213, -4.787874221801758, -4.4820756912231445, -4.1762776374816895, -3.8704793453216553, -3.564681053161621, -3.258882761001587, -2.9530844688415527, -2.6472864151000977, -2.3414881229400635, -2.0356898307800293, -1.7298916578292847, -1.42409348487854, -1.1182951927185059, -0.8124969601631165, -0.506698727607727, -0.20090049505233765, 0.10489773750305176, 0.41069602966308594, 0.7164942026138306, 1.0222923755645752, 1.3280916213989258, 1.63388991355896, 1.9396880865097046, 2.245486259460449, 2.5512845516204834, 2.8570828437805176, 3.1628808975219727, 3.468679189682007, 3.774477481842041, 4.080275535583496, 4.386074066162109, 4.6918721199035645, 4.9976701736450195, 5.303468704223633, 5.609266757965088, 5.915064811706543, 6.220863342285156, 6.526661396026611, 6.832459926605225, 7.13825798034668, 7.444056510925293, 7.749854564666748, 8.055652618408203, 8.361451148986816, 8.66724967956543, 8.973048210144043, 9.27884578704834, 9.584644317626953, 9.890442848205566, 10.19624137878418, 10.502038955688477, 10.80783748626709, 11.113635063171387]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 4.0, 5.0, 6.0, 17.0, 16.0, 19.0, 16.0, 21.0, 27.0, 39.0, 28.0, 33.0, 42.0, 40.0, 43.0, 45.0, 42.0, 47.0, 44.0, 38.0, 35.0, 48.0, 52.0, 33.0, 31.0, 39.0, 26.0, 30.0, 16.0, 22.0, 27.0, 14.0, 6.0, 9.0, 8.0, 6.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.835714340209961, -8.575971603393555, -8.316227912902832, -8.056485176086426, -7.7967424392700195, -7.536999225616455, -7.277256011962891, -7.017513275146484, -6.75777006149292, -6.4980268478393555, -6.238284111022949, -5.978540897369385, -5.71879768371582, -5.459054946899414, -5.19931173324585, -4.939568519592285, -4.679825782775879, -4.4200825691223145, -4.160339832305908, -3.9005966186523438, -3.6408536434173584, -3.381110668182373, -3.1213674545288086, -2.8616244792938232, -2.601881504058838, -2.3421385288238525, -2.082395553588867, -1.8226523399353027, -1.5629093647003174, -1.303166389465332, -1.0434232950210571, -0.7836802005767822, -0.5239377021789551, -0.26419466733932495, -0.004451632499694824, 0.2552914023399353, 0.5150344371795654, 0.7747774124145508, 1.0345205068588257, 1.2942636013031006, 1.554006576538086, 1.8137495517730713, 2.0734925270080566, 2.333235740661621, 2.5929787158966064, 2.852721691131592, 3.1124649047851562, 3.3722078800201416, 3.631950855255127, 3.8916938304901123, 4.151436805725098, 4.411180019378662, 4.670923233032227, 4.930665969848633, 5.190409183502197, 5.450152397155762, 5.709895133972168, 5.969638347625732, 6.229381084442139, 6.489124298095703, 6.748867034912109, 7.008610248565674, 7.268353462219238, 7.5280961990356445, 7.787839412689209]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 6.0, 9.0, 15.0, 17.0, 35.0, 47.0, 65.0, 104.0, 136.0, 175.0, 263.0, 359.0, 556.0, 856.0, 1196.0, 1871.0, 2950.0, 4450.0, 7020.0, 11354.0, 18270.0, 30919.0, 52407.0, 89371.0, 142906.0, 188940.0, 178475.0, 125435.0, 76238.0, 44589.0, 26520.0, 15865.0, 9553.0, 6074.0, 3892.0, 2469.0, 1622.0, 1116.0, 760.0, 551.0, 333.0, 206.0, 185.0, 121.0, 74.0, 47.0, 35.0, 24.0, 28.0, 15.0, 11.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0], "bins": [-9.859375, -9.5592041015625, -9.259033203125, -8.9588623046875, -8.65869140625, -8.3585205078125, -8.058349609375, -7.7581787109375, -7.4580078125, -7.1578369140625, -6.857666015625, -6.5574951171875, -6.25732421875, -5.9571533203125, -5.656982421875, -5.3568115234375, -5.056640625, -4.7564697265625, -4.456298828125, -4.1561279296875, -3.85595703125, -3.5557861328125, -3.255615234375, -2.9554443359375, -2.6552734375, -2.3551025390625, -2.054931640625, -1.7547607421875, -1.45458984375, -1.1544189453125, -0.854248046875, -0.5540771484375, -0.25390625, 0.0462646484375, 0.346435546875, 0.6466064453125, 0.94677734375, 1.2469482421875, 1.547119140625, 1.8472900390625, 2.1474609375, 2.4476318359375, 2.747802734375, 3.0479736328125, 3.34814453125, 3.6483154296875, 3.948486328125, 4.2486572265625, 4.548828125, 4.8489990234375, 5.149169921875, 5.4493408203125, 5.74951171875, 6.0496826171875, 6.349853515625, 6.6500244140625, 6.9501953125, 7.2503662109375, 7.550537109375, 7.8507080078125, 8.15087890625, 8.4510498046875, 8.751220703125, 9.0513916015625, 9.3515625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 6.0, 9.0, 10.0, 3.0, 10.0, 15.0, 16.0, 17.0, 25.0, 28.0, 30.0, 29.0, 31.0, 27.0, 39.0, 46.0, 46.0, 45.0, 38.0, 44.0, 40.0, 35.0, 28.0, 51.0, 46.0, 35.0, 41.0, 26.0, 26.0, 24.0, 33.0, 16.0, 12.0, 17.0, 11.0, 6.0, 12.0, 7.0, 9.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.703125, -8.4530029296875, -8.202880859375, -7.9527587890625, -7.70263671875, -7.4525146484375, -7.202392578125, -6.9522705078125, -6.7021484375, -6.4520263671875, -6.201904296875, -5.9517822265625, -5.70166015625, -5.4515380859375, -5.201416015625, -4.9512939453125, -4.701171875, -4.4510498046875, -4.200927734375, -3.9508056640625, -3.70068359375, -3.4505615234375, -3.200439453125, -2.9503173828125, -2.7001953125, -2.4500732421875, -2.199951171875, -1.9498291015625, -1.69970703125, -1.4495849609375, -1.199462890625, -0.9493408203125, -0.69921875, -0.4490966796875, -0.198974609375, 0.0511474609375, 0.30126953125, 0.5513916015625, 0.801513671875, 1.0516357421875, 1.3017578125, 1.5518798828125, 1.802001953125, 2.0521240234375, 2.30224609375, 2.5523681640625, 2.802490234375, 3.0526123046875, 3.302734375, 3.5528564453125, 3.802978515625, 4.0531005859375, 4.30322265625, 4.5533447265625, 4.803466796875, 5.0535888671875, 5.3037109375, 5.5538330078125, 5.803955078125, 6.0540771484375, 6.30419921875, 6.5543212890625, 6.804443359375, 7.0545654296875, 7.3046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 7.0, 10.0, 19.0, 13.0, 36.0, 46.0, 54.0, 83.0, 117.0, 152.0, 216.0, 341.0, 445.0, 647.0, 982.0, 1554.0, 2463.0, 4107.0, 7201.0, 13918.0, 30807.0, 79507.0, 233532.0, 384624.0, 174930.0, 60673.0, 24441.0, 11559.0, 6148.0, 3579.0, 2161.0, 1347.0, 885.0, 579.0, 412.0, 271.0, 194.0, 145.0, 111.0, 66.0, 50.0, 31.0, 26.0, 18.0, 8.0, 9.0, 5.0, 7.0, 6.0, 0.0, 3.0, 3.0, 0.0, 2.0], "bins": [-22.5625, -21.88623046875, -21.2099609375, -20.53369140625, -19.857421875, -19.18115234375, -18.5048828125, -17.82861328125, -17.15234375, -16.47607421875, -15.7998046875, -15.12353515625, -14.447265625, -13.77099609375, -13.0947265625, -12.41845703125, -11.7421875, -11.06591796875, -10.3896484375, -9.71337890625, -9.037109375, -8.36083984375, -7.6845703125, -7.00830078125, -6.33203125, -5.65576171875, -4.9794921875, -4.30322265625, -3.626953125, -2.95068359375, -2.2744140625, -1.59814453125, -0.921875, -0.24560546875, 0.4306640625, 1.10693359375, 1.783203125, 2.45947265625, 3.1357421875, 3.81201171875, 4.48828125, 5.16455078125, 5.8408203125, 6.51708984375, 7.193359375, 7.86962890625, 8.5458984375, 9.22216796875, 9.8984375, 10.57470703125, 11.2509765625, 11.92724609375, 12.603515625, 13.27978515625, 13.9560546875, 14.63232421875, 15.30859375, 15.98486328125, 16.6611328125, 17.33740234375, 18.013671875, 18.68994140625, 19.3662109375, 20.04248046875, 20.71875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 4.0, 8.0, 4.0, 5.0, 10.0, 11.0, 14.0, 8.0, 8.0, 13.0, 25.0, 22.0, 22.0, 29.0, 20.0, 35.0, 34.0, 37.0, 35.0, 36.0, 29.0, 41.0, 46.0, 44.0, 40.0, 39.0, 44.0, 31.0, 39.0, 33.0, 25.0, 28.0, 31.0, 24.0, 12.0, 31.0, 21.0, 12.0, 13.0, 7.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.42578125, -4.28167724609375, -4.1375732421875, -3.99346923828125, -3.849365234375, -3.70526123046875, -3.5611572265625, -3.41705322265625, -3.27294921875, -3.12884521484375, -2.9847412109375, -2.84063720703125, -2.696533203125, -2.55242919921875, -2.4083251953125, -2.26422119140625, -2.1201171875, -1.97601318359375, -1.8319091796875, -1.68780517578125, -1.543701171875, -1.39959716796875, -1.2554931640625, -1.11138916015625, -0.96728515625, -0.82318115234375, -0.6790771484375, -0.53497314453125, -0.390869140625, -0.24676513671875, -0.1026611328125, 0.04144287109375, 0.185546875, 0.32965087890625, 0.4737548828125, 0.61785888671875, 0.761962890625, 0.90606689453125, 1.0501708984375, 1.19427490234375, 1.33837890625, 1.48248291015625, 1.6265869140625, 1.77069091796875, 1.914794921875, 2.05889892578125, 2.2030029296875, 2.34710693359375, 2.4912109375, 2.63531494140625, 2.7794189453125, 2.92352294921875, 3.067626953125, 3.21173095703125, 3.3558349609375, 3.49993896484375, 3.64404296875, 3.78814697265625, 3.9322509765625, 4.07635498046875, 4.220458984375, 4.36456298828125, 4.5086669921875, 4.65277099609375, 4.796875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 1.0, 1.0, 8.0, 10.0, 11.0, 9.0, 18.0, 20.0, 34.0, 34.0, 59.0, 65.0, 109.0, 165.0, 207.0, 380.0, 502.0, 765.0, 1251.0, 1998.0, 3303.0, 5551.0, 9671.0, 17433.0, 33012.0, 65791.0, 132513.0, 237549.0, 245900.0, 141436.0, 71050.0, 35715.0, 18537.0, 10165.0, 5771.0, 3554.0, 2162.0, 1314.0, 846.0, 549.0, 328.0, 225.0, 149.0, 93.0, 94.0, 56.0, 35.0, 37.0, 20.0, 18.0, 11.0, 4.0, 8.0, 2.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.44921875, -6.24151611328125, -6.0338134765625, -5.82611083984375, -5.618408203125, -5.41070556640625, -5.2030029296875, -4.99530029296875, -4.78759765625, -4.57989501953125, -4.3721923828125, -4.16448974609375, -3.956787109375, -3.74908447265625, -3.5413818359375, -3.33367919921875, -3.1259765625, -2.91827392578125, -2.7105712890625, -2.50286865234375, -2.295166015625, -2.08746337890625, -1.8797607421875, -1.67205810546875, -1.46435546875, -1.25665283203125, -1.0489501953125, -0.84124755859375, -0.633544921875, -0.42584228515625, -0.2181396484375, -0.01043701171875, 0.197265625, 0.40496826171875, 0.6126708984375, 0.82037353515625, 1.028076171875, 1.23577880859375, 1.4434814453125, 1.65118408203125, 1.85888671875, 2.06658935546875, 2.2742919921875, 2.48199462890625, 2.689697265625, 2.89739990234375, 3.1051025390625, 3.31280517578125, 3.5205078125, 3.72821044921875, 3.9359130859375, 4.14361572265625, 4.351318359375, 4.55902099609375, 4.7667236328125, 4.97442626953125, 5.18212890625, 5.38983154296875, 5.5975341796875, 5.80523681640625, 6.012939453125, 6.22064208984375, 6.4283447265625, 6.63604736328125, 6.84375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 8.0, 4.0, 8.0, 8.0, 13.0, 14.0, 18.0, 23.0, 26.0, 35.0, 42.0, 57.0, 63.0, 81.0, 78.0, 77.0, 56.0, 64.0, 58.0, 59.0, 37.0, 18.0, 24.0, 30.0, 24.0, 11.0, 4.0, 10.0, 7.0, 7.0, 4.0, 1.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.0003516674041748047, -0.0003422833979129791, -0.00033289939165115356, -0.000323515385389328, -0.00031413137912750244, -0.0003047473728656769, -0.0002953633666038513, -0.00028597936034202576, -0.0002765953540802002, -0.00026721134781837463, -0.00025782734155654907, -0.0002484433352947235, -0.00023905932903289795, -0.0002296753227710724, -0.00022029131650924683, -0.00021090731024742126, -0.0002015233039855957, -0.00019213929772377014, -0.00018275529146194458, -0.00017337128520011902, -0.00016398727893829346, -0.0001546032726764679, -0.00014521926641464233, -0.00013583526015281677, -0.0001264512538909912, -0.00011706724762916565, -0.00010768324136734009, -9.829923510551453e-05, -8.891522884368896e-05, -7.95312225818634e-05, -7.014721632003784e-05, -6.076321005821228e-05, -5.137920379638672e-05, -4.199519753456116e-05, -3.2611191272735596e-05, -2.3227185010910034e-05, -1.3843178749084473e-05, -4.459172487258911e-06, 4.92483377456665e-06, 1.4308840036392212e-05, 2.3692846298217773e-05, 3.3076852560043335e-05, 4.2460858821868896e-05, 5.184486508369446e-05, 6.122887134552002e-05, 7.061287760734558e-05, 7.999688386917114e-05, 8.93808901309967e-05, 9.876489639282227e-05, 0.00010814890265464783, 0.00011753290891647339, 0.00012691691517829895, 0.0001363009214401245, 0.00014568492770195007, 0.00015506893396377563, 0.0001644529402256012, 0.00017383694648742676, 0.00018322095274925232, 0.00019260495901107788, 0.00020198896527290344, 0.000211372971534729, 0.00022075697779655457, 0.00023014098405838013, 0.0002395249903202057, 0.00024890899658203125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 9.0, 12.0, 19.0, 21.0, 32.0, 42.0, 70.0, 101.0, 182.0, 278.0, 406.0, 683.0, 1079.0, 1686.0, 2721.0, 4462.0, 6977.0, 11382.0, 18356.0, 29858.0, 47993.0, 75527.0, 113762.0, 151221.0, 165016.0, 140515.0, 100970.0, 66131.0, 41566.0, 25449.0, 15920.0, 9996.0, 6075.0, 3602.0, 2405.0, 1458.0, 927.0, 585.0, 364.0, 259.0, 159.0, 93.0, 59.0, 45.0, 30.0, 21.0, 16.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-4.578125, -4.43658447265625, -4.2950439453125, -4.15350341796875, -4.011962890625, -3.87042236328125, -3.7288818359375, -3.58734130859375, -3.44580078125, -3.30426025390625, -3.1627197265625, -3.02117919921875, -2.879638671875, -2.73809814453125, -2.5965576171875, -2.45501708984375, -2.3134765625, -2.17193603515625, -2.0303955078125, -1.88885498046875, -1.747314453125, -1.60577392578125, -1.4642333984375, -1.32269287109375, -1.18115234375, -1.03961181640625, -0.8980712890625, -0.75653076171875, -0.614990234375, -0.47344970703125, -0.3319091796875, -0.19036865234375, -0.048828125, 0.09271240234375, 0.2342529296875, 0.37579345703125, 0.517333984375, 0.65887451171875, 0.8004150390625, 0.94195556640625, 1.08349609375, 1.22503662109375, 1.3665771484375, 1.50811767578125, 1.649658203125, 1.79119873046875, 1.9327392578125, 2.07427978515625, 2.2158203125, 2.35736083984375, 2.4989013671875, 2.64044189453125, 2.781982421875, 2.92352294921875, 3.0650634765625, 3.20660400390625, 3.34814453125, 3.48968505859375, 3.6312255859375, 3.77276611328125, 3.914306640625, 4.05584716796875, 4.1973876953125, 4.33892822265625, 4.48046875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 6.0, 5.0, 9.0, 13.0, 8.0, 18.0, 26.0, 24.0, 24.0, 28.0, 41.0, 37.0, 58.0, 39.0, 57.0, 75.0, 70.0, 58.0, 61.0, 48.0, 72.0, 41.0, 33.0, 26.0, 16.0, 28.0, 15.0, 17.0, 9.0, 8.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.11328125, -2.0491790771484375, -1.985076904296875, -1.9209747314453125, -1.85687255859375, -1.7927703857421875, -1.728668212890625, -1.6645660400390625, -1.6004638671875, -1.5363616943359375, -1.472259521484375, -1.4081573486328125, -1.34405517578125, -1.2799530029296875, -1.215850830078125, -1.1517486572265625, -1.087646484375, -1.0235443115234375, -0.959442138671875, -0.8953399658203125, -0.83123779296875, -0.7671356201171875, -0.703033447265625, -0.6389312744140625, -0.5748291015625, -0.5107269287109375, -0.446624755859375, -0.3825225830078125, -0.31842041015625, -0.2543182373046875, -0.190216064453125, -0.1261138916015625, -0.06201171875, 0.0020904541015625, 0.066192626953125, 0.1302947998046875, 0.19439697265625, 0.2584991455078125, 0.322601318359375, 0.3867034912109375, 0.4508056640625, 0.5149078369140625, 0.579010009765625, 0.6431121826171875, 0.70721435546875, 0.7713165283203125, 0.835418701171875, 0.8995208740234375, 0.963623046875, 1.0277252197265625, 1.091827392578125, 1.1559295654296875, 1.22003173828125, 1.2841339111328125, 1.348236083984375, 1.4123382568359375, 1.4764404296875, 1.5405426025390625, 1.604644775390625, 1.6687469482421875, 1.73284912109375, 1.7969512939453125, 1.861053466796875, 1.9251556396484375, 1.9892578125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 16.0, 5.0, 22.0, 14.0, 22.0, 17.0, 17.0, 33.0, 34.0, 35.0, 46.0, 52.0, 49.0, 59.0, 63.0, 65.0, 59.0, 44.0, 47.0, 36.0, 35.0, 30.0, 32.0, 23.0, 21.0, 24.0, 7.0, 17.0, 19.0, 7.0, 9.0, 5.0, 0.0, 6.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.889204978942871, -8.589778900146484, -8.290352821350098, -7.990926742553711, -7.691500663757324, -7.3920745849609375, -7.092648506164551, -6.793222427368164, -6.493796348571777, -6.194370269775391, -5.894944190979004, -5.595518112182617, -5.2960920333862305, -4.996665954589844, -4.697239875793457, -4.39781379699707, -4.098387718200684, -3.798961639404297, -3.49953556060791, -3.2001094818115234, -2.9006834030151367, -2.60125732421875, -2.3018312454223633, -2.0024051666259766, -1.7029790878295898, -1.4035530090332031, -1.1041269302368164, -0.8047008514404297, -0.505274772644043, -0.20584869384765625, 0.09357738494873047, 0.3930034637451172, 0.6924304962158203, 0.991856575012207, 1.2912826538085938, 1.5907087326049805, 1.8901348114013672, 2.189560890197754, 2.4889869689941406, 2.7884130477905273, 3.087839126586914, 3.387265205383301, 3.6866912841796875, 3.986117362976074, 4.285543441772461, 4.584969520568848, 4.884395599365234, 5.183821678161621, 5.483247756958008, 5.7826738357543945, 6.082099914550781, 6.381525993347168, 6.680952072143555, 6.980378150939941, 7.279804229736328, 7.579230308532715, 7.878656387329102, 8.178082466125488, 8.477508544921875, 8.776934623718262, 9.076360702514648, 9.375786781311035, 9.675212860107422, 9.974638938903809, 10.274065017700195]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 8.0, 0.0, 4.0, 10.0, 8.0, 8.0, 7.0, 16.0, 18.0, 16.0, 26.0, 16.0, 31.0, 26.0, 37.0, 44.0, 41.0, 44.0, 39.0, 44.0, 37.0, 50.0, 40.0, 48.0, 35.0, 39.0, 43.0, 36.0, 29.0, 36.0, 21.0, 21.0, 30.0, 20.0, 18.0, 16.0, 10.0, 8.0, 5.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.668281555175781, -8.42397689819336, -8.179671287536621, -7.935366153717041, -7.691061019897461, -7.446756362915039, -7.202450752258301, -6.958146095275879, -6.713840961456299, -6.469535827636719, -6.225230693817139, -5.980925559997559, -5.7366204261779785, -5.492315292358398, -5.248010635375977, -5.0037055015563965, -4.759400367736816, -4.515095233917236, -4.270790100097656, -4.026484966278076, -3.782180070877075, -3.537874937057495, -3.293569803237915, -3.049264907836914, -2.804959297180176, -2.5606541633605957, -2.3163490295410156, -2.0720438957214355, -1.8277390003204346, -1.5834338665008545, -1.3391287326812744, -1.0948237180709839, -0.8505187034606934, -0.6062136292457581, -0.36190852522850037, -0.11760342121124268, 0.12670165300369263, 0.37100672721862793, 0.615311861038208, 0.8596168756484985, 1.1039220094680786, 1.3482271432876587, 1.5925321578979492, 1.8368372917175293, 2.0811424255371094, 2.3254475593566895, 2.5697526931762695, 2.8140575885772705, 3.0583627223968506, 3.3026678562164307, 3.5469729900360107, 3.7912778854370117, 4.035583019256592, 4.279888153076172, 4.524193286895752, 4.768498420715332, 5.012803554534912, 5.257108688354492, 5.501413822174072, 5.745718955993652, 5.990024089813232, 6.2343292236328125, 6.478633880615234, 6.7229390144348145, 6.9672441482543945]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 36.0, 56.0, 64.0, 101.0, 163.0, 262.0, 414.0, 649.0, 965.0, 1583.0, 2530.0, 4125.0, 6536.0, 10390.0, 16963.0, 26827.0, 42168.0, 62632.0, 89097.0, 116241.0, 135075.0, 135068.0, 118535.0, 92305.0, 65640.0, 43770.0, 28471.0, 18025.0, 11403.0, 6823.0, 4275.0, 2696.0, 1703.0, 1097.0, 665.0, 429.0, 270.0, 145.0, 116.0, 77.0, 47.0, 32.0, 21.0, 11.0, 7.0, 9.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.63873291015625, -6.4102783203125, -6.18182373046875, -5.953369140625, -5.72491455078125, -5.4964599609375, -5.26800537109375, -5.03955078125, -4.81109619140625, -4.5826416015625, -4.35418701171875, -4.125732421875, -3.89727783203125, -3.6688232421875, -3.44036865234375, -3.2119140625, -2.98345947265625, -2.7550048828125, -2.52655029296875, -2.298095703125, -2.06964111328125, -1.8411865234375, -1.61273193359375, -1.38427734375, -1.15582275390625, -0.9273681640625, -0.69891357421875, -0.470458984375, -0.24200439453125, -0.0135498046875, 0.21490478515625, 0.443359375, 0.67181396484375, 0.9002685546875, 1.12872314453125, 1.357177734375, 1.58563232421875, 1.8140869140625, 2.04254150390625, 2.27099609375, 2.49945068359375, 2.7279052734375, 2.95635986328125, 3.184814453125, 3.41326904296875, 3.6417236328125, 3.87017822265625, 4.0986328125, 4.32708740234375, 4.5555419921875, 4.78399658203125, 5.012451171875, 5.24090576171875, 5.4693603515625, 5.69781494140625, 5.92626953125, 6.15472412109375, 6.3831787109375, 6.61163330078125, 6.840087890625, 7.06854248046875, 7.2969970703125, 7.52545166015625, 7.75390625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 9.0, 6.0, 5.0, 10.0, 11.0, 11.0, 14.0, 13.0, 20.0, 25.0, 18.0, 32.0, 30.0, 30.0, 37.0, 42.0, 34.0, 46.0, 43.0, 44.0, 31.0, 36.0, 39.0, 46.0, 41.0, 28.0, 38.0, 37.0, 34.0, 32.0, 24.0, 27.0, 15.0, 16.0, 18.0, 18.0, 9.0, 8.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0], "bins": [-8.5234375, -8.291259765625, -8.05908203125, -7.826904296875, -7.5947265625, -7.362548828125, -7.13037109375, -6.898193359375, -6.666015625, -6.433837890625, -6.20166015625, -5.969482421875, -5.7373046875, -5.505126953125, -5.27294921875, -5.040771484375, -4.80859375, -4.576416015625, -4.34423828125, -4.112060546875, -3.8798828125, -3.647705078125, -3.41552734375, -3.183349609375, -2.951171875, -2.718994140625, -2.48681640625, -2.254638671875, -2.0224609375, -1.790283203125, -1.55810546875, -1.325927734375, -1.09375, -0.861572265625, -0.62939453125, -0.397216796875, -0.1650390625, 0.067138671875, 0.29931640625, 0.531494140625, 0.763671875, 0.995849609375, 1.22802734375, 1.460205078125, 1.6923828125, 1.924560546875, 2.15673828125, 2.388916015625, 2.62109375, 2.853271484375, 3.08544921875, 3.317626953125, 3.5498046875, 3.781982421875, 4.01416015625, 4.246337890625, 4.478515625, 4.710693359375, 4.94287109375, 5.175048828125, 5.4072265625, 5.639404296875, 5.87158203125, 6.103759765625, 6.3359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 13.0, 11.0, 31.0, 46.0, 76.0, 96.0, 143.0, 258.0, 363.0, 537.0, 888.0, 1351.0, 2044.0, 3236.0, 4952.0, 7789.0, 12119.0, 18802.0, 28281.0, 41852.0, 58742.0, 80644.0, 101811.0, 117892.0, 123052.0, 114030.0, 95674.0, 73538.0, 53164.0, 36824.0, 24572.0, 16306.0, 10503.0, 6741.0, 4286.0, 2722.0, 1842.0, 1132.0, 802.0, 455.0, 311.0, 205.0, 124.0, 101.0, 68.0, 42.0, 31.0, 17.0, 14.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.41314697265625, -5.2286376953125, -5.04412841796875, -4.859619140625, -4.67510986328125, -4.4906005859375, -4.30609130859375, -4.12158203125, -3.93707275390625, -3.7525634765625, -3.56805419921875, -3.383544921875, -3.19903564453125, -3.0145263671875, -2.83001708984375, -2.6455078125, -2.46099853515625, -2.2764892578125, -2.09197998046875, -1.907470703125, -1.72296142578125, -1.5384521484375, -1.35394287109375, -1.16943359375, -0.98492431640625, -0.8004150390625, -0.61590576171875, -0.431396484375, -0.24688720703125, -0.0623779296875, 0.12213134765625, 0.306640625, 0.49114990234375, 0.6756591796875, 0.86016845703125, 1.044677734375, 1.22918701171875, 1.4136962890625, 1.59820556640625, 1.78271484375, 1.96722412109375, 2.1517333984375, 2.33624267578125, 2.520751953125, 2.70526123046875, 2.8897705078125, 3.07427978515625, 3.2587890625, 3.44329833984375, 3.6278076171875, 3.81231689453125, 3.996826171875, 4.18133544921875, 4.3658447265625, 4.55035400390625, 4.73486328125, 4.91937255859375, 5.1038818359375, 5.28839111328125, 5.472900390625, 5.65740966796875, 5.8419189453125, 6.02642822265625, 6.2109375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 9.0, 5.0, 9.0, 8.0, 14.0, 15.0, 14.0, 17.0, 17.0, 19.0, 23.0, 31.0, 30.0, 30.0, 29.0, 25.0, 41.0, 35.0, 38.0, 34.0, 28.0, 40.0, 39.0, 46.0, 38.0, 21.0, 42.0, 35.0, 32.0, 25.0, 28.0, 19.0, 22.0, 23.0, 11.0, 21.0, 18.0, 14.0, 12.0, 6.0, 8.0, 6.0, 10.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.57421875, -4.43548583984375, -4.2967529296875, -4.15802001953125, -4.019287109375, -3.88055419921875, -3.7418212890625, -3.60308837890625, -3.46435546875, -3.32562255859375, -3.1868896484375, -3.04815673828125, -2.909423828125, -2.77069091796875, -2.6319580078125, -2.49322509765625, -2.3544921875, -2.21575927734375, -2.0770263671875, -1.93829345703125, -1.799560546875, -1.66082763671875, -1.5220947265625, -1.38336181640625, -1.24462890625, -1.10589599609375, -0.9671630859375, -0.82843017578125, -0.689697265625, -0.55096435546875, -0.4122314453125, -0.27349853515625, -0.134765625, 0.00396728515625, 0.1427001953125, 0.28143310546875, 0.420166015625, 0.55889892578125, 0.6976318359375, 0.83636474609375, 0.97509765625, 1.11383056640625, 1.2525634765625, 1.39129638671875, 1.530029296875, 1.66876220703125, 1.8074951171875, 1.94622802734375, 2.0849609375, 2.22369384765625, 2.3624267578125, 2.50115966796875, 2.639892578125, 2.77862548828125, 2.9173583984375, 3.05609130859375, 3.19482421875, 3.33355712890625, 3.4722900390625, 3.61102294921875, 3.749755859375, 3.88848876953125, 4.0272216796875, 4.16595458984375, 4.3046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 9.0, 20.0, 22.0, 32.0, 47.0, 80.0, 104.0, 152.0, 227.0, 332.0, 531.0, 863.0, 1339.0, 2326.0, 3933.0, 6799.0, 12679.0, 23401.0, 43207.0, 79074.0, 133019.0, 189633.0, 198024.0, 149508.0, 90853.0, 50519.0, 27390.0, 14877.0, 8203.0, 4600.0, 2472.0, 1598.0, 960.0, 576.0, 371.0, 255.0, 173.0, 123.0, 74.0, 51.0, 29.0, 25.0, 13.0, 8.0, 6.0, 7.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.13671875, -5.9395751953125, -5.742431640625, -5.5452880859375, -5.34814453125, -5.1510009765625, -4.953857421875, -4.7567138671875, -4.5595703125, -4.3624267578125, -4.165283203125, -3.9681396484375, -3.77099609375, -3.5738525390625, -3.376708984375, -3.1795654296875, -2.982421875, -2.7852783203125, -2.588134765625, -2.3909912109375, -2.19384765625, -1.9967041015625, -1.799560546875, -1.6024169921875, -1.4052734375, -1.2081298828125, -1.010986328125, -0.8138427734375, -0.61669921875, -0.4195556640625, -0.222412109375, -0.0252685546875, 0.171875, 0.3690185546875, 0.566162109375, 0.7633056640625, 0.96044921875, 1.1575927734375, 1.354736328125, 1.5518798828125, 1.7490234375, 1.9461669921875, 2.143310546875, 2.3404541015625, 2.53759765625, 2.7347412109375, 2.931884765625, 3.1290283203125, 3.326171875, 3.5233154296875, 3.720458984375, 3.9176025390625, 4.11474609375, 4.3118896484375, 4.509033203125, 4.7061767578125, 4.9033203125, 5.1004638671875, 5.297607421875, 5.4947509765625, 5.69189453125, 5.8890380859375, 6.086181640625, 6.2833251953125, 6.48046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 8.0, 14.0, 14.0, 19.0, 18.0, 22.0, 35.0, 43.0, 59.0, 80.0, 123.0, 88.0, 102.0, 83.0, 78.0, 62.0, 44.0, 29.0, 18.0, 18.0, 10.0, 8.0, 10.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005640983581542969, -0.0005357041954994202, -0.0005073100328445435, -0.00047891587018966675, -0.00045052170753479004, -0.00042212754487991333, -0.0003937333822250366, -0.0003653392195701599, -0.0003369450569152832, -0.0003085508942604065, -0.0002801567316055298, -0.0002517625689506531, -0.00022336840629577637, -0.00019497424364089966, -0.00016658008098602295, -0.00013818591833114624, -0.00010979175567626953, -8.139759302139282e-05, -5.300343036651611e-05, -2.4609267711639404e-05, 3.7848949432373047e-06, 3.2179057598114014e-05, 6.057322025299072e-05, 8.896738290786743e-05, 0.00011736154556274414, 0.00014575570821762085, 0.00017414987087249756, 0.00020254403352737427, 0.00023093819618225098, 0.0002593323588371277, 0.0002877265214920044, 0.0003161206841468811, 0.0003445148468017578, 0.0003729090094566345, 0.00040130317211151123, 0.00042969733476638794, 0.00045809149742126465, 0.00048648566007614136, 0.0005148798227310181, 0.0005432739853858948, 0.0005716681480407715, 0.0006000623106956482, 0.0006284564733505249, 0.0006568506360054016, 0.0006852447986602783, 0.000713638961315155, 0.0007420331239700317, 0.0007704272866249084, 0.0007988214492797852, 0.0008272156119346619, 0.0008556097745895386, 0.0008840039372444153, 0.000912398099899292, 0.0009407922625541687, 0.0009691864252090454, 0.0009975805878639221, 0.0010259747505187988, 0.0010543689131736755, 0.0010827630758285522, 0.001111157238483429, 0.0011395514011383057, 0.0011679455637931824, 0.001196339726448059, 0.0012247338891029358, 0.0012531280517578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 10.0, 29.0, 28.0, 35.0, 69.0, 99.0, 212.0, 261.0, 483.0, 788.0, 1345.0, 2278.0, 4018.0, 6462.0, 11441.0, 19519.0, 33347.0, 56324.0, 90044.0, 131396.0, 163485.0, 163990.0, 133061.0, 91188.0, 57117.0, 33925.0, 19729.0, 11468.0, 6637.0, 3925.0, 2332.0, 1403.0, 835.0, 478.0, 310.0, 163.0, 118.0, 65.0, 38.0, 31.0, 23.0, 14.0, 5.0, 9.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.85546875, -4.69891357421875, -4.5423583984375, -4.38580322265625, -4.229248046875, -4.07269287109375, -3.9161376953125, -3.75958251953125, -3.60302734375, -3.44647216796875, -3.2899169921875, -3.13336181640625, -2.976806640625, -2.82025146484375, -2.6636962890625, -2.50714111328125, -2.3505859375, -2.19403076171875, -2.0374755859375, -1.88092041015625, -1.724365234375, -1.56781005859375, -1.4112548828125, -1.25469970703125, -1.09814453125, -0.94158935546875, -0.7850341796875, -0.62847900390625, -0.471923828125, -0.31536865234375, -0.1588134765625, -0.00225830078125, 0.154296875, 0.31085205078125, 0.4674072265625, 0.62396240234375, 0.780517578125, 0.93707275390625, 1.0936279296875, 1.25018310546875, 1.40673828125, 1.56329345703125, 1.7198486328125, 1.87640380859375, 2.032958984375, 2.18951416015625, 2.3460693359375, 2.50262451171875, 2.6591796875, 2.81573486328125, 2.9722900390625, 3.12884521484375, 3.285400390625, 3.44195556640625, 3.5985107421875, 3.75506591796875, 3.91162109375, 4.06817626953125, 4.2247314453125, 4.38128662109375, 4.537841796875, 4.69439697265625, 4.8509521484375, 5.00750732421875, 5.1640625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 7.0, 4.0, 4.0, 9.0, 3.0, 11.0, 20.0, 20.0, 29.0, 25.0, 29.0, 39.0, 37.0, 49.0, 44.0, 58.0, 55.0, 63.0, 72.0, 54.0, 50.0, 53.0, 40.0, 34.0, 31.0, 32.0, 24.0, 22.0, 27.0, 16.0, 11.0, 3.0, 6.0, 3.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.81689453125, -1.7548828125, -1.69287109375, -1.630859375, -1.56884765625, -1.5068359375, -1.44482421875, -1.3828125, -1.32080078125, -1.2587890625, -1.19677734375, -1.134765625, -1.07275390625, -1.0107421875, -0.94873046875, -0.88671875, -0.82470703125, -0.7626953125, -0.70068359375, -0.638671875, -0.57666015625, -0.5146484375, -0.45263671875, -0.390625, -0.32861328125, -0.2666015625, -0.20458984375, -0.142578125, -0.08056640625, -0.0185546875, 0.04345703125, 0.10546875, 0.16748046875, 0.2294921875, 0.29150390625, 0.353515625, 0.41552734375, 0.4775390625, 0.53955078125, 0.6015625, 0.66357421875, 0.7255859375, 0.78759765625, 0.849609375, 0.91162109375, 0.9736328125, 1.03564453125, 1.09765625, 1.15966796875, 1.2216796875, 1.28369140625, 1.345703125, 1.40771484375, 1.4697265625, 1.53173828125, 1.59375, 1.65576171875, 1.7177734375, 1.77978515625, 1.841796875, 1.90380859375, 1.9658203125, 2.02783203125, 2.08984375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 7.0, 7.0, 10.0, 4.0, 9.0, 9.0, 20.0, 11.0, 11.0, 20.0, 29.0, 29.0, 27.0, 35.0, 40.0, 58.0, 47.0, 51.0, 55.0, 56.0, 47.0, 47.0, 54.0, 38.0, 33.0, 46.0, 37.0, 21.0, 28.0, 19.0, 15.0, 16.0, 14.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.72874927520752, -8.447918891906738, -8.167088508605957, -7.886258602142334, -7.605428218841553, -7.3245978355407715, -7.043767929077148, -6.762937545776367, -6.482107162475586, -6.201276779174805, -5.920446395874023, -5.6396164894104, -5.358786106109619, -5.077955722808838, -4.797125816345215, -4.516295433044434, -4.235465049743652, -3.954634666442871, -3.673804521560669, -3.392974376678467, -3.1121439933776855, -2.8313136100769043, -2.550483465194702, -2.2696533203125, -1.9888229370117188, -1.707992672920227, -1.4271624088287354, -1.1463321447372437, -0.865501880645752, -0.5846716165542603, -0.30384135246276855, -0.023011088371276855, 0.25781917572021484, 0.5386494398117065, 0.8194797039031982, 1.10030996799469, 1.3811402320861816, 1.6619704961776733, 1.942800760269165, 2.223630905151367, 2.5044612884521484, 2.7852916717529297, 3.066121816635132, 3.346951961517334, 3.6277823448181152, 3.9086127281188965, 4.1894426345825195, 4.470273017883301, 4.751103401184082, 5.031933784484863, 5.3127641677856445, 5.593594074249268, 5.874424457550049, 6.15525484085083, 6.436084747314453, 6.716915130615234, 6.997745513916016, 7.278575897216797, 7.559406280517578, 7.840236186981201, 8.12106704711914, 8.401896476745605, 8.682726860046387, 8.963557243347168, 9.24438762664795]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 4.0, 5.0, 3.0, 7.0, 8.0, 5.0, 8.0, 6.0, 18.0, 16.0, 13.0, 17.0, 20.0, 21.0, 29.0, 20.0, 25.0, 37.0, 26.0, 36.0, 41.0, 36.0, 39.0, 42.0, 36.0, 43.0, 36.0, 36.0, 33.0, 30.0, 38.0, 33.0, 53.0, 21.0, 22.0, 29.0, 14.0, 18.0, 16.0, 12.0, 10.0, 10.0, 3.0, 10.0, 6.0, 2.0, 5.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-7.567232608795166, -7.347975730895996, -7.128719329833984, -6.9094624519348145, -6.690206050872803, -6.470949172973633, -6.251692771911621, -6.032435894012451, -5.8131794929504395, -5.5939226150512695, -5.374666213989258, -5.155409336090088, -4.936152935028076, -4.716896057128906, -4.4976396560668945, -4.278382778167725, -4.059125900268555, -3.839869260787964, -3.620612621307373, -3.4013559818267822, -3.1820993423461914, -2.9628424644470215, -2.7435860633850098, -2.52432918548584, -2.305072784423828, -2.0858161449432373, -1.8665595054626465, -1.6473028659820557, -1.4280462265014648, -1.2087894678115845, -0.9895328283309937, -0.7702761888504028, -0.5510196685791016, -0.33176302909851074, -0.11250635981559753, 0.10675030946731567, 0.3260069489479065, 0.5452636480331421, 0.7645202875137329, 0.9837769269943237, 1.2030335664749146, 1.4222902059555054, 1.6415468454360962, 1.8608036041259766, 2.0800602436065674, 2.299316883087158, 2.518573522567749, 2.73783016204834, 2.9570868015289307, 3.1763434410095215, 3.3956000804901123, 3.614856719970703, 3.834113359451294, 4.053369998931885, 4.272626876831055, 4.491883277893066, 4.711140155792236, 4.930397033691406, 5.149653434753418, 5.368910312652588, 5.5881667137146, 5.8074235916137695, 6.026679992675781, 6.245936870574951, 6.465193271636963]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 14.0, 23.0, 25.0, 44.0, 54.0, 107.0, 164.0, 228.0, 368.0, 584.0, 997.0, 1617.0, 2695.0, 4408.0, 7576.0, 13339.0, 24039.0, 46071.0, 91898.0, 194552.0, 423329.0, 825026.0, 1055337.0, 765403.0, 382508.0, 175601.0, 83415.0, 42030.0, 22697.0, 12466.0, 6974.0, 4157.0, 2491.0, 1560.0, 963.0, 564.0, 342.0, 223.0, 128.0, 88.0, 60.0, 40.0, 21.0, 16.0, 13.0, 14.0, 4.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.781005859375, -7.50732421875, -7.233642578125, -6.9599609375, -6.686279296875, -6.41259765625, -6.138916015625, -5.865234375, -5.591552734375, -5.31787109375, -5.044189453125, -4.7705078125, -4.496826171875, -4.22314453125, -3.949462890625, -3.67578125, -3.402099609375, -3.12841796875, -2.854736328125, -2.5810546875, -2.307373046875, -2.03369140625, -1.760009765625, -1.486328125, -1.212646484375, -0.93896484375, -0.665283203125, -0.3916015625, -0.117919921875, 0.15576171875, 0.429443359375, 0.703125, 0.976806640625, 1.25048828125, 1.524169921875, 1.7978515625, 2.071533203125, 2.34521484375, 2.618896484375, 2.892578125, 3.166259765625, 3.43994140625, 3.713623046875, 3.9873046875, 4.260986328125, 4.53466796875, 4.808349609375, 5.08203125, 5.355712890625, 5.62939453125, 5.903076171875, 6.1767578125, 6.450439453125, 6.72412109375, 6.997802734375, 7.271484375, 7.545166015625, 7.81884765625, 8.092529296875, 8.3662109375, 8.639892578125, 8.91357421875, 9.187255859375, 9.4609375]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 7.0, 8.0, 3.0, 8.0, 10.0, 12.0, 12.0, 15.0, 20.0, 26.0, 16.0, 19.0, 21.0, 21.0, 36.0, 34.0, 30.0, 35.0, 46.0, 39.0, 50.0, 37.0, 30.0, 42.0, 34.0, 51.0, 35.0, 34.0, 39.0, 39.0, 37.0, 27.0, 17.0, 12.0, 16.0, 16.0, 21.0, 12.0, 8.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.19921875, -5.0399169921875, -4.880615234375, -4.7213134765625, -4.56201171875, -4.4027099609375, -4.243408203125, -4.0841064453125, -3.9248046875, -3.7655029296875, -3.606201171875, -3.4468994140625, -3.28759765625, -3.1282958984375, -2.968994140625, -2.8096923828125, -2.650390625, -2.4910888671875, -2.331787109375, -2.1724853515625, -2.01318359375, -1.8538818359375, -1.694580078125, -1.5352783203125, -1.3759765625, -1.2166748046875, -1.057373046875, -0.8980712890625, -0.73876953125, -0.5794677734375, -0.420166015625, -0.2608642578125, -0.1015625, 0.0577392578125, 0.217041015625, 0.3763427734375, 0.53564453125, 0.6949462890625, 0.854248046875, 1.0135498046875, 1.1728515625, 1.3321533203125, 1.491455078125, 1.6507568359375, 1.81005859375, 1.9693603515625, 2.128662109375, 2.2879638671875, 2.447265625, 2.6065673828125, 2.765869140625, 2.9251708984375, 3.08447265625, 3.2437744140625, 3.403076171875, 3.5623779296875, 3.7216796875, 3.8809814453125, 4.040283203125, 4.1995849609375, 4.35888671875, 4.5181884765625, 4.677490234375, 4.8367919921875, 4.99609375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 10.0, 12.0, 17.0, 26.0, 36.0, 48.0, 70.0, 100.0, 165.0, 267.0, 383.0, 586.0, 893.0, 1353.0, 2171.0, 3624.0, 5987.0, 9772.0, 16627.0, 28222.0, 50388.0, 91728.0, 171235.0, 317893.0, 567945.0, 841816.0, 835389.0, 557480.0, 313184.0, 167994.0, 90580.0, 49265.0, 28195.0, 16075.0, 9459.0, 5711.0, 3434.0, 2248.0, 1355.0, 893.0, 564.0, 346.0, 247.0, 172.0, 110.0, 66.0, 41.0, 37.0, 26.0, 19.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-7.8984375, -7.6514892578125, -7.404541015625, -7.1575927734375, -6.91064453125, -6.6636962890625, -6.416748046875, -6.1697998046875, -5.9228515625, -5.6759033203125, -5.428955078125, -5.1820068359375, -4.93505859375, -4.6881103515625, -4.441162109375, -4.1942138671875, -3.947265625, -3.7003173828125, -3.453369140625, -3.2064208984375, -2.95947265625, -2.7125244140625, -2.465576171875, -2.2186279296875, -1.9716796875, -1.7247314453125, -1.477783203125, -1.2308349609375, -0.98388671875, -0.7369384765625, -0.489990234375, -0.2430419921875, 0.00390625, 0.2508544921875, 0.497802734375, 0.7447509765625, 0.99169921875, 1.2386474609375, 1.485595703125, 1.7325439453125, 1.9794921875, 2.2264404296875, 2.473388671875, 2.7203369140625, 2.96728515625, 3.2142333984375, 3.461181640625, 3.7081298828125, 3.955078125, 4.2020263671875, 4.448974609375, 4.6959228515625, 4.94287109375, 5.1898193359375, 5.436767578125, 5.6837158203125, 5.9306640625, 6.1776123046875, 6.424560546875, 6.6715087890625, 6.91845703125, 7.1654052734375, 7.412353515625, 7.6593017578125, 7.90625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 11.0, 20.0, 17.0, 31.0, 40.0, 38.0, 54.0, 77.0, 94.0, 117.0, 146.0, 143.0, 197.0, 242.0, 279.0, 294.0, 298.0, 273.0, 291.0, 204.0, 209.0, 185.0, 152.0, 131.0, 105.0, 72.0, 80.0, 49.0, 37.0, 34.0, 32.0, 23.0, 21.0, 15.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.666015625, -2.57318115234375, -2.4803466796875, -2.38751220703125, -2.294677734375, -2.20184326171875, -2.1090087890625, -2.01617431640625, -1.92333984375, -1.83050537109375, -1.7376708984375, -1.64483642578125, -1.552001953125, -1.45916748046875, -1.3663330078125, -1.27349853515625, -1.1806640625, -1.08782958984375, -0.9949951171875, -0.90216064453125, -0.809326171875, -0.71649169921875, -0.6236572265625, -0.53082275390625, -0.43798828125, -0.34515380859375, -0.2523193359375, -0.15948486328125, -0.066650390625, 0.02618408203125, 0.1190185546875, 0.21185302734375, 0.3046875, 0.39752197265625, 0.4903564453125, 0.58319091796875, 0.676025390625, 0.76885986328125, 0.8616943359375, 0.95452880859375, 1.04736328125, 1.14019775390625, 1.2330322265625, 1.32586669921875, 1.418701171875, 1.51153564453125, 1.6043701171875, 1.69720458984375, 1.7900390625, 1.88287353515625, 1.9757080078125, 2.06854248046875, 2.161376953125, 2.25421142578125, 2.3470458984375, 2.43988037109375, 2.53271484375, 2.62554931640625, 2.7183837890625, 2.81121826171875, 2.904052734375, 2.99688720703125, 3.0897216796875, 3.18255615234375, 3.275390625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 6.0, 15.0, 12.0, 11.0, 14.0, 19.0, 28.0, 27.0, 32.0, 32.0, 39.0, 38.0, 40.0, 56.0, 67.0, 67.0, 56.0, 51.0, 66.0, 43.0, 52.0, 41.0, 35.0, 26.0, 20.0, 25.0, 18.0, 10.0, 10.0, 7.0, 7.0, 10.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.182652473449707, -9.896796226501465, -9.610940933227539, -9.325084686279297, -9.039228439331055, -8.753372192382812, -8.467516899108887, -8.181660652160645, -7.895804405212402, -7.609948635101318, -7.324092388153076, -7.038236618041992, -6.75238037109375, -6.466524600982666, -6.180668830871582, -5.89481258392334, -5.608956813812256, -5.323101043701172, -5.03724479675293, -4.751389026641846, -4.4655327796936035, -4.1796770095825195, -3.8938210010528564, -3.6079649925231934, -3.3221089839935303, -3.036252975463867, -2.750396966934204, -2.464540958404541, -2.178685188293457, -1.8928290605545044, -1.6069731712341309, -1.3211171627044678, -1.0352611541748047, -0.7494051456451416, -0.4635491967201233, -0.17769324779510498, 0.1081627607345581, 0.3940187692642212, 0.6798746585845947, 0.9657306671142578, 1.251586675643921, 1.537442684173584, 1.823298692703247, 2.10915470123291, 2.395010471343994, 2.6808667182922363, 2.9667224884033203, 3.2525784969329834, 3.5384345054626465, 3.8242905139923096, 4.110146522521973, 4.396002292633057, 4.681858539581299, 4.967714309692383, 5.253570556640625, 5.539426326751709, 5.825282096862793, 6.111137866973877, 6.396994113922119, 6.682849884033203, 6.968706130981445, 7.254561901092529, 7.540417671203613, 7.8262739181518555, 8.112130165100098]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 11.0, 8.0, 10.0, 13.0, 18.0, 16.0, 30.0, 24.0, 25.0, 23.0, 42.0, 34.0, 37.0, 34.0, 38.0, 46.0, 47.0, 47.0, 27.0, 37.0, 40.0, 34.0, 32.0, 43.0, 33.0, 34.0, 31.0, 28.0, 24.0, 15.0, 26.0, 16.0, 14.0, 9.0, 6.0, 5.0, 5.0, 4.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.041364669799805, -5.8413872718811035, -5.641409873962402, -5.441432952880859, -5.241455554962158, -5.041478157043457, -4.841501235961914, -4.641523838043213, -4.441546440124512, -4.2415690422058105, -4.041591644287109, -3.8416147232055664, -3.6416373252868652, -3.441659927368164, -3.241682767868042, -3.04170560836792, -2.8417282104492188, -2.6417508125305176, -2.4417736530303955, -2.2417964935302734, -2.0418190956115723, -1.8418418169021606, -1.641864538192749, -1.4418872594833374, -1.2419099807739258, -1.0419327020645142, -0.8419554233551025, -0.6419781446456909, -0.4420008659362793, -0.24202358722686768, -0.042046308517456055, 0.15793097019195557, 0.357907772064209, 0.5578850507736206, 0.7578623294830322, 0.9578396081924438, 1.1578168869018555, 1.357794165611267, 1.5577714443206787, 1.7577487230300903, 1.957726001739502, 2.157703399658203, 2.357680559158325, 2.5576577186584473, 2.7576351165771484, 2.9576125144958496, 3.1575896739959717, 3.3575668334960938, 3.557544231414795, 3.757521629333496, 3.957498788833618, 4.15747594833374, 4.357453346252441, 4.557430744171143, 4.757408142089844, 4.957385063171387, 5.157362461090088, 5.357339859008789, 5.557316780090332, 5.757294178009033, 5.957271575927734, 6.1572489738464355, 6.357226371765137, 6.55720329284668, 6.757180690765381]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 2.0, 7.0, 11.0, 12.0, 22.0, 22.0, 21.0, 31.0, 49.0, 58.0, 102.0, 107.0, 166.0, 214.0, 325.0, 497.0, 687.0, 967.0, 1475.0, 2250.0, 3623.0, 6228.0, 11967.0, 26220.0, 62385.0, 155953.0, 295129.0, 262569.0, 122678.0, 49334.0, 20683.0, 9864.0, 5415.0, 3184.0, 1988.0, 1275.0, 946.0, 628.0, 402.0, 328.0, 193.0, 143.0, 89.0, 78.0, 59.0, 44.0, 37.0, 25.0, 23.0, 13.0, 9.0, 7.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.921875, -10.55615234375, -10.1904296875, -9.82470703125, -9.458984375, -9.09326171875, -8.7275390625, -8.36181640625, -7.99609375, -7.63037109375, -7.2646484375, -6.89892578125, -6.533203125, -6.16748046875, -5.8017578125, -5.43603515625, -5.0703125, -4.70458984375, -4.3388671875, -3.97314453125, -3.607421875, -3.24169921875, -2.8759765625, -2.51025390625, -2.14453125, -1.77880859375, -1.4130859375, -1.04736328125, -0.681640625, -0.31591796875, 0.0498046875, 0.41552734375, 0.78125, 1.14697265625, 1.5126953125, 1.87841796875, 2.244140625, 2.60986328125, 2.9755859375, 3.34130859375, 3.70703125, 4.07275390625, 4.4384765625, 4.80419921875, 5.169921875, 5.53564453125, 5.9013671875, 6.26708984375, 6.6328125, 6.99853515625, 7.3642578125, 7.72998046875, 8.095703125, 8.46142578125, 8.8271484375, 9.19287109375, 9.55859375, 9.92431640625, 10.2900390625, 10.65576171875, 11.021484375, 11.38720703125, 11.7529296875, 12.11865234375, 12.484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 13.0, 12.0, 12.0, 17.0, 18.0, 19.0, 21.0, 26.0, 32.0, 24.0, 24.0, 37.0, 33.0, 51.0, 36.0, 43.0, 34.0, 31.0, 37.0, 39.0, 50.0, 36.0, 36.0, 27.0, 42.0, 25.0, 32.0, 28.0, 20.0, 18.0, 24.0, 15.0, 20.0, 14.0, 11.0, 8.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.96630859375, -5.7724609375, -5.57861328125, -5.384765625, -5.19091796875, -4.9970703125, -4.80322265625, -4.609375, -4.41552734375, -4.2216796875, -4.02783203125, -3.833984375, -3.64013671875, -3.4462890625, -3.25244140625, -3.05859375, -2.86474609375, -2.6708984375, -2.47705078125, -2.283203125, -2.08935546875, -1.8955078125, -1.70166015625, -1.5078125, -1.31396484375, -1.1201171875, -0.92626953125, -0.732421875, -0.53857421875, -0.3447265625, -0.15087890625, 0.04296875, 0.23681640625, 0.4306640625, 0.62451171875, 0.818359375, 1.01220703125, 1.2060546875, 1.39990234375, 1.59375, 1.78759765625, 1.9814453125, 2.17529296875, 2.369140625, 2.56298828125, 2.7568359375, 2.95068359375, 3.14453125, 3.33837890625, 3.5322265625, 3.72607421875, 3.919921875, 4.11376953125, 4.3076171875, 4.50146484375, 4.6953125, 4.88916015625, 5.0830078125, 5.27685546875, 5.470703125, 5.66455078125, 5.8583984375, 6.05224609375, 6.24609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 8.0, 5.0, 7.0, 11.0, 23.0, 18.0, 33.0, 31.0, 61.0, 69.0, 96.0, 111.0, 175.0, 230.0, 346.0, 534.0, 897.0, 1352.0, 2181.0, 3926.0, 7516.0, 17012.0, 50680.0, 190612.0, 462122.0, 216227.0, 56908.0, 18663.0, 8046.0, 4127.0, 2318.0, 1396.0, 881.0, 541.0, 434.0, 288.0, 186.0, 133.0, 75.0, 72.0, 59.0, 40.0, 39.0, 22.0, 11.0, 12.0, 6.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-17.90625, -17.320068359375, -16.73388671875, -16.147705078125, -15.5615234375, -14.975341796875, -14.38916015625, -13.802978515625, -13.216796875, -12.630615234375, -12.04443359375, -11.458251953125, -10.8720703125, -10.285888671875, -9.69970703125, -9.113525390625, -8.52734375, -7.941162109375, -7.35498046875, -6.768798828125, -6.1826171875, -5.596435546875, -5.01025390625, -4.424072265625, -3.837890625, -3.251708984375, -2.66552734375, -2.079345703125, -1.4931640625, -0.906982421875, -0.32080078125, 0.265380859375, 0.8515625, 1.437744140625, 2.02392578125, 2.610107421875, 3.1962890625, 3.782470703125, 4.36865234375, 4.954833984375, 5.541015625, 6.127197265625, 6.71337890625, 7.299560546875, 7.8857421875, 8.471923828125, 9.05810546875, 9.644287109375, 10.23046875, 10.816650390625, 11.40283203125, 11.989013671875, 12.5751953125, 13.161376953125, 13.74755859375, 14.333740234375, 14.919921875, 15.506103515625, 16.09228515625, 16.678466796875, 17.2646484375, 17.850830078125, 18.43701171875, 19.023193359375, 19.609375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 6.0, 12.0, 18.0, 11.0, 17.0, 16.0, 15.0, 26.0, 28.0, 25.0, 24.0, 25.0, 33.0, 28.0, 41.0, 48.0, 32.0, 41.0, 49.0, 31.0, 43.0, 44.0, 42.0, 35.0, 31.0, 43.0, 32.0, 26.0, 36.0, 20.0, 18.0, 12.0, 14.0, 12.0, 10.0, 5.0, 7.0, 11.0, 4.0, 6.0, 3.0, 5.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.9210205078125, -3.799072265625, -3.6771240234375, -3.55517578125, -3.4332275390625, -3.311279296875, -3.1893310546875, -3.0673828125, -2.9454345703125, -2.823486328125, -2.7015380859375, -2.57958984375, -2.4576416015625, -2.335693359375, -2.2137451171875, -2.091796875, -1.9698486328125, -1.847900390625, -1.7259521484375, -1.60400390625, -1.4820556640625, -1.360107421875, -1.2381591796875, -1.1162109375, -0.9942626953125, -0.872314453125, -0.7503662109375, -0.62841796875, -0.5064697265625, -0.384521484375, -0.2625732421875, -0.140625, -0.0186767578125, 0.103271484375, 0.2252197265625, 0.34716796875, 0.4691162109375, 0.591064453125, 0.7130126953125, 0.8349609375, 0.9569091796875, 1.078857421875, 1.2008056640625, 1.32275390625, 1.4447021484375, 1.566650390625, 1.6885986328125, 1.810546875, 1.9324951171875, 2.054443359375, 2.1763916015625, 2.29833984375, 2.4202880859375, 2.542236328125, 2.6641845703125, 2.7861328125, 2.9080810546875, 3.030029296875, 3.1519775390625, 3.27392578125, 3.3958740234375, 3.517822265625, 3.6397705078125, 3.76171875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 7.0, 4.0, 4.0, 8.0, 16.0, 22.0, 14.0, 41.0, 50.0, 53.0, 113.0, 128.0, 217.0, 303.0, 455.0, 705.0, 1115.0, 1805.0, 3185.0, 6411.0, 14657.0, 46160.0, 202113.0, 512033.0, 187342.0, 43492.0, 14159.0, 6070.0, 3016.0, 1731.0, 1129.0, 652.0, 427.0, 287.0, 187.0, 127.0, 88.0, 63.0, 62.0, 37.0, 18.0, 16.0, 15.0, 5.0, 5.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.265625, -10.9388427734375, -10.612060546875, -10.2852783203125, -9.95849609375, -9.6317138671875, -9.304931640625, -8.9781494140625, -8.6513671875, -8.3245849609375, -7.997802734375, -7.6710205078125, -7.34423828125, -7.0174560546875, -6.690673828125, -6.3638916015625, -6.037109375, -5.7103271484375, -5.383544921875, -5.0567626953125, -4.72998046875, -4.4031982421875, -4.076416015625, -3.7496337890625, -3.4228515625, -3.0960693359375, -2.769287109375, -2.4425048828125, -2.11572265625, -1.7889404296875, -1.462158203125, -1.1353759765625, -0.80859375, -0.4818115234375, -0.155029296875, 0.1717529296875, 0.49853515625, 0.8253173828125, 1.152099609375, 1.4788818359375, 1.8056640625, 2.1324462890625, 2.459228515625, 2.7860107421875, 3.11279296875, 3.4395751953125, 3.766357421875, 4.0931396484375, 4.419921875, 4.7467041015625, 5.073486328125, 5.4002685546875, 5.72705078125, 6.0538330078125, 6.380615234375, 6.7073974609375, 7.0341796875, 7.3609619140625, 7.687744140625, 8.0145263671875, 8.34130859375, 8.6680908203125, 8.994873046875, 9.3216552734375, 9.6484375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 10.0, 26.0, 32.0, 88.0, 143.0, 239.0, 223.0, 122.0, 44.0, 28.0, 12.0, 6.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.0008563995361328125, -0.0008358955383300781, -0.0008153915405273438, -0.0007948875427246094, -0.000774383544921875, -0.0007538795471191406, -0.0007333755493164062, -0.0007128715515136719, -0.0006923675537109375, -0.0006718635559082031, -0.0006513595581054688, -0.0006308555603027344, -0.0006103515625, -0.0005898475646972656, -0.0005693435668945312, -0.0005488395690917969, -0.0005283355712890625, -0.0005078315734863281, -0.00048732757568359375, -0.0004668235778808594, -0.000446319580078125, -0.0004258155822753906, -0.00040531158447265625, -0.0003848075866699219, -0.0003643035888671875, -0.0003437995910644531, -0.00032329559326171875, -0.0003027915954589844, -0.00028228759765625, -0.0002617835998535156, -0.00024127960205078125, -0.00022077560424804688, -0.0002002716064453125, -0.00017976760864257812, -0.00015926361083984375, -0.00013875961303710938, -0.000118255615234375, -9.775161743164062e-05, -7.724761962890625e-05, -5.6743621826171875e-05, -3.62396240234375e-05, -1.5735626220703125e-05, 4.76837158203125e-06, 2.5272369384765625e-05, 4.57763671875e-05, 6.628036499023438e-05, 8.678436279296875e-05, 0.00010728836059570312, 0.0001277923583984375, 0.00014829635620117188, 0.00016880035400390625, 0.00018930435180664062, 0.000209808349609375, 0.00023031234741210938, 0.00025081634521484375, 0.0002713203430175781, 0.0002918243408203125, 0.0003123283386230469, 0.00033283233642578125, 0.0003533363342285156, 0.00037384033203125, 0.0003943443298339844, 0.00041484832763671875, 0.0004353523254394531, 0.0004558563232421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 15.0, 15.0, 14.0, 19.0, 47.0, 53.0, 84.0, 105.0, 134.0, 206.0, 297.0, 427.0, 593.0, 873.0, 1240.0, 1823.0, 2855.0, 5383.0, 12513.0, 39146.0, 145940.0, 397497.0, 304171.0, 89602.0, 24777.0, 8921.0, 4211.0, 2380.0, 1603.0, 1067.0, 715.0, 535.0, 384.0, 249.0, 191.0, 136.0, 93.0, 66.0, 42.0, 31.0, 25.0, 20.0, 13.0, 13.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.53125, -8.25439453125, -7.9775390625, -7.70068359375, -7.423828125, -7.14697265625, -6.8701171875, -6.59326171875, -6.31640625, -6.03955078125, -5.7626953125, -5.48583984375, -5.208984375, -4.93212890625, -4.6552734375, -4.37841796875, -4.1015625, -3.82470703125, -3.5478515625, -3.27099609375, -2.994140625, -2.71728515625, -2.4404296875, -2.16357421875, -1.88671875, -1.60986328125, -1.3330078125, -1.05615234375, -0.779296875, -0.50244140625, -0.2255859375, 0.05126953125, 0.328125, 0.60498046875, 0.8818359375, 1.15869140625, 1.435546875, 1.71240234375, 1.9892578125, 2.26611328125, 2.54296875, 2.81982421875, 3.0966796875, 3.37353515625, 3.650390625, 3.92724609375, 4.2041015625, 4.48095703125, 4.7578125, 5.03466796875, 5.3115234375, 5.58837890625, 5.865234375, 6.14208984375, 6.4189453125, 6.69580078125, 6.97265625, 7.24951171875, 7.5263671875, 7.80322265625, 8.080078125, 8.35693359375, 8.6337890625, 8.91064453125, 9.1875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 6.0, 17.0, 22.0, 45.0, 46.0, 62.0, 117.0, 150.0, 128.0, 116.0, 105.0, 62.0, 45.0, 21.0, 16.0, 11.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.953125, -3.8524169921875, -3.751708984375, -3.6510009765625, -3.55029296875, -3.4495849609375, -3.348876953125, -3.2481689453125, -3.1474609375, -3.0467529296875, -2.946044921875, -2.8453369140625, -2.74462890625, -2.6439208984375, -2.543212890625, -2.4425048828125, -2.341796875, -2.2410888671875, -2.140380859375, -2.0396728515625, -1.93896484375, -1.8382568359375, -1.737548828125, -1.6368408203125, -1.5361328125, -1.4354248046875, -1.334716796875, -1.2340087890625, -1.13330078125, -1.0325927734375, -0.931884765625, -0.8311767578125, -0.73046875, -0.6297607421875, -0.529052734375, -0.4283447265625, -0.32763671875, -0.2269287109375, -0.126220703125, -0.0255126953125, 0.0751953125, 0.1759033203125, 0.276611328125, 0.3773193359375, 0.47802734375, 0.5787353515625, 0.679443359375, 0.7801513671875, 0.880859375, 0.9815673828125, 1.082275390625, 1.1829833984375, 1.28369140625, 1.3843994140625, 1.485107421875, 1.5858154296875, 1.6865234375, 1.7872314453125, 1.887939453125, 1.9886474609375, 2.08935546875, 2.1900634765625, 2.290771484375, 2.3914794921875, 2.4921875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 5.0, 10.0, 9.0, 7.0, 13.0, 17.0, 25.0, 24.0, 35.0, 37.0, 28.0, 37.0, 37.0, 61.0, 43.0, 52.0, 57.0, 45.0, 64.0, 60.0, 46.0, 55.0, 30.0, 32.0, 28.0, 26.0, 22.0, 15.0, 13.0, 12.0, 10.0, 18.0, 7.0, 6.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.566675186157227, -9.304231643676758, -9.041787147521973, -8.779343605041504, -8.516899108886719, -8.25445556640625, -7.992011547088623, -7.729567527770996, -7.467123508453369, -7.204679489135742, -6.942235469818115, -6.679791450500488, -6.4173479080200195, -6.154903411865234, -5.892459869384766, -5.630015850067139, -5.367571830749512, -5.105127811431885, -4.842683792114258, -4.580239772796631, -4.317795753479004, -4.055352210998535, -3.792908191680908, -3.5304641723632812, -3.2680201530456543, -3.0055761337280273, -2.7431321144104004, -2.4806883335113525, -2.2182443141937256, -1.9558002948760986, -1.6933563947677612, -1.4309124946594238, -1.1684694290161133, -0.9060254693031311, -0.6435815095901489, -0.38113754987716675, -0.11869359016418457, 0.14375042915344238, 0.4061943292617798, 0.6686382293701172, 0.9310822486877441, 1.193526268005371, 1.4559701681137085, 1.718414068222046, 1.9808580875396729, 2.2433021068573, 2.5057458877563477, 2.7681899070739746, 3.0306339263916016, 3.2930779457092285, 3.5555219650268555, 3.8179657459259033, 4.080410003662109, 4.342853546142578, 4.605297565460205, 4.867741584777832, 5.130185604095459, 5.392629623413086, 5.655073642730713, 5.91751766204834, 6.179961204528809, 6.442405700683594, 6.7048492431640625, 6.9672932624816895, 7.229737281799316]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 9.0, 11.0, 6.0, 7.0, 6.0, 10.0, 9.0, 24.0, 19.0, 30.0, 20.0, 25.0, 31.0, 25.0, 36.0, 34.0, 39.0, 30.0, 53.0, 41.0, 38.0, 44.0, 46.0, 33.0, 34.0, 31.0, 41.0, 32.0, 36.0, 24.0, 29.0, 35.0, 25.0, 15.0, 13.0, 13.0, 5.0, 11.0, 6.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39036226272583, -5.20006799697876, -5.0097737312316895, -4.819479465484619, -4.629185199737549, -4.4388909339904785, -4.24859619140625, -4.05830192565918, -3.8680078983306885, -3.677713632583618, -3.487419366836548, -3.2971248626708984, -3.106830596923828, -2.916536331176758, -2.7262420654296875, -2.535947799682617, -2.345653533935547, -2.1553592681884766, -1.9650650024414062, -1.7747706174850464, -1.584476351737976, -1.3941820859909058, -1.203887701034546, -1.0135934352874756, -0.8232991695404053, -0.633004903793335, -0.4427105784416199, -0.2524162530899048, -0.06212198734283447, 0.12817227840423584, 0.3184666633605957, 0.508760929107666, 0.6990556716918945, 0.8893499374389648, 1.0796442031860352, 1.269938588142395, 1.4602328538894653, 1.6505271196365356, 1.8408215045928955, 2.031115770339966, 2.221410036087036, 2.4117043018341064, 2.6019985675811768, 2.792293071746826, 2.9825873374938965, 3.172881603240967, 3.363175868988037, 3.5534701347351074, 3.7437644004821777, 3.934058666229248, 4.124352931976318, 4.314647197723389, 4.504941463470459, 4.695235729217529, 4.885530471801758, 5.075824737548828, 5.266119003295898, 5.456413269042969, 5.646707534790039, 5.837001800537109, 6.02729606628418, 6.21759033203125, 6.40788459777832, 6.598178863525391, 6.788473129272461]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 11.0, 31.0, 43.0, 51.0, 84.0, 137.0, 189.0, 297.0, 427.0, 647.0, 962.0, 1390.0, 2251.0, 3602.0, 5561.0, 8837.0, 13770.0, 21888.0, 33952.0, 52084.0, 76169.0, 104075.0, 128284.0, 138219.0, 128039.0, 104106.0, 76889.0, 52283.0, 34102.0, 21942.0, 13783.0, 8595.0, 5617.0, 3486.0, 2323.0, 1461.0, 997.0, 703.0, 453.0, 270.0, 182.0, 135.0, 79.0, 55.0, 37.0, 25.0, 11.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.66796875, -6.46893310546875, -6.2698974609375, -6.07086181640625, -5.871826171875, -5.67279052734375, -5.4737548828125, -5.27471923828125, -5.07568359375, -4.87664794921875, -4.6776123046875, -4.47857666015625, -4.279541015625, -4.08050537109375, -3.8814697265625, -3.68243408203125, -3.4833984375, -3.28436279296875, -3.0853271484375, -2.88629150390625, -2.687255859375, -2.48822021484375, -2.2891845703125, -2.09014892578125, -1.89111328125, -1.69207763671875, -1.4930419921875, -1.29400634765625, -1.094970703125, -0.89593505859375, -0.6968994140625, -0.49786376953125, -0.298828125, -0.09979248046875, 0.0992431640625, 0.29827880859375, 0.497314453125, 0.69635009765625, 0.8953857421875, 1.09442138671875, 1.29345703125, 1.49249267578125, 1.6915283203125, 1.89056396484375, 2.089599609375, 2.28863525390625, 2.4876708984375, 2.68670654296875, 2.8857421875, 3.08477783203125, 3.2838134765625, 3.48284912109375, 3.681884765625, 3.88092041015625, 4.0799560546875, 4.27899169921875, 4.47802734375, 4.67706298828125, 4.8760986328125, 5.07513427734375, 5.274169921875, 5.47320556640625, 5.6722412109375, 5.87127685546875, 6.0703125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 10.0, 8.0, 6.0, 6.0, 15.0, 19.0, 20.0, 25.0, 21.0, 24.0, 30.0, 32.0, 32.0, 32.0, 54.0, 43.0, 41.0, 55.0, 52.0, 33.0, 44.0, 41.0, 42.0, 44.0, 38.0, 30.0, 33.0, 32.0, 25.0, 27.0, 23.0, 9.0, 12.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.765625, -5.5518798828125, -5.338134765625, -5.1243896484375, -4.91064453125, -4.6968994140625, -4.483154296875, -4.2694091796875, -4.0556640625, -3.8419189453125, -3.628173828125, -3.4144287109375, -3.20068359375, -2.9869384765625, -2.773193359375, -2.5594482421875, -2.345703125, -2.1319580078125, -1.918212890625, -1.7044677734375, -1.49072265625, -1.2769775390625, -1.063232421875, -0.8494873046875, -0.6357421875, -0.4219970703125, -0.208251953125, 0.0054931640625, 0.21923828125, 0.4329833984375, 0.646728515625, 0.8604736328125, 1.07421875, 1.2879638671875, 1.501708984375, 1.7154541015625, 1.92919921875, 2.1429443359375, 2.356689453125, 2.5704345703125, 2.7841796875, 2.9979248046875, 3.211669921875, 3.4254150390625, 3.63916015625, 3.8529052734375, 4.066650390625, 4.2803955078125, 4.494140625, 4.7078857421875, 4.921630859375, 5.1353759765625, 5.34912109375, 5.5628662109375, 5.776611328125, 5.9903564453125, 6.2041015625, 6.4178466796875, 6.631591796875, 6.8453369140625, 7.05908203125, 7.2728271484375, 7.486572265625, 7.7003173828125, 7.9140625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 21.0, 32.0, 50.0, 49.0, 78.0, 148.0, 212.0, 316.0, 469.0, 737.0, 1105.0, 1646.0, 2463.0, 3812.0, 5770.0, 8536.0, 13126.0, 19310.0, 28227.0, 41317.0, 58517.0, 79131.0, 99490.0, 114942.0, 120704.0, 111722.0, 94094.0, 73080.0, 53982.0, 37682.0, 26040.0, 17283.0, 11631.0, 7720.0, 5123.0, 3399.0, 2263.0, 1472.0, 932.0, 677.0, 401.0, 299.0, 184.0, 119.0, 89.0, 55.0, 36.0, 26.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0], "bins": [-5.46875, -5.30963134765625, -5.1505126953125, -4.99139404296875, -4.832275390625, -4.67315673828125, -4.5140380859375, -4.35491943359375, -4.19580078125, -4.03668212890625, -3.8775634765625, -3.71844482421875, -3.559326171875, -3.40020751953125, -3.2410888671875, -3.08197021484375, -2.9228515625, -2.76373291015625, -2.6046142578125, -2.44549560546875, -2.286376953125, -2.12725830078125, -1.9681396484375, -1.80902099609375, -1.64990234375, -1.49078369140625, -1.3316650390625, -1.17254638671875, -1.013427734375, -0.85430908203125, -0.6951904296875, -0.53607177734375, -0.376953125, -0.21783447265625, -0.0587158203125, 0.10040283203125, 0.259521484375, 0.41864013671875, 0.5777587890625, 0.73687744140625, 0.89599609375, 1.05511474609375, 1.2142333984375, 1.37335205078125, 1.532470703125, 1.69158935546875, 1.8507080078125, 2.00982666015625, 2.1689453125, 2.32806396484375, 2.4871826171875, 2.64630126953125, 2.805419921875, 2.96453857421875, 3.1236572265625, 3.28277587890625, 3.44189453125, 3.60101318359375, 3.7601318359375, 3.91925048828125, 4.078369140625, 4.23748779296875, 4.3966064453125, 4.55572509765625, 4.71484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 2.0, 3.0, 3.0, 17.0, 8.0, 9.0, 13.0, 16.0, 24.0, 10.0, 22.0, 15.0, 27.0, 28.0, 25.0, 36.0, 34.0, 31.0, 41.0, 42.0, 31.0, 45.0, 36.0, 53.0, 42.0, 48.0, 42.0, 32.0, 35.0, 31.0, 16.0, 23.0, 33.0, 26.0, 16.0, 22.0, 13.0, 9.0, 7.0, 6.0, 8.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.203125, -4.0819091796875, -3.960693359375, -3.8394775390625, -3.71826171875, -3.5970458984375, -3.475830078125, -3.3546142578125, -3.2333984375, -3.1121826171875, -2.990966796875, -2.8697509765625, -2.74853515625, -2.6273193359375, -2.506103515625, -2.3848876953125, -2.263671875, -2.1424560546875, -2.021240234375, -1.9000244140625, -1.77880859375, -1.6575927734375, -1.536376953125, -1.4151611328125, -1.2939453125, -1.1727294921875, -1.051513671875, -0.9302978515625, -0.80908203125, -0.6878662109375, -0.566650390625, -0.4454345703125, -0.32421875, -0.2030029296875, -0.081787109375, 0.0394287109375, 0.16064453125, 0.2818603515625, 0.403076171875, 0.5242919921875, 0.6455078125, 0.7667236328125, 0.887939453125, 1.0091552734375, 1.13037109375, 1.2515869140625, 1.372802734375, 1.4940185546875, 1.615234375, 1.7364501953125, 1.857666015625, 1.9788818359375, 2.10009765625, 2.2213134765625, 2.342529296875, 2.4637451171875, 2.5849609375, 2.7061767578125, 2.827392578125, 2.9486083984375, 3.06982421875, 3.1910400390625, 3.312255859375, 3.4334716796875, 3.5546875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 13.0, 26.0, 24.0, 39.0, 69.0, 80.0, 141.0, 217.0, 345.0, 488.0, 778.0, 1242.0, 1963.0, 3248.0, 5271.0, 8884.0, 15127.0, 25896.0, 45427.0, 76952.0, 124855.0, 173985.0, 186140.0, 146174.0, 95021.0, 56435.0, 32839.0, 18793.0, 11129.0, 6425.0, 3980.0, 2429.0, 1521.0, 919.0, 599.0, 358.0, 245.0, 169.0, 101.0, 66.0, 58.0, 24.0, 24.0, 13.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.2274169921875, -4.072021484375, -3.9166259765625, -3.76123046875, -3.6058349609375, -3.450439453125, -3.2950439453125, -3.1396484375, -2.9842529296875, -2.828857421875, -2.6734619140625, -2.51806640625, -2.3626708984375, -2.207275390625, -2.0518798828125, -1.896484375, -1.7410888671875, -1.585693359375, -1.4302978515625, -1.27490234375, -1.1195068359375, -0.964111328125, -0.8087158203125, -0.6533203125, -0.4979248046875, -0.342529296875, -0.1871337890625, -0.03173828125, 0.1236572265625, 0.279052734375, 0.4344482421875, 0.58984375, 0.7452392578125, 0.900634765625, 1.0560302734375, 1.21142578125, 1.3668212890625, 1.522216796875, 1.6776123046875, 1.8330078125, 1.9884033203125, 2.143798828125, 2.2991943359375, 2.45458984375, 2.6099853515625, 2.765380859375, 2.9207763671875, 3.076171875, 3.2315673828125, 3.386962890625, 3.5423583984375, 3.69775390625, 3.8531494140625, 4.008544921875, 4.1639404296875, 4.3193359375, 4.4747314453125, 4.630126953125, 4.7855224609375, 4.94091796875, 5.0963134765625, 5.251708984375, 5.4071044921875, 5.5625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 7.0, 4.0, 8.0, 8.0, 12.0, 22.0, 24.0, 37.0, 35.0, 45.0, 66.0, 62.0, 56.0, 73.0, 66.0, 84.0, 62.0, 56.0, 46.0, 44.0, 35.0, 30.0, 29.0, 19.0, 11.0, 16.0, 16.0, 4.0, 9.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.0006461143493652344, -0.0006294958293437958, -0.0006128773093223572, -0.0005962587893009186, -0.00057964026927948, -0.0005630217492580414, -0.0005464032292366028, -0.0005297847092151642, -0.0005131661891937256, -0.000496547669172287, -0.0004799291491508484, -0.0004633106291294098, -0.0004466921091079712, -0.0004300735890865326, -0.000413455069065094, -0.0003968365490436554, -0.0003802180290222168, -0.0003635995090007782, -0.0003469809889793396, -0.000330362468957901, -0.0003137439489364624, -0.0002971254289150238, -0.0002805069088935852, -0.0002638883888721466, -0.000247269868850708, -0.0002306513488292694, -0.0002140328288078308, -0.0001974143087863922, -0.0001807957887649536, -0.00016417726874351501, -0.00014755874872207642, -0.00013094022870063782, -0.00011432170867919922, -9.770318865776062e-05, -8.108466863632202e-05, -6.446614861488342e-05, -4.7847628593444824e-05, -3.1229108572006226e-05, -1.4610588550567627e-05, 2.0079314708709717e-06, 1.862645149230957e-05, 3.524497151374817e-05, 5.186349153518677e-05, 6.848201155662537e-05, 8.510053157806396e-05, 0.00010171905159950256, 0.00011833757162094116, 0.00013495609164237976, 0.00015157461166381836, 0.00016819313168525696, 0.00018481165170669556, 0.00020143017172813416, 0.00021804869174957275, 0.00023466721177101135, 0.00025128573179244995, 0.00026790425181388855, 0.00028452277183532715, 0.00030114129185676575, 0.00031775981187820435, 0.00033437833189964294, 0.00035099685192108154, 0.00036761537194252014, 0.00038423389196395874, 0.00040085241198539734, 0.00041747093200683594]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 13.0, 13.0, 19.0, 37.0, 45.0, 84.0, 139.0, 185.0, 275.0, 455.0, 653.0, 1017.0, 1679.0, 2560.0, 4248.0, 7225.0, 12082.0, 20518.0, 34969.0, 58138.0, 92729.0, 133142.0, 162509.0, 161527.0, 128924.0, 88339.0, 54974.0, 33274.0, 19612.0, 11500.0, 6692.0, 4127.0, 2542.0, 1546.0, 990.0, 568.0, 379.0, 289.0, 172.0, 128.0, 74.0, 39.0, 36.0, 32.0, 21.0, 11.0, 11.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.74560546875, -3.6162109375, -3.48681640625, -3.357421875, -3.22802734375, -3.0986328125, -2.96923828125, -2.83984375, -2.71044921875, -2.5810546875, -2.45166015625, -2.322265625, -2.19287109375, -2.0634765625, -1.93408203125, -1.8046875, -1.67529296875, -1.5458984375, -1.41650390625, -1.287109375, -1.15771484375, -1.0283203125, -0.89892578125, -0.76953125, -0.64013671875, -0.5107421875, -0.38134765625, -0.251953125, -0.12255859375, 0.0068359375, 0.13623046875, 0.265625, 0.39501953125, 0.5244140625, 0.65380859375, 0.783203125, 0.91259765625, 1.0419921875, 1.17138671875, 1.30078125, 1.43017578125, 1.5595703125, 1.68896484375, 1.818359375, 1.94775390625, 2.0771484375, 2.20654296875, 2.3359375, 2.46533203125, 2.5947265625, 2.72412109375, 2.853515625, 2.98291015625, 3.1123046875, 3.24169921875, 3.37109375, 3.50048828125, 3.6298828125, 3.75927734375, 3.888671875, 4.01806640625, 4.1474609375, 4.27685546875, 4.40625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 15.0, 6.0, 10.0, 17.0, 17.0, 24.0, 37.0, 33.0, 39.0, 35.0, 43.0, 48.0, 51.0, 51.0, 45.0, 53.0, 41.0, 38.0, 42.0, 34.0, 50.0, 41.0, 30.0, 35.0, 22.0, 20.0, 19.0, 18.0, 18.0, 12.0, 5.0, 3.0, 7.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.2044219970703125, -1.161773681640625, -1.1191253662109375, -1.07647705078125, -1.0338287353515625, -0.991180419921875, -0.9485321044921875, -0.9058837890625, -0.8632354736328125, -0.820587158203125, -0.7779388427734375, -0.73529052734375, -0.6926422119140625, -0.649993896484375, -0.6073455810546875, -0.564697265625, -0.5220489501953125, -0.479400634765625, -0.4367523193359375, -0.39410400390625, -0.3514556884765625, -0.308807373046875, -0.2661590576171875, -0.2235107421875, -0.1808624267578125, -0.138214111328125, -0.0955657958984375, -0.05291748046875, -0.0102691650390625, 0.032379150390625, 0.0750274658203125, 0.11767578125, 0.1603240966796875, 0.202972412109375, 0.2456207275390625, 0.28826904296875, 0.3309173583984375, 0.373565673828125, 0.4162139892578125, 0.4588623046875, 0.5015106201171875, 0.544158935546875, 0.5868072509765625, 0.62945556640625, 0.6721038818359375, 0.714752197265625, 0.7574005126953125, 0.800048828125, 0.8426971435546875, 0.885345458984375, 0.9279937744140625, 0.97064208984375, 1.0132904052734375, 1.055938720703125, 1.0985870361328125, 1.1412353515625, 1.1838836669921875, 1.226531982421875, 1.2691802978515625, 1.31182861328125, 1.3544769287109375, 1.397125244140625, 1.4397735595703125, 1.482421875]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 9.0, 6.0, 9.0, 7.0, 16.0, 21.0, 23.0, 30.0, 44.0, 39.0, 43.0, 49.0, 43.0, 54.0, 60.0, 47.0, 68.0, 59.0, 47.0, 48.0, 48.0, 46.0, 30.0, 25.0, 23.0, 16.0, 24.0, 6.0, 11.0, 16.0, 7.0, 8.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.07490348815918, -8.797059059143066, -8.519214630126953, -8.24137020111084, -7.963525772094727, -7.685681343078613, -7.407836437225342, -7.1299920082092285, -6.852147579193115, -6.574303150177002, -6.296458721160889, -6.018614292144775, -5.740769386291504, -5.462924957275391, -5.185080528259277, -4.907236099243164, -4.629391670227051, -4.3515472412109375, -4.073702812194824, -3.795858144760132, -3.5180137157440186, -3.2401692867279053, -2.962324619293213, -2.6844801902770996, -2.4066357612609863, -2.128791332244873, -1.8509467840194702, -1.5731022357940674, -1.295257806777954, -1.0174133777618408, -0.739568829536438, -0.46172428131103516, -0.18388080596923828, 0.09396368265151978, 0.37180817127227783, 0.6496526598930359, 0.927497148513794, 1.2053415775299072, 1.48318612575531, 1.761030673980713, 2.038875102996826, 2.3167195320129395, 2.5945639610290527, 2.872408628463745, 3.1502530574798584, 3.4280974864959717, 3.705942153930664, 3.9837865829467773, 4.261631011962891, 4.539475440979004, 4.817319869995117, 5.0951642990112305, 5.373008728027344, 5.650853157043457, 5.9286980628967285, 6.206542491912842, 6.484386920928955, 6.762231349945068, 7.040075778961182, 7.317920207977295, 7.595765113830566, 7.87360954284668, 8.151453971862793, 8.429298400878906, 8.70714282989502]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 10.0, 7.0, 9.0, 14.0, 16.0, 9.0, 20.0, 21.0, 17.0, 21.0, 29.0, 24.0, 25.0, 28.0, 35.0, 34.0, 37.0, 31.0, 33.0, 44.0, 43.0, 45.0, 40.0, 37.0, 40.0, 31.0, 22.0, 35.0, 27.0, 38.0, 32.0, 22.0, 18.0, 21.0, 16.0, 14.0, 12.0, 8.0, 7.0, 9.0, 3.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.588812828063965, -6.406785011291504, -6.224756717681885, -6.042728900909424, -5.860701084136963, -5.678673267364502, -5.496644973754883, -5.314617156982422, -5.132589340209961, -4.9505615234375, -4.768533229827881, -4.58650541305542, -4.404477596282959, -4.222449779510498, -4.040421485900879, -3.858393669128418, -3.676365613937378, -3.494337558746338, -3.312309741973877, -3.130281686782837, -2.948253870010376, -2.766225814819336, -2.584197998046875, -2.402169942855835, -2.220141887664795, -2.038113832473755, -1.856086015701294, -1.674057960510254, -1.492030143737793, -1.310002088546753, -1.1279741525650024, -0.945946216583252, -0.763918399810791, -0.5818904638290405, -0.39986249804496765, -0.21783453226089478, -0.03580659627914429, 0.1462213397026062, 0.32824933528900146, 0.510277271270752, 0.6923052072525024, 0.8743331432342529, 1.0563610792160034, 1.238389015197754, 1.420417070388794, 1.6024448871612549, 1.784472942352295, 1.9665008783340454, 2.148528814315796, 2.330556869506836, 2.512584686279297, 2.694612741470337, 2.876640558242798, 3.058668613433838, 3.240696430206299, 3.422724485397339, 3.604752540588379, 3.786780595779419, 3.96880841255188, 4.15083646774292, 4.332864284515381, 4.514892101287842, 4.696920394897461, 4.878948211669922, 5.060976028442383]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 11.0, 10.0, 28.0, 28.0, 44.0, 58.0, 88.0, 131.0, 199.0, 327.0, 475.0, 759.0, 1116.0, 1873.0, 3093.0, 5478.0, 9362.0, 16935.0, 32273.0, 64017.0, 134403.0, 302214.0, 670881.0, 1087862.0, 948878.0, 491293.0, 217082.0, 99008.0, 48071.0, 25054.0, 13826.0, 7592.0, 4525.0, 2606.0, 1732.0, 958.0, 703.0, 411.0, 281.0, 199.0, 113.0, 74.0, 60.0, 44.0, 37.0, 23.0, 9.0, 14.0, 6.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.0859375, -6.84814453125, -6.6103515625, -6.37255859375, -6.134765625, -5.89697265625, -5.6591796875, -5.42138671875, -5.18359375, -4.94580078125, -4.7080078125, -4.47021484375, -4.232421875, -3.99462890625, -3.7568359375, -3.51904296875, -3.28125, -3.04345703125, -2.8056640625, -2.56787109375, -2.330078125, -2.09228515625, -1.8544921875, -1.61669921875, -1.37890625, -1.14111328125, -0.9033203125, -0.66552734375, -0.427734375, -0.18994140625, 0.0478515625, 0.28564453125, 0.5234375, 0.76123046875, 0.9990234375, 1.23681640625, 1.474609375, 1.71240234375, 1.9501953125, 2.18798828125, 2.42578125, 2.66357421875, 2.9013671875, 3.13916015625, 3.376953125, 3.61474609375, 3.8525390625, 4.09033203125, 4.328125, 4.56591796875, 4.8037109375, 5.04150390625, 5.279296875, 5.51708984375, 5.7548828125, 5.99267578125, 6.23046875, 6.46826171875, 6.7060546875, 6.94384765625, 7.181640625, 7.41943359375, 7.6572265625, 7.89501953125, 8.1328125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 7.0, 10.0, 13.0, 22.0, 21.0, 18.0, 18.0, 29.0, 35.0, 28.0, 27.0, 29.0, 28.0, 30.0, 42.0, 36.0, 41.0, 45.0, 52.0, 44.0, 49.0, 42.0, 35.0, 37.0, 29.0, 37.0, 24.0, 25.0, 26.0, 18.0, 20.0, 18.0, 13.0, 11.0, 10.0, 6.0, 7.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.25, -5.1103515625, -4.970703125, -4.8310546875, -4.69140625, -4.5517578125, -4.412109375, -4.2724609375, -4.1328125, -3.9931640625, -3.853515625, -3.7138671875, -3.57421875, -3.4345703125, -3.294921875, -3.1552734375, -3.015625, -2.8759765625, -2.736328125, -2.5966796875, -2.45703125, -2.3173828125, -2.177734375, -2.0380859375, -1.8984375, -1.7587890625, -1.619140625, -1.4794921875, -1.33984375, -1.2001953125, -1.060546875, -0.9208984375, -0.78125, -0.6416015625, -0.501953125, -0.3623046875, -0.22265625, -0.0830078125, 0.056640625, 0.1962890625, 0.3359375, 0.4755859375, 0.615234375, 0.7548828125, 0.89453125, 1.0341796875, 1.173828125, 1.3134765625, 1.453125, 1.5927734375, 1.732421875, 1.8720703125, 2.01171875, 2.1513671875, 2.291015625, 2.4306640625, 2.5703125, 2.7099609375, 2.849609375, 2.9892578125, 3.12890625, 3.2685546875, 3.408203125, 3.5478515625, 3.6875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 9.0, 9.0, 11.0, 17.0, 29.0, 51.0, 74.0, 95.0, 152.0, 245.0, 389.0, 510.0, 863.0, 1312.0, 1935.0, 3159.0, 5055.0, 8305.0, 14021.0, 24441.0, 42661.0, 77885.0, 148480.0, 283034.0, 532400.0, 872063.0, 912395.0, 586691.0, 313271.0, 163557.0, 87140.0, 47479.0, 26838.0, 15453.0, 9264.0, 5648.0, 3334.0, 2195.0, 1335.0, 888.0, 509.0, 350.0, 246.0, 164.0, 92.0, 83.0, 44.0, 33.0, 21.0, 17.0, 9.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0], "bins": [-7.2265625, -7.00811767578125, -6.7896728515625, -6.57122802734375, -6.352783203125, -6.13433837890625, -5.9158935546875, -5.69744873046875, -5.47900390625, -5.26055908203125, -5.0421142578125, -4.82366943359375, -4.605224609375, -4.38677978515625, -4.1683349609375, -3.94989013671875, -3.7314453125, -3.51300048828125, -3.2945556640625, -3.07611083984375, -2.857666015625, -2.63922119140625, -2.4207763671875, -2.20233154296875, -1.98388671875, -1.76544189453125, -1.5469970703125, -1.32855224609375, -1.110107421875, -0.89166259765625, -0.6732177734375, -0.45477294921875, -0.236328125, -0.01788330078125, 0.2005615234375, 0.41900634765625, 0.637451171875, 0.85589599609375, 1.0743408203125, 1.29278564453125, 1.51123046875, 1.72967529296875, 1.9481201171875, 2.16656494140625, 2.385009765625, 2.60345458984375, 2.8218994140625, 3.04034423828125, 3.2587890625, 3.47723388671875, 3.6956787109375, 3.91412353515625, 4.132568359375, 4.35101318359375, 4.5694580078125, 4.78790283203125, 5.00634765625, 5.22479248046875, 5.4432373046875, 5.66168212890625, 5.880126953125, 6.09857177734375, 6.3170166015625, 6.53546142578125, 6.75390625]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 10.0, 6.0, 3.0, 15.0, 23.0, 23.0, 24.0, 36.0, 48.0, 55.0, 63.0, 89.0, 112.0, 131.0, 166.0, 174.0, 203.0, 245.0, 284.0, 258.0, 290.0, 269.0, 253.0, 198.0, 186.0, 145.0, 142.0, 118.0, 74.0, 92.0, 68.0, 60.0, 41.0, 31.0, 27.0, 30.0, 15.0, 16.0, 6.0, 11.0, 11.0, 3.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.076171875, -2.004486083984375, -1.93280029296875, -1.861114501953125, -1.7894287109375, -1.717742919921875, -1.64605712890625, -1.574371337890625, -1.502685546875, -1.430999755859375, -1.35931396484375, -1.287628173828125, -1.2159423828125, -1.144256591796875, -1.07257080078125, -1.000885009765625, -0.92919921875, -0.857513427734375, -0.78582763671875, -0.714141845703125, -0.6424560546875, -0.570770263671875, -0.49908447265625, -0.427398681640625, -0.355712890625, -0.284027099609375, -0.21234130859375, -0.140655517578125, -0.0689697265625, 0.002716064453125, 0.07440185546875, 0.146087646484375, 0.2177734375, 0.289459228515625, 0.36114501953125, 0.432830810546875, 0.5045166015625, 0.576202392578125, 0.64788818359375, 0.719573974609375, 0.791259765625, 0.862945556640625, 0.93463134765625, 1.006317138671875, 1.0780029296875, 1.149688720703125, 1.22137451171875, 1.293060302734375, 1.36474609375, 1.436431884765625, 1.50811767578125, 1.579803466796875, 1.6514892578125, 1.723175048828125, 1.79486083984375, 1.866546630859375, 1.938232421875, 2.009918212890625, 2.08160400390625, 2.153289794921875, 2.2249755859375, 2.296661376953125, 2.36834716796875, 2.440032958984375, 2.51171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 8.0, 10.0, 13.0, 14.0, 26.0, 28.0, 22.0, 37.0, 39.0, 36.0, 46.0, 58.0, 60.0, 62.0, 77.0, 56.0, 52.0, 51.0, 54.0, 59.0, 32.0, 29.0, 26.0, 18.0, 17.0, 7.0, 12.0, 7.0, 11.0, 3.0, 1.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.877823829650879, -8.616966247558594, -8.356109619140625, -8.09525203704834, -7.834394454956055, -7.573537349700928, -7.312680244445801, -7.051822662353516, -6.790965557098389, -6.530108451843262, -6.269250869750977, -6.00839376449585, -5.747536659240723, -5.4866790771484375, -5.2258219718933105, -4.964964866638184, -4.704107284545898, -4.4432501792907715, -4.182392597198486, -3.9215354919433594, -3.6606781482696533, -3.3998208045959473, -3.1389636993408203, -2.8781063556671143, -2.617249011993408, -2.356391668319702, -2.095534324645996, -1.8346772193908691, -1.573819875717163, -1.312962532043457, -1.0521053075790405, -0.791248083114624, -0.5303916931152344, -0.2695344090461731, -0.008677124977111816, 0.25218015909194946, 0.5130374431610107, 0.7738947868347168, 1.0347520112991333, 1.2956092357635498, 1.5564665794372559, 1.817323923110962, 2.078181266784668, 2.339038372039795, 2.599895715713501, 2.860753059387207, 3.121610164642334, 3.38246750831604, 3.643324851989746, 3.904182195663452, 4.165039539337158, 4.425896644592285, 4.68675422668457, 4.947611331939697, 5.208468437194824, 5.469326019287109, 5.730183124542236, 5.991040229797363, 6.251897811889648, 6.512754917144775, 6.773612022399902, 7.0344696044921875, 7.2953267097473145, 7.556183815002441, 7.817041397094727]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 4.0, 16.0, 23.0, 15.0, 27.0, 18.0, 34.0, 25.0, 24.0, 28.0, 52.0, 43.0, 27.0, 39.0, 48.0, 49.0, 45.0, 47.0, 41.0, 50.0, 34.0, 25.0, 36.0, 43.0, 33.0, 26.0, 25.0, 23.0, 21.0, 20.0, 18.0, 6.0, 9.0, 4.0, 6.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0543532371521, -5.8705925941467285, -5.686831951141357, -5.503071308135986, -5.319310665130615, -5.135549545288086, -4.951788902282715, -4.768028259277344, -4.584267616271973, -4.400506973266602, -4.2167463302612305, -4.032985687255859, -3.849224805831909, -3.665464162826538, -3.481703519821167, -3.297942638397217, -3.114182233810425, -2.9304215908050537, -2.7466609477996826, -2.5629000663757324, -2.3791394233703613, -2.1953787803649902, -2.011618137359619, -1.8278573751449585, -1.6440967321395874, -1.4603360891342163, -1.2765753269195557, -1.0928146839141846, -0.9090539813041687, -0.7252932786941528, -0.5415326356887817, -0.3577718734741211, -0.17401123046875, 0.009749457240104675, 0.19351014494895935, 0.37727081775665283, 0.5610315203666687, 0.7447922229766846, 0.9285528659820557, 1.1123136281967163, 1.2960742712020874, 1.4798349142074585, 1.6635956764221191, 1.8473563194274902, 2.0311169624328613, 2.2148776054382324, 2.3986382484436035, 2.5823991298675537, 2.766159772872925, 2.949920415878296, 3.133681058883667, 3.317441940307617, 3.5012025833129883, 3.6849632263183594, 3.8687238693237305, 4.052484512329102, 4.236245155334473, 4.420005798339844, 4.603766441345215, 4.787527084350586, 4.971287727355957, 5.155048370361328, 5.338809013366699, 5.5225701332092285, 5.7063307762146]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 20.0, 33.0, 49.0, 64.0, 125.0, 181.0, 265.0, 397.0, 711.0, 1108.0, 1772.0, 2823.0, 4639.0, 7949.0, 13946.0, 25404.0, 45720.0, 82470.0, 139336.0, 196834.0, 198004.0, 138956.0, 82526.0, 45506.0, 25271.0, 14100.0, 8101.0, 4631.0, 2867.0, 1748.0, 1106.0, 694.0, 404.0, 298.0, 187.0, 103.0, 54.0, 45.0, 37.0, 18.0, 11.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.46771240234375, -5.2791748046875, -5.09063720703125, -4.902099609375, -4.71356201171875, -4.5250244140625, -4.33648681640625, -4.14794921875, -3.95941162109375, -3.7708740234375, -3.58233642578125, -3.393798828125, -3.20526123046875, -3.0167236328125, -2.82818603515625, -2.6396484375, -2.45111083984375, -2.2625732421875, -2.07403564453125, -1.885498046875, -1.69696044921875, -1.5084228515625, -1.31988525390625, -1.13134765625, -0.94281005859375, -0.7542724609375, -0.56573486328125, -0.377197265625, -0.18865966796875, -0.0001220703125, 0.18841552734375, 0.376953125, 0.56549072265625, 0.7540283203125, 0.94256591796875, 1.131103515625, 1.31964111328125, 1.5081787109375, 1.69671630859375, 1.88525390625, 2.07379150390625, 2.2623291015625, 2.45086669921875, 2.639404296875, 2.82794189453125, 3.0164794921875, 3.20501708984375, 3.3935546875, 3.58209228515625, 3.7706298828125, 3.95916748046875, 4.147705078125, 4.33624267578125, 4.5247802734375, 4.71331787109375, 4.90185546875, 5.09039306640625, 5.2789306640625, 5.46746826171875, 5.656005859375, 5.84454345703125, 6.0330810546875, 6.22161865234375, 6.41015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 6.0, 19.0, 15.0, 13.0, 21.0, 20.0, 27.0, 22.0, 30.0, 39.0, 33.0, 41.0, 48.0, 31.0, 40.0, 38.0, 55.0, 57.0, 45.0, 49.0, 31.0, 33.0, 43.0, 35.0, 39.0, 26.0, 29.0, 30.0, 13.0, 15.0, 9.0, 11.0, 8.0, 3.0, 5.0, 4.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.57421875, -6.383544921875, -6.19287109375, -6.002197265625, -5.8115234375, -5.620849609375, -5.43017578125, -5.239501953125, -5.048828125, -4.858154296875, -4.66748046875, -4.476806640625, -4.2861328125, -4.095458984375, -3.90478515625, -3.714111328125, -3.5234375, -3.332763671875, -3.14208984375, -2.951416015625, -2.7607421875, -2.570068359375, -2.37939453125, -2.188720703125, -1.998046875, -1.807373046875, -1.61669921875, -1.426025390625, -1.2353515625, -1.044677734375, -0.85400390625, -0.663330078125, -0.47265625, -0.281982421875, -0.09130859375, 0.099365234375, 0.2900390625, 0.480712890625, 0.67138671875, 0.862060546875, 1.052734375, 1.243408203125, 1.43408203125, 1.624755859375, 1.8154296875, 2.006103515625, 2.19677734375, 2.387451171875, 2.578125, 2.768798828125, 2.95947265625, 3.150146484375, 3.3408203125, 3.531494140625, 3.72216796875, 3.912841796875, 4.103515625, 4.294189453125, 4.48486328125, 4.675537109375, 4.8662109375, 5.056884765625, 5.24755859375, 5.438232421875, 5.62890625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 9.0, 5.0, 10.0, 8.0, 6.0, 20.0, 25.0, 39.0, 75.0, 119.0, 166.0, 216.0, 304.0, 439.0, 690.0, 1248.0, 2101.0, 3735.0, 7246.0, 16155.0, 40665.0, 117668.0, 321090.0, 334313.0, 125415.0, 42990.0, 16925.0, 7448.0, 3802.0, 2140.0, 1287.0, 742.0, 475.0, 334.0, 197.0, 139.0, 110.0, 54.0, 53.0, 29.0, 25.0, 10.0, 10.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 6.0], "bins": [-14.671875, -14.275634765625, -13.87939453125, -13.483154296875, -13.0869140625, -12.690673828125, -12.29443359375, -11.898193359375, -11.501953125, -11.105712890625, -10.70947265625, -10.313232421875, -9.9169921875, -9.520751953125, -9.12451171875, -8.728271484375, -8.33203125, -7.935791015625, -7.53955078125, -7.143310546875, -6.7470703125, -6.350830078125, -5.95458984375, -5.558349609375, -5.162109375, -4.765869140625, -4.36962890625, -3.973388671875, -3.5771484375, -3.180908203125, -2.78466796875, -2.388427734375, -1.9921875, -1.595947265625, -1.19970703125, -0.803466796875, -0.4072265625, -0.010986328125, 0.38525390625, 0.781494140625, 1.177734375, 1.573974609375, 1.97021484375, 2.366455078125, 2.7626953125, 3.158935546875, 3.55517578125, 3.951416015625, 4.34765625, 4.743896484375, 5.14013671875, 5.536376953125, 5.9326171875, 6.328857421875, 6.72509765625, 7.121337890625, 7.517578125, 7.913818359375, 8.31005859375, 8.706298828125, 9.1025390625, 9.498779296875, 9.89501953125, 10.291259765625, 10.6875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 7.0, 8.0, 5.0, 1.0, 10.0, 11.0, 8.0, 14.0, 17.0, 14.0, 24.0, 24.0, 18.0, 20.0, 30.0, 36.0, 26.0, 23.0, 49.0, 43.0, 39.0, 40.0, 49.0, 44.0, 33.0, 34.0, 39.0, 34.0, 29.0, 33.0, 29.0, 36.0, 19.0, 20.0, 33.0, 16.0, 11.0, 12.0, 16.0, 14.0, 3.0, 14.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.078125, -2.975860595703125, -2.87359619140625, -2.771331787109375, -2.6690673828125, -2.566802978515625, -2.46453857421875, -2.362274169921875, -2.260009765625, -2.157745361328125, -2.05548095703125, -1.953216552734375, -1.8509521484375, -1.748687744140625, -1.64642333984375, -1.544158935546875, -1.44189453125, -1.339630126953125, -1.23736572265625, -1.135101318359375, -1.0328369140625, -0.930572509765625, -0.82830810546875, -0.726043701171875, -0.623779296875, -0.521514892578125, -0.41925048828125, -0.316986083984375, -0.2147216796875, -0.112457275390625, -0.01019287109375, 0.092071533203125, 0.1943359375, 0.296600341796875, 0.39886474609375, 0.501129150390625, 0.6033935546875, 0.705657958984375, 0.80792236328125, 0.910186767578125, 1.012451171875, 1.114715576171875, 1.21697998046875, 1.319244384765625, 1.4215087890625, 1.523773193359375, 1.62603759765625, 1.728302001953125, 1.83056640625, 1.932830810546875, 2.03509521484375, 2.137359619140625, 2.2396240234375, 2.341888427734375, 2.44415283203125, 2.546417236328125, 2.648681640625, 2.750946044921875, 2.85321044921875, 2.955474853515625, 3.0577392578125, 3.160003662109375, 3.26226806640625, 3.364532470703125, 3.466796875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 9.0, 12.0, 22.0, 18.0, 31.0, 39.0, 52.0, 83.0, 120.0, 166.0, 243.0, 353.0, 550.0, 778.0, 1214.0, 1832.0, 3088.0, 5477.0, 10249.0, 20416.0, 44948.0, 108145.0, 251242.0, 314920.0, 159045.0, 65327.0, 28787.0, 13607.0, 7023.0, 3898.0, 2321.0, 1486.0, 964.0, 652.0, 446.0, 301.0, 175.0, 162.0, 109.0, 71.0, 46.0, 38.0, 24.0, 21.0, 19.0, 8.0, 4.0, 8.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.40234375, -4.25164794921875, -4.1009521484375, -3.95025634765625, -3.799560546875, -3.64886474609375, -3.4981689453125, -3.34747314453125, -3.19677734375, -3.04608154296875, -2.8953857421875, -2.74468994140625, -2.593994140625, -2.44329833984375, -2.2926025390625, -2.14190673828125, -1.9912109375, -1.84051513671875, -1.6898193359375, -1.53912353515625, -1.388427734375, -1.23773193359375, -1.0870361328125, -0.93634033203125, -0.78564453125, -0.63494873046875, -0.4842529296875, -0.33355712890625, -0.182861328125, -0.03216552734375, 0.1185302734375, 0.26922607421875, 0.419921875, 0.57061767578125, 0.7213134765625, 0.87200927734375, 1.022705078125, 1.17340087890625, 1.3240966796875, 1.47479248046875, 1.62548828125, 1.77618408203125, 1.9268798828125, 2.07757568359375, 2.228271484375, 2.37896728515625, 2.5296630859375, 2.68035888671875, 2.8310546875, 2.98175048828125, 3.1324462890625, 3.28314208984375, 3.433837890625, 3.58453369140625, 3.7352294921875, 3.88592529296875, 4.03662109375, 4.18731689453125, 4.3380126953125, 4.48870849609375, 4.639404296875, 4.79010009765625, 4.9407958984375, 5.09149169921875, 5.2421875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 3.0, 6.0, 5.0, 4.0, 3.0, 9.0, 12.0, 15.0, 21.0, 27.0, 31.0, 52.0, 52.0, 76.0, 107.0, 108.0, 82.0, 79.0, 85.0, 50.0, 37.0, 26.0, 20.0, 20.0, 12.0, 17.0, 7.0, 5.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00021123886108398438, -0.00020439550280570984, -0.0001975521445274353, -0.00019070878624916077, -0.00018386542797088623, -0.0001770220696926117, -0.00017017871141433716, -0.00016333535313606262, -0.00015649199485778809, -0.00014964863657951355, -0.00014280527830123901, -0.00013596192002296448, -0.00012911856174468994, -0.0001222752034664154, -0.00011543184518814087, -0.00010858848690986633, -0.0001017451286315918, -9.490177035331726e-05, -8.805841207504272e-05, -8.121505379676819e-05, -7.437169551849365e-05, -6.752833724021912e-05, -6.068497896194458e-05, -5.3841620683670044e-05, -4.699826240539551e-05, -4.015490412712097e-05, -3.3311545848846436e-05, -2.64681875705719e-05, -1.9624829292297363e-05, -1.2781471014022827e-05, -5.938112735748291e-06, 9.052455425262451e-07, 7.748603820800781e-06, 1.4591962099075317e-05, 2.1435320377349854e-05, 2.827867865562439e-05, 3.5122036933898926e-05, 4.196539521217346e-05, 4.8808753490448e-05, 5.5652111768722534e-05, 6.249547004699707e-05, 6.93388283252716e-05, 7.618218660354614e-05, 8.302554488182068e-05, 8.986890316009521e-05, 9.671226143836975e-05, 0.00010355561971664429, 0.00011039897799491882, 0.00011724233627319336, 0.0001240856945514679, 0.00013092905282974243, 0.00013777241110801697, 0.0001446157693862915, 0.00015145912766456604, 0.00015830248594284058, 0.0001651458442211151, 0.00017198920249938965, 0.00017883256077766418, 0.00018567591905593872, 0.00019251927733421326, 0.0001993626356124878, 0.00020620599389076233, 0.00021304935216903687, 0.0002198927104473114, 0.00022673606872558594]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 8.0, 14.0, 16.0, 26.0, 39.0, 55.0, 77.0, 121.0, 137.0, 189.0, 273.0, 381.0, 510.0, 791.0, 1154.0, 1839.0, 3002.0, 5303.0, 9803.0, 19258.0, 39282.0, 80546.0, 157793.0, 239988.0, 222065.0, 131941.0, 65472.0, 32300.0, 15906.0, 8113.0, 4497.0, 2675.0, 1555.0, 1059.0, 672.0, 513.0, 350.0, 214.0, 159.0, 125.0, 94.0, 66.0, 58.0, 38.0, 24.0, 23.0, 10.0, 4.0, 2.0, 6.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.716796875, -3.600128173828125, -3.48345947265625, -3.366790771484375, -3.2501220703125, -3.133453369140625, -3.01678466796875, -2.900115966796875, -2.783447265625, -2.666778564453125, -2.55010986328125, -2.433441162109375, -2.3167724609375, -2.200103759765625, -2.08343505859375, -1.966766357421875, -1.85009765625, -1.733428955078125, -1.61676025390625, -1.500091552734375, -1.3834228515625, -1.266754150390625, -1.15008544921875, -1.033416748046875, -0.916748046875, -0.800079345703125, -0.68341064453125, -0.566741943359375, -0.4500732421875, -0.333404541015625, -0.21673583984375, -0.100067138671875, 0.0166015625, 0.133270263671875, 0.24993896484375, 0.366607666015625, 0.4832763671875, 0.599945068359375, 0.71661376953125, 0.833282470703125, 0.949951171875, 1.066619873046875, 1.18328857421875, 1.299957275390625, 1.4166259765625, 1.533294677734375, 1.64996337890625, 1.766632080078125, 1.88330078125, 1.999969482421875, 2.11663818359375, 2.233306884765625, 2.3499755859375, 2.466644287109375, 2.58331298828125, 2.699981689453125, 2.816650390625, 2.933319091796875, 3.04998779296875, 3.166656494140625, 3.2833251953125, 3.399993896484375, 3.51666259765625, 3.633331298828125, 3.75]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 15.0, 28.0, 28.0, 34.0, 57.0, 68.0, 89.0, 79.0, 96.0, 89.0, 91.0, 78.0, 65.0, 49.0, 24.0, 20.0, 16.0, 17.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.273468017578125, -1.22760009765625, -1.181732177734375, -1.1358642578125, -1.089996337890625, -1.04412841796875, -0.998260498046875, -0.952392578125, -0.906524658203125, -0.86065673828125, -0.814788818359375, -0.7689208984375, -0.723052978515625, -0.67718505859375, -0.631317138671875, -0.58544921875, -0.539581298828125, -0.49371337890625, -0.447845458984375, -0.4019775390625, -0.356109619140625, -0.31024169921875, -0.264373779296875, -0.218505859375, -0.172637939453125, -0.12677001953125, -0.080902099609375, -0.0350341796875, 0.010833740234375, 0.05670166015625, 0.102569580078125, 0.1484375, 0.194305419921875, 0.24017333984375, 0.286041259765625, 0.3319091796875, 0.377777099609375, 0.42364501953125, 0.469512939453125, 0.515380859375, 0.561248779296875, 0.60711669921875, 0.652984619140625, 0.6988525390625, 0.744720458984375, 0.79058837890625, 0.836456298828125, 0.88232421875, 0.928192138671875, 0.97406005859375, 1.019927978515625, 1.0657958984375, 1.111663818359375, 1.15753173828125, 1.203399658203125, 1.249267578125, 1.295135498046875, 1.34100341796875, 1.386871337890625, 1.4327392578125, 1.478607177734375, 1.52447509765625, 1.570343017578125, 1.6162109375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 2.0, 4.0, 6.0, 9.0, 9.0, 11.0, 18.0, 27.0, 23.0, 31.0, 36.0, 33.0, 44.0, 36.0, 48.0, 64.0, 50.0, 57.0, 59.0, 58.0, 55.0, 54.0, 55.0, 39.0, 35.0, 19.0, 25.0, 17.0, 20.0, 9.0, 4.0, 7.0, 6.0, 3.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.542803764343262, -8.300796508789062, -8.058789253234863, -7.816781997680664, -7.574775218963623, -7.332767963409424, -7.090760707855225, -6.848753452301025, -6.606746673583984, -6.364739418029785, -6.122732162475586, -5.880724906921387, -5.638718128204346, -5.3967108726501465, -5.154703617095947, -4.912696361541748, -4.670689105987549, -4.42868185043335, -4.18667459487915, -3.9446675777435303, -3.70266056060791, -3.460653305053711, -3.2186460494995117, -2.9766387939453125, -2.7346317768096924, -2.492624521255493, -2.250617504119873, -2.008610248565674, -1.7666031122207642, -1.5245959758758545, -1.2825887203216553, -1.0405815839767456, -0.7985744476318359, -0.5565673112869263, -0.3145601153373718, -0.07255291938781738, 0.16945421695709229, 0.41146135330200195, 0.6534686088562012, 0.8954757452011108, 1.1374828815460205, 1.3794900178909302, 1.6214971542358398, 1.863504409790039, 2.1055116653442383, 2.3475186824798584, 2.5895259380340576, 2.8315329551696777, 3.073540210723877, 3.315547466278076, 3.5575544834136963, 3.7995617389678955, 4.041568756103516, 4.283576011657715, 4.525583267211914, 4.767590522766113, 5.0095977783203125, 5.251605033874512, 5.493612289428711, 5.73561954498291, 5.977626323699951, 6.21963357925415, 6.46164083480835, 6.703648090362549, 6.94565486907959]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 6.0, 2.0, 12.0, 14.0, 13.0, 23.0, 24.0, 15.0, 21.0, 27.0, 35.0, 36.0, 48.0, 46.0, 30.0, 46.0, 40.0, 44.0, 51.0, 42.0, 42.0, 50.0, 40.0, 33.0, 33.0, 34.0, 42.0, 27.0, 25.0, 21.0, 21.0, 19.0, 10.0, 13.0, 4.0, 10.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.362408638000488, -6.176389694213867, -5.990370750427246, -5.804351329803467, -5.618332386016846, -5.432313442230225, -5.246294021606445, -5.060275077819824, -4.874256134033203, -4.688237190246582, -4.502218246459961, -4.316198825836182, -4.1301798820495605, -3.9441609382629395, -3.7581417560577393, -3.572122573852539, -3.386103630065918, -3.200084686279297, -3.0140655040740967, -2.8280463218688965, -2.6420273780822754, -2.4560084342956543, -2.269989252090454, -2.083970069885254, -1.8979511260986328, -1.7119320631027222, -1.5259130001068115, -1.3398939371109009, -1.1538748741149902, -0.9678558111190796, -0.781836748123169, -0.5958176851272583, -0.40979814529418945, -0.2237790822982788, -0.037760019302368164, 0.14825904369354248, 0.3342781066894531, 0.5202971696853638, 0.7063162326812744, 0.8923352956771851, 1.0783543586730957, 1.2643734216690063, 1.450392484664917, 1.6364115476608276, 1.8224306106567383, 2.0084495544433594, 2.1944687366485596, 2.3804879188537598, 2.566506862640381, 2.752525806427002, 2.938544988632202, 3.1245641708374023, 3.3105831146240234, 3.4966020584106445, 3.6826212406158447, 3.868640422821045, 4.054659366607666, 4.240678310394287, 4.426697731018066, 4.6127166748046875, 4.798735618591309, 4.98475456237793, 5.170773506164551, 5.35679292678833, 5.542811870574951]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 33.0, 23.0, 52.0, 63.0, 108.0, 171.0, 240.0, 351.0, 504.0, 773.0, 1137.0, 1739.0, 2636.0, 3811.0, 5749.0, 8495.0, 12951.0, 19145.0, 28693.0, 41784.0, 61204.0, 85475.0, 111089.0, 129060.0, 130268.0, 113878.0, 89052.0, 64185.0, 44784.0, 30051.0, 20370.0, 13386.0, 8973.0, 6032.0, 3997.0, 2783.0, 1815.0, 1185.0, 778.0, 587.0, 392.0, 252.0, 154.0, 87.0, 81.0, 51.0, 36.0, 24.0, 18.0, 10.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.70703125, -4.56024169921875, -4.4134521484375, -4.26666259765625, -4.119873046875, -3.97308349609375, -3.8262939453125, -3.67950439453125, -3.53271484375, -3.38592529296875, -3.2391357421875, -3.09234619140625, -2.945556640625, -2.79876708984375, -2.6519775390625, -2.50518798828125, -2.3583984375, -2.21160888671875, -2.0648193359375, -1.91802978515625, -1.771240234375, -1.62445068359375, -1.4776611328125, -1.33087158203125, -1.18408203125, -1.03729248046875, -0.8905029296875, -0.74371337890625, -0.596923828125, -0.45013427734375, -0.3033447265625, -0.15655517578125, -0.009765625, 0.13702392578125, 0.2838134765625, 0.43060302734375, 0.577392578125, 0.72418212890625, 0.8709716796875, 1.01776123046875, 1.16455078125, 1.31134033203125, 1.4581298828125, 1.60491943359375, 1.751708984375, 1.89849853515625, 2.0452880859375, 2.19207763671875, 2.3388671875, 2.48565673828125, 2.6324462890625, 2.77923583984375, 2.926025390625, 3.07281494140625, 3.2196044921875, 3.36639404296875, 3.51318359375, 3.65997314453125, 3.8067626953125, 3.95355224609375, 4.100341796875, 4.24713134765625, 4.3939208984375, 4.54071044921875, 4.6875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 5.0, 9.0, 6.0, 13.0, 18.0, 16.0, 19.0, 21.0, 23.0, 24.0, 37.0, 37.0, 31.0, 32.0, 29.0, 43.0, 36.0, 38.0, 29.0, 48.0, 46.0, 38.0, 42.0, 32.0, 37.0, 33.0, 27.0, 36.0, 30.0, 21.0, 23.0, 22.0, 20.0, 22.0, 15.0, 8.0, 8.0, 3.0, 4.0, 2.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.246337890625, -5.08251953125, -4.918701171875, -4.7548828125, -4.591064453125, -4.42724609375, -4.263427734375, -4.099609375, -3.935791015625, -3.77197265625, -3.608154296875, -3.4443359375, -3.280517578125, -3.11669921875, -2.952880859375, -2.7890625, -2.625244140625, -2.46142578125, -2.297607421875, -2.1337890625, -1.969970703125, -1.80615234375, -1.642333984375, -1.478515625, -1.314697265625, -1.15087890625, -0.987060546875, -0.8232421875, -0.659423828125, -0.49560546875, -0.331787109375, -0.16796875, -0.004150390625, 0.15966796875, 0.323486328125, 0.4873046875, 0.651123046875, 0.81494140625, 0.978759765625, 1.142578125, 1.306396484375, 1.47021484375, 1.634033203125, 1.7978515625, 1.961669921875, 2.12548828125, 2.289306640625, 2.453125, 2.616943359375, 2.78076171875, 2.944580078125, 3.1083984375, 3.272216796875, 3.43603515625, 3.599853515625, 3.763671875, 3.927490234375, 4.09130859375, 4.255126953125, 4.4189453125, 4.582763671875, 4.74658203125, 4.910400390625, 5.07421875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 10.0, 24.0, 23.0, 34.0, 56.0, 79.0, 112.0, 231.0, 323.0, 541.0, 774.0, 1275.0, 1922.0, 3071.0, 4830.0, 7625.0, 12061.0, 19416.0, 30418.0, 47458.0, 71044.0, 101230.0, 130792.0, 146831.0, 136164.0, 108627.0, 78080.0, 52448.0, 34441.0, 21511.0, 13474.0, 8681.0, 5512.0, 3350.0, 2238.0, 1410.0, 886.0, 565.0, 354.0, 213.0, 149.0, 103.0, 73.0, 32.0, 24.0, 12.0, 14.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.578125, -4.433349609375, -4.28857421875, -4.143798828125, -3.9990234375, -3.854248046875, -3.70947265625, -3.564697265625, -3.419921875, -3.275146484375, -3.13037109375, -2.985595703125, -2.8408203125, -2.696044921875, -2.55126953125, -2.406494140625, -2.26171875, -2.116943359375, -1.97216796875, -1.827392578125, -1.6826171875, -1.537841796875, -1.39306640625, -1.248291015625, -1.103515625, -0.958740234375, -0.81396484375, -0.669189453125, -0.5244140625, -0.379638671875, -0.23486328125, -0.090087890625, 0.0546875, 0.199462890625, 0.34423828125, 0.489013671875, 0.6337890625, 0.778564453125, 0.92333984375, 1.068115234375, 1.212890625, 1.357666015625, 1.50244140625, 1.647216796875, 1.7919921875, 1.936767578125, 2.08154296875, 2.226318359375, 2.37109375, 2.515869140625, 2.66064453125, 2.805419921875, 2.9501953125, 3.094970703125, 3.23974609375, 3.384521484375, 3.529296875, 3.674072265625, 3.81884765625, 3.963623046875, 4.1083984375, 4.253173828125, 4.39794921875, 4.542724609375, 4.6875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 8.0, 10.0, 12.0, 8.0, 15.0, 18.0, 18.0, 28.0, 18.0, 27.0, 33.0, 42.0, 37.0, 36.0, 61.0, 45.0, 48.0, 35.0, 43.0, 55.0, 33.0, 45.0, 28.0, 32.0, 39.0, 37.0, 18.0, 27.0, 21.0, 14.0, 17.0, 14.0, 13.0, 14.0, 9.0, 8.0, 7.0, 2.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.703125, -3.591094970703125, -3.47906494140625, -3.367034912109375, -3.2550048828125, -3.142974853515625, -3.03094482421875, -2.918914794921875, -2.806884765625, -2.694854736328125, -2.58282470703125, -2.470794677734375, -2.3587646484375, -2.246734619140625, -2.13470458984375, -2.022674560546875, -1.91064453125, -1.798614501953125, -1.68658447265625, -1.574554443359375, -1.4625244140625, -1.350494384765625, -1.23846435546875, -1.126434326171875, -1.014404296875, -0.902374267578125, -0.79034423828125, -0.678314208984375, -0.5662841796875, -0.454254150390625, -0.34222412109375, -0.230194091796875, -0.1181640625, -0.006134033203125, 0.10589599609375, 0.217926025390625, 0.3299560546875, 0.441986083984375, 0.55401611328125, 0.666046142578125, 0.778076171875, 0.890106201171875, 1.00213623046875, 1.114166259765625, 1.2261962890625, 1.338226318359375, 1.45025634765625, 1.562286376953125, 1.67431640625, 1.786346435546875, 1.89837646484375, 2.010406494140625, 2.1224365234375, 2.234466552734375, 2.34649658203125, 2.458526611328125, 2.570556640625, 2.682586669921875, 2.79461669921875, 2.906646728515625, 3.0186767578125, 3.130706787109375, 3.24273681640625, 3.354766845703125, 3.466796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 12.0, 5.0, 15.0, 22.0, 30.0, 41.0, 71.0, 93.0, 156.0, 220.0, 349.0, 522.0, 774.0, 1151.0, 1841.0, 2964.0, 4625.0, 7250.0, 11855.0, 19702.0, 32705.0, 54525.0, 89850.0, 138453.0, 179353.0, 172468.0, 126329.0, 79808.0, 48280.0, 28726.0, 17599.0, 10553.0, 6614.0, 4142.0, 2609.0, 1674.0, 1091.0, 683.0, 484.0, 321.0, 208.0, 116.0, 102.0, 58.0, 41.0, 36.0, 12.0, 8.0, 9.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.0078125, -3.88592529296875, -3.7640380859375, -3.64215087890625, -3.520263671875, -3.39837646484375, -3.2764892578125, -3.15460205078125, -3.03271484375, -2.91082763671875, -2.7889404296875, -2.66705322265625, -2.545166015625, -2.42327880859375, -2.3013916015625, -2.17950439453125, -2.0576171875, -1.93572998046875, -1.8138427734375, -1.69195556640625, -1.570068359375, -1.44818115234375, -1.3262939453125, -1.20440673828125, -1.08251953125, -0.96063232421875, -0.8387451171875, -0.71685791015625, -0.594970703125, -0.47308349609375, -0.3511962890625, -0.22930908203125, -0.107421875, 0.01446533203125, 0.1363525390625, 0.25823974609375, 0.380126953125, 0.50201416015625, 0.6239013671875, 0.74578857421875, 0.86767578125, 0.98956298828125, 1.1114501953125, 1.23333740234375, 1.355224609375, 1.47711181640625, 1.5989990234375, 1.72088623046875, 1.8427734375, 1.96466064453125, 2.0865478515625, 2.20843505859375, 2.330322265625, 2.45220947265625, 2.5740966796875, 2.69598388671875, 2.81787109375, 2.93975830078125, 3.0616455078125, 3.18353271484375, 3.305419921875, 3.42730712890625, 3.5491943359375, 3.67108154296875, 3.79296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 13.0, 27.0, 21.0, 33.0, 47.0, 57.0, 70.0, 79.0, 109.0, 87.0, 94.0, 84.0, 69.0, 37.0, 41.0, 26.0, 21.0, 14.0, 7.0, 6.0, 5.0, 8.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006833076477050781, -0.0006649717688560486, -0.000646635890007019, -0.0006283000111579895, -0.00060996413230896, -0.0005916282534599304, -0.0005732923746109009, -0.0005549564957618713, -0.0005366206169128418, -0.0005182847380638123, -0.0004999488592147827, -0.0004816129803657532, -0.00046327710151672363, -0.0004449412226676941, -0.00042660534381866455, -0.000408269464969635, -0.00038993358612060547, -0.00037159770727157593, -0.0003532618284225464, -0.00033492594957351685, -0.0003165900707244873, -0.00029825419187545776, -0.0002799183130264282, -0.0002615824341773987, -0.00024324655532836914, -0.0002249106764793396, -0.00020657479763031006, -0.00018823891878128052, -0.00016990303993225098, -0.00015156716108322144, -0.0001332312822341919, -0.00011489540338516235, -9.655952453613281e-05, -7.822364568710327e-05, -5.988776683807373e-05, -4.155188798904419e-05, -2.321600914001465e-05, -4.880130290985107e-06, 1.3455748558044434e-05, 3.1791627407073975e-05, 5.0127506256103516e-05, 6.846338510513306e-05, 8.67992639541626e-05, 0.00010513514280319214, 0.00012347102165222168, 0.00014180690050125122, 0.00016014277935028076, 0.0001784786581993103, 0.00019681453704833984, 0.00021515041589736938, 0.00023348629474639893, 0.00025182217359542847, 0.000270158052444458, 0.00028849393129348755, 0.0003068298101425171, 0.00032516568899154663, 0.00034350156784057617, 0.0003618374466896057, 0.00038017332553863525, 0.0003985092043876648, 0.00041684508323669434, 0.0004351809620857239, 0.0004535168409347534, 0.00047185271978378296, 0.0004901885986328125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 12.0, 14.0, 35.0, 40.0, 53.0, 82.0, 97.0, 195.0, 285.0, 411.0, 639.0, 1087.0, 1724.0, 2804.0, 4533.0, 7647.0, 12563.0, 21371.0, 35591.0, 58260.0, 91549.0, 133517.0, 164338.0, 162358.0, 127138.0, 85669.0, 54132.0, 32758.0, 19666.0, 11736.0, 6997.0, 4314.0, 2570.0, 1588.0, 927.0, 647.0, 385.0, 293.0, 188.0, 114.0, 68.0, 47.0, 37.0, 19.0, 19.0, 5.0, 3.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.228515625, -3.12738037109375, -3.0262451171875, -2.92510986328125, -2.823974609375, -2.72283935546875, -2.6217041015625, -2.52056884765625, -2.41943359375, -2.31829833984375, -2.2171630859375, -2.11602783203125, -2.014892578125, -1.91375732421875, -1.8126220703125, -1.71148681640625, -1.6103515625, -1.50921630859375, -1.4080810546875, -1.30694580078125, -1.205810546875, -1.10467529296875, -1.0035400390625, -0.90240478515625, -0.80126953125, -0.70013427734375, -0.5989990234375, -0.49786376953125, -0.396728515625, -0.29559326171875, -0.1944580078125, -0.09332275390625, 0.0078125, 0.10894775390625, 0.2100830078125, 0.31121826171875, 0.412353515625, 0.51348876953125, 0.6146240234375, 0.71575927734375, 0.81689453125, 0.91802978515625, 1.0191650390625, 1.12030029296875, 1.221435546875, 1.32257080078125, 1.4237060546875, 1.52484130859375, 1.6259765625, 1.72711181640625, 1.8282470703125, 1.92938232421875, 2.030517578125, 2.13165283203125, 2.2327880859375, 2.33392333984375, 2.43505859375, 2.53619384765625, 2.6373291015625, 2.73846435546875, 2.839599609375, 2.94073486328125, 3.0418701171875, 3.14300537109375, 3.244140625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 10.0, 10.0, 10.0, 19.0, 26.0, 31.0, 35.0, 35.0, 56.0, 60.0, 77.0, 60.0, 82.0, 68.0, 74.0, 67.0, 56.0, 47.0, 34.0, 19.0, 35.0, 21.0, 10.0, 13.0, 11.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341796875, -1.487457275390625, -1.44073486328125, -1.394012451171875, -1.3472900390625, -1.300567626953125, -1.25384521484375, -1.207122802734375, -1.160400390625, -1.113677978515625, -1.06695556640625, -1.020233154296875, -0.9735107421875, -0.926788330078125, -0.88006591796875, -0.833343505859375, -0.78662109375, -0.739898681640625, -0.69317626953125, -0.646453857421875, -0.5997314453125, -0.553009033203125, -0.50628662109375, -0.459564208984375, -0.412841796875, -0.366119384765625, -0.31939697265625, -0.272674560546875, -0.2259521484375, -0.179229736328125, -0.13250732421875, -0.085784912109375, -0.0390625, 0.007659912109375, 0.05438232421875, 0.101104736328125, 0.1478271484375, 0.194549560546875, 0.24127197265625, 0.287994384765625, 0.334716796875, 0.381439208984375, 0.42816162109375, 0.474884033203125, 0.5216064453125, 0.568328857421875, 0.61505126953125, 0.661773681640625, 0.70849609375, 0.755218505859375, 0.80194091796875, 0.848663330078125, 0.8953857421875, 0.942108154296875, 0.98883056640625, 1.035552978515625, 1.082275390625, 1.128997802734375, 1.17572021484375, 1.222442626953125, 1.2691650390625, 1.315887451171875, 1.36260986328125, 1.409332275390625, 1.4560546875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 10.0, 12.0, 20.0, 14.0, 31.0, 37.0, 27.0, 39.0, 39.0, 45.0, 39.0, 59.0, 58.0, 58.0, 61.0, 55.0, 52.0, 46.0, 57.0, 37.0, 41.0, 31.0, 20.0, 15.0, 14.0, 12.0, 14.0, 7.0, 5.0, 4.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.444511890411377, -7.208479881286621, -6.972447872161865, -6.736415863037109, -6.500383377075195, -6.2643513679504395, -6.028319358825684, -5.792287349700928, -5.556255340576172, -5.320223331451416, -5.08419132232666, -4.848158836364746, -4.61212682723999, -4.376094818115234, -4.1400628089904785, -3.9040307998657227, -3.6679983139038086, -3.4319663047790527, -3.1959340572357178, -2.959902048110962, -2.723869800567627, -2.487837791442871, -2.2518057823181152, -2.0157737731933594, -1.7797415256500244, -1.543709397315979, -1.3076772689819336, -1.0716452598571777, -0.8356131315231323, -0.5995810031890869, -0.36354899406433105, -0.12751686573028564, 0.10851573944091797, 0.344547837972641, 0.580579936504364, 0.8166120052337646, 1.05264413356781, 1.2886762619018555, 1.5247082710266113, 1.7607403993606567, 1.9967725276947021, 2.232804536819458, 2.468836784362793, 2.704868793487549, 2.9409008026123047, 3.1769330501556396, 3.4129650592803955, 3.6489973068237305, 3.8850293159484863, 4.121061325073242, 4.357093334197998, 4.593125343322754, 4.829157829284668, 5.065189838409424, 5.30122184753418, 5.5372538566589355, 5.773285865783691, 6.009317874908447, 6.245349884033203, 6.481382369995117, 6.717414379119873, 6.953446388244629, 7.189478397369385, 7.425510406494141, 7.661542892456055]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 5.0, 9.0, 7.0, 14.0, 15.0, 22.0, 14.0, 32.0, 22.0, 29.0, 28.0, 31.0, 43.0, 47.0, 45.0, 52.0, 49.0, 49.0, 36.0, 35.0, 38.0, 49.0, 35.0, 31.0, 35.0, 33.0, 24.0, 31.0, 23.0, 19.0, 18.0, 22.0, 8.0, 9.0, 11.0, 5.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.484739303588867, -5.311461925506592, -5.138184547424316, -4.964907169342041, -4.791629791259766, -4.61835241317749, -4.445075035095215, -4.271798133850098, -4.098520278930664, -3.9252429008483887, -3.7519655227661133, -3.578688144683838, -3.4054107666015625, -3.232133388519287, -3.058856248855591, -2.8855788707733154, -2.712301731109619, -2.5390243530273438, -2.3657469749450684, -2.192469596862793, -2.0191922187805176, -1.8459149599075317, -1.672637701034546, -1.4993603229522705, -1.3260829448699951, -1.1528055667877197, -0.9795282483100891, -0.8062509298324585, -0.6329735517501831, -0.4596961736679077, -0.2864189147949219, -0.11314153671264648, 0.060135841369628906, 0.2334131896495819, 0.4066905379295349, 0.5799678564071655, 0.7532452344894409, 0.9265226125717163, 1.0997998714447021, 1.2730772495269775, 1.446354627609253, 1.6196320056915283, 1.7929093837738037, 1.9661866426467896, 2.1394639015197754, 2.312741279602051, 2.486018657684326, 2.6592960357666016, 2.832573413848877, 3.0058507919311523, 3.1791281700134277, 3.352405548095703, 3.5256829261779785, 3.698960304260254, 3.87223744392395, 4.045515060424805, 4.218791961669922, 4.392069339752197, 4.565346717834473, 4.738624095916748, 4.911901473999023, 5.085178852081299, 5.258456230163574, 5.431733131408691, 5.605010986328125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 10.0, 5.0, 14.0, 14.0, 18.0, 27.0, 45.0, 71.0, 115.0, 150.0, 231.0, 367.0, 580.0, 994.0, 1600.0, 2743.0, 4808.0, 8474.0, 16056.0, 30858.0, 64057.0, 142632.0, 338818.0, 789305.0, 1214894.0, 881126.0, 389482.0, 160953.0, 71130.0, 34508.0, 17520.0, 9647.0, 5332.0, 3070.0, 1837.0, 1081.0, 673.0, 388.0, 226.0, 150.0, 95.0, 63.0, 44.0, 27.0, 20.0, 13.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.2265625, -7.995361328125, -7.76416015625, -7.532958984375, -7.3017578125, -7.070556640625, -6.83935546875, -6.608154296875, -6.376953125, -6.145751953125, -5.91455078125, -5.683349609375, -5.4521484375, -5.220947265625, -4.98974609375, -4.758544921875, -4.52734375, -4.296142578125, -4.06494140625, -3.833740234375, -3.6025390625, -3.371337890625, -3.14013671875, -2.908935546875, -2.677734375, -2.446533203125, -2.21533203125, -1.984130859375, -1.7529296875, -1.521728515625, -1.29052734375, -1.059326171875, -0.828125, -0.596923828125, -0.36572265625, -0.134521484375, 0.0966796875, 0.327880859375, 0.55908203125, 0.790283203125, 1.021484375, 1.252685546875, 1.48388671875, 1.715087890625, 1.9462890625, 2.177490234375, 2.40869140625, 2.639892578125, 2.87109375, 3.102294921875, 3.33349609375, 3.564697265625, 3.7958984375, 4.027099609375, 4.25830078125, 4.489501953125, 4.720703125, 4.951904296875, 5.18310546875, 5.414306640625, 5.6455078125, 5.876708984375, 6.10791015625, 6.339111328125, 6.5703125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 5.0, 5.0, 9.0, 14.0, 15.0, 14.0, 17.0, 23.0, 22.0, 27.0, 28.0, 39.0, 31.0, 39.0, 42.0, 40.0, 41.0, 38.0, 55.0, 37.0, 56.0, 31.0, 46.0, 44.0, 40.0, 44.0, 23.0, 31.0, 12.0, 30.0, 24.0, 14.0, 15.0, 11.0, 10.0, 7.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.06719970703125, -3.9468994140625, -3.82659912109375, -3.706298828125, -3.58599853515625, -3.4656982421875, -3.34539794921875, -3.22509765625, -3.10479736328125, -2.9844970703125, -2.86419677734375, -2.743896484375, -2.62359619140625, -2.5032958984375, -2.38299560546875, -2.2626953125, -2.14239501953125, -2.0220947265625, -1.90179443359375, -1.781494140625, -1.66119384765625, -1.5408935546875, -1.42059326171875, -1.30029296875, -1.17999267578125, -1.0596923828125, -0.93939208984375, -0.819091796875, -0.69879150390625, -0.5784912109375, -0.45819091796875, -0.337890625, -0.21759033203125, -0.0972900390625, 0.02301025390625, 0.143310546875, 0.26361083984375, 0.3839111328125, 0.50421142578125, 0.62451171875, 0.74481201171875, 0.8651123046875, 0.98541259765625, 1.105712890625, 1.22601318359375, 1.3463134765625, 1.46661376953125, 1.5869140625, 1.70721435546875, 1.8275146484375, 1.94781494140625, 2.068115234375, 2.18841552734375, 2.3087158203125, 2.42901611328125, 2.54931640625, 2.66961669921875, 2.7899169921875, 2.91021728515625, 3.030517578125, 3.15081787109375, 3.2711181640625, 3.39141845703125, 3.51171875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 12.0, 8.0, 9.0, 13.0, 28.0, 36.0, 52.0, 73.0, 104.0, 165.0, 266.0, 356.0, 555.0, 877.0, 1265.0, 2165.0, 3343.0, 5259.0, 8765.0, 14676.0, 25211.0, 44471.0, 81970.0, 155681.0, 302485.0, 582754.0, 934039.0, 896556.0, 538227.0, 276696.0, 142224.0, 75223.0, 41588.0, 23417.0, 13608.0, 8255.0, 5022.0, 3214.0, 1923.0, 1306.0, 811.0, 542.0, 378.0, 222.0, 151.0, 101.0, 57.0, 49.0, 30.0, 22.0, 14.0, 6.0, 10.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.57012939453125, -5.3707275390625, -5.17132568359375, -4.971923828125, -4.77252197265625, -4.5731201171875, -4.37371826171875, -4.17431640625, -3.97491455078125, -3.7755126953125, -3.57611083984375, -3.376708984375, -3.17730712890625, -2.9779052734375, -2.77850341796875, -2.5791015625, -2.37969970703125, -2.1802978515625, -1.98089599609375, -1.781494140625, -1.58209228515625, -1.3826904296875, -1.18328857421875, -0.98388671875, -0.78448486328125, -0.5850830078125, -0.38568115234375, -0.186279296875, 0.01312255859375, 0.2125244140625, 0.41192626953125, 0.611328125, 0.81072998046875, 1.0101318359375, 1.20953369140625, 1.408935546875, 1.60833740234375, 1.8077392578125, 2.00714111328125, 2.20654296875, 2.40594482421875, 2.6053466796875, 2.80474853515625, 3.004150390625, 3.20355224609375, 3.4029541015625, 3.60235595703125, 3.8017578125, 4.00115966796875, 4.2005615234375, 4.39996337890625, 4.599365234375, 4.79876708984375, 4.9981689453125, 5.19757080078125, 5.39697265625, 5.59637451171875, 5.7957763671875, 5.99517822265625, 6.194580078125, 6.39398193359375, 6.5933837890625, 6.79278564453125, 6.9921875]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 12.0, 8.0, 12.0, 17.0, 25.0, 30.0, 39.0, 56.0, 68.0, 83.0, 112.0, 123.0, 164.0, 203.0, 213.0, 247.0, 298.0, 291.0, 273.0, 256.0, 268.0, 224.0, 192.0, 163.0, 148.0, 105.0, 87.0, 68.0, 57.0, 47.0, 42.0, 34.0, 28.0, 15.0, 13.0, 16.0, 13.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.94921875, -1.87994384765625, -1.8106689453125, -1.74139404296875, -1.672119140625, -1.60284423828125, -1.5335693359375, -1.46429443359375, -1.39501953125, -1.32574462890625, -1.2564697265625, -1.18719482421875, -1.117919921875, -1.04864501953125, -0.9793701171875, -0.91009521484375, -0.8408203125, -0.77154541015625, -0.7022705078125, -0.63299560546875, -0.563720703125, -0.49444580078125, -0.4251708984375, -0.35589599609375, -0.28662109375, -0.21734619140625, -0.1480712890625, -0.07879638671875, -0.009521484375, 0.05975341796875, 0.1290283203125, 0.19830322265625, 0.267578125, 0.33685302734375, 0.4061279296875, 0.47540283203125, 0.544677734375, 0.61395263671875, 0.6832275390625, 0.75250244140625, 0.82177734375, 0.89105224609375, 0.9603271484375, 1.02960205078125, 1.098876953125, 1.16815185546875, 1.2374267578125, 1.30670166015625, 1.3759765625, 1.44525146484375, 1.5145263671875, 1.58380126953125, 1.653076171875, 1.72235107421875, 1.7916259765625, 1.86090087890625, 1.93017578125, 1.99945068359375, 2.0687255859375, 2.13800048828125, 2.207275390625, 2.27655029296875, 2.3458251953125, 2.41510009765625, 2.484375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 17.0, 6.0, 12.0, 10.0, 22.0, 15.0, 34.0, 33.0, 29.0, 39.0, 57.0, 67.0, 69.0, 77.0, 47.0, 64.0, 59.0, 60.0, 42.0, 36.0, 29.0, 23.0, 33.0, 25.0, 20.0, 16.0, 9.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.895099639892578, -6.658045291900635, -6.420990943908691, -6.18393611907959, -5.9468817710876465, -5.709827423095703, -5.472772598266602, -5.235718250274658, -4.998663902282715, -4.7616095542907715, -4.524555206298828, -4.287500381469727, -4.050446033477783, -3.81339168548584, -3.5763370990753174, -3.339282512664795, -3.1022281646728516, -2.865173816680908, -2.6281192302703857, -2.3910646438598633, -2.15401029586792, -1.916955828666687, -1.679901361465454, -1.4428468942642212, -1.2057924270629883, -0.9687379598617554, -0.7316834926605225, -0.49462902545928955, -0.25757455825805664, -0.02052009105682373, 0.21653437614440918, 0.4535888433456421, 0.690643310546875, 0.9276977777481079, 1.1647522449493408, 1.4018067121505737, 1.6388611793518066, 1.8759156465530396, 2.1129701137542725, 2.350024700164795, 2.5870790481567383, 2.8241333961486816, 3.061187982559204, 3.2982425689697266, 3.53529691696167, 3.7723512649536133, 4.009406089782715, 4.246460437774658, 4.483514785766602, 4.720569133758545, 4.957623481750488, 5.19467830657959, 5.431732654571533, 5.668787002563477, 5.905841827392578, 6.1428961753845215, 6.379950523376465, 6.617004871368408, 6.854059219360352, 7.091114044189453, 7.3281683921813965, 7.56522274017334, 7.802277565002441, 8.039331436157227, 8.276386260986328]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 7.0, 8.0, 7.0, 10.0, 8.0, 14.0, 19.0, 12.0, 24.0, 28.0, 19.0, 35.0, 33.0, 34.0, 25.0, 36.0, 26.0, 36.0, 42.0, 29.0, 56.0, 47.0, 32.0, 29.0, 41.0, 38.0, 43.0, 29.0, 18.0, 27.0, 17.0, 24.0, 22.0, 20.0, 11.0, 20.0, 11.0, 15.0, 9.0, 7.0, 10.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-4.4756879806518555, -4.342403888702393, -4.209120273590088, -4.075836181640625, -3.942552328109741, -3.8092684745788574, -3.6759843826293945, -3.5427005290985107, -3.409416675567627, -3.276132822036743, -3.1428487300872803, -3.0095648765563965, -2.8762810230255127, -2.742997169494629, -2.609713077545166, -2.4764292240142822, -2.3431451320648193, -2.2098612785339355, -2.0765771865844727, -1.9432933330535889, -1.810009479522705, -1.6767255067825317, -1.5434415340423584, -1.4101576805114746, -1.2768737077713013, -1.143589735031128, -1.0103058815002441, -0.8770219087600708, -0.7437379956245422, -0.6104540824890137, -0.47717010974884033, -0.34388619661331177, -0.2106022834777832, -0.07731835544109344, 0.055965572595596313, 0.18924951553344727, 0.32253342866897583, 0.4558173418045044, 0.5891013145446777, 0.7223852276802063, 0.8556691408157349, 0.9889530539512634, 1.122236967086792, 1.2555209398269653, 1.3888049125671387, 1.5220887660980225, 1.6553727388381958, 1.7886567115783691, 1.921940565109253, 2.0552244186401367, 2.1885085105895996, 2.3217923641204834, 2.455076217651367, 2.58836030960083, 2.721644163131714, 2.8549280166625977, 2.9882121086120605, 3.1214959621429443, 3.2547800540924072, 3.388063907623291, 3.521347761154175, 3.6546316146850586, 3.7879157066345215, 3.9211995601654053, 4.054483413696289]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 12.0, 13.0, 23.0, 27.0, 45.0, 54.0, 99.0, 130.0, 203.0, 319.0, 531.0, 805.0, 1325.0, 2214.0, 3665.0, 6329.0, 10756.0, 19059.0, 33731.0, 59185.0, 98471.0, 149276.0, 183709.0, 170659.0, 124368.0, 78221.0, 45305.0, 25113.0, 14297.0, 8383.0, 4749.0, 2737.0, 1776.0, 1087.0, 643.0, 432.0, 244.0, 186.0, 129.0, 80.0, 47.0, 38.0, 25.0, 22.0, 8.0, 10.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.88671875, -3.771575927734375, -3.65643310546875, -3.541290283203125, -3.4261474609375, -3.311004638671875, -3.19586181640625, -3.080718994140625, -2.965576171875, -2.850433349609375, -2.73529052734375, -2.620147705078125, -2.5050048828125, -2.389862060546875, -2.27471923828125, -2.159576416015625, -2.04443359375, -1.929290771484375, -1.81414794921875, -1.699005126953125, -1.5838623046875, -1.468719482421875, -1.35357666015625, -1.238433837890625, -1.123291015625, -1.008148193359375, -0.89300537109375, -0.777862548828125, -0.6627197265625, -0.547576904296875, -0.43243408203125, -0.317291259765625, -0.2021484375, -0.087005615234375, 0.02813720703125, 0.143280029296875, 0.2584228515625, 0.373565673828125, 0.48870849609375, 0.603851318359375, 0.718994140625, 0.834136962890625, 0.94927978515625, 1.064422607421875, 1.1795654296875, 1.294708251953125, 1.40985107421875, 1.524993896484375, 1.64013671875, 1.755279541015625, 1.87042236328125, 1.985565185546875, 2.1007080078125, 2.215850830078125, 2.33099365234375, 2.446136474609375, 2.561279296875, 2.676422119140625, 2.79156494140625, 2.906707763671875, 3.0218505859375, 3.136993408203125, 3.25213623046875, 3.367279052734375, 3.482421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 8.0, 5.0, 2.0, 6.0, 9.0, 12.0, 12.0, 9.0, 14.0, 23.0, 19.0, 26.0, 35.0, 28.0, 27.0, 30.0, 27.0, 30.0, 34.0, 43.0, 60.0, 42.0, 40.0, 41.0, 45.0, 39.0, 26.0, 39.0, 32.0, 24.0, 32.0, 20.0, 26.0, 15.0, 27.0, 18.0, 14.0, 10.0, 10.0, 6.0, 7.0, 4.0, 10.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.06640625, -4.92034912109375, -4.7742919921875, -4.62823486328125, -4.482177734375, -4.33612060546875, -4.1900634765625, -4.04400634765625, -3.89794921875, -3.75189208984375, -3.6058349609375, -3.45977783203125, -3.313720703125, -3.16766357421875, -3.0216064453125, -2.87554931640625, -2.7294921875, -2.58343505859375, -2.4373779296875, -2.29132080078125, -2.145263671875, -1.99920654296875, -1.8531494140625, -1.70709228515625, -1.56103515625, -1.41497802734375, -1.2689208984375, -1.12286376953125, -0.976806640625, -0.83074951171875, -0.6846923828125, -0.53863525390625, -0.392578125, -0.24652099609375, -0.1004638671875, 0.04559326171875, 0.191650390625, 0.33770751953125, 0.4837646484375, 0.62982177734375, 0.77587890625, 0.92193603515625, 1.0679931640625, 1.21405029296875, 1.360107421875, 1.50616455078125, 1.6522216796875, 1.79827880859375, 1.9443359375, 2.09039306640625, 2.2364501953125, 2.38250732421875, 2.528564453125, 2.67462158203125, 2.8206787109375, 2.96673583984375, 3.11279296875, 3.25885009765625, 3.4049072265625, 3.55096435546875, 3.697021484375, 3.84307861328125, 3.9891357421875, 4.13519287109375, 4.28125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 5.0, 16.0, 18.0, 19.0, 22.0, 41.0, 60.0, 88.0, 142.0, 202.0, 296.0, 405.0, 718.0, 995.0, 1688.0, 2804.0, 4685.0, 7808.0, 13534.0, 24145.0, 42485.0, 77732.0, 131885.0, 198771.0, 205036.0, 142055.0, 83174.0, 46972.0, 26493.0, 14950.0, 8370.0, 4890.0, 3039.0, 1753.0, 1067.0, 737.0, 471.0, 340.0, 228.0, 139.0, 94.0, 59.0, 43.0, 26.0, 15.0, 20.0, 10.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.2578125, -4.1162109375, -3.974609375, -3.8330078125, -3.69140625, -3.5498046875, -3.408203125, -3.2666015625, -3.125, -2.9833984375, -2.841796875, -2.7001953125, -2.55859375, -2.4169921875, -2.275390625, -2.1337890625, -1.9921875, -1.8505859375, -1.708984375, -1.5673828125, -1.42578125, -1.2841796875, -1.142578125, -1.0009765625, -0.859375, -0.7177734375, -0.576171875, -0.4345703125, -0.29296875, -0.1513671875, -0.009765625, 0.1318359375, 0.2734375, 0.4150390625, 0.556640625, 0.6982421875, 0.83984375, 0.9814453125, 1.123046875, 1.2646484375, 1.40625, 1.5478515625, 1.689453125, 1.8310546875, 1.97265625, 2.1142578125, 2.255859375, 2.3974609375, 2.5390625, 2.6806640625, 2.822265625, 2.9638671875, 3.10546875, 3.2470703125, 3.388671875, 3.5302734375, 3.671875, 3.8134765625, 3.955078125, 4.0966796875, 4.23828125, 4.3798828125, 4.521484375, 4.6630859375, 4.8046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 7.0, 1.0, 4.0, 13.0, 14.0, 7.0, 10.0, 17.0, 26.0, 21.0, 26.0, 28.0, 40.0, 45.0, 54.0, 42.0, 36.0, 40.0, 39.0, 50.0, 52.0, 53.0, 32.0, 36.0, 36.0, 36.0, 21.0, 26.0, 28.0, 24.0, 30.0, 14.0, 12.0, 15.0, 19.0, 10.0, 6.0, 5.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.427581787109375, -2.32977294921875, -2.231964111328125, -2.1341552734375, -2.036346435546875, -1.93853759765625, -1.840728759765625, -1.742919921875, -1.645111083984375, -1.54730224609375, -1.449493408203125, -1.3516845703125, -1.253875732421875, -1.15606689453125, -1.058258056640625, -0.96044921875, -0.862640380859375, -0.76483154296875, -0.667022705078125, -0.5692138671875, -0.471405029296875, -0.37359619140625, -0.275787353515625, -0.177978515625, -0.080169677734375, 0.01763916015625, 0.115447998046875, 0.2132568359375, 0.311065673828125, 0.40887451171875, 0.506683349609375, 0.6044921875, 0.702301025390625, 0.80010986328125, 0.897918701171875, 0.9957275390625, 1.093536376953125, 1.19134521484375, 1.289154052734375, 1.386962890625, 1.484771728515625, 1.58258056640625, 1.680389404296875, 1.7781982421875, 1.876007080078125, 1.97381591796875, 2.071624755859375, 2.16943359375, 2.267242431640625, 2.36505126953125, 2.462860107421875, 2.5606689453125, 2.658477783203125, 2.75628662109375, 2.854095458984375, 2.951904296875, 3.049713134765625, 3.14752197265625, 3.245330810546875, 3.3431396484375, 3.440948486328125, 3.53875732421875, 3.636566162109375, 3.734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 8.0, 10.0, 9.0, 14.0, 21.0, 24.0, 21.0, 37.0, 48.0, 71.0, 85.0, 111.0, 155.0, 161.0, 236.0, 325.0, 432.0, 675.0, 957.0, 1543.0, 2801.0, 5892.0, 13767.0, 39002.0, 128879.0, 385418.0, 318343.0, 96399.0, 30216.0, 11202.0, 4881.0, 2519.0, 1362.0, 834.0, 551.0, 357.0, 275.0, 222.0, 148.0, 131.0, 72.0, 76.0, 61.0, 47.0, 30.0, 35.0, 27.0, 23.0, 17.0, 10.0, 3.0, 6.0, 5.0, 5.0, 4.0], "bins": [-5.1953125, -5.04638671875, -4.8974609375, -4.74853515625, -4.599609375, -4.45068359375, -4.3017578125, -4.15283203125, -4.00390625, -3.85498046875, -3.7060546875, -3.55712890625, -3.408203125, -3.25927734375, -3.1103515625, -2.96142578125, -2.8125, -2.66357421875, -2.5146484375, -2.36572265625, -2.216796875, -2.06787109375, -1.9189453125, -1.77001953125, -1.62109375, -1.47216796875, -1.3232421875, -1.17431640625, -1.025390625, -0.87646484375, -0.7275390625, -0.57861328125, -0.4296875, -0.28076171875, -0.1318359375, 0.01708984375, 0.166015625, 0.31494140625, 0.4638671875, 0.61279296875, 0.76171875, 0.91064453125, 1.0595703125, 1.20849609375, 1.357421875, 1.50634765625, 1.6552734375, 1.80419921875, 1.953125, 2.10205078125, 2.2509765625, 2.39990234375, 2.548828125, 2.69775390625, 2.8466796875, 2.99560546875, 3.14453125, 3.29345703125, 3.4423828125, 3.59130859375, 3.740234375, 3.88916015625, 4.0380859375, 4.18701171875, 4.3359375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 5.0, 9.0, 5.0, 13.0, 15.0, 17.0, 20.0, 31.0, 36.0, 42.0, 48.0, 56.0, 87.0, 106.0, 67.0, 71.0, 74.0, 76.0, 47.0, 32.0, 31.0, 32.0, 18.0, 11.0, 11.0, 11.0, 6.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012421607971191406, -0.00012039672583341599, -0.00011657737195491791, -0.00011275801807641983, -0.00010893866419792175, -0.00010511931031942368, -0.0001012999564409256, -9.748060256242752e-05, -9.366124868392944e-05, -8.984189480543137e-05, -8.602254092693329e-05, -8.220318704843521e-05, -7.838383316993713e-05, -7.456447929143906e-05, -7.074512541294098e-05, -6.69257715344429e-05, -6.310641765594482e-05, -5.928706377744675e-05, -5.546770989894867e-05, -5.164835602045059e-05, -4.7829002141952515e-05, -4.400964826345444e-05, -4.019029438495636e-05, -3.637094050645828e-05, -3.2551586627960205e-05, -2.8732232749462128e-05, -2.491287887096405e-05, -2.1093524992465973e-05, -1.7274171113967896e-05, -1.3454817235469818e-05, -9.63546335697174e-06, -5.816109478473663e-06, -1.996755599975586e-06, 1.8225982785224915e-06, 5.641952157020569e-06, 9.461306035518646e-06, 1.3280659914016724e-05, 1.71000137925148e-05, 2.091936767101288e-05, 2.4738721549510956e-05, 2.8558075428009033e-05, 3.237742930650711e-05, 3.619678318500519e-05, 4.0016137063503265e-05, 4.383549094200134e-05, 4.765484482049942e-05, 5.14741986989975e-05, 5.5293552577495575e-05, 5.911290645599365e-05, 6.293226033449173e-05, 6.675161421298981e-05, 7.057096809148788e-05, 7.439032196998596e-05, 7.820967584848404e-05, 8.202902972698212e-05, 8.58483836054802e-05, 8.966773748397827e-05, 9.348709136247635e-05, 9.730644524097443e-05, 0.0001011257991194725, 0.00010494515299797058, 0.00010876450687646866, 0.00011258386075496674, 0.00011640321463346481, 0.00012022256851196289]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 5.0, 11.0, 18.0, 29.0, 27.0, 51.0, 64.0, 81.0, 125.0, 166.0, 256.0, 355.0, 568.0, 884.0, 1394.0, 2582.0, 4734.0, 9539.0, 21286.0, 51463.0, 125017.0, 249112.0, 283611.0, 167871.0, 72660.0, 29706.0, 12859.0, 6065.0, 3140.0, 1802.0, 1070.0, 603.0, 428.0, 272.0, 188.0, 135.0, 111.0, 70.0, 60.0, 45.0, 23.0, 26.0, 14.0, 6.0, 5.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.017578125, -2.923828125, -2.830078125, -2.736328125, -2.642578125, -2.548828125, -2.455078125, -2.361328125, -2.267578125, -2.173828125, -2.080078125, -1.986328125, -1.892578125, -1.798828125, -1.705078125, -1.611328125, -1.517578125, -1.423828125, -1.330078125, -1.236328125, -1.142578125, -1.048828125, -0.955078125, -0.861328125, -0.767578125, -0.673828125, -0.580078125, -0.486328125, -0.392578125, -0.298828125, -0.205078125, -0.111328125, -0.017578125, 0.076171875, 0.169921875, 0.263671875, 0.357421875, 0.451171875, 0.544921875, 0.638671875, 0.732421875, 0.826171875, 0.919921875, 1.013671875, 1.107421875, 1.201171875, 1.294921875, 1.388671875, 1.482421875, 1.576171875, 1.669921875, 1.763671875, 1.857421875, 1.951171875, 2.044921875, 2.138671875, 2.232421875, 2.326171875, 2.419921875, 2.513671875, 2.607421875, 2.701171875, 2.794921875, 2.888671875, 2.982421875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 10.0, 2.0, 6.0, 6.0, 8.0, 11.0, 15.0, 24.0, 21.0, 36.0, 41.0, 40.0, 49.0, 44.0, 58.0, 51.0, 70.0, 73.0, 65.0, 81.0, 60.0, 47.0, 36.0, 34.0, 27.0, 20.0, 12.0, 17.0, 10.0, 11.0, 3.0, 5.0, 1.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73095703125, -0.7072067260742188, -0.6834564208984375, -0.6597061157226562, -0.635955810546875, -0.6122055053710938, -0.5884552001953125, -0.5647048950195312, -0.54095458984375, -0.5172042846679688, -0.4934539794921875, -0.46970367431640625, -0.445953369140625, -0.42220306396484375, -0.3984527587890625, -0.37470245361328125, -0.3509521484375, -0.32720184326171875, -0.3034515380859375, -0.27970123291015625, -0.255950927734375, -0.23220062255859375, -0.2084503173828125, -0.18470001220703125, -0.16094970703125, -0.13719940185546875, -0.1134490966796875, -0.08969879150390625, -0.065948486328125, -0.04219818115234375, -0.0184478759765625, 0.00530242919921875, 0.029052734375, 0.05280303955078125, 0.0765533447265625, 0.10030364990234375, 0.124053955078125, 0.14780426025390625, 0.1715545654296875, 0.19530487060546875, 0.21905517578125, 0.24280548095703125, 0.2665557861328125, 0.29030609130859375, 0.314056396484375, 0.33780670166015625, 0.3615570068359375, 0.38530731201171875, 0.4090576171875, 0.43280792236328125, 0.4565582275390625, 0.48030853271484375, 0.504058837890625, 0.5278091430664062, 0.5515594482421875, 0.5753097534179688, 0.59906005859375, 0.6228103637695312, 0.6465606689453125, 0.6703109741210938, 0.694061279296875, 0.7178115844726562, 0.7415618896484375, 0.7653121948242188, 0.7890625]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 7.0, 12.0, 13.0, 12.0, 12.0, 29.0, 22.0, 32.0, 33.0, 35.0, 51.0, 65.0, 81.0, 62.0, 57.0, 71.0, 68.0, 55.0, 45.0, 45.0, 24.0, 35.0, 28.0, 21.0, 18.0, 14.0, 16.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.946721076965332, -6.700906276702881, -6.45509147644043, -6.2092766761779785, -5.963461875915527, -5.717647075653076, -5.471832275390625, -5.226017951965332, -4.980202674865723, -4.7343878746032715, -4.48857307434082, -4.242758274078369, -3.996943473815918, -3.751128673553467, -3.5053141117095947, -3.2594993114471436, -3.0136847496032715, -2.7678699493408203, -2.522055149078369, -2.276240348815918, -2.030425548553467, -1.7846108675003052, -1.5387961864471436, -1.2929813861846924, -1.0471665859222412, -0.80135178565979, -0.5555370450019836, -0.30972230434417725, -0.06390750408172607, 0.1819072961807251, 0.4277219772338867, 0.6735367774963379, 0.9193515777587891, 1.1651663780212402, 1.4109811782836914, 1.656795859336853, 1.9026106595993042, 2.148425579071045, 2.394240140914917, 2.640054941177368, 2.8858697414398193, 3.1316845417022705, 3.3774993419647217, 3.6233139038085938, 3.869128704071045, 4.114943504333496, 4.360758304595947, 4.606573104858398, 4.85238790512085, 5.098202705383301, 5.344017505645752, 5.589832305908203, 5.835647106170654, 6.0814619064331055, 6.327276229858398, 6.573091506958008, 6.818905830383301, 7.064720630645752, 7.310535430908203, 7.556350231170654, 7.8021650314331055, 8.047979354858398, 8.293794631958008, 8.5396089553833, 8.78542423248291]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 3.0, 3.0, 13.0, 9.0, 6.0, 9.0, 21.0, 16.0, 23.0, 26.0, 32.0, 25.0, 29.0, 31.0, 33.0, 31.0, 26.0, 38.0, 33.0, 50.0, 46.0, 38.0, 35.0, 41.0, 35.0, 32.0, 45.0, 27.0, 27.0, 21.0, 19.0, 23.0, 25.0, 16.0, 18.0, 12.0, 15.0, 6.0, 13.0, 9.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.334875106811523, -4.202536582946777, -4.070198059082031, -3.9378597736358643, -3.805521249771118, -3.673182725906372, -3.540844440460205, -3.408505916595459, -3.276167392730713, -3.143828868865967, -3.0114903450012207, -2.8791520595550537, -2.7468135356903076, -2.6144750118255615, -2.4821367263793945, -2.3497982025146484, -2.2174596786499023, -2.0851211547851562, -1.9527827501296997, -1.8204443454742432, -1.688105821609497, -1.555767297744751, -1.4234288930892944, -1.291090488433838, -1.1587519645690918, -1.0264134407043457, -0.8940750360488892, -0.7617365717887878, -0.6293981075286865, -0.4970596432685852, -0.3647211790084839, -0.23238271474838257, -0.10004377365112305, 0.03229469060897827, 0.1646331548690796, 0.2969716191291809, 0.4293100833892822, 0.5616485476493835, 0.6939870119094849, 0.8263254761695862, 0.9586639404296875, 1.0910024642944336, 1.2233408689498901, 1.3556792736053467, 1.4880177974700928, 1.6203563213348389, 1.7526947259902954, 1.885033130645752, 2.017371654510498, 2.149710178375244, 2.2820487022399902, 2.4143869876861572, 2.5467255115509033, 2.6790640354156494, 2.8114023208618164, 2.9437408447265625, 3.0760793685913086, 3.2084178924560547, 3.340756416320801, 3.4730947017669678, 3.605433225631714, 3.73777174949646, 3.870110034942627, 4.002448558807373, 4.134787082672119]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 8.0, 17.0, 41.0, 47.0, 62.0, 99.0, 146.0, 255.0, 369.0, 634.0, 979.0, 1593.0, 2405.0, 3961.0, 6251.0, 10430.0, 17000.0, 27843.0, 43573.0, 67312.0, 98482.0, 130243.0, 148541.0, 141621.0, 115425.0, 83227.0, 55409.0, 34979.0, 21884.0, 13669.0, 8302.0, 5214.0, 3156.0, 2000.0, 1283.0, 751.0, 479.0, 343.0, 179.0, 121.0, 81.0, 56.0, 32.0, 15.0, 11.0, 9.0, 9.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.74481201171875, -3.6146240234375, -3.48443603515625, -3.354248046875, -3.22406005859375, -3.0938720703125, -2.96368408203125, -2.83349609375, -2.70330810546875, -2.5731201171875, -2.44293212890625, -2.312744140625, -2.18255615234375, -2.0523681640625, -1.92218017578125, -1.7919921875, -1.66180419921875, -1.5316162109375, -1.40142822265625, -1.271240234375, -1.14105224609375, -1.0108642578125, -0.88067626953125, -0.75048828125, -0.62030029296875, -0.4901123046875, -0.35992431640625, -0.229736328125, -0.09954833984375, 0.0306396484375, 0.16082763671875, 0.291015625, 0.42120361328125, 0.5513916015625, 0.68157958984375, 0.811767578125, 0.94195556640625, 1.0721435546875, 1.20233154296875, 1.33251953125, 1.46270751953125, 1.5928955078125, 1.72308349609375, 1.853271484375, 1.98345947265625, 2.1136474609375, 2.24383544921875, 2.3740234375, 2.50421142578125, 2.6343994140625, 2.76458740234375, 2.894775390625, 3.02496337890625, 3.1551513671875, 3.28533935546875, 3.41552734375, 3.54571533203125, 3.6759033203125, 3.80609130859375, 3.936279296875, 4.06646728515625, 4.1966552734375, 4.32684326171875, 4.45703125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 9.0, 7.0, 7.0, 19.0, 10.0, 12.0, 12.0, 21.0, 28.0, 28.0, 41.0, 33.0, 35.0, 29.0, 46.0, 49.0, 47.0, 48.0, 34.0, 37.0, 46.0, 39.0, 37.0, 33.0, 39.0, 26.0, 31.0, 23.0, 26.0, 21.0, 20.0, 18.0, 17.0, 16.0, 13.0, 8.0, 6.0, 13.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.732421875, -4.58203125, -4.431640625, -4.28125, -4.130859375, -3.98046875, -3.830078125, -3.6796875, -3.529296875, -3.37890625, -3.228515625, -3.078125, -2.927734375, -2.77734375, -2.626953125, -2.4765625, -2.326171875, -2.17578125, -2.025390625, -1.875, -1.724609375, -1.57421875, -1.423828125, -1.2734375, -1.123046875, -0.97265625, -0.822265625, -0.671875, -0.521484375, -0.37109375, -0.220703125, -0.0703125, 0.080078125, 0.23046875, 0.380859375, 0.53125, 0.681640625, 0.83203125, 0.982421875, 1.1328125, 1.283203125, 1.43359375, 1.583984375, 1.734375, 1.884765625, 2.03515625, 2.185546875, 2.3359375, 2.486328125, 2.63671875, 2.787109375, 2.9375, 3.087890625, 3.23828125, 3.388671875, 3.5390625, 3.689453125, 3.83984375, 3.990234375, 4.140625, 4.291015625, 4.44140625, 4.591796875, 4.7421875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 12.0, 14.0, 18.0, 34.0, 44.0, 59.0, 88.0, 137.0, 223.0, 283.0, 464.0, 711.0, 1062.0, 1640.0, 2541.0, 3964.0, 5866.0, 9282.0, 14340.0, 22221.0, 34133.0, 51154.0, 74495.0, 101226.0, 126048.0, 136800.0, 127594.0, 103872.0, 76430.0, 53360.0, 35173.0, 22857.0, 14834.0, 9786.0, 6201.0, 4005.0, 2591.0, 1709.0, 1140.0, 698.0, 518.0, 352.0, 195.0, 128.0, 84.0, 62.0, 39.0, 17.0, 19.0, 12.0, 10.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.322845458984375, -3.21405029296875, -3.105255126953125, -2.9964599609375, -2.887664794921875, -2.77886962890625, -2.670074462890625, -2.561279296875, -2.452484130859375, -2.34368896484375, -2.234893798828125, -2.1260986328125, -2.017303466796875, -1.90850830078125, -1.799713134765625, -1.69091796875, -1.582122802734375, -1.47332763671875, -1.364532470703125, -1.2557373046875, -1.146942138671875, -1.03814697265625, -0.929351806640625, -0.820556640625, -0.711761474609375, -0.60296630859375, -0.494171142578125, -0.3853759765625, -0.276580810546875, -0.16778564453125, -0.058990478515625, 0.0498046875, 0.158599853515625, 0.26739501953125, 0.376190185546875, 0.4849853515625, 0.593780517578125, 0.70257568359375, 0.811370849609375, 0.920166015625, 1.028961181640625, 1.13775634765625, 1.246551513671875, 1.3553466796875, 1.464141845703125, 1.57293701171875, 1.681732177734375, 1.79052734375, 1.899322509765625, 2.00811767578125, 2.116912841796875, 2.2257080078125, 2.334503173828125, 2.44329833984375, 2.552093505859375, 2.660888671875, 2.769683837890625, 2.87847900390625, 2.987274169921875, 3.0960693359375, 3.204864501953125, 3.31365966796875, 3.422454833984375, 3.53125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 2.0, 12.0, 4.0, 8.0, 13.0, 20.0, 12.0, 24.0, 19.0, 32.0, 26.0, 28.0, 30.0, 50.0, 35.0, 45.0, 27.0, 46.0, 47.0, 50.0, 50.0, 37.0, 36.0, 37.0, 36.0, 33.0, 38.0, 27.0, 18.0, 27.0, 23.0, 21.0, 16.0, 8.0, 11.0, 14.0, 5.0, 4.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0], "bins": [-3.494140625, -3.397308349609375, -3.30047607421875, -3.203643798828125, -3.1068115234375, -3.009979248046875, -2.91314697265625, -2.816314697265625, -2.719482421875, -2.622650146484375, -2.52581787109375, -2.428985595703125, -2.3321533203125, -2.235321044921875, -2.13848876953125, -2.041656494140625, -1.94482421875, -1.847991943359375, -1.75115966796875, -1.654327392578125, -1.5574951171875, -1.460662841796875, -1.36383056640625, -1.266998291015625, -1.170166015625, -1.073333740234375, -0.97650146484375, -0.879669189453125, -0.7828369140625, -0.686004638671875, -0.58917236328125, -0.492340087890625, -0.3955078125, -0.298675537109375, -0.20184326171875, -0.105010986328125, -0.0081787109375, 0.088653564453125, 0.18548583984375, 0.282318115234375, 0.379150390625, 0.475982666015625, 0.57281494140625, 0.669647216796875, 0.7664794921875, 0.863311767578125, 0.96014404296875, 1.056976318359375, 1.15380859375, 1.250640869140625, 1.34747314453125, 1.444305419921875, 1.5411376953125, 1.637969970703125, 1.73480224609375, 1.831634521484375, 1.928466796875, 2.025299072265625, 2.12213134765625, 2.218963623046875, 2.3157958984375, 2.412628173828125, 2.50946044921875, 2.606292724609375, 2.703125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 11.0, 10.0, 12.0, 19.0, 48.0, 74.0, 95.0, 119.0, 231.0, 357.0, 623.0, 1070.0, 1842.0, 3090.0, 5617.0, 10415.0, 19125.0, 36554.0, 66929.0, 116073.0, 173721.0, 201441.0, 167081.0, 108458.0, 62029.0, 33832.0, 17896.0, 9559.0, 5290.0, 2911.0, 1596.0, 915.0, 596.0, 340.0, 200.0, 138.0, 83.0, 48.0, 31.0, 25.0, 17.0, 13.0, 6.0, 4.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.17578125, -3.08355712890625, -2.9913330078125, -2.89910888671875, -2.806884765625, -2.71466064453125, -2.6224365234375, -2.53021240234375, -2.43798828125, -2.34576416015625, -2.2535400390625, -2.16131591796875, -2.069091796875, -1.97686767578125, -1.8846435546875, -1.79241943359375, -1.7001953125, -1.60797119140625, -1.5157470703125, -1.42352294921875, -1.331298828125, -1.23907470703125, -1.1468505859375, -1.05462646484375, -0.96240234375, -0.87017822265625, -0.7779541015625, -0.68572998046875, -0.593505859375, -0.50128173828125, -0.4090576171875, -0.31683349609375, -0.224609375, -0.13238525390625, -0.0401611328125, 0.05206298828125, 0.144287109375, 0.23651123046875, 0.3287353515625, 0.42095947265625, 0.51318359375, 0.60540771484375, 0.6976318359375, 0.78985595703125, 0.882080078125, 0.97430419921875, 1.0665283203125, 1.15875244140625, 1.2509765625, 1.34320068359375, 1.4354248046875, 1.52764892578125, 1.619873046875, 1.71209716796875, 1.8043212890625, 1.89654541015625, 1.98876953125, 2.08099365234375, 2.1732177734375, 2.26544189453125, 2.357666015625, 2.44989013671875, 2.5421142578125, 2.63433837890625, 2.7265625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 7.0, 17.0, 18.0, 21.0, 22.0, 38.0, 51.0, 53.0, 81.0, 60.0, 70.0, 75.0, 62.0, 57.0, 64.0, 58.0, 45.0, 36.0, 40.0, 29.0, 27.0, 13.0, 10.0, 10.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029468536376953125, -0.00028483569622039795, -0.00027498602867126465, -0.00026513636112213135, -0.00025528669357299805, -0.00024543702602386475, -0.00023558735847473145, -0.00022573769092559814, -0.00021588802337646484, -0.00020603835582733154, -0.00019618868827819824, -0.00018633902072906494, -0.00017648935317993164, -0.00016663968563079834, -0.00015679001808166504, -0.00014694035053253174, -0.00013709068298339844, -0.00012724101543426514, -0.00011739134788513184, -0.00010754168033599854, -9.769201278686523e-05, -8.784234523773193e-05, -7.799267768859863e-05, -6.814301013946533e-05, -5.829334259033203e-05, -4.844367504119873e-05, -3.859400749206543e-05, -2.874433994293213e-05, -1.8894672393798828e-05, -9.045004844665527e-06, 8.046627044677734e-07, 1.0654330253601074e-05, 2.0503997802734375e-05, 3.0353665351867676e-05, 4.0203332901000977e-05, 5.005300045013428e-05, 5.990266799926758e-05, 6.975233554840088e-05, 7.960200309753418e-05, 8.945167064666748e-05, 9.930133819580078e-05, 0.00010915100574493408, 0.00011900067329406738, 0.00012885034084320068, 0.00013870000839233398, 0.00014854967594146729, 0.00015839934349060059, 0.0001682490110397339, 0.0001780986785888672, 0.0001879483461380005, 0.0001977980136871338, 0.0002076476812362671, 0.0002174973487854004, 0.0002273470163345337, 0.000237196683883667, 0.0002470463514328003, 0.0002568960189819336, 0.0002667456865310669, 0.0002765953540802002, 0.0002864450216293335, 0.0002962946891784668, 0.0003061443567276001, 0.0003159940242767334, 0.0003258436918258667, 0.000335693359375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 8.0, 7.0, 11.0, 13.0, 26.0, 44.0, 57.0, 77.0, 98.0, 151.0, 255.0, 356.0, 544.0, 856.0, 1327.0, 2157.0, 3420.0, 5691.0, 9428.0, 15817.0, 26063.0, 43444.0, 69710.0, 105108.0, 140381.0, 158396.0, 147279.0, 114396.0, 77895.0, 49458.0, 30129.0, 18168.0, 10800.0, 6574.0, 3841.0, 2344.0, 1507.0, 930.0, 587.0, 375.0, 267.0, 173.0, 113.0, 91.0, 57.0, 41.0, 33.0, 17.0, 12.0, 5.0, 7.0, 2.0, 8.0, 3.0, 2.0, 1.0, 2.0], "bins": [-2.328125, -2.25677490234375, -2.1854248046875, -2.11407470703125, -2.042724609375, -1.97137451171875, -1.9000244140625, -1.82867431640625, -1.75732421875, -1.68597412109375, -1.6146240234375, -1.54327392578125, -1.471923828125, -1.40057373046875, -1.3292236328125, -1.25787353515625, -1.1865234375, -1.11517333984375, -1.0438232421875, -0.97247314453125, -0.901123046875, -0.82977294921875, -0.7584228515625, -0.68707275390625, -0.61572265625, -0.54437255859375, -0.4730224609375, -0.40167236328125, -0.330322265625, -0.25897216796875, -0.1876220703125, -0.11627197265625, -0.044921875, 0.02642822265625, 0.0977783203125, 0.16912841796875, 0.240478515625, 0.31182861328125, 0.3831787109375, 0.45452880859375, 0.52587890625, 0.59722900390625, 0.6685791015625, 0.73992919921875, 0.811279296875, 0.88262939453125, 0.9539794921875, 1.02532958984375, 1.0966796875, 1.16802978515625, 1.2393798828125, 1.31072998046875, 1.382080078125, 1.45343017578125, 1.5247802734375, 1.59613037109375, 1.66748046875, 1.73883056640625, 1.8101806640625, 1.88153076171875, 1.952880859375, 2.02423095703125, 2.0955810546875, 2.16693115234375, 2.23828125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 9.0, 3.0, 6.0, 9.0, 13.0, 17.0, 25.0, 25.0, 32.0, 30.0, 37.0, 46.0, 54.0, 47.0, 63.0, 53.0, 67.0, 48.0, 47.0, 49.0, 56.0, 37.0, 47.0, 28.0, 28.0, 25.0, 21.0, 15.0, 10.0, 12.0, 5.0, 10.0, 3.0, 3.0, 5.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.833984375, -0.8075103759765625, -0.781036376953125, -0.7545623779296875, -0.72808837890625, -0.7016143798828125, -0.675140380859375, -0.6486663818359375, -0.6221923828125, -0.5957183837890625, -0.569244384765625, -0.5427703857421875, -0.51629638671875, -0.4898223876953125, -0.463348388671875, -0.4368743896484375, -0.410400390625, -0.3839263916015625, -0.357452392578125, -0.3309783935546875, -0.30450439453125, -0.2780303955078125, -0.251556396484375, -0.2250823974609375, -0.1986083984375, -0.1721343994140625, -0.145660400390625, -0.1191864013671875, -0.09271240234375, -0.0662384033203125, -0.039764404296875, -0.0132904052734375, 0.01318359375, 0.0396575927734375, 0.066131591796875, 0.0926055908203125, 0.11907958984375, 0.1455535888671875, 0.172027587890625, 0.1985015869140625, 0.2249755859375, 0.2514495849609375, 0.277923583984375, 0.3043975830078125, 0.33087158203125, 0.3573455810546875, 0.383819580078125, 0.4102935791015625, 0.436767578125, 0.4632415771484375, 0.489715576171875, 0.5161895751953125, 0.54266357421875, 0.5691375732421875, 0.595611572265625, 0.6220855712890625, 0.6485595703125, 0.6750335693359375, 0.701507568359375, 0.7279815673828125, 0.75445556640625, 0.7809295654296875, 0.807403564453125, 0.8338775634765625, 0.8603515625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 5.0, 5.0, 6.0, 7.0, 7.0, 9.0, 14.0, 11.0, 17.0, 28.0, 31.0, 29.0, 25.0, 38.0, 48.0, 57.0, 57.0, 48.0, 55.0, 66.0, 69.0, 50.0, 45.0, 39.0, 36.0, 40.0, 21.0, 18.0, 30.0, 14.0, 8.0, 13.0, 10.0, 9.0, 9.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.236756324768066, -7.029432773590088, -6.822109699249268, -6.614786148071289, -6.407463073730469, -6.20013952255249, -5.992815971374512, -5.785492897033691, -5.578169822692871, -5.370846271514893, -5.163523197174072, -4.956199645996094, -4.748876571655273, -4.541553020477295, -4.334229469299316, -4.126906394958496, -3.9195828437805176, -3.712259531021118, -3.5049362182617188, -3.2976126670837402, -3.09028959274292, -2.8829660415649414, -2.675642728805542, -2.4683194160461426, -2.260996103286743, -2.0536727905273438, -1.8463494777679443, -1.6390260457992554, -1.431702733039856, -1.2243794202804565, -1.0170559883117676, -0.8097326755523682, -0.602409839630127, -0.39508649706840515, -0.18776315450668335, 0.01956021785736084, 0.22688353061676025, 0.43420684337615967, 0.6415302753448486, 0.848853588104248, 1.0561769008636475, 1.2635002136230469, 1.4708235263824463, 1.6781469583511353, 1.8854702711105347, 2.0927934646606445, 2.300117015838623, 2.5074403285980225, 2.714763641357422, 2.9220869541168213, 3.1294102668762207, 3.336733818054199, 3.5440568923950195, 3.751380443572998, 3.9587037563323975, 4.166027069091797, 4.373350143432617, 4.580673694610596, 4.787996768951416, 4.9953203201293945, 5.202643394470215, 5.409966945648193, 5.617290496826172, 5.824613571166992, 6.031937122344971]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 11.0, 20.0, 15.0, 19.0, 22.0, 31.0, 24.0, 28.0, 18.0, 33.0, 29.0, 40.0, 24.0, 40.0, 36.0, 45.0, 42.0, 33.0, 31.0, 41.0, 45.0, 27.0, 34.0, 33.0, 30.0, 40.0, 28.0, 27.0, 22.0, 26.0, 13.0, 14.0, 8.0, 2.0, 12.0, 10.0, 6.0, 5.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.626706600189209, -4.494546890258789, -4.362387657165527, -4.230227947235107, -4.0980682373046875, -3.9659087657928467, -3.833749294281006, -3.701589584350586, -3.569430112838745, -3.4372706413269043, -3.3051109313964844, -3.1729514598846436, -3.0407919883728027, -2.908632278442383, -2.776472806930542, -2.644313335418701, -2.5121536254882812, -2.3799941539764404, -2.2478344440460205, -2.1156749725341797, -1.9835153818130493, -1.851355791091919, -1.7191963195800781, -1.5870367288589478, -1.4548771381378174, -1.322717547416687, -1.1905579566955566, -1.0583984851837158, -0.9262388944625854, -0.7940793037414551, -0.6619197726249695, -0.5297602415084839, -0.3976008892059326, -0.26544132828712463, -0.13328176736831665, -0.001122206449508667, 0.13103735446929932, 0.2631969451904297, 0.3953564763069153, 0.5275160074234009, 0.6596755981445312, 0.7918351888656616, 0.9239947199821472, 1.0561542510986328, 1.1883138418197632, 1.3204734325408936, 1.4526329040527344, 1.5847924947738647, 1.7169520854949951, 1.8491116762161255, 1.9812712669372559, 2.1134307384490967, 2.2455902099609375, 2.3777499198913574, 2.5099093914031982, 2.642068862915039, 2.774228572845459, 2.9063880443573, 3.0385477542877197, 3.1707072257995605, 3.3028669357299805, 3.4350264072418213, 3.567185878753662, 3.699345588684082, 3.831505060195923]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [4.0, 4.0, 4.0, 11.0, 9.0, 13.0, 18.0, 26.0, 31.0, 43.0, 64.0, 101.0, 120.0, 184.0, 233.0, 341.0, 459.0, 729.0, 1041.0, 1559.0, 2314.0, 3691.0, 5992.0, 9715.0, 16304.0, 29938.0, 56523.0, 116635.0, 260214.0, 602316.0, 1091987.0, 1026853.0, 522785.0, 224801.0, 101313.0, 50034.0, 26780.0, 15258.0, 8953.0, 5745.0, 3697.0, 2425.0, 1585.0, 1076.0, 743.0, 512.0, 363.0, 235.0, 170.0, 132.0, 75.0, 47.0, 28.0, 22.0, 19.0, 11.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-5.9609375, -5.76812744140625, -5.5753173828125, -5.38250732421875, -5.189697265625, -4.99688720703125, -4.8040771484375, -4.61126708984375, -4.41845703125, -4.22564697265625, -4.0328369140625, -3.84002685546875, -3.647216796875, -3.45440673828125, -3.2615966796875, -3.06878662109375, -2.8759765625, -2.68316650390625, -2.4903564453125, -2.29754638671875, -2.104736328125, -1.91192626953125, -1.7191162109375, -1.52630615234375, -1.33349609375, -1.14068603515625, -0.9478759765625, -0.75506591796875, -0.562255859375, -0.36944580078125, -0.1766357421875, 0.01617431640625, 0.208984375, 0.40179443359375, 0.5946044921875, 0.78741455078125, 0.980224609375, 1.17303466796875, 1.3658447265625, 1.55865478515625, 1.75146484375, 1.94427490234375, 2.1370849609375, 2.32989501953125, 2.522705078125, 2.71551513671875, 2.9083251953125, 3.10113525390625, 3.2939453125, 3.48675537109375, 3.6795654296875, 3.87237548828125, 4.065185546875, 4.25799560546875, 4.4508056640625, 4.64361572265625, 4.83642578125, 5.02923583984375, 5.2220458984375, 5.41485595703125, 5.607666015625, 5.80047607421875, 5.9932861328125, 6.18609619140625, 6.37890625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 11.0, 3.0, 15.0, 20.0, 13.0, 18.0, 14.0, 18.0, 27.0, 22.0, 31.0, 30.0, 35.0, 35.0, 35.0, 42.0, 36.0, 38.0, 35.0, 37.0, 40.0, 30.0, 41.0, 46.0, 32.0, 28.0, 35.0, 30.0, 27.0, 26.0, 26.0, 19.0, 24.0, 9.0, 13.0, 8.0, 7.0, 3.0, 9.0, 10.0, 2.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.208984375, -3.1156005859375, -3.022216796875, -2.9288330078125, -2.83544921875, -2.7420654296875, -2.648681640625, -2.5552978515625, -2.4619140625, -2.3685302734375, -2.275146484375, -2.1817626953125, -2.08837890625, -1.9949951171875, -1.901611328125, -1.8082275390625, -1.71484375, -1.6214599609375, -1.528076171875, -1.4346923828125, -1.34130859375, -1.2479248046875, -1.154541015625, -1.0611572265625, -0.9677734375, -0.8743896484375, -0.781005859375, -0.6876220703125, -0.59423828125, -0.5008544921875, -0.407470703125, -0.3140869140625, -0.220703125, -0.1273193359375, -0.033935546875, 0.0594482421875, 0.15283203125, 0.2462158203125, 0.339599609375, 0.4329833984375, 0.5263671875, 0.6197509765625, 0.713134765625, 0.8065185546875, 0.89990234375, 0.9932861328125, 1.086669921875, 1.1800537109375, 1.2734375, 1.3668212890625, 1.460205078125, 1.5535888671875, 1.64697265625, 1.7403564453125, 1.833740234375, 1.9271240234375, 2.0205078125, 2.1138916015625, 2.207275390625, 2.3006591796875, 2.39404296875, 2.4874267578125, 2.580810546875, 2.6741943359375, 2.767578125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 8.0, 14.0, 15.0, 17.0, 36.0, 45.0, 82.0, 106.0, 139.0, 197.0, 298.0, 525.0, 698.0, 1092.0, 1686.0, 2596.0, 4258.0, 7014.0, 12012.0, 21160.0, 38590.0, 73354.0, 146840.0, 306561.0, 649361.0, 1115431.0, 914014.0, 456359.0, 213921.0, 104749.0, 54034.0, 28682.0, 16049.0, 9339.0, 5481.0, 3427.0, 2086.0, 1373.0, 829.0, 577.0, 375.0, 274.0, 176.0, 129.0, 97.0, 56.0, 44.0, 31.0, 18.0, 14.0, 11.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.64453125, -6.44171142578125, -6.2388916015625, -6.03607177734375, -5.833251953125, -5.63043212890625, -5.4276123046875, -5.22479248046875, -5.02197265625, -4.81915283203125, -4.6163330078125, -4.41351318359375, -4.210693359375, -4.00787353515625, -3.8050537109375, -3.60223388671875, -3.3994140625, -3.19659423828125, -2.9937744140625, -2.79095458984375, -2.588134765625, -2.38531494140625, -2.1824951171875, -1.97967529296875, -1.77685546875, -1.57403564453125, -1.3712158203125, -1.16839599609375, -0.965576171875, -0.76275634765625, -0.5599365234375, -0.35711669921875, -0.154296875, 0.04852294921875, 0.2513427734375, 0.45416259765625, 0.656982421875, 0.85980224609375, 1.0626220703125, 1.26544189453125, 1.46826171875, 1.67108154296875, 1.8739013671875, 2.07672119140625, 2.279541015625, 2.48236083984375, 2.6851806640625, 2.88800048828125, 3.0908203125, 3.29364013671875, 3.4964599609375, 3.69927978515625, 3.902099609375, 4.10491943359375, 4.3077392578125, 4.51055908203125, 4.71337890625, 4.91619873046875, 5.1190185546875, 5.32183837890625, 5.524658203125, 5.72747802734375, 5.9302978515625, 6.13311767578125, 6.3359375]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 8.0, 15.0, 16.0, 23.0, 26.0, 27.0, 44.0, 60.0, 61.0, 93.0, 107.0, 163.0, 200.0, 246.0, 239.0, 284.0, 316.0, 328.0, 317.0, 266.0, 224.0, 179.0, 156.0, 133.0, 113.0, 86.0, 67.0, 60.0, 34.0, 38.0, 19.0, 22.0, 20.0, 16.0, 14.0, 11.0, 8.0, 0.0, 5.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.1015625, -2.038299560546875, -1.97503662109375, -1.911773681640625, -1.8485107421875, -1.785247802734375, -1.72198486328125, -1.658721923828125, -1.595458984375, -1.532196044921875, -1.46893310546875, -1.405670166015625, -1.3424072265625, -1.279144287109375, -1.21588134765625, -1.152618408203125, -1.08935546875, -1.026092529296875, -0.96282958984375, -0.899566650390625, -0.8363037109375, -0.773040771484375, -0.70977783203125, -0.646514892578125, -0.583251953125, -0.519989013671875, -0.45672607421875, -0.393463134765625, -0.3302001953125, -0.266937255859375, -0.20367431640625, -0.140411376953125, -0.0771484375, -0.013885498046875, 0.04937744140625, 0.112640380859375, 0.1759033203125, 0.239166259765625, 0.30242919921875, 0.365692138671875, 0.428955078125, 0.492218017578125, 0.55548095703125, 0.618743896484375, 0.6820068359375, 0.745269775390625, 0.80853271484375, 0.871795654296875, 0.93505859375, 0.998321533203125, 1.06158447265625, 1.124847412109375, 1.1881103515625, 1.251373291015625, 1.31463623046875, 1.377899169921875, 1.441162109375, 1.504425048828125, 1.56768798828125, 1.630950927734375, 1.6942138671875, 1.757476806640625, 1.82073974609375, 1.884002685546875, 1.947265625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 7.0, 12.0, 8.0, 6.0, 14.0, 12.0, 29.0, 27.0, 27.0, 30.0, 38.0, 41.0, 58.0, 67.0, 59.0, 78.0, 69.0, 64.0, 58.0, 43.0, 46.0, 52.0, 34.0, 22.0, 15.0, 18.0, 16.0, 8.0, 9.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.33729362487793, -7.110114097595215, -6.8829345703125, -6.655755043029785, -6.42857551574707, -6.2013959884643555, -5.974216461181641, -5.747036457061768, -5.519856929779053, -5.292677402496338, -5.065497875213623, -4.838318347930908, -4.611138820648193, -4.38395881652832, -4.1567792892456055, -3.9295997619628906, -3.702420473098755, -3.47524094581604, -3.248061418533325, -3.0208816528320312, -2.7937021255493164, -2.5665225982666016, -2.3393430709838867, -2.112163543701172, -1.8849838972091675, -1.6578043699264526, -1.4306247234344482, -1.2034451961517334, -0.9762656092643738, -0.7490860223770142, -0.5219064950942993, -0.2947268486022949, -0.06754732131958008, 0.15963225066661835, 0.3868118226528168, 0.613991379737854, 0.8411709666252136, 1.0683505535125732, 1.295530080795288, 1.5227097272872925, 1.7498892545700073, 1.9770687818527222, 2.2042484283447266, 2.4314279556274414, 2.6586074829101562, 2.885787010192871, 3.112966537475586, 3.34014630317688, 3.5673258304595947, 3.7945053577423096, 4.0216851234436035, 4.248864650726318, 4.476044178009033, 4.703223705291748, 4.930403232574463, 5.157582759857178, 5.384762287139893, 5.611941814422607, 5.839121341705322, 6.066300868988037, 6.293480396270752, 6.520660400390625, 6.74783992767334, 6.975019454956055, 7.2021989822387695]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 5.0, 7.0, 10.0, 14.0, 13.0, 17.0, 13.0, 16.0, 17.0, 24.0, 25.0, 30.0, 29.0, 36.0, 23.0, 28.0, 35.0, 46.0, 41.0, 39.0, 41.0, 30.0, 26.0, 33.0, 35.0, 42.0, 33.0, 39.0, 24.0, 27.0, 30.0, 19.0, 17.0, 19.0, 13.0, 12.0, 12.0, 15.0, 11.0, 12.0, 7.0, 3.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4900124073028564, -3.37502384185791, -3.2600350379943848, -3.1450464725494385, -3.030057668685913, -2.915069103240967, -2.8000802993774414, -2.685091733932495, -2.570103168487549, -2.4551146030426025, -2.340125799179077, -2.225137233734131, -2.1101484298706055, -1.9951598644256592, -1.8801711797714233, -1.7651824951171875, -1.650193691253662, -1.5352050065994263, -1.4202163219451904, -1.3052277565002441, -1.1902389526367188, -1.0752503871917725, -0.9602617025375366, -0.8452730178833008, -0.7302843332290649, -0.6152956485748291, -0.5003069639205933, -0.3853183388710022, -0.27032965421676636, -0.15534096956253052, -0.04035234451293945, 0.07463634014129639, 0.18962502479553223, 0.30461370944976807, 0.4196023643016815, 0.534591019153595, 0.6495797038078308, 0.7645683884620667, 0.8795570135116577, 0.9945456981658936, 1.1095343828201294, 1.2245230674743652, 1.339511752128601, 1.454500436782837, 1.5694890022277832, 1.6844778060913086, 1.7994663715362549, 1.9144550561904907, 2.0294437408447266, 2.144432306289673, 2.2594211101531982, 2.3744096755981445, 2.48939847946167, 2.604387044906616, 2.7193756103515625, 2.834364414215088, 2.9493532180786133, 3.0643417835235596, 3.179330587387085, 3.2943191528320312, 3.4093079566955566, 3.524296522140503, 3.639285087585449, 3.7542738914489746, 3.869262456893921]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 10.0, 8.0, 12.0, 22.0, 17.0, 45.0, 41.0, 66.0, 101.0, 181.0, 227.0, 371.0, 567.0, 918.0, 1568.0, 2902.0, 5948.0, 12240.0, 27831.0, 65342.0, 146070.0, 256771.0, 258499.0, 148325.0, 66591.0, 28422.0, 12339.0, 5801.0, 2977.0, 1627.0, 933.0, 605.0, 348.0, 255.0, 184.0, 118.0, 84.0, 49.0, 38.0, 34.0, 19.0, 6.0, 5.0, 10.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-5.046875, -4.88922119140625, -4.7315673828125, -4.57391357421875, -4.416259765625, -4.25860595703125, -4.1009521484375, -3.94329833984375, -3.78564453125, -3.62799072265625, -3.4703369140625, -3.31268310546875, -3.155029296875, -2.99737548828125, -2.8397216796875, -2.68206787109375, -2.5244140625, -2.36676025390625, -2.2091064453125, -2.05145263671875, -1.893798828125, -1.73614501953125, -1.5784912109375, -1.42083740234375, -1.26318359375, -1.10552978515625, -0.9478759765625, -0.79022216796875, -0.632568359375, -0.47491455078125, -0.3172607421875, -0.15960693359375, -0.001953125, 0.15570068359375, 0.3133544921875, 0.47100830078125, 0.628662109375, 0.78631591796875, 0.9439697265625, 1.10162353515625, 1.25927734375, 1.41693115234375, 1.5745849609375, 1.73223876953125, 1.889892578125, 2.04754638671875, 2.2052001953125, 2.36285400390625, 2.5205078125, 2.67816162109375, 2.8358154296875, 2.99346923828125, 3.151123046875, 3.30877685546875, 3.4664306640625, 3.62408447265625, 3.78173828125, 3.93939208984375, 4.0970458984375, 4.25469970703125, 4.412353515625, 4.57000732421875, 4.7276611328125, 4.88531494140625, 5.04296875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 2.0, 10.0, 14.0, 16.0, 9.0, 13.0, 21.0, 18.0, 21.0, 24.0, 19.0, 41.0, 30.0, 28.0, 41.0, 36.0, 37.0, 39.0, 45.0, 39.0, 36.0, 39.0, 37.0, 39.0, 35.0, 32.0, 31.0, 25.0, 29.0, 29.0, 22.0, 20.0, 16.0, 16.0, 9.0, 15.0, 13.0, 10.0, 8.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.818359375, -3.690521240234375, -3.56268310546875, -3.434844970703125, -3.3070068359375, -3.179168701171875, -3.05133056640625, -2.923492431640625, -2.795654296875, -2.667816162109375, -2.53997802734375, -2.412139892578125, -2.2843017578125, -2.156463623046875, -2.02862548828125, -1.900787353515625, -1.77294921875, -1.645111083984375, -1.51727294921875, -1.389434814453125, -1.2615966796875, -1.133758544921875, -1.00592041015625, -0.878082275390625, -0.750244140625, -0.622406005859375, -0.49456787109375, -0.366729736328125, -0.2388916015625, -0.111053466796875, 0.01678466796875, 0.144622802734375, 0.2724609375, 0.400299072265625, 0.52813720703125, 0.655975341796875, 0.7838134765625, 0.911651611328125, 1.03948974609375, 1.167327880859375, 1.295166015625, 1.423004150390625, 1.55084228515625, 1.678680419921875, 1.8065185546875, 1.934356689453125, 2.06219482421875, 2.190032958984375, 2.31787109375, 2.445709228515625, 2.57354736328125, 2.701385498046875, 2.8292236328125, 2.957061767578125, 3.08489990234375, 3.212738037109375, 3.340576171875, 3.468414306640625, 3.59625244140625, 3.724090576171875, 3.8519287109375, 3.979766845703125, 4.10760498046875, 4.235443115234375, 4.36328125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 6.0, 11.0, 7.0, 11.0, 24.0, 32.0, 38.0, 44.0, 93.0, 113.0, 172.0, 280.0, 370.0, 594.0, 1073.0, 1751.0, 3026.0, 5976.0, 11974.0, 25643.0, 59425.0, 137638.0, 271998.0, 275554.0, 140478.0, 60043.0, 26306.0, 11978.0, 6074.0, 3128.0, 1796.0, 1047.0, 622.0, 388.0, 258.0, 186.0, 123.0, 71.0, 61.0, 36.0, 39.0, 25.0, 16.0, 7.0, 6.0, 12.0, 5.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.84765625, -5.66497802734375, -5.4822998046875, -5.29962158203125, -5.116943359375, -4.93426513671875, -4.7515869140625, -4.56890869140625, -4.38623046875, -4.20355224609375, -4.0208740234375, -3.83819580078125, -3.655517578125, -3.47283935546875, -3.2901611328125, -3.10748291015625, -2.9248046875, -2.74212646484375, -2.5594482421875, -2.37677001953125, -2.194091796875, -2.01141357421875, -1.8287353515625, -1.64605712890625, -1.46337890625, -1.28070068359375, -1.0980224609375, -0.91534423828125, -0.732666015625, -0.54998779296875, -0.3673095703125, -0.18463134765625, -0.001953125, 0.18072509765625, 0.3634033203125, 0.54608154296875, 0.728759765625, 0.91143798828125, 1.0941162109375, 1.27679443359375, 1.45947265625, 1.64215087890625, 1.8248291015625, 2.00750732421875, 2.190185546875, 2.37286376953125, 2.5555419921875, 2.73822021484375, 2.9208984375, 3.10357666015625, 3.2862548828125, 3.46893310546875, 3.651611328125, 3.83428955078125, 4.0169677734375, 4.19964599609375, 4.38232421875, 4.56500244140625, 4.7476806640625, 4.93035888671875, 5.113037109375, 5.29571533203125, 5.4783935546875, 5.66107177734375, 5.84375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 6.0, 1.0, 5.0, 7.0, 10.0, 11.0, 12.0, 13.0, 9.0, 15.0, 18.0, 32.0, 24.0, 32.0, 28.0, 26.0, 53.0, 35.0, 38.0, 51.0, 46.0, 33.0, 39.0, 31.0, 39.0, 49.0, 42.0, 37.0, 34.0, 29.0, 32.0, 21.0, 27.0, 15.0, 19.0, 16.0, 7.0, 18.0, 6.0, 10.0, 5.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.693359375, -2.61199951171875, -2.5306396484375, -2.44927978515625, -2.367919921875, -2.28656005859375, -2.2052001953125, -2.12384033203125, -2.04248046875, -1.96112060546875, -1.8797607421875, -1.79840087890625, -1.717041015625, -1.63568115234375, -1.5543212890625, -1.47296142578125, -1.3916015625, -1.31024169921875, -1.2288818359375, -1.14752197265625, -1.066162109375, -0.98480224609375, -0.9034423828125, -0.82208251953125, -0.74072265625, -0.65936279296875, -0.5780029296875, -0.49664306640625, -0.415283203125, -0.33392333984375, -0.2525634765625, -0.17120361328125, -0.08984375, -0.00848388671875, 0.0728759765625, 0.15423583984375, 0.235595703125, 0.31695556640625, 0.3983154296875, 0.47967529296875, 0.56103515625, 0.64239501953125, 0.7237548828125, 0.80511474609375, 0.886474609375, 0.96783447265625, 1.0491943359375, 1.13055419921875, 1.2119140625, 1.29327392578125, 1.3746337890625, 1.45599365234375, 1.537353515625, 1.61871337890625, 1.7000732421875, 1.78143310546875, 1.86279296875, 1.94415283203125, 2.0255126953125, 2.10687255859375, 2.188232421875, 2.26959228515625, 2.3509521484375, 2.43231201171875, 2.513671875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 11.0, 10.0, 11.0, 11.0, 17.0, 21.0, 35.0, 58.0, 81.0, 116.0, 152.0, 214.0, 355.0, 581.0, 1013.0, 1610.0, 2937.0, 5401.0, 10601.0, 22353.0, 48793.0, 111684.0, 236408.0, 296435.0, 168395.0, 75114.0, 33306.0, 15526.0, 7697.0, 4071.0, 2200.0, 1237.0, 730.0, 433.0, 319.0, 195.0, 135.0, 99.0, 53.0, 44.0, 28.0, 21.0, 14.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.509765625, -2.429473876953125, -2.34918212890625, -2.268890380859375, -2.1885986328125, -2.108306884765625, -2.02801513671875, -1.947723388671875, -1.867431640625, -1.787139892578125, -1.70684814453125, -1.626556396484375, -1.5462646484375, -1.465972900390625, -1.38568115234375, -1.305389404296875, -1.22509765625, -1.144805908203125, -1.06451416015625, -0.984222412109375, -0.9039306640625, -0.823638916015625, -0.74334716796875, -0.663055419921875, -0.582763671875, -0.502471923828125, -0.42218017578125, -0.341888427734375, -0.2615966796875, -0.181304931640625, -0.10101318359375, -0.020721435546875, 0.0595703125, 0.139862060546875, 0.22015380859375, 0.300445556640625, 0.3807373046875, 0.461029052734375, 0.54132080078125, 0.621612548828125, 0.701904296875, 0.782196044921875, 0.86248779296875, 0.942779541015625, 1.0230712890625, 1.103363037109375, 1.18365478515625, 1.263946533203125, 1.34423828125, 1.424530029296875, 1.50482177734375, 1.585113525390625, 1.6654052734375, 1.745697021484375, 1.82598876953125, 1.906280517578125, 1.986572265625, 2.066864013671875, 2.14715576171875, 2.227447509765625, 2.3077392578125, 2.388031005859375, 2.46832275390625, 2.548614501953125, 2.62890625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 1.0, 1.0, 7.0, 5.0, 5.0, 5.0, 10.0, 9.0, 14.0, 13.0, 9.0, 21.0, 27.0, 26.0, 27.0, 30.0, 54.0, 42.0, 65.0, 53.0, 48.0, 57.0, 53.0, 54.0, 52.0, 59.0, 43.0, 31.0, 21.0, 38.0, 22.0, 19.0, 14.0, 17.0, 12.0, 11.0, 0.0, 6.0, 7.0, 12.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.98377799987793e-05, -9.724870324134827e-05, -9.465962648391724e-05, -9.20705497264862e-05, -8.948147296905518e-05, -8.689239621162415e-05, -8.430331945419312e-05, -8.171424269676208e-05, -7.912516593933105e-05, -7.653608918190002e-05, -7.3947012424469e-05, -7.135793566703796e-05, -6.876885890960693e-05, -6.61797821521759e-05, -6.359070539474487e-05, -6.100162863731384e-05, -5.841255187988281e-05, -5.582347512245178e-05, -5.323439836502075e-05, -5.064532160758972e-05, -4.805624485015869e-05, -4.546716809272766e-05, -4.287809133529663e-05, -4.02890145778656e-05, -3.769993782043457e-05, -3.511086106300354e-05, -3.252178430557251e-05, -2.993270754814148e-05, -2.734363079071045e-05, -2.475455403327942e-05, -2.216547727584839e-05, -1.957640051841736e-05, -1.6987323760986328e-05, -1.4398247003555298e-05, -1.1809170246124268e-05, -9.220093488693237e-06, -6.631016731262207e-06, -4.041939973831177e-06, -1.4528632164001465e-06, 1.1362135410308838e-06, 3.725290298461914e-06, 6.314367055892944e-06, 8.903443813323975e-06, 1.1492520570755005e-05, 1.4081597328186035e-05, 1.6670674085617065e-05, 1.9259750843048096e-05, 2.1848827600479126e-05, 2.4437904357910156e-05, 2.7026981115341187e-05, 2.9616057872772217e-05, 3.220513463020325e-05, 3.479421138763428e-05, 3.738328814506531e-05, 3.997236490249634e-05, 4.256144165992737e-05, 4.51505184173584e-05, 4.773959517478943e-05, 5.032867193222046e-05, 5.291774868965149e-05, 5.550682544708252e-05, 5.809590220451355e-05, 6.068497896194458e-05, 6.327405571937561e-05, 6.586313247680664e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 11.0, 22.0, 22.0, 53.0, 69.0, 143.0, 258.0, 391.0, 698.0, 1248.0, 2268.0, 4146.0, 7844.0, 15136.0, 28895.0, 55253.0, 102177.0, 167691.0, 213372.0, 186004.0, 121175.0, 67031.0, 35747.0, 18298.0, 9503.0, 4932.0, 2644.0, 1508.0, 850.0, 481.0, 260.0, 142.0, 105.0, 67.0, 42.0, 18.0, 13.0, 9.0, 9.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8828125, -1.8251495361328125, -1.767486572265625, -1.7098236083984375, -1.65216064453125, -1.5944976806640625, -1.536834716796875, -1.4791717529296875, -1.4215087890625, -1.3638458251953125, -1.306182861328125, -1.2485198974609375, -1.19085693359375, -1.1331939697265625, -1.075531005859375, -1.0178680419921875, -0.960205078125, -0.9025421142578125, -0.844879150390625, -0.7872161865234375, -0.72955322265625, -0.6718902587890625, -0.614227294921875, -0.5565643310546875, -0.4989013671875, -0.4412384033203125, -0.383575439453125, -0.3259124755859375, -0.26824951171875, -0.2105865478515625, -0.152923583984375, -0.0952606201171875, -0.03759765625, 0.0200653076171875, 0.077728271484375, 0.1353912353515625, 0.19305419921875, 0.2507171630859375, 0.308380126953125, 0.3660430908203125, 0.4237060546875, 0.4813690185546875, 0.539031982421875, 0.5966949462890625, 0.65435791015625, 0.7120208740234375, 0.769683837890625, 0.8273468017578125, 0.885009765625, 0.9426727294921875, 1.000335693359375, 1.0579986572265625, 1.11566162109375, 1.1733245849609375, 1.230987548828125, 1.2886505126953125, 1.3463134765625, 1.4039764404296875, 1.461639404296875, 1.5193023681640625, 1.57696533203125, 1.6346282958984375, 1.692291259765625, 1.7499542236328125, 1.8076171875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 12.0, 19.0, 14.0, 12.0, 10.0, 26.0, 28.0, 28.0, 30.0, 32.0, 43.0, 39.0, 41.0, 46.0, 48.0, 57.0, 42.0, 55.0, 47.0, 42.0, 38.0, 40.0, 42.0, 23.0, 30.0, 26.0, 30.0, 20.0, 17.0, 15.0, 5.0, 7.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.447509765625, -0.4327201843261719, -0.41793060302734375, -0.4031410217285156, -0.3883514404296875, -0.3735618591308594, -0.35877227783203125, -0.3439826965332031, -0.329193115234375, -0.3144035339355469, -0.29961395263671875, -0.2848243713378906, -0.2700347900390625, -0.2552452087402344, -0.24045562744140625, -0.22566604614257812, -0.21087646484375, -0.19608688354492188, -0.18129730224609375, -0.16650772094726562, -0.1517181396484375, -0.13692855834960938, -0.12213897705078125, -0.10734939575195312, -0.092559814453125, -0.07777023315429688, -0.06298065185546875, -0.048191070556640625, -0.0334014892578125, -0.018611907958984375, -0.00382232666015625, 0.010967254638671875, 0.0257568359375, 0.040546417236328125, 0.05533599853515625, 0.07012557983398438, 0.0849151611328125, 0.09970474243164062, 0.11449432373046875, 0.12928390502929688, 0.144073486328125, 0.15886306762695312, 0.17365264892578125, 0.18844223022460938, 0.2032318115234375, 0.21802139282226562, 0.23281097412109375, 0.24760055541992188, 0.26239013671875, 0.2771797180175781, 0.29196929931640625, 0.3067588806152344, 0.3215484619140625, 0.3363380432128906, 0.35112762451171875, 0.3659172058105469, 0.380706787109375, 0.3954963684082031, 0.41028594970703125, 0.4250755310058594, 0.4398651123046875, 0.4546546936035156, 0.46944427490234375, 0.4842338562011719, 0.4990234375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 6.0, 7.0, 9.0, 8.0, 12.0, 11.0, 13.0, 22.0, 28.0, 20.0, 34.0, 32.0, 39.0, 55.0, 64.0, 59.0, 71.0, 72.0, 59.0, 55.0, 61.0, 44.0, 44.0, 40.0, 30.0, 19.0, 14.0, 16.0, 17.0, 3.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.729515075683594, -6.509955883026123, -6.2903971672058105, -6.07083797454834, -5.851278781890869, -5.631719589233398, -5.412160873413086, -5.192601680755615, -4.9730424880981445, -4.753483295440674, -4.533924579620361, -4.314365386962891, -4.09480619430542, -3.8752472400665283, -3.6556882858276367, -3.436129093170166, -3.2165703773498535, -2.997011423110962, -2.777452230453491, -2.5578932762145996, -2.338334083557129, -2.1187751293182373, -1.8992161750793457, -1.6796571016311646, -1.4600980281829834, -1.2405389547348022, -1.020979881286621, -0.8014209270477295, -0.5818618535995483, -0.3623027801513672, -0.14274382591247559, 0.07681524753570557, 0.2963738441467285, 0.5159329175949097, 0.735491931438446, 0.9550509452819824, 1.1746100187301636, 1.3941690921783447, 1.6137280464172363, 1.8332871198654175, 2.0528461933135986, 2.2724051475524902, 2.491964340209961, 2.7115232944488525, 2.931082248687744, 3.150641441345215, 3.3702003955841064, 3.589759349822998, 3.8093185424804688, 4.0288777351379395, 4.248436450958252, 4.467995643615723, 4.687554836273193, 4.907114028930664, 5.126672744750977, 5.346231937408447, 5.565791130065918, 5.785350322723389, 6.004909038543701, 6.224468231201172, 6.444027423858643, 6.663586616516113, 6.883145332336426, 7.1027045249938965, 7.322263240814209]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 6.0, 3.0, 4.0, 7.0, 7.0, 5.0, 16.0, 12.0, 11.0, 17.0, 9.0, 23.0, 17.0, 24.0, 30.0, 29.0, 24.0, 32.0, 34.0, 24.0, 34.0, 40.0, 38.0, 34.0, 48.0, 29.0, 43.0, 27.0, 29.0, 40.0, 32.0, 38.0, 33.0, 19.0, 30.0, 21.0, 19.0, 21.0, 9.0, 15.0, 11.0, 13.0, 11.0, 11.0, 8.0, 4.0, 4.0, 7.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4440343379974365, -3.3310611248016357, -3.218087911605835, -3.105114459991455, -2.9921412467956543, -2.8791680335998535, -2.7661948204040527, -2.653221607208252, -2.540248394012451, -2.4272751808166504, -2.3143019676208496, -2.201328754425049, -2.088355302810669, -1.9753820896148682, -1.8624088764190674, -1.7494356632232666, -1.6364622116088867, -1.523488998413086, -1.4105156660079956, -1.2975424528121948, -1.1845691204071045, -1.0715959072113037, -0.9586226940155029, -0.8456494212150574, -0.7326761484146118, -0.6197028756141663, -0.5067296028137207, -0.3937563896179199, -0.28078311681747437, -0.1678098440170288, -0.05483663082122803, 0.05813664197921753, 0.1711101531982422, 0.28408342599868774, 0.3970566689968109, 0.5100299119949341, 0.6230031847953796, 0.7359764575958252, 0.848949670791626, 0.9619229435920715, 1.074896216392517, 1.1878694295883179, 1.3008427619934082, 1.413815975189209, 1.5267891883850098, 1.6397625207901, 1.7527357339859009, 1.8657090663909912, 1.978682279586792, 2.0916554927825928, 2.2046287059783936, 2.3176021575927734, 2.430575370788574, 2.543548583984375, 2.656521797180176, 2.7694950103759766, 2.8824682235717773, 2.995441436767578, 3.108414649963379, 3.2213878631591797, 3.3343613147735596, 3.4473345279693604, 3.560307741165161, 3.673280954360962, 3.786254405975342]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 12.0, 13.0, 11.0, 26.0, 27.0, 56.0, 60.0, 105.0, 153.0, 225.0, 371.0, 577.0, 899.0, 1388.0, 2164.0, 3361.0, 5372.0, 8214.0, 12873.0, 19885.0, 29992.0, 44816.0, 65159.0, 89238.0, 114590.0, 131124.0, 130046.0, 112706.0, 87003.0, 62815.0, 42979.0, 29180.0, 18715.0, 12200.0, 7953.0, 5178.0, 3236.0, 2119.0, 1311.0, 836.0, 519.0, 343.0, 238.0, 155.0, 100.0, 67.0, 40.0, 37.0, 26.0, 21.0, 4.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0], "bins": [-3.3515625, -3.249847412109375, -3.14813232421875, -3.046417236328125, -2.9447021484375, -2.842987060546875, -2.74127197265625, -2.639556884765625, -2.537841796875, -2.436126708984375, -2.33441162109375, -2.232696533203125, -2.1309814453125, -2.029266357421875, -1.92755126953125, -1.825836181640625, -1.72412109375, -1.622406005859375, -1.52069091796875, -1.418975830078125, -1.3172607421875, -1.215545654296875, -1.11383056640625, -1.012115478515625, -0.910400390625, -0.808685302734375, -0.70697021484375, -0.605255126953125, -0.5035400390625, -0.401824951171875, -0.30010986328125, -0.198394775390625, -0.0966796875, 0.005035400390625, 0.10675048828125, 0.208465576171875, 0.3101806640625, 0.411895751953125, 0.51361083984375, 0.615325927734375, 0.717041015625, 0.818756103515625, 0.92047119140625, 1.022186279296875, 1.1239013671875, 1.225616455078125, 1.32733154296875, 1.429046630859375, 1.53076171875, 1.632476806640625, 1.73419189453125, 1.835906982421875, 1.9376220703125, 2.039337158203125, 2.14105224609375, 2.242767333984375, 2.344482421875, 2.446197509765625, 2.54791259765625, 2.649627685546875, 2.7513427734375, 2.853057861328125, 2.95477294921875, 3.056488037109375, 3.158203125]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 10.0, 13.0, 10.0, 19.0, 14.0, 16.0, 25.0, 22.0, 32.0, 30.0, 33.0, 35.0, 48.0, 39.0, 38.0, 48.0, 38.0, 58.0, 48.0, 37.0, 42.0, 41.0, 42.0, 34.0, 38.0, 35.0, 21.0, 16.0, 29.0, 12.0, 13.0, 16.0, 13.0, 11.0, 3.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.67578125, -4.53057861328125, -4.3853759765625, -4.24017333984375, -4.094970703125, -3.94976806640625, -3.8045654296875, -3.65936279296875, -3.51416015625, -3.36895751953125, -3.2237548828125, -3.07855224609375, -2.933349609375, -2.78814697265625, -2.6429443359375, -2.49774169921875, -2.3525390625, -2.20733642578125, -2.0621337890625, -1.91693115234375, -1.771728515625, -1.62652587890625, -1.4813232421875, -1.33612060546875, -1.19091796875, -1.04571533203125, -0.9005126953125, -0.75531005859375, -0.610107421875, -0.46490478515625, -0.3197021484375, -0.17449951171875, -0.029296875, 0.11590576171875, 0.2611083984375, 0.40631103515625, 0.551513671875, 0.69671630859375, 0.8419189453125, 0.98712158203125, 1.13232421875, 1.27752685546875, 1.4227294921875, 1.56793212890625, 1.713134765625, 1.85833740234375, 2.0035400390625, 2.14874267578125, 2.2939453125, 2.43914794921875, 2.5843505859375, 2.72955322265625, 2.874755859375, 3.01995849609375, 3.1651611328125, 3.31036376953125, 3.45556640625, 3.60076904296875, 3.7459716796875, 3.89117431640625, 4.036376953125, 4.18157958984375, 4.3267822265625, 4.47198486328125, 4.6171875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 9.0, 10.0, 11.0, 11.0, 30.0, 52.0, 75.0, 125.0, 175.0, 303.0, 450.0, 797.0, 1284.0, 2201.0, 3728.0, 6344.0, 10927.0, 18444.0, 31120.0, 50887.0, 80251.0, 117382.0, 150397.0, 160290.0, 139068.0, 102209.0, 67888.0, 42342.0, 25199.0, 15186.0, 8742.0, 5049.0, 3032.0, 1801.0, 1082.0, 646.0, 380.0, 255.0, 122.0, 106.0, 47.0, 39.0, 22.0, 14.0, 9.0, 12.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.47265625, -3.358062744140625, -3.24346923828125, -3.128875732421875, -3.0142822265625, -2.899688720703125, -2.78509521484375, -2.670501708984375, -2.555908203125, -2.441314697265625, -2.32672119140625, -2.212127685546875, -2.0975341796875, -1.982940673828125, -1.86834716796875, -1.753753662109375, -1.63916015625, -1.524566650390625, -1.40997314453125, -1.295379638671875, -1.1807861328125, -1.066192626953125, -0.95159912109375, -0.837005615234375, -0.722412109375, -0.607818603515625, -0.49322509765625, -0.378631591796875, -0.2640380859375, -0.149444580078125, -0.03485107421875, 0.079742431640625, 0.1943359375, 0.308929443359375, 0.42352294921875, 0.538116455078125, 0.6527099609375, 0.767303466796875, 0.88189697265625, 0.996490478515625, 1.111083984375, 1.225677490234375, 1.34027099609375, 1.454864501953125, 1.5694580078125, 1.684051513671875, 1.79864501953125, 1.913238525390625, 2.02783203125, 2.142425537109375, 2.25701904296875, 2.371612548828125, 2.4862060546875, 2.600799560546875, 2.71539306640625, 2.829986572265625, 2.944580078125, 3.059173583984375, 3.17376708984375, 3.288360595703125, 3.4029541015625, 3.517547607421875, 3.63214111328125, 3.746734619140625, 3.861328125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 6.0, 3.0, 3.0, 10.0, 14.0, 6.0, 17.0, 14.0, 10.0, 14.0, 18.0, 15.0, 16.0, 30.0, 35.0, 22.0, 36.0, 37.0, 38.0, 36.0, 39.0, 48.0, 29.0, 43.0, 42.0, 33.0, 48.0, 39.0, 42.0, 43.0, 32.0, 28.0, 23.0, 27.0, 15.0, 17.0, 14.0, 9.0, 11.0, 9.0, 6.0, 4.0, 7.0, 0.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0], "bins": [-2.705078125, -2.62603759765625, -2.5469970703125, -2.46795654296875, -2.388916015625, -2.30987548828125, -2.2308349609375, -2.15179443359375, -2.07275390625, -1.99371337890625, -1.9146728515625, -1.83563232421875, -1.756591796875, -1.67755126953125, -1.5985107421875, -1.51947021484375, -1.4404296875, -1.36138916015625, -1.2823486328125, -1.20330810546875, -1.124267578125, -1.04522705078125, -0.9661865234375, -0.88714599609375, -0.80810546875, -0.72906494140625, -0.6500244140625, -0.57098388671875, -0.491943359375, -0.41290283203125, -0.3338623046875, -0.25482177734375, -0.17578125, -0.09674072265625, -0.0177001953125, 0.06134033203125, 0.140380859375, 0.21942138671875, 0.2984619140625, 0.37750244140625, 0.45654296875, 0.53558349609375, 0.6146240234375, 0.69366455078125, 0.772705078125, 0.85174560546875, 0.9307861328125, 1.00982666015625, 1.0888671875, 1.16790771484375, 1.2469482421875, 1.32598876953125, 1.405029296875, 1.48406982421875, 1.5631103515625, 1.64215087890625, 1.72119140625, 1.80023193359375, 1.8792724609375, 1.95831298828125, 2.037353515625, 2.11639404296875, 2.1954345703125, 2.27447509765625, 2.353515625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 7.0, 8.0, 15.0, 18.0, 27.0, 48.0, 59.0, 77.0, 132.0, 163.0, 282.0, 398.0, 650.0, 937.0, 1494.0, 2463.0, 3846.0, 6478.0, 10698.0, 18872.0, 33004.0, 58539.0, 101316.0, 156439.0, 192381.0, 173292.0, 119685.0, 71013.0, 40150.0, 22858.0, 13097.0, 7589.0, 4695.0, 2768.0, 1799.0, 1095.0, 687.0, 499.0, 330.0, 215.0, 144.0, 96.0, 69.0, 41.0, 30.0, 24.0, 13.0, 9.0, 8.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.458984375, -2.385955810546875, -2.31292724609375, -2.239898681640625, -2.1668701171875, -2.093841552734375, -2.02081298828125, -1.947784423828125, -1.874755859375, -1.801727294921875, -1.72869873046875, -1.655670166015625, -1.5826416015625, -1.509613037109375, -1.43658447265625, -1.363555908203125, -1.29052734375, -1.217498779296875, -1.14447021484375, -1.071441650390625, -0.9984130859375, -0.925384521484375, -0.85235595703125, -0.779327392578125, -0.706298828125, -0.633270263671875, -0.56024169921875, -0.487213134765625, -0.4141845703125, -0.341156005859375, -0.26812744140625, -0.195098876953125, -0.1220703125, -0.049041748046875, 0.02398681640625, 0.097015380859375, 0.1700439453125, 0.243072509765625, 0.31610107421875, 0.389129638671875, 0.462158203125, 0.535186767578125, 0.60821533203125, 0.681243896484375, 0.7542724609375, 0.827301025390625, 0.90032958984375, 0.973358154296875, 1.04638671875, 1.119415283203125, 1.19244384765625, 1.265472412109375, 1.3385009765625, 1.411529541015625, 1.48455810546875, 1.557586669921875, 1.630615234375, 1.703643798828125, 1.77667236328125, 1.849700927734375, 1.9227294921875, 1.995758056640625, 2.06878662109375, 2.141815185546875, 2.21484375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 3.0, 5.0, 8.0, 8.0, 6.0, 14.0, 10.0, 12.0, 28.0, 27.0, 23.0, 31.0, 27.0, 40.0, 44.0, 55.0, 57.0, 50.0, 61.0, 61.0, 48.0, 49.0, 46.0, 39.0, 32.0, 31.0, 35.0, 17.0, 25.0, 19.0, 16.0, 12.0, 9.0, 9.0, 10.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00018680095672607422, -0.0001807641237974167, -0.00017472729086875916, -0.00016869045794010162, -0.0001626536250114441, -0.00015661679208278656, -0.00015057995915412903, -0.0001445431262254715, -0.00013850629329681396, -0.00013246946036815643, -0.0001264326274394989, -0.00012039579451084137, -0.00011435896158218384, -0.0001083221286535263, -0.00010228529572486877, -9.624846279621124e-05, -9.021162986755371e-05, -8.417479693889618e-05, -7.813796401023865e-05, -7.210113108158112e-05, -6.606429815292358e-05, -6.002746522426605e-05, -5.399063229560852e-05, -4.795379936695099e-05, -4.191696643829346e-05, -3.5880133509635925e-05, -2.9843300580978394e-05, -2.3806467652320862e-05, -1.776963472366333e-05, -1.1732801795005798e-05, -5.695968866348267e-06, 3.4086406230926514e-07, 6.377696990966797e-06, 1.2414529919624329e-05, 1.845136284828186e-05, 2.4488195776939392e-05, 3.0525028705596924e-05, 3.6561861634254456e-05, 4.259869456291199e-05, 4.863552749156952e-05, 5.467236042022705e-05, 6.070919334888458e-05, 6.674602627754211e-05, 7.278285920619965e-05, 7.881969213485718e-05, 8.485652506351471e-05, 9.089335799217224e-05, 9.693019092082977e-05, 0.0001029670238494873, 0.00010900385677814484, 0.00011504068970680237, 0.0001210775226354599, 0.00012711435556411743, 0.00013315118849277496, 0.0001391880214214325, 0.00014522485435009003, 0.00015126168727874756, 0.0001572985202074051, 0.00016333535313606262, 0.00016937218606472015, 0.00017540901899337769, 0.00018144585192203522, 0.00018748268485069275, 0.00019351951777935028, 0.0001995563507080078]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 9.0, 4.0, 8.0, 13.0, 16.0, 8.0, 28.0, 39.0, 55.0, 77.0, 132.0, 172.0, 265.0, 402.0, 704.0, 1140.0, 2052.0, 3677.0, 6756.0, 12743.0, 24554.0, 49130.0, 94680.0, 163197.0, 216364.0, 198193.0, 128896.0, 70131.0, 35612.0, 18247.0, 9427.0, 5082.0, 2785.0, 1541.0, 914.0, 544.0, 307.0, 208.0, 149.0, 81.0, 58.0, 34.0, 26.0, 14.0, 12.0, 15.0, 12.0, 10.0, 9.0, 8.0, 4.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-2.6484375, -2.5650634765625, -2.481689453125, -2.3983154296875, -2.31494140625, -2.2315673828125, -2.148193359375, -2.0648193359375, -1.9814453125, -1.8980712890625, -1.814697265625, -1.7313232421875, -1.64794921875, -1.5645751953125, -1.481201171875, -1.3978271484375, -1.314453125, -1.2310791015625, -1.147705078125, -1.0643310546875, -0.98095703125, -0.8975830078125, -0.814208984375, -0.7308349609375, -0.6474609375, -0.5640869140625, -0.480712890625, -0.3973388671875, -0.31396484375, -0.2305908203125, -0.147216796875, -0.0638427734375, 0.01953125, 0.1029052734375, 0.186279296875, 0.2696533203125, 0.35302734375, 0.4364013671875, 0.519775390625, 0.6031494140625, 0.6865234375, 0.7698974609375, 0.853271484375, 0.9366455078125, 1.02001953125, 1.1033935546875, 1.186767578125, 1.2701416015625, 1.353515625, 1.4368896484375, 1.520263671875, 1.6036376953125, 1.68701171875, 1.7703857421875, 1.853759765625, 1.9371337890625, 2.0205078125, 2.1038818359375, 2.187255859375, 2.2706298828125, 2.35400390625, 2.4373779296875, 2.520751953125, 2.6041259765625, 2.6875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 8.0, 12.0, 16.0, 20.0, 28.0, 30.0, 42.0, 47.0, 44.0, 42.0, 51.0, 56.0, 60.0, 64.0, 60.0, 63.0, 44.0, 48.0, 40.0, 43.0, 37.0, 28.0, 26.0, 16.0, 19.0, 8.0, 5.0, 6.0, 10.0, 9.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8317031860351562, -0.8045196533203125, -0.7773361206054688, -0.750152587890625, -0.7229690551757812, -0.6957855224609375, -0.6686019897460938, -0.64141845703125, -0.6142349243164062, -0.5870513916015625, -0.5598678588867188, -0.532684326171875, -0.5055007934570312, -0.4783172607421875, -0.45113372802734375, -0.4239501953125, -0.39676666259765625, -0.3695831298828125, -0.34239959716796875, -0.315216064453125, -0.28803253173828125, -0.2608489990234375, -0.23366546630859375, -0.20648193359375, -0.17929840087890625, -0.1521148681640625, -0.12493133544921875, -0.097747802734375, -0.07056427001953125, -0.0433807373046875, -0.01619720458984375, 0.010986328125, 0.03816986083984375, 0.0653533935546875, 0.09253692626953125, 0.119720458984375, 0.14690399169921875, 0.1740875244140625, 0.20127105712890625, 0.22845458984375, 0.25563812255859375, 0.2828216552734375, 0.31000518798828125, 0.337188720703125, 0.36437225341796875, 0.3915557861328125, 0.41873931884765625, 0.4459228515625, 0.47310638427734375, 0.5002899169921875, 0.5274734497070312, 0.554656982421875, 0.5818405151367188, 0.6090240478515625, 0.6362075805664062, 0.66339111328125, 0.6905746459960938, 0.7177581787109375, 0.7449417114257812, 0.772125244140625, 0.7993087768554688, 0.8264923095703125, 0.8536758422851562, 0.880859375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 1.0, 10.0, 6.0, 4.0, 5.0, 8.0, 13.0, 12.0, 22.0, 15.0, 19.0, 29.0, 31.0, 49.0, 42.0, 58.0, 54.0, 57.0, 55.0, 66.0, 54.0, 61.0, 56.0, 49.0, 40.0, 42.0, 31.0, 16.0, 26.0, 11.0, 8.0, 11.0, 11.0, 8.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.5597333908081055, -6.353708267211914, -6.1476826667785645, -5.941657543182373, -5.735631942749023, -5.529606819152832, -5.323581695556641, -5.117556571960449, -4.9115309715271, -4.705505847930908, -4.499480247497559, -4.293455123901367, -4.087430000305176, -3.881404399871826, -3.6753792762756348, -3.4693539142608643, -3.2633285522460938, -3.0573031902313232, -2.8512778282165527, -2.6452527046203613, -2.439227342605591, -2.2332019805908203, -2.027176856994629, -1.8211514949798584, -1.615126132965088, -1.4091007709503174, -1.2030755281448364, -0.9970502257347107, -0.791024923324585, -0.5849995613098145, -0.3789743185043335, -0.17294907569885254, 0.03307628631591797, 0.2391015887260437, 0.44512689113616943, 0.6511521935462952, 0.8571774959564209, 1.0632028579711914, 1.2692281007766724, 1.4752533435821533, 1.6812787055969238, 1.8873040676116943, 2.093329429626465, 2.2993545532226562, 2.5053799152374268, 2.7114052772521973, 2.9174304008483887, 3.123455762863159, 3.3294811248779297, 3.5355064868927, 3.7415318489074707, 3.947556972503662, 4.153582572937012, 4.359607696533203, 4.5656328201293945, 4.771657943725586, 4.9776835441589355, 5.183708667755127, 5.389734268188477, 5.595759391784668, 5.801784515380859, 6.007810115814209, 6.2138352394104, 6.41986083984375, 6.625885963439941]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 2.0, 4.0, 7.0, 4.0, 13.0, 16.0, 11.0, 7.0, 23.0, 11.0, 11.0, 22.0, 20.0, 27.0, 24.0, 30.0, 38.0, 27.0, 45.0, 47.0, 44.0, 41.0, 45.0, 44.0, 35.0, 47.0, 32.0, 35.0, 25.0, 19.0, 32.0, 33.0, 27.0, 30.0, 24.0, 10.0, 17.0, 8.0, 23.0, 14.0, 5.0, 5.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.7564151287078857, -3.6334409713745117, -3.5104668140411377, -3.3874926567077637, -3.2645184993743896, -3.1415443420410156, -3.0185699462890625, -2.8955960273742676, -2.7726216316223145, -2.6496474742889404, -2.5266733169555664, -2.4036991596221924, -2.2807250022888184, -2.1577508449554443, -2.0347766876220703, -1.9118024110794067, -1.7888283729553223, -1.6658542156219482, -1.5428800582885742, -1.4199059009552002, -1.2969317436218262, -1.1739575862884521, -1.0509833097457886, -0.9280091524124146, -0.8050349950790405, -0.6820608377456665, -0.5590866804122925, -0.4361124634742737, -0.31313830614089966, -0.19016414880752563, -0.06718993186950684, 0.05578422546386719, 0.1787581443786621, 0.30173230171203613, 0.42470648884773254, 0.547680675983429, 0.670654833316803, 0.793628990650177, 0.9166032075881958, 1.0395773649215698, 1.1625515222549438, 1.2855256795883179, 1.408499836921692, 1.5314741134643555, 1.6544482707977295, 1.7774224281311035, 1.9003965854644775, 2.0233707427978516, 2.1463449001312256, 2.2693190574645996, 2.3922932147979736, 2.5152673721313477, 2.6382415294647217, 2.7612156867980957, 2.884190082550049, 3.0071640014648438, 3.130138397216797, 3.253112554550171, 3.376086711883545, 3.499060869216919, 3.622035026550293, 3.745009183883667, 3.867983341217041, 3.990957736968994, 4.113931655883789]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 10.0, 19.0, 22.0, 30.0, 51.0, 62.0, 83.0, 128.0, 184.0, 233.0, 326.0, 441.0, 710.0, 1045.0, 1594.0, 2482.0, 3885.0, 6365.0, 10566.0, 18126.0, 33211.0, 64498.0, 135525.0, 309109.0, 717012.0, 1165761.0, 925460.0, 431697.0, 182455.0, 84255.0, 42637.0, 22699.0, 13077.0, 7660.0, 4612.0, 2842.0, 1826.0, 1171.0, 764.0, 489.0, 360.0, 227.0, 179.0, 115.0, 95.0, 56.0, 40.0, 28.0, 18.0, 10.0, 8.0, 5.0, 10.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.90625, -5.7255859375, -5.544921875, -5.3642578125, -5.18359375, -5.0029296875, -4.822265625, -4.6416015625, -4.4609375, -4.2802734375, -4.099609375, -3.9189453125, -3.73828125, -3.5576171875, -3.376953125, -3.1962890625, -3.015625, -2.8349609375, -2.654296875, -2.4736328125, -2.29296875, -2.1123046875, -1.931640625, -1.7509765625, -1.5703125, -1.3896484375, -1.208984375, -1.0283203125, -0.84765625, -0.6669921875, -0.486328125, -0.3056640625, -0.125, 0.0556640625, 0.236328125, 0.4169921875, 0.59765625, 0.7783203125, 0.958984375, 1.1396484375, 1.3203125, 1.5009765625, 1.681640625, 1.8623046875, 2.04296875, 2.2236328125, 2.404296875, 2.5849609375, 2.765625, 2.9462890625, 3.126953125, 3.3076171875, 3.48828125, 3.6689453125, 3.849609375, 4.0302734375, 4.2109375, 4.3916015625, 4.572265625, 4.7529296875, 4.93359375, 5.1142578125, 5.294921875, 5.4755859375, 5.65625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 12.0, 6.0, 8.0, 8.0, 14.0, 10.0, 21.0, 14.0, 19.0, 20.0, 24.0, 28.0, 38.0, 16.0, 39.0, 37.0, 41.0, 41.0, 33.0, 50.0, 42.0, 42.0, 27.0, 34.0, 43.0, 38.0, 26.0, 23.0, 37.0, 32.0, 23.0, 23.0, 21.0, 19.0, 16.0, 16.0, 7.0, 11.0, 10.0, 4.0, 2.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.525390625, -2.439788818359375, -2.35418701171875, -2.268585205078125, -2.1829833984375, -2.097381591796875, -2.01177978515625, -1.926177978515625, -1.840576171875, -1.754974365234375, -1.66937255859375, -1.583770751953125, -1.4981689453125, -1.412567138671875, -1.32696533203125, -1.241363525390625, -1.15576171875, -1.070159912109375, -0.98455810546875, -0.898956298828125, -0.8133544921875, -0.727752685546875, -0.64215087890625, -0.556549072265625, -0.470947265625, -0.385345458984375, -0.29974365234375, -0.214141845703125, -0.1285400390625, -0.042938232421875, 0.04266357421875, 0.128265380859375, 0.2138671875, 0.299468994140625, 0.38507080078125, 0.470672607421875, 0.5562744140625, 0.641876220703125, 0.72747802734375, 0.813079833984375, 0.898681640625, 0.984283447265625, 1.06988525390625, 1.155487060546875, 1.2410888671875, 1.326690673828125, 1.41229248046875, 1.497894287109375, 1.58349609375, 1.669097900390625, 1.75469970703125, 1.840301513671875, 1.9259033203125, 2.011505126953125, 2.09710693359375, 2.182708740234375, 2.268310546875, 2.353912353515625, 2.43951416015625, 2.525115966796875, 2.6107177734375, 2.696319580078125, 2.78192138671875, 2.867523193359375, 2.953125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 4.0, 12.0, 14.0, 26.0, 32.0, 40.0, 59.0, 91.0, 129.0, 202.0, 332.0, 505.0, 710.0, 1075.0, 1772.0, 2659.0, 4461.0, 7353.0, 12579.0, 22691.0, 41700.0, 81873.0, 170895.0, 379486.0, 830819.0, 1207709.0, 762219.0, 343970.0, 156100.0, 74901.0, 38545.0, 20995.0, 11819.0, 6976.0, 4150.0, 2615.0, 1661.0, 1056.0, 711.0, 449.0, 317.0, 191.0, 129.0, 85.0, 54.0, 34.0, 34.0, 13.0, 11.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.6328125, -6.4283447265625, -6.223876953125, -6.0194091796875, -5.81494140625, -5.6104736328125, -5.406005859375, -5.2015380859375, -4.9970703125, -4.7926025390625, -4.588134765625, -4.3836669921875, -4.17919921875, -3.9747314453125, -3.770263671875, -3.5657958984375, -3.361328125, -3.1568603515625, -2.952392578125, -2.7479248046875, -2.54345703125, -2.3389892578125, -2.134521484375, -1.9300537109375, -1.7255859375, -1.5211181640625, -1.316650390625, -1.1121826171875, -0.90771484375, -0.7032470703125, -0.498779296875, -0.2943115234375, -0.08984375, 0.1146240234375, 0.319091796875, 0.5235595703125, 0.72802734375, 0.9324951171875, 1.136962890625, 1.3414306640625, 1.5458984375, 1.7503662109375, 1.954833984375, 2.1593017578125, 2.36376953125, 2.5682373046875, 2.772705078125, 2.9771728515625, 3.181640625, 3.3861083984375, 3.590576171875, 3.7950439453125, 3.99951171875, 4.2039794921875, 4.408447265625, 4.6129150390625, 4.8173828125, 5.0218505859375, 5.226318359375, 5.4307861328125, 5.63525390625, 5.8397216796875, 6.044189453125, 6.2486572265625, 6.453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 10.0, 9.0, 9.0, 5.0, 19.0, 19.0, 35.0, 43.0, 45.0, 74.0, 95.0, 133.0, 159.0, 194.0, 283.0, 323.0, 393.0, 376.0, 374.0, 302.0, 267.0, 209.0, 166.0, 113.0, 88.0, 81.0, 55.0, 62.0, 23.0, 29.0, 17.0, 16.0, 11.0, 11.0, 7.0, 5.0, 5.0, 10.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.16363525390625, -2.0928955078125, -2.02215576171875, -1.951416015625, -1.88067626953125, -1.8099365234375, -1.73919677734375, -1.66845703125, -1.59771728515625, -1.5269775390625, -1.45623779296875, -1.385498046875, -1.31475830078125, -1.2440185546875, -1.17327880859375, -1.1025390625, -1.03179931640625, -0.9610595703125, -0.89031982421875, -0.819580078125, -0.74884033203125, -0.6781005859375, -0.60736083984375, -0.53662109375, -0.46588134765625, -0.3951416015625, -0.32440185546875, -0.253662109375, -0.18292236328125, -0.1121826171875, -0.04144287109375, 0.029296875, 0.10003662109375, 0.1707763671875, 0.24151611328125, 0.312255859375, 0.38299560546875, 0.4537353515625, 0.52447509765625, 0.59521484375, 0.66595458984375, 0.7366943359375, 0.80743408203125, 0.878173828125, 0.94891357421875, 1.0196533203125, 1.09039306640625, 1.1611328125, 1.23187255859375, 1.3026123046875, 1.37335205078125, 1.444091796875, 1.51483154296875, 1.5855712890625, 1.65631103515625, 1.72705078125, 1.79779052734375, 1.8685302734375, 1.93927001953125, 2.010009765625, 2.08074951171875, 2.1514892578125, 2.22222900390625, 2.29296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 10.0, 13.0, 15.0, 11.0, 25.0, 26.0, 27.0, 34.0, 32.0, 63.0, 54.0, 72.0, 75.0, 87.0, 72.0, 67.0, 58.0, 57.0, 37.0, 39.0, 23.0, 24.0, 20.0, 8.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.557711601257324, -9.31735897064209, -9.077007293701172, -8.836654663085938, -8.59630298614502, -8.355950355529785, -8.115598678588867, -7.875246047973633, -7.634894371032715, -7.394542217254639, -7.1541900634765625, -6.913837909698486, -6.67348575592041, -6.433133602142334, -6.192781448364258, -5.952428817749023, -5.712076663970947, -5.471724510192871, -5.231372356414795, -4.991020202636719, -4.750668048858643, -4.510315895080566, -4.269963264465332, -4.029611587524414, -3.789259195327759, -3.5489070415496826, -3.3085548877716064, -3.068202495574951, -2.827850341796875, -2.587498188018799, -2.3471460342407227, -2.1067938804626465, -1.8664422035217285, -1.6260900497436523, -1.3857378959655762, -1.1453856229782104, -0.9050334692001343, -0.6646813154220581, -0.4243290424346924, -0.1839768886566162, 0.05637526512145996, 0.2967274487018585, 0.5370796322822571, 0.777431845664978, 1.0177839994430542, 1.2581361532211304, 1.498488426208496, 1.7388405799865723, 1.9791927337646484, 2.2195448875427246, 2.459897041320801, 2.700249195098877, 2.940601348876953, 3.1809535026550293, 3.4213058948516846, 3.6616580486297607, 3.902010202407837, 4.142362594604492, 4.382714748382568, 4.6230669021606445, 4.863419055938721, 5.103771209716797, 5.344123363494873, 5.584475517272949, 5.824827671051025]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 3.0, 5.0, 9.0, 17.0, 8.0, 8.0, 13.0, 13.0, 15.0, 17.0, 19.0, 20.0, 17.0, 23.0, 32.0, 25.0, 26.0, 35.0, 26.0, 33.0, 33.0, 34.0, 28.0, 36.0, 31.0, 40.0, 42.0, 38.0, 31.0, 29.0, 47.0, 31.0, 20.0, 17.0, 15.0, 26.0, 20.0, 16.0, 23.0, 16.0, 9.0, 10.0, 6.0, 2.0, 13.0, 5.0, 6.0, 4.0, 3.0, 4.0, 0.0, 2.0], "bins": [-3.6355714797973633, -3.5323939323425293, -3.4292166233062744, -3.3260390758514404, -3.2228617668151855, -3.1196842193603516, -3.0165066719055176, -2.9133291244506836, -2.8101518154144287, -2.7069742679595947, -2.60379695892334, -2.500619411468506, -2.397441864013672, -2.294264554977417, -2.191087007522583, -2.087909698486328, -1.9847321510314941, -1.8815547227859497, -1.7783772945404053, -1.6751997470855713, -1.5720223188400269, -1.4688448905944824, -1.3656673431396484, -1.262489914894104, -1.1593124866485596, -1.0561350584030151, -0.9529575705528259, -0.8497800827026367, -0.7466026544570923, -0.6434252262115479, -0.5402477383613586, -0.43707025051116943, -0.3338925838470459, -0.23071512579917908, -0.12753766775131226, -0.024360209703445435, 0.07881724834442139, 0.18199467658996582, 0.28517216444015503, 0.38834965229034424, 0.49152708053588867, 0.5947045087814331, 0.6978819966316223, 0.8010594844818115, 0.904236912727356, 1.0074143409729004, 1.1105918884277344, 1.2137693166732788, 1.3169467449188232, 1.4201241731643677, 1.523301601409912, 1.626479148864746, 1.7296565771102905, 1.832834005355835, 1.936011552810669, 2.039188861846924, 2.142366409301758, 2.245543956756592, 2.3487212657928467, 2.4518988132476807, 2.5550761222839355, 2.6582536697387695, 2.7614312171936035, 2.8646087646484375, 2.9677860736846924]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 14.0, 23.0, 27.0, 23.0, 57.0, 81.0, 123.0, 168.0, 289.0, 388.0, 600.0, 1008.0, 1487.0, 2410.0, 3764.0, 6143.0, 10218.0, 16859.0, 28306.0, 46978.0, 76777.0, 118182.0, 159700.0, 172021.0, 143168.0, 100203.0, 62727.0, 38207.0, 22756.0, 13832.0, 8160.0, 5065.0, 3130.0, 1994.0, 1272.0, 798.0, 514.0, 363.0, 244.0, 151.0, 107.0, 68.0, 43.0, 43.0, 17.0, 17.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.63671875, -2.552459716796875, -2.46820068359375, -2.383941650390625, -2.2996826171875, -2.215423583984375, -2.13116455078125, -2.046905517578125, -1.962646484375, -1.878387451171875, -1.79412841796875, -1.709869384765625, -1.6256103515625, -1.541351318359375, -1.45709228515625, -1.372833251953125, -1.28857421875, -1.204315185546875, -1.12005615234375, -1.035797119140625, -0.9515380859375, -0.867279052734375, -0.78302001953125, -0.698760986328125, -0.614501953125, -0.530242919921875, -0.44598388671875, -0.361724853515625, -0.2774658203125, -0.193206787109375, -0.10894775390625, -0.024688720703125, 0.0595703125, 0.143829345703125, 0.22808837890625, 0.312347412109375, 0.3966064453125, 0.480865478515625, 0.56512451171875, 0.649383544921875, 0.733642578125, 0.817901611328125, 0.90216064453125, 0.986419677734375, 1.0706787109375, 1.154937744140625, 1.23919677734375, 1.323455810546875, 1.40771484375, 1.491973876953125, 1.57623291015625, 1.660491943359375, 1.7447509765625, 1.829010009765625, 1.91326904296875, 1.997528076171875, 2.081787109375, 2.166046142578125, 2.25030517578125, 2.334564208984375, 2.4188232421875, 2.503082275390625, 2.58734130859375, 2.671600341796875, 2.755859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 5.0, 9.0, 8.0, 10.0, 9.0, 14.0, 13.0, 11.0, 23.0, 14.0, 22.0, 27.0, 29.0, 32.0, 28.0, 31.0, 32.0, 43.0, 31.0, 30.0, 46.0, 42.0, 37.0, 48.0, 42.0, 50.0, 36.0, 33.0, 45.0, 25.0, 20.0, 19.0, 18.0, 23.0, 16.0, 14.0, 13.0, 15.0, 8.0, 7.0, 8.0, 8.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.895751953125, -3.76806640625, -3.640380859375, -3.5126953125, -3.385009765625, -3.25732421875, -3.129638671875, -3.001953125, -2.874267578125, -2.74658203125, -2.618896484375, -2.4912109375, -2.363525390625, -2.23583984375, -2.108154296875, -1.98046875, -1.852783203125, -1.72509765625, -1.597412109375, -1.4697265625, -1.342041015625, -1.21435546875, -1.086669921875, -0.958984375, -0.831298828125, -0.70361328125, -0.575927734375, -0.4482421875, -0.320556640625, -0.19287109375, -0.065185546875, 0.0625, 0.190185546875, 0.31787109375, 0.445556640625, 0.5732421875, 0.700927734375, 0.82861328125, 0.956298828125, 1.083984375, 1.211669921875, 1.33935546875, 1.467041015625, 1.5947265625, 1.722412109375, 1.85009765625, 1.977783203125, 2.10546875, 2.233154296875, 2.36083984375, 2.488525390625, 2.6162109375, 2.743896484375, 2.87158203125, 2.999267578125, 3.126953125, 3.254638671875, 3.38232421875, 3.510009765625, 3.6376953125, 3.765380859375, 3.89306640625, 4.020751953125, 4.1484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 12.0, 27.0, 45.0, 67.0, 108.0, 183.0, 311.0, 538.0, 896.0, 1640.0, 3281.0, 6349.0, 13309.0, 28714.0, 64424.0, 142757.0, 265850.0, 263109.0, 139440.0, 63047.0, 28286.0, 12855.0, 6283.0, 3171.0, 1681.0, 909.0, 516.0, 292.0, 159.0, 85.0, 57.0, 50.0, 35.0, 21.0, 4.0, 12.0, 3.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.14453125, -4.9931640625, -4.841796875, -4.6904296875, -4.5390625, -4.3876953125, -4.236328125, -4.0849609375, -3.93359375, -3.7822265625, -3.630859375, -3.4794921875, -3.328125, -3.1767578125, -3.025390625, -2.8740234375, -2.72265625, -2.5712890625, -2.419921875, -2.2685546875, -2.1171875, -1.9658203125, -1.814453125, -1.6630859375, -1.51171875, -1.3603515625, -1.208984375, -1.0576171875, -0.90625, -0.7548828125, -0.603515625, -0.4521484375, -0.30078125, -0.1494140625, 0.001953125, 0.1533203125, 0.3046875, 0.4560546875, 0.607421875, 0.7587890625, 0.91015625, 1.0615234375, 1.212890625, 1.3642578125, 1.515625, 1.6669921875, 1.818359375, 1.9697265625, 2.12109375, 2.2724609375, 2.423828125, 2.5751953125, 2.7265625, 2.8779296875, 3.029296875, 3.1806640625, 3.33203125, 3.4833984375, 3.634765625, 3.7861328125, 3.9375, 4.0888671875, 4.240234375, 4.3916015625, 4.54296875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 9.0, 6.0, 15.0, 19.0, 16.0, 17.0, 23.0, 28.0, 21.0, 27.0, 31.0, 29.0, 43.0, 29.0, 42.0, 38.0, 36.0, 44.0, 36.0, 47.0, 31.0, 35.0, 53.0, 31.0, 36.0, 29.0, 27.0, 21.0, 31.0, 25.0, 17.0, 12.0, 11.0, 13.0, 17.0, 9.0, 10.0, 7.0, 4.0, 4.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.20703125, -2.133636474609375, -2.06024169921875, -1.986846923828125, -1.9134521484375, -1.840057373046875, -1.76666259765625, -1.693267822265625, -1.619873046875, -1.546478271484375, -1.47308349609375, -1.399688720703125, -1.3262939453125, -1.252899169921875, -1.17950439453125, -1.106109619140625, -1.03271484375, -0.959320068359375, -0.88592529296875, -0.812530517578125, -0.7391357421875, -0.665740966796875, -0.59234619140625, -0.518951416015625, -0.445556640625, -0.372161865234375, -0.29876708984375, -0.225372314453125, -0.1519775390625, -0.078582763671875, -0.00518798828125, 0.068206787109375, 0.1416015625, 0.214996337890625, 0.28839111328125, 0.361785888671875, 0.4351806640625, 0.508575439453125, 0.58197021484375, 0.655364990234375, 0.728759765625, 0.802154541015625, 0.87554931640625, 0.948944091796875, 1.0223388671875, 1.095733642578125, 1.16912841796875, 1.242523193359375, 1.31591796875, 1.389312744140625, 1.46270751953125, 1.536102294921875, 1.6094970703125, 1.682891845703125, 1.75628662109375, 1.829681396484375, 1.903076171875, 1.976470947265625, 2.04986572265625, 2.123260498046875, 2.1966552734375, 2.270050048828125, 2.34344482421875, 2.416839599609375, 2.490234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 6.0, 1.0, 4.0, 10.0, 11.0, 21.0, 22.0, 38.0, 38.0, 53.0, 89.0, 93.0, 165.0, 188.0, 308.0, 477.0, 770.0, 1027.0, 1611.0, 2614.0, 3931.0, 6546.0, 10996.0, 19104.0, 35184.0, 67554.0, 131654.0, 232806.0, 238789.0, 137610.0, 70605.0, 36420.0, 20229.0, 11242.0, 6686.0, 4068.0, 2569.0, 1598.0, 1111.0, 714.0, 490.0, 351.0, 228.0, 157.0, 117.0, 71.0, 50.0, 37.0, 39.0, 24.0, 13.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.693359375, -1.6369781494140625, -1.580596923828125, -1.5242156982421875, -1.46783447265625, -1.4114532470703125, -1.355072021484375, -1.2986907958984375, -1.2423095703125, -1.1859283447265625, -1.129547119140625, -1.0731658935546875, -1.01678466796875, -0.9604034423828125, -0.904022216796875, -0.8476409912109375, -0.791259765625, -0.7348785400390625, -0.678497314453125, -0.6221160888671875, -0.56573486328125, -0.5093536376953125, -0.452972412109375, -0.3965911865234375, -0.3402099609375, -0.2838287353515625, -0.227447509765625, -0.1710662841796875, -0.11468505859375, -0.0583038330078125, -0.001922607421875, 0.0544586181640625, 0.11083984375, 0.1672210693359375, 0.223602294921875, 0.2799835205078125, 0.33636474609375, 0.3927459716796875, 0.449127197265625, 0.5055084228515625, 0.5618896484375, 0.6182708740234375, 0.674652099609375, 0.7310333251953125, 0.78741455078125, 0.8437957763671875, 0.900177001953125, 0.9565582275390625, 1.012939453125, 1.0693206787109375, 1.125701904296875, 1.1820831298828125, 1.23846435546875, 1.2948455810546875, 1.351226806640625, 1.4076080322265625, 1.4639892578125, 1.5203704833984375, 1.576751708984375, 1.6331329345703125, 1.68951416015625, 1.7458953857421875, 1.802276611328125, 1.8586578369140625, 1.9150390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 7.0, 5.0, 8.0, 8.0, 8.0, 10.0, 13.0, 22.0, 23.0, 30.0, 41.0, 45.0, 48.0, 45.0, 56.0, 51.0, 66.0, 75.0, 68.0, 53.0, 47.0, 58.0, 46.0, 35.0, 22.0, 21.0, 11.0, 18.0, 12.0, 9.0, 7.0, 5.0, 4.0, 6.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.355213165283203e-05, -7.102359086275101e-05, -6.849505007266998e-05, -6.596650928258896e-05, -6.343796849250793e-05, -6.090942770242691e-05, -5.8380886912345886e-05, -5.585234612226486e-05, -5.332380533218384e-05, -5.0795264542102814e-05, -4.826672375202179e-05, -4.5738182961940765e-05, -4.320964217185974e-05, -4.068110138177872e-05, -3.815256059169769e-05, -3.562401980161667e-05, -3.3095479011535645e-05, -3.056693822145462e-05, -2.8038397431373596e-05, -2.5509856641292572e-05, -2.2981315851211548e-05, -2.0452775061130524e-05, -1.79242342710495e-05, -1.5395693480968475e-05, -1.2867152690887451e-05, -1.0338611900806427e-05, -7.810071110725403e-06, -5.281530320644379e-06, -2.7529895305633545e-06, -2.2444874048233032e-07, 2.304092049598694e-06, 4.832632839679718e-06, 7.361173629760742e-06, 9.889714419841766e-06, 1.241825520992279e-05, 1.4946796000003815e-05, 1.747533679008484e-05, 2.0003877580165863e-05, 2.2532418370246887e-05, 2.506095916032791e-05, 2.7589499950408936e-05, 3.011804074048996e-05, 3.2646581530570984e-05, 3.517512232065201e-05, 3.770366311073303e-05, 4.0232203900814056e-05, 4.276074469089508e-05, 4.5289285480976105e-05, 4.781782627105713e-05, 5.034636706113815e-05, 5.287490785121918e-05, 5.54034486413002e-05, 5.7931989431381226e-05, 6.046053022146225e-05, 6.298907101154327e-05, 6.55176118016243e-05, 6.804615259170532e-05, 7.057469338178635e-05, 7.310323417186737e-05, 7.56317749619484e-05, 7.816031575202942e-05, 8.068885654211044e-05, 8.321739733219147e-05, 8.574593812227249e-05, 8.827447891235352e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 11.0, 18.0, 18.0, 34.0, 47.0, 73.0, 91.0, 134.0, 209.0, 342.0, 477.0, 823.0, 1339.0, 2148.0, 3463.0, 5918.0, 10016.0, 17548.0, 31933.0, 60324.0, 111744.0, 181044.0, 216654.0, 173557.0, 104699.0, 56108.0, 29780.0, 16360.0, 9354.0, 5498.0, 3262.0, 1961.0, 1304.0, 780.0, 511.0, 363.0, 186.0, 126.0, 97.0, 54.0, 39.0, 20.0, 22.0, 17.0, 5.0, 17.0, 8.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.5751953125, -1.526641845703125, -1.47808837890625, -1.429534912109375, -1.3809814453125, -1.332427978515625, -1.28387451171875, -1.235321044921875, -1.186767578125, -1.138214111328125, -1.08966064453125, -1.041107177734375, -0.9925537109375, -0.944000244140625, -0.89544677734375, -0.846893310546875, -0.79833984375, -0.749786376953125, -0.70123291015625, -0.652679443359375, -0.6041259765625, -0.555572509765625, -0.50701904296875, -0.458465576171875, -0.409912109375, -0.361358642578125, -0.31280517578125, -0.264251708984375, -0.2156982421875, -0.167144775390625, -0.11859130859375, -0.070037841796875, -0.021484375, 0.027069091796875, 0.07562255859375, 0.124176025390625, 0.1727294921875, 0.221282958984375, 0.26983642578125, 0.318389892578125, 0.366943359375, 0.415496826171875, 0.46405029296875, 0.512603759765625, 0.5611572265625, 0.609710693359375, 0.65826416015625, 0.706817626953125, 0.75537109375, 0.803924560546875, 0.85247802734375, 0.901031494140625, 0.9495849609375, 0.998138427734375, 1.04669189453125, 1.095245361328125, 1.143798828125, 1.192352294921875, 1.24090576171875, 1.289459228515625, 1.3380126953125, 1.386566162109375, 1.43511962890625, 1.483673095703125, 1.5322265625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 4.0, 8.0, 5.0, 3.0, 7.0, 19.0, 12.0, 22.0, 25.0, 33.0, 37.0, 57.0, 53.0, 73.0, 68.0, 70.0, 73.0, 69.0, 67.0, 53.0, 43.0, 46.0, 25.0, 21.0, 29.0, 13.0, 10.0, 14.0, 3.0, 11.0, 4.0, 8.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5146484375, -0.4990501403808594, -0.48345184326171875, -0.4678535461425781, -0.4522552490234375, -0.4366569519042969, -0.42105865478515625, -0.4054603576660156, -0.389862060546875, -0.3742637634277344, -0.35866546630859375, -0.3430671691894531, -0.3274688720703125, -0.3118705749511719, -0.29627227783203125, -0.2806739807128906, -0.26507568359375, -0.24947738647460938, -0.23387908935546875, -0.21828079223632812, -0.2026824951171875, -0.18708419799804688, -0.17148590087890625, -0.15588760375976562, -0.140289306640625, -0.12469100952148438, -0.10909271240234375, -0.09349441528320312, -0.0778961181640625, -0.062297821044921875, -0.04669952392578125, -0.031101226806640625, -0.0155029296875, 9.5367431640625e-05, 0.01569366455078125, 0.031291961669921875, 0.0468902587890625, 0.062488555908203125, 0.07808685302734375, 0.09368515014648438, 0.109283447265625, 0.12488174438476562, 0.14048004150390625, 0.15607833862304688, 0.1716766357421875, 0.18727493286132812, 0.20287322998046875, 0.21847152709960938, 0.23406982421875, 0.24966812133789062, 0.26526641845703125, 0.2808647155761719, 0.2964630126953125, 0.3120613098144531, 0.32765960693359375, 0.3432579040527344, 0.358856201171875, 0.3744544982910156, 0.39005279541015625, 0.4056510925292969, 0.4212493896484375, 0.4368476867675781, 0.45244598388671875, 0.4680442810058594, 0.483642578125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 5.0, 6.0, 6.0, 12.0, 18.0, 10.0, 17.0, 22.0, 32.0, 21.0, 38.0, 51.0, 60.0, 63.0, 66.0, 91.0, 86.0, 70.0, 69.0, 57.0, 46.0, 30.0, 33.0, 30.0, 20.0, 6.0, 6.0, 8.0, 6.0, 2.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.940326690673828, -9.692682266235352, -9.445038795471191, -9.197394371032715, -8.949750900268555, -8.702106475830078, -8.454462051391602, -8.206818580627441, -7.959174156188965, -7.7115302085876465, -7.463886260986328, -7.216241836547852, -6.968597888946533, -6.720953941345215, -6.473309516906738, -6.22566556930542, -5.978021621704102, -5.730377674102783, -5.482733726501465, -5.235089302062988, -4.98744535446167, -4.739801406860352, -4.492156982421875, -4.244513034820557, -3.9968690872192383, -3.74922513961792, -3.5015809535980225, -3.253936767578125, -3.0062928199768066, -2.7586488723754883, -2.511004686355591, -2.2633605003356934, -2.015716552734375, -1.768072485923767, -1.5204284191131592, -1.2727843523025513, -1.0251402854919434, -0.7774962186813354, -0.5298521518707275, -0.28220808506011963, -0.03456401824951172, 0.2130800485610962, 0.4607241153717041, 0.708368182182312, 0.9560122489929199, 1.2036563158035278, 1.4513003826141357, 1.6989444494247437, 1.9465885162353516, 2.19423246383667, 2.4418766498565674, 2.689520835876465, 2.937164783477783, 3.1848087310791016, 3.432452917098999, 3.6800971031188965, 3.927741050720215, 4.175384998321533, 4.423028945922852, 4.670673370361328, 4.9183173179626465, 5.165961265563965, 5.413605690002441, 5.66124963760376, 5.908893585205078]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 5.0, 6.0, 6.0, 5.0, 10.0, 10.0, 10.0, 6.0, 15.0, 16.0, 15.0, 18.0, 17.0, 20.0, 14.0, 26.0, 29.0, 29.0, 27.0, 22.0, 34.0, 28.0, 30.0, 42.0, 28.0, 39.0, 29.0, 43.0, 32.0, 34.0, 41.0, 32.0, 40.0, 31.0, 22.0, 20.0, 19.0, 13.0, 20.0, 27.0, 15.0, 10.0, 19.0, 8.0, 8.0, 4.0, 5.0, 11.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0], "bins": [-3.5719351768493652, -3.4707858562469482, -3.369636297225952, -3.268486976623535, -3.167337656021118, -3.066188335418701, -2.965038776397705, -2.863889455795288, -2.762740135192871, -2.661590814590454, -2.560441255569458, -2.459291934967041, -2.358142614364624, -2.256993293762207, -2.155843734741211, -2.054694414138794, -1.9535448551177979, -1.8523954153060913, -1.7512460947036743, -1.6500966548919678, -1.5489473342895508, -1.4477978944778442, -1.3466484546661377, -1.2454991340637207, -1.1443496942520142, -1.0432002544403076, -0.9420509338378906, -0.8409014940261841, -0.7397521138191223, -0.6386027336120605, -0.537453293800354, -0.43630391359329224, -0.33515477180480957, -0.2340053766965866, -0.13285598158836365, -0.03170657157897949, 0.06944280862808228, 0.17059218883514404, 0.2717416286468506, 0.37289100885391235, 0.4740403890609741, 0.5751897692680359, 0.6763391494750977, 0.7774885892868042, 0.878637969493866, 0.9797873497009277, 1.0809367895126343, 1.1820862293243408, 1.2832355499267578, 1.3843849897384644, 1.4855343103408813, 1.586683750152588, 1.6878330707550049, 1.7889825105667114, 1.890131950378418, 1.991281270980835, 2.092430591583252, 2.193579912185669, 2.294729471206665, 2.395878791809082, 2.497028112411499, 2.598177433013916, 2.699326992034912, 2.800476312637329, 2.901625871658325]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 10.0, 11.0, 16.0, 21.0, 31.0, 41.0, 69.0, 90.0, 146.0, 241.0, 400.0, 679.0, 1304.0, 2460.0, 4718.0, 9633.0, 20038.0, 40699.0, 80288.0, 144386.0, 208855.0, 211954.0, 151040.0, 85480.0, 43589.0, 21279.0, 10263.0, 5140.0, 2552.0, 1303.0, 718.0, 386.0, 235.0, 167.0, 82.0, 57.0, 42.0, 42.0, 23.0, 18.0, 11.0, 10.0, 7.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.265625, -5.1109619140625, -4.956298828125, -4.8016357421875, -4.64697265625, -4.4923095703125, -4.337646484375, -4.1829833984375, -4.0283203125, -3.8736572265625, -3.718994140625, -3.5643310546875, -3.40966796875, -3.2550048828125, -3.100341796875, -2.9456787109375, -2.791015625, -2.6363525390625, -2.481689453125, -2.3270263671875, -2.17236328125, -2.0177001953125, -1.863037109375, -1.7083740234375, -1.5537109375, -1.3990478515625, -1.244384765625, -1.0897216796875, -0.93505859375, -0.7803955078125, -0.625732421875, -0.4710693359375, -0.31640625, -0.1617431640625, -0.007080078125, 0.1475830078125, 0.30224609375, 0.4569091796875, 0.611572265625, 0.7662353515625, 0.9208984375, 1.0755615234375, 1.230224609375, 1.3848876953125, 1.53955078125, 1.6942138671875, 1.848876953125, 2.0035400390625, 2.158203125, 2.3128662109375, 2.467529296875, 2.6221923828125, 2.77685546875, 2.9315185546875, 3.086181640625, 3.2408447265625, 3.3955078125, 3.5501708984375, 3.704833984375, 3.8594970703125, 4.01416015625, 4.1688232421875, 4.323486328125, 4.4781494140625, 4.6328125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 4.0, 3.0, 12.0, 10.0, 7.0, 15.0, 9.0, 22.0, 14.0, 13.0, 21.0, 38.0, 28.0, 23.0, 23.0, 32.0, 31.0, 37.0, 30.0, 35.0, 35.0, 41.0, 29.0, 46.0, 42.0, 50.0, 40.0, 39.0, 35.0, 32.0, 31.0, 23.0, 14.0, 15.0, 16.0, 19.0, 9.0, 16.0, 15.0, 9.0, 8.0, 11.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.79296875, -3.67401123046875, -3.5550537109375, -3.43609619140625, -3.317138671875, -3.19818115234375, -3.0792236328125, -2.96026611328125, -2.84130859375, -2.72235107421875, -2.6033935546875, -2.48443603515625, -2.365478515625, -2.24652099609375, -2.1275634765625, -2.00860595703125, -1.8896484375, -1.77069091796875, -1.6517333984375, -1.53277587890625, -1.413818359375, -1.29486083984375, -1.1759033203125, -1.05694580078125, -0.93798828125, -0.81903076171875, -0.7000732421875, -0.58111572265625, -0.462158203125, -0.34320068359375, -0.2242431640625, -0.10528564453125, 0.013671875, 0.13262939453125, 0.2515869140625, 0.37054443359375, 0.489501953125, 0.60845947265625, 0.7274169921875, 0.84637451171875, 0.96533203125, 1.08428955078125, 1.2032470703125, 1.32220458984375, 1.441162109375, 1.56011962890625, 1.6790771484375, 1.79803466796875, 1.9169921875, 2.03594970703125, 2.1549072265625, 2.27386474609375, 2.392822265625, 2.51177978515625, 2.6307373046875, 2.74969482421875, 2.86865234375, 2.98760986328125, 3.1065673828125, 3.22552490234375, 3.344482421875, 3.46343994140625, 3.5823974609375, 3.70135498046875, 3.8203125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 8.0, 4.0, 4.0, 5.0, 9.0, 11.0, 15.0, 21.0, 21.0, 29.0, 46.0, 64.0, 80.0, 135.0, 171.0, 248.0, 341.0, 451.0, 685.0, 990.0, 1574.0, 2443.0, 4270.0, 7446.0, 13901.0, 25769.0, 49192.0, 90109.0, 148878.0, 199649.0, 192603.0, 135621.0, 78888.0, 43133.0, 22536.0, 12072.0, 6771.0, 3823.0, 2234.0, 1385.0, 943.0, 590.0, 381.0, 280.0, 202.0, 150.0, 107.0, 82.0, 49.0, 41.0, 26.0, 20.0, 19.0, 20.0, 14.0, 5.0, 2.0, 5.0, 2.0, 2.0], "bins": [-4.69140625, -4.552978515625, -4.41455078125, -4.276123046875, -4.1376953125, -3.999267578125, -3.86083984375, -3.722412109375, -3.583984375, -3.445556640625, -3.30712890625, -3.168701171875, -3.0302734375, -2.891845703125, -2.75341796875, -2.614990234375, -2.4765625, -2.338134765625, -2.19970703125, -2.061279296875, -1.9228515625, -1.784423828125, -1.64599609375, -1.507568359375, -1.369140625, -1.230712890625, -1.09228515625, -0.953857421875, -0.8154296875, -0.677001953125, -0.53857421875, -0.400146484375, -0.26171875, -0.123291015625, 0.01513671875, 0.153564453125, 0.2919921875, 0.430419921875, 0.56884765625, 0.707275390625, 0.845703125, 0.984130859375, 1.12255859375, 1.260986328125, 1.3994140625, 1.537841796875, 1.67626953125, 1.814697265625, 1.953125, 2.091552734375, 2.22998046875, 2.368408203125, 2.5068359375, 2.645263671875, 2.78369140625, 2.922119140625, 3.060546875, 3.198974609375, 3.33740234375, 3.475830078125, 3.6142578125, 3.752685546875, 3.89111328125, 4.029541015625, 4.16796875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 14.0, 15.0, 17.0, 14.0, 10.0, 17.0, 28.0, 26.0, 34.0, 27.0, 33.0, 32.0, 34.0, 37.0, 36.0, 43.0, 45.0, 44.0, 45.0, 39.0, 50.0, 36.0, 35.0, 36.0, 35.0, 28.0, 21.0, 35.0, 17.0, 16.0, 15.0, 19.0, 16.0, 10.0, 7.0, 5.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.720703125, -2.64007568359375, -2.5594482421875, -2.47882080078125, -2.398193359375, -2.31756591796875, -2.2369384765625, -2.15631103515625, -2.07568359375, -1.99505615234375, -1.9144287109375, -1.83380126953125, -1.753173828125, -1.67254638671875, -1.5919189453125, -1.51129150390625, -1.4306640625, -1.35003662109375, -1.2694091796875, -1.18878173828125, -1.108154296875, -1.02752685546875, -0.9468994140625, -0.86627197265625, -0.78564453125, -0.70501708984375, -0.6243896484375, -0.54376220703125, -0.463134765625, -0.38250732421875, -0.3018798828125, -0.22125244140625, -0.140625, -0.05999755859375, 0.0206298828125, 0.10125732421875, 0.181884765625, 0.26251220703125, 0.3431396484375, 0.42376708984375, 0.50439453125, 0.58502197265625, 0.6656494140625, 0.74627685546875, 0.826904296875, 0.90753173828125, 0.9881591796875, 1.06878662109375, 1.1494140625, 1.23004150390625, 1.3106689453125, 1.39129638671875, 1.471923828125, 1.55255126953125, 1.6331787109375, 1.71380615234375, 1.79443359375, 1.87506103515625, 1.9556884765625, 2.03631591796875, 2.116943359375, 2.19757080078125, 2.2781982421875, 2.35882568359375, 2.439453125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 12.0, 17.0, 31.0, 34.0, 40.0, 68.0, 96.0, 139.0, 225.0, 321.0, 477.0, 674.0, 1072.0, 1766.0, 2825.0, 5208.0, 10283.0, 23304.0, 58100.0, 145348.0, 280048.0, 275963.0, 141000.0, 55981.0, 22656.0, 10029.0, 5071.0, 2780.0, 1743.0, 1074.0, 715.0, 453.0, 314.0, 187.0, 160.0, 113.0, 67.0, 54.0, 32.0, 22.0, 16.0, 9.0, 4.0, 7.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.4765625, -3.37115478515625, -3.2657470703125, -3.16033935546875, -3.054931640625, -2.94952392578125, -2.8441162109375, -2.73870849609375, -2.63330078125, -2.52789306640625, -2.4224853515625, -2.31707763671875, -2.211669921875, -2.10626220703125, -2.0008544921875, -1.89544677734375, -1.7900390625, -1.68463134765625, -1.5792236328125, -1.47381591796875, -1.368408203125, -1.26300048828125, -1.1575927734375, -1.05218505859375, -0.94677734375, -0.84136962890625, -0.7359619140625, -0.63055419921875, -0.525146484375, -0.41973876953125, -0.3143310546875, -0.20892333984375, -0.103515625, 0.00189208984375, 0.1072998046875, 0.21270751953125, 0.318115234375, 0.42352294921875, 0.5289306640625, 0.63433837890625, 0.73974609375, 0.84515380859375, 0.9505615234375, 1.05596923828125, 1.161376953125, 1.26678466796875, 1.3721923828125, 1.47760009765625, 1.5830078125, 1.68841552734375, 1.7938232421875, 1.89923095703125, 2.004638671875, 2.11004638671875, 2.2154541015625, 2.32086181640625, 2.42626953125, 2.53167724609375, 2.6370849609375, 2.74249267578125, 2.847900390625, 2.95330810546875, 3.0587158203125, 3.16412353515625, 3.26953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 9.0, 8.0, 7.0, 12.0, 16.0, 27.0, 52.0, 64.0, 103.0, 110.0, 115.0, 124.0, 81.0, 79.0, 58.0, 46.0, 31.0, 18.0, 8.0, 6.0, 7.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00029468536376953125, -0.00028366968035697937, -0.0002726539969444275, -0.0002616383135318756, -0.00025062263011932373, -0.00023960694670677185, -0.00022859126329421997, -0.0002175755798816681, -0.0002065598964691162, -0.00019554421305656433, -0.00018452852964401245, -0.00017351284623146057, -0.0001624971628189087, -0.0001514814794063568, -0.00014046579599380493, -0.00012945011258125305, -0.00011843442916870117, -0.00010741874575614929, -9.640306234359741e-05, -8.538737893104553e-05, -7.437169551849365e-05, -6.335601210594177e-05, -5.234032869338989e-05, -4.132464528083801e-05, -3.0308961868286133e-05, -1.9293278455734253e-05, -8.277595043182373e-06, 2.738088369369507e-06, 1.3753771781921387e-05, 2.4769455194473267e-05, 3.5785138607025146e-05, 4.6800822019577026e-05, 5.7816505432128906e-05, 6.883218884468079e-05, 7.984787225723267e-05, 9.086355566978455e-05, 0.00010187923908233643, 0.0001128949224948883, 0.00012391060590744019, 0.00013492628931999207, 0.00014594197273254395, 0.00015695765614509583, 0.0001679733395576477, 0.00017898902297019958, 0.00019000470638275146, 0.00020102038979530334, 0.00021203607320785522, 0.0002230517566204071, 0.00023406744003295898, 0.00024508312344551086, 0.00025609880685806274, 0.0002671144902706146, 0.0002781301736831665, 0.0002891458570957184, 0.00030016154050827026, 0.00031117722392082214, 0.000322192907333374, 0.0003332085907459259, 0.0003442242741584778, 0.00035523995757102966, 0.00036625564098358154, 0.0003772713243961334, 0.0003882870078086853, 0.0003993026912212372, 0.00041031837463378906]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 4.0, 3.0, 10.0, 12.0, 10.0, 33.0, 26.0, 30.0, 49.0, 69.0, 101.0, 132.0, 163.0, 235.0, 328.0, 475.0, 759.0, 1060.0, 1663.0, 2686.0, 5081.0, 10167.0, 23447.0, 61134.0, 160717.0, 304357.0, 269175.0, 123243.0, 45725.0, 18257.0, 8249.0, 4192.0, 2405.0, 1413.0, 962.0, 661.0, 448.0, 274.0, 218.0, 164.0, 131.0, 72.0, 68.0, 36.0, 32.0, 24.0, 16.0, 14.0, 10.0, 4.0, 10.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.109375, -3.001617431640625, -2.89385986328125, -2.786102294921875, -2.6783447265625, -2.570587158203125, -2.46282958984375, -2.355072021484375, -2.247314453125, -2.139556884765625, -2.03179931640625, -1.924041748046875, -1.8162841796875, -1.708526611328125, -1.60076904296875, -1.493011474609375, -1.38525390625, -1.277496337890625, -1.16973876953125, -1.061981201171875, -0.9542236328125, -0.846466064453125, -0.73870849609375, -0.630950927734375, -0.523193359375, -0.415435791015625, -0.30767822265625, -0.199920654296875, -0.0921630859375, 0.015594482421875, 0.12335205078125, 0.231109619140625, 0.3388671875, 0.446624755859375, 0.55438232421875, 0.662139892578125, 0.7698974609375, 0.877655029296875, 0.98541259765625, 1.093170166015625, 1.200927734375, 1.308685302734375, 1.41644287109375, 1.524200439453125, 1.6319580078125, 1.739715576171875, 1.84747314453125, 1.955230712890625, 2.06298828125, 2.170745849609375, 2.27850341796875, 2.386260986328125, 2.4940185546875, 2.601776123046875, 2.70953369140625, 2.817291259765625, 2.925048828125, 3.032806396484375, 3.14056396484375, 3.248321533203125, 3.3560791015625, 3.463836669921875, 3.57159423828125, 3.679351806640625, 3.787109375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 4.0, 5.0, 11.0, 10.0, 15.0, 22.0, 39.0, 47.0, 74.0, 70.0, 83.0, 97.0, 91.0, 86.0, 104.0, 68.0, 56.0, 34.0, 35.0, 13.0, 8.0, 6.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9140625, -0.8826446533203125, -0.851226806640625, -0.8198089599609375, -0.78839111328125, -0.7569732666015625, -0.725555419921875, -0.6941375732421875, -0.6627197265625, -0.6313018798828125, -0.599884033203125, -0.5684661865234375, -0.53704833984375, -0.5056304931640625, -0.474212646484375, -0.4427947998046875, -0.411376953125, -0.3799591064453125, -0.348541259765625, -0.3171234130859375, -0.28570556640625, -0.2542877197265625, -0.222869873046875, -0.1914520263671875, -0.1600341796875, -0.1286163330078125, -0.097198486328125, -0.0657806396484375, -0.03436279296875, -0.0029449462890625, 0.028472900390625, 0.0598907470703125, 0.09130859375, 0.1227264404296875, 0.154144287109375, 0.1855621337890625, 0.21697998046875, 0.2483978271484375, 0.279815673828125, 0.3112335205078125, 0.3426513671875, 0.3740692138671875, 0.405487060546875, 0.4369049072265625, 0.46832275390625, 0.4997406005859375, 0.531158447265625, 0.5625762939453125, 0.593994140625, 0.6254119873046875, 0.656829833984375, 0.6882476806640625, 0.71966552734375, 0.7510833740234375, 0.782501220703125, 0.8139190673828125, 0.8453369140625, 0.8767547607421875, 0.908172607421875, 0.9395904541015625, 0.97100830078125, 1.0024261474609375, 1.033843994140625, 1.0652618408203125, 1.0966796875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 8.0, 2.0, 3.0, 12.0, 12.0, 20.0, 14.0, 18.0, 22.0, 37.0, 36.0, 36.0, 57.0, 64.0, 59.0, 77.0, 69.0, 73.0, 59.0, 64.0, 56.0, 41.0, 37.0, 34.0, 24.0, 16.0, 7.0, 13.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.231340408325195, -8.999356269836426, -8.767373085021973, -8.535388946533203, -8.30340576171875, -8.07142162322998, -7.839438438415527, -7.607454299926758, -7.3754706382751465, -7.143486976623535, -6.911503314971924, -6.6795196533203125, -6.447535991668701, -6.21555233001709, -5.98356819152832, -5.751584529876709, -5.519600868225098, -5.287617206573486, -5.055633544921875, -4.823649883270264, -4.591666221618652, -4.359682083129883, -4.12769889831543, -3.89571475982666, -3.663731575012207, -3.4317479133605957, -3.1997642517089844, -2.967780590057373, -2.7357966899871826, -2.5038130283355713, -2.27182936668396, -2.0398454666137695, -1.8078618049621582, -1.5758781433105469, -1.343894362449646, -1.1119107007980347, -0.8799269795417786, -0.6479432582855225, -0.41595959663391113, -0.18397581577301025, 0.048007845878601074, 0.2799915671348572, 0.5119752883911133, 0.7439589500427246, 0.9759426712989807, 1.2079263925552368, 1.4399100542068481, 1.671893835067749, 1.9038774967193604, 2.1358611583709717, 2.367844820022583, 2.5998287200927734, 2.8318123817443848, 3.063796043395996, 3.2957797050476074, 3.5277633666992188, 3.75974702835083, 3.9917306900024414, 4.223714351654053, 4.455698013305664, 4.687681674957275, 4.919665336608887, 5.151649475097656, 5.383633136749268, 5.615616798400879]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 6.0, 8.0, 4.0, 5.0, 12.0, 8.0, 13.0, 15.0, 8.0, 22.0, 16.0, 23.0, 12.0, 21.0, 24.0, 21.0, 27.0, 28.0, 34.0, 37.0, 38.0, 40.0, 32.0, 41.0, 42.0, 53.0, 28.0, 34.0, 35.0, 33.0, 32.0, 26.0, 31.0, 29.0, 25.0, 23.0, 16.0, 18.0, 12.0, 12.0, 10.0, 10.0, 12.0, 5.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.342905044555664, -3.2374014854431152, -3.1318979263305664, -3.0263943672180176, -2.9208908081054688, -2.81538724899292, -2.70988392829895, -2.6043803691864014, -2.4988768100738525, -2.3933732509613037, -2.287869691848755, -2.182366132736206, -2.0768628120422363, -1.971359133720398, -1.8658556938171387, -1.7603521347045898, -1.654848575592041, -1.5493450164794922, -1.4438414573669434, -1.338338017463684, -1.2328344583511353, -1.1273308992385864, -1.0218274593353271, -0.9163239002227783, -0.8108203411102295, -0.7053167819976807, -0.5998132824897766, -0.49430975317955017, -0.38880622386932373, -0.2833026647567749, -0.17779916524887085, -0.0722956657409668, 0.03320789337158203, 0.13871142268180847, 0.2442149519920349, 0.34971848130226135, 0.4552220106124878, 0.5607255697250366, 0.6662290692329407, 0.7717325687408447, 0.8772361278533936, 0.9827396869659424, 1.0882432460784912, 1.1937466859817505, 1.2992502450942993, 1.4047538042068481, 1.5102572441101074, 1.6157608032226562, 1.721264362335205, 1.826767921447754, 1.9322714805603027, 2.0377750396728516, 2.1432785987854004, 2.248782157897949, 2.354285478591919, 2.4597890377044678, 2.5652925968170166, 2.6707961559295654, 2.7762997150421143, 2.881803274154663, 2.987306594848633, 3.0928101539611816, 3.1983137130737305, 3.3038172721862793, 3.409320831298828]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 5.0, 12.0, 20.0, 15.0, 22.0, 34.0, 57.0, 58.0, 105.0, 137.0, 184.0, 290.0, 386.0, 599.0, 908.0, 1338.0, 1946.0, 3068.0, 4787.0, 7945.0, 13741.0, 24741.0, 47206.0, 97477.0, 221553.0, 558049.0, 1154140.0, 1120302.0, 528408.0, 211373.0, 92585.0, 44845.0, 23650.0, 13120.0, 7628.0, 4730.0, 2912.0, 1915.0, 1285.0, 844.0, 590.0, 384.0, 269.0, 196.0, 113.0, 97.0, 71.0, 41.0, 41.0, 16.0, 13.0, 12.0, 7.0, 8.0, 1.0, 2.0, 3.0], "bins": [-6.5, -6.30865478515625, -6.1173095703125, -5.92596435546875, -5.734619140625, -5.54327392578125, -5.3519287109375, -5.16058349609375, -4.96923828125, -4.77789306640625, -4.5865478515625, -4.39520263671875, -4.203857421875, -4.01251220703125, -3.8211669921875, -3.62982177734375, -3.4384765625, -3.24713134765625, -3.0557861328125, -2.86444091796875, -2.673095703125, -2.48175048828125, -2.2904052734375, -2.09906005859375, -1.90771484375, -1.71636962890625, -1.5250244140625, -1.33367919921875, -1.142333984375, -0.95098876953125, -0.7596435546875, -0.56829833984375, -0.376953125, -0.18560791015625, 0.0057373046875, 0.19708251953125, 0.388427734375, 0.57977294921875, 0.7711181640625, 0.96246337890625, 1.15380859375, 1.34515380859375, 1.5364990234375, 1.72784423828125, 1.919189453125, 2.11053466796875, 2.3018798828125, 2.49322509765625, 2.6845703125, 2.87591552734375, 3.0672607421875, 3.25860595703125, 3.449951171875, 3.64129638671875, 3.8326416015625, 4.02398681640625, 4.21533203125, 4.40667724609375, 4.5980224609375, 4.78936767578125, 4.980712890625, 5.17205810546875, 5.3634033203125, 5.55474853515625, 5.74609375]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 12.0, 6.0, 12.0, 14.0, 17.0, 12.0, 8.0, 18.0, 27.0, 18.0, 17.0, 21.0, 34.0, 26.0, 26.0, 26.0, 26.0, 43.0, 36.0, 37.0, 34.0, 45.0, 45.0, 41.0, 35.0, 39.0, 35.0, 28.0, 37.0, 27.0, 20.0, 24.0, 22.0, 21.0, 12.0, 10.0, 16.0, 15.0, 9.0, 5.0, 6.0, 6.0, 8.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.548828125, -2.472869873046875, -2.39691162109375, -2.320953369140625, -2.2449951171875, -2.169036865234375, -2.09307861328125, -2.017120361328125, -1.941162109375, -1.865203857421875, -1.78924560546875, -1.713287353515625, -1.6373291015625, -1.561370849609375, -1.48541259765625, -1.409454345703125, -1.33349609375, -1.257537841796875, -1.18157958984375, -1.105621337890625, -1.0296630859375, -0.953704833984375, -0.87774658203125, -0.801788330078125, -0.725830078125, -0.649871826171875, -0.57391357421875, -0.497955322265625, -0.4219970703125, -0.346038818359375, -0.27008056640625, -0.194122314453125, -0.1181640625, -0.042205810546875, 0.03375244140625, 0.109710693359375, 0.1856689453125, 0.261627197265625, 0.33758544921875, 0.413543701171875, 0.489501953125, 0.565460205078125, 0.64141845703125, 0.717376708984375, 0.7933349609375, 0.869293212890625, 0.94525146484375, 1.021209716796875, 1.09716796875, 1.173126220703125, 1.24908447265625, 1.325042724609375, 1.4010009765625, 1.476959228515625, 1.55291748046875, 1.628875732421875, 1.704833984375, 1.780792236328125, 1.85675048828125, 1.932708740234375, 2.0086669921875, 2.084625244140625, 2.16058349609375, 2.236541748046875, 2.3125]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 13.0, 17.0, 12.0, 14.0, 44.0, 72.0, 96.0, 134.0, 225.0, 291.0, 450.0, 712.0, 991.0, 1609.0, 2463.0, 3789.0, 6025.0, 9727.0, 16247.0, 27177.0, 47295.0, 85426.0, 160703.0, 320625.0, 641484.0, 1034483.0, 868500.0, 461940.0, 229935.0, 118966.0, 63683.0, 36316.0, 20888.0, 12667.0, 7726.0, 4805.0, 2997.0, 1996.0, 1265.0, 809.0, 536.0, 367.0, 276.0, 152.0, 106.0, 73.0, 62.0, 26.0, 24.0, 24.0, 9.0, 10.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.640625, -5.46844482421875, -5.2962646484375, -5.12408447265625, -4.951904296875, -4.77972412109375, -4.6075439453125, -4.43536376953125, -4.26318359375, -4.09100341796875, -3.9188232421875, -3.74664306640625, -3.574462890625, -3.40228271484375, -3.2301025390625, -3.05792236328125, -2.8857421875, -2.71356201171875, -2.5413818359375, -2.36920166015625, -2.197021484375, -2.02484130859375, -1.8526611328125, -1.68048095703125, -1.50830078125, -1.33612060546875, -1.1639404296875, -0.99176025390625, -0.819580078125, -0.64739990234375, -0.4752197265625, -0.30303955078125, -0.130859375, 0.04132080078125, 0.2135009765625, 0.38568115234375, 0.557861328125, 0.73004150390625, 0.9022216796875, 1.07440185546875, 1.24658203125, 1.41876220703125, 1.5909423828125, 1.76312255859375, 1.935302734375, 2.10748291015625, 2.2796630859375, 2.45184326171875, 2.6240234375, 2.79620361328125, 2.9683837890625, 3.14056396484375, 3.312744140625, 3.48492431640625, 3.6571044921875, 3.82928466796875, 4.00146484375, 4.17364501953125, 4.3458251953125, 4.51800537109375, 4.690185546875, 4.86236572265625, 5.0345458984375, 5.20672607421875, 5.37890625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 11.0, 9.0, 11.0, 14.0, 17.0, 14.0, 24.0, 38.0, 39.0, 53.0, 74.0, 93.0, 122.0, 146.0, 180.0, 202.0, 233.0, 284.0, 285.0, 268.0, 292.0, 271.0, 254.0, 247.0, 194.0, 129.0, 115.0, 90.0, 82.0, 63.0, 30.0, 42.0, 32.0, 25.0, 22.0, 18.0, 15.0, 9.0, 4.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6572265625, -1.6015777587890625, -1.545928955078125, -1.4902801513671875, -1.43463134765625, -1.3789825439453125, -1.323333740234375, -1.2676849365234375, -1.2120361328125, -1.1563873291015625, -1.100738525390625, -1.0450897216796875, -0.98944091796875, -0.9337921142578125, -0.878143310546875, -0.8224945068359375, -0.766845703125, -0.7111968994140625, -0.655548095703125, -0.5998992919921875, -0.54425048828125, -0.4886016845703125, -0.432952880859375, -0.3773040771484375, -0.3216552734375, -0.2660064697265625, -0.210357666015625, -0.1547088623046875, -0.09906005859375, -0.0434112548828125, 0.012237548828125, 0.0678863525390625, 0.12353515625, 0.1791839599609375, 0.234832763671875, 0.2904815673828125, 0.34613037109375, 0.4017791748046875, 0.457427978515625, 0.5130767822265625, 0.5687255859375, 0.6243743896484375, 0.680023193359375, 0.7356719970703125, 0.79132080078125, 0.8469696044921875, 0.902618408203125, 0.9582672119140625, 1.013916015625, 1.0695648193359375, 1.125213623046875, 1.1808624267578125, 1.23651123046875, 1.2921600341796875, 1.347808837890625, 1.4034576416015625, 1.4591064453125, 1.5147552490234375, 1.570404052734375, 1.6260528564453125, 1.68170166015625, 1.7373504638671875, 1.792999267578125, 1.8486480712890625, 1.904296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 7.0, 7.0, 9.0, 13.0, 19.0, 23.0, 29.0, 34.0, 38.0, 58.0, 66.0, 68.0, 77.0, 77.0, 74.0, 82.0, 56.0, 54.0, 48.0, 41.0, 35.0, 24.0, 17.0, 14.0, 8.0, 1.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.406835556030273, -11.148826599121094, -10.890816688537598, -10.632807731628418, -10.374797821044922, -10.116788864135742, -9.858778953552246, -9.600769996643066, -9.34276008605957, -9.08475112915039, -8.826741218566895, -8.568732261657715, -8.310722351074219, -8.052713394165039, -7.794703960418701, -7.536694526672363, -7.278685569763184, -7.020676136016846, -6.762666702270508, -6.50465726852417, -6.246647834777832, -5.988638877868652, -5.7306294441223145, -5.472620010375977, -5.214610576629639, -4.956601142883301, -4.698591709136963, -4.440582275390625, -4.182573318481445, -3.9245636463165283, -3.6665544509887695, -3.4085450172424316, -3.1505351066589355, -2.8925256729125977, -2.6345162391662598, -2.376507043838501, -2.118497610092163, -1.8604881763458252, -1.6024788618087769, -1.3444695472717285, -1.0864601135253906, -0.8284507393836975, -0.5704413652420044, -0.3124319911003113, -0.054422616958618164, 0.20358681678771973, 0.46159613132476807, 0.7196054458618164, 0.9776148796081543, 1.2356243133544922, 1.4936336278915405, 1.7516429424285889, 2.0096523761749268, 2.2676618099212646, 2.5256710052490234, 2.7836804389953613, 3.041689872741699, 3.299699306488037, 3.557708740234375, 3.815717935562134, 4.073727607727051, 4.3317365646362305, 4.589745998382568, 4.847755432128906, 5.105764865875244]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 7.0, 5.0, 9.0, 11.0, 13.0, 15.0, 17.0, 13.0, 23.0, 24.0, 30.0, 17.0, 27.0, 38.0, 35.0, 38.0, 43.0, 24.0, 40.0, 40.0, 35.0, 32.0, 47.0, 39.0, 33.0, 36.0, 34.0, 25.0, 28.0, 26.0, 28.0, 17.0, 27.0, 27.0, 9.0, 18.0, 6.0, 14.0, 14.0, 4.0, 6.0, 3.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.7236645221710205, -3.6212408542633057, -3.518817186355591, -3.416393518447876, -3.313969850540161, -3.2115461826324463, -3.1091222763061523, -3.0066986083984375, -2.9042749404907227, -2.801851272583008, -2.699427604675293, -2.597003936767578, -2.4945802688598633, -2.3921566009521484, -2.2897329330444336, -2.1873092651367188, -2.084885597229004, -1.982461929321289, -1.8800382614135742, -1.7776145935058594, -1.6751909255981445, -1.5727672576904297, -1.4703434705734253, -1.3679198026657104, -1.2654961347579956, -1.1630724668502808, -1.060648798942566, -0.9582250714302063, -0.8558014035224915, -0.7533777356147766, -0.650954008102417, -0.5485303401947021, -0.4461069107055664, -0.34368324279785156, -0.24125954508781433, -0.1388358473777771, -0.036412179470062256, 0.06601148843765259, 0.1684352159500122, 0.27085888385772705, 0.3732825517654419, 0.47570621967315674, 0.5781298875808716, 0.6805536150932312, 0.782977283000946, 0.8854009509086609, 0.9878246784210205, 1.0902483463287354, 1.1926720142364502, 1.295095682144165, 1.3975193500518799, 1.4999430179595947, 1.6023666858673096, 1.7047903537750244, 1.8072141408920288, 1.9096378087997437, 2.012061595916748, 2.114485263824463, 2.2169089317321777, 2.3193325996398926, 2.4217562675476074, 2.5241799354553223, 2.626603603363037, 2.729027271270752, 2.831450939178467]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 12.0, 7.0, 16.0, 22.0, 17.0, 47.0, 53.0, 83.0, 117.0, 163.0, 199.0, 246.0, 376.0, 584.0, 869.0, 1307.0, 2290.0, 4018.0, 7399.0, 14255.0, 28620.0, 57793.0, 112151.0, 189819.0, 233841.0, 180748.0, 103709.0, 53671.0, 26241.0, 13230.0, 6853.0, 3724.0, 2094.0, 1268.0, 836.0, 580.0, 344.0, 252.0, 173.0, 148.0, 99.0, 69.0, 60.0, 45.0, 27.0, 27.0, 14.0, 10.0, 5.0, 11.0, 4.0, 2.0, 4.0], "bins": [-3.7421875, -3.6365966796875, -3.531005859375, -3.4254150390625, -3.31982421875, -3.2142333984375, -3.108642578125, -3.0030517578125, -2.8974609375, -2.7918701171875, -2.686279296875, -2.5806884765625, -2.47509765625, -2.3695068359375, -2.263916015625, -2.1583251953125, -2.052734375, -1.9471435546875, -1.841552734375, -1.7359619140625, -1.63037109375, -1.5247802734375, -1.419189453125, -1.3135986328125, -1.2080078125, -1.1024169921875, -0.996826171875, -0.8912353515625, -0.78564453125, -0.6800537109375, -0.574462890625, -0.4688720703125, -0.36328125, -0.2576904296875, -0.152099609375, -0.0465087890625, 0.05908203125, 0.1646728515625, 0.270263671875, 0.3758544921875, 0.4814453125, 0.5870361328125, 0.692626953125, 0.7982177734375, 0.90380859375, 1.0093994140625, 1.114990234375, 1.2205810546875, 1.326171875, 1.4317626953125, 1.537353515625, 1.6429443359375, 1.74853515625, 1.8541259765625, 1.959716796875, 2.0653076171875, 2.1708984375, 2.2764892578125, 2.382080078125, 2.4876708984375, 2.59326171875, 2.6988525390625, 2.804443359375, 2.9100341796875, 3.015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 9.0, 6.0, 8.0, 7.0, 12.0, 9.0, 12.0, 16.0, 22.0, 19.0, 28.0, 24.0, 32.0, 31.0, 43.0, 28.0, 30.0, 32.0, 32.0, 51.0, 35.0, 39.0, 41.0, 33.0, 38.0, 32.0, 31.0, 33.0, 35.0, 27.0, 38.0, 19.0, 28.0, 16.0, 22.0, 13.0, 11.0, 10.0, 12.0, 5.0, 7.0, 8.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.83984375, -3.7265625, -3.61328125, -3.5, -3.38671875, -3.2734375, -3.16015625, -3.046875, -2.93359375, -2.8203125, -2.70703125, -2.59375, -2.48046875, -2.3671875, -2.25390625, -2.140625, -2.02734375, -1.9140625, -1.80078125, -1.6875, -1.57421875, -1.4609375, -1.34765625, -1.234375, -1.12109375, -1.0078125, -0.89453125, -0.78125, -0.66796875, -0.5546875, -0.44140625, -0.328125, -0.21484375, -0.1015625, 0.01171875, 0.125, 0.23828125, 0.3515625, 0.46484375, 0.578125, 0.69140625, 0.8046875, 0.91796875, 1.03125, 1.14453125, 1.2578125, 1.37109375, 1.484375, 1.59765625, 1.7109375, 1.82421875, 1.9375, 2.05078125, 2.1640625, 2.27734375, 2.390625, 2.50390625, 2.6171875, 2.73046875, 2.84375, 2.95703125, 3.0703125, 3.18359375, 3.296875, 3.41015625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 0.0, 5.0, 10.0, 8.0, 13.0, 18.0, 30.0, 18.0, 30.0, 57.0, 84.0, 146.0, 209.0, 269.0, 437.0, 691.0, 1167.0, 2097.0, 4072.0, 8073.0, 18181.0, 43181.0, 106174.0, 246194.0, 320853.0, 171781.0, 70393.0, 28883.0, 12485.0, 5905.0, 2964.0, 1615.0, 959.0, 508.0, 303.0, 229.0, 156.0, 115.0, 60.0, 60.0, 33.0, 27.0, 19.0, 8.0, 4.0, 9.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-5.21484375, -5.05810546875, -4.9013671875, -4.74462890625, -4.587890625, -4.43115234375, -4.2744140625, -4.11767578125, -3.9609375, -3.80419921875, -3.6474609375, -3.49072265625, -3.333984375, -3.17724609375, -3.0205078125, -2.86376953125, -2.70703125, -2.55029296875, -2.3935546875, -2.23681640625, -2.080078125, -1.92333984375, -1.7666015625, -1.60986328125, -1.453125, -1.29638671875, -1.1396484375, -0.98291015625, -0.826171875, -0.66943359375, -0.5126953125, -0.35595703125, -0.19921875, -0.04248046875, 0.1142578125, 0.27099609375, 0.427734375, 0.58447265625, 0.7412109375, 0.89794921875, 1.0546875, 1.21142578125, 1.3681640625, 1.52490234375, 1.681640625, 1.83837890625, 1.9951171875, 2.15185546875, 2.30859375, 2.46533203125, 2.6220703125, 2.77880859375, 2.935546875, 3.09228515625, 3.2490234375, 3.40576171875, 3.5625, 3.71923828125, 3.8759765625, 4.03271484375, 4.189453125, 4.34619140625, 4.5029296875, 4.65966796875, 4.81640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 12.0, 9.0, 11.0, 17.0, 13.0, 20.0, 23.0, 24.0, 25.0, 24.0, 35.0, 21.0, 45.0, 50.0, 39.0, 39.0, 33.0, 34.0, 35.0, 50.0, 38.0, 32.0, 33.0, 36.0, 42.0, 31.0, 25.0, 28.0, 18.0, 16.0, 26.0, 16.0, 19.0, 10.0, 10.0, 11.0, 10.0, 6.0, 8.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.2265625, -2.15716552734375, -2.0877685546875, -2.01837158203125, -1.948974609375, -1.87957763671875, -1.8101806640625, -1.74078369140625, -1.67138671875, -1.60198974609375, -1.5325927734375, -1.46319580078125, -1.393798828125, -1.32440185546875, -1.2550048828125, -1.18560791015625, -1.1162109375, -1.04681396484375, -0.9774169921875, -0.90802001953125, -0.838623046875, -0.76922607421875, -0.6998291015625, -0.63043212890625, -0.56103515625, -0.49163818359375, -0.4222412109375, -0.35284423828125, -0.283447265625, -0.21405029296875, -0.1446533203125, -0.07525634765625, -0.005859375, 0.06353759765625, 0.1329345703125, 0.20233154296875, 0.271728515625, 0.34112548828125, 0.4105224609375, 0.47991943359375, 0.54931640625, 0.61871337890625, 0.6881103515625, 0.75750732421875, 0.826904296875, 0.89630126953125, 0.9656982421875, 1.03509521484375, 1.1044921875, 1.17388916015625, 1.2432861328125, 1.31268310546875, 1.382080078125, 1.45147705078125, 1.5208740234375, 1.59027099609375, 1.65966796875, 1.72906494140625, 1.7984619140625, 1.86785888671875, 1.937255859375, 2.00665283203125, 2.0760498046875, 2.14544677734375, 2.21484375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 7.0, 16.0, 21.0, 24.0, 37.0, 56.0, 60.0, 93.0, 102.0, 151.0, 217.0, 297.0, 417.0, 564.0, 875.0, 1434.0, 2401.0, 4345.0, 9820.0, 27215.0, 92287.0, 327317.0, 398942.0, 122451.0, 34484.0, 12239.0, 5112.0, 2649.0, 1553.0, 1041.0, 629.0, 484.0, 328.0, 255.0, 173.0, 114.0, 98.0, 78.0, 48.0, 32.0, 19.0, 21.0, 13.0, 9.0, 10.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.1640625, -3.065521240234375, -2.96697998046875, -2.868438720703125, -2.7698974609375, -2.671356201171875, -2.57281494140625, -2.474273681640625, -2.375732421875, -2.277191162109375, -2.17864990234375, -2.080108642578125, -1.9815673828125, -1.883026123046875, -1.78448486328125, -1.685943603515625, -1.58740234375, -1.488861083984375, -1.39031982421875, -1.291778564453125, -1.1932373046875, -1.094696044921875, -0.99615478515625, -0.897613525390625, -0.799072265625, -0.700531005859375, -0.60198974609375, -0.503448486328125, -0.4049072265625, -0.306365966796875, -0.20782470703125, -0.109283447265625, -0.0107421875, 0.087799072265625, 0.18634033203125, 0.284881591796875, 0.3834228515625, 0.481964111328125, 0.58050537109375, 0.679046630859375, 0.777587890625, 0.876129150390625, 0.97467041015625, 1.073211669921875, 1.1717529296875, 1.270294189453125, 1.36883544921875, 1.467376708984375, 1.56591796875, 1.664459228515625, 1.76300048828125, 1.861541748046875, 1.9600830078125, 2.058624267578125, 2.15716552734375, 2.255706787109375, 2.354248046875, 2.452789306640625, 2.55133056640625, 2.649871826171875, 2.7484130859375, 2.846954345703125, 2.94549560546875, 3.044036865234375, 3.142578125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 14.0, 35.0, 36.0, 48.0, 65.0, 92.0, 117.0, 135.0, 124.0, 95.0, 71.0, 44.0, 31.0, 25.0, 21.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014281272888183594, -0.00013865530490875244, -0.00013449788093566895, -0.00013034045696258545, -0.00012618303298950195, -0.00012202560901641846, -0.00011786818504333496, -0.00011371076107025146, -0.00010955333709716797, -0.00010539591312408447, -0.00010123848915100098, -9.708106517791748e-05, -9.292364120483398e-05, -8.876621723175049e-05, -8.460879325866699e-05, -8.04513692855835e-05, -7.62939453125e-05, -7.21365213394165e-05, -6.797909736633301e-05, -6.382167339324951e-05, -5.9664249420166016e-05, -5.550682544708252e-05, -5.1349401473999023e-05, -4.719197750091553e-05, -4.303455352783203e-05, -3.8877129554748535e-05, -3.471970558166504e-05, -3.056228160858154e-05, -2.6404857635498047e-05, -2.224743366241455e-05, -1.8090009689331055e-05, -1.3932585716247559e-05, -9.775161743164062e-06, -5.617737770080566e-06, -1.4603137969970703e-06, 2.6971101760864258e-06, 6.854534149169922e-06, 1.1011958122253418e-05, 1.5169382095336914e-05, 1.932680606842041e-05, 2.3484230041503906e-05, 2.7641654014587402e-05, 3.17990779876709e-05, 3.5956501960754395e-05, 4.011392593383789e-05, 4.427134990692139e-05, 4.842877388000488e-05, 5.258619785308838e-05, 5.6743621826171875e-05, 6.090104579925537e-05, 6.505846977233887e-05, 6.921589374542236e-05, 7.337331771850586e-05, 7.753074169158936e-05, 8.168816566467285e-05, 8.584558963775635e-05, 9.000301361083984e-05, 9.416043758392334e-05, 9.831786155700684e-05, 0.00010247528553009033, 0.00010663270950317383, 0.00011079013347625732, 0.00011494755744934082, 0.00011910498142242432, 0.0001232624053955078]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 13.0, 20.0, 17.0, 23.0, 42.0, 61.0, 88.0, 150.0, 220.0, 293.0, 459.0, 724.0, 1050.0, 1718.0, 2976.0, 6416.0, 17414.0, 60659.0, 216050.0, 422717.0, 222656.0, 62230.0, 18080.0, 6459.0, 3046.0, 1755.0, 1093.0, 718.0, 489.0, 290.0, 205.0, 151.0, 101.0, 55.0, 35.0, 33.0, 20.0, 6.0, 13.0, 3.0, 4.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.0859375, -2.99652099609375, -2.9071044921875, -2.81768798828125, -2.728271484375, -2.63885498046875, -2.5494384765625, -2.46002197265625, -2.37060546875, -2.28118896484375, -2.1917724609375, -2.10235595703125, -2.012939453125, -1.92352294921875, -1.8341064453125, -1.74468994140625, -1.6552734375, -1.56585693359375, -1.4764404296875, -1.38702392578125, -1.297607421875, -1.20819091796875, -1.1187744140625, -1.02935791015625, -0.93994140625, -0.85052490234375, -0.7611083984375, -0.67169189453125, -0.582275390625, -0.49285888671875, -0.4034423828125, -0.31402587890625, -0.224609375, -0.13519287109375, -0.0457763671875, 0.04364013671875, 0.133056640625, 0.22247314453125, 0.3118896484375, 0.40130615234375, 0.49072265625, 0.58013916015625, 0.6695556640625, 0.75897216796875, 0.848388671875, 0.93780517578125, 1.0272216796875, 1.11663818359375, 1.2060546875, 1.29547119140625, 1.3848876953125, 1.47430419921875, 1.563720703125, 1.65313720703125, 1.7425537109375, 1.83197021484375, 1.92138671875, 2.01080322265625, 2.1002197265625, 2.18963623046875, 2.279052734375, 2.36846923828125, 2.4578857421875, 2.54730224609375, 2.63671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 2.0, 7.0, 6.0, 10.0, 21.0, 16.0, 34.0, 53.0, 47.0, 46.0, 69.0, 82.0, 99.0, 92.0, 75.0, 63.0, 75.0, 47.0, 40.0, 29.0, 24.0, 19.0, 14.0, 7.0, 9.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.537109375, -0.519195556640625, -0.50128173828125, -0.483367919921875, -0.4654541015625, -0.447540283203125, -0.42962646484375, -0.411712646484375, -0.393798828125, -0.375885009765625, -0.35797119140625, -0.340057373046875, -0.3221435546875, -0.304229736328125, -0.28631591796875, -0.268402099609375, -0.25048828125, -0.232574462890625, -0.21466064453125, -0.196746826171875, -0.1788330078125, -0.160919189453125, -0.14300537109375, -0.125091552734375, -0.107177734375, -0.089263916015625, -0.07135009765625, -0.053436279296875, -0.0355224609375, -0.017608642578125, 0.00030517578125, 0.018218994140625, 0.0361328125, 0.054046630859375, 0.07196044921875, 0.089874267578125, 0.1077880859375, 0.125701904296875, 0.14361572265625, 0.161529541015625, 0.179443359375, 0.197357177734375, 0.21527099609375, 0.233184814453125, 0.2510986328125, 0.269012451171875, 0.28692626953125, 0.304840087890625, 0.32275390625, 0.340667724609375, 0.35858154296875, 0.376495361328125, 0.3944091796875, 0.412322998046875, 0.43023681640625, 0.448150634765625, 0.466064453125, 0.483978271484375, 0.50189208984375, 0.519805908203125, 0.5377197265625, 0.555633544921875, 0.57354736328125, 0.591461181640625, 0.609375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 9.0, 6.0, 19.0, 17.0, 27.0, 32.0, 36.0, 50.0, 53.0, 68.0, 84.0, 77.0, 84.0, 85.0, 71.0, 45.0, 57.0, 45.0, 32.0, 21.0, 21.0, 13.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.466853141784668, -11.204253196716309, -10.941654205322266, -10.679054260253906, -10.416454315185547, -10.153854370117188, -9.891255378723145, -9.628655433654785, -9.366056442260742, -9.103456497192383, -8.84085750579834, -8.57825756072998, -8.315657615661621, -8.053058624267578, -7.790458679199219, -7.527858734130859, -7.2652587890625, -7.002659320831299, -6.7400593757629395, -6.477459907531738, -6.214859962463379, -5.952260494232178, -5.689661026000977, -5.427061080932617, -5.164461612701416, -4.901862144470215, -4.6392621994018555, -4.376662731170654, -4.114063262939453, -3.8514633178710938, -3.5888638496398926, -3.3262641429901123, -3.0636649131774902, -2.80106520652771, -2.5384654998779297, -2.2758660316467285, -2.0132663249969482, -1.750666618347168, -1.4880670309066772, -1.2254674434661865, -0.9628677368164062, -0.7002680897712708, -0.43766844272613525, -0.17506879568099976, 0.08753085136413574, 0.350130558013916, 0.6127301454544067, 0.8753297328948975, 1.1379294395446777, 1.400529146194458, 1.6631287336349487, 1.9257283210754395, 2.1883280277252197, 2.450927734375, 2.713527202606201, 2.9761269092559814, 3.2387266159057617, 3.501326322555542, 3.7639260292053223, 4.026525497436523, 4.289125442504883, 4.551724910736084, 4.814324378967285, 5.0769243240356445, 5.339523792266846]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 6.0, 11.0, 7.0, 10.0, 9.0, 18.0, 16.0, 9.0, 19.0, 22.0, 23.0, 24.0, 34.0, 17.0, 30.0, 46.0, 38.0, 37.0, 27.0, 32.0, 40.0, 36.0, 34.0, 40.0, 37.0, 34.0, 35.0, 30.0, 34.0, 27.0, 22.0, 28.0, 20.0, 24.0, 27.0, 13.0, 15.0, 7.0, 9.0, 13.0, 7.0, 8.0, 3.0, 2.0, 6.0, 2.0, 3.0, 3.0], "bins": [-3.6605007648468018, -3.561526298522949, -3.4625518321990967, -3.363577365875244, -3.2646028995513916, -3.165628433227539, -3.0666542053222656, -2.967679500579834, -2.8687052726745605, -2.769730806350708, -2.6707563400268555, -2.571781873703003, -2.4728074073791504, -2.373832941055298, -2.2748584747314453, -2.175884246826172, -2.0769095420837402, -1.9779350757598877, -1.8789606094360352, -1.7799861431121826, -1.68101167678833, -1.5820372104644775, -1.4830628633499146, -1.384088397026062, -1.2851139307022095, -1.186139464378357, -1.0871649980545044, -0.9881905913352966, -0.8892161250114441, -0.7902416586875916, -0.6912672519683838, -0.5922927856445312, -0.4933185577392578, -0.3943440914154053, -0.2953696548938751, -0.19639521837234497, -0.09742075204849243, 0.0015537142753601074, 0.10052812099456787, 0.1995025873184204, 0.29847705364227295, 0.3974515199661255, 0.49642595648765564, 0.5954003930091858, 0.6943748593330383, 0.7933493256568909, 0.8923237323760986, 0.9912981986999512, 1.0902726650238037, 1.1892471313476562, 1.2882215976715088, 1.3871960639953613, 1.4861705303192139, 1.5851449966430664, 1.6841193437576294, 1.783093810081482, 1.8820682764053345, 1.981042742729187, 2.08001708984375, 2.1789915561676025, 2.277966022491455, 2.3769404888153076, 2.47591495513916, 2.5748894214630127, 2.6738638877868652]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 10.0, 9.0, 15.0, 20.0, 41.0, 70.0, 89.0, 150.0, 205.0, 336.0, 542.0, 804.0, 1235.0, 1962.0, 2972.0, 4838.0, 7735.0, 12120.0, 19637.0, 30766.0, 47737.0, 72049.0, 102205.0, 131174.0, 145811.0, 136303.0, 107896.0, 77880.0, 52051.0, 33947.0, 21338.0, 13611.0, 8305.0, 5409.0, 3276.0, 2182.0, 1372.0, 853.0, 549.0, 373.0, 241.0, 145.0, 108.0, 55.0, 44.0, 28.0, 19.0, 18.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.134765625, -3.041473388671875, -2.94818115234375, -2.854888916015625, -2.7615966796875, -2.668304443359375, -2.57501220703125, -2.481719970703125, -2.388427734375, -2.295135498046875, -2.20184326171875, -2.108551025390625, -2.0152587890625, -1.921966552734375, -1.82867431640625, -1.735382080078125, -1.64208984375, -1.548797607421875, -1.45550537109375, -1.362213134765625, -1.2689208984375, -1.175628662109375, -1.08233642578125, -0.989044189453125, -0.895751953125, -0.802459716796875, -0.70916748046875, -0.615875244140625, -0.5225830078125, -0.429290771484375, -0.33599853515625, -0.242706298828125, -0.1494140625, -0.056121826171875, 0.03717041015625, 0.130462646484375, 0.2237548828125, 0.317047119140625, 0.41033935546875, 0.503631591796875, 0.596923828125, 0.690216064453125, 0.78350830078125, 0.876800537109375, 0.9700927734375, 1.063385009765625, 1.15667724609375, 1.249969482421875, 1.34326171875, 1.436553955078125, 1.52984619140625, 1.623138427734375, 1.7164306640625, 1.809722900390625, 1.90301513671875, 1.996307373046875, 2.089599609375, 2.182891845703125, 2.27618408203125, 2.369476318359375, 2.4627685546875, 2.556060791015625, 2.64935302734375, 2.742645263671875, 2.8359375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 1.0, 8.0, 6.0, 10.0, 9.0, 18.0, 18.0, 12.0, 16.0, 24.0, 19.0, 25.0, 30.0, 34.0, 36.0, 32.0, 38.0, 52.0, 38.0, 41.0, 42.0, 37.0, 32.0, 40.0, 39.0, 39.0, 29.0, 35.0, 21.0, 30.0, 26.0, 32.0, 18.0, 24.0, 18.0, 13.0, 14.0, 10.0, 9.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.03125, -3.91534423828125, -3.7994384765625, -3.68353271484375, -3.567626953125, -3.45172119140625, -3.3358154296875, -3.21990966796875, -3.10400390625, -2.98809814453125, -2.8721923828125, -2.75628662109375, -2.640380859375, -2.52447509765625, -2.4085693359375, -2.29266357421875, -2.1767578125, -2.06085205078125, -1.9449462890625, -1.82904052734375, -1.713134765625, -1.59722900390625, -1.4813232421875, -1.36541748046875, -1.24951171875, -1.13360595703125, -1.0177001953125, -0.90179443359375, -0.785888671875, -0.66998291015625, -0.5540771484375, -0.43817138671875, -0.322265625, -0.20635986328125, -0.0904541015625, 0.02545166015625, 0.141357421875, 0.25726318359375, 0.3731689453125, 0.48907470703125, 0.60498046875, 0.72088623046875, 0.8367919921875, 0.95269775390625, 1.068603515625, 1.18450927734375, 1.3004150390625, 1.41632080078125, 1.5322265625, 1.64813232421875, 1.7640380859375, 1.87994384765625, 1.995849609375, 2.11175537109375, 2.2276611328125, 2.34356689453125, 2.45947265625, 2.57537841796875, 2.6912841796875, 2.80718994140625, 2.923095703125, 3.03900146484375, 3.1549072265625, 3.27081298828125, 3.38671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 6.0, 3.0, 12.0, 18.0, 19.0, 26.0, 61.0, 83.0, 98.0, 124.0, 254.0, 381.0, 624.0, 931.0, 1703.0, 2685.0, 4604.0, 8325.0, 14751.0, 26124.0, 46965.0, 80250.0, 126115.0, 168825.0, 179383.0, 147230.0, 99417.0, 60173.0, 34397.0, 19537.0, 10708.0, 5989.0, 3427.0, 2055.0, 1190.0, 730.0, 439.0, 311.0, 197.0, 131.0, 102.0, 50.0, 44.0, 22.0, 12.0, 7.0, 12.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.62890625, -3.50885009765625, -3.3887939453125, -3.26873779296875, -3.148681640625, -3.02862548828125, -2.9085693359375, -2.78851318359375, -2.66845703125, -2.54840087890625, -2.4283447265625, -2.30828857421875, -2.188232421875, -2.06817626953125, -1.9481201171875, -1.82806396484375, -1.7080078125, -1.58795166015625, -1.4678955078125, -1.34783935546875, -1.227783203125, -1.10772705078125, -0.9876708984375, -0.86761474609375, -0.74755859375, -0.62750244140625, -0.5074462890625, -0.38739013671875, -0.267333984375, -0.14727783203125, -0.0272216796875, 0.09283447265625, 0.212890625, 0.33294677734375, 0.4530029296875, 0.57305908203125, 0.693115234375, 0.81317138671875, 0.9332275390625, 1.05328369140625, 1.17333984375, 1.29339599609375, 1.4134521484375, 1.53350830078125, 1.653564453125, 1.77362060546875, 1.8936767578125, 2.01373291015625, 2.1337890625, 2.25384521484375, 2.3739013671875, 2.49395751953125, 2.614013671875, 2.73406982421875, 2.8541259765625, 2.97418212890625, 3.09423828125, 3.21429443359375, 3.3343505859375, 3.45440673828125, 3.574462890625, 3.69451904296875, 3.8145751953125, 3.93463134765625, 4.0546875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 9.0, 13.0, 19.0, 23.0, 11.0, 16.0, 27.0, 25.0, 33.0, 31.0, 29.0, 47.0, 30.0, 42.0, 41.0, 38.0, 40.0, 43.0, 34.0, 40.0, 36.0, 31.0, 35.0, 41.0, 26.0, 23.0, 38.0, 21.0, 20.0, 15.0, 17.0, 20.0, 17.0, 13.0, 6.0, 7.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.248046875, -2.1796875, -2.111328125, -2.04296875, -1.974609375, -1.90625, -1.837890625, -1.76953125, -1.701171875, -1.6328125, -1.564453125, -1.49609375, -1.427734375, -1.359375, -1.291015625, -1.22265625, -1.154296875, -1.0859375, -1.017578125, -0.94921875, -0.880859375, -0.8125, -0.744140625, -0.67578125, -0.607421875, -0.5390625, -0.470703125, -0.40234375, -0.333984375, -0.265625, -0.197265625, -0.12890625, -0.060546875, 0.0078125, 0.076171875, 0.14453125, 0.212890625, 0.28125, 0.349609375, 0.41796875, 0.486328125, 0.5546875, 0.623046875, 0.69140625, 0.759765625, 0.828125, 0.896484375, 0.96484375, 1.033203125, 1.1015625, 1.169921875, 1.23828125, 1.306640625, 1.375, 1.443359375, 1.51171875, 1.580078125, 1.6484375, 1.716796875, 1.78515625, 1.853515625, 1.921875, 1.990234375, 2.05859375, 2.126953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 14.0, 16.0, 20.0, 36.0, 53.0, 80.0, 85.0, 153.0, 244.0, 365.0, 548.0, 853.0, 1293.0, 1971.0, 3140.0, 5256.0, 8743.0, 14745.0, 26099.0, 45603.0, 80069.0, 132419.0, 186168.0, 192067.0, 142289.0, 87667.0, 49740.0, 28145.0, 15954.0, 9478.0, 5704.0, 3476.0, 2151.0, 1326.0, 886.0, 550.0, 372.0, 253.0, 167.0, 108.0, 82.0, 59.0, 35.0, 23.0, 20.0, 10.0, 3.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.01953125, -1.956573486328125, -1.89361572265625, -1.830657958984375, -1.7677001953125, -1.704742431640625, -1.64178466796875, -1.578826904296875, -1.515869140625, -1.452911376953125, -1.38995361328125, -1.326995849609375, -1.2640380859375, -1.201080322265625, -1.13812255859375, -1.075164794921875, -1.01220703125, -0.949249267578125, -0.88629150390625, -0.823333740234375, -0.7603759765625, -0.697418212890625, -0.63446044921875, -0.571502685546875, -0.508544921875, -0.445587158203125, -0.38262939453125, -0.319671630859375, -0.2567138671875, -0.193756103515625, -0.13079833984375, -0.067840576171875, -0.0048828125, 0.058074951171875, 0.12103271484375, 0.183990478515625, 0.2469482421875, 0.309906005859375, 0.37286376953125, 0.435821533203125, 0.498779296875, 0.561737060546875, 0.62469482421875, 0.687652587890625, 0.7506103515625, 0.813568115234375, 0.87652587890625, 0.939483642578125, 1.00244140625, 1.065399169921875, 1.12835693359375, 1.191314697265625, 1.2542724609375, 1.317230224609375, 1.38018798828125, 1.443145751953125, 1.506103515625, 1.569061279296875, 1.63201904296875, 1.694976806640625, 1.7579345703125, 1.820892333984375, 1.88385009765625, 1.946807861328125, 2.009765625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 7.0, 5.0, 7.0, 11.0, 6.0, 12.0, 21.0, 15.0, 20.0, 15.0, 35.0, 25.0, 33.0, 46.0, 62.0, 59.0, 73.0, 56.0, 70.0, 66.0, 57.0, 54.0, 36.0, 39.0, 30.0, 29.0, 20.0, 20.0, 13.0, 8.0, 10.0, 4.0, 4.0, 6.0, 4.0, 1.0, 5.0, 0.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00015461444854736328, -0.00014940090477466583, -0.00014418736100196838, -0.00013897381722927094, -0.00013376027345657349, -0.00012854672968387604, -0.0001233331859111786, -0.00011811964213848114, -0.00011290609836578369, -0.00010769255459308624, -0.0001024790108203888, -9.726546704769135e-05, -9.20519232749939e-05, -8.683837950229645e-05, -8.1624835729599e-05, -7.641129195690155e-05, -7.11977481842041e-05, -6.598420441150665e-05, -6.0770660638809204e-05, -5.5557116866111755e-05, -5.034357309341431e-05, -4.513002932071686e-05, -3.991648554801941e-05, -3.470294177532196e-05, -2.9489398002624512e-05, -2.4275854229927063e-05, -1.9062310457229614e-05, -1.3848766684532166e-05, -8.635222911834717e-06, -3.421679139137268e-06, 1.7918646335601807e-06, 7.005408406257629e-06, 1.2218952178955078e-05, 1.7432495951652527e-05, 2.2646039724349976e-05, 2.7859583497047424e-05, 3.307312726974487e-05, 3.828667104244232e-05, 4.350021481513977e-05, 4.871375858783722e-05, 5.392730236053467e-05, 5.914084613323212e-05, 6.435438990592957e-05, 6.956793367862701e-05, 7.478147745132446e-05, 7.999502122402191e-05, 8.520856499671936e-05, 9.042210876941681e-05, 9.563565254211426e-05, 0.0001008491963148117, 0.00010606274008750916, 0.0001112762838602066, 0.00011648982763290405, 0.0001217033714056015, 0.00012691691517829895, 0.0001321304589509964, 0.00013734400272369385, 0.0001425575464963913, 0.00014777109026908875, 0.0001529846340417862, 0.00015819817781448364, 0.0001634117215871811, 0.00016862526535987854, 0.000173838809132576, 0.00017905235290527344]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 9.0, 10.0, 15.0, 25.0, 43.0, 54.0, 78.0, 143.0, 183.0, 289.0, 476.0, 656.0, 942.0, 1556.0, 2350.0, 3634.0, 5619.0, 9003.0, 14003.0, 23070.0, 37773.0, 61837.0, 96545.0, 139649.0, 168504.0, 157702.0, 118754.0, 78360.0, 48307.0, 29741.0, 17999.0, 11352.0, 6998.0, 4576.0, 2754.0, 1883.0, 1205.0, 806.0, 514.0, 388.0, 222.0, 173.0, 116.0, 84.0, 54.0, 26.0, 25.0, 19.0, 8.0, 4.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8056640625, -1.7505340576171875, -1.695404052734375, -1.6402740478515625, -1.58514404296875, -1.5300140380859375, -1.474884033203125, -1.4197540283203125, -1.3646240234375, -1.3094940185546875, -1.254364013671875, -1.1992340087890625, -1.14410400390625, -1.0889739990234375, -1.033843994140625, -0.9787139892578125, -0.923583984375, -0.8684539794921875, -0.813323974609375, -0.7581939697265625, -0.70306396484375, -0.6479339599609375, -0.592803955078125, -0.5376739501953125, -0.4825439453125, -0.4274139404296875, -0.372283935546875, -0.3171539306640625, -0.26202392578125, -0.2068939208984375, -0.151763916015625, -0.0966339111328125, -0.04150390625, 0.0136260986328125, 0.068756103515625, 0.1238861083984375, 0.17901611328125, 0.2341461181640625, 0.289276123046875, 0.3444061279296875, 0.3995361328125, 0.4546661376953125, 0.509796142578125, 0.5649261474609375, 0.62005615234375, 0.6751861572265625, 0.730316162109375, 0.7854461669921875, 0.840576171875, 0.8957061767578125, 0.950836181640625, 1.0059661865234375, 1.06109619140625, 1.1162261962890625, 1.171356201171875, 1.2264862060546875, 1.2816162109375, 1.3367462158203125, 1.391876220703125, 1.4470062255859375, 1.50213623046875, 1.5572662353515625, 1.612396240234375, 1.6675262451171875, 1.72265625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 2.0, 4.0, 3.0, 7.0, 8.0, 4.0, 12.0, 13.0, 22.0, 13.0, 24.0, 21.0, 25.0, 29.0, 40.0, 39.0, 59.0, 40.0, 50.0, 54.0, 59.0, 55.0, 38.0, 45.0, 44.0, 52.0, 40.0, 35.0, 31.0, 26.0, 18.0, 11.0, 18.0, 7.0, 10.0, 7.0, 3.0, 7.0, 0.0, 8.0, 5.0, 3.0, 6.0, 0.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54296875, -0.5252151489257812, -0.5074615478515625, -0.48970794677734375, -0.471954345703125, -0.45420074462890625, -0.4364471435546875, -0.41869354248046875, -0.40093994140625, -0.38318634033203125, -0.3654327392578125, -0.34767913818359375, -0.329925537109375, -0.31217193603515625, -0.2944183349609375, -0.27666473388671875, -0.2589111328125, -0.24115753173828125, -0.2234039306640625, -0.20565032958984375, -0.187896728515625, -0.17014312744140625, -0.1523895263671875, -0.13463592529296875, -0.11688232421875, -0.09912872314453125, -0.0813751220703125, -0.06362152099609375, -0.045867919921875, -0.02811431884765625, -0.0103607177734375, 0.00739288330078125, 0.025146484375, 0.04290008544921875, 0.0606536865234375, 0.07840728759765625, 0.096160888671875, 0.11391448974609375, 0.1316680908203125, 0.14942169189453125, 0.16717529296875, 0.18492889404296875, 0.2026824951171875, 0.22043609619140625, 0.238189697265625, 0.25594329833984375, 0.2736968994140625, 0.29145050048828125, 0.3092041015625, 0.32695770263671875, 0.3447113037109375, 0.36246490478515625, 0.380218505859375, 0.39797210693359375, 0.4157257080078125, 0.43347930908203125, 0.45123291015625, 0.46898651123046875, 0.4867401123046875, 0.5044937133789062, 0.522247314453125, 0.5400009155273438, 0.5577545166015625, 0.5755081176757812, 0.59326171875]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 5.0, 10.0, 10.0, 14.0, 17.0, 24.0, 34.0, 45.0, 53.0, 55.0, 71.0, 69.0, 92.0, 76.0, 89.0, 56.0, 61.0, 44.0, 51.0, 38.0, 22.0, 18.0, 7.0, 8.0, 4.0, 8.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0], "bins": [-11.977826118469238, -11.709940910339355, -11.442055702209473, -11.17417049407959, -10.906285285949707, -10.638400077819824, -10.370514869689941, -10.102629661560059, -9.834744453430176, -9.566859245300293, -9.29897403717041, -9.031088829040527, -8.763203620910645, -8.495318412780762, -8.227433204650879, -7.959547996520996, -7.691662788391113, -7.4237775802612305, -7.155892372131348, -6.888007164001465, -6.620121955871582, -6.352236747741699, -6.084351539611816, -5.816466331481934, -5.548581123352051, -5.280695915222168, -5.012810707092285, -4.744925498962402, -4.4770402908325195, -4.209155082702637, -3.941269874572754, -3.673384666442871, -3.40549898147583, -3.1376137733459473, -2.8697285652160645, -2.6018433570861816, -2.333958148956299, -2.066072940826416, -1.7981877326965332, -1.5303025245666504, -1.2624173164367676, -0.9945321083068848, -0.726646900177002, -0.45876169204711914, -0.19087648391723633, 0.07700872421264648, 0.3448939323425293, 0.6127791404724121, 0.8806643486022949, 1.1485495567321777, 1.4164347648620605, 1.6843199729919434, 1.9522051811218262, 2.220090389251709, 2.487975597381592, 2.7558608055114746, 3.0237460136413574, 3.2916312217712402, 3.559516429901123, 3.827401638031006, 4.095286846160889, 4.3631720542907715, 4.631057262420654, 4.898942470550537, 5.16682767868042]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 7.0, 5.0, 4.0, 3.0, 7.0, 7.0, 9.0, 11.0, 11.0, 9.0, 17.0, 22.0, 13.0, 22.0, 28.0, 20.0, 31.0, 30.0, 36.0, 38.0, 41.0, 38.0, 33.0, 35.0, 32.0, 33.0, 35.0, 40.0, 39.0, 37.0, 41.0, 31.0, 23.0, 28.0, 25.0, 24.0, 21.0, 25.0, 17.0, 12.0, 11.0, 10.0, 13.0, 12.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.248361110687256, -3.1510603427886963, -3.0537595748901367, -2.956458806991577, -2.8591580390930176, -2.761857032775879, -2.6645562648773193, -2.5672554969787598, -2.4699547290802, -2.3726539611816406, -2.275353193283081, -2.1780524253845215, -2.080751419067383, -1.9834507703781128, -1.8861498832702637, -1.788849115371704, -1.6915483474731445, -1.594247579574585, -1.4969468116760254, -1.3996459245681763, -1.3023451566696167, -1.2050443887710571, -1.107743501663208, -1.0104427337646484, -0.9131419658660889, -0.8158411979675293, -0.718540370464325, -0.6212395429611206, -0.523938775062561, -0.4266379773616791, -0.3293371796607971, -0.23203635215759277, -0.1347355842590332, -0.037434786558151245, 0.05986601114273071, 0.15716680884361267, 0.25446760654449463, 0.3517684042453766, 0.44906920194625854, 0.5463700294494629, 0.6436707973480225, 0.740971565246582, 0.8382723927497864, 0.9355732202529907, 1.0328739881515503, 1.1301747560501099, 1.227475643157959, 1.3247764110565186, 1.4220771789550781, 1.5193779468536377, 1.6166787147521973, 1.7139796018600464, 1.811280369758606, 1.9085811376571655, 2.0058820247650146, 2.103182792663574, 2.200483560562134, 2.2977843284606934, 2.395085096359253, 2.4923858642578125, 2.589686870574951, 2.6869876384735107, 2.7842884063720703, 2.88158917427063, 2.9788899421691895]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 15.0, 12.0, 20.0, 36.0, 56.0, 79.0, 112.0, 177.0, 240.0, 410.0, 651.0, 936.0, 1416.0, 2296.0, 3555.0, 5917.0, 9694.0, 16779.0, 31459.0, 62304.0, 138526.0, 351733.0, 897125.0, 1328063.0, 790685.0, 306923.0, 123185.0, 55775.0, 28404.0, 15143.0, 8743.0, 5183.0, 3133.0, 1970.0, 1197.0, 833.0, 551.0, 324.0, 226.0, 141.0, 102.0, 54.0, 37.0, 24.0, 12.0, 7.0, 6.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.23046875, -6.038330078125, -5.84619140625, -5.654052734375, -5.4619140625, -5.269775390625, -5.07763671875, -4.885498046875, -4.693359375, -4.501220703125, -4.30908203125, -4.116943359375, -3.9248046875, -3.732666015625, -3.54052734375, -3.348388671875, -3.15625, -2.964111328125, -2.77197265625, -2.579833984375, -2.3876953125, -2.195556640625, -2.00341796875, -1.811279296875, -1.619140625, -1.427001953125, -1.23486328125, -1.042724609375, -0.8505859375, -0.658447265625, -0.46630859375, -0.274169921875, -0.08203125, 0.110107421875, 0.30224609375, 0.494384765625, 0.6865234375, 0.878662109375, 1.07080078125, 1.262939453125, 1.455078125, 1.647216796875, 1.83935546875, 2.031494140625, 2.2236328125, 2.415771484375, 2.60791015625, 2.800048828125, 2.9921875, 3.184326171875, 3.37646484375, 3.568603515625, 3.7607421875, 3.952880859375, 4.14501953125, 4.337158203125, 4.529296875, 4.721435546875, 4.91357421875, 5.105712890625, 5.2978515625, 5.489990234375, 5.68212890625, 5.874267578125, 6.06640625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 4.0, 6.0, 10.0, 9.0, 9.0, 16.0, 23.0, 23.0, 19.0, 34.0, 30.0, 30.0, 34.0, 32.0, 40.0, 40.0, 36.0, 50.0, 45.0, 37.0, 44.0, 47.0, 39.0, 29.0, 31.0, 25.0, 33.0, 31.0, 26.0, 25.0, 17.0, 21.0, 21.0, 15.0, 13.0, 10.0, 5.0, 6.0, 5.0, 0.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-2.873046875, -2.79534912109375, -2.7176513671875, -2.63995361328125, -2.562255859375, -2.48455810546875, -2.4068603515625, -2.32916259765625, -2.25146484375, -2.17376708984375, -2.0960693359375, -2.01837158203125, -1.940673828125, -1.86297607421875, -1.7852783203125, -1.70758056640625, -1.6298828125, -1.55218505859375, -1.4744873046875, -1.39678955078125, -1.319091796875, -1.24139404296875, -1.1636962890625, -1.08599853515625, -1.00830078125, -0.93060302734375, -0.8529052734375, -0.77520751953125, -0.697509765625, -0.61981201171875, -0.5421142578125, -0.46441650390625, -0.38671875, -0.30902099609375, -0.2313232421875, -0.15362548828125, -0.075927734375, 0.00177001953125, 0.0794677734375, 0.15716552734375, 0.23486328125, 0.31256103515625, 0.3902587890625, 0.46795654296875, 0.545654296875, 0.62335205078125, 0.7010498046875, 0.77874755859375, 0.8564453125, 0.93414306640625, 1.0118408203125, 1.08953857421875, 1.167236328125, 1.24493408203125, 1.3226318359375, 1.40032958984375, 1.47802734375, 1.55572509765625, 1.6334228515625, 1.71112060546875, 1.788818359375, 1.86651611328125, 1.9442138671875, 2.02191162109375, 2.099609375]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 12.0, 9.0, 9.0, 9.0, 19.0, 25.0, 43.0, 48.0, 86.0, 108.0, 182.0, 278.0, 412.0, 652.0, 1140.0, 1884.0, 3304.0, 6004.0, 11249.0, 21944.0, 45933.0, 101393.0, 246739.0, 643707.0, 1357316.0, 1039397.0, 411963.0, 162183.0, 69929.0, 32781.0, 16270.0, 8441.0, 4640.0, 2492.0, 1407.0, 865.0, 495.0, 315.0, 213.0, 112.0, 74.0, 72.0, 51.0, 23.0, 21.0, 15.0, 3.0, 14.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1328125, -6.9010009765625, -6.669189453125, -6.4373779296875, -6.20556640625, -5.9737548828125, -5.741943359375, -5.5101318359375, -5.2783203125, -5.0465087890625, -4.814697265625, -4.5828857421875, -4.35107421875, -4.1192626953125, -3.887451171875, -3.6556396484375, -3.423828125, -3.1920166015625, -2.960205078125, -2.7283935546875, -2.49658203125, -2.2647705078125, -2.032958984375, -1.8011474609375, -1.5693359375, -1.3375244140625, -1.105712890625, -0.8739013671875, -0.64208984375, -0.4102783203125, -0.178466796875, 0.0533447265625, 0.28515625, 0.5169677734375, 0.748779296875, 0.9805908203125, 1.21240234375, 1.4442138671875, 1.676025390625, 1.9078369140625, 2.1396484375, 2.3714599609375, 2.603271484375, 2.8350830078125, 3.06689453125, 3.2987060546875, 3.530517578125, 3.7623291015625, 3.994140625, 4.2259521484375, 4.457763671875, 4.6895751953125, 4.92138671875, 5.1531982421875, 5.385009765625, 5.6168212890625, 5.8486328125, 6.0804443359375, 6.312255859375, 6.5440673828125, 6.77587890625, 7.0076904296875, 7.239501953125, 7.4713134765625, 7.703125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 4.0, 5.0, 11.0, 18.0, 20.0, 27.0, 36.0, 47.0, 63.0, 67.0, 97.0, 118.0, 149.0, 172.0, 233.0, 264.0, 333.0, 308.0, 358.0, 289.0, 328.0, 242.0, 191.0, 143.0, 127.0, 77.0, 80.0, 60.0, 46.0, 37.0, 26.0, 21.0, 13.0, 11.0, 11.0, 11.0, 5.0, 7.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8330078125, -1.774169921875, -1.71533203125, -1.656494140625, -1.59765625, -1.538818359375, -1.47998046875, -1.421142578125, -1.3623046875, -1.303466796875, -1.24462890625, -1.185791015625, -1.126953125, -1.068115234375, -1.00927734375, -0.950439453125, -0.8916015625, -0.832763671875, -0.77392578125, -0.715087890625, -0.65625, -0.597412109375, -0.53857421875, -0.479736328125, -0.4208984375, -0.362060546875, -0.30322265625, -0.244384765625, -0.185546875, -0.126708984375, -0.06787109375, -0.009033203125, 0.0498046875, 0.108642578125, 0.16748046875, 0.226318359375, 0.28515625, 0.343994140625, 0.40283203125, 0.461669921875, 0.5205078125, 0.579345703125, 0.63818359375, 0.697021484375, 0.755859375, 0.814697265625, 0.87353515625, 0.932373046875, 0.9912109375, 1.050048828125, 1.10888671875, 1.167724609375, 1.2265625, 1.285400390625, 1.34423828125, 1.403076171875, 1.4619140625, 1.520751953125, 1.57958984375, 1.638427734375, 1.697265625, 1.756103515625, 1.81494140625, 1.873779296875, 1.9326171875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 8.0, 9.0, 10.0, 23.0, 31.0, 43.0, 59.0, 79.0, 94.0, 99.0, 109.0, 98.0, 91.0, 73.0, 52.0, 32.0, 33.0, 19.0, 12.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-16.24724769592285, -15.90961742401123, -15.571986198425293, -15.234355926513672, -14.89672565460205, -14.55909538269043, -14.221464157104492, -13.883833885192871, -13.54620361328125, -13.208573341369629, -12.870942115783691, -12.53331184387207, -12.19568157196045, -11.858051300048828, -11.52042007446289, -11.18278980255127, -10.845159530639648, -10.507529258728027, -10.16989803314209, -9.832267761230469, -9.494637489318848, -9.157007217407227, -8.819375991821289, -8.481745719909668, -8.14411449432373, -7.806483745574951, -7.46885347366333, -7.131222724914551, -6.79359245300293, -6.45596170425415, -6.118330955505371, -5.78070068359375, -5.443070411682129, -5.10543966293335, -4.7678093910217285, -4.430178642272949, -4.092548370361328, -3.754917621612549, -3.4172871112823486, -3.0796566009521484, -2.7420260906219482, -2.404395580291748, -2.066765069961548, -1.729134440422058, -1.391503930091858, -1.0538734197616577, -0.716242790222168, -0.3786122798919678, -0.04098176956176758, 0.296648770570755, 0.6342793107032776, 0.9719098806381226, 1.3095403909683228, 1.647170901298523, 1.9848015308380127, 2.322432041168213, 2.660062551498413, 2.9976930618286133, 3.3353235721588135, 3.6729540824890137, 4.010584831237793, 4.348215103149414, 4.685845851898193, 5.023476600646973, 5.361106872558594]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 4.0, 18.0, 5.0, 11.0, 14.0, 18.0, 14.0, 21.0, 23.0, 32.0, 23.0, 30.0, 31.0, 46.0, 39.0, 40.0, 43.0, 49.0, 31.0, 36.0, 42.0, 47.0, 43.0, 43.0, 38.0, 43.0, 29.0, 29.0, 21.0, 22.0, 25.0, 18.0, 11.0, 9.0, 14.0, 9.0, 7.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.53413724899292, -3.4264910221099854, -3.318844795227051, -3.211198329925537, -3.1035521030426025, -2.995905876159668, -2.8882596492767334, -2.780613422393799, -2.672966957092285, -2.5653207302093506, -2.457674503326416, -2.3500280380249023, -2.2423818111419678, -2.134735584259033, -2.0270893573760986, -1.919443130493164, -1.8117969036102295, -1.704150676727295, -1.5965043306350708, -1.4888581037521362, -1.381211757659912, -1.2735655307769775, -1.165919303894043, -1.0582730770111084, -0.9506267309188843, -0.8429804444313049, -0.7353341579437256, -0.627687931060791, -0.5200416445732117, -0.4123953580856323, -0.30474913120269775, -0.1971028447151184, -0.08945631980895996, 0.01818995177745819, 0.12583622336387634, 0.2334824800491333, 0.34112876653671265, 0.448775053024292, 0.5564212799072266, 0.6640675663948059, 0.7717138528823853, 0.8793601393699646, 0.987006425857544, 1.0946526527404785, 1.202298879623413, 1.3099452257156372, 1.4175914525985718, 1.525237798690796, 1.6328840255737305, 1.740530252456665, 1.8481765985488892, 1.9558228254318237, 2.063469171524048, 2.1711153984069824, 2.278761625289917, 2.3864078521728516, 2.4940543174743652, 2.6017005443573, 2.7093467712402344, 2.816993236541748, 2.9246394634246826, 3.032285690307617, 3.1399319171905518, 3.2475781440734863, 3.355224370956421]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 6.0, 1.0, 6.0, 11.0, 7.0, 18.0, 17.0, 33.0, 28.0, 49.0, 62.0, 94.0, 110.0, 170.0, 229.0, 368.0, 555.0, 844.0, 1390.0, 2547.0, 4944.0, 11641.0, 31167.0, 93130.0, 265344.0, 368857.0, 174081.0, 56532.0, 19768.0, 7764.0, 3635.0, 1929.0, 1061.0, 672.0, 449.0, 291.0, 203.0, 159.0, 127.0, 71.0, 41.0, 38.0, 28.0, 27.0, 11.0, 12.0, 6.0, 8.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-5.15625, -4.9859619140625, -4.815673828125, -4.6453857421875, -4.47509765625, -4.3048095703125, -4.134521484375, -3.9642333984375, -3.7939453125, -3.6236572265625, -3.453369140625, -3.2830810546875, -3.11279296875, -2.9425048828125, -2.772216796875, -2.6019287109375, -2.431640625, -2.2613525390625, -2.091064453125, -1.9207763671875, -1.75048828125, -1.5802001953125, -1.409912109375, -1.2396240234375, -1.0693359375, -0.8990478515625, -0.728759765625, -0.5584716796875, -0.38818359375, -0.2178955078125, -0.047607421875, 0.1226806640625, 0.29296875, 0.4632568359375, 0.633544921875, 0.8038330078125, 0.97412109375, 1.1444091796875, 1.314697265625, 1.4849853515625, 1.6552734375, 1.8255615234375, 1.995849609375, 2.1661376953125, 2.33642578125, 2.5067138671875, 2.677001953125, 2.8472900390625, 3.017578125, 3.1878662109375, 3.358154296875, 3.5284423828125, 3.69873046875, 3.8690185546875, 4.039306640625, 4.2095947265625, 4.3798828125, 4.5501708984375, 4.720458984375, 4.8907470703125, 5.06103515625, 5.2313232421875, 5.401611328125, 5.5718994140625, 5.7421875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 2.0, 6.0, 15.0, 7.0, 15.0, 16.0, 24.0, 15.0, 31.0, 26.0, 29.0, 37.0, 41.0, 49.0, 49.0, 39.0, 50.0, 43.0, 34.0, 47.0, 52.0, 43.0, 35.0, 44.0, 33.0, 25.0, 33.0, 18.0, 25.0, 17.0, 21.0, 19.0, 16.0, 4.0, 8.0, 5.0, 5.0, 8.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6875, -3.56463623046875, -3.4417724609375, -3.31890869140625, -3.196044921875, -3.07318115234375, -2.9503173828125, -2.82745361328125, -2.70458984375, -2.58172607421875, -2.4588623046875, -2.33599853515625, -2.213134765625, -2.09027099609375, -1.9674072265625, -1.84454345703125, -1.7216796875, -1.59881591796875, -1.4759521484375, -1.35308837890625, -1.230224609375, -1.10736083984375, -0.9844970703125, -0.86163330078125, -0.73876953125, -0.61590576171875, -0.4930419921875, -0.37017822265625, -0.247314453125, -0.12445068359375, -0.0015869140625, 0.12127685546875, 0.244140625, 0.36700439453125, 0.4898681640625, 0.61273193359375, 0.735595703125, 0.85845947265625, 0.9813232421875, 1.10418701171875, 1.22705078125, 1.34991455078125, 1.4727783203125, 1.59564208984375, 1.718505859375, 1.84136962890625, 1.9642333984375, 2.08709716796875, 2.2099609375, 2.33282470703125, 2.4556884765625, 2.57855224609375, 2.701416015625, 2.82427978515625, 2.9471435546875, 3.07000732421875, 3.19287109375, 3.31573486328125, 3.4385986328125, 3.56146240234375, 3.684326171875, 3.80718994140625, 3.9300537109375, 4.05291748046875, 4.17578125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 10.0, 7.0, 18.0, 14.0, 20.0, 29.0, 71.0, 71.0, 123.0, 164.0, 271.0, 411.0, 709.0, 1210.0, 2190.0, 4886.0, 12545.0, 37951.0, 141016.0, 420679.0, 301290.0, 84436.0, 24547.0, 8181.0, 3448.0, 1696.0, 906.0, 573.0, 367.0, 238.0, 143.0, 109.0, 81.0, 44.0, 27.0, 20.0, 11.0, 10.0, 7.0, 3.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.4517822265625, -6.227783203125, -6.0037841796875, -5.77978515625, -5.5557861328125, -5.331787109375, -5.1077880859375, -4.8837890625, -4.6597900390625, -4.435791015625, -4.2117919921875, -3.98779296875, -3.7637939453125, -3.539794921875, -3.3157958984375, -3.091796875, -2.8677978515625, -2.643798828125, -2.4197998046875, -2.19580078125, -1.9718017578125, -1.747802734375, -1.5238037109375, -1.2998046875, -1.0758056640625, -0.851806640625, -0.6278076171875, -0.40380859375, -0.1798095703125, 0.044189453125, 0.2681884765625, 0.4921875, 0.7161865234375, 0.940185546875, 1.1641845703125, 1.38818359375, 1.6121826171875, 1.836181640625, 2.0601806640625, 2.2841796875, 2.5081787109375, 2.732177734375, 2.9561767578125, 3.18017578125, 3.4041748046875, 3.628173828125, 3.8521728515625, 4.076171875, 4.3001708984375, 4.524169921875, 4.7481689453125, 4.97216796875, 5.1961669921875, 5.420166015625, 5.6441650390625, 5.8681640625, 6.0921630859375, 6.316162109375, 6.5401611328125, 6.76416015625, 6.9881591796875, 7.212158203125, 7.4361572265625, 7.66015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 9.0, 10.0, 11.0, 15.0, 17.0, 20.0, 28.0, 18.0, 28.0, 28.0, 41.0, 31.0, 33.0, 50.0, 38.0, 48.0, 50.0, 52.0, 38.0, 48.0, 28.0, 46.0, 33.0, 26.0, 38.0, 24.0, 37.0, 20.0, 26.0, 22.0, 9.0, 16.0, 9.0, 9.0, 6.0, 11.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.204193115234375, -2.13299560546875, -2.061798095703125, -1.9906005859375, -1.919403076171875, -1.84820556640625, -1.777008056640625, -1.705810546875, -1.634613037109375, -1.56341552734375, -1.492218017578125, -1.4210205078125, -1.349822998046875, -1.27862548828125, -1.207427978515625, -1.13623046875, -1.065032958984375, -0.99383544921875, -0.922637939453125, -0.8514404296875, -0.780242919921875, -0.70904541015625, -0.637847900390625, -0.566650390625, -0.495452880859375, -0.42425537109375, -0.353057861328125, -0.2818603515625, -0.210662841796875, -0.13946533203125, -0.068267822265625, 0.0029296875, 0.074127197265625, 0.14532470703125, 0.216522216796875, 0.2877197265625, 0.358917236328125, 0.43011474609375, 0.501312255859375, 0.572509765625, 0.643707275390625, 0.71490478515625, 0.786102294921875, 0.8572998046875, 0.928497314453125, 0.99969482421875, 1.070892333984375, 1.14208984375, 1.213287353515625, 1.28448486328125, 1.355682373046875, 1.4268798828125, 1.498077392578125, 1.56927490234375, 1.640472412109375, 1.711669921875, 1.782867431640625, 1.85406494140625, 1.925262451171875, 1.9964599609375, 2.067657470703125, 2.13885498046875, 2.210052490234375, 2.28125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 9.0, 10.0, 17.0, 22.0, 38.0, 54.0, 81.0, 96.0, 149.0, 186.0, 294.0, 483.0, 658.0, 1117.0, 1764.0, 2720.0, 4537.0, 7839.0, 13872.0, 26914.0, 56676.0, 123716.0, 259729.0, 278054.0, 139667.0, 62689.0, 30155.0, 15363.0, 8589.0, 4815.0, 3002.0, 1855.0, 1124.0, 699.0, 523.0, 320.0, 221.0, 144.0, 100.0, 71.0, 57.0, 31.0, 24.0, 22.0, 15.0, 11.0, 6.0, 2.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.805206298828125, -1.74517822265625, -1.685150146484375, -1.6251220703125, -1.565093994140625, -1.50506591796875, -1.445037841796875, -1.385009765625, -1.324981689453125, -1.26495361328125, -1.204925537109375, -1.1448974609375, -1.084869384765625, -1.02484130859375, -0.964813232421875, -0.90478515625, -0.844757080078125, -0.78472900390625, -0.724700927734375, -0.6646728515625, -0.604644775390625, -0.54461669921875, -0.484588623046875, -0.424560546875, -0.364532470703125, -0.30450439453125, -0.244476318359375, -0.1844482421875, -0.124420166015625, -0.06439208984375, -0.004364013671875, 0.0556640625, 0.115692138671875, 0.17572021484375, 0.235748291015625, 0.2957763671875, 0.355804443359375, 0.41583251953125, 0.475860595703125, 0.535888671875, 0.595916748046875, 0.65594482421875, 0.715972900390625, 0.7760009765625, 0.836029052734375, 0.89605712890625, 0.956085205078125, 1.01611328125, 1.076141357421875, 1.13616943359375, 1.196197509765625, 1.2562255859375, 1.316253662109375, 1.37628173828125, 1.436309814453125, 1.496337890625, 1.556365966796875, 1.61639404296875, 1.676422119140625, 1.7364501953125, 1.796478271484375, 1.85650634765625, 1.916534423828125, 1.9765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 4.0, 5.0, 9.0, 13.0, 22.0, 12.0, 44.0, 51.0, 85.0, 126.0, 125.0, 138.0, 109.0, 80.0, 52.0, 34.0, 18.0, 16.0, 13.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014209747314453125, -0.00013664178550243378, -0.0001311860978603363, -0.00012573041021823883, -0.00012027472257614136, -0.00011481903493404388, -0.00010936334729194641, -0.00010390765964984894, -9.845197200775146e-05, -9.299628436565399e-05, -8.754059672355652e-05, -8.208490908145905e-05, -7.662922143936157e-05, -7.11735337972641e-05, -6.571784615516663e-05, -6.026215851306915e-05, -5.480647087097168e-05, -4.9350783228874207e-05, -4.3895095586776733e-05, -3.843940794467926e-05, -3.298372030258179e-05, -2.7528032660484314e-05, -2.207234501838684e-05, -1.6616657376289368e-05, -1.1160969734191895e-05, -5.705282092094421e-06, -2.4959444999694824e-07, 5.206093192100525e-06, 1.0661780834197998e-05, 1.611746847629547e-05, 2.1573156118392944e-05, 2.7028843760490417e-05, 3.248453140258789e-05, 3.7940219044685364e-05, 4.339590668678284e-05, 4.885159432888031e-05, 5.430728197097778e-05, 5.9762969613075256e-05, 6.521865725517273e-05, 7.06743448972702e-05, 7.613003253936768e-05, 8.158572018146515e-05, 8.704140782356262e-05, 9.24970954656601e-05, 9.795278310775757e-05, 0.00010340847074985504, 0.00010886415839195251, 0.00011431984603404999, 0.00011977553367614746, 0.00012523122131824493, 0.0001306869089603424, 0.00013614259660243988, 0.00014159828424453735, 0.00014705397188663483, 0.0001525096595287323, 0.00015796534717082977, 0.00016342103481292725, 0.00016887672245502472, 0.0001743324100971222, 0.00017978809773921967, 0.00018524378538131714, 0.0001906994730234146, 0.00019615516066551208, 0.00020161084830760956, 0.00020706653594970703]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 10.0, 14.0, 17.0, 23.0, 42.0, 53.0, 93.0, 126.0, 162.0, 280.0, 354.0, 616.0, 925.0, 1400.0, 2241.0, 3558.0, 6031.0, 10549.0, 18927.0, 35148.0, 69503.0, 136819.0, 228302.0, 232155.0, 143547.0, 73611.0, 36735.0, 19548.0, 10920.0, 6429.0, 3826.0, 2369.0, 1449.0, 926.0, 650.0, 385.0, 246.0, 190.0, 111.0, 82.0, 56.0, 37.0, 33.0, 18.0, 13.0, 8.0, 3.0, 1.0, 6.0, 1.0, 1.0, 3.0, 2.0], "bins": [-1.65625, -1.6075897216796875, -1.558929443359375, -1.5102691650390625, -1.46160888671875, -1.4129486083984375, -1.364288330078125, -1.3156280517578125, -1.2669677734375, -1.2183074951171875, -1.169647216796875, -1.1209869384765625, -1.07232666015625, -1.0236663818359375, -0.975006103515625, -0.9263458251953125, -0.877685546875, -0.8290252685546875, -0.780364990234375, -0.7317047119140625, -0.68304443359375, -0.6343841552734375, -0.585723876953125, -0.5370635986328125, -0.4884033203125, -0.4397430419921875, -0.391082763671875, -0.3424224853515625, -0.29376220703125, -0.2451019287109375, -0.196441650390625, -0.1477813720703125, -0.09912109375, -0.0504608154296875, -0.001800537109375, 0.0468597412109375, 0.09552001953125, 0.1441802978515625, 0.192840576171875, 0.2415008544921875, 0.2901611328125, 0.3388214111328125, 0.387481689453125, 0.4361419677734375, 0.48480224609375, 0.5334625244140625, 0.582122802734375, 0.6307830810546875, 0.679443359375, 0.7281036376953125, 0.776763916015625, 0.8254241943359375, 0.87408447265625, 0.9227447509765625, 0.971405029296875, 1.0200653076171875, 1.0687255859375, 1.1173858642578125, 1.166046142578125, 1.2147064208984375, 1.26336669921875, 1.3120269775390625, 1.360687255859375, 1.4093475341796875, 1.4580078125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 10.0, 10.0, 10.0, 11.0, 20.0, 21.0, 31.0, 53.0, 43.0, 83.0, 78.0, 108.0, 123.0, 89.0, 74.0, 65.0, 48.0, 40.0, 34.0, 16.0, 19.0, 2.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63525390625, -0.6155776977539062, -0.5959014892578125, -0.5762252807617188, -0.556549072265625, -0.5368728637695312, -0.5171966552734375, -0.49752044677734375, -0.47784423828125, -0.45816802978515625, -0.4384918212890625, -0.41881561279296875, -0.399139404296875, -0.37946319580078125, -0.3597869873046875, -0.34011077880859375, -0.3204345703125, -0.30075836181640625, -0.2810821533203125, -0.26140594482421875, -0.241729736328125, -0.22205352783203125, -0.2023773193359375, -0.18270111083984375, -0.16302490234375, -0.14334869384765625, -0.1236724853515625, -0.10399627685546875, -0.084320068359375, -0.06464385986328125, -0.0449676513671875, -0.02529144287109375, -0.005615234375, 0.01406097412109375, 0.0337371826171875, 0.05341339111328125, 0.073089599609375, 0.09276580810546875, 0.1124420166015625, 0.13211822509765625, 0.15179443359375, 0.17147064208984375, 0.1911468505859375, 0.21082305908203125, 0.230499267578125, 0.25017547607421875, 0.2698516845703125, 0.28952789306640625, 0.3092041015625, 0.32888031005859375, 0.3485565185546875, 0.36823272705078125, 0.387908935546875, 0.40758514404296875, 0.4272613525390625, 0.44693756103515625, 0.46661376953125, 0.48628997802734375, 0.5059661865234375, 0.5256423950195312, 0.545318603515625, 0.5649948120117188, 0.5846710205078125, 0.6043472290039062, 0.6240234375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 5.0, 11.0, 11.0, 16.0, 25.0, 30.0, 43.0, 67.0, 75.0, 87.0, 103.0, 113.0, 90.0, 101.0, 66.0, 47.0, 23.0, 29.0, 21.0, 14.0, 8.0, 6.0, 6.0, 4.0, 0.0, 2.0], "bins": [-15.971409797668457, -15.644852638244629, -15.318296432495117, -14.991739273071289, -14.665182113647461, -14.338624954223633, -14.012068748474121, -13.685511589050293, -13.358954429626465, -13.032397270202637, -12.705841064453125, -12.379283905029297, -12.052726745605469, -11.72616958618164, -11.399613380432129, -11.0730562210083, -10.746500015258789, -10.419942855834961, -10.09338665008545, -9.766829490661621, -9.440272331237793, -9.113715171813965, -8.787158966064453, -8.460601806640625, -8.134044647216797, -7.807487964630127, -7.480930805206299, -7.154374122619629, -6.827816963195801, -6.501260280609131, -6.174703598022461, -5.848146438598633, -5.5215888023376465, -5.195032119750977, -4.868474960327148, -4.5419182777404785, -4.21536111831665, -3.8888044357299805, -3.5622475147247314, -3.2356905937194824, -2.9091336727142334, -2.5825767517089844, -2.2560198307037354, -1.9294630289077759, -1.6029061079025269, -1.2763491868972778, -0.9497923851013184, -0.6232354640960693, -0.2966785430908203, 0.029878348112106323, 0.35643523931503296, 0.6829921007156372, 1.0095490217208862, 1.3361059427261353, 1.6626627445220947, 1.9892196655273438, 2.3157765865325928, 2.642333507537842, 2.968890428543091, 3.29544734954834, 3.6220040321350098, 3.948561191558838, 4.275117874145508, 4.601675033569336, 4.928231716156006]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 10.0, 12.0, 7.0, 15.0, 19.0, 14.0, 24.0, 24.0, 27.0, 25.0, 24.0, 43.0, 42.0, 37.0, 42.0, 51.0, 42.0, 29.0, 36.0, 44.0, 40.0, 57.0, 31.0, 45.0, 38.0, 33.0, 20.0, 22.0, 24.0, 24.0, 19.0, 9.0, 11.0, 14.0, 8.0, 5.0, 3.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.4932479858398438, -3.386782169342041, -3.2803165912628174, -3.1738507747650146, -3.067385196685791, -2.9609193801879883, -2.8544535636901855, -2.747987747192383, -2.641522169113159, -2.5350563526153564, -2.428590774536133, -2.32212495803833, -2.2156591415405273, -2.1091935634613037, -2.002727746963501, -1.8962620496749878, -1.7897963523864746, -1.6833306550979614, -1.5768649578094482, -1.4703991413116455, -1.3639334440231323, -1.2574677467346191, -1.1510019302368164, -1.0445362329483032, -0.93807053565979, -0.8316048383712769, -0.7251390814781189, -0.6186733245849609, -0.5122076272964478, -0.40574193000793457, -0.2992761731147766, -0.19281041622161865, -0.08634471893310547, 0.020121008157730103, 0.12658673524856567, 0.23305246233940125, 0.3395181894302368, 0.44598388671875, 0.552449643611908, 0.6589154005050659, 0.7653810977935791, 0.8718467950820923, 0.9783125519752502, 1.0847783088684082, 1.1912440061569214, 1.2977097034454346, 1.4041755199432373, 1.5106412172317505, 1.6171069145202637, 1.7235726118087769, 1.83003830909729, 1.9365041255950928, 2.0429697036743164, 2.149435520172119, 2.255901336669922, 2.3623671531677246, 2.4688327312469482, 2.575298547744751, 2.6817641258239746, 2.7882299423217773, 2.89469575881958, 3.0011613368988037, 3.1076271533966064, 3.21409273147583, 3.320558547973633]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 7.0, 7.0, 13.0, 11.0, 25.0, 31.0, 42.0, 70.0, 93.0, 139.0, 266.0, 414.0, 741.0, 1412.0, 2700.0, 5752.0, 12439.0, 27864.0, 64168.0, 137252.0, 235085.0, 251486.0, 163850.0, 79615.0, 35376.0, 15490.0, 7007.0, 3343.0, 1711.0, 881.0, 516.0, 301.0, 174.0, 98.0, 58.0, 38.0, 26.0, 23.0, 10.0, 8.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.77557373046875, -4.6058349609375, -4.43609619140625, -4.266357421875, -4.09661865234375, -3.9268798828125, -3.75714111328125, -3.58740234375, -3.41766357421875, -3.2479248046875, -3.07818603515625, -2.908447265625, -2.73870849609375, -2.5689697265625, -2.39923095703125, -2.2294921875, -2.05975341796875, -1.8900146484375, -1.72027587890625, -1.550537109375, -1.38079833984375, -1.2110595703125, -1.04132080078125, -0.87158203125, -0.70184326171875, -0.5321044921875, -0.36236572265625, -0.192626953125, -0.02288818359375, 0.1468505859375, 0.31658935546875, 0.486328125, 0.65606689453125, 0.8258056640625, 0.99554443359375, 1.165283203125, 1.33502197265625, 1.5047607421875, 1.67449951171875, 1.84423828125, 2.01397705078125, 2.1837158203125, 2.35345458984375, 2.523193359375, 2.69293212890625, 2.8626708984375, 3.03240966796875, 3.2021484375, 3.37188720703125, 3.5416259765625, 3.71136474609375, 3.881103515625, 4.05084228515625, 4.2205810546875, 4.39031982421875, 4.56005859375, 4.72979736328125, 4.8995361328125, 5.06927490234375, 5.239013671875, 5.40875244140625, 5.5784912109375, 5.74822998046875, 5.91796875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 10.0, 15.0, 18.0, 17.0, 16.0, 16.0, 19.0, 24.0, 24.0, 30.0, 38.0, 46.0, 34.0, 45.0, 49.0, 39.0, 47.0, 36.0, 49.0, 44.0, 32.0, 42.0, 39.0, 37.0, 30.0, 27.0, 20.0, 27.0, 24.0, 22.0, 10.0, 16.0, 12.0, 10.0, 7.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.861328125, -3.745452880859375, -3.62957763671875, -3.513702392578125, -3.3978271484375, -3.281951904296875, -3.16607666015625, -3.050201416015625, -2.934326171875, -2.818450927734375, -2.70257568359375, -2.586700439453125, -2.4708251953125, -2.354949951171875, -2.23907470703125, -2.123199462890625, -2.00732421875, -1.891448974609375, -1.77557373046875, -1.659698486328125, -1.5438232421875, -1.427947998046875, -1.31207275390625, -1.196197509765625, -1.080322265625, -0.964447021484375, -0.84857177734375, -0.732696533203125, -0.6168212890625, -0.500946044921875, -0.38507080078125, -0.269195556640625, -0.1533203125, -0.037445068359375, 0.07843017578125, 0.194305419921875, 0.3101806640625, 0.426055908203125, 0.54193115234375, 0.657806396484375, 0.773681640625, 0.889556884765625, 1.00543212890625, 1.121307373046875, 1.2371826171875, 1.353057861328125, 1.46893310546875, 1.584808349609375, 1.70068359375, 1.816558837890625, 1.93243408203125, 2.048309326171875, 2.1641845703125, 2.280059814453125, 2.39593505859375, 2.511810302734375, 2.627685546875, 2.743560791015625, 2.85943603515625, 2.975311279296875, 3.0911865234375, 3.207061767578125, 3.32293701171875, 3.438812255859375, 3.5546875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 9.0, 10.0, 18.0, 37.0, 37.0, 54.0, 78.0, 106.0, 161.0, 210.0, 355.0, 509.0, 890.0, 1511.0, 2751.0, 5429.0, 10957.0, 23266.0, 50585.0, 105487.0, 189042.0, 241459.0, 197092.0, 113818.0, 54941.0, 25144.0, 11865.0, 5656.0, 2907.0, 1569.0, 936.0, 548.0, 334.0, 257.0, 167.0, 106.0, 62.0, 54.0, 31.0, 35.0, 12.0, 14.0, 16.0, 13.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.66253662109375, -4.5047607421875, -4.34698486328125, -4.189208984375, -4.03143310546875, -3.8736572265625, -3.71588134765625, -3.55810546875, -3.40032958984375, -3.2425537109375, -3.08477783203125, -2.927001953125, -2.76922607421875, -2.6114501953125, -2.45367431640625, -2.2958984375, -2.13812255859375, -1.9803466796875, -1.82257080078125, -1.664794921875, -1.50701904296875, -1.3492431640625, -1.19146728515625, -1.03369140625, -0.87591552734375, -0.7181396484375, -0.56036376953125, -0.402587890625, -0.24481201171875, -0.0870361328125, 0.07073974609375, 0.228515625, 0.38629150390625, 0.5440673828125, 0.70184326171875, 0.859619140625, 1.01739501953125, 1.1751708984375, 1.33294677734375, 1.49072265625, 1.64849853515625, 1.8062744140625, 1.96405029296875, 2.121826171875, 2.27960205078125, 2.4373779296875, 2.59515380859375, 2.7529296875, 2.91070556640625, 3.0684814453125, 3.22625732421875, 3.384033203125, 3.54180908203125, 3.6995849609375, 3.85736083984375, 4.01513671875, 4.17291259765625, 4.3306884765625, 4.48846435546875, 4.646240234375, 4.80401611328125, 4.9617919921875, 5.11956787109375, 5.27734375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 3.0, 7.0, 7.0, 8.0, 5.0, 14.0, 12.0, 14.0, 14.0, 14.0, 27.0, 25.0, 25.0, 18.0, 42.0, 35.0, 47.0, 34.0, 55.0, 44.0, 42.0, 36.0, 55.0, 42.0, 39.0, 35.0, 48.0, 33.0, 33.0, 31.0, 21.0, 25.0, 21.0, 23.0, 15.0, 14.0, 7.0, 9.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.05645751953125, -1.9879150390625, -1.91937255859375, -1.850830078125, -1.78228759765625, -1.7137451171875, -1.64520263671875, -1.57666015625, -1.50811767578125, -1.4395751953125, -1.37103271484375, -1.302490234375, -1.23394775390625, -1.1654052734375, -1.09686279296875, -1.0283203125, -0.95977783203125, -0.8912353515625, -0.82269287109375, -0.754150390625, -0.68560791015625, -0.6170654296875, -0.54852294921875, -0.47998046875, -0.41143798828125, -0.3428955078125, -0.27435302734375, -0.205810546875, -0.13726806640625, -0.0687255859375, -0.00018310546875, 0.068359375, 0.13690185546875, 0.2054443359375, 0.27398681640625, 0.342529296875, 0.41107177734375, 0.4796142578125, 0.54815673828125, 0.61669921875, 0.68524169921875, 0.7537841796875, 0.82232666015625, 0.890869140625, 0.95941162109375, 1.0279541015625, 1.09649658203125, 1.1650390625, 1.23358154296875, 1.3021240234375, 1.37066650390625, 1.439208984375, 1.50775146484375, 1.5762939453125, 1.64483642578125, 1.71337890625, 1.78192138671875, 1.8504638671875, 1.91900634765625, 1.987548828125, 2.05609130859375, 2.1246337890625, 2.19317626953125, 2.26171875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 5.0, 6.0, 6.0, 14.0, 18.0, 29.0, 34.0, 69.0, 100.0, 152.0, 207.0, 311.0, 424.0, 675.0, 1044.0, 1653.0, 2712.0, 4327.0, 7306.0, 13484.0, 26196.0, 52323.0, 105575.0, 189386.0, 242239.0, 187344.0, 103936.0, 51186.0, 25747.0, 13057.0, 7412.0, 4274.0, 2523.0, 1665.0, 1061.0, 741.0, 437.0, 320.0, 178.0, 133.0, 92.0, 58.0, 39.0, 24.0, 12.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.505859375, -2.433197021484375, -2.36053466796875, -2.287872314453125, -2.2152099609375, -2.142547607421875, -2.06988525390625, -1.997222900390625, -1.924560546875, -1.851898193359375, -1.77923583984375, -1.706573486328125, -1.6339111328125, -1.561248779296875, -1.48858642578125, -1.415924072265625, -1.34326171875, -1.270599365234375, -1.19793701171875, -1.125274658203125, -1.0526123046875, -0.979949951171875, -0.90728759765625, -0.834625244140625, -0.761962890625, -0.689300537109375, -0.61663818359375, -0.543975830078125, -0.4713134765625, -0.398651123046875, -0.32598876953125, -0.253326416015625, -0.1806640625, -0.108001708984375, -0.03533935546875, 0.037322998046875, 0.1099853515625, 0.182647705078125, 0.25531005859375, 0.327972412109375, 0.400634765625, 0.473297119140625, 0.54595947265625, 0.618621826171875, 0.6912841796875, 0.763946533203125, 0.83660888671875, 0.909271240234375, 0.98193359375, 1.054595947265625, 1.12725830078125, 1.199920654296875, 1.2725830078125, 1.345245361328125, 1.41790771484375, 1.490570068359375, 1.563232421875, 1.635894775390625, 1.70855712890625, 1.781219482421875, 1.8538818359375, 1.926544189453125, 1.99920654296875, 2.071868896484375, 2.14453125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 6.0, 1.0, 9.0, 8.0, 6.0, 20.0, 29.0, 21.0, 36.0, 42.0, 52.0, 73.0, 101.0, 99.0, 99.0, 87.0, 91.0, 55.0, 37.0, 37.0, 31.0, 14.0, 7.0, 12.0, 1.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024056434631347656, -0.00023252889513969421, -0.00022449344396591187, -0.00021645799279212952, -0.00020842254161834717, -0.00020038709044456482, -0.00019235163927078247, -0.00018431618809700012, -0.00017628073692321777, -0.00016824528574943542, -0.00016020983457565308, -0.00015217438340187073, -0.00014413893222808838, -0.00013610348105430603, -0.00012806802988052368, -0.00012003257870674133, -0.00011199712753295898, -0.00010396167635917664, -9.592622518539429e-05, -8.789077401161194e-05, -7.985532283782959e-05, -7.181987166404724e-05, -6.378442049026489e-05, -5.5748969316482544e-05, -4.7713518142700195e-05, -3.967806696891785e-05, -3.16426157951355e-05, -2.360716462135315e-05, -1.55717134475708e-05, -7.536262273788452e-06, 4.991888999938965e-07, 8.534640073776245e-06, 1.6570091247558594e-05, 2.4605542421340942e-05, 3.264099359512329e-05, 4.067644476890564e-05, 4.871189594268799e-05, 5.674734711647034e-05, 6.478279829025269e-05, 7.281824946403503e-05, 8.085370063781738e-05, 8.888915181159973e-05, 9.692460298538208e-05, 0.00010496005415916443, 0.00011299550533294678, 0.00012103095650672913, 0.00012906640768051147, 0.00013710185885429382, 0.00014513731002807617, 0.00015317276120185852, 0.00016120821237564087, 0.00016924366354942322, 0.00017727911472320557, 0.00018531456589698792, 0.00019335001707077026, 0.0002013854682445526, 0.00020942091941833496, 0.0002174563705921173, 0.00022549182176589966, 0.000233527272939682, 0.00024156272411346436, 0.0002495981752872467, 0.00025763362646102905, 0.0002656690776348114, 0.00027370452880859375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 15.0, 23.0, 38.0, 42.0, 36.0, 73.0, 116.0, 144.0, 197.0, 279.0, 411.0, 547.0, 850.0, 1201.0, 1729.0, 2547.0, 3876.0, 6216.0, 9636.0, 15931.0, 26666.0, 45169.0, 74752.0, 117525.0, 160158.0, 175088.0, 146717.0, 100379.0, 62192.0, 36948.0, 21926.0, 13171.0, 8191.0, 5151.0, 3300.0, 2216.0, 1552.0, 1079.0, 664.0, 495.0, 372.0, 261.0, 209.0, 143.0, 101.0, 62.0, 40.0, 36.0, 21.0, 17.0, 16.0, 6.0, 4.0, 7.0, 3.0, 4.0], "bins": [-1.7197265625, -1.6681060791015625, -1.616485595703125, -1.5648651123046875, -1.51324462890625, -1.4616241455078125, -1.410003662109375, -1.3583831787109375, -1.3067626953125, -1.2551422119140625, -1.203521728515625, -1.1519012451171875, -1.10028076171875, -1.0486602783203125, -0.997039794921875, -0.9454193115234375, -0.893798828125, -0.8421783447265625, -0.790557861328125, -0.7389373779296875, -0.68731689453125, -0.6356964111328125, -0.584075927734375, -0.5324554443359375, -0.4808349609375, -0.4292144775390625, -0.377593994140625, -0.3259735107421875, -0.27435302734375, -0.2227325439453125, -0.171112060546875, -0.1194915771484375, -0.06787109375, -0.0162506103515625, 0.035369873046875, 0.0869903564453125, 0.13861083984375, 0.1902313232421875, 0.241851806640625, 0.2934722900390625, 0.3450927734375, 0.3967132568359375, 0.448333740234375, 0.4999542236328125, 0.55157470703125, 0.6031951904296875, 0.654815673828125, 0.7064361572265625, 0.758056640625, 0.8096771240234375, 0.861297607421875, 0.9129180908203125, 0.96453857421875, 1.0161590576171875, 1.067779541015625, 1.1194000244140625, 1.1710205078125, 1.2226409912109375, 1.274261474609375, 1.3258819580078125, 1.37750244140625, 1.4291229248046875, 1.480743408203125, 1.5323638916015625, 1.583984375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 2.0, 5.0, 3.0, 5.0, 10.0, 5.0, 13.0, 14.0, 13.0, 19.0, 23.0, 36.0, 33.0, 48.0, 44.0, 51.0, 50.0, 57.0, 68.0, 62.0, 71.0, 65.0, 44.0, 41.0, 36.0, 31.0, 35.0, 23.0, 17.0, 21.0, 12.0, 11.0, 10.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.548828125, -0.5321578979492188, -0.5154876708984375, -0.49881744384765625, -0.482147216796875, -0.46547698974609375, -0.4488067626953125, -0.43213653564453125, -0.41546630859375, -0.39879608154296875, -0.3821258544921875, -0.36545562744140625, -0.348785400390625, -0.33211517333984375, -0.3154449462890625, -0.29877471923828125, -0.2821044921875, -0.26543426513671875, -0.2487640380859375, -0.23209381103515625, -0.215423583984375, -0.19875335693359375, -0.1820831298828125, -0.16541290283203125, -0.14874267578125, -0.13207244873046875, -0.1154022216796875, -0.09873199462890625, -0.082061767578125, -0.06539154052734375, -0.0487213134765625, -0.03205108642578125, -0.015380859375, 0.00128936767578125, 0.0179595947265625, 0.03462982177734375, 0.051300048828125, 0.06797027587890625, 0.0846405029296875, 0.10131072998046875, 0.11798095703125, 0.13465118408203125, 0.1513214111328125, 0.16799163818359375, 0.184661865234375, 0.20133209228515625, 0.2180023193359375, 0.23467254638671875, 0.2513427734375, 0.26801300048828125, 0.2846832275390625, 0.30135345458984375, 0.318023681640625, 0.33469390869140625, 0.3513641357421875, 0.36803436279296875, 0.38470458984375, 0.40137481689453125, 0.4180450439453125, 0.43471527099609375, 0.451385498046875, 0.46805572509765625, 0.4847259521484375, 0.5013961791992188, 0.51806640625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 7.0, 14.0, 10.0, 21.0, 32.0, 44.0, 53.0, 62.0, 103.0, 99.0, 121.0, 104.0, 89.0, 65.0, 59.0, 30.0, 35.0, 18.0, 14.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0], "bins": [-16.5013484954834, -16.165313720703125, -15.829277038574219, -15.493241310119629, -15.157205581665039, -14.82116985321045, -14.48513412475586, -14.149099349975586, -13.81306266784668, -13.47702693939209, -13.1409912109375, -12.80495548248291, -12.46891975402832, -12.13288402557373, -11.79684829711914, -11.460813522338867, -11.124777793884277, -10.788742065429688, -10.452706336975098, -10.116670608520508, -9.780634880065918, -9.444599151611328, -9.108564376831055, -8.772527694702148, -8.436492919921875, -8.100457191467285, -7.764421463012695, -7.4283857345581055, -7.092350006103516, -6.756314277648926, -6.420279026031494, -6.084243297576904, -5.74820613861084, -5.41217041015625, -5.07613468170166, -4.74009895324707, -4.4040632247924805, -4.068027496337891, -3.731992244720459, -3.395956516265869, -3.0599207878112793, -2.7238850593566895, -2.3878493309020996, -2.051813840866089, -1.715778112411499, -1.3797423839569092, -1.0437068939208984, -0.7076711654663086, -0.37163543701171875, -0.03559976816177368, 0.3004359006881714, 0.6364715099334717, 0.9725072383880615, 1.3085429668426514, 1.644578456878662, 1.980614185333252, 2.316649913787842, 2.6526856422424316, 2.9887213706970215, 3.3247568607330322, 3.660792589187622, 3.996828317642212, 4.332863807678223, 4.6688995361328125, 5.004935264587402]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 6.0, 4.0, 11.0, 6.0, 9.0, 17.0, 17.0, 29.0, 26.0, 21.0, 29.0, 39.0, 35.0, 27.0, 37.0, 50.0, 51.0, 46.0, 37.0, 45.0, 48.0, 34.0, 59.0, 37.0, 27.0, 30.0, 24.0, 28.0, 38.0, 23.0, 18.0, 16.0, 14.0, 9.0, 15.0, 6.0, 5.0, 8.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.512770891189575, -3.4048044681549072, -3.2968382835388184, -3.1888718605041504, -3.0809054374694824, -2.9729392528533936, -2.8649728298187256, -2.7570066452026367, -2.6490402221679688, -2.541073799133301, -2.433107614517212, -2.325141191482544, -2.217174768447876, -2.109208583831787, -2.001242160797119, -1.8932758569717407, -1.7853094339370728, -1.6773431301116943, -1.5693767070770264, -1.461410403251648, -1.3534440994262695, -1.2454776763916016, -1.1375113725662231, -1.0295450687408447, -0.9215787053108215, -0.8136123418807983, -0.7056460380554199, -0.5976796746253967, -0.4897133409976959, -0.3817470073699951, -0.2737806439399719, -0.1658143401145935, -0.05784797668457031, 0.05011836439371109, 0.1580847054719925, 0.2660510540008545, 0.3740173876285553, 0.4819837212562561, 0.5899500846862793, 0.6979163885116577, 0.8058827519416809, 0.9138491153717041, 1.0218154191970825, 1.129781723022461, 1.237748146057129, 1.3457144498825073, 1.4536807537078857, 1.5616471767425537, 1.6696134805679321, 1.7775797843933105, 1.8855462074279785, 1.993512511253357, 2.1014788150787354, 2.2094452381134033, 2.317411422729492, 2.42537784576416, 2.533344268798828, 2.641310691833496, 2.749276876449585, 2.857243299484253, 2.965209722518921, 3.0731759071350098, 3.1811423301696777, 3.2891087532043457, 3.3970749378204346]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 5.0, 6.0, 11.0, 12.0, 13.0, 24.0, 37.0, 45.0, 57.0, 106.0, 146.0, 237.0, 360.0, 532.0, 854.0, 1361.0, 2371.0, 4033.0, 7270.0, 13569.0, 27120.0, 59095.0, 144953.0, 402818.0, 1122442.0, 1422214.0, 615033.0, 210433.0, 82244.0, 36885.0, 17809.0, 9403.0, 5183.0, 2924.0, 1723.0, 1074.0, 671.0, 392.0, 275.0, 164.0, 107.0, 80.0, 60.0, 40.0, 30.0, 17.0, 20.0, 14.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.12109375, -6.89990234375, -6.6787109375, -6.45751953125, -6.236328125, -6.01513671875, -5.7939453125, -5.57275390625, -5.3515625, -5.13037109375, -4.9091796875, -4.68798828125, -4.466796875, -4.24560546875, -4.0244140625, -3.80322265625, -3.58203125, -3.36083984375, -3.1396484375, -2.91845703125, -2.697265625, -2.47607421875, -2.2548828125, -2.03369140625, -1.8125, -1.59130859375, -1.3701171875, -1.14892578125, -0.927734375, -0.70654296875, -0.4853515625, -0.26416015625, -0.04296875, 0.17822265625, 0.3994140625, 0.62060546875, 0.841796875, 1.06298828125, 1.2841796875, 1.50537109375, 1.7265625, 1.94775390625, 2.1689453125, 2.39013671875, 2.611328125, 2.83251953125, 3.0537109375, 3.27490234375, 3.49609375, 3.71728515625, 3.9384765625, 4.15966796875, 4.380859375, 4.60205078125, 4.8232421875, 5.04443359375, 5.265625, 5.48681640625, 5.7080078125, 5.92919921875, 6.150390625, 6.37158203125, 6.5927734375, 6.81396484375, 7.03515625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 7.0, 12.0, 14.0, 15.0, 9.0, 17.0, 28.0, 34.0, 40.0, 43.0, 40.0, 40.0, 44.0, 47.0, 54.0, 48.0, 46.0, 48.0, 49.0, 44.0, 40.0, 40.0, 38.0, 44.0, 33.0, 25.0, 25.0, 15.0, 12.0, 10.0, 7.0, 9.0, 5.0, 8.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.538330078125, -2.44775390625, -2.357177734375, -2.2666015625, -2.176025390625, -2.08544921875, -1.994873046875, -1.904296875, -1.813720703125, -1.72314453125, -1.632568359375, -1.5419921875, -1.451416015625, -1.36083984375, -1.270263671875, -1.1796875, -1.089111328125, -0.99853515625, -0.907958984375, -0.8173828125, -0.726806640625, -0.63623046875, -0.545654296875, -0.455078125, -0.364501953125, -0.27392578125, -0.183349609375, -0.0927734375, -0.002197265625, 0.08837890625, 0.178955078125, 0.26953125, 0.360107421875, 0.45068359375, 0.541259765625, 0.6318359375, 0.722412109375, 0.81298828125, 0.903564453125, 0.994140625, 1.084716796875, 1.17529296875, 1.265869140625, 1.3564453125, 1.447021484375, 1.53759765625, 1.628173828125, 1.71875, 1.809326171875, 1.89990234375, 1.990478515625, 2.0810546875, 2.171630859375, 2.26220703125, 2.352783203125, 2.443359375, 2.533935546875, 2.62451171875, 2.715087890625, 2.8056640625, 2.896240234375, 2.98681640625, 3.077392578125, 3.16796875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 8.0, 10.0, 21.0, 17.0, 31.0, 36.0, 36.0, 70.0, 99.0, 142.0, 192.0, 271.0, 380.0, 598.0, 901.0, 1374.0, 2027.0, 3173.0, 4972.0, 7792.0, 12632.0, 21437.0, 37443.0, 68044.0, 127793.0, 254104.0, 514208.0, 944363.0, 1008026.0, 575753.0, 285919.0, 143820.0, 75438.0, 41324.0, 24209.0, 14016.0, 8482.0, 5315.0, 3394.0, 2091.0, 1442.0, 958.0, 576.0, 425.0, 290.0, 213.0, 133.0, 82.0, 55.0, 46.0, 32.0, 26.0, 19.0, 6.0, 8.0, 10.0, 3.0, 7.0, 3.0, 3.0, 1.0], "bins": [-5.3046875, -5.134033203125, -4.96337890625, -4.792724609375, -4.6220703125, -4.451416015625, -4.28076171875, -4.110107421875, -3.939453125, -3.768798828125, -3.59814453125, -3.427490234375, -3.2568359375, -3.086181640625, -2.91552734375, -2.744873046875, -2.57421875, -2.403564453125, -2.23291015625, -2.062255859375, -1.8916015625, -1.720947265625, -1.55029296875, -1.379638671875, -1.208984375, -1.038330078125, -0.86767578125, -0.697021484375, -0.5263671875, -0.355712890625, -0.18505859375, -0.014404296875, 0.15625, 0.326904296875, 0.49755859375, 0.668212890625, 0.8388671875, 1.009521484375, 1.18017578125, 1.350830078125, 1.521484375, 1.692138671875, 1.86279296875, 2.033447265625, 2.2041015625, 2.374755859375, 2.54541015625, 2.716064453125, 2.88671875, 3.057373046875, 3.22802734375, 3.398681640625, 3.5693359375, 3.739990234375, 3.91064453125, 4.081298828125, 4.251953125, 4.422607421875, 4.59326171875, 4.763916015625, 4.9345703125, 5.105224609375, 5.27587890625, 5.446533203125, 5.6171875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 3.0, 7.0, 11.0, 14.0, 15.0, 17.0, 21.0, 39.0, 34.0, 46.0, 79.0, 90.0, 128.0, 123.0, 175.0, 239.0, 279.0, 265.0, 294.0, 317.0, 331.0, 276.0, 252.0, 217.0, 178.0, 130.0, 116.0, 84.0, 52.0, 53.0, 33.0, 28.0, 24.0, 26.0, 13.0, 12.0, 10.0, 11.0, 8.0, 5.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.633148193359375, -1.57781982421875, -1.522491455078125, -1.4671630859375, -1.411834716796875, -1.35650634765625, -1.301177978515625, -1.245849609375, -1.190521240234375, -1.13519287109375, -1.079864501953125, -1.0245361328125, -0.969207763671875, -0.91387939453125, -0.858551025390625, -0.80322265625, -0.747894287109375, -0.69256591796875, -0.637237548828125, -0.5819091796875, -0.526580810546875, -0.47125244140625, -0.415924072265625, -0.360595703125, -0.305267333984375, -0.24993896484375, -0.194610595703125, -0.1392822265625, -0.083953857421875, -0.02862548828125, 0.026702880859375, 0.08203125, 0.137359619140625, 0.19268798828125, 0.248016357421875, 0.3033447265625, 0.358673095703125, 0.41400146484375, 0.469329833984375, 0.524658203125, 0.579986572265625, 0.63531494140625, 0.690643310546875, 0.7459716796875, 0.801300048828125, 0.85662841796875, 0.911956787109375, 0.96728515625, 1.022613525390625, 1.07794189453125, 1.133270263671875, 1.1885986328125, 1.243927001953125, 1.29925537109375, 1.354583740234375, 1.409912109375, 1.465240478515625, 1.52056884765625, 1.575897216796875, 1.6312255859375, 1.686553955078125, 1.74188232421875, 1.797210693359375, 1.8525390625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 8.0, 9.0, 16.0, 22.0, 24.0, 23.0, 36.0, 61.0, 66.0, 86.0, 84.0, 83.0, 96.0, 94.0, 62.0, 60.0, 40.0, 37.0, 26.0, 15.0, 11.0, 16.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-13.311237335205078, -13.022732734680176, -12.73422908782959, -12.445724487304688, -12.157219886779785, -11.8687162399292, -11.580211639404297, -11.291707992553711, -11.003203392028809, -10.714698791503906, -10.42619514465332, -10.137690544128418, -9.849185943603516, -9.56068229675293, -9.272177696228027, -8.983673095703125, -8.695169448852539, -8.406664848327637, -8.11816120147705, -7.829656600952148, -7.541152477264404, -7.25264835357666, -6.964143753051758, -6.675639629364014, -6.387134552001953, -6.098630428314209, -5.810125827789307, -5.5216217041015625, -5.233117580413818, -4.944613456726074, -4.656108856201172, -4.367604732513428, -4.079100608825684, -3.7905962467193604, -3.502092123031616, -3.213587760925293, -2.925083637237549, -2.6365792751312256, -2.3480749130249023, -2.059570789337158, -1.771066427230835, -1.4825621843338013, -1.1940579414367676, -0.9055535793304443, -0.6170493364334106, -0.32854509353637695, -0.04004073143005371, 0.24846339225769043, 0.5369677543640137, 0.8254719972610474, 1.113976240158081, 1.4024806022644043, 1.690984845161438, 1.9794890880584717, 2.267993450164795, 2.556497573852539, 2.8450019359588623, 3.1335062980651855, 3.4220104217529297, 3.710514783859253, 3.999019145965576, 4.28752326965332, 4.576027870178223, 4.864531517028809, 5.153036117553711]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 9.0, 13.0, 12.0, 13.0, 20.0, 21.0, 27.0, 27.0, 25.0, 27.0, 31.0, 30.0, 31.0, 43.0, 53.0, 42.0, 40.0, 53.0, 42.0, 44.0, 39.0, 31.0, 40.0, 37.0, 42.0, 39.0, 32.0, 17.0, 18.0, 21.0, 14.0, 15.0, 11.0, 8.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.712069272994995, -3.6039493083953857, -3.4958291053771973, -3.387709140777588, -3.2795891761779785, -3.17146897315979, -3.0633490085601807, -2.955228805541992, -2.847108840942383, -2.7389888763427734, -2.630868673324585, -2.5227487087249756, -2.414628505706787, -2.3065085411071777, -2.1983885765075684, -2.090268611907959, -1.9821484088897705, -1.8740283250808716, -1.7659082412719727, -1.6577882766723633, -1.5496681928634644, -1.4415481090545654, -1.333428144454956, -1.2253080606460571, -1.1171879768371582, -1.0090678930282593, -0.9009478688240051, -0.792827844619751, -0.684707760810852, -0.5765876770019531, -0.468467652797699, -0.3603476285934448, -0.2522275447845459, -0.14410749077796936, -0.03598743677139282, 0.07213261723518372, 0.18025267124176025, 0.2883727550506592, 0.39649277925491333, 0.5046128034591675, 0.6127328872680664, 0.7208529710769653, 0.8289729952812195, 0.9370930194854736, 1.0452131032943726, 1.1533331871032715, 1.2614531517028809, 1.3695732355117798, 1.4776933193206787, 1.5858134031295776, 1.6939334869384766, 1.802053451538086, 1.9101735353469849, 2.018293619155884, 2.126413583755493, 2.2345337867736816, 2.342653751373291, 2.4507737159729004, 2.558893918991089, 2.6670138835906982, 2.7751340866088867, 2.883254051208496, 2.9913740158081055, 3.099493980407715, 3.2076141834259033]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 13.0, 24.0, 27.0, 64.0, 94.0, 140.0, 241.0, 353.0, 555.0, 888.0, 1451.0, 2428.0, 4078.0, 6713.0, 11546.0, 20003.0, 33070.0, 55845.0, 88426.0, 128453.0, 161271.0, 163959.0, 132331.0, 92205.0, 58109.0, 35324.0, 20744.0, 12261.0, 7190.0, 4268.0, 2595.0, 1507.0, 880.0, 556.0, 342.0, 201.0, 126.0, 98.0, 52.0, 37.0, 25.0, 17.0, 9.0, 12.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.9849395751953125, -1.923004150390625, -1.8610687255859375, -1.79913330078125, -1.7371978759765625, -1.675262451171875, -1.6133270263671875, -1.5513916015625, -1.4894561767578125, -1.427520751953125, -1.3655853271484375, -1.30364990234375, -1.2417144775390625, -1.179779052734375, -1.1178436279296875, -1.055908203125, -0.9939727783203125, -0.932037353515625, -0.8701019287109375, -0.80816650390625, -0.7462310791015625, -0.684295654296875, -0.6223602294921875, -0.5604248046875, -0.4984893798828125, -0.436553955078125, -0.3746185302734375, -0.31268310546875, -0.2507476806640625, -0.188812255859375, -0.1268768310546875, -0.06494140625, -0.0030059814453125, 0.058929443359375, 0.1208648681640625, 0.18280029296875, 0.2447357177734375, 0.306671142578125, 0.3686065673828125, 0.4305419921875, 0.4924774169921875, 0.554412841796875, 0.6163482666015625, 0.67828369140625, 0.7402191162109375, 0.802154541015625, 0.8640899658203125, 0.926025390625, 0.9879608154296875, 1.049896240234375, 1.1118316650390625, 1.17376708984375, 1.2357025146484375, 1.297637939453125, 1.3595733642578125, 1.4215087890625, 1.4834442138671875, 1.545379638671875, 1.6073150634765625, 1.66925048828125, 1.7311859130859375, 1.793121337890625, 1.8550567626953125, 1.9169921875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 7.0, 9.0, 19.0, 14.0, 11.0, 19.0, 27.0, 26.0, 25.0, 32.0, 36.0, 38.0, 30.0, 47.0, 38.0, 38.0, 57.0, 42.0, 39.0, 51.0, 35.0, 29.0, 42.0, 34.0, 44.0, 25.0, 27.0, 23.0, 24.0, 17.0, 27.0, 17.0, 12.0, 7.0, 6.0, 8.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.580078125, -3.46234130859375, -3.3446044921875, -3.22686767578125, -3.109130859375, -2.99139404296875, -2.8736572265625, -2.75592041015625, -2.63818359375, -2.52044677734375, -2.4027099609375, -2.28497314453125, -2.167236328125, -2.04949951171875, -1.9317626953125, -1.81402587890625, -1.6962890625, -1.57855224609375, -1.4608154296875, -1.34307861328125, -1.225341796875, -1.10760498046875, -0.9898681640625, -0.87213134765625, -0.75439453125, -0.63665771484375, -0.5189208984375, -0.40118408203125, -0.283447265625, -0.16571044921875, -0.0479736328125, 0.06976318359375, 0.1875, 0.30523681640625, 0.4229736328125, 0.54071044921875, 0.658447265625, 0.77618408203125, 0.8939208984375, 1.01165771484375, 1.12939453125, 1.24713134765625, 1.3648681640625, 1.48260498046875, 1.600341796875, 1.71807861328125, 1.8358154296875, 1.95355224609375, 2.0712890625, 2.18902587890625, 2.3067626953125, 2.42449951171875, 2.542236328125, 2.65997314453125, 2.7777099609375, 2.89544677734375, 3.01318359375, 3.13092041015625, 3.2486572265625, 3.36639404296875, 3.484130859375, 3.60186767578125, 3.7196044921875, 3.83734130859375, 3.955078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 11.0, 20.0, 32.0, 35.0, 87.0, 96.0, 182.0, 309.0, 512.0, 842.0, 1567.0, 2506.0, 4311.0, 7670.0, 13648.0, 24449.0, 44108.0, 78955.0, 133882.0, 197727.0, 202849.0, 141843.0, 84922.0, 47713.0, 26111.0, 14774.0, 8193.0, 4600.0, 2641.0, 1642.0, 937.0, 553.0, 342.0, 170.0, 116.0, 68.0, 50.0, 32.0, 21.0, 9.0, 6.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.876953125, -2.789947509765625, -2.70294189453125, -2.615936279296875, -2.5289306640625, -2.441925048828125, -2.35491943359375, -2.267913818359375, -2.180908203125, -2.093902587890625, -2.00689697265625, -1.919891357421875, -1.8328857421875, -1.745880126953125, -1.65887451171875, -1.571868896484375, -1.48486328125, -1.397857666015625, -1.31085205078125, -1.223846435546875, -1.1368408203125, -1.049835205078125, -0.96282958984375, -0.875823974609375, -0.788818359375, -0.701812744140625, -0.61480712890625, -0.527801513671875, -0.4407958984375, -0.353790283203125, -0.26678466796875, -0.179779052734375, -0.0927734375, -0.005767822265625, 0.08123779296875, 0.168243408203125, 0.2552490234375, 0.342254638671875, 0.42926025390625, 0.516265869140625, 0.603271484375, 0.690277099609375, 0.77728271484375, 0.864288330078125, 0.9512939453125, 1.038299560546875, 1.12530517578125, 1.212310791015625, 1.29931640625, 1.386322021484375, 1.47332763671875, 1.560333251953125, 1.6473388671875, 1.734344482421875, 1.82135009765625, 1.908355712890625, 1.995361328125, 2.082366943359375, 2.16937255859375, 2.256378173828125, 2.3433837890625, 2.430389404296875, 2.51739501953125, 2.604400634765625, 2.69140625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 8.0, 6.0, 14.0, 8.0, 14.0, 24.0, 30.0, 22.0, 17.0, 32.0, 24.0, 32.0, 28.0, 36.0, 30.0, 28.0, 35.0, 38.0, 34.0, 44.0, 49.0, 33.0, 33.0, 26.0, 38.0, 37.0, 28.0, 25.0, 25.0, 24.0, 21.0, 18.0, 18.0, 16.0, 13.0, 15.0, 11.0, 13.0, 7.0, 8.0, 4.0, 7.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.009765625, -1.949462890625, -1.88916015625, -1.828857421875, -1.7685546875, -1.708251953125, -1.64794921875, -1.587646484375, -1.52734375, -1.467041015625, -1.40673828125, -1.346435546875, -1.2861328125, -1.225830078125, -1.16552734375, -1.105224609375, -1.044921875, -0.984619140625, -0.92431640625, -0.864013671875, -0.8037109375, -0.743408203125, -0.68310546875, -0.622802734375, -0.5625, -0.502197265625, -0.44189453125, -0.381591796875, -0.3212890625, -0.260986328125, -0.20068359375, -0.140380859375, -0.080078125, -0.019775390625, 0.04052734375, 0.100830078125, 0.1611328125, 0.221435546875, 0.28173828125, 0.342041015625, 0.40234375, 0.462646484375, 0.52294921875, 0.583251953125, 0.6435546875, 0.703857421875, 0.76416015625, 0.824462890625, 0.884765625, 0.945068359375, 1.00537109375, 1.065673828125, 1.1259765625, 1.186279296875, 1.24658203125, 1.306884765625, 1.3671875, 1.427490234375, 1.48779296875, 1.548095703125, 1.6083984375, 1.668701171875, 1.72900390625, 1.789306640625, 1.849609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 8.0, 11.0, 7.0, 22.0, 30.0, 52.0, 59.0, 60.0, 131.0, 168.0, 235.0, 378.0, 543.0, 727.0, 1133.0, 1729.0, 2656.0, 4113.0, 6410.0, 10462.0, 17062.0, 28824.0, 48409.0, 81886.0, 134337.0, 193476.0, 190073.0, 129230.0, 78244.0, 46217.0, 27506.0, 16461.0, 10002.0, 6312.0, 4039.0, 2452.0, 1645.0, 1110.0, 753.0, 494.0, 354.0, 232.0, 173.0, 100.0, 86.0, 44.0, 28.0, 30.0, 16.0, 10.0, 13.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.1396484375, -1.105072021484375, -1.07049560546875, -1.035919189453125, -1.0013427734375, -0.966766357421875, -0.93218994140625, -0.897613525390625, -0.863037109375, -0.828460693359375, -0.79388427734375, -0.759307861328125, -0.7247314453125, -0.690155029296875, -0.65557861328125, -0.621002197265625, -0.58642578125, -0.551849365234375, -0.51727294921875, -0.482696533203125, -0.4481201171875, -0.413543701171875, -0.37896728515625, -0.344390869140625, -0.309814453125, -0.275238037109375, -0.24066162109375, -0.206085205078125, -0.1715087890625, -0.136932373046875, -0.10235595703125, -0.067779541015625, -0.033203125, 0.001373291015625, 0.03594970703125, 0.070526123046875, 0.1051025390625, 0.139678955078125, 0.17425537109375, 0.208831787109375, 0.243408203125, 0.277984619140625, 0.31256103515625, 0.347137451171875, 0.3817138671875, 0.416290283203125, 0.45086669921875, 0.485443115234375, 0.52001953125, 0.554595947265625, 0.58917236328125, 0.623748779296875, 0.6583251953125, 0.692901611328125, 0.72747802734375, 0.762054443359375, 0.796630859375, 0.831207275390625, 0.86578369140625, 0.900360107421875, 0.9349365234375, 0.969512939453125, 1.00408935546875, 1.038665771484375, 1.0732421875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 12.0, 16.0, 10.0, 13.0, 21.0, 21.0, 33.0, 36.0, 47.0, 52.0, 49.0, 79.0, 69.0, 64.0, 69.0, 78.0, 55.0, 50.0, 51.0, 31.0, 26.0, 19.0, 28.0, 16.0, 9.0, 10.0, 5.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.151199340820312e-05, -5.941465497016907e-05, -5.731731653213501e-05, -5.521997809410095e-05, -5.3122639656066895e-05, -5.102530121803284e-05, -4.892796277999878e-05, -4.683062434196472e-05, -4.4733285903930664e-05, -4.2635947465896606e-05, -4.053860902786255e-05, -3.844127058982849e-05, -3.6343932151794434e-05, -3.4246593713760376e-05, -3.214925527572632e-05, -3.005191683769226e-05, -2.7954578399658203e-05, -2.5857239961624146e-05, -2.3759901523590088e-05, -2.166256308555603e-05, -1.9565224647521973e-05, -1.7467886209487915e-05, -1.5370547771453857e-05, -1.32732093334198e-05, -1.1175870895385742e-05, -9.078532457351685e-06, -6.981194019317627e-06, -4.883855581283569e-06, -2.7865171432495117e-06, -6.891787052154541e-07, 1.4081597328186035e-06, 3.505498170852661e-06, 5.602836608886719e-06, 7.700175046920776e-06, 9.797513484954834e-06, 1.1894851922988892e-05, 1.399219036102295e-05, 1.6089528799057007e-05, 1.8186867237091064e-05, 2.0284205675125122e-05, 2.238154411315918e-05, 2.4478882551193237e-05, 2.6576220989227295e-05, 2.8673559427261353e-05, 3.077089786529541e-05, 3.286823630332947e-05, 3.4965574741363525e-05, 3.706291317939758e-05, 3.916025161743164e-05, 4.12575900554657e-05, 4.3354928493499756e-05, 4.5452266931533813e-05, 4.754960536956787e-05, 4.964694380760193e-05, 5.1744282245635986e-05, 5.3841620683670044e-05, 5.59389591217041e-05, 5.803629755973816e-05, 6.013363599777222e-05, 6.223097443580627e-05, 6.432831287384033e-05, 6.642565131187439e-05, 6.852298974990845e-05, 7.06203281879425e-05, 7.271766662597656e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 13.0, 14.0, 16.0, 30.0, 57.0, 71.0, 122.0, 182.0, 272.0, 475.0, 738.0, 1186.0, 1820.0, 3155.0, 5187.0, 8624.0, 14440.0, 24772.0, 42069.0, 70378.0, 111882.0, 156567.0, 176724.0, 153709.0, 108787.0, 67693.0, 40660.0, 23716.0, 14127.0, 8346.0, 4898.0, 2965.0, 1822.0, 1088.0, 682.0, 476.0, 270.0, 178.0, 127.0, 80.0, 34.0, 35.0, 14.0, 16.0, 16.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.0439453125, -1.0127487182617188, -0.9815521240234375, -0.9503555297851562, -0.919158935546875, -0.8879623413085938, -0.8567657470703125, -0.8255691528320312, -0.79437255859375, -0.7631759643554688, -0.7319793701171875, -0.7007827758789062, -0.669586181640625, -0.6383895874023438, -0.6071929931640625, -0.5759963989257812, -0.5447998046875, -0.5136032104492188, -0.4824066162109375, -0.45121002197265625, -0.420013427734375, -0.38881683349609375, -0.3576202392578125, -0.32642364501953125, -0.29522705078125, -0.26403045654296875, -0.2328338623046875, -0.20163726806640625, -0.170440673828125, -0.13924407958984375, -0.1080474853515625, -0.07685089111328125, -0.045654296875, -0.01445770263671875, 0.0167388916015625, 0.04793548583984375, 0.079132080078125, 0.11032867431640625, 0.1415252685546875, 0.17272186279296875, 0.20391845703125, 0.23511505126953125, 0.2663116455078125, 0.29750823974609375, 0.328704833984375, 0.35990142822265625, 0.3910980224609375, 0.42229461669921875, 0.4534912109375, 0.48468780517578125, 0.5158843994140625, 0.5470809936523438, 0.578277587890625, 0.6094741821289062, 0.6406707763671875, 0.6718673706054688, 0.70306396484375, 0.7342605590820312, 0.7654571533203125, 0.7966537475585938, 0.827850341796875, 0.8590469360351562, 0.8902435302734375, 0.9214401245117188, 0.95263671875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 8.0, 5.0, 9.0, 10.0, 19.0, 15.0, 14.0, 26.0, 22.0, 26.0, 24.0, 34.0, 44.0, 33.0, 52.0, 39.0, 33.0, 45.0, 47.0, 45.0, 55.0, 45.0, 33.0, 38.0, 52.0, 28.0, 23.0, 25.0, 22.0, 21.0, 16.0, 13.0, 8.0, 8.0, 11.0, 11.0, 7.0, 2.0, 4.0, 0.0, 4.0, 5.0, 1.0, 4.0, 4.0], "bins": [-0.301025390625, -0.2930259704589844, -0.28502655029296875, -0.2770271301269531, -0.2690277099609375, -0.2610282897949219, -0.25302886962890625, -0.24502944946289062, -0.237030029296875, -0.22903060913085938, -0.22103118896484375, -0.21303176879882812, -0.2050323486328125, -0.19703292846679688, -0.18903350830078125, -0.18103408813476562, -0.17303466796875, -0.16503524780273438, -0.15703582763671875, -0.14903640747070312, -0.1410369873046875, -0.13303756713867188, -0.12503814697265625, -0.11703872680664062, -0.109039306640625, -0.10103988647460938, -0.09304046630859375, -0.08504104614257812, -0.0770416259765625, -0.06904220581054688, -0.06104278564453125, -0.053043365478515625, -0.0450439453125, -0.037044525146484375, -0.02904510498046875, -0.021045684814453125, -0.0130462646484375, -0.005046844482421875, 0.00295257568359375, 0.010951995849609375, 0.018951416015625, 0.026950836181640625, 0.03495025634765625, 0.042949676513671875, 0.0509490966796875, 0.058948516845703125, 0.06694793701171875, 0.07494735717773438, 0.08294677734375, 0.09094619750976562, 0.09894561767578125, 0.10694503784179688, 0.1149444580078125, 0.12294387817382812, 0.13094329833984375, 0.13894271850585938, 0.146942138671875, 0.15494155883789062, 0.16294097900390625, 0.17094039916992188, 0.1789398193359375, 0.18693923950195312, 0.19493865966796875, 0.20293807983398438, 0.2109375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 10.0, 11.0, 16.0, 25.0, 23.0, 30.0, 52.0, 67.0, 68.0, 88.0, 94.0, 93.0, 97.0, 76.0, 64.0, 38.0, 48.0, 28.0, 18.0, 13.0, 12.0, 8.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.480181694030762, -13.184569358825684, -12.888957023620605, -12.593343734741211, -12.297731399536133, -12.002119064331055, -11.706506729125977, -11.410894393920898, -11.11528205871582, -10.819669723510742, -10.524057388305664, -10.22844409942627, -9.932831764221191, -9.637219429016113, -9.341607093811035, -9.045994758605957, -8.750381469726562, -8.454769134521484, -8.159156799316406, -7.86354398727417, -7.567931175231934, -7.2723188400268555, -6.976706504821777, -6.681094169616699, -6.385481357574463, -6.089869022369385, -5.794256210327148, -5.49864387512207, -5.203031539916992, -4.907418727874756, -4.611806392669678, -4.316193580627441, -4.020580291748047, -3.7249677181243896, -3.4293551445007324, -3.1337428092956543, -2.838130235671997, -2.54251766204834, -2.2469053268432617, -1.9512927532196045, -1.6556801795959473, -1.36006760597229, -1.0644551515579224, -0.7688426375389099, -0.47323012351989746, -0.17761754989624023, 0.11799490451812744, 0.4136073589324951, 0.7092199325561523, 1.0048325061798096, 1.3004449605941772, 1.596057415008545, 1.8916699886322021, 2.1872825622558594, 2.4828948974609375, 2.7785074710845947, 3.074120044708252, 3.369732618331909, 3.6653451919555664, 3.9609575271606445, 4.256569862365723, 4.552182674407959, 4.847795009613037, 5.143407821655273, 5.439020156860352]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 4.0, 3.0, 10.0, 11.0, 14.0, 11.0, 18.0, 15.0, 21.0, 30.0, 30.0, 20.0, 38.0, 27.0, 37.0, 40.0, 38.0, 48.0, 40.0, 55.0, 37.0, 45.0, 43.0, 33.0, 39.0, 34.0, 42.0, 36.0, 38.0, 23.0, 16.0, 20.0, 14.0, 22.0, 11.0, 13.0, 8.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.694929361343384, -3.5890119075775146, -3.4830944538116455, -3.3771772384643555, -3.2712597846984863, -3.165342330932617, -3.059424877166748, -2.953507423400879, -2.8475899696350098, -2.7416725158691406, -2.6357550621032715, -2.5298376083374023, -2.4239203929901123, -2.318002939224243, -2.212085485458374, -2.106168031692505, -2.000250816345215, -1.8943333625793457, -1.7884160280227661, -1.682498574256897, -1.5765811204910278, -1.4706637859344482, -1.364746332168579, -1.25882887840271, -1.1529114246368408, -1.0469939708709717, -0.9410765767097473, -0.835159182548523, -0.7292417287826538, -0.6233243346214294, -0.5174069404602051, -0.41148948669433594, -0.3055720329284668, -0.19965460896492004, -0.09373719990253448, 0.012180209159851074, 0.11809763312339783, 0.22401505708694458, 0.32993245124816895, 0.4358499050140381, 0.5417672991752625, 0.6476846933364868, 0.753602147102356, 0.8595195412635803, 0.9654369354248047, 1.0713543891906738, 1.177271842956543, 1.283189296722412, 1.3891066312789917, 1.4950240850448608, 1.6009414196014404, 1.7068588733673096, 1.8127763271331787, 1.9186937808990479, 2.024610996246338, 2.130528450012207, 2.236445903778076, 2.3423633575439453, 2.4482808113098145, 2.5541982650756836, 2.6601154804229736, 2.7660329341888428, 2.871950387954712, 2.977867841720581, 3.08378529548645]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 6.0, 11.0, 13.0, 26.0, 35.0, 43.0, 79.0, 156.0, 189.0, 336.0, 529.0, 854.0, 1511.0, 2539.0, 4221.0, 7151.0, 12325.0, 20584.0, 34839.0, 56570.0, 87769.0, 124462.0, 151877.0, 155933.0, 131961.0, 96067.0, 62815.0, 38732.0, 23442.0, 13597.0, 8117.0, 4768.0, 2877.0, 1606.0, 989.0, 587.0, 351.0, 205.0, 143.0, 92.0, 57.0, 40.0, 22.0, 12.0, 9.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.3828125, -3.286468505859375, -3.19012451171875, -3.093780517578125, -2.9974365234375, -2.901092529296875, -2.80474853515625, -2.708404541015625, -2.612060546875, -2.515716552734375, -2.41937255859375, -2.323028564453125, -2.2266845703125, -2.130340576171875, -2.03399658203125, -1.937652587890625, -1.84130859375, -1.744964599609375, -1.64862060546875, -1.552276611328125, -1.4559326171875, -1.359588623046875, -1.26324462890625, -1.166900634765625, -1.070556640625, -0.974212646484375, -0.87786865234375, -0.781524658203125, -0.6851806640625, -0.588836669921875, -0.49249267578125, -0.396148681640625, -0.2998046875, -0.203460693359375, -0.10711669921875, -0.010772705078125, 0.0855712890625, 0.181915283203125, 0.27825927734375, 0.374603271484375, 0.470947265625, 0.567291259765625, 0.66363525390625, 0.759979248046875, 0.8563232421875, 0.952667236328125, 1.04901123046875, 1.145355224609375, 1.24169921875, 1.338043212890625, 1.43438720703125, 1.530731201171875, 1.6270751953125, 1.723419189453125, 1.81976318359375, 1.916107177734375, 2.012451171875, 2.108795166015625, 2.20513916015625, 2.301483154296875, 2.3978271484375, 2.494171142578125, 2.59051513671875, 2.686859130859375, 2.783203125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 1.0, 8.0, 9.0, 10.0, 7.0, 12.0, 14.0, 22.0, 19.0, 28.0, 15.0, 40.0, 32.0, 35.0, 30.0, 42.0, 41.0, 51.0, 46.0, 43.0, 53.0, 49.0, 46.0, 31.0, 40.0, 35.0, 38.0, 43.0, 25.0, 24.0, 21.0, 18.0, 16.0, 14.0, 17.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.37890625, -4.260101318359375, -4.14129638671875, -4.022491455078125, -3.9036865234375, -3.784881591796875, -3.66607666015625, -3.547271728515625, -3.428466796875, -3.309661865234375, -3.19085693359375, -3.072052001953125, -2.9532470703125, -2.834442138671875, -2.71563720703125, -2.596832275390625, -2.47802734375, -2.359222412109375, -2.24041748046875, -2.121612548828125, -2.0028076171875, -1.884002685546875, -1.76519775390625, -1.646392822265625, -1.527587890625, -1.408782958984375, -1.28997802734375, -1.171173095703125, -1.0523681640625, -0.933563232421875, -0.81475830078125, -0.695953369140625, -0.5771484375, -0.458343505859375, -0.33953857421875, -0.220733642578125, -0.1019287109375, 0.016876220703125, 0.13568115234375, 0.254486083984375, 0.373291015625, 0.492095947265625, 0.61090087890625, 0.729705810546875, 0.8485107421875, 0.967315673828125, 1.08612060546875, 1.204925537109375, 1.32373046875, 1.442535400390625, 1.56134033203125, 1.680145263671875, 1.7989501953125, 1.917755126953125, 2.03656005859375, 2.155364990234375, 2.274169921875, 2.392974853515625, 2.51177978515625, 2.630584716796875, 2.7493896484375, 2.868194580078125, 2.98699951171875, 3.105804443359375, 3.224609375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 12.0, 16.0, 28.0, 46.0, 79.0, 124.0, 183.0, 248.0, 388.0, 600.0, 839.0, 1302.0, 1947.0, 3113.0, 4703.0, 7106.0, 10879.0, 16573.0, 25233.0, 37377.0, 54470.0, 75801.0, 99057.0, 116973.0, 124759.0, 118748.0, 100438.0, 77252.0, 55899.0, 38738.0, 25799.0, 17174.0, 11225.0, 7477.0, 4774.0, 3078.0, 2037.0, 1368.0, 944.0, 591.0, 394.0, 294.0, 153.0, 121.0, 66.0, 41.0, 33.0, 20.0, 14.0, 7.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.462890625, -2.384796142578125, -2.30670166015625, -2.228607177734375, -2.1505126953125, -2.072418212890625, -1.99432373046875, -1.916229248046875, -1.838134765625, -1.760040283203125, -1.68194580078125, -1.603851318359375, -1.5257568359375, -1.447662353515625, -1.36956787109375, -1.291473388671875, -1.21337890625, -1.135284423828125, -1.05718994140625, -0.979095458984375, -0.9010009765625, -0.822906494140625, -0.74481201171875, -0.666717529296875, -0.588623046875, -0.510528564453125, -0.43243408203125, -0.354339599609375, -0.2762451171875, -0.198150634765625, -0.12005615234375, -0.041961669921875, 0.0361328125, 0.114227294921875, 0.19232177734375, 0.270416259765625, 0.3485107421875, 0.426605224609375, 0.50469970703125, 0.582794189453125, 0.660888671875, 0.738983154296875, 0.81707763671875, 0.895172119140625, 0.9732666015625, 1.051361083984375, 1.12945556640625, 1.207550048828125, 1.28564453125, 1.363739013671875, 1.44183349609375, 1.519927978515625, 1.5980224609375, 1.676116943359375, 1.75421142578125, 1.832305908203125, 1.910400390625, 1.988494873046875, 2.06658935546875, 2.144683837890625, 2.2227783203125, 2.300872802734375, 2.37896728515625, 2.457061767578125, 2.53515625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 10.0, 8.0, 12.0, 22.0, 18.0, 9.0, 22.0, 32.0, 28.0, 14.0, 23.0, 26.0, 52.0, 39.0, 38.0, 41.0, 37.0, 47.0, 42.0, 42.0, 44.0, 41.0, 26.0, 26.0, 31.0, 33.0, 30.0, 27.0, 27.0, 20.0, 20.0, 14.0, 15.0, 15.0, 11.0, 12.0, 10.0, 6.0, 9.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.9975433349609375, -1.934539794921875, -1.8715362548828125, -1.80853271484375, -1.7455291748046875, -1.682525634765625, -1.6195220947265625, -1.5565185546875, -1.4935150146484375, -1.430511474609375, -1.3675079345703125, -1.30450439453125, -1.2415008544921875, -1.178497314453125, -1.1154937744140625, -1.052490234375, -0.9894866943359375, -0.926483154296875, -0.8634796142578125, -0.80047607421875, -0.7374725341796875, -0.674468994140625, -0.6114654541015625, -0.5484619140625, -0.4854583740234375, -0.422454833984375, -0.3594512939453125, -0.29644775390625, -0.2334442138671875, -0.170440673828125, -0.1074371337890625, -0.04443359375, 0.0185699462890625, 0.081573486328125, 0.1445770263671875, 0.20758056640625, 0.2705841064453125, 0.333587646484375, 0.3965911865234375, 0.4595947265625, 0.5225982666015625, 0.585601806640625, 0.6486053466796875, 0.71160888671875, 0.7746124267578125, 0.837615966796875, 0.9006195068359375, 0.963623046875, 1.0266265869140625, 1.089630126953125, 1.1526336669921875, 1.21563720703125, 1.2786407470703125, 1.341644287109375, 1.4046478271484375, 1.4676513671875, 1.5306549072265625, 1.593658447265625, 1.6566619873046875, 1.71966552734375, 1.7826690673828125, 1.845672607421875, 1.9086761474609375, 1.9716796875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 15.0, 24.0, 27.0, 48.0, 92.0, 142.0, 205.0, 348.0, 573.0, 860.0, 1378.0, 2175.0, 3427.0, 5931.0, 9927.0, 16736.0, 28126.0, 47756.0, 78198.0, 120046.0, 158888.0, 171230.0, 143772.0, 100732.0, 63619.0, 38286.0, 22635.0, 13138.0, 7801.0, 4749.0, 2849.0, 1771.0, 1095.0, 685.0, 454.0, 296.0, 193.0, 115.0, 71.0, 47.0, 35.0, 19.0, 10.0, 9.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5107421875, -1.4666748046875, -1.422607421875, -1.3785400390625, -1.33447265625, -1.2904052734375, -1.246337890625, -1.2022705078125, -1.158203125, -1.1141357421875, -1.070068359375, -1.0260009765625, -0.98193359375, -0.9378662109375, -0.893798828125, -0.8497314453125, -0.8056640625, -0.7615966796875, -0.717529296875, -0.6734619140625, -0.62939453125, -0.5853271484375, -0.541259765625, -0.4971923828125, -0.453125, -0.4090576171875, -0.364990234375, -0.3209228515625, -0.27685546875, -0.2327880859375, -0.188720703125, -0.1446533203125, -0.1005859375, -0.0565185546875, -0.012451171875, 0.0316162109375, 0.07568359375, 0.1197509765625, 0.163818359375, 0.2078857421875, 0.251953125, 0.2960205078125, 0.340087890625, 0.3841552734375, 0.42822265625, 0.4722900390625, 0.516357421875, 0.5604248046875, 0.6044921875, 0.6485595703125, 0.692626953125, 0.7366943359375, 0.78076171875, 0.8248291015625, 0.868896484375, 0.9129638671875, 0.95703125, 1.0010986328125, 1.045166015625, 1.0892333984375, 1.13330078125, 1.1773681640625, 1.221435546875, 1.2655029296875, 1.3095703125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 3.0, 2.0, 10.0, 6.0, 14.0, 21.0, 21.0, 29.0, 35.0, 37.0, 45.0, 49.0, 51.0, 61.0, 56.0, 72.0, 58.0, 64.0, 59.0, 60.0, 46.0, 40.0, 35.0, 27.0, 18.0, 20.0, 12.0, 10.0, 10.0, 5.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0001633167266845703, -0.0001587122678756714, -0.00015410780906677246, -0.00014950335025787354, -0.0001448988914489746, -0.00014029443264007568, -0.00013568997383117676, -0.00013108551502227783, -0.0001264810562133789, -0.00012187659740447998, -0.00011727213859558105, -0.00011266767978668213, -0.0001080632209777832, -0.00010345876216888428, -9.885430335998535e-05, -9.424984455108643e-05, -8.96453857421875e-05, -8.504092693328857e-05, -8.043646812438965e-05, -7.583200931549072e-05, -7.12275505065918e-05, -6.662309169769287e-05, -6.201863288879395e-05, -5.741417407989502e-05, -5.2809715270996094e-05, -4.820525646209717e-05, -4.360079765319824e-05, -3.8996338844299316e-05, -3.439188003540039e-05, -2.9787421226501465e-05, -2.518296241760254e-05, -2.0578503608703613e-05, -1.5974044799804688e-05, -1.1369585990905762e-05, -6.765127182006836e-06, -2.16066837310791e-06, 2.4437904357910156e-06, 7.048249244689941e-06, 1.1652708053588867e-05, 1.6257166862487793e-05, 2.086162567138672e-05, 2.5466084480285645e-05, 3.007054328918457e-05, 3.4675002098083496e-05, 3.927946090698242e-05, 4.388391971588135e-05, 4.8488378524780273e-05, 5.30928373336792e-05, 5.7697296142578125e-05, 6.230175495147705e-05, 6.690621376037598e-05, 7.15106725692749e-05, 7.611513137817383e-05, 8.071959018707275e-05, 8.532404899597168e-05, 8.99285078048706e-05, 9.453296661376953e-05, 9.913742542266846e-05, 0.00010374188423156738, 0.00010834634304046631, 0.00011295080184936523, 0.00011755526065826416, 0.00012215971946716309, 0.000126764178276062, 0.00013136863708496094]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 10.0, 21.0, 19.0, 26.0, 48.0, 69.0, 99.0, 179.0, 261.0, 492.0, 844.0, 1447.0, 2467.0, 4469.0, 7932.0, 14283.0, 26335.0, 47849.0, 83905.0, 135459.0, 183642.0, 187078.0, 143315.0, 91260.0, 52078.0, 29050.0, 15789.0, 8736.0, 4756.0, 2782.0, 1562.0, 881.0, 557.0, 287.0, 199.0, 114.0, 83.0, 51.0, 22.0, 22.0, 15.0, 14.0, 11.0, 8.0, 2.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.658203125, -1.6095428466796875, -1.560882568359375, -1.5122222900390625, -1.46356201171875, -1.4149017333984375, -1.366241455078125, -1.3175811767578125, -1.2689208984375, -1.2202606201171875, -1.171600341796875, -1.1229400634765625, -1.07427978515625, -1.0256195068359375, -0.976959228515625, -0.9282989501953125, -0.879638671875, -0.8309783935546875, -0.782318115234375, -0.7336578369140625, -0.68499755859375, -0.6363372802734375, -0.587677001953125, -0.5390167236328125, -0.4903564453125, -0.4416961669921875, -0.393035888671875, -0.3443756103515625, -0.29571533203125, -0.2470550537109375, -0.198394775390625, -0.1497344970703125, -0.10107421875, -0.0524139404296875, -0.003753662109375, 0.0449066162109375, 0.09356689453125, 0.1422271728515625, 0.190887451171875, 0.2395477294921875, 0.2882080078125, 0.3368682861328125, 0.385528564453125, 0.4341888427734375, 0.48284912109375, 0.5315093994140625, 0.580169677734375, 0.6288299560546875, 0.677490234375, 0.7261505126953125, 0.774810791015625, 0.8234710693359375, 0.87213134765625, 0.9207916259765625, 0.969451904296875, 1.0181121826171875, 1.0667724609375, 1.1154327392578125, 1.164093017578125, 1.2127532958984375, 1.26141357421875, 1.3100738525390625, 1.358734130859375, 1.4073944091796875, 1.4560546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 10.0, 13.0, 9.0, 16.0, 17.0, 23.0, 31.0, 19.0, 29.0, 31.0, 54.0, 49.0, 45.0, 43.0, 51.0, 45.0, 45.0, 55.0, 50.0, 43.0, 40.0, 40.0, 37.0, 26.0, 29.0, 21.0, 28.0, 22.0, 12.0, 10.0, 12.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3974609375, -0.38423919677734375, -0.3710174560546875, -0.35779571533203125, -0.344573974609375, -0.33135223388671875, -0.3181304931640625, -0.30490875244140625, -0.29168701171875, -0.27846527099609375, -0.2652435302734375, -0.25202178955078125, -0.238800048828125, -0.22557830810546875, -0.2123565673828125, -0.19913482666015625, -0.1859130859375, -0.17269134521484375, -0.1594696044921875, -0.14624786376953125, -0.133026123046875, -0.11980438232421875, -0.1065826416015625, -0.09336090087890625, -0.08013916015625, -0.06691741943359375, -0.0536956787109375, -0.04047393798828125, -0.027252197265625, -0.01403045654296875, -0.0008087158203125, 0.01241302490234375, 0.025634765625, 0.03885650634765625, 0.0520782470703125, 0.06529998779296875, 0.078521728515625, 0.09174346923828125, 0.1049652099609375, 0.11818695068359375, 0.13140869140625, 0.14463043212890625, 0.1578521728515625, 0.17107391357421875, 0.184295654296875, 0.19751739501953125, 0.2107391357421875, 0.22396087646484375, 0.2371826171875, 0.25040435791015625, 0.2636260986328125, 0.27684783935546875, 0.290069580078125, 0.30329132080078125, 0.3165130615234375, 0.32973480224609375, 0.34295654296875, 0.35617828369140625, 0.3694000244140625, 0.38262176513671875, 0.395843505859375, 0.40906524658203125, 0.4222869873046875, 0.43550872802734375, 0.44873046875]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 8.0, 12.0, 11.0, 25.0, 33.0, 33.0, 42.0, 55.0, 74.0, 79.0, 87.0, 91.0, 107.0, 87.0, 66.0, 41.0, 35.0, 40.0, 19.0, 16.0, 12.0, 8.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-13.601099967956543, -13.304840087890625, -13.008581161499023, -12.712321281433105, -12.416061401367188, -12.119802474975586, -11.823542594909668, -11.52728271484375, -11.231023788452148, -10.93476390838623, -10.638504981994629, -10.342245101928711, -10.04598617553711, -9.749726295471191, -9.453466415405273, -9.157207489013672, -8.860947608947754, -8.564687728881836, -8.268428802490234, -7.972168922424316, -7.675909519195557, -7.379650115966797, -7.083390235900879, -6.787130832672119, -6.490871429443359, -6.1946120262146, -5.89835262298584, -5.602092742919922, -5.305833339691162, -5.009573936462402, -4.713314056396484, -4.417054653167725, -4.120794296264648, -3.8245348930358887, -3.52827525138855, -3.232015609741211, -2.935756206512451, -2.6394968032836914, -2.3432371616363525, -2.0469775199890137, -1.750718116760254, -1.4544585943222046, -1.1581990718841553, -0.861939549446106, -0.5656800270080566, -0.2694205045700073, 0.026839017868041992, 0.32309865951538086, 0.6193580627441406, 0.9156175851821899, 1.2118771076202393, 1.5081366300582886, 1.804396152496338, 2.1006555557250977, 2.3969151973724365, 2.6931748390197754, 2.989434242248535, 3.285693645477295, 3.581953287124634, 3.8782129287719727, 4.174472332000732, 4.470731735229492, 4.76699161529541, 5.06325101852417, 5.35951042175293]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 10.0, 14.0, 20.0, 21.0, 30.0, 30.0, 25.0, 32.0, 26.0, 33.0, 40.0, 44.0, 40.0, 36.0, 50.0, 54.0, 59.0, 54.0, 35.0, 53.0, 43.0, 42.0, 34.0, 30.0, 31.0, 26.0, 11.0, 16.0, 9.0, 11.0, 6.0, 8.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.361629009246826, -4.244543075561523, -4.1274566650390625, -4.01037073135376, -3.893284797668457, -3.776198625564575, -3.6591124534606934, -3.5420265197753906, -3.424940347671509, -3.307854175567627, -3.190768241882324, -3.0736820697784424, -2.9565958976745605, -2.839509963989258, -2.722423791885376, -2.605337619781494, -2.4882516860961914, -2.3711655139923096, -2.254079580307007, -2.136993408203125, -2.0199074745178223, -1.9028213024139404, -1.7857351303100586, -1.6686490774154663, -1.551563024520874, -1.4344769716262817, -1.3173909187316895, -1.2003047466278076, -1.0832186937332153, -0.966132640838623, -0.849046528339386, -0.7319604158401489, -0.6148743629455566, -0.49778828024864197, -0.3807021975517273, -0.2636161148548126, -0.14653003215789795, -0.029443979263305664, 0.0876421332359314, 0.20472824573516846, 0.32181429862976074, 0.4389003813266754, 0.5559864640235901, 0.6730725765228271, 0.7901586294174194, 0.9072446823120117, 1.0243308544158936, 1.1414169073104858, 1.2585029602050781, 1.3755890130996704, 1.4926750659942627, 1.6097612380981445, 1.7268472909927368, 1.843933343887329, 1.961019515991211, 2.0781054496765137, 2.1951916217803955, 2.3122777938842773, 2.42936372756958, 2.546449899673462, 2.6635360717773438, 2.7806220054626465, 2.8977081775665283, 3.01479434967041, 3.131880283355713]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 6.0, 15.0, 13.0, 16.0, 29.0, 41.0, 49.0, 50.0, 92.0, 113.0, 222.0, 299.0, 445.0, 733.0, 1168.0, 2006.0, 3221.0, 5654.0, 10816.0, 20380.0, 42956.0, 101702.0, 281230.0, 863378.0, 1570182.0, 839419.0, 267896.0, 97368.0, 41311.0, 19769.0, 9995.0, 5636.0, 3166.0, 1766.0, 1080.0, 730.0, 465.0, 270.0, 197.0, 116.0, 76.0, 68.0, 40.0, 32.0, 19.0, 14.0, 9.0, 6.0, 4.0, 1.0, 5.0, 4.0, 2.0, 4.0], "bins": [-7.8671875, -7.6390380859375, -7.410888671875, -7.1827392578125, -6.95458984375, -6.7264404296875, -6.498291015625, -6.2701416015625, -6.0419921875, -5.8138427734375, -5.585693359375, -5.3575439453125, -5.12939453125, -4.9012451171875, -4.673095703125, -4.4449462890625, -4.216796875, -3.9886474609375, -3.760498046875, -3.5323486328125, -3.30419921875, -3.0760498046875, -2.847900390625, -2.6197509765625, -2.3916015625, -2.1634521484375, -1.935302734375, -1.7071533203125, -1.47900390625, -1.2508544921875, -1.022705078125, -0.7945556640625, -0.56640625, -0.3382568359375, -0.110107421875, 0.1180419921875, 0.34619140625, 0.5743408203125, 0.802490234375, 1.0306396484375, 1.2587890625, 1.4869384765625, 1.715087890625, 1.9432373046875, 2.17138671875, 2.3995361328125, 2.627685546875, 2.8558349609375, 3.083984375, 3.3121337890625, 3.540283203125, 3.7684326171875, 3.99658203125, 4.2247314453125, 4.452880859375, 4.6810302734375, 4.9091796875, 5.1373291015625, 5.365478515625, 5.5936279296875, 5.82177734375, 6.0499267578125, 6.278076171875, 6.5062255859375, 6.734375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 9.0, 3.0, 8.0, 9.0, 12.0, 18.0, 16.0, 17.0, 17.0, 31.0, 23.0, 38.0, 35.0, 37.0, 46.0, 31.0, 57.0, 44.0, 46.0, 42.0, 43.0, 52.0, 40.0, 41.0, 31.0, 40.0, 44.0, 28.0, 23.0, 20.0, 22.0, 15.0, 9.0, 13.0, 6.0, 6.0, 9.0, 8.0, 2.0, 8.0, 2.0, 3.0], "bins": [-3.458984375, -3.3746337890625, -3.290283203125, -3.2059326171875, -3.12158203125, -3.0372314453125, -2.952880859375, -2.8685302734375, -2.7841796875, -2.6998291015625, -2.615478515625, -2.5311279296875, -2.44677734375, -2.3624267578125, -2.278076171875, -2.1937255859375, -2.109375, -2.0250244140625, -1.940673828125, -1.8563232421875, -1.77197265625, -1.6876220703125, -1.603271484375, -1.5189208984375, -1.4345703125, -1.3502197265625, -1.265869140625, -1.1815185546875, -1.09716796875, -1.0128173828125, -0.928466796875, -0.8441162109375, -0.759765625, -0.6754150390625, -0.591064453125, -0.5067138671875, -0.42236328125, -0.3380126953125, -0.253662109375, -0.1693115234375, -0.0849609375, -0.0006103515625, 0.083740234375, 0.1680908203125, 0.25244140625, 0.3367919921875, 0.421142578125, 0.5054931640625, 0.58984375, 0.6741943359375, 0.758544921875, 0.8428955078125, 0.92724609375, 1.0115966796875, 1.095947265625, 1.1802978515625, 1.2646484375, 1.3489990234375, 1.433349609375, 1.5177001953125, 1.60205078125, 1.6864013671875, 1.770751953125, 1.8551025390625, 1.939453125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 9.0, 18.0, 35.0, 35.0, 85.0, 94.0, 157.0, 202.0, 360.0, 568.0, 905.0, 1489.0, 2313.0, 3727.0, 6302.0, 10371.0, 17859.0, 31956.0, 60561.0, 119291.0, 252675.0, 552885.0, 1064235.0, 1041923.0, 533769.0, 243963.0, 115686.0, 58350.0, 31262.0, 17245.0, 10099.0, 6010.0, 3711.0, 2347.0, 1396.0, 838.0, 536.0, 352.0, 248.0, 139.0, 93.0, 60.0, 42.0, 28.0, 20.0, 11.0, 8.0, 4.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.91015625, -5.7193603515625, -5.528564453125, -5.3377685546875, -5.14697265625, -4.9561767578125, -4.765380859375, -4.5745849609375, -4.3837890625, -4.1929931640625, -4.002197265625, -3.8114013671875, -3.62060546875, -3.4298095703125, -3.239013671875, -3.0482177734375, -2.857421875, -2.6666259765625, -2.475830078125, -2.2850341796875, -2.09423828125, -1.9034423828125, -1.712646484375, -1.5218505859375, -1.3310546875, -1.1402587890625, -0.949462890625, -0.7586669921875, -0.56787109375, -0.3770751953125, -0.186279296875, 0.0045166015625, 0.1953125, 0.3861083984375, 0.576904296875, 0.7677001953125, 0.95849609375, 1.1492919921875, 1.340087890625, 1.5308837890625, 1.7216796875, 1.9124755859375, 2.103271484375, 2.2940673828125, 2.48486328125, 2.6756591796875, 2.866455078125, 3.0572509765625, 3.248046875, 3.4388427734375, 3.629638671875, 3.8204345703125, 4.01123046875, 4.2020263671875, 4.392822265625, 4.5836181640625, 4.7744140625, 4.9652099609375, 5.156005859375, 5.3468017578125, 5.53759765625, 5.7283935546875, 5.919189453125, 6.1099853515625, 6.30078125]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 11.0, 8.0, 15.0, 23.0, 35.0, 46.0, 49.0, 55.0, 88.0, 106.0, 138.0, 193.0, 237.0, 280.0, 336.0, 385.0, 392.0, 339.0, 318.0, 239.0, 192.0, 148.0, 109.0, 93.0, 58.0, 46.0, 31.0, 28.0, 20.0, 14.0, 9.0, 7.0, 8.0, 5.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9619140625, -1.8965301513671875, -1.831146240234375, -1.7657623291015625, -1.70037841796875, -1.6349945068359375, -1.569610595703125, -1.5042266845703125, -1.4388427734375, -1.3734588623046875, -1.308074951171875, -1.2426910400390625, -1.17730712890625, -1.1119232177734375, -1.046539306640625, -0.9811553955078125, -0.915771484375, -0.8503875732421875, -0.785003662109375, -0.7196197509765625, -0.65423583984375, -0.5888519287109375, -0.523468017578125, -0.4580841064453125, -0.3927001953125, -0.3273162841796875, -0.261932373046875, -0.1965484619140625, -0.13116455078125, -0.0657806396484375, -0.000396728515625, 0.0649871826171875, 0.13037109375, 0.1957550048828125, 0.261138916015625, 0.3265228271484375, 0.39190673828125, 0.4572906494140625, 0.522674560546875, 0.5880584716796875, 0.6534423828125, 0.7188262939453125, 0.784210205078125, 0.8495941162109375, 0.91497802734375, 0.9803619384765625, 1.045745849609375, 1.1111297607421875, 1.176513671875, 1.2418975830078125, 1.307281494140625, 1.3726654052734375, 1.43804931640625, 1.5034332275390625, 1.568817138671875, 1.6342010498046875, 1.6995849609375, 1.7649688720703125, 1.830352783203125, 1.8957366943359375, 1.96112060546875, 2.0265045166015625, 2.091888427734375, 2.1572723388671875, 2.22265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 9.0, 8.0, 6.0, 8.0, 22.0, 27.0, 34.0, 35.0, 65.0, 62.0, 101.0, 115.0, 118.0, 107.0, 85.0, 58.0, 47.0, 24.0, 25.0, 18.0, 11.0, 10.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.51675796508789, -16.16375160217285, -15.810744285583496, -15.45773696899414, -15.104729652404785, -14.75172233581543, -14.39871597290039, -14.045708656311035, -13.69270133972168, -13.339694023132324, -12.986687660217285, -12.63368034362793, -12.280673027038574, -11.927665710449219, -11.57465934753418, -11.221652030944824, -10.868644714355469, -10.515637397766113, -10.162631034851074, -9.809623718261719, -9.456616401672363, -9.103609085083008, -8.750602722167969, -8.397595405578613, -8.044589042663574, -7.691582202911377, -7.3385748863220215, -6.985568046569824, -6.632560729980469, -6.2795538902282715, -5.926547050476074, -5.573539733886719, -5.220532417297363, -4.867525577545166, -4.5145182609558105, -4.161511421203613, -3.808504104614258, -3.4554972648620605, -3.102490186691284, -2.749483108520508, -2.3964760303497314, -2.043468952178955, -1.6904618740081787, -1.337454915046692, -0.9844478368759155, -0.6314407587051392, -0.27843379974365234, 0.07457327842712402, 0.4275803565979004, 0.7805874347686768, 1.1335945129394531, 1.48660147190094, 1.8396085500717163, 2.192615509033203, 2.5456225872039795, 2.898629665374756, 3.2516367435455322, 3.6046438217163086, 3.957650899887085, 4.310657978057861, 4.663664817810059, 5.016672134399414, 5.369678974151611, 5.722685813903809, 6.075693130493164]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 3.0, 11.0, 16.0, 15.0, 15.0, 13.0, 20.0, 29.0, 21.0, 30.0, 18.0, 33.0, 35.0, 29.0, 32.0, 33.0, 41.0, 32.0, 39.0, 39.0, 34.0, 51.0, 44.0, 41.0, 45.0, 32.0, 32.0, 32.0, 24.0, 25.0, 17.0, 21.0, 14.0, 17.0, 16.0, 11.0, 17.0, 7.0, 4.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.3351566791534424, -3.2348620891571045, -3.1345677375793457, -3.034273147583008, -2.933978796005249, -2.833684206008911, -2.7333898544311523, -2.6330952644348145, -2.5328006744384766, -2.4325060844421387, -2.33221173286438, -2.231917142868042, -2.131622791290283, -2.0313282012939453, -1.931033730506897, -1.8307392597198486, -1.7304449081420898, -1.6301504373550415, -1.5298559665679932, -1.4295613765716553, -1.3292670249938965, -1.2289724349975586, -1.1286779642105103, -1.028383493423462, -0.9280890226364136, -0.8277945518493652, -0.7275000810623169, -0.6272055506706238, -0.5269110798835754, -0.4266166090965271, -0.326322078704834, -0.22602760791778564, -0.1257328987121582, -0.02543841302394867, 0.07485607266426086, 0.1751505732536316, 0.27544504404067993, 0.37573951482772827, 0.4760340452194214, 0.5763285160064697, 0.6766229867935181, 0.7769174575805664, 0.8772119283676147, 0.9775064587593079, 1.077800989151001, 1.1780953407287598, 1.2783899307250977, 1.378684401512146, 1.4789788722991943, 1.5792733430862427, 1.679567813873291, 1.779862403869629, 1.8801567554473877, 1.9804513454437256, 2.0807456970214844, 2.1810402870178223, 2.28133487701416, 2.381629467010498, 2.481923818588257, 2.5822184085845947, 2.6825127601623535, 2.7828073501586914, 2.8831019401550293, 2.983396291732788, 3.083690643310547]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 8.0, 12.0, 23.0, 31.0, 50.0, 109.0, 147.0, 262.0, 408.0, 773.0, 1273.0, 2444.0, 4289.0, 7693.0, 13997.0, 26017.0, 47732.0, 85928.0, 141485.0, 192018.0, 192486.0, 140728.0, 85264.0, 47643.0, 26013.0, 14175.0, 7729.0, 4264.0, 2352.0, 1322.0, 737.0, 432.0, 275.0, 153.0, 108.0, 52.0, 44.0, 24.0, 21.0, 5.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.5546875, -2.481689453125, -2.40869140625, -2.335693359375, -2.2626953125, -2.189697265625, -2.11669921875, -2.043701171875, -1.970703125, -1.897705078125, -1.82470703125, -1.751708984375, -1.6787109375, -1.605712890625, -1.53271484375, -1.459716796875, -1.38671875, -1.313720703125, -1.24072265625, -1.167724609375, -1.0947265625, -1.021728515625, -0.94873046875, -0.875732421875, -0.802734375, -0.729736328125, -0.65673828125, -0.583740234375, -0.5107421875, -0.437744140625, -0.36474609375, -0.291748046875, -0.21875, -0.145751953125, -0.07275390625, 0.000244140625, 0.0732421875, 0.146240234375, 0.21923828125, 0.292236328125, 0.365234375, 0.438232421875, 0.51123046875, 0.584228515625, 0.6572265625, 0.730224609375, 0.80322265625, 0.876220703125, 0.94921875, 1.022216796875, 1.09521484375, 1.168212890625, 1.2412109375, 1.314208984375, 1.38720703125, 1.460205078125, 1.533203125, 1.606201171875, 1.67919921875, 1.752197265625, 1.8251953125, 1.898193359375, 1.97119140625, 2.044189453125, 2.1171875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 5.0, 12.0, 7.0, 8.0, 7.0, 10.0, 24.0, 15.0, 22.0, 16.0, 28.0, 26.0, 27.0, 22.0, 28.0, 32.0, 29.0, 33.0, 38.0, 30.0, 43.0, 35.0, 33.0, 35.0, 45.0, 40.0, 26.0, 43.0, 33.0, 40.0, 24.0, 21.0, 29.0, 11.0, 21.0, 23.0, 17.0, 12.0, 11.0, 9.0, 7.0, 6.0, 7.0, 9.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.30859375, -3.208160400390625, -3.10772705078125, -3.007293701171875, -2.9068603515625, -2.806427001953125, -2.70599365234375, -2.605560302734375, -2.505126953125, -2.404693603515625, -2.30426025390625, -2.203826904296875, -2.1033935546875, -2.002960205078125, -1.90252685546875, -1.802093505859375, -1.70166015625, -1.601226806640625, -1.50079345703125, -1.400360107421875, -1.2999267578125, -1.199493408203125, -1.09906005859375, -0.998626708984375, -0.898193359375, -0.797760009765625, -0.69732666015625, -0.596893310546875, -0.4964599609375, -0.396026611328125, -0.29559326171875, -0.195159912109375, -0.0947265625, 0.005706787109375, 0.10614013671875, 0.206573486328125, 0.3070068359375, 0.407440185546875, 0.50787353515625, 0.608306884765625, 0.708740234375, 0.809173583984375, 0.90960693359375, 1.010040283203125, 1.1104736328125, 1.210906982421875, 1.31134033203125, 1.411773681640625, 1.51220703125, 1.612640380859375, 1.71307373046875, 1.813507080078125, 1.9139404296875, 2.014373779296875, 2.11480712890625, 2.215240478515625, 2.315673828125, 2.416107177734375, 2.51654052734375, 2.616973876953125, 2.7174072265625, 2.817840576171875, 2.91827392578125, 3.018707275390625, 3.119140625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 9.0, 19.0, 34.0, 27.0, 57.0, 74.0, 121.0, 213.0, 301.0, 453.0, 769.0, 1173.0, 1786.0, 2984.0, 4625.0, 7577.0, 12425.0, 19949.0, 32829.0, 53371.0, 85742.0, 130964.0, 174308.0, 172761.0, 128386.0, 83422.0, 51649.0, 31918.0, 19119.0, 11813.0, 7318.0, 4519.0, 2871.0, 1765.0, 1161.0, 769.0, 455.0, 289.0, 185.0, 122.0, 79.0, 44.0, 29.0, 31.0, 14.0, 7.0, 3.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08984375, -2.020111083984375, -1.95037841796875, -1.880645751953125, -1.8109130859375, -1.741180419921875, -1.67144775390625, -1.601715087890625, -1.531982421875, -1.462249755859375, -1.39251708984375, -1.322784423828125, -1.2530517578125, -1.183319091796875, -1.11358642578125, -1.043853759765625, -0.97412109375, -0.904388427734375, -0.83465576171875, -0.764923095703125, -0.6951904296875, -0.625457763671875, -0.55572509765625, -0.485992431640625, -0.416259765625, -0.346527099609375, -0.27679443359375, -0.207061767578125, -0.1373291015625, -0.067596435546875, 0.00213623046875, 0.071868896484375, 0.1416015625, 0.211334228515625, 0.28106689453125, 0.350799560546875, 0.4205322265625, 0.490264892578125, 0.55999755859375, 0.629730224609375, 0.699462890625, 0.769195556640625, 0.83892822265625, 0.908660888671875, 0.9783935546875, 1.048126220703125, 1.11785888671875, 1.187591552734375, 1.25732421875, 1.327056884765625, 1.39678955078125, 1.466522216796875, 1.5362548828125, 1.605987548828125, 1.67572021484375, 1.745452880859375, 1.815185546875, 1.884918212890625, 1.95465087890625, 2.024383544921875, 2.0941162109375, 2.163848876953125, 2.23358154296875, 2.303314208984375, 2.373046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 8.0, 7.0, 14.0, 10.0, 10.0, 6.0, 12.0, 12.0, 23.0, 21.0, 25.0, 25.0, 26.0, 30.0, 28.0, 39.0, 33.0, 34.0, 44.0, 48.0, 27.0, 35.0, 41.0, 38.0, 37.0, 39.0, 47.0, 35.0, 29.0, 27.0, 21.0, 24.0, 23.0, 16.0, 14.0, 19.0, 17.0, 15.0, 5.0, 6.0, 7.0, 3.0, 5.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-1.990234375, -1.931304931640625, -1.87237548828125, -1.813446044921875, -1.7545166015625, -1.695587158203125, -1.63665771484375, -1.577728271484375, -1.518798828125, -1.459869384765625, -1.40093994140625, -1.342010498046875, -1.2830810546875, -1.224151611328125, -1.16522216796875, -1.106292724609375, -1.04736328125, -0.988433837890625, -0.92950439453125, -0.870574951171875, -0.8116455078125, -0.752716064453125, -0.69378662109375, -0.634857177734375, -0.575927734375, -0.516998291015625, -0.45806884765625, -0.399139404296875, -0.3402099609375, -0.281280517578125, -0.22235107421875, -0.163421630859375, -0.1044921875, -0.045562744140625, 0.01336669921875, 0.072296142578125, 0.1312255859375, 0.190155029296875, 0.24908447265625, 0.308013916015625, 0.366943359375, 0.425872802734375, 0.48480224609375, 0.543731689453125, 0.6026611328125, 0.661590576171875, 0.72052001953125, 0.779449462890625, 0.83837890625, 0.897308349609375, 0.95623779296875, 1.015167236328125, 1.0740966796875, 1.133026123046875, 1.19195556640625, 1.250885009765625, 1.309814453125, 1.368743896484375, 1.42767333984375, 1.486602783203125, 1.5455322265625, 1.604461669921875, 1.66339111328125, 1.722320556640625, 1.78125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 11.0, 13.0, 20.0, 22.0, 28.0, 56.0, 86.0, 94.0, 166.0, 221.0, 397.0, 650.0, 1221.0, 2019.0, 3674.0, 7293.0, 14174.0, 29187.0, 61636.0, 131734.0, 245086.0, 263779.0, 149585.0, 70906.0, 33098.0, 15871.0, 8007.0, 4234.0, 2160.0, 1196.0, 710.0, 414.0, 276.0, 166.0, 106.0, 77.0, 44.0, 41.0, 32.0, 16.0, 11.0, 10.0, 7.0, 7.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5849609375, -1.5370635986328125, -1.489166259765625, -1.4412689208984375, -1.39337158203125, -1.3454742431640625, -1.297576904296875, -1.2496795654296875, -1.2017822265625, -1.1538848876953125, -1.105987548828125, -1.0580902099609375, -1.01019287109375, -0.9622955322265625, -0.914398193359375, -0.8665008544921875, -0.818603515625, -0.7707061767578125, -0.722808837890625, -0.6749114990234375, -0.62701416015625, -0.5791168212890625, -0.531219482421875, -0.4833221435546875, -0.4354248046875, -0.3875274658203125, -0.339630126953125, -0.2917327880859375, -0.24383544921875, -0.1959381103515625, -0.148040771484375, -0.1001434326171875, -0.05224609375, -0.0043487548828125, 0.043548583984375, 0.0914459228515625, 0.13934326171875, 0.1872406005859375, 0.235137939453125, 0.2830352783203125, 0.3309326171875, 0.3788299560546875, 0.426727294921875, 0.4746246337890625, 0.52252197265625, 0.5704193115234375, 0.618316650390625, 0.6662139892578125, 0.714111328125, 0.7620086669921875, 0.809906005859375, 0.8578033447265625, 0.90570068359375, 0.9535980224609375, 1.001495361328125, 1.0493927001953125, 1.0972900390625, 1.1451873779296875, 1.193084716796875, 1.2409820556640625, 1.28887939453125, 1.3367767333984375, 1.384674072265625, 1.4325714111328125, 1.48046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 9.0, 7.0, 11.0, 11.0, 24.0, 19.0, 19.0, 22.0, 30.0, 41.0, 49.0, 43.0, 43.0, 56.0, 55.0, 55.0, 48.0, 59.0, 52.0, 47.0, 52.0, 47.0, 29.0, 34.0, 20.0, 17.0, 21.0, 14.0, 11.0, 9.0, 6.0, 7.0, 9.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.857778549194336e-05, -4.682503640651703e-05, -4.50722873210907e-05, -4.331953823566437e-05, -4.156678915023804e-05, -3.9814040064811707e-05, -3.8061290979385376e-05, -3.6308541893959045e-05, -3.4555792808532715e-05, -3.2803043723106384e-05, -3.1050294637680054e-05, -2.9297545552253723e-05, -2.7544796466827393e-05, -2.5792047381401062e-05, -2.403929829597473e-05, -2.22865492105484e-05, -2.053380012512207e-05, -1.878105103969574e-05, -1.702830195426941e-05, -1.527555286884308e-05, -1.3522803783416748e-05, -1.1770054697990417e-05, -1.0017305612564087e-05, -8.264556527137756e-06, -6.511807441711426e-06, -4.759058356285095e-06, -3.0063092708587646e-06, -1.253560185432434e-06, 4.991888999938965e-07, 2.251937985420227e-06, 4.004687070846558e-06, 5.757436156272888e-06, 7.510185241699219e-06, 9.26293432712555e-06, 1.101568341255188e-05, 1.276843249797821e-05, 1.4521181583404541e-05, 1.627393066883087e-05, 1.8026679754257202e-05, 1.9779428839683533e-05, 2.1532177925109863e-05, 2.3284927010536194e-05, 2.5037676095962524e-05, 2.6790425181388855e-05, 2.8543174266815186e-05, 3.0295923352241516e-05, 3.204867243766785e-05, 3.380142152309418e-05, 3.555417060852051e-05, 3.730691969394684e-05, 3.905966877937317e-05, 4.08124178647995e-05, 4.256516695022583e-05, 4.431791603565216e-05, 4.607066512107849e-05, 4.782341420650482e-05, 4.957616329193115e-05, 5.132891237735748e-05, 5.3081661462783813e-05, 5.4834410548210144e-05, 5.6587159633636475e-05, 5.8339908719062805e-05, 6.0092657804489136e-05, 6.184540688991547e-05, 6.35981559753418e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 16.0, 21.0, 37.0, 63.0, 70.0, 116.0, 207.0, 260.0, 397.0, 705.0, 1054.0, 1552.0, 2446.0, 3774.0, 5988.0, 9560.0, 15209.0, 24832.0, 38735.0, 60572.0, 89129.0, 121649.0, 145790.0, 145514.0, 122064.0, 90092.0, 61502.0, 39877.0, 25019.0, 15601.0, 9636.0, 6210.0, 3788.0, 2541.0, 1579.0, 1018.0, 683.0, 439.0, 276.0, 186.0, 116.0, 78.0, 60.0, 26.0, 21.0, 14.0, 11.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.8828125, -0.8552398681640625, -0.827667236328125, -0.8000946044921875, -0.77252197265625, -0.7449493408203125, -0.717376708984375, -0.6898040771484375, -0.6622314453125, -0.6346588134765625, -0.607086181640625, -0.5795135498046875, -0.55194091796875, -0.5243682861328125, -0.496795654296875, -0.4692230224609375, -0.441650390625, -0.4140777587890625, -0.386505126953125, -0.3589324951171875, -0.33135986328125, -0.3037872314453125, -0.276214599609375, -0.2486419677734375, -0.2210693359375, -0.1934967041015625, -0.165924072265625, -0.1383514404296875, -0.11077880859375, -0.0832061767578125, -0.055633544921875, -0.0280609130859375, -0.00048828125, 0.0270843505859375, 0.054656982421875, 0.0822296142578125, 0.10980224609375, 0.1373748779296875, 0.164947509765625, 0.1925201416015625, 0.2200927734375, 0.2476654052734375, 0.275238037109375, 0.3028106689453125, 0.33038330078125, 0.3579559326171875, 0.385528564453125, 0.4131011962890625, 0.440673828125, 0.4682464599609375, 0.495819091796875, 0.5233917236328125, 0.55096435546875, 0.5785369873046875, 0.606109619140625, 0.6336822509765625, 0.6612548828125, 0.6888275146484375, 0.716400146484375, 0.7439727783203125, 0.77154541015625, 0.7991180419921875, 0.826690673828125, 0.8542633056640625, 0.8818359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 6.0, 6.0, 4.0, 2.0, 6.0, 10.0, 10.0, 10.0, 10.0, 19.0, 21.0, 29.0, 38.0, 36.0, 46.0, 55.0, 79.0, 48.0, 63.0, 49.0, 57.0, 61.0, 53.0, 47.0, 41.0, 32.0, 24.0, 23.0, 14.0, 18.0, 14.0, 16.0, 12.0, 7.0, 8.0, 6.0, 6.0, 6.0, 4.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298828125, -0.28974151611328125, -0.2806549072265625, -0.27156829833984375, -0.262481689453125, -0.25339508056640625, -0.2443084716796875, -0.23522186279296875, -0.22613525390625, -0.21704864501953125, -0.2079620361328125, -0.19887542724609375, -0.189788818359375, -0.18070220947265625, -0.1716156005859375, -0.16252899169921875, -0.1534423828125, -0.14435577392578125, -0.1352691650390625, -0.12618255615234375, -0.117095947265625, -0.10800933837890625, -0.0989227294921875, -0.08983612060546875, -0.08074951171875, -0.07166290283203125, -0.0625762939453125, -0.05348968505859375, -0.044403076171875, -0.03531646728515625, -0.0262298583984375, -0.01714324951171875, -0.008056640625, 0.00102996826171875, 0.0101165771484375, 0.01920318603515625, 0.028289794921875, 0.03737640380859375, 0.0464630126953125, 0.05554962158203125, 0.06463623046875, 0.07372283935546875, 0.0828094482421875, 0.09189605712890625, 0.100982666015625, 0.11006927490234375, 0.1191558837890625, 0.12824249267578125, 0.1373291015625, 0.14641571044921875, 0.1555023193359375, 0.16458892822265625, 0.173675537109375, 0.18276214599609375, 0.1918487548828125, 0.20093536376953125, 0.21002197265625, 0.21910858154296875, 0.2281951904296875, 0.23728179931640625, 0.246368408203125, 0.25545501708984375, 0.2645416259765625, 0.27362823486328125, 0.28271484375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 6.0, 7.0, 6.0, 9.0, 24.0, 43.0, 31.0, 40.0, 63.0, 66.0, 106.0, 109.0, 121.0, 94.0, 77.0, 58.0, 38.0, 33.0, 17.0, 21.0, 10.0, 3.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.761994361877441, -15.422834396362305, -15.083675384521484, -14.744515419006348, -14.405355453491211, -14.066195487976074, -13.727036476135254, -13.387876510620117, -13.04871654510498, -12.709556579589844, -12.370397567749023, -12.031237602233887, -11.69207763671875, -11.352917671203613, -11.013758659362793, -10.674598693847656, -10.335439682006836, -9.9962797164917, -9.657120704650879, -9.317960739135742, -8.978800773620605, -8.639640808105469, -8.300481796264648, -7.961321830749512, -7.622161865234375, -7.2830023765563965, -6.94384241104126, -6.604682922363281, -6.2655229568481445, -5.926363468170166, -5.5872039794921875, -5.248044013977051, -4.908884525299072, -4.569725036621094, -4.230565071105957, -3.8914055824279785, -3.552245616912842, -3.2130861282348633, -2.8739264011383057, -2.534766674041748, -2.1956069469451904, -1.8564472198486328, -1.5172874927520752, -1.1781278848648071, -0.8389681577682495, -0.4998084306716919, -0.16064882278442383, 0.1785109043121338, 0.5176706314086914, 0.856830358505249, 1.1959900856018066, 1.5351496934890747, 1.8743094205856323, 2.2134690284729004, 2.552628755569458, 2.8917884826660156, 3.2309482097625732, 3.570107936859131, 3.9092676639556885, 4.248427391052246, 4.587586879730225, 4.926746845245361, 5.26590633392334, 5.605066299438477, 5.944225788116455]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 15.0, 11.0, 14.0, 18.0, 15.0, 19.0, 28.0, 24.0, 26.0, 19.0, 32.0, 39.0, 25.0, 34.0, 35.0, 36.0, 31.0, 47.0, 34.0, 41.0, 46.0, 36.0, 43.0, 52.0, 27.0, 32.0, 25.0, 28.0, 22.0, 22.0, 15.0, 16.0, 19.0, 16.0, 15.0, 10.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2714529037475586, -3.1733615398406982, -3.075270175933838, -2.9771788120269775, -2.879087448120117, -2.780996084213257, -2.6829047203063965, -2.5848135948181152, -2.486721992492676, -2.3886306285858154, -2.290539264678955, -2.1924479007720947, -2.0943565368652344, -1.996265172958374, -1.8981739282608032, -1.8000825643539429, -1.701991319656372, -1.6038999557495117, -1.5058085918426514, -1.407717227935791, -1.3096258640289307, -1.2115345001220703, -1.1134432554244995, -1.0153518915176392, -0.9172605276107788, -0.8191691637039185, -0.7210777997970581, -0.6229864954948425, -0.5248951315879822, -0.4268037676811218, -0.32871246337890625, -0.2306210994720459, -0.13252949714660645, -0.03443814814090729, 0.06365320086479187, 0.16174453496932983, 0.2598358988761902, 0.35792726278305054, 0.4560185670852661, 0.5541099309921265, 0.6522012948989868, 0.7502926588058472, 0.8483840227127075, 0.9464753270149231, 1.0445666313171387, 1.142657995223999, 1.2407493591308594, 1.3388407230377197, 1.43693208694458, 1.5350234508514404, 1.6331148147583008, 1.7312061786651611, 1.8292975425720215, 1.9273889064788818, 2.025480270385742, 2.1235713958740234, 2.221662998199463, 2.3197543621063232, 2.4178457260131836, 2.515937089920044, 2.6140284538269043, 2.7121198177337646, 2.810211181640625, 2.9083023071289062, 3.0063936710357666]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 10.0, 14.0, 11.0, 28.0, 45.0, 71.0, 123.0, 185.0, 299.0, 558.0, 967.0, 1699.0, 3090.0, 5594.0, 10329.0, 18542.0, 33287.0, 58317.0, 96273.0, 141888.0, 174180.0, 169834.0, 130860.0, 86237.0, 51181.0, 28795.0, 16042.0, 8801.0, 4974.0, 2699.0, 1570.0, 856.0, 508.0, 281.0, 188.0, 79.0, 56.0, 36.0, 12.0, 19.0, 12.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.48870849609375, -3.3719482421875, -3.25518798828125, -3.138427734375, -3.02166748046875, -2.9049072265625, -2.78814697265625, -2.67138671875, -2.55462646484375, -2.4378662109375, -2.32110595703125, -2.204345703125, -2.08758544921875, -1.9708251953125, -1.85406494140625, -1.7373046875, -1.62054443359375, -1.5037841796875, -1.38702392578125, -1.270263671875, -1.15350341796875, -1.0367431640625, -0.91998291015625, -0.80322265625, -0.68646240234375, -0.5697021484375, -0.45294189453125, -0.336181640625, -0.21942138671875, -0.1026611328125, 0.01409912109375, 0.130859375, 0.24761962890625, 0.3643798828125, 0.48114013671875, 0.597900390625, 0.71466064453125, 0.8314208984375, 0.94818115234375, 1.06494140625, 1.18170166015625, 1.2984619140625, 1.41522216796875, 1.531982421875, 1.64874267578125, 1.7655029296875, 1.88226318359375, 1.9990234375, 2.11578369140625, 2.2325439453125, 2.34930419921875, 2.466064453125, 2.58282470703125, 2.6995849609375, 2.81634521484375, 2.93310546875, 3.04986572265625, 3.1666259765625, 3.28338623046875, 3.400146484375, 3.51690673828125, 3.6336669921875, 3.75042724609375, 3.8671875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 6.0, 11.0, 10.0, 13.0, 18.0, 24.0, 25.0, 29.0, 24.0, 23.0, 31.0, 23.0, 29.0, 37.0, 44.0, 40.0, 35.0, 29.0, 31.0, 43.0, 44.0, 45.0, 42.0, 43.0, 47.0, 26.0, 22.0, 29.0, 26.0, 25.0, 18.0, 18.0, 10.0, 16.0, 12.0, 10.0, 9.0, 8.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.654296875, -3.544403076171875, -3.43450927734375, -3.324615478515625, -3.2147216796875, -3.104827880859375, -2.99493408203125, -2.885040283203125, -2.775146484375, -2.665252685546875, -2.55535888671875, -2.445465087890625, -2.3355712890625, -2.225677490234375, -2.11578369140625, -2.005889892578125, -1.89599609375, -1.786102294921875, -1.67620849609375, -1.566314697265625, -1.4564208984375, -1.346527099609375, -1.23663330078125, -1.126739501953125, -1.016845703125, -0.906951904296875, -0.79705810546875, -0.687164306640625, -0.5772705078125, -0.467376708984375, -0.35748291015625, -0.247589111328125, -0.1376953125, -0.027801513671875, 0.08209228515625, 0.191986083984375, 0.3018798828125, 0.411773681640625, 0.52166748046875, 0.631561279296875, 0.741455078125, 0.851348876953125, 0.96124267578125, 1.071136474609375, 1.1810302734375, 1.290924072265625, 1.40081787109375, 1.510711669921875, 1.62060546875, 1.730499267578125, 1.84039306640625, 1.950286865234375, 2.0601806640625, 2.170074462890625, 2.27996826171875, 2.389862060546875, 2.499755859375, 2.609649658203125, 2.71954345703125, 2.829437255859375, 2.9393310546875, 3.049224853515625, 3.15911865234375, 3.269012451171875, 3.37890625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 19.0, 23.0, 34.0, 39.0, 76.0, 86.0, 147.0, 243.0, 436.0, 799.0, 1436.0, 2774.0, 5245.0, 10056.0, 19264.0, 36707.0, 68123.0, 117276.0, 172693.0, 198573.0, 167392.0, 110618.0, 63877.0, 34548.0, 18036.0, 9518.0, 4781.0, 2532.0, 1344.0, 737.0, 434.0, 253.0, 132.0, 106.0, 58.0, 46.0, 23.0, 16.0, 13.0, 8.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.21484375, -4.080810546875, -3.94677734375, -3.812744140625, -3.6787109375, -3.544677734375, -3.41064453125, -3.276611328125, -3.142578125, -3.008544921875, -2.87451171875, -2.740478515625, -2.6064453125, -2.472412109375, -2.33837890625, -2.204345703125, -2.0703125, -1.936279296875, -1.80224609375, -1.668212890625, -1.5341796875, -1.400146484375, -1.26611328125, -1.132080078125, -0.998046875, -0.864013671875, -0.72998046875, -0.595947265625, -0.4619140625, -0.327880859375, -0.19384765625, -0.059814453125, 0.07421875, 0.208251953125, 0.34228515625, 0.476318359375, 0.6103515625, 0.744384765625, 0.87841796875, 1.012451171875, 1.146484375, 1.280517578125, 1.41455078125, 1.548583984375, 1.6826171875, 1.816650390625, 1.95068359375, 2.084716796875, 2.21875, 2.352783203125, 2.48681640625, 2.620849609375, 2.7548828125, 2.888916015625, 3.02294921875, 3.156982421875, 3.291015625, 3.425048828125, 3.55908203125, 3.693115234375, 3.8271484375, 3.961181640625, 4.09521484375, 4.229248046875, 4.36328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 13.0, 11.0, 14.0, 14.0, 17.0, 15.0, 18.0, 12.0, 21.0, 17.0, 27.0, 22.0, 32.0, 28.0, 32.0, 31.0, 38.0, 43.0, 46.0, 29.0, 42.0, 44.0, 34.0, 29.0, 34.0, 40.0, 27.0, 26.0, 21.0, 29.0, 24.0, 19.0, 22.0, 24.0, 19.0, 12.0, 12.0, 9.0, 5.0, 9.0, 9.0, 8.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.8515625, -1.79150390625, -1.7314453125, -1.67138671875, -1.611328125, -1.55126953125, -1.4912109375, -1.43115234375, -1.37109375, -1.31103515625, -1.2509765625, -1.19091796875, -1.130859375, -1.07080078125, -1.0107421875, -0.95068359375, -0.890625, -0.83056640625, -0.7705078125, -0.71044921875, -0.650390625, -0.59033203125, -0.5302734375, -0.47021484375, -0.41015625, -0.35009765625, -0.2900390625, -0.22998046875, -0.169921875, -0.10986328125, -0.0498046875, 0.01025390625, 0.0703125, 0.13037109375, 0.1904296875, 0.25048828125, 0.310546875, 0.37060546875, 0.4306640625, 0.49072265625, 0.55078125, 0.61083984375, 0.6708984375, 0.73095703125, 0.791015625, 0.85107421875, 0.9111328125, 0.97119140625, 1.03125, 1.09130859375, 1.1513671875, 1.21142578125, 1.271484375, 1.33154296875, 1.3916015625, 1.45166015625, 1.51171875, 1.57177734375, 1.6318359375, 1.69189453125, 1.751953125, 1.81201171875, 1.8720703125, 1.93212890625, 1.9921875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 9.0, 27.0, 21.0, 36.0, 48.0, 66.0, 92.0, 123.0, 200.0, 265.0, 381.0, 638.0, 1064.0, 1640.0, 3060.0, 5351.0, 10679.0, 21784.0, 45994.0, 98174.0, 186310.0, 252912.0, 203371.0, 111661.0, 53267.0, 24623.0, 11931.0, 6184.0, 3374.0, 1886.0, 1156.0, 778.0, 489.0, 279.0, 231.0, 133.0, 82.0, 73.0, 41.0, 33.0, 22.0, 24.0, 8.0, 10.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.4375, -2.367034912109375, -2.29656982421875, -2.226104736328125, -2.1556396484375, -2.085174560546875, -2.01470947265625, -1.944244384765625, -1.873779296875, -1.803314208984375, -1.73284912109375, -1.662384033203125, -1.5919189453125, -1.521453857421875, -1.45098876953125, -1.380523681640625, -1.31005859375, -1.239593505859375, -1.16912841796875, -1.098663330078125, -1.0281982421875, -0.957733154296875, -0.88726806640625, -0.816802978515625, -0.746337890625, -0.675872802734375, -0.60540771484375, -0.534942626953125, -0.4644775390625, -0.394012451171875, -0.32354736328125, -0.253082275390625, -0.1826171875, -0.112152099609375, -0.04168701171875, 0.028778076171875, 0.0992431640625, 0.169708251953125, 0.24017333984375, 0.310638427734375, 0.381103515625, 0.451568603515625, 0.52203369140625, 0.592498779296875, 0.6629638671875, 0.733428955078125, 0.80389404296875, 0.874359130859375, 0.94482421875, 1.015289306640625, 1.08575439453125, 1.156219482421875, 1.2266845703125, 1.297149658203125, 1.36761474609375, 1.438079833984375, 1.508544921875, 1.579010009765625, 1.64947509765625, 1.719940185546875, 1.7904052734375, 1.860870361328125, 1.93133544921875, 2.001800537109375, 2.072265625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 11.0, 9.0, 16.0, 24.0, 25.0, 27.0, 29.0, 43.0, 45.0, 62.0, 70.0, 58.0, 69.0, 76.0, 76.0, 69.0, 52.0, 44.0, 42.0, 32.0, 27.0, 22.0, 9.0, 15.0, 6.0, 6.0, 8.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015020370483398438, -0.00014432333409786224, -0.0001384429633617401, -0.00013256259262561798, -0.00012668222188949585, -0.00012080185115337372, -0.00011492148041725159, -0.00010904110968112946, -0.00010316073894500732, -9.728036820888519e-05, -9.139999747276306e-05, -8.551962673664093e-05, -7.96392560005188e-05, -7.375888526439667e-05, -6.787851452827454e-05, -6.19981437921524e-05, -5.6117773056030273e-05, -5.023740231990814e-05, -4.435703158378601e-05, -3.847666084766388e-05, -3.259629011154175e-05, -2.6715919375419617e-05, -2.0835548639297485e-05, -1.4955177903175354e-05, -9.074807167053223e-06, -3.1944364309310913e-06, 2.68593430519104e-06, 8.566305041313171e-06, 1.4446675777435303e-05, 2.0327046513557434e-05, 2.6207417249679565e-05, 3.20877879858017e-05, 3.796815872192383e-05, 4.384852945804596e-05, 4.972890019416809e-05, 5.560927093029022e-05, 6.148964166641235e-05, 6.737001240253448e-05, 7.325038313865662e-05, 7.913075387477875e-05, 8.501112461090088e-05, 9.089149534702301e-05, 9.677186608314514e-05, 0.00010265223681926727, 0.0001085326075553894, 0.00011441297829151154, 0.00012029334902763367, 0.0001261737197637558, 0.00013205409049987793, 0.00013793446123600006, 0.0001438148319721222, 0.00014969520270824432, 0.00015557557344436646, 0.00016145594418048859, 0.00016733631491661072, 0.00017321668565273285, 0.00017909705638885498, 0.0001849774271249771, 0.00019085779786109924, 0.00019673816859722137, 0.0002026185393333435, 0.00020849891006946564, 0.00021437928080558777, 0.0002202596515417099, 0.00022614002227783203]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 14.0, 25.0, 24.0, 37.0, 53.0, 88.0, 112.0, 150.0, 210.0, 306.0, 447.0, 676.0, 1008.0, 1543.0, 2480.0, 4061.0, 6585.0, 11231.0, 19460.0, 34195.0, 60789.0, 101152.0, 152154.0, 184638.0, 169267.0, 120976.0, 74575.0, 42931.0, 24184.0, 13873.0, 7993.0, 4791.0, 3014.0, 1909.0, 1167.0, 752.0, 496.0, 346.0, 226.0, 183.0, 120.0, 86.0, 68.0, 38.0, 36.0, 23.0, 21.0, 12.0, 10.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.6357421875, -1.5857086181640625, -1.535675048828125, -1.4856414794921875, -1.43560791015625, -1.3855743408203125, -1.335540771484375, -1.2855072021484375, -1.2354736328125, -1.1854400634765625, -1.135406494140625, -1.0853729248046875, -1.03533935546875, -0.9853057861328125, -0.935272216796875, -0.8852386474609375, -0.835205078125, -0.7851715087890625, -0.735137939453125, -0.6851043701171875, -0.63507080078125, -0.5850372314453125, -0.535003662109375, -0.4849700927734375, -0.4349365234375, -0.3849029541015625, -0.334869384765625, -0.2848358154296875, -0.23480224609375, -0.1847686767578125, -0.134735107421875, -0.0847015380859375, -0.03466796875, 0.0153656005859375, 0.065399169921875, 0.1154327392578125, 0.16546630859375, 0.2154998779296875, 0.265533447265625, 0.3155670166015625, 0.3656005859375, 0.4156341552734375, 0.465667724609375, 0.5157012939453125, 0.56573486328125, 0.6157684326171875, 0.665802001953125, 0.7158355712890625, 0.765869140625, 0.8159027099609375, 0.865936279296875, 0.9159698486328125, 0.96600341796875, 1.0160369873046875, 1.066070556640625, 1.1161041259765625, 1.1661376953125, 1.2161712646484375, 1.266204833984375, 1.3162384033203125, 1.36627197265625, 1.4163055419921875, 1.466339111328125, 1.5163726806640625, 1.56640625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 7.0, 12.0, 17.0, 10.0, 24.0, 20.0, 19.0, 30.0, 37.0, 32.0, 37.0, 50.0, 49.0, 51.0, 70.0, 43.0, 57.0, 45.0, 51.0, 48.0, 52.0, 42.0, 29.0, 26.0, 31.0, 20.0, 24.0, 12.0, 11.0, 7.0, 5.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.52490234375, -0.5104942321777344, -0.49608612060546875, -0.4816780090332031, -0.4672698974609375, -0.4528617858886719, -0.43845367431640625, -0.4240455627441406, -0.409637451171875, -0.3952293395996094, -0.38082122802734375, -0.3664131164550781, -0.3520050048828125, -0.3375968933105469, -0.32318878173828125, -0.3087806701660156, -0.29437255859375, -0.2799644470214844, -0.26555633544921875, -0.2511482238769531, -0.2367401123046875, -0.22233200073242188, -0.20792388916015625, -0.19351577758789062, -0.179107666015625, -0.16469955444335938, -0.15029144287109375, -0.13588333129882812, -0.1214752197265625, -0.10706710815429688, -0.09265899658203125, -0.07825088500976562, -0.0638427734375, -0.049434661865234375, -0.03502655029296875, -0.020618438720703125, -0.0062103271484375, 0.008197784423828125, 0.02260589599609375, 0.037014007568359375, 0.051422119140625, 0.06583023071289062, 0.08023834228515625, 0.09464645385742188, 0.1090545654296875, 0.12346267700195312, 0.13787078857421875, 0.15227890014648438, 0.16668701171875, 0.18109512329101562, 0.19550323486328125, 0.20991134643554688, 0.2243194580078125, 0.23872756958007812, 0.25313568115234375, 0.2675437927246094, 0.281951904296875, 0.2963600158691406, 0.31076812744140625, 0.3251762390136719, 0.3395843505859375, 0.3539924621582031, 0.36840057373046875, 0.3828086853027344, 0.397216796875]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 9.0, 4.0, 5.0, 9.0, 13.0, 27.0, 35.0, 47.0, 45.0, 77.0, 78.0, 100.0, 110.0, 129.0, 80.0, 70.0, 55.0, 29.0, 29.0, 17.0, 8.0, 9.0, 6.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.795585632324219, -15.452794075012207, -15.110002517700195, -14.767210006713867, -14.424418449401855, -14.081626892089844, -13.738835334777832, -13.39604377746582, -13.053252220153809, -12.710460662841797, -12.367669105529785, -12.024877548217773, -11.682085037231445, -11.339293479919434, -10.996501922607422, -10.65371036529541, -10.310918807983398, -9.968127250671387, -9.625335693359375, -9.282543182373047, -8.939751625061035, -8.596960067749023, -8.254168510437012, -7.911376953125, -7.568584442138672, -7.22579288482666, -6.88300085067749, -6.5402092933654785, -6.197417736053467, -5.854625701904297, -5.511834144592285, -5.169042587280273, -4.82625150680542, -4.483459949493408, -4.140667915344238, -3.7978763580322266, -3.455084800720215, -3.112293004989624, -2.769501209259033, -2.4267096519470215, -2.0839178562164307, -1.7411261796951294, -1.3983345031738281, -1.0555427074432373, -0.712751030921936, -0.36995935440063477, -0.027167558670043945, 0.3156239986419678, 0.6584157943725586, 1.0012074708938599, 1.3439991474151611, 1.686790943145752, 2.0295825004577637, 2.3723742961883545, 2.7151660919189453, 3.057957649230957, 3.400749444961548, 3.7435412406921387, 4.08633279800415, 4.42912483215332, 4.771916389465332, 5.114707946777344, 5.4574995040893555, 5.800291061401367, 6.143083095550537]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 10.0, 7.0, 11.0, 10.0, 11.0, 12.0, 15.0, 14.0, 19.0, 32.0, 28.0, 33.0, 25.0, 27.0, 29.0, 25.0, 39.0, 29.0, 33.0, 41.0, 45.0, 48.0, 45.0, 41.0, 36.0, 41.0, 32.0, 33.0, 33.0, 24.0, 23.0, 20.0, 23.0, 12.0, 14.0, 18.0, 7.0, 9.0, 15.0, 6.0, 10.0, 3.0, 8.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.327981472015381, -3.231311798095703, -3.1346421241760254, -3.0379726886749268, -2.941303014755249, -2.8446333408355713, -2.7479639053344727, -2.651294231414795, -2.554624557495117, -2.4579548835754395, -2.3612852096557617, -2.264615774154663, -2.1679461002349854, -2.0712764263153076, -1.9746068716049194, -1.8779373168945312, -1.7812676429748535, -1.6845979690551758, -1.5879284143447876, -1.4912588596343994, -1.3945891857147217, -1.297919511795044, -1.2012499570846558, -1.1045804023742676, -1.0079107284545898, -0.9112411141395569, -0.8145714998245239, -0.717901885509491, -0.621232271194458, -0.524562656879425, -0.4278930425643921, -0.33122342824935913, -0.23455405235290527, -0.13788443803787231, -0.041214823722839355, 0.055454790592193604, 0.15212440490722656, 0.24879401922225952, 0.3454636335372925, 0.44213324785232544, 0.5388028621673584, 0.6354724764823914, 0.7321420907974243, 0.8288117051124573, 0.9254813194274902, 1.022150993347168, 1.1188205480575562, 1.2154901027679443, 1.312159776687622, 1.4088294506072998, 1.505499005317688, 1.6021685600280762, 1.698838233947754, 1.7955079078674316, 1.8921774625778198, 1.988847017288208, 2.0855166912078857, 2.1821863651275635, 2.278855800628662, 2.37552547454834, 2.4721951484680176, 2.5688648223876953, 2.665534496307373, 2.7622039318084717, 2.8588736057281494]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 13.0, 16.0, 25.0, 29.0, 54.0, 94.0, 116.0, 215.0, 252.0, 438.0, 733.0, 1049.0, 1792.0, 3020.0, 4981.0, 8764.0, 16216.0, 30579.0, 63105.0, 142093.0, 357360.0, 929564.0, 1371347.0, 755804.0, 280866.0, 113867.0, 52218.0, 25952.0, 14038.0, 7786.0, 4572.0, 2704.0, 1683.0, 1040.0, 693.0, 415.0, 279.0, 174.0, 109.0, 72.0, 48.0, 39.0, 16.0, 15.0, 4.0, 8.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.82421875, -6.6197509765625, -6.415283203125, -6.2108154296875, -6.00634765625, -5.8018798828125, -5.597412109375, -5.3929443359375, -5.1884765625, -4.9840087890625, -4.779541015625, -4.5750732421875, -4.37060546875, -4.1661376953125, -3.961669921875, -3.7572021484375, -3.552734375, -3.3482666015625, -3.143798828125, -2.9393310546875, -2.73486328125, -2.5303955078125, -2.325927734375, -2.1214599609375, -1.9169921875, -1.7125244140625, -1.508056640625, -1.3035888671875, -1.09912109375, -0.8946533203125, -0.690185546875, -0.4857177734375, -0.28125, -0.0767822265625, 0.127685546875, 0.3321533203125, 0.53662109375, 0.7410888671875, 0.945556640625, 1.1500244140625, 1.3544921875, 1.5589599609375, 1.763427734375, 1.9678955078125, 2.17236328125, 2.3768310546875, 2.581298828125, 2.7857666015625, 2.990234375, 3.1947021484375, 3.399169921875, 3.6036376953125, 3.80810546875, 4.0125732421875, 4.217041015625, 4.4215087890625, 4.6259765625, 4.8304443359375, 5.034912109375, 5.2393798828125, 5.44384765625, 5.6483154296875, 5.852783203125, 6.0572509765625, 6.26171875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 10.0, 15.0, 11.0, 10.0, 7.0, 23.0, 22.0, 39.0, 31.0, 27.0, 31.0, 24.0, 24.0, 31.0, 44.0, 43.0, 38.0, 55.0, 27.0, 50.0, 49.0, 48.0, 34.0, 34.0, 36.0, 28.0, 25.0, 27.0, 26.0, 15.0, 17.0, 13.0, 18.0, 7.0, 5.0, 9.0, 10.0, 9.0, 3.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.261138916015625, -2.18243408203125, -2.103729248046875, -2.0250244140625, -1.946319580078125, -1.86761474609375, -1.788909912109375, -1.710205078125, -1.631500244140625, -1.55279541015625, -1.474090576171875, -1.3953857421875, -1.316680908203125, -1.23797607421875, -1.159271240234375, -1.08056640625, -1.001861572265625, -0.92315673828125, -0.844451904296875, -0.7657470703125, -0.687042236328125, -0.60833740234375, -0.529632568359375, -0.450927734375, -0.372222900390625, -0.29351806640625, -0.214813232421875, -0.1361083984375, -0.057403564453125, 0.02130126953125, 0.100006103515625, 0.1787109375, 0.257415771484375, 0.33612060546875, 0.414825439453125, 0.4935302734375, 0.572235107421875, 0.65093994140625, 0.729644775390625, 0.808349609375, 0.887054443359375, 0.96575927734375, 1.044464111328125, 1.1231689453125, 1.201873779296875, 1.28057861328125, 1.359283447265625, 1.43798828125, 1.516693115234375, 1.59539794921875, 1.674102783203125, 1.7528076171875, 1.831512451171875, 1.91021728515625, 1.988922119140625, 2.067626953125, 2.146331787109375, 2.22503662109375, 2.303741455078125, 2.3824462890625, 2.461151123046875, 2.53985595703125, 2.618560791015625, 2.697265625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 9.0, 14.0, 17.0, 30.0, 39.0, 63.0, 65.0, 137.0, 217.0, 330.0, 521.0, 736.0, 1184.0, 1833.0, 2878.0, 4675.0, 7796.0, 13230.0, 23271.0, 42048.0, 81759.0, 166861.0, 356853.0, 759733.0, 1165215.0, 809641.0, 384403.0, 179110.0, 86918.0, 45059.0, 24545.0, 13730.0, 8173.0, 4798.0, 2995.0, 1932.0, 1160.0, 820.0, 474.0, 345.0, 256.0, 137.0, 105.0, 60.0, 42.0, 28.0, 16.0, 13.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.3289794921875, -6.134521484375, -5.9400634765625, -5.74560546875, -5.5511474609375, -5.356689453125, -5.1622314453125, -4.9677734375, -4.7733154296875, -4.578857421875, -4.3843994140625, -4.18994140625, -3.9954833984375, -3.801025390625, -3.6065673828125, -3.412109375, -3.2176513671875, -3.023193359375, -2.8287353515625, -2.63427734375, -2.4398193359375, -2.245361328125, -2.0509033203125, -1.8564453125, -1.6619873046875, -1.467529296875, -1.2730712890625, -1.07861328125, -0.8841552734375, -0.689697265625, -0.4952392578125, -0.30078125, -0.1063232421875, 0.088134765625, 0.2825927734375, 0.47705078125, 0.6715087890625, 0.865966796875, 1.0604248046875, 1.2548828125, 1.4493408203125, 1.643798828125, 1.8382568359375, 2.03271484375, 2.2271728515625, 2.421630859375, 2.6160888671875, 2.810546875, 3.0050048828125, 3.199462890625, 3.3939208984375, 3.58837890625, 3.7828369140625, 3.977294921875, 4.1717529296875, 4.3662109375, 4.5606689453125, 4.755126953125, 4.9495849609375, 5.14404296875, 5.3385009765625, 5.532958984375, 5.7274169921875, 5.921875]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 6.0, 2.0, 7.0, 10.0, 11.0, 18.0, 20.0, 31.0, 33.0, 46.0, 58.0, 74.0, 106.0, 97.0, 157.0, 195.0, 233.0, 261.0, 289.0, 286.0, 306.0, 344.0, 274.0, 250.0, 194.0, 172.0, 138.0, 87.0, 67.0, 55.0, 49.0, 42.0, 31.0, 28.0, 15.0, 13.0, 12.0, 5.0, 10.0, 8.0, 5.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.586395263671875, -1.53021240234375, -1.474029541015625, -1.4178466796875, -1.361663818359375, -1.30548095703125, -1.249298095703125, -1.193115234375, -1.136932373046875, -1.08074951171875, -1.024566650390625, -0.9683837890625, -0.912200927734375, -0.85601806640625, -0.799835205078125, -0.74365234375, -0.687469482421875, -0.63128662109375, -0.575103759765625, -0.5189208984375, -0.462738037109375, -0.40655517578125, -0.350372314453125, -0.294189453125, -0.238006591796875, -0.18182373046875, -0.125640869140625, -0.0694580078125, -0.013275146484375, 0.04290771484375, 0.099090576171875, 0.1552734375, 0.211456298828125, 0.26763916015625, 0.323822021484375, 0.3800048828125, 0.436187744140625, 0.49237060546875, 0.548553466796875, 0.604736328125, 0.660919189453125, 0.71710205078125, 0.773284912109375, 0.8294677734375, 0.885650634765625, 0.94183349609375, 0.998016357421875, 1.05419921875, 1.110382080078125, 1.16656494140625, 1.222747802734375, 1.2789306640625, 1.335113525390625, 1.39129638671875, 1.447479248046875, 1.503662109375, 1.559844970703125, 1.61602783203125, 1.672210693359375, 1.7283935546875, 1.784576416015625, 1.84075927734375, 1.896942138671875, 1.953125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 10.0, 7.0, 15.0, 26.0, 22.0, 30.0, 49.0, 64.0, 62.0, 97.0, 116.0, 133.0, 105.0, 90.0, 56.0, 36.0, 20.0, 22.0, 16.0, 11.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.101999282836914, -13.726221084594727, -13.350443840026855, -12.974665641784668, -12.598888397216797, -12.22311019897461, -11.847332000732422, -11.471553802490234, -11.095776557922363, -10.719998359680176, -10.344221115112305, -9.968442916870117, -9.59266471862793, -9.216887474060059, -8.841109275817871, -8.46533203125, -8.089553833007812, -7.713776111602783, -7.337998390197754, -6.962220191955566, -6.586442470550537, -6.210664749145508, -5.83488655090332, -5.459108829498291, -5.083331108093262, -4.707553386688232, -4.331775665283203, -3.9559974670410156, -3.5802197456359863, -3.204442024230957, -2.8286640644073486, -2.4528861045837402, -2.077108383178711, -1.701330542564392, -1.3255527019500732, -0.9497748613357544, -0.5739970207214355, -0.1982191801071167, 0.17755866050720215, 0.5533366203308105, 0.9291143417358398, 1.3048921823501587, 1.6806700229644775, 2.056447982788086, 2.4322257041931152, 2.8080034255981445, 3.183781385421753, 3.5595593452453613, 3.9353370666503906, 4.31111478805542, 4.686892509460449, 5.062670707702637, 5.438448429107666, 5.814226150512695, 6.190004348754883, 6.565782070159912, 6.941559791564941, 7.317337512969971, 7.693115234375, 8.068893432617188, 8.444671630859375, 8.820448875427246, 9.196227073669434, 9.572004318237305, 9.947782516479492]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 11.0, 9.0, 16.0, 20.0, 15.0, 14.0, 19.0, 25.0, 20.0, 22.0, 26.0, 32.0, 46.0, 46.0, 39.0, 34.0, 47.0, 40.0, 44.0, 36.0, 46.0, 50.0, 35.0, 31.0, 31.0, 32.0, 26.0, 23.0, 19.0, 12.0, 12.0, 23.0, 18.0, 12.0, 11.0, 8.0, 13.0, 5.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.4018402099609375, -3.298731565475464, -3.1956229209899902, -3.0925140380859375, -2.989405393600464, -2.8862967491149902, -2.7831878662109375, -2.680079221725464, -2.5769705772399902, -2.4738619327545166, -2.370753288269043, -2.2676444053649902, -2.1645357608795166, -2.061427116394043, -1.9583183526992798, -1.8552095890045166, -1.752100944519043, -1.6489923000335693, -1.5458835363388062, -1.442774772644043, -1.3396661281585693, -1.2365574836730957, -1.1334487199783325, -1.0303399562835693, -0.9272313117980957, -0.8241226077079773, -0.7210139036178589, -0.6179051995277405, -0.5147964954376221, -0.41168779134750366, -0.30857908725738525, -0.20547038316726685, -0.10236191749572754, 0.0007467865943908691, 0.10385549068450928, 0.20696419477462769, 0.3100728988647461, 0.4131816029548645, 0.5162903070449829, 0.6193990111351013, 0.7225077152252197, 0.8256164193153381, 0.9287251234054565, 1.0318338871002197, 1.1349425315856934, 1.238051176071167, 1.3411599397659302, 1.4442687034606934, 1.547377347946167, 1.6504859924316406, 1.7535947561264038, 1.856703519821167, 1.9598121643066406, 2.0629208087921143, 2.166029453277588, 2.2691383361816406, 2.3722469806671143, 2.475355625152588, 2.5784645080566406, 2.6815731525421143, 2.784681797027588, 2.8877904415130615, 2.990899085998535, 3.094007968902588, 3.1971166133880615]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 19.0, 11.0, 11.0, 24.0, 42.0, 75.0, 82.0, 124.0, 205.0, 286.0, 422.0, 655.0, 998.0, 1609.0, 2759.0, 5683.0, 12671.0, 35532.0, 112483.0, 319738.0, 351549.0, 133306.0, 41429.0, 14897.0, 6152.0, 3036.0, 1659.0, 999.0, 648.0, 451.0, 293.0, 214.0, 145.0, 94.0, 54.0, 47.0, 33.0, 37.0, 15.0, 16.0, 6.0, 11.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.078125, -5.88861083984375, -5.6990966796875, -5.50958251953125, -5.320068359375, -5.13055419921875, -4.9410400390625, -4.75152587890625, -4.56201171875, -4.37249755859375, -4.1829833984375, -3.99346923828125, -3.803955078125, -3.61444091796875, -3.4249267578125, -3.23541259765625, -3.0458984375, -2.85638427734375, -2.6668701171875, -2.47735595703125, -2.287841796875, -2.09832763671875, -1.9088134765625, -1.71929931640625, -1.52978515625, -1.34027099609375, -1.1507568359375, -0.96124267578125, -0.771728515625, -0.58221435546875, -0.3927001953125, -0.20318603515625, -0.013671875, 0.17584228515625, 0.3653564453125, 0.55487060546875, 0.744384765625, 0.93389892578125, 1.1234130859375, 1.31292724609375, 1.50244140625, 1.69195556640625, 1.8814697265625, 2.07098388671875, 2.260498046875, 2.45001220703125, 2.6395263671875, 2.82904052734375, 3.0185546875, 3.20806884765625, 3.3975830078125, 3.58709716796875, 3.776611328125, 3.96612548828125, 4.1556396484375, 4.34515380859375, 4.53466796875, 4.72418212890625, 4.9136962890625, 5.10321044921875, 5.292724609375, 5.48223876953125, 5.6717529296875, 5.86126708984375, 6.05078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 1.0, 4.0, 4.0, 5.0, 8.0, 11.0, 6.0, 9.0, 10.0, 18.0, 27.0, 17.0, 31.0, 26.0, 35.0, 28.0, 31.0, 34.0, 35.0, 36.0, 42.0, 55.0, 46.0, 35.0, 48.0, 40.0, 39.0, 40.0, 28.0, 25.0, 26.0, 24.0, 25.0, 23.0, 20.0, 20.0, 16.0, 8.0, 17.0, 10.0, 11.0, 10.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.62109375, -3.507659912109375, -3.39422607421875, -3.280792236328125, -3.1673583984375, -3.053924560546875, -2.94049072265625, -2.827056884765625, -2.713623046875, -2.600189208984375, -2.48675537109375, -2.373321533203125, -2.2598876953125, -2.146453857421875, -2.03302001953125, -1.919586181640625, -1.80615234375, -1.692718505859375, -1.57928466796875, -1.465850830078125, -1.3524169921875, -1.238983154296875, -1.12554931640625, -1.012115478515625, -0.898681640625, -0.785247802734375, -0.67181396484375, -0.558380126953125, -0.4449462890625, -0.331512451171875, -0.21807861328125, -0.104644775390625, 0.0087890625, 0.122222900390625, 0.23565673828125, 0.349090576171875, 0.4625244140625, 0.575958251953125, 0.68939208984375, 0.802825927734375, 0.916259765625, 1.029693603515625, 1.14312744140625, 1.256561279296875, 1.3699951171875, 1.483428955078125, 1.59686279296875, 1.710296630859375, 1.82373046875, 1.937164306640625, 2.05059814453125, 2.164031982421875, 2.2774658203125, 2.390899658203125, 2.50433349609375, 2.617767333984375, 2.731201171875, 2.844635009765625, 2.95806884765625, 3.071502685546875, 3.1849365234375, 3.298370361328125, 3.41180419921875, 3.525238037109375, 3.638671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 4.0, 11.0, 8.0, 15.0, 12.0, 17.0, 30.0, 50.0, 50.0, 83.0, 101.0, 132.0, 169.0, 292.0, 429.0, 587.0, 838.0, 1340.0, 2138.0, 4410.0, 13175.0, 63857.0, 403338.0, 456575.0, 74806.0, 14596.0, 4877.0, 2238.0, 1370.0, 903.0, 599.0, 412.0, 292.0, 213.0, 151.0, 111.0, 80.0, 60.0, 42.0, 30.0, 22.0, 19.0, 18.0, 12.0, 9.0, 7.0, 3.0, 2.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-10.390625, -10.055908203125, -9.72119140625, -9.386474609375, -9.0517578125, -8.717041015625, -8.38232421875, -8.047607421875, -7.712890625, -7.378173828125, -7.04345703125, -6.708740234375, -6.3740234375, -6.039306640625, -5.70458984375, -5.369873046875, -5.03515625, -4.700439453125, -4.36572265625, -4.031005859375, -3.6962890625, -3.361572265625, -3.02685546875, -2.692138671875, -2.357421875, -2.022705078125, -1.68798828125, -1.353271484375, -1.0185546875, -0.683837890625, -0.34912109375, -0.014404296875, 0.3203125, 0.655029296875, 0.98974609375, 1.324462890625, 1.6591796875, 1.993896484375, 2.32861328125, 2.663330078125, 2.998046875, 3.332763671875, 3.66748046875, 4.002197265625, 4.3369140625, 4.671630859375, 5.00634765625, 5.341064453125, 5.67578125, 6.010498046875, 6.34521484375, 6.679931640625, 7.0146484375, 7.349365234375, 7.68408203125, 8.018798828125, 8.353515625, 8.688232421875, 9.02294921875, 9.357666015625, 9.6923828125, 10.027099609375, 10.36181640625, 10.696533203125, 11.03125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 7.0, 7.0, 10.0, 7.0, 5.0, 13.0, 11.0, 17.0, 17.0, 23.0, 23.0, 13.0, 25.0, 24.0, 25.0, 34.0, 44.0, 37.0, 46.0, 53.0, 47.0, 35.0, 36.0, 38.0, 32.0, 37.0, 43.0, 34.0, 40.0, 23.0, 28.0, 29.0, 23.0, 14.0, 15.0, 19.0, 12.0, 9.0, 6.0, 11.0, 13.0, 4.0, 3.0, 6.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.091796875, -2.026336669921875, -1.96087646484375, -1.895416259765625, -1.8299560546875, -1.764495849609375, -1.69903564453125, -1.633575439453125, -1.568115234375, -1.502655029296875, -1.43719482421875, -1.371734619140625, -1.3062744140625, -1.240814208984375, -1.17535400390625, -1.109893798828125, -1.04443359375, -0.978973388671875, -0.91351318359375, -0.848052978515625, -0.7825927734375, -0.717132568359375, -0.65167236328125, -0.586212158203125, -0.520751953125, -0.455291748046875, -0.38983154296875, -0.324371337890625, -0.2589111328125, -0.193450927734375, -0.12799072265625, -0.062530517578125, 0.0029296875, 0.068389892578125, 0.13385009765625, 0.199310302734375, 0.2647705078125, 0.330230712890625, 0.39569091796875, 0.461151123046875, 0.526611328125, 0.592071533203125, 0.65753173828125, 0.722991943359375, 0.7884521484375, 0.853912353515625, 0.91937255859375, 0.984832763671875, 1.05029296875, 1.115753173828125, 1.18121337890625, 1.246673583984375, 1.3121337890625, 1.377593994140625, 1.44305419921875, 1.508514404296875, 1.573974609375, 1.639434814453125, 1.70489501953125, 1.770355224609375, 1.8358154296875, 1.901275634765625, 1.96673583984375, 2.032196044921875, 2.09765625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 8.0, 6.0, 6.0, 5.0, 10.0, 22.0, 30.0, 45.0, 62.0, 104.0, 143.0, 228.0, 318.0, 554.0, 821.0, 1460.0, 2509.0, 4699.0, 10547.0, 32031.0, 143147.0, 530062.0, 243936.0, 49725.0, 14506.0, 6136.0, 2959.0, 1731.0, 1048.0, 620.0, 377.0, 236.0, 164.0, 101.0, 79.0, 38.0, 26.0, 24.0, 14.0, 11.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.53515625, -3.4073486328125, -3.279541015625, -3.1517333984375, -3.02392578125, -2.8961181640625, -2.768310546875, -2.6405029296875, -2.5126953125, -2.3848876953125, -2.257080078125, -2.1292724609375, -2.00146484375, -1.8736572265625, -1.745849609375, -1.6180419921875, -1.490234375, -1.3624267578125, -1.234619140625, -1.1068115234375, -0.97900390625, -0.8511962890625, -0.723388671875, -0.5955810546875, -0.4677734375, -0.3399658203125, -0.212158203125, -0.0843505859375, 0.04345703125, 0.1712646484375, 0.299072265625, 0.4268798828125, 0.5546875, 0.6824951171875, 0.810302734375, 0.9381103515625, 1.06591796875, 1.1937255859375, 1.321533203125, 1.4493408203125, 1.5771484375, 1.7049560546875, 1.832763671875, 1.9605712890625, 2.08837890625, 2.2161865234375, 2.343994140625, 2.4718017578125, 2.599609375, 2.7274169921875, 2.855224609375, 2.9830322265625, 3.11083984375, 3.2386474609375, 3.366455078125, 3.4942626953125, 3.6220703125, 3.7498779296875, 3.877685546875, 4.0054931640625, 4.13330078125, 4.2611083984375, 4.388916015625, 4.5167236328125, 4.64453125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 4.0, 2.0, 5.0, 2.0, 5.0, 9.0, 19.0, 31.0, 68.0, 100.0, 174.0, 199.0, 155.0, 100.0, 54.0, 29.0, 22.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014770030975341797, -0.00014081411063671112, -0.00013392791152000427, -0.00012704171240329742, -0.00012015551328659058, -0.00011326931416988373, -0.00010638311505317688, -9.949691593647003e-05, -9.261071681976318e-05, -8.572451770305634e-05, -7.883831858634949e-05, -7.195211946964264e-05, -6.506592035293579e-05, -5.817972123622894e-05, -5.1293522119522095e-05, -4.4407323002815247e-05, -3.75211238861084e-05, -3.063492476940155e-05, -2.3748725652694702e-05, -1.6862526535987854e-05, -9.976327419281006e-06, -3.0901283025741577e-06, 3.7960708141326904e-06, 1.0682269930839539e-05, 1.7568469047546387e-05, 2.4454668164253235e-05, 3.134086728096008e-05, 3.822706639766693e-05, 4.511326551437378e-05, 5.199946463108063e-05, 5.8885663747787476e-05, 6.577186286449432e-05, 7.265806198120117e-05, 7.954426109790802e-05, 8.643046021461487e-05, 9.331665933132172e-05, 0.00010020285844802856, 0.00010708905756473541, 0.00011397525668144226, 0.00012086145579814911, 0.00012774765491485596, 0.0001346338540315628, 0.00014152005314826965, 0.0001484062522649765, 0.00015529245138168335, 0.0001621786504983902, 0.00016906484961509705, 0.0001759510487318039, 0.00018283724784851074, 0.0001897234469652176, 0.00019660964608192444, 0.0002034958451986313, 0.00021038204431533813, 0.00021726824343204498, 0.00022415444254875183, 0.00023104064166545868, 0.00023792684078216553, 0.0002448130398988724, 0.0002516992390155792, 0.00025858543813228607, 0.0002654716372489929, 0.00027235783636569977, 0.0002792440354824066, 0.00028613023459911346, 0.0002930164337158203]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 15.0, 20.0, 19.0, 44.0, 74.0, 111.0, 125.0, 173.0, 233.0, 341.0, 434.0, 629.0, 871.0, 1222.0, 1640.0, 2257.0, 3433.0, 5900.0, 12124.0, 33001.0, 108060.0, 307665.0, 351398.0, 141473.0, 42978.0, 14975.0, 6715.0, 3740.0, 2480.0, 1778.0, 1252.0, 921.0, 689.0, 498.0, 371.0, 283.0, 180.0, 120.0, 84.0, 76.0, 46.0, 39.0, 14.0, 15.0, 9.0, 4.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.5546875, -2.4698486328125, -2.385009765625, -2.3001708984375, -2.21533203125, -2.1304931640625, -2.045654296875, -1.9608154296875, -1.8759765625, -1.7911376953125, -1.706298828125, -1.6214599609375, -1.53662109375, -1.4517822265625, -1.366943359375, -1.2821044921875, -1.197265625, -1.1124267578125, -1.027587890625, -0.9427490234375, -0.85791015625, -0.7730712890625, -0.688232421875, -0.6033935546875, -0.5185546875, -0.4337158203125, -0.348876953125, -0.2640380859375, -0.17919921875, -0.0943603515625, -0.009521484375, 0.0753173828125, 0.16015625, 0.2449951171875, 0.329833984375, 0.4146728515625, 0.49951171875, 0.5843505859375, 0.669189453125, 0.7540283203125, 0.8388671875, 0.9237060546875, 1.008544921875, 1.0933837890625, 1.17822265625, 1.2630615234375, 1.347900390625, 1.4327392578125, 1.517578125, 1.6024169921875, 1.687255859375, 1.7720947265625, 1.85693359375, 1.9417724609375, 2.026611328125, 2.1114501953125, 2.1962890625, 2.2811279296875, 2.365966796875, 2.4508056640625, 2.53564453125, 2.6204833984375, 2.705322265625, 2.7901611328125, 2.875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 6.0, 6.0, 14.0, 17.0, 28.0, 42.0, 62.0, 128.0, 163.0, 163.0, 118.0, 85.0, 66.0, 40.0, 15.0, 15.0, 10.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9342193603515625, -0.906036376953125, -0.8778533935546875, -0.84967041015625, -0.8214874267578125, -0.793304443359375, -0.7651214599609375, -0.7369384765625, -0.7087554931640625, -0.680572509765625, -0.6523895263671875, -0.62420654296875, -0.5960235595703125, -0.567840576171875, -0.5396575927734375, -0.511474609375, -0.4832916259765625, -0.455108642578125, -0.4269256591796875, -0.39874267578125, -0.3705596923828125, -0.342376708984375, -0.3141937255859375, -0.2860107421875, -0.2578277587890625, -0.229644775390625, -0.2014617919921875, -0.17327880859375, -0.1450958251953125, -0.116912841796875, -0.0887298583984375, -0.060546875, -0.0323638916015625, -0.004180908203125, 0.0240020751953125, 0.05218505859375, 0.0803680419921875, 0.108551025390625, 0.1367340087890625, 0.1649169921875, 0.1930999755859375, 0.221282958984375, 0.2494659423828125, 0.27764892578125, 0.3058319091796875, 0.334014892578125, 0.3621978759765625, 0.390380859375, 0.4185638427734375, 0.446746826171875, 0.4749298095703125, 0.50311279296875, 0.5312957763671875, 0.559478759765625, 0.5876617431640625, 0.6158447265625, 0.6440277099609375, 0.672210693359375, 0.7003936767578125, 0.72857666015625, 0.7567596435546875, 0.784942626953125, 0.8131256103515625, 0.84130859375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 16.0, 16.0, 21.0, 25.0, 47.0, 56.0, 65.0, 79.0, 124.0, 114.0, 112.0, 82.0, 85.0, 44.0, 24.0, 23.0, 16.0, 18.0, 7.0, 3.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.908937454223633, -13.542439460754395, -13.175941467285156, -12.809443473815918, -12.44294548034668, -12.076448440551758, -11.70995044708252, -11.343452453613281, -10.976954460144043, -10.610456466674805, -10.243958473205566, -9.877460479736328, -9.510963439941406, -9.144465446472168, -8.77796745300293, -8.411469459533691, -8.044971466064453, -7.678473472595215, -7.311975479125977, -6.9454779624938965, -6.578979969024658, -6.21248197555542, -5.84598445892334, -5.479486465454102, -5.112988471984863, -4.746490478515625, -4.379992485046387, -4.013494968414307, -3.6469969749450684, -3.28049898147583, -2.914001226425171, -2.5475034713745117, -2.1810054779052734, -1.8145076036453247, -1.448009729385376, -1.0815118551254272, -0.7150139808654785, -0.3485161066055298, 0.017981767654418945, 0.3844795227050781, 0.7509775161743164, 1.1174753904342651, 1.4839732646942139, 1.8504711389541626, 2.2169690132141113, 2.5834670066833496, 2.949964761734009, 3.316462516784668, 3.6829605102539062, 4.0494585037231445, 4.415956497192383, 4.782454013824463, 5.148952007293701, 5.5154500007629395, 5.8819475173950195, 6.248445510864258, 6.614943504333496, 6.981441497802734, 7.347939491271973, 7.714437007904053, 8.080934524536133, 8.447432518005371, 8.81393051147461, 9.180428504943848, 9.546926498413086]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 7.0, 7.0, 12.0, 16.0, 15.0, 24.0, 15.0, 21.0, 16.0, 24.0, 26.0, 27.0, 37.0, 45.0, 43.0, 38.0, 37.0, 39.0, 46.0, 45.0, 41.0, 45.0, 50.0, 38.0, 28.0, 26.0, 40.0, 18.0, 20.0, 19.0, 16.0, 12.0, 21.0, 18.0, 12.0, 10.0, 11.0, 3.0, 7.0, 5.0, 8.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.3787872791290283, -3.276102066040039, -3.173417091369629, -3.0707318782806396, -2.9680469036102295, -2.8653616905212402, -2.76267671585083, -2.659991502761841, -2.5573062896728516, -2.4546210765838623, -2.351936101913452, -2.249250888824463, -2.1465659141540527, -2.0438807010650635, -1.9411956071853638, -1.838510513305664, -1.735825538635254, -1.6331404447555542, -1.5304553508758545, -1.4277701377868652, -1.325085163116455, -1.2223999500274658, -1.1197148561477661, -1.0170297622680664, -0.9143446683883667, -0.811659574508667, -0.7089744806289673, -0.6062893271446228, -0.5036042332649231, -0.4009191393852234, -0.2982339859008789, -0.1955488920211792, -0.09286355972290039, 0.00982154905796051, 0.11250665783882141, 0.2151917815208435, 0.3178768754005432, 0.4205619692802429, 0.5232471227645874, 0.6259322166442871, 0.7286173105239868, 0.8313024044036865, 0.9339874982833862, 1.036672592163086, 1.1393578052520752, 1.2420427799224854, 1.3447279930114746, 1.4474130868911743, 1.550098180770874, 1.6527832746505737, 1.7554683685302734, 1.8581535816192627, 1.9608385562896729, 2.063523769378662, 2.1662087440490723, 2.2688939571380615, 2.371579170227051, 2.47426438331604, 2.57694935798645, 2.6796345710754395, 2.7823195457458496, 2.885004758834839, 2.987689971923828, 3.0903749465942383, 3.1930599212646484]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 8.0, 16.0, 18.0, 18.0, 45.0, 80.0, 104.0, 184.0, 313.0, 499.0, 977.0, 2166.0, 4796.0, 11960.0, 31953.0, 85951.0, 206862.0, 313321.0, 228329.0, 99760.0, 37080.0, 13875.0, 5466.0, 2323.0, 1062.0, 575.0, 292.0, 173.0, 122.0, 81.0, 43.0, 27.0, 20.0, 10.0, 13.0, 12.0, 9.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.859375, -7.61810302734375, -7.3768310546875, -7.13555908203125, -6.894287109375, -6.65301513671875, -6.4117431640625, -6.17047119140625, -5.92919921875, -5.68792724609375, -5.4466552734375, -5.20538330078125, -4.964111328125, -4.72283935546875, -4.4815673828125, -4.24029541015625, -3.9990234375, -3.75775146484375, -3.5164794921875, -3.27520751953125, -3.033935546875, -2.79266357421875, -2.5513916015625, -2.31011962890625, -2.06884765625, -1.82757568359375, -1.5863037109375, -1.34503173828125, -1.103759765625, -0.86248779296875, -0.6212158203125, -0.37994384765625, -0.138671875, 0.10260009765625, 0.3438720703125, 0.58514404296875, 0.826416015625, 1.06768798828125, 1.3089599609375, 1.55023193359375, 1.79150390625, 2.03277587890625, 2.2740478515625, 2.51531982421875, 2.756591796875, 2.99786376953125, 3.2391357421875, 3.48040771484375, 3.7216796875, 3.96295166015625, 4.2042236328125, 4.44549560546875, 4.686767578125, 4.92803955078125, 5.1693115234375, 5.41058349609375, 5.65185546875, 5.89312744140625, 6.1343994140625, 6.37567138671875, 6.616943359375, 6.85821533203125, 7.0994873046875, 7.34075927734375, 7.58203125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 0.0, 9.0, 6.0, 8.0, 8.0, 13.0, 20.0, 18.0, 19.0, 21.0, 23.0, 20.0, 27.0, 47.0, 29.0, 41.0, 44.0, 35.0, 47.0, 33.0, 35.0, 45.0, 40.0, 41.0, 43.0, 24.0, 38.0, 33.0, 27.0, 28.0, 27.0, 18.0, 21.0, 21.0, 12.0, 15.0, 16.0, 10.0, 4.0, 8.0, 3.0, 8.0, 8.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.666015625, -3.554962158203125, -3.44390869140625, -3.332855224609375, -3.2218017578125, -3.110748291015625, -2.99969482421875, -2.888641357421875, -2.777587890625, -2.666534423828125, -2.55548095703125, -2.444427490234375, -2.3333740234375, -2.222320556640625, -2.11126708984375, -2.000213623046875, -1.88916015625, -1.778106689453125, -1.66705322265625, -1.555999755859375, -1.4449462890625, -1.333892822265625, -1.22283935546875, -1.111785888671875, -1.000732421875, -0.889678955078125, -0.77862548828125, -0.667572021484375, -0.5565185546875, -0.445465087890625, -0.33441162109375, -0.223358154296875, -0.1123046875, -0.001251220703125, 0.10980224609375, 0.220855712890625, 0.3319091796875, 0.442962646484375, 0.55401611328125, 0.665069580078125, 0.776123046875, 0.887176513671875, 0.99822998046875, 1.109283447265625, 1.2203369140625, 1.331390380859375, 1.44244384765625, 1.553497314453125, 1.66455078125, 1.775604248046875, 1.88665771484375, 1.997711181640625, 2.1087646484375, 2.219818115234375, 2.33087158203125, 2.441925048828125, 2.552978515625, 2.664031982421875, 2.77508544921875, 2.886138916015625, 2.9971923828125, 3.108245849609375, 3.21929931640625, 3.330352783203125, 3.44140625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 8.0, 19.0, 29.0, 42.0, 69.0, 98.0, 104.0, 171.0, 290.0, 392.0, 626.0, 1005.0, 1548.0, 2761.0, 4631.0, 8008.0, 14098.0, 25776.0, 45792.0, 80002.0, 128032.0, 175111.0, 185226.0, 147244.0, 96989.0, 56972.0, 31628.0, 17552.0, 10135.0, 5670.0, 3296.0, 1944.0, 1183.0, 730.0, 453.0, 297.0, 197.0, 141.0, 98.0, 59.0, 40.0, 24.0, 14.0, 15.0, 9.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.30560302734375, -4.1580810546875, -4.01055908203125, -3.863037109375, -3.71551513671875, -3.5679931640625, -3.42047119140625, -3.27294921875, -3.12542724609375, -2.9779052734375, -2.83038330078125, -2.682861328125, -2.53533935546875, -2.3878173828125, -2.24029541015625, -2.0927734375, -1.94525146484375, -1.7977294921875, -1.65020751953125, -1.502685546875, -1.35516357421875, -1.2076416015625, -1.06011962890625, -0.91259765625, -0.76507568359375, -0.6175537109375, -0.47003173828125, -0.322509765625, -0.17498779296875, -0.0274658203125, 0.12005615234375, 0.267578125, 0.41510009765625, 0.5626220703125, 0.71014404296875, 0.857666015625, 1.00518798828125, 1.1527099609375, 1.30023193359375, 1.44775390625, 1.59527587890625, 1.7427978515625, 1.89031982421875, 2.037841796875, 2.18536376953125, 2.3328857421875, 2.48040771484375, 2.6279296875, 2.77545166015625, 2.9229736328125, 3.07049560546875, 3.218017578125, 3.36553955078125, 3.5130615234375, 3.66058349609375, 3.80810546875, 3.95562744140625, 4.1031494140625, 4.25067138671875, 4.398193359375, 4.54571533203125, 4.6932373046875, 4.84075927734375, 4.98828125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 4.0, 10.0, 5.0, 6.0, 12.0, 6.0, 14.0, 9.0, 15.0, 20.0, 17.0, 16.0, 28.0, 23.0, 35.0, 27.0, 31.0, 36.0, 37.0, 50.0, 38.0, 33.0, 38.0, 39.0, 42.0, 35.0, 40.0, 34.0, 28.0, 32.0, 29.0, 34.0, 33.0, 22.0, 12.0, 19.0, 16.0, 10.0, 18.0, 9.0, 10.0, 6.0, 8.0, 3.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9427490234375, -1.879638671875, -1.8165283203125, -1.75341796875, -1.6903076171875, -1.627197265625, -1.5640869140625, -1.5009765625, -1.4378662109375, -1.374755859375, -1.3116455078125, -1.24853515625, -1.1854248046875, -1.122314453125, -1.0592041015625, -0.99609375, -0.9329833984375, -0.869873046875, -0.8067626953125, -0.74365234375, -0.6805419921875, -0.617431640625, -0.5543212890625, -0.4912109375, -0.4281005859375, -0.364990234375, -0.3018798828125, -0.23876953125, -0.1756591796875, -0.112548828125, -0.0494384765625, 0.013671875, 0.0767822265625, 0.139892578125, 0.2030029296875, 0.26611328125, 0.3292236328125, 0.392333984375, 0.4554443359375, 0.5185546875, 0.5816650390625, 0.644775390625, 0.7078857421875, 0.77099609375, 0.8341064453125, 0.897216796875, 0.9603271484375, 1.0234375, 1.0865478515625, 1.149658203125, 1.2127685546875, 1.27587890625, 1.3389892578125, 1.402099609375, 1.4652099609375, 1.5283203125, 1.5914306640625, 1.654541015625, 1.7176513671875, 1.78076171875, 1.8438720703125, 1.906982421875, 1.9700927734375, 2.033203125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 13.0, 15.0, 32.0, 25.0, 55.0, 55.0, 120.0, 184.0, 248.0, 388.0, 550.0, 876.0, 1449.0, 2133.0, 3683.0, 6080.0, 10297.0, 17393.0, 30449.0, 52338.0, 88515.0, 137804.0, 179434.0, 177607.0, 132912.0, 84644.0, 50231.0, 29193.0, 16762.0, 9750.0, 5821.0, 3583.0, 2124.0, 1306.0, 847.0, 531.0, 370.0, 252.0, 151.0, 121.0, 74.0, 46.0, 20.0, 21.0, 13.0, 15.0, 9.0, 12.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8779296875, -1.8191680908203125, -1.760406494140625, -1.7016448974609375, -1.64288330078125, -1.5841217041015625, -1.525360107421875, -1.4665985107421875, -1.4078369140625, -1.3490753173828125, -1.290313720703125, -1.2315521240234375, -1.17279052734375, -1.1140289306640625, -1.055267333984375, -0.9965057373046875, -0.937744140625, -0.8789825439453125, -0.820220947265625, -0.7614593505859375, -0.70269775390625, -0.6439361572265625, -0.585174560546875, -0.5264129638671875, -0.4676513671875, -0.4088897705078125, -0.350128173828125, -0.2913665771484375, -0.23260498046875, -0.1738433837890625, -0.115081787109375, -0.0563201904296875, 0.00244140625, 0.0612030029296875, 0.119964599609375, 0.1787261962890625, 0.23748779296875, 0.2962493896484375, 0.355010986328125, 0.4137725830078125, 0.4725341796875, 0.5312957763671875, 0.590057373046875, 0.6488189697265625, 0.70758056640625, 0.7663421630859375, 0.825103759765625, 0.8838653564453125, 0.942626953125, 1.0013885498046875, 1.060150146484375, 1.1189117431640625, 1.17767333984375, 1.2364349365234375, 1.295196533203125, 1.3539581298828125, 1.4127197265625, 1.4714813232421875, 1.530242919921875, 1.5890045166015625, 1.64776611328125, 1.7065277099609375, 1.765289306640625, 1.8240509033203125, 1.8828125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 10.0, 5.0, 12.0, 18.0, 20.0, 16.0, 32.0, 44.0, 46.0, 58.0, 78.0, 84.0, 89.0, 90.0, 80.0, 78.0, 51.0, 48.0, 31.0, 25.0, 28.0, 10.0, 7.0, 9.0, 6.0, 7.0, 4.0, 6.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031113624572753906, -0.00030315108597278595, -0.00029516592621803284, -0.0002871807664632797, -0.0002791956067085266, -0.0002712104469537735, -0.0002632252871990204, -0.0002552401274442673, -0.00024725496768951416, -0.00023926980793476105, -0.00023128464818000793, -0.00022329948842525482, -0.0002153143286705017, -0.0002073291689157486, -0.00019934400916099548, -0.00019135884940624237, -0.00018337368965148926, -0.00017538852989673615, -0.00016740337014198303, -0.00015941821038722992, -0.0001514330506324768, -0.0001434478908777237, -0.00013546273112297058, -0.00012747757136821747, -0.00011949241161346436, -0.00011150725185871124, -0.00010352209210395813, -9.553693234920502e-05, -8.75517725944519e-05, -7.956661283969879e-05, -7.158145308494568e-05, -6.359629333019257e-05, -5.561113357543945e-05, -4.762597382068634e-05, -3.964081406593323e-05, -3.1655654311180115e-05, -2.3670494556427002e-05, -1.568533480167389e-05, -7.700175046920776e-06, 2.849847078323364e-07, 8.27014446258545e-06, 1.6255304217338562e-05, 2.4240463972091675e-05, 3.222562372684479e-05, 4.02107834815979e-05, 4.819594323635101e-05, 5.6181102991104126e-05, 6.416626274585724e-05, 7.215142250061035e-05, 8.013658225536346e-05, 8.812174201011658e-05, 9.610690176486969e-05, 0.0001040920615196228, 0.00011207722127437592, 0.00012006238102912903, 0.00012804754078388214, 0.00013603270053863525, 0.00014401786029338837, 0.00015200302004814148, 0.0001599881798028946, 0.0001679733395576477, 0.00017595849931240082, 0.00018394365906715393, 0.00019192881882190704, 0.00019991397857666016]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 5.0, 2.0, 7.0, 8.0, 3.0, 8.0, 18.0, 26.0, 48.0, 70.0, 95.0, 130.0, 219.0, 304.0, 482.0, 701.0, 1107.0, 1781.0, 3022.0, 5066.0, 8376.0, 15192.0, 26623.0, 48199.0, 87002.0, 142755.0, 194264.0, 190003.0, 136457.0, 81662.0, 45184.0, 25384.0, 13913.0, 8023.0, 4604.0, 2832.0, 1738.0, 1104.0, 751.0, 437.0, 329.0, 201.0, 136.0, 89.0, 64.0, 47.0, 41.0, 16.0, 12.0, 11.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8515625, -1.78973388671875, -1.7279052734375, -1.66607666015625, -1.604248046875, -1.54241943359375, -1.4805908203125, -1.41876220703125, -1.35693359375, -1.29510498046875, -1.2332763671875, -1.17144775390625, -1.109619140625, -1.04779052734375, -0.9859619140625, -0.92413330078125, -0.8623046875, -0.80047607421875, -0.7386474609375, -0.67681884765625, -0.614990234375, -0.55316162109375, -0.4913330078125, -0.42950439453125, -0.36767578125, -0.30584716796875, -0.2440185546875, -0.18218994140625, -0.120361328125, -0.05853271484375, 0.0032958984375, 0.06512451171875, 0.126953125, 0.18878173828125, 0.2506103515625, 0.31243896484375, 0.374267578125, 0.43609619140625, 0.4979248046875, 0.55975341796875, 0.62158203125, 0.68341064453125, 0.7452392578125, 0.80706787109375, 0.868896484375, 0.93072509765625, 0.9925537109375, 1.05438232421875, 1.1162109375, 1.17803955078125, 1.2398681640625, 1.30169677734375, 1.363525390625, 1.42535400390625, 1.4871826171875, 1.54901123046875, 1.61083984375, 1.67266845703125, 1.7344970703125, 1.79632568359375, 1.858154296875, 1.91998291015625, 1.9818115234375, 2.04364013671875, 2.10546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 7.0, 8.0, 9.0, 13.0, 13.0, 13.0, 14.0, 16.0, 24.0, 32.0, 32.0, 37.0, 30.0, 35.0, 52.0, 40.0, 41.0, 50.0, 48.0, 58.0, 57.0, 32.0, 44.0, 45.0, 35.0, 34.0, 28.0, 13.0, 23.0, 14.0, 11.0, 14.0, 14.0, 10.0, 5.0, 6.0, 4.0, 1.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.5068359375, -0.4926567077636719, -0.47847747802734375, -0.4642982482910156, -0.4501190185546875, -0.4359397888183594, -0.42176055908203125, -0.4075813293457031, -0.393402099609375, -0.3792228698730469, -0.36504364013671875, -0.3508644104003906, -0.3366851806640625, -0.3225059509277344, -0.30832672119140625, -0.2941474914550781, -0.27996826171875, -0.2657890319824219, -0.25160980224609375, -0.23743057250976562, -0.2232513427734375, -0.20907211303710938, -0.19489288330078125, -0.18071365356445312, -0.166534423828125, -0.15235519409179688, -0.13817596435546875, -0.12399673461914062, -0.1098175048828125, -0.09563827514648438, -0.08145904541015625, -0.06727981567382812, -0.0531005859375, -0.038921356201171875, -0.02474212646484375, -0.010562896728515625, 0.0036163330078125, 0.017795562744140625, 0.03197479248046875, 0.046154022216796875, 0.060333251953125, 0.07451248168945312, 0.08869171142578125, 0.10287094116210938, 0.1170501708984375, 0.13122940063476562, 0.14540863037109375, 0.15958786010742188, 0.17376708984375, 0.18794631958007812, 0.20212554931640625, 0.21630477905273438, 0.2304840087890625, 0.24466323852539062, 0.25884246826171875, 0.2730216979980469, 0.287200927734375, 0.3013801574707031, 0.31555938720703125, 0.3297386169433594, 0.3439178466796875, 0.3580970764160156, 0.37227630615234375, 0.3864555358886719, 0.400634765625]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 3.0, 4.0, 5.0, 7.0, 16.0, 16.0, 21.0, 21.0, 37.0, 49.0, 56.0, 75.0, 95.0, 124.0, 115.0, 103.0, 75.0, 62.0, 41.0, 23.0, 20.0, 16.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.230144500732422, -13.869439125061035, -13.508734703063965, -13.148029327392578, -12.787324905395508, -12.426619529724121, -12.065914154052734, -11.705209732055664, -11.344504356384277, -10.98379898071289, -10.62309455871582, -10.262389183044434, -9.901684761047363, -9.540979385375977, -9.180274963378906, -8.81956958770752, -8.458864212036133, -8.098158836364746, -7.737454414367676, -7.376749038696289, -7.0160441398620605, -6.655339241027832, -6.2946343421936035, -5.933929443359375, -5.573225021362305, -5.212520122528076, -4.851815223693848, -4.491109848022461, -4.130404949188232, -3.769700050354004, -3.4089951515197754, -3.0482900142669678, -2.68758487701416, -2.3268799781799316, -1.966174840927124, -1.6054699420928955, -1.2447649240493774, -0.8840599060058594, -0.5233550071716309, -0.16264986991882324, 0.19805502891540527, 0.5587600469589233, 0.9194650053977966, 1.28016996383667, 1.640874981880188, 2.001579999923706, 2.3622848987579346, 2.722990036010742, 3.0836949348449707, 3.444399833679199, 3.805104970932007, 4.165809631347656, 4.526515007019043, 4.8872199058532715, 5.2479248046875, 5.608630180358887, 5.969334602355957, 6.3300395011901855, 6.690744400024414, 7.051449775695801, 7.412154674530029, 7.772859573364258, 8.133563995361328, 8.494269371032715, 8.854974746704102]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 9.0, 7.0, 6.0, 9.0, 11.0, 16.0, 15.0, 20.0, 25.0, 23.0, 19.0, 39.0, 36.0, 31.0, 41.0, 32.0, 39.0, 44.0, 41.0, 37.0, 48.0, 48.0, 46.0, 43.0, 39.0, 29.0, 25.0, 28.0, 28.0, 25.0, 25.0, 21.0, 18.0, 16.0, 11.0, 13.0, 7.0, 11.0, 7.0, 6.0, 7.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.568134069442749, -3.462757110595703, -3.3573801517486572, -3.2520031929016113, -3.1466259956359863, -3.0412490367889404, -2.9358720779418945, -2.8304951190948486, -2.7251181602478027, -2.619741201400757, -2.514364242553711, -2.408987045288086, -2.30361008644104, -2.198233127593994, -2.0928561687469482, -1.9874792098999023, -1.8821020126342773, -1.7767250537872314, -1.671347975730896, -1.56597101688385, -1.4605939388275146, -1.3552169799804688, -1.2498400211334229, -1.144463062286377, -1.0390859842300415, -0.9337089657783508, -0.8283319473266602, -0.7229549884796143, -0.6175779700279236, -0.5122009515762329, -0.406823992729187, -0.30144697427749634, -0.19607019424438477, -0.09069319069385529, 0.014683812856674194, 0.12006080150604248, 0.22543781995773315, 0.33081483840942383, 0.4361917972564697, 0.5415688157081604, 0.6469458341598511, 0.7523228526115417, 0.8576998710632324, 0.9630768299102783, 1.0684537887573242, 1.1738308668136597, 1.2792078256607056, 1.384584903717041, 1.489961862564087, 1.5953388214111328, 1.7007158994674683, 1.8060928583145142, 1.9114699363708496, 2.0168468952178955, 2.1222238540649414, 2.2276008129119873, 2.332977771759033, 2.438354730606079, 2.543731689453125, 2.64910888671875, 2.754485845565796, 2.859862804412842, 2.9652397632598877, 3.0706167221069336, 3.1759939193725586]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 9.0, 3.0, 11.0, 9.0, 8.0, 23.0, 34.0, 59.0, 82.0, 115.0, 233.0, 316.0, 559.0, 1038.0, 1756.0, 3485.0, 6567.0, 13468.0, 29103.0, 68296.0, 184543.0, 588295.0, 1542454.0, 1181063.0, 363582.0, 119565.0, 47219.0, 21063.0, 10033.0, 5162.0, 2721.0, 1448.0, 793.0, 482.0, 260.0, 170.0, 88.0, 58.0, 48.0, 33.0, 14.0, 10.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.828125, -9.56109619140625, -9.2940673828125, -9.02703857421875, -8.760009765625, -8.49298095703125, -8.2259521484375, -7.95892333984375, -7.69189453125, -7.42486572265625, -7.1578369140625, -6.89080810546875, -6.623779296875, -6.35675048828125, -6.0897216796875, -5.82269287109375, -5.5556640625, -5.28863525390625, -5.0216064453125, -4.75457763671875, -4.487548828125, -4.22052001953125, -3.9534912109375, -3.68646240234375, -3.41943359375, -3.15240478515625, -2.8853759765625, -2.61834716796875, -2.351318359375, -2.08428955078125, -1.8172607421875, -1.55023193359375, -1.283203125, -1.01617431640625, -0.7491455078125, -0.48211669921875, -0.215087890625, 0.05194091796875, 0.3189697265625, 0.58599853515625, 0.85302734375, 1.12005615234375, 1.3870849609375, 1.65411376953125, 1.921142578125, 2.18817138671875, 2.4552001953125, 2.72222900390625, 2.9892578125, 3.25628662109375, 3.5233154296875, 3.79034423828125, 4.057373046875, 4.32440185546875, 4.5914306640625, 4.85845947265625, 5.12548828125, 5.39251708984375, 5.6595458984375, 5.92657470703125, 6.193603515625, 6.46063232421875, 6.7276611328125, 6.99468994140625, 7.26171875]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 12.0, 10.0, 10.0, 6.0, 12.0, 17.0, 20.0, 24.0, 26.0, 28.0, 37.0, 24.0, 19.0, 45.0, 33.0, 34.0, 53.0, 52.0, 46.0, 48.0, 33.0, 34.0, 39.0, 32.0, 45.0, 33.0, 31.0, 25.0, 26.0, 33.0, 11.0, 22.0, 16.0, 11.0, 10.0, 10.0, 11.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.830078125, -2.7470703125, -2.6640625, -2.5810546875, -2.498046875, -2.4150390625, -2.33203125, -2.2490234375, -2.166015625, -2.0830078125, -2.0, -1.9169921875, -1.833984375, -1.7509765625, -1.66796875, -1.5849609375, -1.501953125, -1.4189453125, -1.3359375, -1.2529296875, -1.169921875, -1.0869140625, -1.00390625, -0.9208984375, -0.837890625, -0.7548828125, -0.671875, -0.5888671875, -0.505859375, -0.4228515625, -0.33984375, -0.2568359375, -0.173828125, -0.0908203125, -0.0078125, 0.0751953125, 0.158203125, 0.2412109375, 0.32421875, 0.4072265625, 0.490234375, 0.5732421875, 0.65625, 0.7392578125, 0.822265625, 0.9052734375, 0.98828125, 1.0712890625, 1.154296875, 1.2373046875, 1.3203125, 1.4033203125, 1.486328125, 1.5693359375, 1.65234375, 1.7353515625, 1.818359375, 1.9013671875, 1.984375, 2.0673828125, 2.150390625, 2.2333984375, 2.31640625, 2.3994140625, 2.482421875]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 17.0, 23.0, 38.0, 70.0, 79.0, 149.0, 176.0, 289.0, 455.0, 641.0, 938.0, 1443.0, 2120.0, 3450.0, 5529.0, 8960.0, 14977.0, 25365.0, 45688.0, 83755.0, 162684.0, 327882.0, 661097.0, 1070692.0, 861286.0, 446648.0, 218567.0, 111505.0, 58797.0, 32582.0, 18614.0, 11028.0, 6664.0, 4163.0, 2688.0, 1692.0, 1199.0, 777.0, 522.0, 344.0, 223.0, 128.0, 99.0, 93.0, 48.0, 28.0, 17.0, 14.0, 12.0, 8.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.0859375, -5.89404296875, -5.7021484375, -5.51025390625, -5.318359375, -5.12646484375, -4.9345703125, -4.74267578125, -4.55078125, -4.35888671875, -4.1669921875, -3.97509765625, -3.783203125, -3.59130859375, -3.3994140625, -3.20751953125, -3.015625, -2.82373046875, -2.6318359375, -2.43994140625, -2.248046875, -2.05615234375, -1.8642578125, -1.67236328125, -1.48046875, -1.28857421875, -1.0966796875, -0.90478515625, -0.712890625, -0.52099609375, -0.3291015625, -0.13720703125, 0.0546875, 0.24658203125, 0.4384765625, 0.63037109375, 0.822265625, 1.01416015625, 1.2060546875, 1.39794921875, 1.58984375, 1.78173828125, 1.9736328125, 2.16552734375, 2.357421875, 2.54931640625, 2.7412109375, 2.93310546875, 3.125, 3.31689453125, 3.5087890625, 3.70068359375, 3.892578125, 4.08447265625, 4.2763671875, 4.46826171875, 4.66015625, 4.85205078125, 5.0439453125, 5.23583984375, 5.427734375, 5.61962890625, 5.8115234375, 6.00341796875, 6.1953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 1.0, 5.0, 5.0, 7.0, 17.0, 16.0, 18.0, 26.0, 48.0, 56.0, 75.0, 108.0, 112.0, 149.0, 204.0, 266.0, 296.0, 361.0, 385.0, 386.0, 334.0, 261.0, 224.0, 179.0, 120.0, 99.0, 81.0, 62.0, 42.0, 30.0, 23.0, 21.0, 13.0, 14.0, 5.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9697265625, -1.8986663818359375, -1.827606201171875, -1.7565460205078125, -1.68548583984375, -1.6144256591796875, -1.543365478515625, -1.4723052978515625, -1.4012451171875, -1.3301849365234375, -1.259124755859375, -1.1880645751953125, -1.11700439453125, -1.0459442138671875, -0.974884033203125, -0.9038238525390625, -0.832763671875, -0.7617034912109375, -0.690643310546875, -0.6195831298828125, -0.54852294921875, -0.4774627685546875, -0.406402587890625, -0.3353424072265625, -0.2642822265625, -0.1932220458984375, -0.122161865234375, -0.0511016845703125, 0.01995849609375, 0.0910186767578125, 0.162078857421875, 0.2331390380859375, 0.30419921875, 0.3752593994140625, 0.446319580078125, 0.5173797607421875, 0.58843994140625, 0.6595001220703125, 0.730560302734375, 0.8016204833984375, 0.8726806640625, 0.9437408447265625, 1.014801025390625, 1.0858612060546875, 1.15692138671875, 1.2279815673828125, 1.299041748046875, 1.3701019287109375, 1.441162109375, 1.5122222900390625, 1.583282470703125, 1.6543426513671875, 1.72540283203125, 1.7964630126953125, 1.867523193359375, 1.9385833740234375, 2.0096435546875, 2.0807037353515625, 2.151763916015625, 2.2228240966796875, 2.29388427734375, 2.3649444580078125, 2.436004638671875, 2.5070648193359375, 2.578125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 8.0, 4.0, 0.0, 7.0, 12.0, 11.0, 17.0, 16.0, 20.0, 42.0, 36.0, 52.0, 55.0, 73.0, 94.0, 93.0, 84.0, 86.0, 67.0, 59.0, 46.0, 38.0, 22.0, 22.0, 20.0, 8.0, 5.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.97739315032959, -10.66610336303711, -10.354814529418945, -10.043524742126465, -9.732234954833984, -9.42094612121582, -9.10965633392334, -8.79836654663086, -8.487077713012695, -8.175787925720215, -7.864498615264893, -7.55320930480957, -7.24191951751709, -6.930630207061768, -6.619340896606445, -6.308051109313965, -5.996761322021484, -5.685472011566162, -5.374182224273682, -5.062892913818359, -4.751603126525879, -4.440313816070557, -4.129024505615234, -3.817734956741333, -3.5064454078674316, -3.1951558589935303, -2.883866310119629, -2.5725769996643066, -2.2612874507904053, -1.949997901916504, -1.638708472251892, -1.3274190425872803, -1.0161304473876953, -0.7048409581184387, -0.39355146884918213, -0.08226197957992554, 0.22902750968933105, 0.5403170585632324, 0.8516064882278442, 1.162895917892456, 1.4741854667663574, 1.7854750156402588, 2.09676456451416, 2.4080538749694824, 2.719343423843384, 3.030632972717285, 3.3419222831726074, 3.653211832046509, 3.96450138092041, 4.275790691375732, 4.587080478668213, 4.898369789123535, 5.209659576416016, 5.520948886871338, 5.83223819732666, 6.143527984619141, 6.454817295074463, 6.766106605529785, 7.077396392822266, 7.388685703277588, 7.69997501373291, 8.01126480102539, 8.322554588317871, 8.633843421936035, 8.945133209228516]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 11.0, 13.0, 6.0, 18.0, 15.0, 30.0, 27.0, 32.0, 32.0, 36.0, 36.0, 35.0, 36.0, 38.0, 36.0, 36.0, 45.0, 48.0, 35.0, 36.0, 50.0, 35.0, 37.0, 28.0, 37.0, 24.0, 20.0, 28.0, 26.0, 14.0, 16.0, 10.0, 12.0, 10.0, 6.0, 4.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7475574016571045, -3.6351704597473145, -3.5227832794189453, -3.4103963375091553, -3.2980093955993652, -3.185622215270996, -3.073235273361206, -2.960848331451416, -2.848461151123047, -2.736074209213257, -2.6236870288848877, -2.5113000869750977, -2.3989131450653076, -2.2865259647369385, -2.1741390228271484, -2.0617518424987793, -1.9493650197982788, -1.8369779586791992, -1.7245910167694092, -1.6122039556503296, -1.49981689453125, -1.38742995262146, -1.2750428915023804, -1.1626558303833008, -1.0502688884735107, -0.9378818869590759, -0.8254948258399963, -0.7131078243255615, -0.6007207632064819, -0.4883337616920471, -0.3759467601776123, -0.2635596990585327, -0.15117263793945312, -0.03878561407327652, 0.07360140979290009, 0.1859884262084961, 0.2983754575252533, 0.4107624888420105, 0.5231494903564453, 0.6355365514755249, 0.7479235529899597, 0.8603105545043945, 0.9726976156234741, 1.0850846767425537, 1.1974716186523438, 1.3098586797714233, 1.422245740890503, 1.534632682800293, 1.6470197439193726, 1.7594068050384521, 1.8717937469482422, 1.9841808080673218, 2.0965678691864014, 2.2089548110961914, 2.3213419914245605, 2.4337289333343506, 2.5461158752441406, 2.6585028171539307, 2.7708899974823, 2.88327693939209, 2.99566388130188, 3.108051061630249, 3.220438003540039, 3.332825183868408, 3.4452121257781982]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 6.0, 10.0, 17.0, 28.0, 28.0, 41.0, 56.0, 105.0, 152.0, 218.0, 370.0, 632.0, 1127.0, 2162.0, 4173.0, 9078.0, 21074.0, 51938.0, 129165.0, 266679.0, 293260.0, 156473.0, 64576.0, 25832.0, 10858.0, 4887.0, 2421.0, 1264.0, 696.0, 430.0, 269.0, 173.0, 111.0, 71.0, 51.0, 42.0, 35.0, 14.0, 12.0, 6.0, 3.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.713134765625, -4.57080078125, -4.428466796875, -4.2861328125, -4.143798828125, -4.00146484375, -3.859130859375, -3.716796875, -3.574462890625, -3.43212890625, -3.289794921875, -3.1474609375, -3.005126953125, -2.86279296875, -2.720458984375, -2.578125, -2.435791015625, -2.29345703125, -2.151123046875, -2.0087890625, -1.866455078125, -1.72412109375, -1.581787109375, -1.439453125, -1.297119140625, -1.15478515625, -1.012451171875, -0.8701171875, -0.727783203125, -0.58544921875, -0.443115234375, -0.30078125, -0.158447265625, -0.01611328125, 0.126220703125, 0.2685546875, 0.410888671875, 0.55322265625, 0.695556640625, 0.837890625, 0.980224609375, 1.12255859375, 1.264892578125, 1.4072265625, 1.549560546875, 1.69189453125, 1.834228515625, 1.9765625, 2.118896484375, 2.26123046875, 2.403564453125, 2.5458984375, 2.688232421875, 2.83056640625, 2.972900390625, 3.115234375, 3.257568359375, 3.39990234375, 3.542236328125, 3.6845703125, 3.826904296875, 3.96923828125, 4.111572265625, 4.25390625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 17.0, 15.0, 16.0, 15.0, 22.0, 19.0, 28.0, 22.0, 35.0, 42.0, 35.0, 35.0, 35.0, 43.0, 44.0, 50.0, 41.0, 45.0, 36.0, 35.0, 44.0, 33.0, 31.0, 41.0, 25.0, 28.0, 24.0, 22.0, 23.0, 12.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.98114013671875, -3.8529052734375, -3.72467041015625, -3.596435546875, -3.46820068359375, -3.3399658203125, -3.21173095703125, -3.08349609375, -2.95526123046875, -2.8270263671875, -2.69879150390625, -2.570556640625, -2.44232177734375, -2.3140869140625, -2.18585205078125, -2.0576171875, -1.92938232421875, -1.8011474609375, -1.67291259765625, -1.544677734375, -1.41644287109375, -1.2882080078125, -1.15997314453125, -1.03173828125, -0.90350341796875, -0.7752685546875, -0.64703369140625, -0.518798828125, -0.39056396484375, -0.2623291015625, -0.13409423828125, -0.005859375, 0.12237548828125, 0.2506103515625, 0.37884521484375, 0.507080078125, 0.63531494140625, 0.7635498046875, 0.89178466796875, 1.02001953125, 1.14825439453125, 1.2764892578125, 1.40472412109375, 1.532958984375, 1.66119384765625, 1.7894287109375, 1.91766357421875, 2.0458984375, 2.17413330078125, 2.3023681640625, 2.43060302734375, 2.558837890625, 2.68707275390625, 2.8153076171875, 2.94354248046875, 3.07177734375, 3.20001220703125, 3.3282470703125, 3.45648193359375, 3.584716796875, 3.71295166015625, 3.8411865234375, 3.96942138671875, 4.09765625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 7.0, 7.0, 18.0, 22.0, 24.0, 37.0, 63.0, 63.0, 100.0, 143.0, 198.0, 272.0, 444.0, 680.0, 997.0, 1678.0, 2810.0, 4778.0, 9095.0, 17394.0, 35275.0, 72610.0, 146892.0, 248566.0, 236627.0, 134408.0, 66748.0, 32507.0, 16047.0, 8477.0, 4530.0, 2569.0, 1567.0, 917.0, 594.0, 429.0, 293.0, 185.0, 125.0, 100.0, 71.0, 52.0, 39.0, 23.0, 28.0, 9.0, 10.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.0, -3.874755859375, -3.74951171875, -3.624267578125, -3.4990234375, -3.373779296875, -3.24853515625, -3.123291015625, -2.998046875, -2.872802734375, -2.74755859375, -2.622314453125, -2.4970703125, -2.371826171875, -2.24658203125, -2.121337890625, -1.99609375, -1.870849609375, -1.74560546875, -1.620361328125, -1.4951171875, -1.369873046875, -1.24462890625, -1.119384765625, -0.994140625, -0.868896484375, -0.74365234375, -0.618408203125, -0.4931640625, -0.367919921875, -0.24267578125, -0.117431640625, 0.0078125, 0.133056640625, 0.25830078125, 0.383544921875, 0.5087890625, 0.634033203125, 0.75927734375, 0.884521484375, 1.009765625, 1.135009765625, 1.26025390625, 1.385498046875, 1.5107421875, 1.635986328125, 1.76123046875, 1.886474609375, 2.01171875, 2.136962890625, 2.26220703125, 2.387451171875, 2.5126953125, 2.637939453125, 2.76318359375, 2.888427734375, 3.013671875, 3.138916015625, 3.26416015625, 3.389404296875, 3.5146484375, 3.639892578125, 3.76513671875, 3.890380859375, 4.015625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 12.0, 9.0, 10.0, 15.0, 23.0, 23.0, 29.0, 31.0, 25.0, 24.0, 22.0, 31.0, 45.0, 40.0, 41.0, 40.0, 49.0, 33.0, 51.0, 44.0, 44.0, 38.0, 36.0, 28.0, 31.0, 30.0, 20.0, 32.0, 27.0, 22.0, 13.0, 13.0, 11.0, 12.0, 13.0, 1.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9066925048828125, -1.833892822265625, -1.7610931396484375, -1.68829345703125, -1.6154937744140625, -1.542694091796875, -1.4698944091796875, -1.3970947265625, -1.3242950439453125, -1.251495361328125, -1.1786956787109375, -1.10589599609375, -1.0330963134765625, -0.960296630859375, -0.8874969482421875, -0.814697265625, -0.7418975830078125, -0.669097900390625, -0.5962982177734375, -0.52349853515625, -0.4506988525390625, -0.377899169921875, -0.3050994873046875, -0.2322998046875, -0.1595001220703125, -0.086700439453125, -0.0139007568359375, 0.05889892578125, 0.1316986083984375, 0.204498291015625, 0.2772979736328125, 0.35009765625, 0.4228973388671875, 0.495697021484375, 0.5684967041015625, 0.64129638671875, 0.7140960693359375, 0.786895751953125, 0.8596954345703125, 0.9324951171875, 1.0052947998046875, 1.078094482421875, 1.1508941650390625, 1.22369384765625, 1.2964935302734375, 1.369293212890625, 1.4420928955078125, 1.514892578125, 1.5876922607421875, 1.660491943359375, 1.7332916259765625, 1.80609130859375, 1.8788909912109375, 1.951690673828125, 2.0244903564453125, 2.0972900390625, 2.1700897216796875, 2.242889404296875, 2.3156890869140625, 2.38848876953125, 2.4612884521484375, 2.534088134765625, 2.6068878173828125, 2.6796875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [6.0, 2.0, 2.0, 3.0, 5.0, 9.0, 10.0, 12.0, 17.0, 16.0, 28.0, 46.0, 59.0, 75.0, 132.0, 171.0, 271.0, 352.0, 546.0, 795.0, 1271.0, 2047.0, 3299.0, 5585.0, 9786.0, 18455.0, 36346.0, 74646.0, 156431.0, 271863.0, 230667.0, 117760.0, 56039.0, 27531.0, 14359.0, 7896.0, 4467.0, 2655.0, 1682.0, 1045.0, 660.0, 469.0, 309.0, 214.0, 163.0, 101.0, 68.0, 53.0, 45.0, 27.0, 18.0, 15.0, 12.0, 8.0, 5.0, 8.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7601776123046875, -1.699066162109375, -1.6379547119140625, -1.57684326171875, -1.5157318115234375, -1.454620361328125, -1.3935089111328125, -1.3323974609375, -1.2712860107421875, -1.210174560546875, -1.1490631103515625, -1.08795166015625, -1.0268402099609375, -0.965728759765625, -0.9046173095703125, -0.843505859375, -0.7823944091796875, -0.721282958984375, -0.6601715087890625, -0.59906005859375, -0.5379486083984375, -0.476837158203125, -0.4157257080078125, -0.3546142578125, -0.2935028076171875, -0.232391357421875, -0.1712799072265625, -0.11016845703125, -0.0490570068359375, 0.012054443359375, 0.0731658935546875, 0.13427734375, 0.1953887939453125, 0.256500244140625, 0.3176116943359375, 0.37872314453125, 0.4398345947265625, 0.500946044921875, 0.5620574951171875, 0.6231689453125, 0.6842803955078125, 0.745391845703125, 0.8065032958984375, 0.86761474609375, 0.9287261962890625, 0.989837646484375, 1.0509490966796875, 1.112060546875, 1.1731719970703125, 1.234283447265625, 1.2953948974609375, 1.35650634765625, 1.4176177978515625, 1.478729248046875, 1.5398406982421875, 1.6009521484375, 1.6620635986328125, 1.723175048828125, 1.7842864990234375, 1.84539794921875, 1.9065093994140625, 1.967620849609375, 2.0287322998046875, 2.08984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 8.0, 22.0, 17.0, 22.0, 25.0, 28.0, 47.0, 50.0, 70.0, 62.0, 74.0, 91.0, 88.0, 72.0, 56.0, 54.0, 47.0, 34.0, 20.0, 22.0, 14.0, 18.0, 7.0, 3.0, 5.0, 8.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00012350082397460938, -0.00012022629380226135, -0.00011695176362991333, -0.00011367723345756531, -0.00011040270328521729, -0.00010712817311286926, -0.00010385364294052124, -0.00010057911276817322, -9.73045825958252e-05, -9.403005242347717e-05, -9.075552225112915e-05, -8.748099207878113e-05, -8.42064619064331e-05, -8.093193173408508e-05, -7.765740156173706e-05, -7.438287138938904e-05, -7.110834121704102e-05, -6.783381104469299e-05, -6.455928087234497e-05, -6.128475069999695e-05, -5.8010220527648926e-05, -5.47356903553009e-05, -5.146116018295288e-05, -4.818663001060486e-05, -4.4912099838256836e-05, -4.1637569665908813e-05, -3.836303949356079e-05, -3.508850932121277e-05, -3.1813979148864746e-05, -2.8539448976516724e-05, -2.52649188041687e-05, -2.199038863182068e-05, -1.8715858459472656e-05, -1.5441328287124634e-05, -1.2166798114776611e-05, -8.892267942428589e-06, -5.617737770080566e-06, -2.343207597732544e-06, 9.313225746154785e-07, 4.205852746963501e-06, 7.4803829193115234e-06, 1.0754913091659546e-05, 1.4029443264007568e-05, 1.730397343635559e-05, 2.0578503608703613e-05, 2.3853033781051636e-05, 2.7127563953399658e-05, 3.040209412574768e-05, 3.36766242980957e-05, 3.6951154470443726e-05, 4.022568464279175e-05, 4.350021481513977e-05, 4.677474498748779e-05, 5.0049275159835815e-05, 5.332380533218384e-05, 5.659833550453186e-05, 5.987286567687988e-05, 6.31473958492279e-05, 6.642192602157593e-05, 6.969645619392395e-05, 7.297098636627197e-05, 7.624551653862e-05, 7.952004671096802e-05, 8.279457688331604e-05, 8.606910705566406e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 10.0, 13.0, 19.0, 25.0, 41.0, 80.0, 123.0, 168.0, 224.0, 381.0, 577.0, 900.0, 1442.0, 2655.0, 4607.0, 9008.0, 19278.0, 45429.0, 110682.0, 235172.0, 294712.0, 181672.0, 78491.0, 32730.0, 14067.0, 6838.0, 3654.0, 2133.0, 1285.0, 741.0, 508.0, 284.0, 194.0, 144.0, 77.0, 70.0, 45.0, 32.0, 22.0, 7.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.86328125, -1.7950439453125, -1.726806640625, -1.6585693359375, -1.59033203125, -1.5220947265625, -1.453857421875, -1.3856201171875, -1.3173828125, -1.2491455078125, -1.180908203125, -1.1126708984375, -1.04443359375, -0.9761962890625, -0.907958984375, -0.8397216796875, -0.771484375, -0.7032470703125, -0.635009765625, -0.5667724609375, -0.49853515625, -0.4302978515625, -0.362060546875, -0.2938232421875, -0.2255859375, -0.1573486328125, -0.089111328125, -0.0208740234375, 0.04736328125, 0.1156005859375, 0.183837890625, 0.2520751953125, 0.3203125, 0.3885498046875, 0.456787109375, 0.5250244140625, 0.59326171875, 0.6614990234375, 0.729736328125, 0.7979736328125, 0.8662109375, 0.9344482421875, 1.002685546875, 1.0709228515625, 1.13916015625, 1.2073974609375, 1.275634765625, 1.3438720703125, 1.412109375, 1.4803466796875, 1.548583984375, 1.6168212890625, 1.68505859375, 1.7532958984375, 1.821533203125, 1.8897705078125, 1.9580078125, 2.0262451171875, 2.094482421875, 2.1627197265625, 2.23095703125, 2.2991943359375, 2.367431640625, 2.4356689453125, 2.50390625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 3.0, 3.0, 5.0, 7.0, 13.0, 17.0, 15.0, 17.0, 23.0, 28.0, 30.0, 39.0, 46.0, 50.0, 64.0, 55.0, 73.0, 56.0, 63.0, 73.0, 64.0, 54.0, 34.0, 31.0, 27.0, 22.0, 20.0, 11.0, 11.0, 7.0, 10.0, 5.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404541015625, -0.3915138244628906, -0.37848663330078125, -0.3654594421386719, -0.3524322509765625, -0.3394050598144531, -0.32637786865234375, -0.3133506774902344, -0.300323486328125, -0.2872962951660156, -0.27426910400390625, -0.2612419128417969, -0.2482147216796875, -0.23518753051757812, -0.22216033935546875, -0.20913314819335938, -0.19610595703125, -0.18307876586914062, -0.17005157470703125, -0.15702438354492188, -0.1439971923828125, -0.13097000122070312, -0.11794281005859375, -0.10491561889648438, -0.091888427734375, -0.07886123657226562, -0.06583404541015625, -0.052806854248046875, -0.0397796630859375, -0.026752471923828125, -0.01372528076171875, -0.000698089599609375, 0.0123291015625, 0.025356292724609375, 0.03838348388671875, 0.051410675048828125, 0.0644378662109375, 0.07746505737304688, 0.09049224853515625, 0.10351943969726562, 0.116546630859375, 0.12957382202148438, 0.14260101318359375, 0.15562820434570312, 0.1686553955078125, 0.18168258666992188, 0.19470977783203125, 0.20773696899414062, 0.22076416015625, 0.23379135131835938, 0.24681854248046875, 0.2598457336425781, 0.2728729248046875, 0.2859001159667969, 0.29892730712890625, 0.3119544982910156, 0.324981689453125, 0.3380088806152344, 0.35103607177734375, 0.3640632629394531, 0.3770904541015625, 0.3901176452636719, 0.40314483642578125, 0.4161720275878906, 0.42919921875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 6.0, 9.0, 7.0, 9.0, 20.0, 22.0, 33.0, 36.0, 49.0, 57.0, 76.0, 83.0, 95.0, 87.0, 92.0, 68.0, 65.0, 54.0, 27.0, 32.0, 15.0, 28.0, 12.0, 3.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.881915092468262, -10.567342758178711, -10.25277042388916, -9.938197135925293, -9.623624801635742, -9.309052467346191, -8.99448013305664, -8.67990779876709, -8.365335464477539, -8.050763130187988, -7.736190319061279, -7.4216179847717285, -7.1070451736450195, -6.792472839355469, -6.477900505065918, -6.163328170776367, -5.8487548828125, -5.534182548522949, -5.21960973739624, -4.9050374031066895, -4.5904645919799805, -4.27589225769043, -3.961319923400879, -3.646747350692749, -3.332174777984619, -3.0176022052764893, -2.7030296325683594, -2.3884572982788086, -2.0738847255706787, -1.7593121528625488, -1.4447396993637085, -1.1301672458648682, -0.8155937194824219, -0.5010212063789368, -0.18644869327545166, 0.12812381982803345, 0.44269633293151855, 0.7572689056396484, 1.0718413591384888, 1.386413812637329, 1.700986385345459, 2.015558958053589, 2.3301315307617188, 2.6447038650512695, 2.9592764377593994, 3.2738490104675293, 3.58842134475708, 3.90299391746521, 4.21756649017334, 4.532138824462891, 4.8467116355896, 5.16128396987915, 5.475856781005859, 5.79042911529541, 6.105001449584961, 6.419573783874512, 6.734146595001221, 7.0487189292907715, 7.3632917404174805, 7.677864074707031, 7.992436408996582, 8.307008743286133, 8.62158203125, 8.93615436553955, 9.250726699829102]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 11.0, 8.0, 11.0, 10.0, 12.0, 9.0, 24.0, 31.0, 25.0, 29.0, 31.0, 41.0, 36.0, 37.0, 37.0, 31.0, 40.0, 37.0, 42.0, 53.0, 32.0, 37.0, 44.0, 29.0, 39.0, 31.0, 29.0, 34.0, 21.0, 26.0, 23.0, 15.0, 13.0, 11.0, 12.0, 10.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.650895357131958, -3.541168689727783, -3.4314420223236084, -3.3217153549194336, -3.211988687515259, -3.102262020111084, -2.992535352706909, -2.8828086853027344, -2.7730820178985596, -2.6633553504943848, -2.55362868309021, -2.443902015686035, -2.3341753482818604, -2.2244486808776855, -2.1147220134735107, -2.004995346069336, -1.8952686786651611, -1.7855420112609863, -1.6758153438568115, -1.5660886764526367, -1.456362009048462, -1.346635341644287, -1.2369086742401123, -1.1271820068359375, -1.0174553394317627, -0.9077286720275879, -0.7980020046234131, -0.6882753372192383, -0.5785486698150635, -0.46882200241088867, -0.35909533500671387, -0.24936866760253906, -0.13964200019836426, -0.029915332794189453, 0.07981133460998535, 0.18953800201416016, 0.29926466941833496, 0.40899133682250977, 0.5187180042266846, 0.6284446716308594, 0.7381713390350342, 0.847898006439209, 0.9576246738433838, 1.0673513412475586, 1.1770780086517334, 1.2868046760559082, 1.396531343460083, 1.5062580108642578, 1.6159846782684326, 1.7257113456726074, 1.8354380130767822, 1.945164680480957, 2.054891347885132, 2.1646180152893066, 2.2743446826934814, 2.3840713500976562, 2.493798017501831, 2.603524684906006, 2.7132513523101807, 2.8229780197143555, 2.9327046871185303, 3.042431354522705, 3.15215802192688, 3.2618846893310547, 3.3716113567352295]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 9.0, 13.0, 25.0, 28.0, 58.0, 76.0, 117.0, 176.0, 269.0, 387.0, 665.0, 1134.0, 1796.0, 3065.0, 5379.0, 9753.0, 18085.0, 34661.0, 65334.0, 118796.0, 184177.0, 211898.0, 168341.0, 103833.0, 55745.0, 29240.0, 15454.0, 8384.0, 4786.0, 2625.0, 1600.0, 967.0, 570.0, 361.0, 216.0, 184.0, 120.0, 70.0, 36.0, 40.0, 30.0, 15.0, 13.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.52734375, -6.33746337890625, -6.1475830078125, -5.95770263671875, -5.767822265625, -5.57794189453125, -5.3880615234375, -5.19818115234375, -5.00830078125, -4.81842041015625, -4.6285400390625, -4.43865966796875, -4.248779296875, -4.05889892578125, -3.8690185546875, -3.67913818359375, -3.4892578125, -3.29937744140625, -3.1094970703125, -2.91961669921875, -2.729736328125, -2.53985595703125, -2.3499755859375, -2.16009521484375, -1.97021484375, -1.78033447265625, -1.5904541015625, -1.40057373046875, -1.210693359375, -1.02081298828125, -0.8309326171875, -0.64105224609375, -0.451171875, -0.26129150390625, -0.0714111328125, 0.11846923828125, 0.308349609375, 0.49822998046875, 0.6881103515625, 0.87799072265625, 1.06787109375, 1.25775146484375, 1.4476318359375, 1.63751220703125, 1.827392578125, 2.01727294921875, 2.2071533203125, 2.39703369140625, 2.5869140625, 2.77679443359375, 2.9666748046875, 3.15655517578125, 3.346435546875, 3.53631591796875, 3.7261962890625, 3.91607666015625, 4.10595703125, 4.29583740234375, 4.4857177734375, 4.67559814453125, 4.865478515625, 5.05535888671875, 5.2452392578125, 5.43511962890625, 5.625]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 2.0, 6.0, 9.0, 12.0, 9.0, 5.0, 10.0, 16.0, 16.0, 22.0, 25.0, 24.0, 27.0, 31.0, 21.0, 34.0, 36.0, 36.0, 38.0, 34.0, 44.0, 34.0, 29.0, 44.0, 31.0, 47.0, 37.0, 35.0, 33.0, 19.0, 33.0, 23.0, 23.0, 19.0, 18.0, 15.0, 16.0, 10.0, 9.0, 10.0, 6.0, 10.0, 5.0, 10.0, 5.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.703125, -3.59429931640625, -3.4854736328125, -3.37664794921875, -3.267822265625, -3.15899658203125, -3.0501708984375, -2.94134521484375, -2.83251953125, -2.72369384765625, -2.6148681640625, -2.50604248046875, -2.397216796875, -2.28839111328125, -2.1795654296875, -2.07073974609375, -1.9619140625, -1.85308837890625, -1.7442626953125, -1.63543701171875, -1.526611328125, -1.41778564453125, -1.3089599609375, -1.20013427734375, -1.09130859375, -0.98248291015625, -0.8736572265625, -0.76483154296875, -0.656005859375, -0.54718017578125, -0.4383544921875, -0.32952880859375, -0.220703125, -0.11187744140625, -0.0030517578125, 0.10577392578125, 0.214599609375, 0.32342529296875, 0.4322509765625, 0.54107666015625, 0.64990234375, 0.75872802734375, 0.8675537109375, 0.97637939453125, 1.085205078125, 1.19403076171875, 1.3028564453125, 1.41168212890625, 1.5205078125, 1.62933349609375, 1.7381591796875, 1.84698486328125, 1.955810546875, 2.06463623046875, 2.1734619140625, 2.28228759765625, 2.39111328125, 2.49993896484375, 2.6087646484375, 2.71759033203125, 2.826416015625, 2.93524169921875, 3.0440673828125, 3.15289306640625, 3.26171875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 6.0, 7.0, 7.0, 11.0, 12.0, 35.0, 22.0, 41.0, 62.0, 83.0, 169.0, 228.0, 384.0, 708.0, 1193.0, 2024.0, 3691.0, 6705.0, 12706.0, 24131.0, 45977.0, 85213.0, 141951.0, 192424.0, 194864.0, 145259.0, 88189.0, 48072.0, 25407.0, 12981.0, 7028.0, 3816.0, 2124.0, 1213.0, 698.0, 420.0, 239.0, 151.0, 100.0, 61.0, 52.0, 29.0, 18.0, 12.0, 7.0, 11.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.0078125, -5.82025146484375, -5.6326904296875, -5.44512939453125, -5.257568359375, -5.07000732421875, -4.8824462890625, -4.69488525390625, -4.50732421875, -4.31976318359375, -4.1322021484375, -3.94464111328125, -3.757080078125, -3.56951904296875, -3.3819580078125, -3.19439697265625, -3.0068359375, -2.81927490234375, -2.6317138671875, -2.44415283203125, -2.256591796875, -2.06903076171875, -1.8814697265625, -1.69390869140625, -1.50634765625, -1.31878662109375, -1.1312255859375, -0.94366455078125, -0.756103515625, -0.56854248046875, -0.3809814453125, -0.19342041015625, -0.005859375, 0.18170166015625, 0.3692626953125, 0.55682373046875, 0.744384765625, 0.93194580078125, 1.1195068359375, 1.30706787109375, 1.49462890625, 1.68218994140625, 1.8697509765625, 2.05731201171875, 2.244873046875, 2.43243408203125, 2.6199951171875, 2.80755615234375, 2.9951171875, 3.18267822265625, 3.3702392578125, 3.55780029296875, 3.745361328125, 3.93292236328125, 4.1204833984375, 4.30804443359375, 4.49560546875, 4.68316650390625, 4.8707275390625, 5.05828857421875, 5.245849609375, 5.43341064453125, 5.6209716796875, 5.80853271484375, 5.99609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 7.0, 10.0, 8.0, 10.0, 15.0, 17.0, 14.0, 26.0, 37.0, 23.0, 31.0, 39.0, 42.0, 35.0, 45.0, 40.0, 57.0, 47.0, 40.0, 52.0, 47.0, 49.0, 39.0, 42.0, 28.0, 25.0, 27.0, 19.0, 24.0, 20.0, 17.0, 15.0, 12.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6328125, -2.553680419921875, -2.47454833984375, -2.395416259765625, -2.3162841796875, -2.237152099609375, -2.15802001953125, -2.078887939453125, -1.999755859375, -1.920623779296875, -1.84149169921875, -1.762359619140625, -1.6832275390625, -1.604095458984375, -1.52496337890625, -1.445831298828125, -1.36669921875, -1.287567138671875, -1.20843505859375, -1.129302978515625, -1.0501708984375, -0.971038818359375, -0.89190673828125, -0.812774658203125, -0.733642578125, -0.654510498046875, -0.57537841796875, -0.496246337890625, -0.4171142578125, -0.337982177734375, -0.25885009765625, -0.179718017578125, -0.1005859375, -0.021453857421875, 0.05767822265625, 0.136810302734375, 0.2159423828125, 0.295074462890625, 0.37420654296875, 0.453338623046875, 0.532470703125, 0.611602783203125, 0.69073486328125, 0.769866943359375, 0.8489990234375, 0.928131103515625, 1.00726318359375, 1.086395263671875, 1.16552734375, 1.244659423828125, 1.32379150390625, 1.402923583984375, 1.4820556640625, 1.561187744140625, 1.64031982421875, 1.719451904296875, 1.798583984375, 1.877716064453125, 1.95684814453125, 2.035980224609375, 2.1151123046875, 2.194244384765625, 2.27337646484375, 2.352508544921875, 2.431640625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 11.0, 11.0, 19.0, 26.0, 35.0, 39.0, 70.0, 103.0, 175.0, 237.0, 376.0, 622.0, 894.0, 1536.0, 2449.0, 3710.0, 6020.0, 9949.0, 16590.0, 28698.0, 49650.0, 84404.0, 134556.0, 181993.0, 182640.0, 135569.0, 85288.0, 50206.0, 28886.0, 17128.0, 10133.0, 6132.0, 3859.0, 2361.0, 1525.0, 909.0, 611.0, 387.0, 277.0, 172.0, 102.0, 60.0, 50.0, 31.0, 17.0, 15.0, 11.0, 5.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.671875, -2.588409423828125, -2.50494384765625, -2.421478271484375, -2.3380126953125, -2.254547119140625, -2.17108154296875, -2.087615966796875, -2.004150390625, -1.920684814453125, -1.83721923828125, -1.753753662109375, -1.6702880859375, -1.586822509765625, -1.50335693359375, -1.419891357421875, -1.33642578125, -1.252960205078125, -1.16949462890625, -1.086029052734375, -1.0025634765625, -0.919097900390625, -0.83563232421875, -0.752166748046875, -0.668701171875, -0.585235595703125, -0.50177001953125, -0.418304443359375, -0.3348388671875, -0.251373291015625, -0.16790771484375, -0.084442138671875, -0.0009765625, 0.082489013671875, 0.16595458984375, 0.249420166015625, 0.3328857421875, 0.416351318359375, 0.49981689453125, 0.583282470703125, 0.666748046875, 0.750213623046875, 0.83367919921875, 0.917144775390625, 1.0006103515625, 1.084075927734375, 1.16754150390625, 1.251007080078125, 1.33447265625, 1.417938232421875, 1.50140380859375, 1.584869384765625, 1.6683349609375, 1.751800537109375, 1.83526611328125, 1.918731689453125, 2.002197265625, 2.085662841796875, 2.16912841796875, 2.252593994140625, 2.3360595703125, 2.419525146484375, 2.50299072265625, 2.586456298828125, 2.669921875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 8.0, 13.0, 12.0, 18.0, 17.0, 29.0, 35.0, 32.0, 58.0, 47.0, 62.0, 66.0, 67.0, 76.0, 83.0, 64.0, 56.0, 53.0, 42.0, 20.0, 30.0, 17.0, 14.0, 10.0, 9.0, 17.0, 8.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.0004024505615234375, -0.00039162859320640564, -0.0003808066248893738, -0.0003699846565723419, -0.00035916268825531006, -0.0003483407199382782, -0.00033751875162124634, -0.0003266967833042145, -0.0003158748149871826, -0.00030505284667015076, -0.0002942308783531189, -0.00028340891003608704, -0.0002725869417190552, -0.0002617649734020233, -0.00025094300508499146, -0.0002401210367679596, -0.00022929906845092773, -0.00021847710013389587, -0.00020765513181686401, -0.00019683316349983215, -0.0001860111951828003, -0.00017518922686576843, -0.00016436725854873657, -0.0001535452902317047, -0.00014272332191467285, -0.000131901353597641, -0.00012107938528060913, -0.00011025741696357727, -9.943544864654541e-05, -8.861348032951355e-05, -7.779151201248169e-05, -6.696954369544983e-05, -5.614757537841797e-05, -4.532560706138611e-05, -3.450363874435425e-05, -2.3681670427322388e-05, -1.2859702110290527e-05, -2.037733793258667e-06, 8.784234523773193e-06, 1.9606202840805054e-05, 3.0428171157836914e-05, 4.1250139474868774e-05, 5.2072107791900635e-05, 6.28940761089325e-05, 7.371604442596436e-05, 8.453801274299622e-05, 9.535998106002808e-05, 0.00010618194937705994, 0.0001170039176940918, 0.00012782588601112366, 0.00013864785432815552, 0.00014946982264518738, 0.00016029179096221924, 0.0001711137592792511, 0.00018193572759628296, 0.00019275769591331482, 0.00020357966423034668, 0.00021440163254737854, 0.0002252236008644104, 0.00023604556918144226, 0.0002468675374984741, 0.000257689505815506, 0.00026851147413253784, 0.0002793334424495697, 0.00029015541076660156]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 6.0, 7.0, 14.0, 15.0, 24.0, 27.0, 35.0, 58.0, 76.0, 79.0, 111.0, 152.0, 230.0, 311.0, 470.0, 729.0, 1156.0, 1699.0, 2753.0, 4398.0, 7269.0, 12256.0, 21314.0, 36587.0, 61967.0, 101222.0, 146394.0, 176023.0, 162473.0, 120441.0, 77193.0, 46312.0, 26897.0, 15906.0, 9003.0, 5451.0, 3377.0, 2087.0, 1288.0, 882.0, 534.0, 397.0, 264.0, 172.0, 126.0, 108.0, 69.0, 40.0, 38.0, 40.0, 26.0, 21.0, 10.0, 12.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-2.1015625, -2.03314208984375, -1.9647216796875, -1.89630126953125, -1.827880859375, -1.75946044921875, -1.6910400390625, -1.62261962890625, -1.55419921875, -1.48577880859375, -1.4173583984375, -1.34893798828125, -1.280517578125, -1.21209716796875, -1.1436767578125, -1.07525634765625, -1.0068359375, -0.93841552734375, -0.8699951171875, -0.80157470703125, -0.733154296875, -0.66473388671875, -0.5963134765625, -0.52789306640625, -0.45947265625, -0.39105224609375, -0.3226318359375, -0.25421142578125, -0.185791015625, -0.11737060546875, -0.0489501953125, 0.01947021484375, 0.087890625, 0.15631103515625, 0.2247314453125, 0.29315185546875, 0.361572265625, 0.42999267578125, 0.4984130859375, 0.56683349609375, 0.63525390625, 0.70367431640625, 0.7720947265625, 0.84051513671875, 0.908935546875, 0.97735595703125, 1.0457763671875, 1.11419677734375, 1.1826171875, 1.25103759765625, 1.3194580078125, 1.38787841796875, 1.456298828125, 1.52471923828125, 1.5931396484375, 1.66156005859375, 1.72998046875, 1.79840087890625, 1.8668212890625, 1.93524169921875, 2.003662109375, 2.07208251953125, 2.1405029296875, 2.20892333984375, 2.27734375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 16.0, 9.0, 22.0, 27.0, 36.0, 37.0, 54.0, 59.0, 67.0, 74.0, 66.0, 64.0, 73.0, 70.0, 59.0, 54.0, 49.0, 26.0, 23.0, 27.0, 23.0, 9.0, 15.0, 12.0, 3.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.0234375, -0.9976119995117188, -0.9717864990234375, -0.9459609985351562, -0.920135498046875, -0.8943099975585938, -0.8684844970703125, -0.8426589965820312, -0.81683349609375, -0.7910079956054688, -0.7651824951171875, -0.7393569946289062, -0.713531494140625, -0.6877059936523438, -0.6618804931640625, -0.6360549926757812, -0.6102294921875, -0.5844039916992188, -0.5585784912109375, -0.5327529907226562, -0.506927490234375, -0.48110198974609375, -0.4552764892578125, -0.42945098876953125, -0.40362548828125, -0.37779998779296875, -0.3519744873046875, -0.32614898681640625, -0.300323486328125, -0.27449798583984375, -0.2486724853515625, -0.22284698486328125, -0.197021484375, -0.17119598388671875, -0.1453704833984375, -0.11954498291015625, -0.093719482421875, -0.06789398193359375, -0.0420684814453125, -0.01624298095703125, 0.00958251953125, 0.03540802001953125, 0.0612335205078125, 0.08705902099609375, 0.112884521484375, 0.13871002197265625, 0.1645355224609375, 0.19036102294921875, 0.2161865234375, 0.24201202392578125, 0.2678375244140625, 0.29366302490234375, 0.319488525390625, 0.34531402587890625, 0.3711395263671875, 0.39696502685546875, 0.42279052734375, 0.44861602783203125, 0.4744415283203125, 0.5002670288085938, 0.526092529296875, 0.5519180297851562, 0.5777435302734375, 0.6035690307617188, 0.62939453125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 6.0, 5.0, 9.0, 2.0, 8.0, 14.0, 16.0, 20.0, 22.0, 27.0, 41.0, 63.0, 67.0, 65.0, 83.0, 79.0, 66.0, 99.0, 73.0, 66.0, 46.0, 33.0, 27.0, 26.0, 13.0, 16.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.698271751403809, -10.396517753601074, -10.094762802124023, -9.793008804321289, -9.491254806518555, -9.189499855041504, -8.88774585723877, -8.585990905761719, -8.284236907958984, -7.982482433319092, -7.680727958679199, -7.378973960876465, -7.077219486236572, -6.77546501159668, -6.473711013793945, -6.171956539154053, -5.87020206451416, -5.568447589874268, -5.266693115234375, -4.964939117431641, -4.663184642791748, -4.3614301681518555, -4.059676170349121, -3.7579216957092285, -3.456167221069336, -3.1544127464294434, -2.85265851020813, -2.5509042739868164, -2.249149799346924, -1.9473954439163208, -1.6456410884857178, -1.3438868522644043, -1.0421333312988281, -0.7403789758682251, -0.43862462043762207, -0.13687026500701904, 0.16488409042358398, 0.466638445854187, 0.76839280128479, 1.0701470375061035, 1.371901512145996, 1.6736558675765991, 1.9754102230072021, 2.2771644592285156, 2.578918933868408, 2.880673408508301, 3.1824276447296143, 3.4841818809509277, 3.7859363555908203, 4.087690830230713, 4.3894453048706055, 4.69119930267334, 4.992953777313232, 5.294708251953125, 5.596462249755859, 5.898216724395752, 6.1999711990356445, 6.501725673675537, 6.80348014831543, 7.105234146118164, 7.406988620758057, 7.708743095397949, 8.010497093200684, 8.312252044677734, 8.614006042480469]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 8.0, 13.0, 8.0, 11.0, 12.0, 12.0, 18.0, 25.0, 22.0, 14.0, 22.0, 17.0, 25.0, 24.0, 41.0, 42.0, 52.0, 53.0, 43.0, 49.0, 43.0, 39.0, 32.0, 34.0, 42.0, 35.0, 47.0, 29.0, 24.0, 36.0, 30.0, 22.0, 11.0, 7.0, 15.0, 12.0, 6.0, 5.0, 5.0, 8.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4548962116241455, -3.342690944671631, -3.2304859161376953, -3.1182806491851807, -3.006075620651245, -2.8938703536987305, -2.781665325164795, -2.6694600582122803, -2.5572547912597656, -2.445049524307251, -2.3328444957733154, -2.220639228820801, -2.1084342002868652, -1.9962289333343506, -1.8840237855911255, -1.7718186378479004, -1.6596136093139648, -1.5474084615707397, -1.4352033138275146, -1.322998046875, -1.2107930183410645, -1.0985877513885498, -0.9863826036453247, -0.8741774559020996, -0.7619723081588745, -0.6497671604156494, -0.5375620126724243, -0.42535680532455444, -0.31315165758132935, -0.20094650983810425, -0.08874130249023438, 0.023463845252990723, 0.13566923141479492, 0.2478743940591812, 0.3600795567035675, 0.472284734249115, 0.5844898819923401, 0.6966950297355652, 0.8089002370834351, 0.9211053848266602, 1.0333105325698853, 1.1455156803131104, 1.2577208280563354, 1.3699259757995605, 1.4821312427520752, 1.5943362712860107, 1.7065415382385254, 1.8187466859817505, 1.9309518337249756, 2.0431571006774902, 2.155362129211426, 2.2675673961639404, 2.379772424697876, 2.4919776916503906, 2.604182720184326, 2.716387987136841, 2.8285932540893555, 2.94079852104187, 3.0530035495758057, 3.1652088165283203, 3.277413845062256, 3.3896191120147705, 3.501824378967285, 3.6140294075012207, 3.7262344360351562]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 14.0, 17.0, 21.0, 45.0, 66.0, 96.0, 159.0, 251.0, 421.0, 680.0, 1234.0, 2283.0, 4486.0, 9188.0, 20588.0, 52667.0, 154775.0, 545847.0, 1652830.0, 1243638.0, 337328.0, 100276.0, 36429.0, 15417.0, 7322.0, 3640.0, 1941.0, 1063.0, 621.0, 380.0, 196.0, 144.0, 66.0, 57.0, 26.0, 19.0, 12.0, 13.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.984375, -10.6689453125, -10.353515625, -10.0380859375, -9.72265625, -9.4072265625, -9.091796875, -8.7763671875, -8.4609375, -8.1455078125, -7.830078125, -7.5146484375, -7.19921875, -6.8837890625, -6.568359375, -6.2529296875, -5.9375, -5.6220703125, -5.306640625, -4.9912109375, -4.67578125, -4.3603515625, -4.044921875, -3.7294921875, -3.4140625, -3.0986328125, -2.783203125, -2.4677734375, -2.15234375, -1.8369140625, -1.521484375, -1.2060546875, -0.890625, -0.5751953125, -0.259765625, 0.0556640625, 0.37109375, 0.6865234375, 1.001953125, 1.3173828125, 1.6328125, 1.9482421875, 2.263671875, 2.5791015625, 2.89453125, 3.2099609375, 3.525390625, 3.8408203125, 4.15625, 4.4716796875, 4.787109375, 5.1025390625, 5.41796875, 5.7333984375, 6.048828125, 6.3642578125, 6.6796875, 6.9951171875, 7.310546875, 7.6259765625, 7.94140625, 8.2568359375, 8.572265625, 8.8876953125, 9.203125]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 14.0, 9.0, 16.0, 12.0, 14.0, 12.0, 19.0, 19.0, 20.0, 21.0, 21.0, 34.0, 37.0, 41.0, 38.0, 47.0, 35.0, 52.0, 34.0, 56.0, 51.0, 38.0, 36.0, 49.0, 25.0, 30.0, 30.0, 32.0, 26.0, 25.0, 12.0, 17.0, 6.0, 5.0, 14.0, 7.0, 7.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.91015625, -2.81756591796875, -2.7249755859375, -2.63238525390625, -2.539794921875, -2.44720458984375, -2.3546142578125, -2.26202392578125, -2.16943359375, -2.07684326171875, -1.9842529296875, -1.89166259765625, -1.799072265625, -1.70648193359375, -1.6138916015625, -1.52130126953125, -1.4287109375, -1.33612060546875, -1.2435302734375, -1.15093994140625, -1.058349609375, -0.96575927734375, -0.8731689453125, -0.78057861328125, -0.68798828125, -0.59539794921875, -0.5028076171875, -0.41021728515625, -0.317626953125, -0.22503662109375, -0.1324462890625, -0.03985595703125, 0.052734375, 0.14532470703125, 0.2379150390625, 0.33050537109375, 0.423095703125, 0.51568603515625, 0.6082763671875, 0.70086669921875, 0.79345703125, 0.88604736328125, 0.9786376953125, 1.07122802734375, 1.163818359375, 1.25640869140625, 1.3489990234375, 1.44158935546875, 1.5341796875, 1.62677001953125, 1.7193603515625, 1.81195068359375, 1.904541015625, 1.99713134765625, 2.0897216796875, 2.18231201171875, 2.27490234375, 2.36749267578125, 2.4600830078125, 2.55267333984375, 2.645263671875, 2.73785400390625, 2.8304443359375, 2.92303466796875, 3.015625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 10.0, 14.0, 19.0, 40.0, 43.0, 61.0, 111.0, 130.0, 258.0, 345.0, 549.0, 772.0, 1204.0, 1840.0, 3016.0, 4834.0, 8046.0, 13798.0, 24314.0, 44747.0, 84682.0, 167328.0, 347530.0, 720056.0, 1121666.0, 830137.0, 408773.0, 194800.0, 97412.0, 50884.0, 28193.0, 15469.0, 8964.0, 5363.0, 3212.0, 2073.0, 1254.0, 829.0, 511.0, 364.0, 212.0, 146.0, 91.0, 65.0, 48.0, 22.0, 18.0, 10.0, 11.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-6.9296875, -6.7171630859375, -6.504638671875, -6.2921142578125, -6.07958984375, -5.8670654296875, -5.654541015625, -5.4420166015625, -5.2294921875, -5.0169677734375, -4.804443359375, -4.5919189453125, -4.37939453125, -4.1668701171875, -3.954345703125, -3.7418212890625, -3.529296875, -3.3167724609375, -3.104248046875, -2.8917236328125, -2.67919921875, -2.4666748046875, -2.254150390625, -2.0416259765625, -1.8291015625, -1.6165771484375, -1.404052734375, -1.1915283203125, -0.97900390625, -0.7664794921875, -0.553955078125, -0.3414306640625, -0.12890625, 0.0836181640625, 0.296142578125, 0.5086669921875, 0.72119140625, 0.9337158203125, 1.146240234375, 1.3587646484375, 1.5712890625, 1.7838134765625, 1.996337890625, 2.2088623046875, 2.42138671875, 2.6339111328125, 2.846435546875, 3.0589599609375, 3.271484375, 3.4840087890625, 3.696533203125, 3.9090576171875, 4.12158203125, 4.3341064453125, 4.546630859375, 4.7591552734375, 4.9716796875, 5.1842041015625, 5.396728515625, 5.6092529296875, 5.82177734375, 6.0343017578125, 6.246826171875, 6.4593505859375, 6.671875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 7.0, 16.0, 12.0, 17.0, 24.0, 39.0, 48.0, 57.0, 77.0, 100.0, 117.0, 151.0, 181.0, 257.0, 258.0, 297.0, 312.0, 328.0, 321.0, 295.0, 225.0, 213.0, 164.0, 129.0, 71.0, 73.0, 63.0, 44.0, 38.0, 22.0, 23.0, 11.0, 10.0, 14.0, 9.0, 6.0, 1.0, 7.0, 2.0, 10.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.240234375, -2.17242431640625, -2.1046142578125, -2.03680419921875, -1.968994140625, -1.90118408203125, -1.8333740234375, -1.76556396484375, -1.69775390625, -1.62994384765625, -1.5621337890625, -1.49432373046875, -1.426513671875, -1.35870361328125, -1.2908935546875, -1.22308349609375, -1.1552734375, -1.08746337890625, -1.0196533203125, -0.95184326171875, -0.884033203125, -0.81622314453125, -0.7484130859375, -0.68060302734375, -0.61279296875, -0.54498291015625, -0.4771728515625, -0.40936279296875, -0.341552734375, -0.27374267578125, -0.2059326171875, -0.13812255859375, -0.0703125, -0.00250244140625, 0.0653076171875, 0.13311767578125, 0.200927734375, 0.26873779296875, 0.3365478515625, 0.40435791015625, 0.47216796875, 0.53997802734375, 0.6077880859375, 0.67559814453125, 0.743408203125, 0.81121826171875, 0.8790283203125, 0.94683837890625, 1.0146484375, 1.08245849609375, 1.1502685546875, 1.21807861328125, 1.285888671875, 1.35369873046875, 1.4215087890625, 1.48931884765625, 1.55712890625, 1.62493896484375, 1.6927490234375, 1.76055908203125, 1.828369140625, 1.89617919921875, 1.9639892578125, 2.03179931640625, 2.099609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 2.0, 4.0, 9.0, 7.0, 10.0, 18.0, 17.0, 33.0, 32.0, 37.0, 45.0, 48.0, 70.0, 75.0, 64.0, 86.0, 69.0, 58.0, 65.0, 58.0, 40.0, 19.0, 33.0, 21.0, 8.0, 16.0, 9.0, 11.0, 7.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.09686279296875, -9.814611434936523, -9.532360076904297, -9.25010871887207, -8.967857360839844, -8.685606002807617, -8.40335464477539, -8.121103286743164, -7.838851451873779, -7.556600093841553, -7.274348735809326, -6.9920973777771, -6.709845542907715, -6.427594184875488, -6.145342826843262, -5.863091468811035, -5.580840110778809, -5.298588752746582, -5.0163373947143555, -4.734086036682129, -4.451834678649902, -4.169583320617676, -3.887331485748291, -3.6050801277160645, -3.322828769683838, -3.0405774116516113, -2.7583260536193848, -2.476074457168579, -2.1938230991363525, -1.911571741104126, -1.6293202638626099, -1.3470687866210938, -1.0648174285888672, -0.7825660109519958, -0.5003145933151245, -0.21806317567825317, 0.06418824195861816, 0.3464395999908447, 0.6286910772323608, 0.910942554473877, 1.1931939125061035, 1.47544527053833, 1.7576967477798462, 2.0399482250213623, 2.322199583053589, 2.6044509410858154, 2.886702537536621, 3.1689538955688477, 3.451205253601074, 3.733456611633301, 4.015707969665527, 4.297959327697754, 4.5802106857299805, 4.862462043762207, 5.144713878631592, 5.426965236663818, 5.709216594696045, 5.9914679527282715, 6.273719310760498, 6.555970668792725, 6.838222503662109, 7.120473861694336, 7.4027252197265625, 7.684976577758789, 7.967227935791016]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 11.0, 9.0, 3.0, 6.0, 15.0, 11.0, 17.0, 12.0, 19.0, 19.0, 29.0, 25.0, 30.0, 33.0, 31.0, 33.0, 39.0, 49.0, 39.0, 47.0, 37.0, 25.0, 27.0, 28.0, 30.0, 36.0, 34.0, 27.0, 33.0, 31.0, 22.0, 21.0, 25.0, 25.0, 17.0, 11.0, 13.0, 11.0, 9.0, 10.0, 9.0, 8.0, 1.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.54913330078125, -3.442233085632324, -3.3353331089019775, -3.2284328937530518, -3.121532678604126, -3.0146327018737793, -2.9077324867248535, -2.8008322715759277, -2.693932056427002, -2.587031841278076, -2.4801318645477295, -2.3732316493988037, -2.266331434249878, -2.1594314575195312, -2.0525312423706055, -1.9456310272216797, -1.838731050491333, -1.7318309545516968, -1.624930739402771, -1.5180306434631348, -1.411130428314209, -1.3042303323745728, -1.1973302364349365, -1.0904300212860107, -0.9835299253463745, -0.8766297698020935, -0.7697296142578125, -0.6628295183181763, -0.5559293627738953, -0.44902920722961426, -0.342129111289978, -0.23522895574569702, -0.12832880020141602, -0.021428659558296204, 0.08547148108482361, 0.19237160682678223, 0.29927176237106323, 0.40617191791534424, 0.5130720138549805, 0.6199721693992615, 0.7268723249435425, 0.8337724804878235, 0.9406726360321045, 1.0475727319717407, 1.154472827911377, 1.2613730430603027, 1.368273138999939, 1.4751732349395752, 1.582073450088501, 1.6889735460281372, 1.795873761177063, 1.9027738571166992, 2.009674072265625, 2.116574287414551, 2.2234742641448975, 2.3303744792938232, 2.43727445602417, 2.5441746711730957, 2.6510746479034424, 2.757974863052368, 2.864875078201294, 2.9717750549316406, 3.0786752700805664, 3.185575485229492, 3.292475700378418]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 9.0, 14.0, 13.0, 33.0, 43.0, 50.0, 78.0, 118.0, 167.0, 257.0, 395.0, 595.0, 884.0, 1445.0, 2536.0, 4963.0, 11020.0, 29728.0, 91461.0, 264497.0, 370764.0, 176477.0, 56954.0, 19289.0, 7579.0, 3687.0, 1998.0, 1224.0, 771.0, 511.0, 331.0, 230.0, 141.0, 95.0, 77.0, 35.0, 23.0, 25.0, 14.0, 11.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.753662109375, -5.55029296875, -5.346923828125, -5.1435546875, -4.940185546875, -4.73681640625, -4.533447265625, -4.330078125, -4.126708984375, -3.92333984375, -3.719970703125, -3.5166015625, -3.313232421875, -3.10986328125, -2.906494140625, -2.703125, -2.499755859375, -2.29638671875, -2.093017578125, -1.8896484375, -1.686279296875, -1.48291015625, -1.279541015625, -1.076171875, -0.872802734375, -0.66943359375, -0.466064453125, -0.2626953125, -0.059326171875, 0.14404296875, 0.347412109375, 0.55078125, 0.754150390625, 0.95751953125, 1.160888671875, 1.3642578125, 1.567626953125, 1.77099609375, 1.974365234375, 2.177734375, 2.381103515625, 2.58447265625, 2.787841796875, 2.9912109375, 3.194580078125, 3.39794921875, 3.601318359375, 3.8046875, 4.008056640625, 4.21142578125, 4.414794921875, 4.6181640625, 4.821533203125, 5.02490234375, 5.228271484375, 5.431640625, 5.635009765625, 5.83837890625, 6.041748046875, 6.2451171875, 6.448486328125, 6.65185546875, 6.855224609375, 7.05859375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 7.0, 4.0, 8.0, 9.0, 11.0, 8.0, 14.0, 9.0, 15.0, 23.0, 23.0, 23.0, 20.0, 25.0, 31.0, 31.0, 37.0, 36.0, 37.0, 40.0, 53.0, 33.0, 49.0, 40.0, 23.0, 44.0, 30.0, 35.0, 31.0, 24.0, 29.0, 39.0, 26.0, 20.0, 8.0, 16.0, 10.0, 9.0, 14.0, 12.0, 9.0, 6.0, 9.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.94921875, -3.8251953125, -3.701171875, -3.5771484375, -3.453125, -3.3291015625, -3.205078125, -3.0810546875, -2.95703125, -2.8330078125, -2.708984375, -2.5849609375, -2.4609375, -2.3369140625, -2.212890625, -2.0888671875, -1.96484375, -1.8408203125, -1.716796875, -1.5927734375, -1.46875, -1.3447265625, -1.220703125, -1.0966796875, -0.97265625, -0.8486328125, -0.724609375, -0.6005859375, -0.4765625, -0.3525390625, -0.228515625, -0.1044921875, 0.01953125, 0.1435546875, 0.267578125, 0.3916015625, 0.515625, 0.6396484375, 0.763671875, 0.8876953125, 1.01171875, 1.1357421875, 1.259765625, 1.3837890625, 1.5078125, 1.6318359375, 1.755859375, 1.8798828125, 2.00390625, 2.1279296875, 2.251953125, 2.3759765625, 2.5, 2.6240234375, 2.748046875, 2.8720703125, 2.99609375, 3.1201171875, 3.244140625, 3.3681640625, 3.4921875, 3.6162109375, 3.740234375, 3.8642578125, 3.98828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 6.0, 7.0, 9.0, 6.0, 21.0, 23.0, 36.0, 44.0, 45.0, 73.0, 82.0, 131.0, 188.0, 237.0, 374.0, 508.0, 849.0, 1552.0, 3279.0, 8959.0, 38398.0, 252772.0, 582163.0, 125710.0, 21327.0, 5786.0, 2380.0, 1265.0, 744.0, 423.0, 312.0, 228.0, 160.0, 115.0, 87.0, 64.0, 45.0, 35.0, 40.0, 21.0, 9.0, 15.0, 9.0, 6.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.34375, -10.9696044921875, -10.595458984375, -10.2213134765625, -9.84716796875, -9.4730224609375, -9.098876953125, -8.7247314453125, -8.3505859375, -7.9764404296875, -7.602294921875, -7.2281494140625, -6.85400390625, -6.4798583984375, -6.105712890625, -5.7315673828125, -5.357421875, -4.9832763671875, -4.609130859375, -4.2349853515625, -3.86083984375, -3.4866943359375, -3.112548828125, -2.7384033203125, -2.3642578125, -1.9901123046875, -1.615966796875, -1.2418212890625, -0.86767578125, -0.4935302734375, -0.119384765625, 0.2547607421875, 0.62890625, 1.0030517578125, 1.377197265625, 1.7513427734375, 2.12548828125, 2.4996337890625, 2.873779296875, 3.2479248046875, 3.6220703125, 3.9962158203125, 4.370361328125, 4.7445068359375, 5.11865234375, 5.4927978515625, 5.866943359375, 6.2410888671875, 6.615234375, 6.9893798828125, 7.363525390625, 7.7376708984375, 8.11181640625, 8.4859619140625, 8.860107421875, 9.2342529296875, 9.6083984375, 9.9825439453125, 10.356689453125, 10.7308349609375, 11.10498046875, 11.4791259765625, 11.853271484375, 12.2274169921875, 12.6015625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 1.0, 8.0, 8.0, 7.0, 5.0, 12.0, 7.0, 13.0, 14.0, 17.0, 10.0, 21.0, 17.0, 22.0, 20.0, 37.0, 36.0, 26.0, 35.0, 37.0, 40.0, 32.0, 39.0, 38.0, 40.0, 42.0, 40.0, 38.0, 32.0, 37.0, 36.0, 29.0, 16.0, 22.0, 20.0, 22.0, 19.0, 20.0, 12.0, 7.0, 8.0, 12.0, 8.0, 8.0, 7.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.169921875, -2.0987548828125, -2.027587890625, -1.9564208984375, -1.88525390625, -1.8140869140625, -1.742919921875, -1.6717529296875, -1.6005859375, -1.5294189453125, -1.458251953125, -1.3870849609375, -1.31591796875, -1.2447509765625, -1.173583984375, -1.1024169921875, -1.03125, -0.9600830078125, -0.888916015625, -0.8177490234375, -0.74658203125, -0.6754150390625, -0.604248046875, -0.5330810546875, -0.4619140625, -0.3907470703125, -0.319580078125, -0.2484130859375, -0.17724609375, -0.1060791015625, -0.034912109375, 0.0362548828125, 0.107421875, 0.1785888671875, 0.249755859375, 0.3209228515625, 0.39208984375, 0.4632568359375, 0.534423828125, 0.6055908203125, 0.6767578125, 0.7479248046875, 0.819091796875, 0.8902587890625, 0.96142578125, 1.0325927734375, 1.103759765625, 1.1749267578125, 1.24609375, 1.3172607421875, 1.388427734375, 1.4595947265625, 1.53076171875, 1.6019287109375, 1.673095703125, 1.7442626953125, 1.8154296875, 1.8865966796875, 1.957763671875, 2.0289306640625, 2.10009765625, 2.1712646484375, 2.242431640625, 2.3135986328125, 2.384765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 14.0, 31.0, 11.0, 36.0, 46.0, 79.0, 98.0, 164.0, 243.0, 369.0, 543.0, 823.0, 1340.0, 2093.0, 3631.0, 7646.0, 28531.0, 283712.0, 626540.0, 68492.0, 11970.0, 4835.0, 2669.0, 1560.0, 1049.0, 680.0, 414.0, 284.0, 181.0, 125.0, 91.0, 75.0, 48.0, 37.0, 22.0, 24.0, 12.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.0546875, -6.82867431640625, -6.6026611328125, -6.37664794921875, -6.150634765625, -5.92462158203125, -5.6986083984375, -5.47259521484375, -5.24658203125, -5.02056884765625, -4.7945556640625, -4.56854248046875, -4.342529296875, -4.11651611328125, -3.8905029296875, -3.66448974609375, -3.4384765625, -3.21246337890625, -2.9864501953125, -2.76043701171875, -2.534423828125, -2.30841064453125, -2.0823974609375, -1.85638427734375, -1.63037109375, -1.40435791015625, -1.1783447265625, -0.95233154296875, -0.726318359375, -0.50030517578125, -0.2742919921875, -0.04827880859375, 0.177734375, 0.40374755859375, 0.6297607421875, 0.85577392578125, 1.081787109375, 1.30780029296875, 1.5338134765625, 1.75982666015625, 1.98583984375, 2.21185302734375, 2.4378662109375, 2.66387939453125, 2.889892578125, 3.11590576171875, 3.3419189453125, 3.56793212890625, 3.7939453125, 4.01995849609375, 4.2459716796875, 4.47198486328125, 4.697998046875, 4.92401123046875, 5.1500244140625, 5.37603759765625, 5.60205078125, 5.82806396484375, 6.0540771484375, 6.28009033203125, 6.506103515625, 6.73211669921875, 6.9581298828125, 7.18414306640625, 7.41015625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 15.0, 18.0, 28.0, 47.0, 87.0, 127.0, 203.0, 180.0, 108.0, 77.0, 49.0, 16.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.0002760887145996094, -0.0002685803920030594, -0.0002610720694065094, -0.0002535637468099594, -0.0002460554242134094, -0.00023854710161685944, -0.00023103877902030945, -0.00022353045642375946, -0.00021602213382720947, -0.00020851381123065948, -0.0002010054886341095, -0.0001934971660375595, -0.00018598884344100952, -0.00017848052084445953, -0.00017097219824790955, -0.00016346387565135956, -0.00015595555305480957, -0.00014844723045825958, -0.0001409389078617096, -0.0001334305852651596, -0.00012592226266860962, -0.00011841394007205963, -0.00011090561747550964, -0.00010339729487895966, -9.588897228240967e-05, -8.838064968585968e-05, -8.087232708930969e-05, -7.33640044927597e-05, -6.585568189620972e-05, -5.834735929965973e-05, -5.083903670310974e-05, -4.3330714106559753e-05, -3.5822391510009766e-05, -2.8314068913459778e-05, -2.080574631690979e-05, -1.3297423720359802e-05, -5.7891011238098145e-06, 1.7192214727401733e-06, 9.227544069290161e-06, 1.673586666584015e-05, 2.4244189262390137e-05, 3.1752511858940125e-05, 3.926083445549011e-05, 4.67691570520401e-05, 5.427747964859009e-05, 6.178580224514008e-05, 6.929412484169006e-05, 7.680244743824005e-05, 8.431077003479004e-05, 9.181909263134003e-05, 9.932741522789001e-05, 0.00010683573782444, 0.00011434406042098999, 0.00012185238301753998, 0.00012936070561408997, 0.00013686902821063995, 0.00014437735080718994, 0.00015188567340373993, 0.00015939399600028992, 0.0001669023185968399, 0.0001744106411933899, 0.00018191896378993988, 0.00018942728638648987, 0.00019693560898303986, 0.00020444393157958984]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 6.0, 10.0, 10.0, 20.0, 20.0, 32.0, 44.0, 62.0, 87.0, 153.0, 154.0, 221.0, 371.0, 477.0, 675.0, 905.0, 1238.0, 1815.0, 2633.0, 3704.0, 6394.0, 14068.0, 46577.0, 197767.0, 460764.0, 222680.0, 52594.0, 15245.0, 6743.0, 3942.0, 2602.0, 1857.0, 1347.0, 959.0, 637.0, 481.0, 335.0, 286.0, 177.0, 136.0, 96.0, 78.0, 55.0, 33.0, 18.0, 13.0, 11.0, 5.0, 5.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-4.03515625, -3.911163330078125, -3.78717041015625, -3.663177490234375, -3.5391845703125, -3.415191650390625, -3.29119873046875, -3.167205810546875, -3.043212890625, -2.919219970703125, -2.79522705078125, -2.671234130859375, -2.5472412109375, -2.423248291015625, -2.29925537109375, -2.175262451171875, -2.05126953125, -1.927276611328125, -1.80328369140625, -1.679290771484375, -1.5552978515625, -1.431304931640625, -1.30731201171875, -1.183319091796875, -1.059326171875, -0.935333251953125, -0.81134033203125, -0.687347412109375, -0.5633544921875, -0.439361572265625, -0.31536865234375, -0.191375732421875, -0.0673828125, 0.056610107421875, 0.18060302734375, 0.304595947265625, 0.4285888671875, 0.552581787109375, 0.67657470703125, 0.800567626953125, 0.924560546875, 1.048553466796875, 1.17254638671875, 1.296539306640625, 1.4205322265625, 1.544525146484375, 1.66851806640625, 1.792510986328125, 1.91650390625, 2.040496826171875, 2.16448974609375, 2.288482666015625, 2.4124755859375, 2.536468505859375, 2.66046142578125, 2.784454345703125, 2.908447265625, 3.032440185546875, 3.15643310546875, 3.280426025390625, 3.4044189453125, 3.528411865234375, 3.65240478515625, 3.776397705078125, 3.900390625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 2.0, 14.0, 22.0, 74.0, 160.0, 227.0, 215.0, 147.0, 72.0, 23.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8193359375, -1.76055908203125, -1.7017822265625, -1.64300537109375, -1.584228515625, -1.52545166015625, -1.4666748046875, -1.40789794921875, -1.34912109375, -1.29034423828125, -1.2315673828125, -1.17279052734375, -1.114013671875, -1.05523681640625, -0.9964599609375, -0.93768310546875, -0.87890625, -0.82012939453125, -0.7613525390625, -0.70257568359375, -0.643798828125, -0.58502197265625, -0.5262451171875, -0.46746826171875, -0.40869140625, -0.34991455078125, -0.2911376953125, -0.23236083984375, -0.173583984375, -0.11480712890625, -0.0560302734375, 0.00274658203125, 0.0615234375, 0.12030029296875, 0.1790771484375, 0.23785400390625, 0.296630859375, 0.35540771484375, 0.4141845703125, 0.47296142578125, 0.53173828125, 0.59051513671875, 0.6492919921875, 0.70806884765625, 0.766845703125, 0.82562255859375, 0.8843994140625, 0.94317626953125, 1.001953125, 1.06072998046875, 1.1195068359375, 1.17828369140625, 1.237060546875, 1.29583740234375, 1.3546142578125, 1.41339111328125, 1.47216796875, 1.53094482421875, 1.5897216796875, 1.64849853515625, 1.707275390625, 1.76605224609375, 1.8248291015625, 1.88360595703125, 1.9423828125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 1.0, 5.0, 8.0, 1.0, 2.0, 10.0, 3.0, 12.0, 10.0, 13.0, 18.0, 28.0, 42.0, 35.0, 49.0, 46.0, 63.0, 75.0, 69.0, 84.0, 64.0, 60.0, 58.0, 57.0, 43.0, 24.0, 29.0, 22.0, 18.0, 15.0, 11.0, 7.0, 10.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.02247428894043, -9.74274730682373, -9.463020324707031, -9.183293342590332, -8.903566360473633, -8.623838424682617, -8.344111442565918, -8.064384460449219, -7.7846574783325195, -7.50493049621582, -7.225203514099121, -6.945476055145264, -6.6657490730285645, -6.386022090911865, -6.106294631958008, -5.826567649841309, -5.546840667724609, -5.26711368560791, -4.987386703491211, -4.7076592445373535, -4.427932262420654, -4.148205280303955, -3.8684780597686768, -3.5887508392333984, -3.309023857116699, -3.029296875, -2.7495696544647217, -2.4698424339294434, -2.190115451812744, -1.9103883504867554, -1.6306612491607666, -1.3509341478347778, -1.071207046508789, -0.7914799451828003, -0.5117528438568115, -0.23202574253082275, 0.047701358795166016, 0.3274284601211548, 0.6071555614471436, 0.8868826627731323, 1.166609764099121, 1.4463368654251099, 1.7260639667510986, 2.005791187286377, 2.285518169403076, 2.5652451515197754, 2.8449723720550537, 3.124699592590332, 3.4044265747070312, 3.6841535568237305, 3.963880777359009, 4.243607997894287, 4.523334980010986, 4.8030619621276855, 5.082789421081543, 5.362516403198242, 5.642243385314941, 5.921970367431641, 6.20169734954834, 6.481424808502197, 6.7611517906188965, 7.040878772735596, 7.320606231689453, 7.600333213806152, 7.880060195922852]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 11.0, 7.0, 2.0, 8.0, 7.0, 9.0, 9.0, 12.0, 11.0, 17.0, 16.0, 22.0, 27.0, 28.0, 22.0, 44.0, 27.0, 35.0, 39.0, 34.0, 40.0, 47.0, 37.0, 35.0, 31.0, 28.0, 32.0, 34.0, 30.0, 35.0, 26.0, 27.0, 30.0, 29.0, 22.0, 19.0, 18.0, 10.0, 13.0, 17.0, 11.0, 8.0, 8.0, 7.0, 6.0, 6.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5768890380859375, -3.4689245223999023, -3.360960006713867, -3.252995491027832, -3.145030975341797, -3.0370664596557617, -2.9291017055511475, -2.8211371898651123, -2.713172674179077, -2.605208158493042, -2.497243642807007, -2.3892791271209717, -2.2813143730163574, -2.1733498573303223, -2.065385341644287, -1.957420825958252, -1.8494563102722168, -1.7414917945861816, -1.6335272789001465, -1.5255626440048218, -1.4175981283187866, -1.3096336126327515, -1.2016689777374268, -1.0937044620513916, -0.9857399463653564, -0.8777754306793213, -0.7698108553886414, -0.6618462800979614, -0.5538817644119263, -0.4459172487258911, -0.3379526734352112, -0.22998809814453125, -0.12202334403991699, -0.014058798551559448, 0.0939057469367981, 0.20187029242515564, 0.3098348379135132, 0.41779935359954834, 0.5257639288902283, 0.6337285041809082, 0.7416930198669434, 0.8496575355529785, 0.9576221108436584, 1.0655866861343384, 1.1735512018203735, 1.2815157175064087, 1.3894803524017334, 1.4974448680877686, 1.6054093837738037, 1.7133738994598389, 1.821338415145874, 1.9293030500411987, 2.0372676849365234, 2.1452322006225586, 2.2531967163085938, 2.361161231994629, 2.469125747680664, 2.577090263366699, 2.6850547790527344, 2.7930192947387695, 2.9009838104248047, 3.00894832611084, 3.116913080215454, 3.2248775959014893, 3.3328421115875244]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 7.0, 5.0, 11.0, 17.0, 22.0, 26.0, 39.0, 71.0, 104.0, 141.0, 231.0, 390.0, 579.0, 889.0, 1374.0, 2266.0, 3772.0, 6196.0, 10300.0, 17323.0, 29887.0, 51315.0, 86017.0, 131655.0, 172841.0, 175128.0, 137086.0, 89733.0, 53970.0, 31486.0, 18131.0, 10696.0, 6308.0, 3920.0, 2382.0, 1476.0, 1002.0, 574.0, 363.0, 251.0, 167.0, 135.0, 81.0, 62.0, 43.0, 25.0, 26.0, 13.0, 13.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.44140625, -5.26031494140625, -5.0792236328125, -4.89813232421875, -4.717041015625, -4.53594970703125, -4.3548583984375, -4.17376708984375, -3.99267578125, -3.81158447265625, -3.6304931640625, -3.44940185546875, -3.268310546875, -3.08721923828125, -2.9061279296875, -2.72503662109375, -2.5439453125, -2.36285400390625, -2.1817626953125, -2.00067138671875, -1.819580078125, -1.63848876953125, -1.4573974609375, -1.27630615234375, -1.09521484375, -0.91412353515625, -0.7330322265625, -0.55194091796875, -0.370849609375, -0.18975830078125, -0.0086669921875, 0.17242431640625, 0.353515625, 0.53460693359375, 0.7156982421875, 0.89678955078125, 1.077880859375, 1.25897216796875, 1.4400634765625, 1.62115478515625, 1.80224609375, 1.98333740234375, 2.1644287109375, 2.34552001953125, 2.526611328125, 2.70770263671875, 2.8887939453125, 3.06988525390625, 3.2509765625, 3.43206787109375, 3.6131591796875, 3.79425048828125, 3.975341796875, 4.15643310546875, 4.3375244140625, 4.51861572265625, 4.69970703125, 4.88079833984375, 5.0618896484375, 5.24298095703125, 5.424072265625, 5.60516357421875, 5.7862548828125, 5.96734619140625, 6.1484375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 17.0, 15.0, 12.0, 11.0, 14.0, 21.0, 14.0, 21.0, 30.0, 35.0, 36.0, 29.0, 41.0, 34.0, 34.0, 38.0, 36.0, 59.0, 36.0, 40.0, 42.0, 38.0, 41.0, 30.0, 30.0, 24.0, 26.0, 27.0, 11.0, 14.0, 19.0, 19.0, 15.0, 16.0, 12.0, 7.0, 10.0, 3.0, 6.0, 7.0, 2.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.1484375, -4.02545166015625, -3.9024658203125, -3.77947998046875, -3.656494140625, -3.53350830078125, -3.4105224609375, -3.28753662109375, -3.16455078125, -3.04156494140625, -2.9185791015625, -2.79559326171875, -2.672607421875, -2.54962158203125, -2.4266357421875, -2.30364990234375, -2.1806640625, -2.05767822265625, -1.9346923828125, -1.81170654296875, -1.688720703125, -1.56573486328125, -1.4427490234375, -1.31976318359375, -1.19677734375, -1.07379150390625, -0.9508056640625, -0.82781982421875, -0.704833984375, -0.58184814453125, -0.4588623046875, -0.33587646484375, -0.212890625, -0.08990478515625, 0.0330810546875, 0.15606689453125, 0.279052734375, 0.40203857421875, 0.5250244140625, 0.64801025390625, 0.77099609375, 0.89398193359375, 1.0169677734375, 1.13995361328125, 1.262939453125, 1.38592529296875, 1.5089111328125, 1.63189697265625, 1.7548828125, 1.87786865234375, 2.0008544921875, 2.12384033203125, 2.246826171875, 2.36981201171875, 2.4927978515625, 2.61578369140625, 2.73876953125, 2.86175537109375, 2.9847412109375, 3.10772705078125, 3.230712890625, 3.35369873046875, 3.4766845703125, 3.59967041015625, 3.72265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 15.0, 24.0, 24.0, 46.0, 72.0, 113.0, 137.0, 207.0, 355.0, 579.0, 865.0, 1432.0, 2137.0, 3528.0, 5557.0, 8525.0, 13504.0, 21222.0, 33384.0, 52190.0, 77359.0, 107766.0, 135119.0, 145221.0, 130850.0, 103096.0, 72093.0, 47768.0, 31245.0, 19829.0, 12573.0, 7812.0, 4996.0, 3276.0, 2033.0, 1281.0, 798.0, 548.0, 325.0, 222.0, 148.0, 86.0, 74.0, 49.0, 28.0, 17.0, 8.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.15234375, -5.00262451171875, -4.8529052734375, -4.70318603515625, -4.553466796875, -4.40374755859375, -4.2540283203125, -4.10430908203125, -3.95458984375, -3.80487060546875, -3.6551513671875, -3.50543212890625, -3.355712890625, -3.20599365234375, -3.0562744140625, -2.90655517578125, -2.7568359375, -2.60711669921875, -2.4573974609375, -2.30767822265625, -2.157958984375, -2.00823974609375, -1.8585205078125, -1.70880126953125, -1.55908203125, -1.40936279296875, -1.2596435546875, -1.10992431640625, -0.960205078125, -0.81048583984375, -0.6607666015625, -0.51104736328125, -0.361328125, -0.21160888671875, -0.0618896484375, 0.08782958984375, 0.237548828125, 0.38726806640625, 0.5369873046875, 0.68670654296875, 0.83642578125, 0.98614501953125, 1.1358642578125, 1.28558349609375, 1.435302734375, 1.58502197265625, 1.7347412109375, 1.88446044921875, 2.0341796875, 2.18389892578125, 2.3336181640625, 2.48333740234375, 2.633056640625, 2.78277587890625, 2.9324951171875, 3.08221435546875, 3.23193359375, 3.38165283203125, 3.5313720703125, 3.68109130859375, 3.830810546875, 3.98052978515625, 4.1302490234375, 4.27996826171875, 4.4296875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 5.0, 7.0, 11.0, 13.0, 15.0, 6.0, 27.0, 21.0, 22.0, 28.0, 21.0, 54.0, 34.0, 46.0, 26.0, 33.0, 30.0, 33.0, 40.0, 50.0, 45.0, 34.0, 47.0, 41.0, 43.0, 36.0, 38.0, 28.0, 20.0, 28.0, 16.0, 14.0, 14.0, 12.0, 12.0, 9.0, 8.0, 7.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.690673828125, -2.60791015625, -2.525146484375, -2.4423828125, -2.359619140625, -2.27685546875, -2.194091796875, -2.111328125, -2.028564453125, -1.94580078125, -1.863037109375, -1.7802734375, -1.697509765625, -1.61474609375, -1.531982421875, -1.44921875, -1.366455078125, -1.28369140625, -1.200927734375, -1.1181640625, -1.035400390625, -0.95263671875, -0.869873046875, -0.787109375, -0.704345703125, -0.62158203125, -0.538818359375, -0.4560546875, -0.373291015625, -0.29052734375, -0.207763671875, -0.125, -0.042236328125, 0.04052734375, 0.123291015625, 0.2060546875, 0.288818359375, 0.37158203125, 0.454345703125, 0.537109375, 0.619873046875, 0.70263671875, 0.785400390625, 0.8681640625, 0.950927734375, 1.03369140625, 1.116455078125, 1.19921875, 1.281982421875, 1.36474609375, 1.447509765625, 1.5302734375, 1.613037109375, 1.69580078125, 1.778564453125, 1.861328125, 1.944091796875, 2.02685546875, 2.109619140625, 2.1923828125, 2.275146484375, 2.35791015625, 2.440673828125, 2.5234375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 13.0, 32.0, 29.0, 50.0, 68.0, 126.0, 167.0, 240.0, 325.0, 533.0, 757.0, 1178.0, 1777.0, 2722.0, 4218.0, 6489.0, 10618.0, 17071.0, 28490.0, 49149.0, 83861.0, 136944.0, 186947.0, 184698.0, 132740.0, 80585.0, 46441.0, 27354.0, 16557.0, 10070.0, 6354.0, 4196.0, 2622.0, 1727.0, 1129.0, 711.0, 478.0, 364.0, 241.0, 146.0, 106.0, 75.0, 46.0, 33.0, 29.0, 16.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.648773193359375, -2.55731201171875, -2.465850830078125, -2.3743896484375, -2.282928466796875, -2.19146728515625, -2.100006103515625, -2.008544921875, -1.917083740234375, -1.82562255859375, -1.734161376953125, -1.6427001953125, -1.551239013671875, -1.45977783203125, -1.368316650390625, -1.27685546875, -1.185394287109375, -1.09393310546875, -1.002471923828125, -0.9110107421875, -0.819549560546875, -0.72808837890625, -0.636627197265625, -0.545166015625, -0.453704833984375, -0.36224365234375, -0.270782470703125, -0.1793212890625, -0.087860107421875, 0.00360107421875, 0.095062255859375, 0.1865234375, 0.277984619140625, 0.36944580078125, 0.460906982421875, 0.5523681640625, 0.643829345703125, 0.73529052734375, 0.826751708984375, 0.918212890625, 1.009674072265625, 1.10113525390625, 1.192596435546875, 1.2840576171875, 1.375518798828125, 1.46697998046875, 1.558441162109375, 1.64990234375, 1.741363525390625, 1.83282470703125, 1.924285888671875, 2.0157470703125, 2.107208251953125, 2.19866943359375, 2.290130615234375, 2.381591796875, 2.473052978515625, 2.56451416015625, 2.655975341796875, 2.7474365234375, 2.838897705078125, 2.93035888671875, 3.021820068359375, 3.11328125]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 8.0, 6.0, 14.0, 15.0, 27.0, 28.0, 33.0, 35.0, 45.0, 67.0, 55.0, 90.0, 81.0, 94.0, 84.0, 52.0, 59.0, 46.0, 32.0, 23.0, 13.0, 10.0, 17.0, 9.0, 9.0, 8.0, 9.0, 2.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004417896270751953, -0.0004290565848350525, -0.00041632354259490967, -0.00040359050035476685, -0.000390857458114624, -0.0003781244158744812, -0.0003653913736343384, -0.00035265833139419556, -0.00033992528915405273, -0.0003271922469139099, -0.0003144592046737671, -0.00030172616243362427, -0.00028899312019348145, -0.0002762600779533386, -0.0002635270357131958, -0.000250793993473053, -0.00023806095123291016, -0.00022532790899276733, -0.0002125948667526245, -0.0001998618245124817, -0.00018712878227233887, -0.00017439574003219604, -0.00016166269779205322, -0.0001489296555519104, -0.00013619661331176758, -0.00012346357107162476, -0.00011073052883148193, -9.799748659133911e-05, -8.526444435119629e-05, -7.253140211105347e-05, -5.9798359870910645e-05, -4.706531763076782e-05, -3.4332275390625e-05, -2.1599233150482178e-05, -8.866190910339355e-06, 3.866851329803467e-06, 1.659989356994629e-05, 2.933293581008911e-05, 4.2065978050231934e-05, 5.4799020290374756e-05, 6.753206253051758e-05, 8.02651047706604e-05, 9.299814701080322e-05, 0.00010573118925094604, 0.00011846423149108887, 0.0001311972737312317, 0.0001439303159713745, 0.00015666335821151733, 0.00016939640045166016, 0.00018212944269180298, 0.0001948624849319458, 0.00020759552717208862, 0.00022032856941223145, 0.00023306161165237427, 0.0002457946538925171, 0.0002585276961326599, 0.00027126073837280273, 0.00028399378061294556, 0.0002967268228530884, 0.0003094598650932312, 0.000322192907333374, 0.00033492594957351685, 0.00034765899181365967, 0.0003603920340538025, 0.0003731250762939453]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 12.0, 20.0, 28.0, 43.0, 66.0, 100.0, 129.0, 218.0, 327.0, 508.0, 797.0, 1275.0, 1953.0, 3260.0, 5245.0, 8893.0, 15100.0, 25387.0, 43762.0, 74170.0, 119281.0, 169340.0, 184334.0, 149630.0, 99361.0, 59879.0, 34525.0, 20423.0, 11874.0, 7185.0, 4263.0, 2574.0, 1626.0, 1052.0, 674.0, 405.0, 281.0, 193.0, 109.0, 94.0, 54.0, 34.0, 26.0, 24.0, 11.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.273162841796875, -2.19281005859375, -2.112457275390625, -2.0321044921875, -1.951751708984375, -1.87139892578125, -1.791046142578125, -1.710693359375, -1.630340576171875, -1.54998779296875, -1.469635009765625, -1.3892822265625, -1.308929443359375, -1.22857666015625, -1.148223876953125, -1.06787109375, -0.987518310546875, -0.90716552734375, -0.826812744140625, -0.7464599609375, -0.666107177734375, -0.58575439453125, -0.505401611328125, -0.425048828125, -0.344696044921875, -0.26434326171875, -0.183990478515625, -0.1036376953125, -0.023284912109375, 0.05706787109375, 0.137420654296875, 0.2177734375, 0.298126220703125, 0.37847900390625, 0.458831787109375, 0.5391845703125, 0.619537353515625, 0.69989013671875, 0.780242919921875, 0.860595703125, 0.940948486328125, 1.02130126953125, 1.101654052734375, 1.1820068359375, 1.262359619140625, 1.34271240234375, 1.423065185546875, 1.50341796875, 1.583770751953125, 1.66412353515625, 1.744476318359375, 1.8248291015625, 1.905181884765625, 1.98553466796875, 2.065887451171875, 2.146240234375, 2.226593017578125, 2.30694580078125, 2.387298583984375, 2.4676513671875, 2.548004150390625, 2.62835693359375, 2.708709716796875, 2.7890625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 0.0, 6.0, 2.0, 13.0, 7.0, 13.0, 12.0, 16.0, 11.0, 18.0, 25.0, 22.0, 26.0, 43.0, 47.0, 50.0, 60.0, 52.0, 46.0, 61.0, 52.0, 56.0, 36.0, 39.0, 53.0, 37.0, 35.0, 33.0, 27.0, 20.0, 10.0, 12.0, 11.0, 11.0, 9.0, 3.0, 3.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.708984375, -0.6871337890625, -0.665283203125, -0.6434326171875, -0.62158203125, -0.5997314453125, -0.577880859375, -0.5560302734375, -0.5341796875, -0.5123291015625, -0.490478515625, -0.4686279296875, -0.44677734375, -0.4249267578125, -0.403076171875, -0.3812255859375, -0.359375, -0.3375244140625, -0.315673828125, -0.2938232421875, -0.27197265625, -0.2501220703125, -0.228271484375, -0.2064208984375, -0.1845703125, -0.1627197265625, -0.140869140625, -0.1190185546875, -0.09716796875, -0.0753173828125, -0.053466796875, -0.0316162109375, -0.009765625, 0.0120849609375, 0.033935546875, 0.0557861328125, 0.07763671875, 0.0994873046875, 0.121337890625, 0.1431884765625, 0.1650390625, 0.1868896484375, 0.208740234375, 0.2305908203125, 0.25244140625, 0.2742919921875, 0.296142578125, 0.3179931640625, 0.33984375, 0.3616943359375, 0.383544921875, 0.4053955078125, 0.42724609375, 0.4490966796875, 0.470947265625, 0.4927978515625, 0.5146484375, 0.5364990234375, 0.558349609375, 0.5802001953125, 0.60205078125, 0.6239013671875, 0.645751953125, 0.6676025390625, 0.689453125]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 2.0, 7.0, 9.0, 7.0, 5.0, 11.0, 13.0, 13.0, 15.0, 23.0, 30.0, 31.0, 59.0, 70.0, 69.0, 73.0, 59.0, 82.0, 60.0, 71.0, 56.0, 57.0, 43.0, 34.0, 20.0, 23.0, 12.0, 11.0, 9.0, 8.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.548230171203613, -10.262133598327637, -9.97603702545166, -9.689939498901367, -9.40384292602539, -9.117746353149414, -8.831649780273438, -8.545553207397461, -8.259455680847168, -7.973359107971191, -7.687262058258057, -7.40116548538208, -7.115068435668945, -6.828971862792969, -6.542875289916992, -6.256778240203857, -5.970681667327881, -5.684585094451904, -5.3984880447387695, -5.112391471862793, -4.826294422149658, -4.540197849273682, -4.254100799560547, -3.9680042266845703, -3.6819074153900146, -3.395810604095459, -3.1097137928009033, -2.8236169815063477, -2.537520408630371, -2.2514233589172363, -1.9653267860412598, -1.679229974746704, -1.3931326866149902, -1.1070358753204346, -0.8209391236305237, -0.5348423719406128, -0.24874556064605713, 0.037351250648498535, 0.32344794273376465, 0.6095447540283203, 0.895641565322876, 1.1817383766174316, 1.4678351879119873, 1.7539318799972534, 2.0400285720825195, 2.3261256217956543, 2.612222194671631, 2.8983190059661865, 3.184415817260742, 3.470512628555298, 3.7566094398498535, 4.04270601272583, 4.328803062438965, 4.614899635314941, 4.900996208190918, 5.187093257904053, 5.4731903076171875, 5.759286880493164, 6.045383930206299, 6.331480503082275, 6.61757755279541, 6.903674125671387, 7.189770698547363, 7.475867748260498, 7.761964321136475]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 9.0, 1.0, 8.0, 10.0, 11.0, 10.0, 8.0, 12.0, 26.0, 18.0, 15.0, 17.0, 20.0, 27.0, 23.0, 28.0, 35.0, 33.0, 27.0, 39.0, 32.0, 39.0, 29.0, 26.0, 42.0, 29.0, 41.0, 34.0, 34.0, 25.0, 33.0, 36.0, 29.0, 22.0, 21.0, 10.0, 22.0, 15.0, 19.0, 14.0, 9.0, 15.0, 8.0, 10.0, 9.0, 5.0, 7.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0], "bins": [-3.612844944000244, -3.507185459136963, -3.4015259742736816, -3.2958664894104004, -3.1902072429656982, -3.084547758102417, -2.9788882732391357, -2.8732287883758545, -2.7675695419311523, -2.661910057067871, -2.55625057220459, -2.4505910873413086, -2.3449318408966064, -2.239272356033325, -2.133612871170044, -2.0279533863067627, -1.9222939014434814, -1.8166344165802002, -1.7109750509262085, -1.6053155660629272, -1.4996562004089355, -1.3939967155456543, -1.288337230682373, -1.1826777458190918, -1.0770183801651, -0.9713589549064636, -0.8656995296478271, -0.7600400447845459, -0.6543806195259094, -0.548721194267273, -0.4430617094039917, -0.3374022841453552, -0.23174285888671875, -0.12608341872692108, -0.020423978567123413, 0.08523547649383545, 0.19089490175247192, 0.2965543270111084, 0.40221381187438965, 0.5078732371330261, 0.6135326623916626, 0.7191920876502991, 0.8248515129089355, 0.9305109977722168, 1.036170482635498, 1.1418298482894897, 1.247489333152771, 1.3531486988067627, 1.458808183670044, 1.5644676685333252, 1.670127034187317, 1.7757865190505981, 1.8814458847045898, 1.987105369567871, 2.0927648544311523, 2.1984243392944336, 2.304083824157715, 2.409743309020996, 2.5154027938842773, 2.6210622787475586, 2.7267215251922607, 2.832381010055542, 2.9380404949188232, 3.0436999797821045, 3.1493592262268066]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 2.0, 8.0, 9.0, 13.0, 17.0, 15.0, 35.0, 56.0, 87.0, 135.0, 189.0, 346.0, 587.0, 903.0, 1527.0, 2818.0, 5441.0, 10466.0, 22355.0, 51959.0, 134702.0, 403988.0, 1168476.0, 1473538.0, 597299.0, 188543.0, 69401.0, 29731.0, 14287.0, 7199.0, 4025.0, 2246.0, 1381.0, 820.0, 568.0, 353.0, 236.0, 166.0, 110.0, 80.0, 54.0, 35.0, 20.0, 16.0, 9.0, 15.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-9.7734375, -9.4874267578125, -9.201416015625, -8.9154052734375, -8.62939453125, -8.3433837890625, -8.057373046875, -7.7713623046875, -7.4853515625, -7.1993408203125, -6.913330078125, -6.6273193359375, -6.34130859375, -6.0552978515625, -5.769287109375, -5.4832763671875, -5.197265625, -4.9112548828125, -4.625244140625, -4.3392333984375, -4.05322265625, -3.7672119140625, -3.481201171875, -3.1951904296875, -2.9091796875, -2.6231689453125, -2.337158203125, -2.0511474609375, -1.76513671875, -1.4791259765625, -1.193115234375, -0.9071044921875, -0.62109375, -0.3350830078125, -0.049072265625, 0.2369384765625, 0.52294921875, 0.8089599609375, 1.094970703125, 1.3809814453125, 1.6669921875, 1.9530029296875, 2.239013671875, 2.5250244140625, 2.81103515625, 3.0970458984375, 3.383056640625, 3.6690673828125, 3.955078125, 4.2410888671875, 4.527099609375, 4.8131103515625, 5.09912109375, 5.3851318359375, 5.671142578125, 5.9571533203125, 6.2431640625, 6.5291748046875, 6.815185546875, 7.1011962890625, 7.38720703125, 7.6732177734375, 7.959228515625, 8.2452392578125, 8.53125]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 13.0, 11.0, 15.0, 17.0, 16.0, 13.0, 22.0, 22.0, 25.0, 34.0, 32.0, 35.0, 29.0, 47.0, 52.0, 40.0, 35.0, 52.0, 24.0, 39.0, 44.0, 43.0, 38.0, 36.0, 26.0, 25.0, 20.0, 23.0, 26.0, 16.0, 13.0, 20.0, 17.0, 13.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.142578125, -3.0423583984375, -2.942138671875, -2.8419189453125, -2.74169921875, -2.6414794921875, -2.541259765625, -2.4410400390625, -2.3408203125, -2.2406005859375, -2.140380859375, -2.0401611328125, -1.93994140625, -1.8397216796875, -1.739501953125, -1.6392822265625, -1.5390625, -1.4388427734375, -1.338623046875, -1.2384033203125, -1.13818359375, -1.0379638671875, -0.937744140625, -0.8375244140625, -0.7373046875, -0.6370849609375, -0.536865234375, -0.4366455078125, -0.33642578125, -0.2362060546875, -0.135986328125, -0.0357666015625, 0.064453125, 0.1646728515625, 0.264892578125, 0.3651123046875, 0.46533203125, 0.5655517578125, 0.665771484375, 0.7659912109375, 0.8662109375, 0.9664306640625, 1.066650390625, 1.1668701171875, 1.26708984375, 1.3673095703125, 1.467529296875, 1.5677490234375, 1.66796875, 1.7681884765625, 1.868408203125, 1.9686279296875, 2.06884765625, 2.1690673828125, 2.269287109375, 2.3695068359375, 2.4697265625, 2.5699462890625, 2.670166015625, 2.7703857421875, 2.87060546875, 2.9708251953125, 3.071044921875, 3.1712646484375, 3.271484375]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 20.0, 25.0, 34.0, 53.0, 104.0, 163.0, 251.0, 434.0, 761.0, 1428.0, 2452.0, 4558.0, 8724.0, 17776.0, 38274.0, 89123.0, 226184.0, 631933.0, 1435009.0, 1076413.0, 397374.0, 147987.0, 60958.0, 26992.0, 12984.0, 6490.0, 3466.0, 1846.0, 1038.0, 568.0, 322.0, 198.0, 112.0, 65.0, 62.0, 36.0, 20.0, 10.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.546875, -10.22509765625, -9.9033203125, -9.58154296875, -9.259765625, -8.93798828125, -8.6162109375, -8.29443359375, -7.97265625, -7.65087890625, -7.3291015625, -7.00732421875, -6.685546875, -6.36376953125, -6.0419921875, -5.72021484375, -5.3984375, -5.07666015625, -4.7548828125, -4.43310546875, -4.111328125, -3.78955078125, -3.4677734375, -3.14599609375, -2.82421875, -2.50244140625, -2.1806640625, -1.85888671875, -1.537109375, -1.21533203125, -0.8935546875, -0.57177734375, -0.25, 0.07177734375, 0.3935546875, 0.71533203125, 1.037109375, 1.35888671875, 1.6806640625, 2.00244140625, 2.32421875, 2.64599609375, 2.9677734375, 3.28955078125, 3.611328125, 3.93310546875, 4.2548828125, 4.57666015625, 4.8984375, 5.22021484375, 5.5419921875, 5.86376953125, 6.185546875, 6.50732421875, 6.8291015625, 7.15087890625, 7.47265625, 7.79443359375, 8.1162109375, 8.43798828125, 8.759765625, 9.08154296875, 9.4033203125, 9.72509765625, 10.046875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 7.0, 8.0, 11.0, 14.0, 21.0, 32.0, 38.0, 53.0, 71.0, 96.0, 152.0, 176.0, 228.0, 325.0, 346.0, 384.0, 411.0, 390.0, 332.0, 277.0, 179.0, 158.0, 94.0, 68.0, 65.0, 33.0, 25.0, 26.0, 11.0, 9.0, 7.0, 8.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.470703125, -3.37457275390625, -3.2784423828125, -3.18231201171875, -3.086181640625, -2.99005126953125, -2.8939208984375, -2.79779052734375, -2.70166015625, -2.60552978515625, -2.5093994140625, -2.41326904296875, -2.317138671875, -2.22100830078125, -2.1248779296875, -2.02874755859375, -1.9326171875, -1.83648681640625, -1.7403564453125, -1.64422607421875, -1.548095703125, -1.45196533203125, -1.3558349609375, -1.25970458984375, -1.16357421875, -1.06744384765625, -0.9713134765625, -0.87518310546875, -0.779052734375, -0.68292236328125, -0.5867919921875, -0.49066162109375, -0.39453125, -0.29840087890625, -0.2022705078125, -0.10614013671875, -0.010009765625, 0.08612060546875, 0.1822509765625, 0.27838134765625, 0.37451171875, 0.47064208984375, 0.5667724609375, 0.66290283203125, 0.759033203125, 0.85516357421875, 0.9512939453125, 1.04742431640625, 1.1435546875, 1.23968505859375, 1.3358154296875, 1.43194580078125, 1.528076171875, 1.62420654296875, 1.7203369140625, 1.81646728515625, 1.91259765625, 2.00872802734375, 2.1048583984375, 2.20098876953125, 2.297119140625, 2.39324951171875, 2.4893798828125, 2.58551025390625, 2.681640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 6.0, 12.0, 10.0, 17.0, 11.0, 22.0, 23.0, 34.0, 37.0, 39.0, 50.0, 72.0, 65.0, 81.0, 85.0, 62.0, 62.0, 73.0, 54.0, 37.0, 27.0, 31.0, 23.0, 15.0, 17.0, 8.0, 4.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.038509368896484, -12.719670295715332, -12.400830268859863, -12.081991195678711, -11.763152122497559, -11.444313049316406, -11.125473022460938, -10.806633949279785, -10.487794876098633, -10.16895580291748, -9.850115776062012, -9.53127670288086, -9.212437629699707, -8.893598556518555, -8.574758529663086, -8.255919456481934, -7.937079429626465, -7.618239879608154, -7.299400806427002, -6.980561256408691, -6.661722183227539, -6.3428826332092285, -6.024043083190918, -5.705204010009766, -5.386364459991455, -5.0675249099731445, -4.748685836791992, -4.429846286773682, -4.111006736755371, -3.7921676635742188, -3.473328113555908, -3.1544888019561768, -2.8356499671936035, -2.516810655593872, -2.1979713439941406, -1.87913179397583, -1.5602924823760986, -1.2414531707763672, -0.9226137399673462, -0.6037743091583252, -0.28493499755859375, 0.03390437364578247, 0.3527437448501587, 0.6715831160545349, 0.9904224872589111, 1.3092617988586426, 1.6281012296676636, 1.9469406604766846, 2.265779972076416, 2.5846192836761475, 2.903458595275879, 3.2222981452941895, 3.541137456893921, 3.8599767684936523, 4.178816318511963, 4.497655868530273, 4.816494941711426, 5.135334491729736, 5.454173564910889, 5.773013114929199, 6.091852188110352, 6.410691738128662, 6.729531288146973, 7.048370361328125, 7.3672099113464355]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 7.0, 4.0, 2.0, 5.0, 10.0, 10.0, 12.0, 19.0, 12.0, 21.0, 15.0, 20.0, 26.0, 25.0, 31.0, 29.0, 37.0, 35.0, 44.0, 40.0, 32.0, 41.0, 38.0, 45.0, 37.0, 37.0, 30.0, 28.0, 33.0, 34.0, 28.0, 34.0, 21.0, 27.0, 20.0, 17.0, 16.0, 11.0, 9.0, 8.0, 9.0, 11.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.489992618560791, -4.361401081085205, -4.232809543609619, -4.104218006134033, -3.9756264686584473, -3.8470349311828613, -3.7184433937072754, -3.5898518562316895, -3.4612603187561035, -3.3326687812805176, -3.2040772438049316, -3.0754857063293457, -2.9468941688537598, -2.818302631378174, -2.689711093902588, -2.561119556427002, -2.432528018951416, -2.30393648147583, -2.175344944000244, -2.046753406524658, -1.9181618690490723, -1.7895703315734863, -1.6609787940979004, -1.5323872566223145, -1.4037957191467285, -1.2752041816711426, -1.1466126441955566, -1.0180211067199707, -0.8894295692443848, -0.7608380317687988, -0.6322464942932129, -0.503654956817627, -0.3750631809234619, -0.24647164344787598, -0.11788010597229004, 0.010711431503295898, 0.13930296897888184, 0.2678945064544678, 0.3964860439300537, 0.5250775814056396, 0.6536691188812256, 0.7822606563568115, 0.9108521938323975, 1.0394437313079834, 1.1680352687835693, 1.2966268062591553, 1.4252183437347412, 1.5538098812103271, 1.682401418685913, 1.810992956161499, 1.939584493637085, 2.068176031112671, 2.196767568588257, 2.3253591060638428, 2.4539506435394287, 2.5825421810150146, 2.7111337184906006, 2.8397252559661865, 2.9683167934417725, 3.0969083309173584, 3.2254998683929443, 3.3540914058685303, 3.482682943344116, 3.611274480819702, 3.739866018295288]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 11.0, 17.0, 27.0, 28.0, 55.0, 83.0, 145.0, 220.0, 367.0, 546.0, 898.0, 1347.0, 2253.0, 3614.0, 5877.0, 9809.0, 16065.0, 26414.0, 42929.0, 68074.0, 103453.0, 142455.0, 163486.0, 149560.0, 111842.0, 74947.0, 47606.0, 29782.0, 18010.0, 11041.0, 6641.0, 4151.0, 2507.0, 1610.0, 990.0, 611.0, 385.0, 216.0, 168.0, 104.0, 74.0, 48.0, 24.0, 20.0, 10.0, 7.0, 10.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.74609375, -2.661895751953125, -2.57769775390625, -2.493499755859375, -2.4093017578125, -2.325103759765625, -2.24090576171875, -2.156707763671875, -2.072509765625, -1.988311767578125, -1.90411376953125, -1.819915771484375, -1.7357177734375, -1.651519775390625, -1.56732177734375, -1.483123779296875, -1.39892578125, -1.314727783203125, -1.23052978515625, -1.146331787109375, -1.0621337890625, -0.977935791015625, -0.89373779296875, -0.809539794921875, -0.725341796875, -0.641143798828125, -0.55694580078125, -0.472747802734375, -0.3885498046875, -0.304351806640625, -0.22015380859375, -0.135955810546875, -0.0517578125, 0.032440185546875, 0.11663818359375, 0.200836181640625, 0.2850341796875, 0.369232177734375, 0.45343017578125, 0.537628173828125, 0.621826171875, 0.706024169921875, 0.79022216796875, 0.874420166015625, 0.9586181640625, 1.042816162109375, 1.12701416015625, 1.211212158203125, 1.29541015625, 1.379608154296875, 1.46380615234375, 1.548004150390625, 1.6322021484375, 1.716400146484375, 1.80059814453125, 1.884796142578125, 1.968994140625, 2.053192138671875, 2.13739013671875, 2.221588134765625, 2.3057861328125, 2.389984130859375, 2.47418212890625, 2.558380126953125, 2.642578125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 3.0, 2.0, 8.0, 11.0, 10.0, 8.0, 20.0, 16.0, 16.0, 31.0, 24.0, 26.0, 32.0, 28.0, 30.0, 40.0, 33.0, 42.0, 35.0, 38.0, 38.0, 49.0, 43.0, 35.0, 37.0, 32.0, 31.0, 28.0, 24.0, 26.0, 28.0, 23.0, 16.0, 21.0, 18.0, 14.0, 22.0, 16.0, 6.0, 11.0, 3.0, 4.0, 2.0, 3.0, 3.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-4.80859375, -4.6680908203125, -4.527587890625, -4.3870849609375, -4.24658203125, -4.1060791015625, -3.965576171875, -3.8250732421875, -3.6845703125, -3.5440673828125, -3.403564453125, -3.2630615234375, -3.12255859375, -2.9820556640625, -2.841552734375, -2.7010498046875, -2.560546875, -2.4200439453125, -2.279541015625, -2.1390380859375, -1.99853515625, -1.8580322265625, -1.717529296875, -1.5770263671875, -1.4365234375, -1.2960205078125, -1.155517578125, -1.0150146484375, -0.87451171875, -0.7340087890625, -0.593505859375, -0.4530029296875, -0.3125, -0.1719970703125, -0.031494140625, 0.1090087890625, 0.24951171875, 0.3900146484375, 0.530517578125, 0.6710205078125, 0.8115234375, 0.9520263671875, 1.092529296875, 1.2330322265625, 1.37353515625, 1.5140380859375, 1.654541015625, 1.7950439453125, 1.935546875, 2.0760498046875, 2.216552734375, 2.3570556640625, 2.49755859375, 2.6380615234375, 2.778564453125, 2.9190673828125, 3.0595703125, 3.2000732421875, 3.340576171875, 3.4810791015625, 3.62158203125, 3.7620849609375, 3.902587890625, 4.0430908203125, 4.18359375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 14.0, 16.0, 25.0, 41.0, 58.0, 86.0, 160.0, 216.0, 358.0, 567.0, 908.0, 1341.0, 2097.0, 3384.0, 5395.0, 8590.0, 13861.0, 22577.0, 37153.0, 59953.0, 96685.0, 147856.0, 187504.0, 164790.0, 112137.0, 69944.0, 43215.0, 26360.0, 16346.0, 9906.0, 6310.0, 3955.0, 2398.0, 1478.0, 1032.0, 604.0, 445.0, 277.0, 181.0, 137.0, 73.0, 55.0, 26.0, 18.0, 8.0, 4.0, 9.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9375, -2.838470458984375, -2.73944091796875, -2.640411376953125, -2.5413818359375, -2.442352294921875, -2.34332275390625, -2.244293212890625, -2.145263671875, -2.046234130859375, -1.94720458984375, -1.848175048828125, -1.7491455078125, -1.650115966796875, -1.55108642578125, -1.452056884765625, -1.35302734375, -1.253997802734375, -1.15496826171875, -1.055938720703125, -0.9569091796875, -0.857879638671875, -0.75885009765625, -0.659820556640625, -0.560791015625, -0.461761474609375, -0.36273193359375, -0.263702392578125, -0.1646728515625, -0.065643310546875, 0.03338623046875, 0.132415771484375, 0.2314453125, 0.330474853515625, 0.42950439453125, 0.528533935546875, 0.6275634765625, 0.726593017578125, 0.82562255859375, 0.924652099609375, 1.023681640625, 1.122711181640625, 1.22174072265625, 1.320770263671875, 1.4197998046875, 1.518829345703125, 1.61785888671875, 1.716888427734375, 1.81591796875, 1.914947509765625, 2.01397705078125, 2.113006591796875, 2.2120361328125, 2.311065673828125, 2.41009521484375, 2.509124755859375, 2.608154296875, 2.707183837890625, 2.80621337890625, 2.905242919921875, 3.0042724609375, 3.103302001953125, 3.20233154296875, 3.301361083984375, 3.400390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 8.0, 7.0, 12.0, 14.0, 14.0, 16.0, 17.0, 20.0, 21.0, 24.0, 39.0, 31.0, 48.0, 47.0, 49.0, 48.0, 52.0, 45.0, 56.0, 47.0, 49.0, 35.0, 42.0, 29.0, 29.0, 31.0, 27.0, 24.0, 20.0, 20.0, 12.0, 16.0, 9.0, 8.0, 9.0, 7.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.998046875, -2.89984130859375, -2.8016357421875, -2.70343017578125, -2.605224609375, -2.50701904296875, -2.4088134765625, -2.31060791015625, -2.21240234375, -2.11419677734375, -2.0159912109375, -1.91778564453125, -1.819580078125, -1.72137451171875, -1.6231689453125, -1.52496337890625, -1.4267578125, -1.32855224609375, -1.2303466796875, -1.13214111328125, -1.033935546875, -0.93572998046875, -0.8375244140625, -0.73931884765625, -0.64111328125, -0.54290771484375, -0.4447021484375, -0.34649658203125, -0.248291015625, -0.15008544921875, -0.0518798828125, 0.04632568359375, 0.14453125, 0.24273681640625, 0.3409423828125, 0.43914794921875, 0.537353515625, 0.63555908203125, 0.7337646484375, 0.83197021484375, 0.93017578125, 1.02838134765625, 1.1265869140625, 1.22479248046875, 1.322998046875, 1.42120361328125, 1.5194091796875, 1.61761474609375, 1.7158203125, 1.81402587890625, 1.9122314453125, 2.01043701171875, 2.108642578125, 2.20684814453125, 2.3050537109375, 2.40325927734375, 2.50146484375, 2.59967041015625, 2.6978759765625, 2.79608154296875, 2.894287109375, 2.99249267578125, 3.0906982421875, 3.18890380859375, 3.287109375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 13.0, 21.0, 28.0, 34.0, 54.0, 88.0, 126.0, 210.0, 291.0, 498.0, 751.0, 1207.0, 1921.0, 3271.0, 5646.0, 9838.0, 18314.0, 36136.0, 75453.0, 157695.0, 276580.0, 230198.0, 115740.0, 54769.0, 26979.0, 14195.0, 7379.0, 4345.0, 2515.0, 1557.0, 977.0, 611.0, 369.0, 259.0, 150.0, 109.0, 69.0, 50.0, 37.0, 15.0, 25.0, 7.0, 8.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.951171875, -1.883392333984375, -1.81561279296875, -1.747833251953125, -1.6800537109375, -1.612274169921875, -1.54449462890625, -1.476715087890625, -1.408935546875, -1.341156005859375, -1.27337646484375, -1.205596923828125, -1.1378173828125, -1.070037841796875, -1.00225830078125, -0.934478759765625, -0.86669921875, -0.798919677734375, -0.73114013671875, -0.663360595703125, -0.5955810546875, -0.527801513671875, -0.46002197265625, -0.392242431640625, -0.324462890625, -0.256683349609375, -0.18890380859375, -0.121124267578125, -0.0533447265625, 0.014434814453125, 0.08221435546875, 0.149993896484375, 0.2177734375, 0.285552978515625, 0.35333251953125, 0.421112060546875, 0.4888916015625, 0.556671142578125, 0.62445068359375, 0.692230224609375, 0.760009765625, 0.827789306640625, 0.89556884765625, 0.963348388671875, 1.0311279296875, 1.098907470703125, 1.16668701171875, 1.234466552734375, 1.30224609375, 1.370025634765625, 1.43780517578125, 1.505584716796875, 1.5733642578125, 1.641143798828125, 1.70892333984375, 1.776702880859375, 1.844482421875, 1.912261962890625, 1.98004150390625, 2.047821044921875, 2.1156005859375, 2.183380126953125, 2.25115966796875, 2.318939208984375, 2.38671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 8.0, 9.0, 17.0, 13.0, 22.0, 26.0, 45.0, 43.0, 62.0, 64.0, 79.0, 89.0, 84.0, 88.0, 72.0, 61.0, 59.0, 36.0, 27.0, 25.0, 15.0, 15.0, 11.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00013518333435058594, -0.00013144686818122864, -0.00012771040201187134, -0.00012397393584251404, -0.00012023746967315674, -0.00011650100350379944, -0.00011276453733444214, -0.00010902807116508484, -0.00010529160499572754, -0.00010155513882637024, -9.781867265701294e-05, -9.408220648765564e-05, -9.034574031829834e-05, -8.660927414894104e-05, -8.287280797958374e-05, -7.913634181022644e-05, -7.539987564086914e-05, -7.166340947151184e-05, -6.792694330215454e-05, -6.419047713279724e-05, -6.045401096343994e-05, -5.671754479408264e-05, -5.298107862472534e-05, -4.924461245536804e-05, -4.550814628601074e-05, -4.177168011665344e-05, -3.803521394729614e-05, -3.429874777793884e-05, -3.056228160858154e-05, -2.6825815439224243e-05, -2.3089349269866943e-05, -1.9352883100509644e-05, -1.5616416931152344e-05, -1.1879950761795044e-05, -8.143484592437744e-06, -4.407018423080444e-06, -6.705522537231445e-07, 3.0659139156341553e-06, 6.802380084991455e-06, 1.0538846254348755e-05, 1.4275312423706055e-05, 1.8011778593063354e-05, 2.1748244762420654e-05, 2.5484710931777954e-05, 2.9221177101135254e-05, 3.2957643270492554e-05, 3.6694109439849854e-05, 4.043057560920715e-05, 4.416704177856445e-05, 4.790350794792175e-05, 5.163997411727905e-05, 5.537644028663635e-05, 5.911290645599365e-05, 6.284937262535095e-05, 6.658583879470825e-05, 7.032230496406555e-05, 7.405877113342285e-05, 7.779523730278015e-05, 8.153170347213745e-05, 8.526816964149475e-05, 8.900463581085205e-05, 9.274110198020935e-05, 9.647756814956665e-05, 0.00010021403431892395, 0.00010395050048828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 9.0, 18.0, 21.0, 25.0, 40.0, 63.0, 96.0, 129.0, 196.0, 270.0, 409.0, 664.0, 1035.0, 1520.0, 2564.0, 4085.0, 6591.0, 10849.0, 17641.0, 29810.0, 49855.0, 81558.0, 124626.0, 165253.0, 172013.0, 138372.0, 93880.0, 57888.0, 34945.0, 20960.0, 12527.0, 7669.0, 4716.0, 3029.0, 1832.0, 1117.0, 771.0, 482.0, 340.0, 235.0, 142.0, 83.0, 73.0, 63.0, 34.0, 24.0, 13.0, 9.0, 5.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4287109375, -1.38427734375, -1.33984375, -1.29541015625, -1.2509765625, -1.20654296875, -1.162109375, -1.11767578125, -1.0732421875, -1.02880859375, -0.984375, -0.93994140625, -0.8955078125, -0.85107421875, -0.806640625, -0.76220703125, -0.7177734375, -0.67333984375, -0.62890625, -0.58447265625, -0.5400390625, -0.49560546875, -0.451171875, -0.40673828125, -0.3623046875, -0.31787109375, -0.2734375, -0.22900390625, -0.1845703125, -0.14013671875, -0.095703125, -0.05126953125, -0.0068359375, 0.03759765625, 0.08203125, 0.12646484375, 0.1708984375, 0.21533203125, 0.259765625, 0.30419921875, 0.3486328125, 0.39306640625, 0.4375, 0.48193359375, 0.5263671875, 0.57080078125, 0.615234375, 0.65966796875, 0.7041015625, 0.74853515625, 0.79296875, 0.83740234375, 0.8818359375, 0.92626953125, 0.970703125, 1.01513671875, 1.0595703125, 1.10400390625, 1.1484375, 1.19287109375, 1.2373046875, 1.28173828125, 1.326171875, 1.37060546875, 1.4150390625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 5.0, 6.0, 9.0, 8.0, 15.0, 17.0, 24.0, 30.0, 37.0, 31.0, 42.0, 42.0, 51.0, 50.0, 50.0, 46.0, 58.0, 59.0, 66.0, 52.0, 39.0, 43.0, 39.0, 24.0, 33.0, 13.0, 18.0, 15.0, 12.0, 15.0, 6.0, 11.0, 3.0, 7.0, 6.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4138031005859375, -0.400115966796875, -0.3864288330078125, -0.37274169921875, -0.3590545654296875, -0.345367431640625, -0.3316802978515625, -0.3179931640625, -0.3043060302734375, -0.290618896484375, -0.2769317626953125, -0.26324462890625, -0.2495574951171875, -0.235870361328125, -0.2221832275390625, -0.20849609375, -0.1948089599609375, -0.181121826171875, -0.1674346923828125, -0.15374755859375, -0.1400604248046875, -0.126373291015625, -0.1126861572265625, -0.0989990234375, -0.0853118896484375, -0.071624755859375, -0.0579376220703125, -0.04425048828125, -0.0305633544921875, -0.016876220703125, -0.0031890869140625, 0.010498046875, 0.0241851806640625, 0.037872314453125, 0.0515594482421875, 0.06524658203125, 0.0789337158203125, 0.092620849609375, 0.1063079833984375, 0.1199951171875, 0.1336822509765625, 0.147369384765625, 0.1610565185546875, 0.17474365234375, 0.1884307861328125, 0.202117919921875, 0.2158050537109375, 0.2294921875, 0.2431793212890625, 0.256866455078125, 0.2705535888671875, 0.28424072265625, 0.2979278564453125, 0.311614990234375, 0.3253021240234375, 0.3389892578125, 0.3526763916015625, 0.366363525390625, 0.3800506591796875, 0.39373779296875, 0.4074249267578125, 0.421112060546875, 0.4347991943359375, 0.448486328125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 9.0, 10.0, 11.0, 18.0, 9.0, 17.0, 26.0, 32.0, 37.0, 36.0, 46.0, 72.0, 65.0, 77.0, 81.0, 56.0, 70.0, 63.0, 65.0, 41.0, 30.0, 34.0, 17.0, 21.0, 14.0, 9.0, 6.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0], "bins": [-12.656728744506836, -12.348825454711914, -12.040922164916992, -11.73301887512207, -11.425115585327148, -11.11721134185791, -10.809308052062988, -10.501404762268066, -10.193501472473145, -9.885598182678223, -9.5776948928833, -9.269791603088379, -8.96188735961914, -8.653984069824219, -8.346080780029297, -8.038177490234375, -7.730274200439453, -7.422370910644531, -7.114467620849609, -6.806563854217529, -6.498660564422607, -6.1907572746276855, -5.8828535079956055, -5.574950218200684, -5.267046928405762, -4.95914363861084, -4.651240348815918, -4.343336582183838, -4.035433292388916, -3.727530002593994, -3.419626474380493, -3.111722946166992, -2.8038196563720703, -2.4959163665771484, -2.1880128383636475, -1.880109429359436, -1.5722060203552246, -1.2643026113510132, -0.9563992023468018, -0.6484956741333008, -0.3405923843383789, -0.03268897533416748, 0.27521443367004395, 0.5831178426742554, 0.8910212516784668, 1.1989246606826782, 1.5068280696868896, 1.8147315979003906, 2.1226348876953125, 2.4305381774902344, 2.7384417057037354, 3.0463452339172363, 3.354248523712158, 3.66215181350708, 3.970055341720581, 4.277958869934082, 4.585862159729004, 4.893765449523926, 5.201668739318848, 5.509572505950928, 5.81747579574585, 6.1253790855407715, 6.433282852172852, 6.741186141967773, 7.049089431762695]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 2.0, 9.0, 11.0, 7.0, 16.0, 11.0, 24.0, 13.0, 18.0, 23.0, 22.0, 26.0, 36.0, 28.0, 34.0, 39.0, 37.0, 32.0, 39.0, 37.0, 41.0, 42.0, 45.0, 29.0, 31.0, 34.0, 31.0, 22.0, 34.0, 37.0, 23.0, 22.0, 21.0, 17.0, 17.0, 12.0, 7.0, 9.0, 13.0, 7.0, 9.0, 10.0, 7.0, 3.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.384467124938965, -4.258650779724121, -4.132833957672119, -4.007017612457275, -3.8812012672424316, -3.755384683609009, -3.629568099975586, -3.503751754760742, -3.3779351711273193, -3.2521185874938965, -3.1263022422790527, -3.00048565864563, -2.874669075012207, -2.7488527297973633, -2.6230361461639404, -2.4972195625305176, -2.371403217315674, -2.245586633682251, -2.1197702884674072, -1.9939537048339844, -1.868137240409851, -1.7423207759857178, -1.616504192352295, -1.4906877279281616, -1.3648712635040283, -1.239054799079895, -1.1132383346557617, -0.9874217510223389, -0.8616052865982056, -0.7357888221740723, -0.6099722981452942, -0.4841557741165161, -0.3583395481109619, -0.23252305388450623, -0.10670655965805054, 0.01910993456840515, 0.14492642879486084, 0.27074289321899414, 0.3965594172477722, 0.5223759412765503, 0.6481924057006836, 0.7740088701248169, 0.899825394153595, 1.025641918182373, 1.1514583826065063, 1.2772748470306396, 1.4030914306640625, 1.5289078950881958, 1.654724359512329, 1.7805408239364624, 1.9063572883605957, 2.0321738719940186, 2.1579904556274414, 2.283806800842285, 2.409623384475708, 2.535439968109131, 2.6612563133239746, 2.7870728969573975, 2.912889242172241, 3.038705825805664, 3.164522171020508, 3.2903387546539307, 3.4161553382873535, 3.5419716835021973, 3.66778826713562]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 11.0, 15.0, 11.0, 21.0, 18.0, 22.0, 42.0, 69.0, 99.0, 127.0, 182.0, 274.0, 440.0, 730.0, 1149.0, 1832.0, 3218.0, 5539.0, 9712.0, 17707.0, 32747.0, 61296.0, 112500.0, 181892.0, 217543.0, 172442.0, 104329.0, 56317.0, 29875.0, 16401.0, 8879.0, 5155.0, 2995.0, 1785.0, 1137.0, 684.0, 434.0, 283.0, 191.0, 136.0, 98.0, 69.0, 38.0, 30.0, 16.0, 16.0, 20.0, 9.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0], "bins": [-7.48828125, -7.27081298828125, -7.0533447265625, -6.83587646484375, -6.618408203125, -6.40093994140625, -6.1834716796875, -5.96600341796875, -5.74853515625, -5.53106689453125, -5.3135986328125, -5.09613037109375, -4.878662109375, -4.66119384765625, -4.4437255859375, -4.22625732421875, -4.0087890625, -3.79132080078125, -3.5738525390625, -3.35638427734375, -3.138916015625, -2.92144775390625, -2.7039794921875, -2.48651123046875, -2.26904296875, -2.05157470703125, -1.8341064453125, -1.61663818359375, -1.399169921875, -1.18170166015625, -0.9642333984375, -0.74676513671875, -0.529296875, -0.31182861328125, -0.0943603515625, 0.12310791015625, 0.340576171875, 0.55804443359375, 0.7755126953125, 0.99298095703125, 1.21044921875, 1.42791748046875, 1.6453857421875, 1.86285400390625, 2.080322265625, 2.29779052734375, 2.5152587890625, 2.73272705078125, 2.9501953125, 3.16766357421875, 3.3851318359375, 3.60260009765625, 3.820068359375, 4.03753662109375, 4.2550048828125, 4.47247314453125, 4.68994140625, 4.90740966796875, 5.1248779296875, 5.34234619140625, 5.559814453125, 5.77728271484375, 5.9947509765625, 6.21221923828125, 6.4296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 5.0, 2.0, 14.0, 10.0, 14.0, 5.0, 13.0, 16.0, 16.0, 16.0, 23.0, 20.0, 28.0, 34.0, 40.0, 25.0, 38.0, 48.0, 32.0, 38.0, 27.0, 41.0, 58.0, 45.0, 40.0, 29.0, 33.0, 27.0, 31.0, 25.0, 26.0, 26.0, 23.0, 18.0, 17.0, 12.0, 13.0, 10.0, 10.0, 10.0, 7.0, 4.0, 9.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-4.51953125, -4.38494873046875, -4.2503662109375, -4.11578369140625, -3.981201171875, -3.84661865234375, -3.7120361328125, -3.57745361328125, -3.44287109375, -3.30828857421875, -3.1737060546875, -3.03912353515625, -2.904541015625, -2.76995849609375, -2.6353759765625, -2.50079345703125, -2.3662109375, -2.23162841796875, -2.0970458984375, -1.96246337890625, -1.827880859375, -1.69329833984375, -1.5587158203125, -1.42413330078125, -1.28955078125, -1.15496826171875, -1.0203857421875, -0.88580322265625, -0.751220703125, -0.61663818359375, -0.4820556640625, -0.34747314453125, -0.212890625, -0.07830810546875, 0.0562744140625, 0.19085693359375, 0.325439453125, 0.46002197265625, 0.5946044921875, 0.72918701171875, 0.86376953125, 0.99835205078125, 1.1329345703125, 1.26751708984375, 1.402099609375, 1.53668212890625, 1.6712646484375, 1.80584716796875, 1.9404296875, 2.07501220703125, 2.2095947265625, 2.34417724609375, 2.478759765625, 2.61334228515625, 2.7479248046875, 2.88250732421875, 3.01708984375, 3.15167236328125, 3.2862548828125, 3.42083740234375, 3.555419921875, 3.69000244140625, 3.8245849609375, 3.95916748046875, 4.09375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 12.0, 17.0, 20.0, 28.0, 54.0, 53.0, 101.0, 132.0, 203.0, 319.0, 407.0, 618.0, 943.0, 1450.0, 2221.0, 3636.0, 5480.0, 9202.0, 15529.0, 26537.0, 45928.0, 76792.0, 122350.0, 169987.0, 181741.0, 145271.0, 96411.0, 58185.0, 34263.0, 19837.0, 11582.0, 7046.0, 4319.0, 2644.0, 1729.0, 1093.0, 827.0, 514.0, 349.0, 206.0, 154.0, 113.0, 80.0, 61.0, 25.0, 30.0, 24.0, 8.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.49609375, -5.31427001953125, -5.1324462890625, -4.95062255859375, -4.768798828125, -4.58697509765625, -4.4051513671875, -4.22332763671875, -4.04150390625, -3.85968017578125, -3.6778564453125, -3.49603271484375, -3.314208984375, -3.13238525390625, -2.9505615234375, -2.76873779296875, -2.5869140625, -2.40509033203125, -2.2232666015625, -2.04144287109375, -1.859619140625, -1.67779541015625, -1.4959716796875, -1.31414794921875, -1.13232421875, -0.95050048828125, -0.7686767578125, -0.58685302734375, -0.405029296875, -0.22320556640625, -0.0413818359375, 0.14044189453125, 0.322265625, 0.50408935546875, 0.6859130859375, 0.86773681640625, 1.049560546875, 1.23138427734375, 1.4132080078125, 1.59503173828125, 1.77685546875, 1.95867919921875, 2.1405029296875, 2.32232666015625, 2.504150390625, 2.68597412109375, 2.8677978515625, 3.04962158203125, 3.2314453125, 3.41326904296875, 3.5950927734375, 3.77691650390625, 3.958740234375, 4.14056396484375, 4.3223876953125, 4.50421142578125, 4.68603515625, 4.86785888671875, 5.0496826171875, 5.23150634765625, 5.413330078125, 5.59515380859375, 5.7769775390625, 5.95880126953125, 6.140625]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 3.0, 9.0, 7.0, 7.0, 6.0, 9.0, 7.0, 9.0, 16.0, 20.0, 23.0, 22.0, 25.0, 35.0, 26.0, 26.0, 37.0, 32.0, 35.0, 34.0, 29.0, 59.0, 40.0, 41.0, 34.0, 39.0, 34.0, 41.0, 28.0, 34.0, 29.0, 33.0, 29.0, 29.0, 18.0, 13.0, 10.0, 14.0, 10.0, 7.0, 10.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.34765625, -2.26690673828125, -2.1861572265625, -2.10540771484375, -2.024658203125, -1.94390869140625, -1.8631591796875, -1.78240966796875, -1.70166015625, -1.62091064453125, -1.5401611328125, -1.45941162109375, -1.378662109375, -1.29791259765625, -1.2171630859375, -1.13641357421875, -1.0556640625, -0.97491455078125, -0.8941650390625, -0.81341552734375, -0.732666015625, -0.65191650390625, -0.5711669921875, -0.49041748046875, -0.40966796875, -0.32891845703125, -0.2481689453125, -0.16741943359375, -0.086669921875, -0.00592041015625, 0.0748291015625, 0.15557861328125, 0.236328125, 0.31707763671875, 0.3978271484375, 0.47857666015625, 0.559326171875, 0.64007568359375, 0.7208251953125, 0.80157470703125, 0.88232421875, 0.96307373046875, 1.0438232421875, 1.12457275390625, 1.205322265625, 1.28607177734375, 1.3668212890625, 1.44757080078125, 1.5283203125, 1.60906982421875, 1.6898193359375, 1.77056884765625, 1.851318359375, 1.93206787109375, 2.0128173828125, 2.09356689453125, 2.17431640625, 2.25506591796875, 2.3358154296875, 2.41656494140625, 2.497314453125, 2.57806396484375, 2.6588134765625, 2.73956298828125, 2.8203125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 12.0, 18.0, 16.0, 31.0, 31.0, 62.0, 104.0, 128.0, 180.0, 218.0, 335.0, 477.0, 713.0, 1105.0, 1482.0, 2263.0, 3413.0, 5010.0, 7714.0, 12043.0, 18731.0, 29897.0, 49589.0, 82370.0, 131998.0, 182262.0, 179995.0, 128458.0, 80063.0, 48022.0, 29280.0, 18070.0, 11425.0, 7586.0, 4986.0, 3438.0, 2168.0, 1538.0, 1006.0, 679.0, 459.0, 352.0, 249.0, 165.0, 115.0, 76.0, 62.0, 43.0, 24.0, 25.0, 21.0, 13.0, 6.0, 9.0, 8.0, 1.0, 3.0], "bins": [-2.8203125, -2.734771728515625, -2.64923095703125, -2.563690185546875, -2.4781494140625, -2.392608642578125, -2.30706787109375, -2.221527099609375, -2.135986328125, -2.050445556640625, -1.96490478515625, -1.879364013671875, -1.7938232421875, -1.708282470703125, -1.62274169921875, -1.537200927734375, -1.45166015625, -1.366119384765625, -1.28057861328125, -1.195037841796875, -1.1094970703125, -1.023956298828125, -0.93841552734375, -0.852874755859375, -0.767333984375, -0.681793212890625, -0.59625244140625, -0.510711669921875, -0.4251708984375, -0.339630126953125, -0.25408935546875, -0.168548583984375, -0.0830078125, 0.002532958984375, 0.08807373046875, 0.173614501953125, 0.2591552734375, 0.344696044921875, 0.43023681640625, 0.515777587890625, 0.601318359375, 0.686859130859375, 0.77239990234375, 0.857940673828125, 0.9434814453125, 1.029022216796875, 1.11456298828125, 1.200103759765625, 1.28564453125, 1.371185302734375, 1.45672607421875, 1.542266845703125, 1.6278076171875, 1.713348388671875, 1.79888916015625, 1.884429931640625, 1.969970703125, 2.055511474609375, 2.14105224609375, 2.226593017578125, 2.3121337890625, 2.397674560546875, 2.48321533203125, 2.568756103515625, 2.654296875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 18.0, 7.0, 12.0, 14.0, 35.0, 55.0, 72.0, 92.0, 133.0, 151.0, 131.0, 106.0, 44.0, 53.0, 22.0, 18.0, 12.0, 8.0, 4.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007038116455078125, -0.000684000551700592, -0.0006641894578933716, -0.0006443783640861511, -0.0006245672702789307, -0.0006047561764717102, -0.0005849450826644897, -0.0005651339888572693, -0.0005453228950500488, -0.0005255118012428284, -0.0005057007074356079, -0.00048588961362838745, -0.000466078519821167, -0.00044626742601394653, -0.0004264563322067261, -0.0004066452383995056, -0.00038683414459228516, -0.0003670230507850647, -0.00034721195697784424, -0.0003274008631706238, -0.0003075897693634033, -0.00028777867555618286, -0.0002679675817489624, -0.00024815648794174194, -0.00022834539413452148, -0.00020853430032730103, -0.00018872320652008057, -0.0001689121127128601, -0.00014910101890563965, -0.0001292899250984192, -0.00010947883129119873, -8.966773748397827e-05, -6.985664367675781e-05, -5.0045549869537354e-05, -3.0234456062316895e-05, -1.0423362255096436e-05, 9.387731552124023e-06, 2.9198825359344482e-05, 4.900991916656494e-05, 6.88210129737854e-05, 8.863210678100586e-05, 0.00010844320058822632, 0.00012825429439544678, 0.00014806538820266724, 0.0001678764820098877, 0.00018768757581710815, 0.0002074986696243286, 0.00022730976343154907, 0.00024712085723876953, 0.00026693195104599, 0.00028674304485321045, 0.0003065541386604309, 0.00032636523246765137, 0.0003461763262748718, 0.0003659874200820923, 0.00038579851388931274, 0.0004056096076965332, 0.00042542070150375366, 0.0004452317953109741, 0.0004650428891181946, 0.00048485398292541504, 0.0005046650767326355, 0.000524476170539856, 0.0005442872643470764, 0.0005640983581542969]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 11.0, 23.0, 38.0, 45.0, 77.0, 128.0, 220.0, 300.0, 488.0, 805.0, 1349.0, 2166.0, 3529.0, 5783.0, 9777.0, 16467.0, 28049.0, 48774.0, 84367.0, 137972.0, 190378.0, 187617.0, 134591.0, 81597.0, 47261.0, 27275.0, 15814.0, 9243.0, 5574.0, 3465.0, 2075.0, 1234.0, 780.0, 474.0, 319.0, 186.0, 87.0, 78.0, 50.0, 29.0, 19.0, 15.0, 10.0, 6.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.48046875, -2.39483642578125, -2.3092041015625, -2.22357177734375, -2.137939453125, -2.05230712890625, -1.9666748046875, -1.88104248046875, -1.79541015625, -1.70977783203125, -1.6241455078125, -1.53851318359375, -1.452880859375, -1.36724853515625, -1.2816162109375, -1.19598388671875, -1.1103515625, -1.02471923828125, -0.9390869140625, -0.85345458984375, -0.767822265625, -0.68218994140625, -0.5965576171875, -0.51092529296875, -0.42529296875, -0.33966064453125, -0.2540283203125, -0.16839599609375, -0.082763671875, 0.00286865234375, 0.0885009765625, 0.17413330078125, 0.259765625, 0.34539794921875, 0.4310302734375, 0.51666259765625, 0.602294921875, 0.68792724609375, 0.7735595703125, 0.85919189453125, 0.94482421875, 1.03045654296875, 1.1160888671875, 1.20172119140625, 1.287353515625, 1.37298583984375, 1.4586181640625, 1.54425048828125, 1.6298828125, 1.71551513671875, 1.8011474609375, 1.88677978515625, 1.972412109375, 2.05804443359375, 2.1436767578125, 2.22930908203125, 2.31494140625, 2.40057373046875, 2.4862060546875, 2.57183837890625, 2.657470703125, 2.74310302734375, 2.8287353515625, 2.91436767578125, 3.0]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 7.0, 11.0, 7.0, 12.0, 21.0, 22.0, 36.0, 32.0, 37.0, 40.0, 46.0, 63.0, 74.0, 91.0, 79.0, 74.0, 44.0, 48.0, 37.0, 40.0, 37.0, 30.0, 23.0, 18.0, 17.0, 15.0, 8.0, 5.0, 8.0, 3.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.900390625, -0.869384765625, -0.83837890625, -0.807373046875, -0.7763671875, -0.745361328125, -0.71435546875, -0.683349609375, -0.65234375, -0.621337890625, -0.59033203125, -0.559326171875, -0.5283203125, -0.497314453125, -0.46630859375, -0.435302734375, -0.404296875, -0.373291015625, -0.34228515625, -0.311279296875, -0.2802734375, -0.249267578125, -0.21826171875, -0.187255859375, -0.15625, -0.125244140625, -0.09423828125, -0.063232421875, -0.0322265625, -0.001220703125, 0.02978515625, 0.060791015625, 0.091796875, 0.122802734375, 0.15380859375, 0.184814453125, 0.2158203125, 0.246826171875, 0.27783203125, 0.308837890625, 0.33984375, 0.370849609375, 0.40185546875, 0.432861328125, 0.4638671875, 0.494873046875, 0.52587890625, 0.556884765625, 0.587890625, 0.618896484375, 0.64990234375, 0.680908203125, 0.7119140625, 0.742919921875, 0.77392578125, 0.804931640625, 0.8359375, 0.866943359375, 0.89794921875, 0.928955078125, 0.9599609375, 0.990966796875, 1.02197265625, 1.052978515625, 1.083984375]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 18.0, 10.0, 9.0, 14.0, 28.0, 39.0, 28.0, 37.0, 39.0, 65.0, 71.0, 69.0, 82.0, 74.0, 63.0, 65.0, 54.0, 52.0, 41.0, 25.0, 18.0, 17.0, 13.0, 15.0, 10.0, 5.0, 8.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.7656831741333, -10.46187686920166, -10.158071517944336, -9.854265213012695, -9.550458908081055, -9.24665355682373, -8.94284725189209, -8.639041900634766, -8.335235595703125, -8.031429290771484, -7.727623462677002, -7.4238176345825195, -7.120011806488037, -6.816205978393555, -6.512399673461914, -6.208593845367432, -5.904787540435791, -5.600981712341309, -5.297175407409668, -4.9933695793151855, -4.689563751220703, -4.3857574462890625, -4.08195161819458, -3.7781457901000977, -3.474339723587036, -3.1705336570739746, -2.866727828979492, -2.5629217624664307, -2.259115695953369, -1.9553098678588867, -1.6515038013458252, -1.3476979732513428, -1.0438919067382812, -0.7400859594345093, -0.43627995252609253, -0.13247394561767578, 0.1713320016860962, 0.47513794898986816, 0.7789440155029297, 1.082749843597412, 1.3865559101104736, 1.6903618574142456, 1.9941678047180176, 2.297973871231079, 2.6017799377441406, 2.905585765838623, 3.2093918323516846, 3.513197660446167, 3.8170037269592285, 4.120809555053711, 4.424615859985352, 4.728421688079834, 5.032227516174316, 5.336033821105957, 5.6398396492004395, 5.943645477294922, 6.2474517822265625, 6.551257610321045, 6.8550639152526855, 7.158869743347168, 7.46267557144165, 7.766481399536133, 8.070287704467773, 8.374094009399414, 8.677899360656738]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 7.0, 4.0, 5.0, 9.0, 6.0, 12.0, 13.0, 22.0, 18.0, 24.0, 21.0, 22.0, 15.0, 25.0, 23.0, 36.0, 31.0, 43.0, 35.0, 40.0, 35.0, 38.0, 44.0, 36.0, 36.0, 28.0, 55.0, 37.0, 29.0, 33.0, 27.0, 31.0, 25.0, 16.0, 21.0, 24.0, 14.0, 11.0, 12.0, 13.0, 9.0, 3.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.349158763885498, -4.21394157409668, -4.078723907470703, -3.9435067176818848, -3.8082895278930664, -3.673072099685669, -3.5378546714782715, -3.402637481689453, -3.2674200534820557, -3.132202625274658, -2.99698543548584, -2.8617680072784424, -2.726550579071045, -2.5913333892822266, -2.456115961074829, -2.3208985328674316, -2.1856813430786133, -2.050463914871216, -1.9152467250823975, -1.780029296875, -1.644811987876892, -1.5095946788787842, -1.3743772506713867, -1.2391599416732788, -1.103942632675171, -0.968725323677063, -0.8335079550743103, -0.6982905864715576, -0.5630732774734497, -0.4278559684753418, -0.2926385998725891, -0.15742123126983643, -0.02220439910888672, 0.11301293969154358, 0.24823027849197388, 0.3834476172924042, 0.5186649560928345, 0.6538822650909424, 0.7890996336936951, 0.9243170022964478, 1.0595343112945557, 1.1947516202926636, 1.3299689292907715, 1.465186357498169, 1.6004036664962769, 1.7356209754943848, 1.8708384037017822, 2.0060558319091797, 2.141273021697998, 2.2764904499053955, 2.411707639694214, 2.5469250679016113, 2.6821422576904297, 2.817359685897827, 2.9525771141052246, 3.087794303894043, 3.2230117321014404, 3.358229160308838, 3.4934463500976562, 3.6286637783050537, 3.763881206512451, 3.8990983963012695, 4.034315586090088, 4.1695332527160645, 4.304750442504883]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 6.0, 13.0, 22.0, 28.0, 50.0, 72.0, 105.0, 121.0, 202.0, 337.0, 521.0, 879.0, 1443.0, 2490.0, 4282.0, 7928.0, 15558.0, 33908.0, 81267.0, 228561.0, 728995.0, 1550161.0, 1013859.0, 325197.0, 109554.0, 44286.0, 20467.0, 10206.0, 5425.0, 3163.0, 1871.0, 1117.0, 735.0, 464.0, 286.0, 197.0, 146.0, 99.0, 91.0, 42.0, 38.0, 22.0, 17.0, 14.0, 7.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.4453125, -10.1153564453125, -9.785400390625, -9.4554443359375, -9.12548828125, -8.7955322265625, -8.465576171875, -8.1356201171875, -7.8056640625, -7.4757080078125, -7.145751953125, -6.8157958984375, -6.48583984375, -6.1558837890625, -5.825927734375, -5.4959716796875, -5.166015625, -4.8360595703125, -4.506103515625, -4.1761474609375, -3.84619140625, -3.5162353515625, -3.186279296875, -2.8563232421875, -2.5263671875, -2.1964111328125, -1.866455078125, -1.5364990234375, -1.20654296875, -0.8765869140625, -0.546630859375, -0.2166748046875, 0.11328125, 0.4432373046875, 0.773193359375, 1.1031494140625, 1.43310546875, 1.7630615234375, 2.093017578125, 2.4229736328125, 2.7529296875, 3.0828857421875, 3.412841796875, 3.7427978515625, 4.07275390625, 4.4027099609375, 4.732666015625, 5.0626220703125, 5.392578125, 5.7225341796875, 6.052490234375, 6.3824462890625, 6.71240234375, 7.0423583984375, 7.372314453125, 7.7022705078125, 8.0322265625, 8.3621826171875, 8.692138671875, 9.0220947265625, 9.35205078125, 9.6820068359375, 10.011962890625, 10.3419189453125, 10.671875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 7.0, 4.0, 10.0, 7.0, 7.0, 11.0, 20.0, 12.0, 17.0, 28.0, 15.0, 32.0, 29.0, 27.0, 32.0, 38.0, 26.0, 36.0, 30.0, 40.0, 40.0, 41.0, 33.0, 52.0, 46.0, 37.0, 35.0, 23.0, 24.0, 33.0, 33.0, 26.0, 23.0, 13.0, 24.0, 22.0, 9.0, 13.0, 1.0, 10.0, 10.0, 7.0, 2.0, 5.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.04296875, -2.93548583984375, -2.8280029296875, -2.72052001953125, -2.613037109375, -2.50555419921875, -2.3980712890625, -2.29058837890625, -2.18310546875, -2.07562255859375, -1.9681396484375, -1.86065673828125, -1.753173828125, -1.64569091796875, -1.5382080078125, -1.43072509765625, -1.3232421875, -1.21575927734375, -1.1082763671875, -1.00079345703125, -0.893310546875, -0.78582763671875, -0.6783447265625, -0.57086181640625, -0.46337890625, -0.35589599609375, -0.2484130859375, -0.14093017578125, -0.033447265625, 0.07403564453125, 0.1815185546875, 0.28900146484375, 0.396484375, 0.50396728515625, 0.6114501953125, 0.71893310546875, 0.826416015625, 0.93389892578125, 1.0413818359375, 1.14886474609375, 1.25634765625, 1.36383056640625, 1.4713134765625, 1.57879638671875, 1.686279296875, 1.79376220703125, 1.9012451171875, 2.00872802734375, 2.1162109375, 2.22369384765625, 2.3311767578125, 2.43865966796875, 2.546142578125, 2.65362548828125, 2.7611083984375, 2.86859130859375, 2.97607421875, 3.08355712890625, 3.1910400390625, 3.29852294921875, 3.406005859375, 3.51348876953125, 3.6209716796875, 3.72845458984375, 3.8359375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 7.0, 10.0, 10.0, 15.0, 18.0, 38.0, 41.0, 86.0, 121.0, 223.0, 353.0, 601.0, 1019.0, 1739.0, 3123.0, 6080.0, 12285.0, 26432.0, 62563.0, 165223.0, 493509.0, 1354968.0, 1321622.0, 473941.0, 159240.0, 60519.0, 25646.0, 11702.0, 5966.0, 3082.0, 1656.0, 1001.0, 519.0, 326.0, 188.0, 147.0, 91.0, 50.0, 45.0, 30.0, 15.0, 10.0, 7.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.2750244140625, -10.885986328125, -10.4969482421875, -10.10791015625, -9.7188720703125, -9.329833984375, -8.9407958984375, -8.5517578125, -8.1627197265625, -7.773681640625, -7.3846435546875, -6.99560546875, -6.6065673828125, -6.217529296875, -5.8284912109375, -5.439453125, -5.0504150390625, -4.661376953125, -4.2723388671875, -3.88330078125, -3.4942626953125, -3.105224609375, -2.7161865234375, -2.3271484375, -1.9381103515625, -1.549072265625, -1.1600341796875, -0.77099609375, -0.3819580078125, 0.007080078125, 0.3961181640625, 0.78515625, 1.1741943359375, 1.563232421875, 1.9522705078125, 2.34130859375, 2.7303466796875, 3.119384765625, 3.5084228515625, 3.8974609375, 4.2864990234375, 4.675537109375, 5.0645751953125, 5.45361328125, 5.8426513671875, 6.231689453125, 6.6207275390625, 7.009765625, 7.3988037109375, 7.787841796875, 8.1768798828125, 8.56591796875, 8.9549560546875, 9.343994140625, 9.7330322265625, 10.1220703125, 10.5111083984375, 10.900146484375, 11.2891845703125, 11.67822265625, 12.0672607421875, 12.456298828125, 12.8453369140625, 13.234375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 8.0, 9.0, 17.0, 26.0, 33.0, 52.0, 66.0, 102.0, 150.0, 165.0, 212.0, 326.0, 372.0, 373.0, 401.0, 349.0, 298.0, 294.0, 218.0, 156.0, 105.0, 87.0, 60.0, 43.0, 31.0, 32.0, 11.0, 14.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.53125, -3.428070068359375, -3.32489013671875, -3.221710205078125, -3.1185302734375, -3.015350341796875, -2.91217041015625, -2.808990478515625, -2.705810546875, -2.602630615234375, -2.49945068359375, -2.396270751953125, -2.2930908203125, -2.189910888671875, -2.08673095703125, -1.983551025390625, -1.88037109375, -1.777191162109375, -1.67401123046875, -1.570831298828125, -1.4676513671875, -1.364471435546875, -1.26129150390625, -1.158111572265625, -1.054931640625, -0.951751708984375, -0.84857177734375, -0.745391845703125, -0.6422119140625, -0.539031982421875, -0.43585205078125, -0.332672119140625, -0.2294921875, -0.126312255859375, -0.02313232421875, 0.080047607421875, 0.1832275390625, 0.286407470703125, 0.38958740234375, 0.492767333984375, 0.595947265625, 0.699127197265625, 0.80230712890625, 0.905487060546875, 1.0086669921875, 1.111846923828125, 1.21502685546875, 1.318206787109375, 1.42138671875, 1.524566650390625, 1.62774658203125, 1.730926513671875, 1.8341064453125, 1.937286376953125, 2.04046630859375, 2.143646240234375, 2.246826171875, 2.350006103515625, 2.45318603515625, 2.556365966796875, 2.6595458984375, 2.762725830078125, 2.86590576171875, 2.969085693359375, 3.072265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 7.0, 6.0, 4.0, 7.0, 14.0, 11.0, 20.0, 23.0, 23.0, 28.0, 37.0, 46.0, 56.0, 62.0, 73.0, 72.0, 58.0, 61.0, 58.0, 51.0, 59.0, 44.0, 33.0, 27.0, 24.0, 19.0, 14.0, 9.0, 7.0, 13.0, 7.0, 4.0, 9.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-11.04246711730957, -10.743955612182617, -10.445443153381348, -10.146930694580078, -9.848419189453125, -9.549907684326172, -9.251395225524902, -8.952882766723633, -8.65437126159668, -8.355859756469727, -8.057347297668457, -7.758835315704346, -7.460323333740234, -7.161811351776123, -6.863299369812012, -6.5647873878479, -6.266275405883789, -5.967763423919678, -5.669251441955566, -5.370739459991455, -5.072227478027344, -4.773715496063232, -4.475203514099121, -4.17669153213501, -3.8781795501708984, -3.579667568206787, -3.281155586242676, -2.9826436042785645, -2.684131622314453, -2.385619640350342, -2.0871076583862305, -1.7885956764221191, -1.4900836944580078, -1.1915717124938965, -0.8930597305297852, -0.5945477485656738, -0.2960357666015625, 0.002476215362548828, 0.30098819732666016, 0.5995001792907715, 0.8980121612548828, 1.1965241432189941, 1.4950361251831055, 1.7935481071472168, 2.092060089111328, 2.3905720710754395, 2.689084053039551, 2.987596035003662, 3.2861080169677734, 3.5846199989318848, 3.883131980895996, 4.181643962860107, 4.480155944824219, 4.77866792678833, 5.077179908752441, 5.375691890716553, 5.674203872680664, 5.972715854644775, 6.271227836608887, 6.569739818572998, 6.868251800537109, 7.166763782501221, 7.465275764465332, 7.763787746429443, 8.062299728393555]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 7.0, 5.0, 5.0, 8.0, 17.0, 12.0, 16.0, 10.0, 21.0, 26.0, 28.0, 22.0, 27.0, 27.0, 25.0, 33.0, 31.0, 31.0, 45.0, 33.0, 49.0, 41.0, 34.0, 32.0, 30.0, 35.0, 37.0, 31.0, 31.0, 35.0, 22.0, 29.0, 26.0, 12.0, 19.0, 9.0, 7.0, 12.0, 14.0, 11.0, 11.0, 6.0, 8.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.12053108215332, -3.9783573150634766, -3.836183786392212, -3.6940102577209473, -3.5518364906311035, -3.4096627235412598, -3.267489194869995, -3.1253156661987305, -2.9831418991088867, -2.840968132019043, -2.6987946033477783, -2.5566210746765137, -2.41444730758667, -2.272273540496826, -2.1301000118255615, -1.9879263639450073, -1.8457527160644531, -1.703579068183899, -1.5614054203033447, -1.4192317724227905, -1.2770581245422363, -1.1348844766616821, -0.9927108287811279, -0.8505371809005737, -0.7083635330200195, -0.5661898851394653, -0.42401623725891113, -0.28184258937835693, -0.13966894149780273, 0.002504706382751465, 0.14467835426330566, 0.28685200214385986, 0.42902517318725586, 0.5711988210678101, 0.7133724689483643, 0.8555461168289185, 0.9977197647094727, 1.1398934125900269, 1.282067060470581, 1.4242407083511353, 1.5664143562316895, 1.7085880041122437, 1.8507616519927979, 1.992935299873352, 2.1351089477539062, 2.27728271484375, 2.4194562435150146, 2.5616297721862793, 2.703803539276123, 2.845977306365967, 2.9881508350372314, 3.130324363708496, 3.27249813079834, 3.4146718978881836, 3.5568454265594482, 3.699018955230713, 3.8411927223205566, 3.9833664894104004, 4.125539779663086, 4.26771354675293, 4.409887313842773, 4.552061080932617, 4.694234848022461, 4.8364081382751465, 4.97858190536499]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 3.0, 9.0, 7.0, 18.0, 24.0, 36.0, 53.0, 83.0, 89.0, 139.0, 192.0, 267.0, 380.0, 532.0, 758.0, 1022.0, 1411.0, 2089.0, 3173.0, 5040.0, 8890.0, 18373.0, 44581.0, 125231.0, 305888.0, 310496.0, 129825.0, 46363.0, 18870.0, 9142.0, 5138.0, 3155.0, 2136.0, 1454.0, 1000.0, 800.0, 534.0, 394.0, 293.0, 199.0, 141.0, 88.0, 86.0, 50.0, 35.0, 18.0, 17.0, 11.0, 9.0, 7.0, 4.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.7572021484375, -7.498779296875, -7.2403564453125, -6.98193359375, -6.7235107421875, -6.465087890625, -6.2066650390625, -5.9482421875, -5.6898193359375, -5.431396484375, -5.1729736328125, -4.91455078125, -4.6561279296875, -4.397705078125, -4.1392822265625, -3.880859375, -3.6224365234375, -3.364013671875, -3.1055908203125, -2.84716796875, -2.5887451171875, -2.330322265625, -2.0718994140625, -1.8134765625, -1.5550537109375, -1.296630859375, -1.0382080078125, -0.77978515625, -0.5213623046875, -0.262939453125, -0.0045166015625, 0.25390625, 0.5123291015625, 0.770751953125, 1.0291748046875, 1.28759765625, 1.5460205078125, 1.804443359375, 2.0628662109375, 2.3212890625, 2.5797119140625, 2.838134765625, 3.0965576171875, 3.35498046875, 3.6134033203125, 3.871826171875, 4.1302490234375, 4.388671875, 4.6470947265625, 4.905517578125, 5.1639404296875, 5.42236328125, 5.6807861328125, 5.939208984375, 6.1976318359375, 6.4560546875, 6.7144775390625, 6.972900390625, 7.2313232421875, 7.48974609375, 7.7481689453125, 8.006591796875, 8.2650146484375, 8.5234375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 8.0, 8.0, 11.0, 17.0, 11.0, 23.0, 9.0, 19.0, 17.0, 20.0, 19.0, 29.0, 27.0, 36.0, 27.0, 38.0, 43.0, 31.0, 43.0, 34.0, 41.0, 36.0, 43.0, 39.0, 32.0, 38.0, 30.0, 32.0, 21.0, 20.0, 21.0, 21.0, 22.0, 18.0, 12.0, 13.0, 6.0, 14.0, 8.0, 8.0, 11.0, 8.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.46875, -4.31982421875, -4.1708984375, -4.02197265625, -3.873046875, -3.72412109375, -3.5751953125, -3.42626953125, -3.27734375, -3.12841796875, -2.9794921875, -2.83056640625, -2.681640625, -2.53271484375, -2.3837890625, -2.23486328125, -2.0859375, -1.93701171875, -1.7880859375, -1.63916015625, -1.490234375, -1.34130859375, -1.1923828125, -1.04345703125, -0.89453125, -0.74560546875, -0.5966796875, -0.44775390625, -0.298828125, -0.14990234375, -0.0009765625, 0.14794921875, 0.296875, 0.44580078125, 0.5947265625, 0.74365234375, 0.892578125, 1.04150390625, 1.1904296875, 1.33935546875, 1.48828125, 1.63720703125, 1.7861328125, 1.93505859375, 2.083984375, 2.23291015625, 2.3818359375, 2.53076171875, 2.6796875, 2.82861328125, 2.9775390625, 3.12646484375, 3.275390625, 3.42431640625, 3.5732421875, 3.72216796875, 3.87109375, 4.02001953125, 4.1689453125, 4.31787109375, 4.466796875, 4.61572265625, 4.7646484375, 4.91357421875, 5.0625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 6.0, 5.0, 5.0, 1.0, 10.0, 5.0, 15.0, 16.0, 13.0, 25.0, 40.0, 41.0, 43.0, 84.0, 92.0, 152.0, 189.0, 214.0, 339.0, 502.0, 666.0, 1054.0, 1596.0, 2529.0, 4470.0, 9387.0, 27697.0, 142486.0, 592533.0, 204035.0, 35816.0, 11126.0, 4987.0, 2817.0, 1754.0, 1123.0, 757.0, 572.0, 352.0, 232.0, 200.0, 139.0, 98.0, 74.0, 54.0, 54.0, 46.0, 29.0, 19.0, 19.0, 14.0, 3.0, 9.0, 4.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.7109375, -15.1973876953125, -14.683837890625, -14.1702880859375, -13.65673828125, -13.1431884765625, -12.629638671875, -12.1160888671875, -11.6025390625, -11.0889892578125, -10.575439453125, -10.0618896484375, -9.54833984375, -9.0347900390625, -8.521240234375, -8.0076904296875, -7.494140625, -6.9805908203125, -6.467041015625, -5.9534912109375, -5.43994140625, -4.9263916015625, -4.412841796875, -3.8992919921875, -3.3857421875, -2.8721923828125, -2.358642578125, -1.8450927734375, -1.33154296875, -0.8179931640625, -0.304443359375, 0.2091064453125, 0.72265625, 1.2362060546875, 1.749755859375, 2.2633056640625, 2.77685546875, 3.2904052734375, 3.803955078125, 4.3175048828125, 4.8310546875, 5.3446044921875, 5.858154296875, 6.3717041015625, 6.88525390625, 7.3988037109375, 7.912353515625, 8.4259033203125, 8.939453125, 9.4530029296875, 9.966552734375, 10.4801025390625, 10.99365234375, 11.5072021484375, 12.020751953125, 12.5343017578125, 13.0478515625, 13.5614013671875, 14.074951171875, 14.5885009765625, 15.10205078125, 15.6156005859375, 16.129150390625, 16.6427001953125, 17.15625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 4.0, 8.0, 4.0, 9.0, 13.0, 8.0, 13.0, 20.0, 21.0, 19.0, 24.0, 24.0, 34.0, 43.0, 41.0, 38.0, 37.0, 43.0, 42.0, 41.0, 63.0, 46.0, 50.0, 41.0, 44.0, 21.0, 26.0, 31.0, 28.0, 33.0, 28.0, 13.0, 17.0, 13.0, 15.0, 11.0, 8.0, 7.0, 8.0, 3.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.05029296875, -2.9404296875, -2.83056640625, -2.720703125, -2.61083984375, -2.5009765625, -2.39111328125, -2.28125, -2.17138671875, -2.0615234375, -1.95166015625, -1.841796875, -1.73193359375, -1.6220703125, -1.51220703125, -1.40234375, -1.29248046875, -1.1826171875, -1.07275390625, -0.962890625, -0.85302734375, -0.7431640625, -0.63330078125, -0.5234375, -0.41357421875, -0.3037109375, -0.19384765625, -0.083984375, 0.02587890625, 0.1357421875, 0.24560546875, 0.35546875, 0.46533203125, 0.5751953125, 0.68505859375, 0.794921875, 0.90478515625, 1.0146484375, 1.12451171875, 1.234375, 1.34423828125, 1.4541015625, 1.56396484375, 1.673828125, 1.78369140625, 1.8935546875, 2.00341796875, 2.11328125, 2.22314453125, 2.3330078125, 2.44287109375, 2.552734375, 2.66259765625, 2.7724609375, 2.88232421875, 2.9921875, 3.10205078125, 3.2119140625, 3.32177734375, 3.431640625, 3.54150390625, 3.6513671875, 3.76123046875, 3.87109375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 6.0, 20.0, 24.0, 27.0, 50.0, 66.0, 115.0, 143.0, 223.0, 368.0, 623.0, 945.0, 1765.0, 3283.0, 7119.0, 21467.0, 132031.0, 684311.0, 156224.0, 23970.0, 7701.0, 3448.0, 1857.0, 1013.0, 654.0, 402.0, 226.0, 153.0, 96.0, 71.0, 46.0, 37.0, 17.0, 9.0, 9.0, 12.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.875, -8.5843505859375, -8.293701171875, -8.0030517578125, -7.71240234375, -7.4217529296875, -7.131103515625, -6.8404541015625, -6.5498046875, -6.2591552734375, -5.968505859375, -5.6778564453125, -5.38720703125, -5.0965576171875, -4.805908203125, -4.5152587890625, -4.224609375, -3.9339599609375, -3.643310546875, -3.3526611328125, -3.06201171875, -2.7713623046875, -2.480712890625, -2.1900634765625, -1.8994140625, -1.6087646484375, -1.318115234375, -1.0274658203125, -0.73681640625, -0.4461669921875, -0.155517578125, 0.1351318359375, 0.42578125, 0.7164306640625, 1.007080078125, 1.2977294921875, 1.58837890625, 1.8790283203125, 2.169677734375, 2.4603271484375, 2.7509765625, 3.0416259765625, 3.332275390625, 3.6229248046875, 3.91357421875, 4.2042236328125, 4.494873046875, 4.7855224609375, 5.076171875, 5.3668212890625, 5.657470703125, 5.9481201171875, 6.23876953125, 6.5294189453125, 6.820068359375, 7.1107177734375, 7.4013671875, 7.6920166015625, 7.982666015625, 8.2733154296875, 8.56396484375, 8.8546142578125, 9.145263671875, 9.4359130859375, 9.7265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 7.0, 19.0, 33.0, 33.0, 96.0, 184.0, 197.0, 180.0, 100.0, 55.0, 24.0, 19.0, 11.0, 8.0, 4.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003955364227294922, -0.0003840737044811249, -0.00037261098623275757, -0.00036114826798439026, -0.00034968554973602295, -0.00033822283148765564, -0.00032676011323928833, -0.000315297394990921, -0.0003038346767425537, -0.0002923719584941864, -0.0002809092402458191, -0.0002694465219974518, -0.00025798380374908447, -0.00024652108550071716, -0.00023505836725234985, -0.00022359564900398254, -0.00021213293075561523, -0.00020067021250724792, -0.00018920749425888062, -0.0001777447760105133, -0.000166282057762146, -0.0001548193395137787, -0.00014335662126541138, -0.00013189390301704407, -0.00012043118476867676, -0.00010896846652030945, -9.750574827194214e-05, -8.604303002357483e-05, -7.458031177520752e-05, -6.311759352684021e-05, -5.16548752784729e-05, -4.019215703010559e-05, -2.872943878173828e-05, -1.726672053337097e-05, -5.804002285003662e-06, 5.6587159633636475e-06, 1.7121434211730957e-05, 2.8584152460098267e-05, 4.0046870708465576e-05, 5.1509588956832886e-05, 6.29723072052002e-05, 7.44350254535675e-05, 8.589774370193481e-05, 9.736046195030212e-05, 0.00010882318019866943, 0.00012028589844703674, 0.00013174861669540405, 0.00014321133494377136, 0.00015467405319213867, 0.00016613677144050598, 0.0001775994896888733, 0.0001890622079372406, 0.0002005249261856079, 0.00021198764443397522, 0.00022345036268234253, 0.00023491308093070984, 0.00024637579917907715, 0.00025783851742744446, 0.00026930123567581177, 0.0002807639539241791, 0.0002922266721725464, 0.0003036893904209137, 0.000315152108669281, 0.0003266148269176483, 0.0003380775451660156]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 8.0, 10.0, 23.0, 24.0, 26.0, 50.0, 76.0, 118.0, 136.0, 196.0, 242.0, 355.0, 520.0, 679.0, 989.0, 1353.0, 1937.0, 2724.0, 4121.0, 6652.0, 12024.0, 30582.0, 112937.0, 389828.0, 338368.0, 89586.0, 25482.0, 10583.0, 5998.0, 3940.0, 2586.0, 1783.0, 1318.0, 945.0, 686.0, 453.0, 336.0, 240.0, 171.0, 142.0, 94.0, 73.0, 58.0, 34.0, 25.0, 8.0, 11.0, 10.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.078125, -4.90838623046875, -4.7386474609375, -4.56890869140625, -4.399169921875, -4.22943115234375, -4.0596923828125, -3.88995361328125, -3.72021484375, -3.55047607421875, -3.3807373046875, -3.21099853515625, -3.041259765625, -2.87152099609375, -2.7017822265625, -2.53204345703125, -2.3623046875, -2.19256591796875, -2.0228271484375, -1.85308837890625, -1.683349609375, -1.51361083984375, -1.3438720703125, -1.17413330078125, -1.00439453125, -0.83465576171875, -0.6649169921875, -0.49517822265625, -0.325439453125, -0.15570068359375, 0.0140380859375, 0.18377685546875, 0.353515625, 0.52325439453125, 0.6929931640625, 0.86273193359375, 1.032470703125, 1.20220947265625, 1.3719482421875, 1.54168701171875, 1.71142578125, 1.88116455078125, 2.0509033203125, 2.22064208984375, 2.390380859375, 2.56011962890625, 2.7298583984375, 2.89959716796875, 3.0693359375, 3.23907470703125, 3.4088134765625, 3.57855224609375, 3.748291015625, 3.91802978515625, 4.0877685546875, 4.25750732421875, 4.42724609375, 4.59698486328125, 4.7667236328125, 4.93646240234375, 5.106201171875, 5.27593994140625, 5.4456787109375, 5.61541748046875, 5.78515625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 8.0, 12.0, 34.0, 51.0, 98.0, 182.0, 218.0, 168.0, 109.0, 47.0, 26.0, 10.0, 5.0, 1.0, 8.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.470703125, -2.39874267578125, -2.3267822265625, -2.25482177734375, -2.182861328125, -2.11090087890625, -2.0389404296875, -1.96697998046875, -1.89501953125, -1.82305908203125, -1.7510986328125, -1.67913818359375, -1.607177734375, -1.53521728515625, -1.4632568359375, -1.39129638671875, -1.3193359375, -1.24737548828125, -1.1754150390625, -1.10345458984375, -1.031494140625, -0.95953369140625, -0.8875732421875, -0.81561279296875, -0.74365234375, -0.67169189453125, -0.5997314453125, -0.52777099609375, -0.455810546875, -0.38385009765625, -0.3118896484375, -0.23992919921875, -0.16796875, -0.09600830078125, -0.0240478515625, 0.04791259765625, 0.119873046875, 0.19183349609375, 0.2637939453125, 0.33575439453125, 0.40771484375, 0.47967529296875, 0.5516357421875, 0.62359619140625, 0.695556640625, 0.76751708984375, 0.8394775390625, 0.91143798828125, 0.9833984375, 1.05535888671875, 1.1273193359375, 1.19927978515625, 1.271240234375, 1.34320068359375, 1.4151611328125, 1.48712158203125, 1.55908203125, 1.63104248046875, 1.7030029296875, 1.77496337890625, 1.846923828125, 1.91888427734375, 1.9908447265625, 2.06280517578125, 2.134765625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 8.0, 7.0, 9.0, 11.0, 11.0, 16.0, 21.0, 31.0, 35.0, 47.0, 33.0, 62.0, 72.0, 61.0, 65.0, 65.0, 62.0, 63.0, 51.0, 52.0, 43.0, 28.0, 31.0, 22.0, 16.0, 16.0, 13.0, 6.0, 11.0, 8.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.459746360778809, -11.157273292541504, -10.8548002243042, -10.552327156066895, -10.24985408782959, -9.947381019592285, -9.64490795135498, -9.34243392944336, -9.039960861206055, -8.73748779296875, -8.435014724731445, -8.13254165649414, -7.830068588256836, -7.527595520019531, -7.225121974945068, -6.922648906707764, -6.620176315307617, -6.3177032470703125, -6.015230178833008, -5.712757110595703, -5.410284042358398, -5.107810974121094, -4.805337429046631, -4.502864360809326, -4.2003912925720215, -3.897918224334717, -3.595445156097412, -3.2929718494415283, -2.9904987812042236, -2.688025712966919, -2.385552406311035, -2.0830793380737305, -1.7806062698364258, -1.478133201599121, -1.1756600141525269, -0.8731868863105774, -0.5707137584686279, -0.26824069023132324, 0.034232497215270996, 0.33670568466186523, 0.6391787528991699, 0.9416518807411194, 1.2441250085830688, 1.546598196029663, 1.8490712642669678, 2.1515443325042725, 2.4540176391601562, 2.756490707397461, 3.0589637756347656, 3.3614368438720703, 3.663909912109375, 3.966383218765259, 4.268856048583984, 4.571329116821289, 4.873802661895752, 5.176275730133057, 5.478748798370361, 5.781221866607666, 6.083694934844971, 6.386168003082275, 6.688641548156738, 6.991114616394043, 7.293587684631348, 7.596060752868652, 7.898533821105957]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 3.0, 4.0, 5.0, 8.0, 8.0, 7.0, 10.0, 13.0, 10.0, 10.0, 16.0, 19.0, 22.0, 11.0, 20.0, 31.0, 20.0, 31.0, 28.0, 33.0, 34.0, 40.0, 35.0, 36.0, 41.0, 39.0, 37.0, 32.0, 38.0, 36.0, 35.0, 35.0, 29.0, 29.0, 27.0, 22.0, 28.0, 19.0, 4.0, 14.0, 17.0, 10.0, 12.0, 10.0, 6.0, 13.0, 5.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.127529144287109, -3.9859135150909424, -3.8442978858947754, -3.7026822566986084, -3.5610666275024414, -3.4194507598876953, -3.2778351306915283, -3.1362195014953613, -2.9946038722991943, -2.8529882431030273, -2.7113726139068604, -2.5697569847106934, -2.4281411170959473, -2.2865257263183594, -2.1449098587036133, -2.0032942295074463, -1.8616786003112793, -1.7200629711151123, -1.5784473419189453, -1.4368315935134888, -1.2952159643173218, -1.1536003351211548, -1.0119845867156982, -0.8703689575195312, -0.7287533283233643, -0.5871376991271973, -0.4455220103263855, -0.3039063513278961, -0.16229069232940674, -0.020675063133239746, 0.12094062566757202, 0.2625563144683838, 0.4041719436645508, 0.5457875728607178, 0.6874032616615295, 0.8290189504623413, 0.9706345796585083, 1.1122502088546753, 1.2538659572601318, 1.3954815864562988, 1.5370972156524658, 1.6787128448486328, 1.8203284740447998, 1.9619442224502563, 2.103559970855713, 2.245175361633301, 2.386791229248047, 2.528406858444214, 2.670022487640381, 2.811638116836548, 2.953253746032715, 3.094869375228882, 3.236485004425049, 3.378100872039795, 3.519716501235962, 3.661332130432129, 3.802947759628296, 3.944563388824463, 4.086179256439209, 4.227794647216797, 4.369410514831543, 4.511025905609131, 4.652641773223877, 4.794257164001465, 4.935873031616211]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 7.0, 5.0, 5.0, 9.0, 15.0, 28.0, 34.0, 43.0, 68.0, 110.0, 153.0, 204.0, 324.0, 438.0, 688.0, 1030.0, 1446.0, 2189.0, 3354.0, 4971.0, 7623.0, 11518.0, 17342.0, 25651.0, 39182.0, 56587.0, 79743.0, 105166.0, 124651.0, 131070.0, 118931.0, 95638.0, 70821.0, 49390.0, 33494.0, 22409.0, 15019.0, 9668.0, 6517.0, 4328.0, 2851.0, 1927.0, 1265.0, 851.0, 599.0, 370.0, 263.0, 169.0, 127.0, 95.0, 59.0, 45.0, 26.0, 17.0, 11.0, 5.0, 9.0, 2.0, 2.0, 6.0, 3.0], "bins": [-3.70703125, -3.592315673828125, -3.47760009765625, -3.362884521484375, -3.2481689453125, -3.133453369140625, -3.01873779296875, -2.904022216796875, -2.789306640625, -2.674591064453125, -2.55987548828125, -2.445159912109375, -2.3304443359375, -2.215728759765625, -2.10101318359375, -1.986297607421875, -1.87158203125, -1.756866455078125, -1.64215087890625, -1.527435302734375, -1.4127197265625, -1.298004150390625, -1.18328857421875, -1.068572998046875, -0.953857421875, -0.839141845703125, -0.72442626953125, -0.609710693359375, -0.4949951171875, -0.380279541015625, -0.26556396484375, -0.150848388671875, -0.0361328125, 0.078582763671875, 0.19329833984375, 0.308013916015625, 0.4227294921875, 0.537445068359375, 0.65216064453125, 0.766876220703125, 0.881591796875, 0.996307373046875, 1.11102294921875, 1.225738525390625, 1.3404541015625, 1.455169677734375, 1.56988525390625, 1.684600830078125, 1.79931640625, 1.914031982421875, 2.02874755859375, 2.143463134765625, 2.2581787109375, 2.372894287109375, 2.48760986328125, 2.602325439453125, 2.717041015625, 2.831756591796875, 2.94647216796875, 3.061187744140625, 3.1759033203125, 3.290618896484375, 3.40533447265625, 3.520050048828125, 3.634765625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 6.0, 6.0, 5.0, 10.0, 10.0, 11.0, 6.0, 17.0, 15.0, 17.0, 18.0, 24.0, 24.0, 35.0, 29.0, 22.0, 25.0, 38.0, 31.0, 33.0, 35.0, 33.0, 42.0, 45.0, 39.0, 37.0, 30.0, 36.0, 33.0, 33.0, 30.0, 25.0, 30.0, 20.0, 21.0, 23.0, 14.0, 11.0, 10.0, 15.0, 15.0, 12.0, 4.0, 2.0, 6.0, 5.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.703125, -4.5562744140625, -4.409423828125, -4.2625732421875, -4.11572265625, -3.9688720703125, -3.822021484375, -3.6751708984375, -3.5283203125, -3.3814697265625, -3.234619140625, -3.0877685546875, -2.94091796875, -2.7940673828125, -2.647216796875, -2.5003662109375, -2.353515625, -2.2066650390625, -2.059814453125, -1.9129638671875, -1.76611328125, -1.6192626953125, -1.472412109375, -1.3255615234375, -1.1787109375, -1.0318603515625, -0.885009765625, -0.7381591796875, -0.59130859375, -0.4444580078125, -0.297607421875, -0.1507568359375, -0.00390625, 0.1429443359375, 0.289794921875, 0.4366455078125, 0.58349609375, 0.7303466796875, 0.877197265625, 1.0240478515625, 1.1708984375, 1.3177490234375, 1.464599609375, 1.6114501953125, 1.75830078125, 1.9051513671875, 2.052001953125, 2.1988525390625, 2.345703125, 2.4925537109375, 2.639404296875, 2.7862548828125, 2.93310546875, 3.0799560546875, 3.226806640625, 3.3736572265625, 3.5205078125, 3.6673583984375, 3.814208984375, 3.9610595703125, 4.10791015625, 4.2547607421875, 4.401611328125, 4.5484619140625, 4.6953125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 15.0, 17.0, 19.0, 24.0, 38.0, 68.0, 104.0, 178.0, 249.0, 397.0, 636.0, 1032.0, 1641.0, 2582.0, 4343.0, 7181.0, 11866.0, 19511.0, 32107.0, 51225.0, 77341.0, 110496.0, 139200.0, 149424.0, 135652.0, 105425.0, 73314.0, 47862.0, 29982.0, 18180.0, 11211.0, 6717.0, 3943.0, 2491.0, 1477.0, 994.0, 588.0, 389.0, 233.0, 137.0, 91.0, 51.0, 35.0, 29.0, 25.0, 10.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.07421875, -3.944580078125, -3.81494140625, -3.685302734375, -3.5556640625, -3.426025390625, -3.29638671875, -3.166748046875, -3.037109375, -2.907470703125, -2.77783203125, -2.648193359375, -2.5185546875, -2.388916015625, -2.25927734375, -2.129638671875, -2.0, -1.870361328125, -1.74072265625, -1.611083984375, -1.4814453125, -1.351806640625, -1.22216796875, -1.092529296875, -0.962890625, -0.833251953125, -0.70361328125, -0.573974609375, -0.4443359375, -0.314697265625, -0.18505859375, -0.055419921875, 0.07421875, 0.203857421875, 0.33349609375, 0.463134765625, 0.5927734375, 0.722412109375, 0.85205078125, 0.981689453125, 1.111328125, 1.240966796875, 1.37060546875, 1.500244140625, 1.6298828125, 1.759521484375, 1.88916015625, 2.018798828125, 2.1484375, 2.278076171875, 2.40771484375, 2.537353515625, 2.6669921875, 2.796630859375, 2.92626953125, 3.055908203125, 3.185546875, 3.315185546875, 3.44482421875, 3.574462890625, 3.7041015625, 3.833740234375, 3.96337890625, 4.093017578125, 4.22265625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 10.0, 6.0, 7.0, 7.0, 6.0, 8.0, 14.0, 11.0, 16.0, 20.0, 19.0, 16.0, 26.0, 31.0, 25.0, 38.0, 43.0, 26.0, 37.0, 43.0, 35.0, 31.0, 45.0, 37.0, 39.0, 37.0, 44.0, 41.0, 27.0, 34.0, 27.0, 27.0, 23.0, 25.0, 16.0, 20.0, 18.0, 9.0, 13.0, 13.0, 5.0, 8.0, 2.0, 3.0, 8.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.81121826171875, -2.7181396484375, -2.62506103515625, -2.531982421875, -2.43890380859375, -2.3458251953125, -2.25274658203125, -2.15966796875, -2.06658935546875, -1.9735107421875, -1.88043212890625, -1.787353515625, -1.69427490234375, -1.6011962890625, -1.50811767578125, -1.4150390625, -1.32196044921875, -1.2288818359375, -1.13580322265625, -1.042724609375, -0.94964599609375, -0.8565673828125, -0.76348876953125, -0.67041015625, -0.57733154296875, -0.4842529296875, -0.39117431640625, -0.298095703125, -0.20501708984375, -0.1119384765625, -0.01885986328125, 0.07421875, 0.16729736328125, 0.2603759765625, 0.35345458984375, 0.446533203125, 0.53961181640625, 0.6326904296875, 0.72576904296875, 0.81884765625, 0.91192626953125, 1.0050048828125, 1.09808349609375, 1.191162109375, 1.28424072265625, 1.3773193359375, 1.47039794921875, 1.5634765625, 1.65655517578125, 1.7496337890625, 1.84271240234375, 1.935791015625, 2.02886962890625, 2.1219482421875, 2.21502685546875, 2.30810546875, 2.40118408203125, 2.4942626953125, 2.58734130859375, 2.680419921875, 2.77349853515625, 2.8665771484375, 2.95965576171875, 3.052734375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 7.0, 11.0, 30.0, 47.0, 52.0, 92.0, 111.0, 178.0, 249.0, 396.0, 575.0, 713.0, 1153.0, 1653.0, 2634.0, 3936.0, 6247.0, 9623.0, 15302.0, 24329.0, 37628.0, 59204.0, 87422.0, 120513.0, 145552.0, 146154.0, 123147.0, 91426.0, 60774.0, 39585.0, 25228.0, 15828.0, 9931.0, 6338.0, 4145.0, 2764.0, 1816.0, 1295.0, 770.0, 513.0, 363.0, 239.0, 186.0, 130.0, 73.0, 60.0, 36.0, 23.0, 18.0, 18.0, 10.0, 8.0, 4.0, 4.0, 6.0], "bins": [-1.8779296875, -1.8227691650390625, -1.767608642578125, -1.7124481201171875, -1.65728759765625, -1.6021270751953125, -1.546966552734375, -1.4918060302734375, -1.4366455078125, -1.3814849853515625, -1.326324462890625, -1.2711639404296875, -1.21600341796875, -1.1608428955078125, -1.105682373046875, -1.0505218505859375, -0.995361328125, -0.9402008056640625, -0.885040283203125, -0.8298797607421875, -0.77471923828125, -0.7195587158203125, -0.664398193359375, -0.6092376708984375, -0.5540771484375, -0.4989166259765625, -0.443756103515625, -0.3885955810546875, -0.33343505859375, -0.2782745361328125, -0.223114013671875, -0.1679534912109375, -0.11279296875, -0.0576324462890625, -0.002471923828125, 0.0526885986328125, 0.10784912109375, 0.1630096435546875, 0.218170166015625, 0.2733306884765625, 0.3284912109375, 0.3836517333984375, 0.438812255859375, 0.4939727783203125, 0.54913330078125, 0.6042938232421875, 0.659454345703125, 0.7146148681640625, 0.769775390625, 0.8249359130859375, 0.880096435546875, 0.9352569580078125, 0.99041748046875, 1.0455780029296875, 1.100738525390625, 1.1558990478515625, 1.2110595703125, 1.2662200927734375, 1.321380615234375, 1.3765411376953125, 1.43170166015625, 1.4868621826171875, 1.542022705078125, 1.5971832275390625, 1.65234375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 3.0, 7.0, 7.0, 4.0, 13.0, 16.0, 17.0, 20.0, 27.0, 38.0, 59.0, 43.0, 64.0, 60.0, 69.0, 59.0, 69.0, 72.0, 67.0, 63.0, 45.0, 31.0, 40.0, 24.0, 22.0, 14.0, 15.0, 4.0, 4.0, 7.0, 1.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002636909484863281, -0.0002558566629886627, -0.0002480223774909973, -0.0002401880919933319, -0.0002323538064956665, -0.0002245195209980011, -0.0002166852355003357, -0.0002088509500026703, -0.00020101666450500488, -0.00019318237900733948, -0.00018534809350967407, -0.00017751380801200867, -0.00016967952251434326, -0.00016184523701667786, -0.00015401095151901245, -0.00014617666602134705, -0.00013834238052368164, -0.00013050809502601624, -0.00012267380952835083, -0.00011483952403068542, -0.00010700523853302002, -9.917095303535461e-05, -9.133666753768921e-05, -8.35023820400238e-05, -7.56680965423584e-05, -6.783381104469299e-05, -5.999952554702759e-05, -5.216524004936218e-05, -4.433095455169678e-05, -3.649666905403137e-05, -2.8662383556365967e-05, -2.082809805870056e-05, -1.2993812561035156e-05, -5.159527063369751e-06, 2.6747584342956543e-06, 1.050904393196106e-05, 1.8343329429626465e-05, 2.617761492729187e-05, 3.4011900424957275e-05, 4.184618592262268e-05, 4.9680471420288086e-05, 5.751475691795349e-05, 6.53490424156189e-05, 7.31833279132843e-05, 8.101761341094971e-05, 8.885189890861511e-05, 9.668618440628052e-05, 0.00010452046990394592, 0.00011235475540161133, 0.00012018904089927673, 0.00012802332639694214, 0.00013585761189460754, 0.00014369189739227295, 0.00015152618288993835, 0.00015936046838760376, 0.00016719475388526917, 0.00017502903938293457, 0.00018286332488059998, 0.00019069761037826538, 0.00019853189587593079, 0.0002063661813735962, 0.0002142004668712616, 0.000222034752368927, 0.0002298690378665924, 0.0002377033233642578]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 8.0, 5.0, 15.0, 22.0, 28.0, 48.0, 77.0, 110.0, 167.0, 247.0, 427.0, 686.0, 1109.0, 1801.0, 3073.0, 5190.0, 8687.0, 14677.0, 25126.0, 42016.0, 68137.0, 104042.0, 140922.0, 161970.0, 151190.0, 116499.0, 79629.0, 49198.0, 29907.0, 17594.0, 10302.0, 6296.0, 3647.0, 2201.0, 1321.0, 806.0, 546.0, 307.0, 165.0, 145.0, 68.0, 57.0, 39.0, 20.0, 12.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.109375, -2.046722412109375, -1.98406982421875, -1.921417236328125, -1.8587646484375, -1.796112060546875, -1.73345947265625, -1.670806884765625, -1.608154296875, -1.545501708984375, -1.48284912109375, -1.420196533203125, -1.3575439453125, -1.294891357421875, -1.23223876953125, -1.169586181640625, -1.10693359375, -1.044281005859375, -0.98162841796875, -0.918975830078125, -0.8563232421875, -0.793670654296875, -0.73101806640625, -0.668365478515625, -0.605712890625, -0.543060302734375, -0.48040771484375, -0.417755126953125, -0.3551025390625, -0.292449951171875, -0.22979736328125, -0.167144775390625, -0.1044921875, -0.041839599609375, 0.02081298828125, 0.083465576171875, 0.1461181640625, 0.208770751953125, 0.27142333984375, 0.334075927734375, 0.396728515625, 0.459381103515625, 0.52203369140625, 0.584686279296875, 0.6473388671875, 0.709991455078125, 0.77264404296875, 0.835296630859375, 0.89794921875, 0.960601806640625, 1.02325439453125, 1.085906982421875, 1.1485595703125, 1.211212158203125, 1.27386474609375, 1.336517333984375, 1.399169921875, 1.461822509765625, 1.52447509765625, 1.587127685546875, 1.6497802734375, 1.712432861328125, 1.77508544921875, 1.837738037109375, 1.900390625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 7.0, 7.0, 10.0, 7.0, 10.0, 15.0, 17.0, 16.0, 29.0, 33.0, 28.0, 34.0, 48.0, 37.0, 48.0, 42.0, 56.0, 52.0, 44.0, 42.0, 52.0, 44.0, 27.0, 37.0, 45.0, 32.0, 38.0, 20.0, 18.0, 18.0, 20.0, 7.0, 13.0, 14.0, 6.0, 3.0, 5.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.6943359375, -0.6751480102539062, -0.6559600830078125, -0.6367721557617188, -0.617584228515625, -0.5983963012695312, -0.5792083740234375, -0.5600204467773438, -0.54083251953125, -0.5216445922851562, -0.5024566650390625, -0.48326873779296875, -0.464080810546875, -0.44489288330078125, -0.4257049560546875, -0.40651702880859375, -0.3873291015625, -0.36814117431640625, -0.3489532470703125, -0.32976531982421875, -0.310577392578125, -0.29138946533203125, -0.2722015380859375, -0.25301361083984375, -0.23382568359375, -0.21463775634765625, -0.1954498291015625, -0.17626190185546875, -0.157073974609375, -0.13788604736328125, -0.1186981201171875, -0.09951019287109375, -0.080322265625, -0.06113433837890625, -0.0419464111328125, -0.02275848388671875, -0.003570556640625, 0.01561737060546875, 0.0348052978515625, 0.05399322509765625, 0.07318115234375, 0.09236907958984375, 0.1115570068359375, 0.13074493408203125, 0.149932861328125, 0.16912078857421875, 0.1883087158203125, 0.20749664306640625, 0.2266845703125, 0.24587249755859375, 0.2650604248046875, 0.28424835205078125, 0.303436279296875, 0.32262420654296875, 0.3418121337890625, 0.36100006103515625, 0.38018798828125, 0.39937591552734375, 0.4185638427734375, 0.43775177001953125, 0.456939697265625, 0.47612762451171875, 0.4953155517578125, 0.5145034790039062, 0.53369140625]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 3.0, 10.0, 10.0, 11.0, 12.0, 14.0, 26.0, 20.0, 29.0, 38.0, 32.0, 63.0, 67.0, 60.0, 62.0, 67.0, 55.0, 56.0, 62.0, 71.0, 45.0, 27.0, 31.0, 26.0, 21.0, 16.0, 10.0, 10.0, 13.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.933524131774902, -10.64033031463623, -10.347137451171875, -10.053943634033203, -9.760749816894531, -9.46755599975586, -9.174363136291504, -8.881169319152832, -8.58797550201416, -8.294781684875488, -8.001588821411133, -7.708395004272461, -7.415201187133789, -7.122007846832275, -6.828814506530762, -6.53562068939209, -6.242427349090576, -5.9492340087890625, -5.656040191650391, -5.362846851348877, -5.069653034210205, -4.776459693908691, -4.4832658767700195, -4.190072536468506, -3.896878957748413, -3.6036853790283203, -3.3104918003082275, -3.0172982215881348, -2.724104881286621, -2.430911064147949, -2.1377177238464355, -1.8445241451263428, -1.5513310432434082, -1.2581374645233154, -0.9649439454078674, -0.6717504262924194, -0.37855684757232666, -0.08536326885223389, 0.20783019065856934, 0.5010237693786621, 0.7942173480987549, 1.0874109268188477, 1.3806045055389404, 1.6737979650497437, 1.9669915437698364, 2.2601852416992188, 2.5533785820007324, 2.846572160720825, 3.139765739440918, 3.4329593181610107, 3.7261528968811035, 4.019346237182617, 4.312540054321289, 4.605733394622803, 4.898926734924316, 5.192120552062988, 5.48531436920166, 5.778507709503174, 6.071701526641846, 6.364894866943359, 6.658088684082031, 6.951282024383545, 7.244475364685059, 7.5376691818237305, 7.830862522125244]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 3.0, 12.0, 3.0, 13.0, 11.0, 13.0, 8.0, 19.0, 17.0, 18.0, 24.0, 22.0, 30.0, 36.0, 34.0, 28.0, 35.0, 51.0, 38.0, 35.0, 29.0, 38.0, 42.0, 42.0, 41.0, 42.0, 40.0, 22.0, 36.0, 33.0, 29.0, 26.0, 22.0, 23.0, 18.0, 6.0, 8.0, 9.0, 9.0, 10.0, 4.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.408603191375732, -5.249632358551025, -5.09066104888916, -4.931690216064453, -4.772719383239746, -4.613748550415039, -4.454777717590332, -4.295806407928467, -4.13683557510376, -3.9778647422790527, -3.8188936710357666, -3.6599225997924805, -3.5009517669677734, -3.3419809341430664, -3.1830098628997803, -3.024038791656494, -2.865067958831787, -2.70609712600708, -2.547126054763794, -2.388154983520508, -2.229184150695801, -2.0702133178710938, -1.9112422466278076, -1.752271294593811, -1.5933003425598145, -1.4343293905258179, -1.2753584384918213, -1.1163874864578247, -0.9574165344238281, -0.7984455823898315, -0.639474630355835, -0.4805036783218384, -0.321533203125, -0.16256225109100342, -0.003591299057006836, 0.15537965297698975, 0.31435060501098633, 0.4733215570449829, 0.6322925090789795, 0.7912634611129761, 0.9502344131469727, 1.1092053651809692, 1.2681763172149658, 1.4271472692489624, 1.586118221282959, 1.7450891733169556, 1.9040601253509521, 2.0630311965942383, 2.2220020294189453, 2.3809728622436523, 2.5399439334869385, 2.6989150047302246, 2.8578858375549316, 3.0168566703796387, 3.175827741622925, 3.334798812866211, 3.493769645690918, 3.652740478515625, 3.811711549758911, 3.9706826210021973, 4.129653453826904, 4.288624286651611, 4.447595596313477, 4.606566429138184, 4.765537261962891]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 13.0, 18.0, 37.0, 33.0, 61.0, 116.0, 118.0, 189.0, 314.0, 563.0, 882.0, 1405.0, 2255.0, 3640.0, 6071.0, 10707.0, 19694.0, 39324.0, 90347.0, 246382.0, 751592.0, 1497428.0, 984171.0, 327544.0, 112261.0, 46598.0, 22578.0, 11909.0, 6853.0, 4117.0, 2552.0, 1548.0, 999.0, 678.0, 429.0, 274.0, 174.0, 106.0, 105.0, 53.0, 31.0, 22.0, 21.0, 17.0, 11.0, 16.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.1171875, -9.7637939453125, -9.410400390625, -9.0570068359375, -8.70361328125, -8.3502197265625, -7.996826171875, -7.6434326171875, -7.2900390625, -6.9366455078125, -6.583251953125, -6.2298583984375, -5.87646484375, -5.5230712890625, -5.169677734375, -4.8162841796875, -4.462890625, -4.1094970703125, -3.756103515625, -3.4027099609375, -3.04931640625, -2.6959228515625, -2.342529296875, -1.9891357421875, -1.6357421875, -1.2823486328125, -0.928955078125, -0.5755615234375, -0.22216796875, 0.1312255859375, 0.484619140625, 0.8380126953125, 1.19140625, 1.5447998046875, 1.898193359375, 2.2515869140625, 2.60498046875, 2.9583740234375, 3.311767578125, 3.6651611328125, 4.0185546875, 4.3719482421875, 4.725341796875, 5.0787353515625, 5.43212890625, 5.7855224609375, 6.138916015625, 6.4923095703125, 6.845703125, 7.1990966796875, 7.552490234375, 7.9058837890625, 8.25927734375, 8.6126708984375, 8.966064453125, 9.3194580078125, 9.6728515625, 10.0262451171875, 10.379638671875, 10.7330322265625, 11.08642578125, 11.4398193359375, 11.793212890625, 12.1466064453125, 12.5]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 3.0, 5.0, 9.0, 3.0, 12.0, 11.0, 12.0, 13.0, 14.0, 15.0, 15.0, 26.0, 25.0, 35.0, 25.0, 38.0, 35.0, 40.0, 34.0, 46.0, 47.0, 39.0, 42.0, 31.0, 49.0, 48.0, 31.0, 42.0, 30.0, 38.0, 24.0, 34.0, 24.0, 21.0, 13.0, 14.0, 11.0, 12.0, 8.0, 5.0, 11.0, 1.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.26092529296875, -4.1273193359375, -3.99371337890625, -3.860107421875, -3.72650146484375, -3.5928955078125, -3.45928955078125, -3.32568359375, -3.19207763671875, -3.0584716796875, -2.92486572265625, -2.791259765625, -2.65765380859375, -2.5240478515625, -2.39044189453125, -2.2568359375, -2.12322998046875, -1.9896240234375, -1.85601806640625, -1.722412109375, -1.58880615234375, -1.4552001953125, -1.32159423828125, -1.18798828125, -1.05438232421875, -0.9207763671875, -0.78717041015625, -0.653564453125, -0.51995849609375, -0.3863525390625, -0.25274658203125, -0.119140625, 0.01446533203125, 0.1480712890625, 0.28167724609375, 0.415283203125, 0.54888916015625, 0.6824951171875, 0.81610107421875, 0.94970703125, 1.08331298828125, 1.2169189453125, 1.35052490234375, 1.484130859375, 1.61773681640625, 1.7513427734375, 1.88494873046875, 2.0185546875, 2.15216064453125, 2.2857666015625, 2.41937255859375, 2.552978515625, 2.68658447265625, 2.8201904296875, 2.95379638671875, 3.08740234375, 3.22100830078125, 3.3546142578125, 3.48822021484375, 3.621826171875, 3.75543212890625, 3.8890380859375, 4.02264404296875, 4.15625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 12.0, 10.0, 26.0, 27.0, 53.0, 74.0, 121.0, 185.0, 262.0, 461.0, 690.0, 1039.0, 1716.0, 2824.0, 4546.0, 8021.0, 13887.0, 25936.0, 51784.0, 108748.0, 246948.0, 591001.0, 1194175.0, 1066500.0, 483913.0, 203333.0, 91398.0, 44162.0, 22620.0, 12365.0, 6885.0, 4017.0, 2503.0, 1430.0, 938.0, 562.0, 390.0, 235.0, 161.0, 104.0, 72.0, 46.0, 38.0, 19.0, 21.0, 15.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.8671875, -10.5263671875, -10.185546875, -9.8447265625, -9.50390625, -9.1630859375, -8.822265625, -8.4814453125, -8.140625, -7.7998046875, -7.458984375, -7.1181640625, -6.77734375, -6.4365234375, -6.095703125, -5.7548828125, -5.4140625, -5.0732421875, -4.732421875, -4.3916015625, -4.05078125, -3.7099609375, -3.369140625, -3.0283203125, -2.6875, -2.3466796875, -2.005859375, -1.6650390625, -1.32421875, -0.9833984375, -0.642578125, -0.3017578125, 0.0390625, 0.3798828125, 0.720703125, 1.0615234375, 1.40234375, 1.7431640625, 2.083984375, 2.4248046875, 2.765625, 3.1064453125, 3.447265625, 3.7880859375, 4.12890625, 4.4697265625, 4.810546875, 5.1513671875, 5.4921875, 5.8330078125, 6.173828125, 6.5146484375, 6.85546875, 7.1962890625, 7.537109375, 7.8779296875, 8.21875, 8.5595703125, 8.900390625, 9.2412109375, 9.58203125, 9.9228515625, 10.263671875, 10.6044921875, 10.9453125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 5.0, 7.0, 11.0, 15.0, 14.0, 24.0, 38.0, 28.0, 55.0, 60.0, 90.0, 127.0, 148.0, 206.0, 253.0, 313.0, 374.0, 400.0, 368.0, 345.0, 241.0, 213.0, 161.0, 130.0, 113.0, 91.0, 53.0, 41.0, 34.0, 25.0, 22.0, 14.0, 12.0, 12.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.041015625, -2.930755615234375, -2.82049560546875, -2.710235595703125, -2.5999755859375, -2.489715576171875, -2.37945556640625, -2.269195556640625, -2.158935546875, -2.048675537109375, -1.93841552734375, -1.828155517578125, -1.7178955078125, -1.607635498046875, -1.49737548828125, -1.387115478515625, -1.27685546875, -1.166595458984375, -1.05633544921875, -0.946075439453125, -0.8358154296875, -0.725555419921875, -0.61529541015625, -0.505035400390625, -0.394775390625, -0.284515380859375, -0.17425537109375, -0.063995361328125, 0.0462646484375, 0.156524658203125, 0.26678466796875, 0.377044677734375, 0.4873046875, 0.597564697265625, 0.70782470703125, 0.818084716796875, 0.9283447265625, 1.038604736328125, 1.14886474609375, 1.259124755859375, 1.369384765625, 1.479644775390625, 1.58990478515625, 1.700164794921875, 1.8104248046875, 1.920684814453125, 2.03094482421875, 2.141204833984375, 2.25146484375, 2.361724853515625, 2.47198486328125, 2.582244873046875, 2.6925048828125, 2.802764892578125, 2.91302490234375, 3.023284912109375, 3.133544921875, 3.243804931640625, 3.35406494140625, 3.464324951171875, 3.5745849609375, 3.684844970703125, 3.79510498046875, 3.905364990234375, 4.015625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 9.0, 8.0, 14.0, 11.0, 17.0, 19.0, 22.0, 19.0, 33.0, 25.0, 46.0, 48.0, 49.0, 73.0, 76.0, 70.0, 75.0, 58.0, 51.0, 36.0, 41.0, 38.0, 36.0, 27.0, 12.0, 13.0, 8.0, 12.0, 7.0, 8.0, 7.0, 1.0, 4.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.345856666564941, -10.03372859954834, -9.721600532531738, -9.409473419189453, -9.097345352172852, -8.78521728515625, -8.473089218139648, -8.160961151123047, -7.8488335609436035, -7.536705493927002, -7.224577903747559, -6.912449836730957, -6.6003217697143555, -6.288194179534912, -5.9760661125183105, -5.663938522338867, -5.351810455322266, -5.039682388305664, -4.727554798126221, -4.415426731109619, -4.103299140930176, -3.791171073913574, -3.4790430068969727, -3.16691517829895, -2.8547873497009277, -2.5426595211029053, -2.230531692504883, -1.9184036254882812, -1.6062757968902588, -1.2941479682922363, -0.9820200204849243, -0.6698920726776123, -0.35776424407958984, -0.04563635587692261, 0.26649153232574463, 0.5786194205284119, 0.8907473087310791, 1.2028751373291016, 1.5150030851364136, 1.8271310329437256, 2.139258861541748, 2.4513866901397705, 2.763514518737793, 3.0756425857543945, 3.387770414352417, 3.6998982429504395, 4.012026309967041, 4.324153900146484, 4.636281967163086, 4.9484100341796875, 5.260537624359131, 5.572665691375732, 5.884793281555176, 6.196921348571777, 6.509049415588379, 6.8211774826049805, 7.133305072784424, 7.445433139801025, 7.757560729980469, 8.06968879699707, 8.381816864013672, 8.693944931030273, 9.006072044372559, 9.31820011138916, 9.630328178405762]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 16.0, 10.0, 13.0, 18.0, 10.0, 17.0, 15.0, 13.0, 20.0, 26.0, 22.0, 32.0, 25.0, 34.0, 34.0, 28.0, 42.0, 40.0, 34.0, 45.0, 34.0, 48.0, 28.0, 48.0, 40.0, 35.0, 32.0, 30.0, 19.0, 21.0, 19.0, 21.0, 19.0, 16.0, 14.0, 12.0, 15.0, 8.0, 9.0, 8.0, 7.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.479977607727051, -5.306244373321533, -5.132511615753174, -4.958778381347656, -4.785045146942139, -4.611311912536621, -4.437579154968262, -4.263845920562744, -4.090112686157227, -3.916379690170288, -3.7426464557647705, -3.568913459777832, -3.3951802253723145, -3.221447229385376, -3.0477142333984375, -2.87398099899292, -2.7002482414245605, -2.526515245437622, -2.3527820110321045, -2.179049015045166, -2.0053157806396484, -1.83158278465271, -1.6578497886657715, -1.4841166734695435, -1.3103835582733154, -1.1366504430770874, -0.9629173874855042, -0.7891843318939209, -0.6154512166976929, -0.44171810150146484, -0.26798510551452637, -0.09425199031829834, 0.07948160171508789, 0.25321468710899353, 0.42694777250289917, 0.6006808280944824, 0.7744139432907104, 0.9481470584869385, 1.121880054473877, 1.295613169670105, 1.469346284866333, 1.643079400062561, 1.816812515258789, 1.9905455112457275, 2.164278507232666, 2.3380117416381836, 2.511744737625122, 2.6854777336120605, 2.859210968017578, 3.0329439640045166, 3.206677198410034, 3.3804101943969727, 3.5541434288024902, 3.7278764247894287, 3.901609420776367, 4.075342655181885, 4.249075889587402, 4.42280912399292, 4.596541881561279, 4.770275115966797, 4.9440083503723145, 5.117741584777832, 5.291474342346191, 5.465207576751709, 5.638940334320068]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 16.0, 15.0, 31.0, 42.0, 67.0, 120.0, 147.0, 259.0, 445.0, 738.0, 1150.0, 2044.0, 3514.0, 6123.0, 10372.0, 17987.0, 31081.0, 52445.0, 86317.0, 134149.0, 177135.0, 176225.0, 134019.0, 86701.0, 52809.0, 31274.0, 17988.0, 10578.0, 6063.0, 3568.0, 2057.0, 1225.0, 690.0, 448.0, 270.0, 190.0, 99.0, 58.0, 33.0, 19.0, 17.0, 14.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.046875, -3.9278564453125, -3.808837890625, -3.6898193359375, -3.57080078125, -3.4517822265625, -3.332763671875, -3.2137451171875, -3.0947265625, -2.9757080078125, -2.856689453125, -2.7376708984375, -2.61865234375, -2.4996337890625, -2.380615234375, -2.2615966796875, -2.142578125, -2.0235595703125, -1.904541015625, -1.7855224609375, -1.66650390625, -1.5474853515625, -1.428466796875, -1.3094482421875, -1.1904296875, -1.0714111328125, -0.952392578125, -0.8333740234375, -0.71435546875, -0.5953369140625, -0.476318359375, -0.3572998046875, -0.23828125, -0.1192626953125, -0.000244140625, 0.1187744140625, 0.23779296875, 0.3568115234375, 0.475830078125, 0.5948486328125, 0.7138671875, 0.8328857421875, 0.951904296875, 1.0709228515625, 1.18994140625, 1.3089599609375, 1.427978515625, 1.5469970703125, 1.666015625, 1.7850341796875, 1.904052734375, 2.0230712890625, 2.14208984375, 2.2611083984375, 2.380126953125, 2.4991455078125, 2.6181640625, 2.7371826171875, 2.856201171875, 2.9752197265625, 3.09423828125, 3.2132568359375, 3.332275390625, 3.4512939453125, 3.5703125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 9.0, 11.0, 16.0, 12.0, 15.0, 11.0, 23.0, 11.0, 35.0, 25.0, 18.0, 43.0, 32.0, 24.0, 34.0, 34.0, 37.0, 43.0, 33.0, 52.0, 46.0, 44.0, 28.0, 36.0, 23.0, 34.0, 32.0, 23.0, 18.0, 24.0, 20.0, 26.0, 17.0, 11.0, 13.0, 11.0, 10.0, 10.0, 12.0, 7.0, 7.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.09979248046875, -4.9183349609375, -4.73687744140625, -4.555419921875, -4.37396240234375, -4.1925048828125, -4.01104736328125, -3.82958984375, -3.64813232421875, -3.4666748046875, -3.28521728515625, -3.103759765625, -2.92230224609375, -2.7408447265625, -2.55938720703125, -2.3779296875, -2.19647216796875, -2.0150146484375, -1.83355712890625, -1.652099609375, -1.47064208984375, -1.2891845703125, -1.10772705078125, -0.92626953125, -0.74481201171875, -0.5633544921875, -0.38189697265625, -0.200439453125, -0.01898193359375, 0.1624755859375, 0.34393310546875, 0.525390625, 0.70684814453125, 0.8883056640625, 1.06976318359375, 1.251220703125, 1.43267822265625, 1.6141357421875, 1.79559326171875, 1.97705078125, 2.15850830078125, 2.3399658203125, 2.52142333984375, 2.702880859375, 2.88433837890625, 3.0657958984375, 3.24725341796875, 3.4287109375, 3.61016845703125, 3.7916259765625, 3.97308349609375, 4.154541015625, 4.33599853515625, 4.5174560546875, 4.69891357421875, 4.88037109375, 5.06182861328125, 5.2432861328125, 5.42474365234375, 5.606201171875, 5.78765869140625, 5.9691162109375, 6.15057373046875, 6.33203125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 11.0, 15.0, 21.0, 36.0, 38.0, 70.0, 112.0, 178.0, 265.0, 427.0, 604.0, 949.0, 1600.0, 2631.0, 4382.0, 7313.0, 12974.0, 23337.0, 41742.0, 77648.0, 137468.0, 209967.0, 210230.0, 139154.0, 78778.0, 42981.0, 23291.0, 13285.0, 7447.0, 4474.0, 2687.0, 1628.0, 1030.0, 626.0, 389.0, 249.0, 163.0, 112.0, 77.0, 42.0, 37.0, 29.0, 15.0, 10.0, 10.0, 8.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.94140625, -4.78704833984375, -4.6326904296875, -4.47833251953125, -4.323974609375, -4.16961669921875, -4.0152587890625, -3.86090087890625, -3.70654296875, -3.55218505859375, -3.3978271484375, -3.24346923828125, -3.089111328125, -2.93475341796875, -2.7803955078125, -2.62603759765625, -2.4716796875, -2.31732177734375, -2.1629638671875, -2.00860595703125, -1.854248046875, -1.69989013671875, -1.5455322265625, -1.39117431640625, -1.23681640625, -1.08245849609375, -0.9281005859375, -0.77374267578125, -0.619384765625, -0.46502685546875, -0.3106689453125, -0.15631103515625, -0.001953125, 0.15240478515625, 0.3067626953125, 0.46112060546875, 0.615478515625, 0.76983642578125, 0.9241943359375, 1.07855224609375, 1.23291015625, 1.38726806640625, 1.5416259765625, 1.69598388671875, 1.850341796875, 2.00469970703125, 2.1590576171875, 2.31341552734375, 2.4677734375, 2.62213134765625, 2.7764892578125, 2.93084716796875, 3.085205078125, 3.23956298828125, 3.3939208984375, 3.54827880859375, 3.70263671875, 3.85699462890625, 4.0113525390625, 4.16571044921875, 4.320068359375, 4.47442626953125, 4.6287841796875, 4.78314208984375, 4.9375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 7.0, 11.0, 8.0, 12.0, 9.0, 10.0, 12.0, 22.0, 20.0, 22.0, 25.0, 31.0, 33.0, 36.0, 41.0, 45.0, 32.0, 42.0, 39.0, 40.0, 43.0, 47.0, 36.0, 46.0, 45.0, 46.0, 30.0, 36.0, 25.0, 18.0, 21.0, 25.0, 18.0, 9.0, 12.0, 8.0, 12.0, 4.0, 14.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.745025634765625, -3.62286376953125, -3.500701904296875, -3.3785400390625, -3.256378173828125, -3.13421630859375, -3.012054443359375, -2.889892578125, -2.767730712890625, -2.64556884765625, -2.523406982421875, -2.4012451171875, -2.279083251953125, -2.15692138671875, -2.034759521484375, -1.91259765625, -1.790435791015625, -1.66827392578125, -1.546112060546875, -1.4239501953125, -1.301788330078125, -1.17962646484375, -1.057464599609375, -0.935302734375, -0.813140869140625, -0.69097900390625, -0.568817138671875, -0.4466552734375, -0.324493408203125, -0.20233154296875, -0.080169677734375, 0.0419921875, 0.164154052734375, 0.28631591796875, 0.408477783203125, 0.5306396484375, 0.652801513671875, 0.77496337890625, 0.897125244140625, 1.019287109375, 1.141448974609375, 1.26361083984375, 1.385772705078125, 1.5079345703125, 1.630096435546875, 1.75225830078125, 1.874420166015625, 1.99658203125, 2.118743896484375, 2.24090576171875, 2.363067626953125, 2.4852294921875, 2.607391357421875, 2.72955322265625, 2.851715087890625, 2.973876953125, 3.096038818359375, 3.21820068359375, 3.340362548828125, 3.4625244140625, 3.584686279296875, 3.70684814453125, 3.829010009765625, 3.951171875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 10.0, 20.0, 38.0, 49.0, 81.0, 89.0, 170.0, 227.0, 365.0, 559.0, 820.0, 1254.0, 1958.0, 3056.0, 4839.0, 7966.0, 13242.0, 22948.0, 40494.0, 73302.0, 129858.0, 204706.0, 213723.0, 141353.0, 80276.0, 44559.0, 25002.0, 14552.0, 8499.0, 5196.0, 3254.0, 2019.0, 1349.0, 869.0, 625.0, 380.0, 266.0, 184.0, 128.0, 87.0, 54.0, 39.0, 30.0, 15.0, 10.0, 6.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.453125, -2.37896728515625, -2.3048095703125, -2.23065185546875, -2.156494140625, -2.08233642578125, -2.0081787109375, -1.93402099609375, -1.85986328125, -1.78570556640625, -1.7115478515625, -1.63739013671875, -1.563232421875, -1.48907470703125, -1.4149169921875, -1.34075927734375, -1.2666015625, -1.19244384765625, -1.1182861328125, -1.04412841796875, -0.969970703125, -0.89581298828125, -0.8216552734375, -0.74749755859375, -0.67333984375, -0.59918212890625, -0.5250244140625, -0.45086669921875, -0.376708984375, -0.30255126953125, -0.2283935546875, -0.15423583984375, -0.080078125, -0.00592041015625, 0.0682373046875, 0.14239501953125, 0.216552734375, 0.29071044921875, 0.3648681640625, 0.43902587890625, 0.51318359375, 0.58734130859375, 0.6614990234375, 0.73565673828125, 0.809814453125, 0.88397216796875, 0.9581298828125, 1.03228759765625, 1.1064453125, 1.18060302734375, 1.2547607421875, 1.32891845703125, 1.403076171875, 1.47723388671875, 1.5513916015625, 1.62554931640625, 1.69970703125, 1.77386474609375, 1.8480224609375, 1.92218017578125, 1.996337890625, 2.07049560546875, 2.1446533203125, 2.21881103515625, 2.29296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 13.0, 6.0, 17.0, 15.0, 24.0, 24.0, 21.0, 36.0, 50.0, 61.0, 85.0, 67.0, 73.0, 73.0, 79.0, 59.0, 57.0, 60.0, 33.0, 30.0, 25.0, 19.0, 11.0, 8.0, 10.0, 5.0, 5.0, 8.0, 0.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0001475811004638672, -0.0001432131975889206, -0.000138845294713974, -0.0001344773918390274, -0.0001301094889640808, -0.00012574158608913422, -0.00012137368321418762, -0.00011700578033924103, -0.00011263787746429443, -0.00010826997458934784, -0.00010390207171440125, -9.953416883945465e-05, -9.516626596450806e-05, -9.079836308956146e-05, -8.643046021461487e-05, -8.206255733966827e-05, -7.769465446472168e-05, -7.332675158977509e-05, -6.895884871482849e-05, -6.45909458398819e-05, -6.02230429649353e-05, -5.585514008998871e-05, -5.1487237215042114e-05, -4.711933434009552e-05, -4.2751431465148926e-05, -3.838352859020233e-05, -3.401562571525574e-05, -2.9647722840309143e-05, -2.527981996536255e-05, -2.0911917090415955e-05, -1.654401421546936e-05, -1.2176111340522766e-05, -7.808208465576172e-06, -3.4403055906295776e-06, 9.275972843170166e-07, 5.295500159263611e-06, 9.663403034210205e-06, 1.40313059091568e-05, 1.8399208784103394e-05, 2.2767111659049988e-05, 2.7135014533996582e-05, 3.1502917408943176e-05, 3.587082028388977e-05, 4.0238723158836365e-05, 4.460662603378296e-05, 4.897452890872955e-05, 5.334243178367615e-05, 5.771033465862274e-05, 6.207823753356934e-05, 6.644614040851593e-05, 7.081404328346252e-05, 7.518194615840912e-05, 7.954984903335571e-05, 8.391775190830231e-05, 8.82856547832489e-05, 9.26535576581955e-05, 9.702146053314209e-05, 0.00010138936340808868, 0.00010575726628303528, 0.00011012516915798187, 0.00011449307203292847, 0.00011886097490787506, 0.00012322887778282166, 0.00012759678065776825, 0.00013196468353271484]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 13.0, 23.0, 21.0, 32.0, 56.0, 69.0, 105.0, 157.0, 204.0, 345.0, 483.0, 763.0, 1212.0, 1733.0, 2771.0, 4331.0, 6666.0, 10490.0, 16912.0, 27407.0, 44394.0, 70788.0, 107968.0, 148045.0, 167108.0, 146026.0, 106197.0, 68996.0, 43177.0, 26685.0, 16377.0, 10436.0, 6620.0, 4003.0, 2713.0, 1826.0, 1124.0, 750.0, 490.0, 333.0, 217.0, 157.0, 118.0, 77.0, 47.0, 20.0, 22.0, 20.0, 10.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.982421875, -1.91943359375, -1.8564453125, -1.79345703125, -1.73046875, -1.66748046875, -1.6044921875, -1.54150390625, -1.478515625, -1.41552734375, -1.3525390625, -1.28955078125, -1.2265625, -1.16357421875, -1.1005859375, -1.03759765625, -0.974609375, -0.91162109375, -0.8486328125, -0.78564453125, -0.72265625, -0.65966796875, -0.5966796875, -0.53369140625, -0.470703125, -0.40771484375, -0.3447265625, -0.28173828125, -0.21875, -0.15576171875, -0.0927734375, -0.02978515625, 0.033203125, 0.09619140625, 0.1591796875, 0.22216796875, 0.28515625, 0.34814453125, 0.4111328125, 0.47412109375, 0.537109375, 0.60009765625, 0.6630859375, 0.72607421875, 0.7890625, 0.85205078125, 0.9150390625, 0.97802734375, 1.041015625, 1.10400390625, 1.1669921875, 1.22998046875, 1.29296875, 1.35595703125, 1.4189453125, 1.48193359375, 1.544921875, 1.60791015625, 1.6708984375, 1.73388671875, 1.796875, 1.85986328125, 1.9228515625, 1.98583984375, 2.048828125]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 6.0, 7.0, 8.0, 7.0, 6.0, 16.0, 16.0, 14.0, 18.0, 18.0, 34.0, 29.0, 28.0, 37.0, 52.0, 46.0, 49.0, 47.0, 55.0, 48.0, 41.0, 53.0, 41.0, 49.0, 30.0, 41.0, 29.0, 29.0, 21.0, 23.0, 14.0, 15.0, 15.0, 17.0, 5.0, 13.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6630859375, -0.6432113647460938, -0.6233367919921875, -0.6034622192382812, -0.583587646484375, -0.5637130737304688, -0.5438385009765625, -0.5239639282226562, -0.50408935546875, -0.48421478271484375, -0.4643402099609375, -0.44446563720703125, -0.424591064453125, -0.40471649169921875, -0.3848419189453125, -0.36496734619140625, -0.3450927734375, -0.32521820068359375, -0.3053436279296875, -0.28546905517578125, -0.265594482421875, -0.24571990966796875, -0.2258453369140625, -0.20597076416015625, -0.18609619140625, -0.16622161865234375, -0.1463470458984375, -0.12647247314453125, -0.106597900390625, -0.08672332763671875, -0.0668487548828125, -0.04697418212890625, -0.027099609375, -0.00722503662109375, 0.0126495361328125, 0.03252410888671875, 0.052398681640625, 0.07227325439453125, 0.0921478271484375, 0.11202239990234375, 0.13189697265625, 0.15177154541015625, 0.1716461181640625, 0.19152069091796875, 0.211395263671875, 0.23126983642578125, 0.2511444091796875, 0.27101898193359375, 0.2908935546875, 0.31076812744140625, 0.3306427001953125, 0.35051727294921875, 0.370391845703125, 0.39026641845703125, 0.4101409912109375, 0.43001556396484375, 0.44989013671875, 0.46976470947265625, 0.4896392822265625, 0.5095138549804688, 0.529388427734375, 0.5492630004882812, 0.5691375732421875, 0.5890121459960938, 0.60888671875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 0.0, 4.0, 5.0, 6.0, 8.0, 8.0, 15.0, 13.0, 16.0, 23.0, 28.0, 28.0, 31.0, 43.0, 61.0, 48.0, 78.0, 77.0, 78.0, 71.0, 57.0, 47.0, 48.0, 38.0, 42.0, 30.0, 13.0, 9.0, 14.0, 10.0, 13.0, 8.0, 5.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.154535293579102, -10.825577735900879, -10.496620178222656, -10.16766357421875, -9.838706016540527, -9.509748458862305, -9.180790901184082, -8.85183334350586, -8.522875785827637, -8.193918228149414, -7.86496114730835, -7.536003589630127, -7.207046031951904, -6.87808895111084, -6.549131393432617, -6.2201738357543945, -5.89121675491333, -5.562259197235107, -5.233302116394043, -4.90434455871582, -4.575387001037598, -4.246429443359375, -3.9174723625183105, -3.588514804840088, -3.2595574855804443, -2.930600166320801, -2.601642608642578, -2.2726852893829346, -1.9437278509140015, -1.6147704124450684, -1.2858130931854248, -0.9568555355072021, -0.6278982162475586, -0.2989408075809479, 0.030016601085662842, 0.35897397994995117, 0.6879314184188843, 1.0168888568878174, 1.345846176147461, 1.6748037338256836, 2.003761053085327, 2.3327183723449707, 2.6616759300231934, 2.990633249282837, 3.3195905685424805, 3.648548126220703, 3.9775054454803467, 4.306463241577148, 4.635420322418213, 4.9643778800964355, 5.2933349609375, 5.622292518615723, 5.951250076293945, 6.280207633972168, 6.609164714813232, 6.938122272491455, 7.2670793533325195, 7.596036911010742, 7.924993991851807, 8.253952026367188, 8.582908630371094, 8.911866188049316, 9.240823745727539, 9.569781303405762, 9.898738861083984]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 5.0, 12.0, 13.0, 13.0, 15.0, 14.0, 12.0, 16.0, 14.0, 22.0, 22.0, 22.0, 23.0, 27.0, 36.0, 32.0, 32.0, 27.0, 48.0, 37.0, 31.0, 60.0, 38.0, 30.0, 39.0, 45.0, 41.0, 40.0, 23.0, 22.0, 24.0, 19.0, 21.0, 19.0, 22.0, 13.0, 13.0, 16.0, 10.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.661330223083496, -5.485322952270508, -5.3093156814575195, -5.133308410644531, -4.957301139831543, -4.781293869018555, -4.605286598205566, -4.429279327392578, -4.25327205657959, -4.077264785766602, -3.9012575149536133, -3.725250244140625, -3.5492429733276367, -3.3732357025146484, -3.19722843170166, -3.021221160888672, -2.8452138900756836, -2.6692066192626953, -2.493199348449707, -2.3171920776367188, -2.1411848068237305, -1.9651775360107422, -1.789170265197754, -1.6131629943847656, -1.4371557235717773, -1.261148452758789, -1.0851411819458008, -0.9091339111328125, -0.7331266403198242, -0.5571193695068359, -0.38111209869384766, -0.20510482788085938, -0.02909708023071289, 0.1469101905822754, 0.32291746139526367, 0.49892473220825195, 0.6749320030212402, 0.8509392738342285, 1.0269465446472168, 1.202953815460205, 1.3789610862731934, 1.5549683570861816, 1.73097562789917, 1.9069828987121582, 2.0829901695251465, 2.2589974403381348, 2.435004711151123, 2.6110119819641113, 2.7870192527770996, 2.963026523590088, 3.139033794403076, 3.3150410652160645, 3.4910483360290527, 3.667055606842041, 3.8430628776550293, 4.019070148468018, 4.195077419281006, 4.371084690093994, 4.547091960906982, 4.723099231719971, 4.899106502532959, 5.075113773345947, 5.2511210441589355, 5.427128314971924, 5.603135585784912]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 13.0, 20.0, 33.0, 42.0, 63.0, 110.0, 150.0, 257.0, 386.0, 612.0, 984.0, 1487.0, 2194.0, 3343.0, 5342.0, 8465.0, 13044.0, 20142.0, 30653.0, 46831.0, 69623.0, 97470.0, 126392.0, 142349.0, 134910.0, 108950.0, 78992.0, 54270.0, 35474.0, 23397.0, 15097.0, 9811.0, 6286.0, 4050.0, 2644.0, 1674.0, 1100.0, 667.0, 458.0, 266.0, 193.0, 118.0, 68.0, 53.0, 24.0, 12.0, 5.0, 9.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.2578125, -4.1190185546875, -3.980224609375, -3.8414306640625, -3.70263671875, -3.5638427734375, -3.425048828125, -3.2862548828125, -3.1474609375, -3.0086669921875, -2.869873046875, -2.7310791015625, -2.59228515625, -2.4534912109375, -2.314697265625, -2.1759033203125, -2.037109375, -1.8983154296875, -1.759521484375, -1.6207275390625, -1.48193359375, -1.3431396484375, -1.204345703125, -1.0655517578125, -0.9267578125, -0.7879638671875, -0.649169921875, -0.5103759765625, -0.37158203125, -0.2327880859375, -0.093994140625, 0.0447998046875, 0.18359375, 0.3223876953125, 0.461181640625, 0.5999755859375, 0.73876953125, 0.8775634765625, 1.016357421875, 1.1551513671875, 1.2939453125, 1.4327392578125, 1.571533203125, 1.7103271484375, 1.84912109375, 1.9879150390625, 2.126708984375, 2.2655029296875, 2.404296875, 2.5430908203125, 2.681884765625, 2.8206787109375, 2.95947265625, 3.0982666015625, 3.237060546875, 3.3758544921875, 3.5146484375, 3.6534423828125, 3.792236328125, 3.9310302734375, 4.06982421875, 4.2086181640625, 4.347412109375, 4.4862060546875, 4.625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 9.0, 7.0, 8.0, 7.0, 10.0, 15.0, 8.0, 15.0, 23.0, 14.0, 19.0, 21.0, 19.0, 20.0, 37.0, 33.0, 31.0, 27.0, 33.0, 32.0, 40.0, 48.0, 34.0, 38.0, 33.0, 53.0, 31.0, 32.0, 36.0, 38.0, 23.0, 20.0, 15.0, 24.0, 23.0, 13.0, 15.0, 11.0, 14.0, 15.0, 7.0, 9.0, 6.0, 8.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.046875, -4.87652587890625, -4.7061767578125, -4.53582763671875, -4.365478515625, -4.19512939453125, -4.0247802734375, -3.85443115234375, -3.68408203125, -3.51373291015625, -3.3433837890625, -3.17303466796875, -3.002685546875, -2.83233642578125, -2.6619873046875, -2.49163818359375, -2.3212890625, -2.15093994140625, -1.9805908203125, -1.81024169921875, -1.639892578125, -1.46954345703125, -1.2991943359375, -1.12884521484375, -0.95849609375, -0.78814697265625, -0.6177978515625, -0.44744873046875, -0.277099609375, -0.10675048828125, 0.0635986328125, 0.23394775390625, 0.404296875, 0.57464599609375, 0.7449951171875, 0.91534423828125, 1.085693359375, 1.25604248046875, 1.4263916015625, 1.59674072265625, 1.76708984375, 1.93743896484375, 2.1077880859375, 2.27813720703125, 2.448486328125, 2.61883544921875, 2.7891845703125, 2.95953369140625, 3.1298828125, 3.30023193359375, 3.4705810546875, 3.64093017578125, 3.811279296875, 3.98162841796875, 4.1519775390625, 4.32232666015625, 4.49267578125, 4.66302490234375, 4.8333740234375, 5.00372314453125, 5.174072265625, 5.34442138671875, 5.5147705078125, 5.68511962890625, 5.85546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 12.0, 23.0, 38.0, 67.0, 89.0, 115.0, 231.0, 371.0, 531.0, 864.0, 1388.0, 2183.0, 3487.0, 5403.0, 8731.0, 13523.0, 21290.0, 32855.0, 49945.0, 74786.0, 103393.0, 131296.0, 143577.0, 132396.0, 104670.0, 73978.0, 50963.0, 33706.0, 21409.0, 13684.0, 8710.0, 5373.0, 3447.0, 2189.0, 1336.0, 893.0, 622.0, 346.0, 232.0, 151.0, 87.0, 65.0, 37.0, 19.0, 18.0, 11.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.45245361328125, -4.3111572265625, -4.16986083984375, -4.028564453125, -3.88726806640625, -3.7459716796875, -3.60467529296875, -3.46337890625, -3.32208251953125, -3.1807861328125, -3.03948974609375, -2.898193359375, -2.75689697265625, -2.6156005859375, -2.47430419921875, -2.3330078125, -2.19171142578125, -2.0504150390625, -1.90911865234375, -1.767822265625, -1.62652587890625, -1.4852294921875, -1.34393310546875, -1.20263671875, -1.06134033203125, -0.9200439453125, -0.77874755859375, -0.637451171875, -0.49615478515625, -0.3548583984375, -0.21356201171875, -0.072265625, 0.06903076171875, 0.2103271484375, 0.35162353515625, 0.492919921875, 0.63421630859375, 0.7755126953125, 0.91680908203125, 1.05810546875, 1.19940185546875, 1.3406982421875, 1.48199462890625, 1.623291015625, 1.76458740234375, 1.9058837890625, 2.04718017578125, 2.1884765625, 2.32977294921875, 2.4710693359375, 2.61236572265625, 2.753662109375, 2.89495849609375, 3.0362548828125, 3.17755126953125, 3.31884765625, 3.46014404296875, 3.6014404296875, 3.74273681640625, 3.884033203125, 4.02532958984375, 4.1666259765625, 4.30792236328125, 4.44921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 3.0, 7.0, 6.0, 8.0, 9.0, 12.0, 12.0, 19.0, 13.0, 15.0, 21.0, 16.0, 29.0, 23.0, 20.0, 42.0, 31.0, 35.0, 33.0, 31.0, 43.0, 53.0, 31.0, 33.0, 38.0, 43.0, 27.0, 33.0, 31.0, 24.0, 27.0, 33.0, 23.0, 17.0, 20.0, 24.0, 19.0, 18.0, 12.0, 10.0, 8.0, 10.0, 9.0, 8.0, 2.0, 2.0, 7.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.2421875, -3.137054443359375, -3.03192138671875, -2.926788330078125, -2.8216552734375, -2.716522216796875, -2.61138916015625, -2.506256103515625, -2.401123046875, -2.295989990234375, -2.19085693359375, -2.085723876953125, -1.9805908203125, -1.875457763671875, -1.77032470703125, -1.665191650390625, -1.56005859375, -1.454925537109375, -1.34979248046875, -1.244659423828125, -1.1395263671875, -1.034393310546875, -0.92926025390625, -0.824127197265625, -0.718994140625, -0.613861083984375, -0.50872802734375, -0.403594970703125, -0.2984619140625, -0.193328857421875, -0.08819580078125, 0.016937255859375, 0.1220703125, 0.227203369140625, 0.33233642578125, 0.437469482421875, 0.5426025390625, 0.647735595703125, 0.75286865234375, 0.858001708984375, 0.963134765625, 1.068267822265625, 1.17340087890625, 1.278533935546875, 1.3836669921875, 1.488800048828125, 1.59393310546875, 1.699066162109375, 1.80419921875, 1.909332275390625, 2.01446533203125, 2.119598388671875, 2.2247314453125, 2.329864501953125, 2.43499755859375, 2.540130615234375, 2.645263671875, 2.750396728515625, 2.85552978515625, 2.960662841796875, 3.0657958984375, 3.170928955078125, 3.27606201171875, 3.381195068359375, 3.486328125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 10.0, 16.0, 27.0, 47.0, 35.0, 64.0, 83.0, 112.0, 182.0, 246.0, 391.0, 539.0, 835.0, 1368.0, 2175.0, 3511.0, 6294.0, 11263.0, 20364.0, 38186.0, 72501.0, 131440.0, 200931.0, 214501.0, 153695.0, 87559.0, 45847.0, 24414.0, 13142.0, 7338.0, 4280.0, 2547.0, 1617.0, 972.0, 625.0, 449.0, 275.0, 186.0, 132.0, 91.0, 54.0, 58.0, 41.0, 26.0, 24.0, 19.0, 10.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.0703125, -2.968475341796875, -2.86663818359375, -2.764801025390625, -2.6629638671875, -2.561126708984375, -2.45928955078125, -2.357452392578125, -2.255615234375, -2.153778076171875, -2.05194091796875, -1.950103759765625, -1.8482666015625, -1.746429443359375, -1.64459228515625, -1.542755126953125, -1.44091796875, -1.339080810546875, -1.23724365234375, -1.135406494140625, -1.0335693359375, -0.931732177734375, -0.82989501953125, -0.728057861328125, -0.626220703125, -0.524383544921875, -0.42254638671875, -0.320709228515625, -0.2188720703125, -0.117034912109375, -0.01519775390625, 0.086639404296875, 0.1884765625, 0.290313720703125, 0.39215087890625, 0.493988037109375, 0.5958251953125, 0.697662353515625, 0.79949951171875, 0.901336669921875, 1.003173828125, 1.105010986328125, 1.20684814453125, 1.308685302734375, 1.4105224609375, 1.512359619140625, 1.61419677734375, 1.716033935546875, 1.81787109375, 1.919708251953125, 2.02154541015625, 2.123382568359375, 2.2252197265625, 2.327056884765625, 2.42889404296875, 2.530731201171875, 2.632568359375, 2.734405517578125, 2.83624267578125, 2.938079833984375, 3.0399169921875, 3.141754150390625, 3.24359130859375, 3.345428466796875, 3.447265625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 3.0, 8.0, 4.0, 6.0, 13.0, 17.0, 23.0, 38.0, 60.0, 68.0, 70.0, 112.0, 103.0, 87.0, 89.0, 66.0, 49.0, 48.0, 33.0, 23.0, 22.0, 13.0, 8.0, 7.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003898143768310547, -0.00037750229239463806, -0.00036519020795822144, -0.0003528781235218048, -0.0003405660390853882, -0.00032825395464897156, -0.00031594187021255493, -0.0003036297857761383, -0.0002913177013397217, -0.00027900561690330505, -0.00026669353246688843, -0.0002543814480304718, -0.00024206936359405518, -0.00022975727915763855, -0.00021744519472122192, -0.0002051331102848053, -0.00019282102584838867, -0.00018050894141197205, -0.00016819685697555542, -0.0001558847725391388, -0.00014357268810272217, -0.00013126060366630554, -0.00011894851922988892, -0.00010663643479347229, -9.432435035705566e-05, -8.201226592063904e-05, -6.970018148422241e-05, -5.7388097047805786e-05, -4.507601261138916e-05, -3.2763928174972534e-05, -2.0451843738555908e-05, -8.139759302139282e-06, 4.172325134277344e-06, 1.648440957069397e-05, 2.8796494007110596e-05, 4.110857844352722e-05, 5.342066287994385e-05, 6.573274731636047e-05, 7.80448317527771e-05, 9.035691618919373e-05, 0.00010266900062561035, 0.00011498108506202698, 0.0001272931694984436, 0.00013960525393486023, 0.00015191733837127686, 0.00016422942280769348, 0.0001765415072441101, 0.00018885359168052673, 0.00020116567611694336, 0.00021347776055335999, 0.0002257898449897766, 0.00023810192942619324, 0.00025041401386260986, 0.0002627260982990265, 0.0002750381827354431, 0.00028735026717185974, 0.00029966235160827637, 0.000311974436044693, 0.0003242865204811096, 0.00033659860491752625, 0.00034891068935394287, 0.0003612227737903595, 0.0003735348582267761, 0.00038584694266319275, 0.0003981590270996094]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 10.0, 14.0, 16.0, 20.0, 32.0, 50.0, 85.0, 107.0, 151.0, 264.0, 381.0, 683.0, 1155.0, 2018.0, 3522.0, 6627.0, 12635.0, 25277.0, 52854.0, 108263.0, 195558.0, 247764.0, 188146.0, 102492.0, 49739.0, 23909.0, 12146.0, 6366.0, 3471.0, 1915.0, 1078.0, 640.0, 447.0, 247.0, 159.0, 100.0, 66.0, 40.0, 36.0, 24.0, 9.0, 11.0, 10.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.65234375, -3.5362548828125, -3.420166015625, -3.3040771484375, -3.18798828125, -3.0718994140625, -2.955810546875, -2.8397216796875, -2.7236328125, -2.6075439453125, -2.491455078125, -2.3753662109375, -2.25927734375, -2.1431884765625, -2.027099609375, -1.9110107421875, -1.794921875, -1.6788330078125, -1.562744140625, -1.4466552734375, -1.33056640625, -1.2144775390625, -1.098388671875, -0.9822998046875, -0.8662109375, -0.7501220703125, -0.634033203125, -0.5179443359375, -0.40185546875, -0.2857666015625, -0.169677734375, -0.0535888671875, 0.0625, 0.1785888671875, 0.294677734375, 0.4107666015625, 0.52685546875, 0.6429443359375, 0.759033203125, 0.8751220703125, 0.9912109375, 1.1072998046875, 1.223388671875, 1.3394775390625, 1.45556640625, 1.5716552734375, 1.687744140625, 1.8038330078125, 1.919921875, 2.0360107421875, 2.152099609375, 2.2681884765625, 2.38427734375, 2.5003662109375, 2.616455078125, 2.7325439453125, 2.8486328125, 2.9647216796875, 3.080810546875, 3.1968994140625, 3.31298828125, 3.4290771484375, 3.545166015625, 3.6612548828125, 3.77734375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 6.0, 13.0, 19.0, 16.0, 19.0, 25.0, 24.0, 30.0, 33.0, 46.0, 40.0, 41.0, 72.0, 61.0, 46.0, 63.0, 50.0, 57.0, 46.0, 47.0, 44.0, 28.0, 31.0, 22.0, 22.0, 14.0, 14.0, 8.0, 13.0, 11.0, 7.0, 11.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.0771484375, -1.0475082397460938, -1.0178680419921875, -0.9882278442382812, -0.958587646484375, -0.9289474487304688, -0.8993072509765625, -0.8696670532226562, -0.84002685546875, -0.8103866577148438, -0.7807464599609375, -0.7511062622070312, -0.721466064453125, -0.6918258666992188, -0.6621856689453125, -0.6325454711914062, -0.6029052734375, -0.5732650756835938, -0.5436248779296875, -0.5139846801757812, -0.484344482421875, -0.45470428466796875, -0.4250640869140625, -0.39542388916015625, -0.36578369140625, -0.33614349365234375, -0.3065032958984375, -0.27686309814453125, -0.247222900390625, -0.21758270263671875, -0.1879425048828125, -0.15830230712890625, -0.128662109375, -0.09902191162109375, -0.0693817138671875, -0.03974151611328125, -0.010101318359375, 0.01953887939453125, 0.0491790771484375, 0.07881927490234375, 0.10845947265625, 0.13809967041015625, 0.1677398681640625, 0.19738006591796875, 0.227020263671875, 0.25666046142578125, 0.2863006591796875, 0.31594085693359375, 0.3455810546875, 0.37522125244140625, 0.4048614501953125, 0.43450164794921875, 0.464141845703125, 0.49378204345703125, 0.5234222412109375, 0.5530624389648438, 0.58270263671875, 0.6123428344726562, 0.6419830322265625, 0.6716232299804688, 0.701263427734375, 0.7309036254882812, 0.7605438232421875, 0.7901840209960938, 0.81982421875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 2.0, 4.0, 7.0, 6.0, 9.0, 6.0, 14.0, 9.0, 24.0, 18.0, 32.0, 27.0, 35.0, 58.0, 49.0, 62.0, 72.0, 82.0, 66.0, 61.0, 64.0, 61.0, 24.0, 44.0, 44.0, 25.0, 23.0, 5.0, 13.0, 7.0, 8.0, 9.0, 5.0, 9.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.37326717376709, -11.045008659362793, -10.716750144958496, -10.388492584228516, -10.060234069824219, -9.731975555419922, -9.403717041015625, -9.075458526611328, -8.747200012207031, -8.418941497802734, -8.090682983398438, -7.762424945831299, -7.43416690826416, -7.105908393859863, -6.777649879455566, -6.4493913650512695, -6.121133804321289, -5.792875289916992, -5.4646172523498535, -5.136358737945557, -4.808100700378418, -4.479842185974121, -4.151583671569824, -3.8233253955841064, -3.4950671195983887, -3.166808843612671, -2.838550567626953, -2.5102920532226562, -2.1820337772369385, -1.8537755012512207, -1.5255171060562134, -1.197258710861206, -0.8690013885498047, -0.5407430529594421, -0.2124847173690796, 0.11577361822128296, 0.4440319538116455, 0.7722902297973633, 1.1005486249923706, 1.428807020187378, 1.7570652961730957, 2.0853235721588135, 2.4135818481445312, 2.741840362548828, 3.070098638534546, 3.3983569145202637, 3.7266154289245605, 4.054873466491699, 4.383131980895996, 4.711390495300293, 5.039648532867432, 5.3679070472717285, 5.696165084838867, 6.024423599243164, 6.352682113647461, 6.680940628051758, 7.0091986656188965, 7.337457180023193, 7.665715217590332, 7.993973731994629, 8.322232246398926, 8.650489807128906, 8.978748321533203, 9.3070068359375, 9.635265350341797]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 10.0, 4.0, 8.0, 8.0, 10.0, 12.0, 9.0, 12.0, 12.0, 19.0, 20.0, 18.0, 15.0, 24.0, 30.0, 25.0, 37.0, 24.0, 35.0, 37.0, 40.0, 40.0, 40.0, 35.0, 35.0, 35.0, 42.0, 40.0, 41.0, 45.0, 21.0, 30.0, 24.0, 21.0, 26.0, 19.0, 11.0, 15.0, 12.0, 16.0, 7.0, 3.0, 11.0, 5.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.67939567565918, -5.50309419631958, -5.326793193817139, -5.150491714477539, -4.9741902351379395, -4.79788875579834, -4.621587753295898, -4.445286273956299, -4.268984794616699, -4.0926833152771, -3.916382074356079, -3.7400808334350586, -3.563779354095459, -3.3874781131744385, -3.211176872253418, -3.0348753929138184, -2.858574390411377, -2.6822731494903564, -2.505971670150757, -2.3296704292297363, -2.1533689498901367, -1.9770677089691162, -1.8007664680480957, -1.6244651079177856, -1.4481637477874756, -1.2718623876571655, -1.0955610275268555, -0.919259786605835, -0.7429584264755249, -0.5666570663452148, -0.39035582542419434, -0.21405446529388428, -0.03775310516357422, 0.13854822516441345, 0.3148495554924011, 0.4911508560180664, 0.6674522161483765, 0.8437535762786865, 1.020054817199707, 1.196356177330017, 1.3726575374603271, 1.5489588975906372, 1.7252602577209473, 1.9015614986419678, 2.0778627395629883, 2.254164218902588, 2.4304654598236084, 2.606766700744629, 2.7830681800842285, 2.959369421005249, 3.1356709003448486, 3.311972141265869, 3.4882736206054688, 3.6645748615264893, 3.8408761024475098, 4.017177581787109, 4.193478584289551, 4.36978006362915, 4.546081066131592, 4.722382545471191, 4.898684024810791, 5.074985504150391, 5.251286506652832, 5.427587985992432, 5.603889465332031]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 12.0, 9.0, 11.0, 29.0, 42.0, 43.0, 76.0, 91.0, 150.0, 247.0, 369.0, 557.0, 819.0, 1304.0, 2036.0, 3098.0, 5045.0, 8459.0, 14896.0, 27026.0, 53871.0, 116996.0, 293198.0, 744650.0, 1292684.0, 949199.0, 387407.0, 149580.0, 65542.0, 32251.0, 17502.0, 10216.0, 6113.0, 3877.0, 2329.0, 1547.0, 1042.0, 695.0, 452.0, 277.0, 173.0, 131.0, 74.0, 55.0, 41.0, 23.0, 12.0, 12.0, 9.0, 2.0, 2.0, 4.0], "bins": [-12.625, -12.280517578125, -11.93603515625, -11.591552734375, -11.2470703125, -10.902587890625, -10.55810546875, -10.213623046875, -9.869140625, -9.524658203125, -9.18017578125, -8.835693359375, -8.4912109375, -8.146728515625, -7.80224609375, -7.457763671875, -7.11328125, -6.768798828125, -6.42431640625, -6.079833984375, -5.7353515625, -5.390869140625, -5.04638671875, -4.701904296875, -4.357421875, -4.012939453125, -3.66845703125, -3.323974609375, -2.9794921875, -2.635009765625, -2.29052734375, -1.946044921875, -1.6015625, -1.257080078125, -0.91259765625, -0.568115234375, -0.2236328125, 0.120849609375, 0.46533203125, 0.809814453125, 1.154296875, 1.498779296875, 1.84326171875, 2.187744140625, 2.5322265625, 2.876708984375, 3.22119140625, 3.565673828125, 3.91015625, 4.254638671875, 4.59912109375, 4.943603515625, 5.2880859375, 5.632568359375, 5.97705078125, 6.321533203125, 6.666015625, 7.010498046875, 7.35498046875, 7.699462890625, 8.0439453125, 8.388427734375, 8.73291015625, 9.077392578125, 9.421875]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 5.0, 9.0, 13.0, 17.0, 11.0, 14.0, 12.0, 27.0, 20.0, 20.0, 29.0, 25.0, 25.0, 29.0, 35.0, 28.0, 38.0, 35.0, 31.0, 53.0, 37.0, 43.0, 46.0, 33.0, 49.0, 28.0, 30.0, 33.0, 22.0, 27.0, 20.0, 23.0, 21.0, 19.0, 14.0, 16.0, 8.0, 8.0, 6.0, 9.0, 1.0, 5.0, 3.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-4.4765625, -4.3323974609375, -4.188232421875, -4.0440673828125, -3.89990234375, -3.7557373046875, -3.611572265625, -3.4674072265625, -3.3232421875, -3.1790771484375, -3.034912109375, -2.8907470703125, -2.74658203125, -2.6024169921875, -2.458251953125, -2.3140869140625, -2.169921875, -2.0257568359375, -1.881591796875, -1.7374267578125, -1.59326171875, -1.4490966796875, -1.304931640625, -1.1607666015625, -1.0166015625, -0.8724365234375, -0.728271484375, -0.5841064453125, -0.43994140625, -0.2957763671875, -0.151611328125, -0.0074462890625, 0.13671875, 0.2808837890625, 0.425048828125, 0.5692138671875, 0.71337890625, 0.8575439453125, 1.001708984375, 1.1458740234375, 1.2900390625, 1.4342041015625, 1.578369140625, 1.7225341796875, 1.86669921875, 2.0108642578125, 2.155029296875, 2.2991943359375, 2.443359375, 2.5875244140625, 2.731689453125, 2.8758544921875, 3.02001953125, 3.1641845703125, 3.308349609375, 3.4525146484375, 3.5966796875, 3.7408447265625, 3.885009765625, 4.0291748046875, 4.17333984375, 4.3175048828125, 4.461669921875, 4.6058349609375, 4.75]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 7.0, 12.0, 18.0, 27.0, 24.0, 35.0, 63.0, 89.0, 111.0, 187.0, 226.0, 381.0, 536.0, 829.0, 1264.0, 2028.0, 3029.0, 5076.0, 8529.0, 14741.0, 27617.0, 52366.0, 106600.0, 234118.0, 547070.0, 1110847.0, 1096581.0, 532716.0, 228337.0, 104277.0, 51657.0, 27303.0, 14966.0, 8713.0, 5055.0, 3149.0, 1998.0, 1243.0, 828.0, 520.0, 367.0, 222.0, 159.0, 115.0, 74.0, 54.0, 29.0, 32.0, 13.0, 13.0, 15.0, 6.0, 3.0, 4.0, 2.0, 3.0], "bins": [-13.296875, -12.9056396484375, -12.514404296875, -12.1231689453125, -11.73193359375, -11.3406982421875, -10.949462890625, -10.5582275390625, -10.1669921875, -9.7757568359375, -9.384521484375, -8.9932861328125, -8.60205078125, -8.2108154296875, -7.819580078125, -7.4283447265625, -7.037109375, -6.6458740234375, -6.254638671875, -5.8634033203125, -5.47216796875, -5.0809326171875, -4.689697265625, -4.2984619140625, -3.9072265625, -3.5159912109375, -3.124755859375, -2.7335205078125, -2.34228515625, -1.9510498046875, -1.559814453125, -1.1685791015625, -0.77734375, -0.3861083984375, 0.005126953125, 0.3963623046875, 0.78759765625, 1.1788330078125, 1.570068359375, 1.9613037109375, 2.3525390625, 2.7437744140625, 3.135009765625, 3.5262451171875, 3.91748046875, 4.3087158203125, 4.699951171875, 5.0911865234375, 5.482421875, 5.8736572265625, 6.264892578125, 6.6561279296875, 7.04736328125, 7.4385986328125, 7.829833984375, 8.2210693359375, 8.6123046875, 9.0035400390625, 9.394775390625, 9.7860107421875, 10.17724609375, 10.5684814453125, 10.959716796875, 11.3509521484375, 11.7421875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 13.0, 13.0, 19.0, 27.0, 20.0, 45.0, 26.0, 66.0, 90.0, 128.0, 128.0, 180.0, 218.0, 268.0, 327.0, 354.0, 349.0, 339.0, 302.0, 248.0, 198.0, 127.0, 124.0, 95.0, 79.0, 66.0, 42.0, 45.0, 34.0, 21.0, 21.0, 9.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.23828125, -4.11419677734375, -3.9901123046875, -3.86602783203125, -3.741943359375, -3.61785888671875, -3.4937744140625, -3.36968994140625, -3.24560546875, -3.12152099609375, -2.9974365234375, -2.87335205078125, -2.749267578125, -2.62518310546875, -2.5010986328125, -2.37701416015625, -2.2529296875, -2.12884521484375, -2.0047607421875, -1.88067626953125, -1.756591796875, -1.63250732421875, -1.5084228515625, -1.38433837890625, -1.26025390625, -1.13616943359375, -1.0120849609375, -0.88800048828125, -0.763916015625, -0.63983154296875, -0.5157470703125, -0.39166259765625, -0.267578125, -0.14349365234375, -0.0194091796875, 0.10467529296875, 0.228759765625, 0.35284423828125, 0.4769287109375, 0.60101318359375, 0.72509765625, 0.84918212890625, 0.9732666015625, 1.09735107421875, 1.221435546875, 1.34552001953125, 1.4696044921875, 1.59368896484375, 1.7177734375, 1.84185791015625, 1.9659423828125, 2.09002685546875, 2.214111328125, 2.33819580078125, 2.4622802734375, 2.58636474609375, 2.71044921875, 2.83453369140625, 2.9586181640625, 3.08270263671875, 3.206787109375, 3.33087158203125, 3.4549560546875, 3.57904052734375, 3.703125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 5.0, 12.0, 6.0, 18.0, 15.0, 16.0, 17.0, 16.0, 26.0, 28.0, 31.0, 49.0, 55.0, 37.0, 62.0, 59.0, 37.0, 76.0, 60.0, 48.0, 47.0, 44.0, 44.0, 31.0, 26.0, 21.0, 20.0, 11.0, 21.0, 18.0, 9.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.486200332641602, -9.154423713684082, -8.822648048400879, -8.49087142944336, -8.159095764160156, -7.827319145202637, -7.495542526245117, -7.163766384124756, -6.8319902420043945, -6.500214099884033, -6.168437957763672, -5.836661338806152, -5.504885196685791, -5.17310905456543, -4.84133243560791, -4.509556293487549, -4.1777801513671875, -3.846004009246826, -3.5142276287078857, -3.1824512481689453, -2.850675106048584, -2.5188989639282227, -2.1871225833892822, -1.8553462028503418, -1.5235700607299805, -1.1917937994003296, -0.8600175380706787, -0.5282412767410278, -0.19646501541137695, 0.13531124591827393, 0.4670875072479248, 0.7988638877868652, 1.1306400299072266, 1.4624162912368774, 1.7941925525665283, 2.1259689331054688, 2.45774507522583, 2.7895212173461914, 3.121297597885132, 3.4530739784240723, 3.7848501205444336, 4.116626262664795, 4.448402404785156, 4.780179023742676, 5.111955165863037, 5.443731307983398, 5.775507926940918, 6.107284069061279, 6.439060211181641, 6.770836353302002, 7.102612495422363, 7.434389114379883, 7.766165256500244, 8.097941398620605, 8.429718017578125, 8.761493682861328, 9.093270301818848, 9.425046920776367, 9.75682258605957, 10.08859920501709, 10.42037582397461, 10.752151489257812, 11.083928108215332, 11.415704727172852, 11.747480392456055]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 10.0, 13.0, 14.0, 14.0, 16.0, 22.0, 17.0, 19.0, 32.0, 31.0, 33.0, 34.0, 26.0, 37.0, 29.0, 34.0, 39.0, 39.0, 47.0, 44.0, 46.0, 41.0, 47.0, 38.0, 36.0, 19.0, 28.0, 31.0, 30.0, 22.0, 16.0, 14.0, 14.0, 8.0, 12.0, 8.0, 7.0, 9.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.198548316955566, -6.969392776489258, -6.740237236022949, -6.511082172393799, -6.28192663192749, -6.052771091461182, -5.823616027832031, -5.594460487365723, -5.365304946899414, -5.1361494064331055, -4.906993865966797, -4.6778388023376465, -4.448683261871338, -4.219527721405029, -3.9903724193573, -3.7612171173095703, -3.5320615768432617, -3.302906036376953, -3.0737507343292236, -2.844595432281494, -2.6154398918151855, -2.386284351348877, -2.1571290493011475, -1.9279736280441284, -1.6988182067871094, -1.4696627855300903, -1.2405073642730713, -1.0113519430160522, -0.7821965217590332, -0.5530411005020142, -0.3238856792449951, -0.09473025798797607, 0.13442468643188477, 0.3635801076889038, 0.5927355289459229, 0.8218909502029419, 1.051046371459961, 1.28020179271698, 1.509357213973999, 1.738512635231018, 1.967668056488037, 2.1968235969543457, 2.425978899002075, 2.6551342010498047, 2.8842897415161133, 3.113445281982422, 3.3426005840301514, 3.571755886077881, 3.8009114265441895, 4.030066967010498, 4.259222030639648, 4.488377571105957, 4.717533111572266, 4.946688652038574, 5.175844192504883, 5.404999256134033, 5.634154796600342, 5.86331033706665, 6.092465400695801, 6.321620941162109, 6.550776481628418, 6.779932022094727, 7.009087562561035, 7.2382426261901855, 7.467398166656494]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 8.0, 6.0, 21.0, 32.0, 32.0, 62.0, 68.0, 113.0, 208.0, 276.0, 434.0, 589.0, 1045.0, 1734.0, 2793.0, 4591.0, 8211.0, 14313.0, 25149.0, 44627.0, 77981.0, 127663.0, 179877.0, 190331.0, 147955.0, 93529.0, 54496.0, 30833.0, 17200.0, 9867.0, 5598.0, 3476.0, 1990.0, 1241.0, 793.0, 485.0, 299.0, 206.0, 124.0, 92.0, 63.0, 42.0, 36.0, 22.0, 22.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-5.2578125, -5.10833740234375, -4.9588623046875, -4.80938720703125, -4.659912109375, -4.51043701171875, -4.3609619140625, -4.21148681640625, -4.06201171875, -3.91253662109375, -3.7630615234375, -3.61358642578125, -3.464111328125, -3.31463623046875, -3.1651611328125, -3.01568603515625, -2.8662109375, -2.71673583984375, -2.5672607421875, -2.41778564453125, -2.268310546875, -2.11883544921875, -1.9693603515625, -1.81988525390625, -1.67041015625, -1.52093505859375, -1.3714599609375, -1.22198486328125, -1.072509765625, -0.92303466796875, -0.7735595703125, -0.62408447265625, -0.474609375, -0.32513427734375, -0.1756591796875, -0.02618408203125, 0.123291015625, 0.27276611328125, 0.4222412109375, 0.57171630859375, 0.72119140625, 0.87066650390625, 1.0201416015625, 1.16961669921875, 1.319091796875, 1.46856689453125, 1.6180419921875, 1.76751708984375, 1.9169921875, 2.06646728515625, 2.2159423828125, 2.36541748046875, 2.514892578125, 2.66436767578125, 2.8138427734375, 2.96331787109375, 3.11279296875, 3.26226806640625, 3.4117431640625, 3.56121826171875, 3.710693359375, 3.86016845703125, 4.0096435546875, 4.15911865234375, 4.30859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 10.0, 5.0, 7.0, 26.0, 14.0, 10.0, 12.0, 12.0, 27.0, 27.0, 29.0, 26.0, 31.0, 37.0, 28.0, 35.0, 37.0, 39.0, 48.0, 53.0, 53.0, 50.0, 39.0, 42.0, 43.0, 36.0, 31.0, 29.0, 22.0, 27.0, 21.0, 14.0, 8.0, 13.0, 9.0, 11.0, 9.0, 6.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.1953125, -7.940185546875, -7.68505859375, -7.429931640625, -7.1748046875, -6.919677734375, -6.66455078125, -6.409423828125, -6.154296875, -5.899169921875, -5.64404296875, -5.388916015625, -5.1337890625, -4.878662109375, -4.62353515625, -4.368408203125, -4.11328125, -3.858154296875, -3.60302734375, -3.347900390625, -3.0927734375, -2.837646484375, -2.58251953125, -2.327392578125, -2.072265625, -1.817138671875, -1.56201171875, -1.306884765625, -1.0517578125, -0.796630859375, -0.54150390625, -0.286376953125, -0.03125, 0.223876953125, 0.47900390625, 0.734130859375, 0.9892578125, 1.244384765625, 1.49951171875, 1.754638671875, 2.009765625, 2.264892578125, 2.52001953125, 2.775146484375, 3.0302734375, 3.285400390625, 3.54052734375, 3.795654296875, 4.05078125, 4.305908203125, 4.56103515625, 4.816162109375, 5.0712890625, 5.326416015625, 5.58154296875, 5.836669921875, 6.091796875, 6.346923828125, 6.60205078125, 6.857177734375, 7.1123046875, 7.367431640625, 7.62255859375, 7.877685546875, 8.1328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 9.0, 20.0, 14.0, 17.0, 37.0, 39.0, 46.0, 56.0, 95.0, 123.0, 188.0, 261.0, 363.0, 572.0, 951.0, 1510.0, 2701.0, 4618.0, 8478.0, 16346.0, 31865.0, 65511.0, 131410.0, 231353.0, 248519.0, 149994.0, 75488.0, 36665.0, 18596.0, 9557.0, 5395.0, 2976.0, 1711.0, 1030.0, 645.0, 398.0, 252.0, 197.0, 149.0, 103.0, 60.0, 55.0, 37.0, 35.0, 29.0, 17.0, 12.0, 11.0, 11.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.15625, -6.933349609375, -6.71044921875, -6.487548828125, -6.2646484375, -6.041748046875, -5.81884765625, -5.595947265625, -5.373046875, -5.150146484375, -4.92724609375, -4.704345703125, -4.4814453125, -4.258544921875, -4.03564453125, -3.812744140625, -3.58984375, -3.366943359375, -3.14404296875, -2.921142578125, -2.6982421875, -2.475341796875, -2.25244140625, -2.029541015625, -1.806640625, -1.583740234375, -1.36083984375, -1.137939453125, -0.9150390625, -0.692138671875, -0.46923828125, -0.246337890625, -0.0234375, 0.199462890625, 0.42236328125, 0.645263671875, 0.8681640625, 1.091064453125, 1.31396484375, 1.536865234375, 1.759765625, 1.982666015625, 2.20556640625, 2.428466796875, 2.6513671875, 2.874267578125, 3.09716796875, 3.320068359375, 3.54296875, 3.765869140625, 3.98876953125, 4.211669921875, 4.4345703125, 4.657470703125, 4.88037109375, 5.103271484375, 5.326171875, 5.549072265625, 5.77197265625, 5.994873046875, 6.2177734375, 6.440673828125, 6.66357421875, 6.886474609375, 7.109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 4.0, 13.0, 16.0, 17.0, 17.0, 13.0, 18.0, 32.0, 18.0, 35.0, 14.0, 21.0, 25.0, 35.0, 42.0, 40.0, 35.0, 38.0, 35.0, 36.0, 39.0, 46.0, 36.0, 32.0, 34.0, 35.0, 27.0, 28.0, 25.0, 22.0, 23.0, 19.0, 20.0, 15.0, 11.0, 13.0, 7.0, 9.0, 6.0, 8.0, 6.0, 2.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.6015625, -4.467315673828125, -4.33306884765625, -4.198822021484375, -4.0645751953125, -3.930328369140625, -3.79608154296875, -3.661834716796875, -3.527587890625, -3.393341064453125, -3.25909423828125, -3.124847412109375, -2.9906005859375, -2.856353759765625, -2.72210693359375, -2.587860107421875, -2.45361328125, -2.319366455078125, -2.18511962890625, -2.050872802734375, -1.9166259765625, -1.782379150390625, -1.64813232421875, -1.513885498046875, -1.379638671875, -1.245391845703125, -1.11114501953125, -0.976898193359375, -0.8426513671875, -0.708404541015625, -0.57415771484375, -0.439910888671875, -0.3056640625, -0.171417236328125, -0.03717041015625, 0.097076416015625, 0.2313232421875, 0.365570068359375, 0.49981689453125, 0.634063720703125, 0.768310546875, 0.902557373046875, 1.03680419921875, 1.171051025390625, 1.3052978515625, 1.439544677734375, 1.57379150390625, 1.708038330078125, 1.84228515625, 1.976531982421875, 2.11077880859375, 2.245025634765625, 2.3792724609375, 2.513519287109375, 2.64776611328125, 2.782012939453125, 2.916259765625, 3.050506591796875, 3.18475341796875, 3.319000244140625, 3.4532470703125, 3.587493896484375, 3.72174072265625, 3.855987548828125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 8.0, 8.0, 7.0, 9.0, 10.0, 17.0, 23.0, 44.0, 57.0, 78.0, 125.0, 177.0, 280.0, 427.0, 678.0, 1090.0, 1817.0, 3046.0, 5211.0, 9546.0, 16949.0, 32367.0, 62700.0, 122547.0, 220672.0, 248455.0, 153177.0, 79302.0, 40969.0, 21417.0, 11371.0, 6390.0, 3699.0, 2219.0, 1372.0, 839.0, 510.0, 319.0, 188.0, 139.0, 103.0, 60.0, 41.0, 21.0, 23.0, 18.0, 21.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.73046875, -3.621307373046875, -3.51214599609375, -3.402984619140625, -3.2938232421875, -3.184661865234375, -3.07550048828125, -2.966339111328125, -2.857177734375, -2.748016357421875, -2.63885498046875, -2.529693603515625, -2.4205322265625, -2.311370849609375, -2.20220947265625, -2.093048095703125, -1.98388671875, -1.874725341796875, -1.76556396484375, -1.656402587890625, -1.5472412109375, -1.438079833984375, -1.32891845703125, -1.219757080078125, -1.110595703125, -1.001434326171875, -0.89227294921875, -0.783111572265625, -0.6739501953125, -0.564788818359375, -0.45562744140625, -0.346466064453125, -0.2373046875, -0.128143310546875, -0.01898193359375, 0.090179443359375, 0.1993408203125, 0.308502197265625, 0.41766357421875, 0.526824951171875, 0.635986328125, 0.745147705078125, 0.85430908203125, 0.963470458984375, 1.0726318359375, 1.181793212890625, 1.29095458984375, 1.400115966796875, 1.50927734375, 1.618438720703125, 1.72760009765625, 1.836761474609375, 1.9459228515625, 2.055084228515625, 2.16424560546875, 2.273406982421875, 2.382568359375, 2.491729736328125, 2.60089111328125, 2.710052490234375, 2.8192138671875, 2.928375244140625, 3.03753662109375, 3.146697998046875, 3.255859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 8.0, 8.0, 10.0, 12.0, 16.0, 33.0, 35.0, 35.0, 44.0, 55.0, 52.0, 58.0, 65.0, 83.0, 73.0, 62.0, 56.0, 55.0, 44.0, 42.0, 30.0, 21.0, 20.0, 17.0, 10.0, 8.0, 11.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00012493133544921875, -0.0001205839216709137, -0.00011623650789260864, -0.00011188909411430359, -0.00010754168033599854, -0.00010319426655769348, -9.884685277938843e-05, -9.449943900108337e-05, -9.015202522277832e-05, -8.580461144447327e-05, -8.145719766616821e-05, -7.710978388786316e-05, -7.27623701095581e-05, -6.841495633125305e-05, -6.4067542552948e-05, -5.9720128774642944e-05, -5.537271499633789e-05, -5.102530121803284e-05, -4.667788743972778e-05, -4.233047366142273e-05, -3.7983059883117676e-05, -3.363564610481262e-05, -2.928823232650757e-05, -2.4940818548202515e-05, -2.059340476989746e-05, -1.6245990991592407e-05, -1.1898577213287354e-05, -7.5511634349823e-06, -3.203749656677246e-06, 1.1436641216278076e-06, 5.491077899932861e-06, 9.838491678237915e-06, 1.4185905456542969e-05, 1.8533319234848022e-05, 2.2880733013153076e-05, 2.722814679145813e-05, 3.1575560569763184e-05, 3.592297434806824e-05, 4.027038812637329e-05, 4.4617801904678345e-05, 4.89652156829834e-05, 5.331262946128845e-05, 5.7660043239593506e-05, 6.200745701789856e-05, 6.635487079620361e-05, 7.070228457450867e-05, 7.504969835281372e-05, 7.939711213111877e-05, 8.374452590942383e-05, 8.809193968772888e-05, 9.243935346603394e-05, 9.678676724433899e-05, 0.00010113418102264404, 0.0001054815948009491, 0.00010982900857925415, 0.0001141764223575592, 0.00011852383613586426, 0.0001228712499141693, 0.00012721866369247437, 0.00013156607747077942, 0.00013591349124908447, 0.00014026090502738953, 0.00014460831880569458, 0.00014895573258399963, 0.0001533031463623047]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 6.0, 19.0, 22.0, 35.0, 52.0, 77.0, 114.0, 159.0, 286.0, 486.0, 724.0, 1149.0, 1899.0, 3117.0, 5362.0, 9315.0, 16303.0, 29239.0, 51874.0, 90397.0, 145421.0, 193430.0, 184344.0, 131232.0, 79227.0, 45101.0, 25065.0, 14092.0, 8015.0, 4701.0, 2799.0, 1711.0, 1024.0, 626.0, 411.0, 269.0, 148.0, 90.0, 70.0, 44.0, 32.0, 27.0, 11.0, 8.0, 7.0, 7.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.337890625, -3.236358642578125, -3.13482666015625, -3.033294677734375, -2.9317626953125, -2.830230712890625, -2.72869873046875, -2.627166748046875, -2.525634765625, -2.424102783203125, -2.32257080078125, -2.221038818359375, -2.1195068359375, -2.017974853515625, -1.91644287109375, -1.814910888671875, -1.71337890625, -1.611846923828125, -1.51031494140625, -1.408782958984375, -1.3072509765625, -1.205718994140625, -1.10418701171875, -1.002655029296875, -0.901123046875, -0.799591064453125, -0.69805908203125, -0.596527099609375, -0.4949951171875, -0.393463134765625, -0.29193115234375, -0.190399169921875, -0.0888671875, 0.012664794921875, 0.11419677734375, 0.215728759765625, 0.3172607421875, 0.418792724609375, 0.52032470703125, 0.621856689453125, 0.723388671875, 0.824920654296875, 0.92645263671875, 1.027984619140625, 1.1295166015625, 1.231048583984375, 1.33258056640625, 1.434112548828125, 1.53564453125, 1.637176513671875, 1.73870849609375, 1.840240478515625, 1.9417724609375, 2.043304443359375, 2.14483642578125, 2.246368408203125, 2.347900390625, 2.449432373046875, 2.55096435546875, 2.652496337890625, 2.7540283203125, 2.855560302734375, 2.95709228515625, 3.058624267578125, 3.16015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 5.0, 8.0, 9.0, 8.0, 18.0, 20.0, 22.0, 25.0, 34.0, 37.0, 52.0, 64.0, 51.0, 72.0, 60.0, 67.0, 67.0, 55.0, 56.0, 47.0, 49.0, 32.0, 22.0, 31.0, 24.0, 16.0, 14.0, 6.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.227447509765625, -1.19122314453125, -1.154998779296875, -1.1187744140625, -1.082550048828125, -1.04632568359375, -1.010101318359375, -0.973876953125, -0.937652587890625, -0.90142822265625, -0.865203857421875, -0.8289794921875, -0.792755126953125, -0.75653076171875, -0.720306396484375, -0.68408203125, -0.647857666015625, -0.61163330078125, -0.575408935546875, -0.5391845703125, -0.502960205078125, -0.46673583984375, -0.430511474609375, -0.394287109375, -0.358062744140625, -0.32183837890625, -0.285614013671875, -0.2493896484375, -0.213165283203125, -0.17694091796875, -0.140716552734375, -0.1044921875, -0.068267822265625, -0.03204345703125, 0.004180908203125, 0.0404052734375, 0.076629638671875, 0.11285400390625, 0.149078369140625, 0.185302734375, 0.221527099609375, 0.25775146484375, 0.293975830078125, 0.3302001953125, 0.366424560546875, 0.40264892578125, 0.438873291015625, 0.47509765625, 0.511322021484375, 0.54754638671875, 0.583770751953125, 0.6199951171875, 0.656219482421875, 0.69244384765625, 0.728668212890625, 0.764892578125, 0.801116943359375, 0.83734130859375, 0.873565673828125, 0.9097900390625, 0.946014404296875, 0.98223876953125, 1.018463134765625, 1.0546875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 9.0, 9.0, 21.0, 15.0, 15.0, 16.0, 28.0, 32.0, 28.0, 49.0, 38.0, 50.0, 55.0, 55.0, 48.0, 66.0, 57.0, 43.0, 45.0, 41.0, 40.0, 36.0, 28.0, 28.0, 24.0, 21.0, 14.0, 16.0, 5.0, 7.0, 6.0, 5.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.05610179901123, -8.740498542785645, -8.424895286560059, -8.109292984008789, -7.793689727783203, -7.478086471557617, -7.162483215332031, -6.8468804359436035, -6.531277656555176, -6.21567440032959, -5.900071620941162, -5.584468364715576, -5.268865585327148, -4.9532623291015625, -4.637659072875977, -4.322056293487549, -4.006453037261963, -3.690850019454956, -3.375247001647949, -3.0596437454223633, -2.7440409660339355, -2.4284377098083496, -2.1128346920013428, -1.797231674194336, -1.481628656387329, -1.1660256385803223, -0.8504225611686707, -0.534819483757019, -0.2192164659500122, 0.09638655185699463, 0.411989688873291, 0.7275927066802979, 1.0431957244873047, 1.3587987422943115, 1.6744017601013184, 1.9900048971176147, 2.305607795715332, 2.621211051940918, 2.936814069747925, 3.2524170875549316, 3.5680201053619385, 3.8836231231689453, 4.199226379394531, 4.514829158782959, 4.830432415008545, 5.146035194396973, 5.461638450622559, 5.7772417068481445, 6.092844486236572, 6.408447742462158, 6.724050521850586, 7.039653778076172, 7.3552565574646, 7.6708598136901855, 7.986462593078613, 8.3020658493042, 8.617669105529785, 8.933272361755371, 9.248875617980957, 9.564477920532227, 9.880081176757812, 10.195684432983398, 10.511287689208984, 10.82689094543457, 11.14249324798584]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 2.0, 6.0, 13.0, 13.0, 16.0, 11.0, 14.0, 22.0, 16.0, 23.0, 29.0, 30.0, 33.0, 31.0, 33.0, 33.0, 31.0, 33.0, 43.0, 39.0, 41.0, 51.0, 49.0, 44.0, 35.0, 47.0, 29.0, 19.0, 30.0, 30.0, 36.0, 13.0, 23.0, 12.0, 16.0, 8.0, 11.0, 7.0, 8.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.210147380828857, -6.9790754318237305, -6.748003959655762, -6.516932487487793, -6.285860538482666, -6.054788589477539, -5.82371711730957, -5.592645645141602, -5.361573696136475, -5.130501747131348, -4.899430274963379, -4.66835880279541, -4.437286853790283, -4.206214904785156, -3.9751434326171875, -3.7440717220306396, -3.513000011444092, -3.281928300857544, -3.050856590270996, -2.8197848796844482, -2.5887131690979004, -2.3576414585113525, -2.1265697479248047, -1.8954980373382568, -1.664426326751709, -1.4333546161651611, -1.2022829055786133, -0.9712111949920654, -0.7401394844055176, -0.5090677738189697, -0.2779960632324219, -0.04692435264587402, 0.18414783477783203, 0.4152195453643799, 0.6462912559509277, 0.8773629665374756, 1.1084346771240234, 1.3395063877105713, 1.5705780982971191, 1.801649808883667, 2.032721519470215, 2.2637932300567627, 2.4948649406433105, 2.7259366512298584, 2.9570083618164062, 3.188080072402954, 3.419151782989502, 3.65022349357605, 3.8812952041625977, 4.112366676330566, 4.343438625335693, 4.57451057434082, 4.805582046508789, 5.036653518676758, 5.267725467681885, 5.498797416687012, 5.7298688888549805, 5.960940361022949, 6.192012310028076, 6.423084259033203, 6.654155731201172, 6.885227203369141, 7.116299152374268, 7.3473711013793945, 7.578442573547363]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 4.0, 3.0, 9.0, 24.0, 17.0, 36.0, 56.0, 105.0, 169.0, 330.0, 564.0, 1005.0, 2005.0, 3911.0, 7597.0, 15072.0, 31676.0, 64713.0, 127206.0, 206703.0, 232631.0, 169970.0, 93575.0, 46545.0, 22105.0, 10837.0, 5559.0, 2779.0, 1516.0, 806.0, 443.0, 244.0, 124.0, 99.0, 44.0, 31.0, 21.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.921875, -6.6583251953125, -6.394775390625, -6.1312255859375, -5.86767578125, -5.6041259765625, -5.340576171875, -5.0770263671875, -4.8134765625, -4.5499267578125, -4.286376953125, -4.0228271484375, -3.75927734375, -3.4957275390625, -3.232177734375, -2.9686279296875, -2.705078125, -2.4415283203125, -2.177978515625, -1.9144287109375, -1.65087890625, -1.3873291015625, -1.123779296875, -0.8602294921875, -0.5966796875, -0.3331298828125, -0.069580078125, 0.1939697265625, 0.45751953125, 0.7210693359375, 0.984619140625, 1.2481689453125, 1.51171875, 1.7752685546875, 2.038818359375, 2.3023681640625, 2.56591796875, 2.8294677734375, 3.093017578125, 3.3565673828125, 3.6201171875, 3.8836669921875, 4.147216796875, 4.4107666015625, 4.67431640625, 4.9378662109375, 5.201416015625, 5.4649658203125, 5.728515625, 5.9920654296875, 6.255615234375, 6.5191650390625, 6.78271484375, 7.0462646484375, 7.309814453125, 7.5733642578125, 7.8369140625, 8.1004638671875, 8.364013671875, 8.6275634765625, 8.89111328125, 9.1546630859375, 9.418212890625, 9.6817626953125, 9.9453125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 5.0, 8.0, 11.0, 7.0, 18.0, 17.0, 19.0, 24.0, 15.0, 31.0, 31.0, 18.0, 28.0, 36.0, 42.0, 36.0, 46.0, 38.0, 43.0, 53.0, 54.0, 48.0, 42.0, 37.0, 39.0, 30.0, 24.0, 24.0, 24.0, 27.0, 24.0, 24.0, 11.0, 16.0, 10.0, 10.0, 7.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.59765625, -7.34710693359375, -7.0965576171875, -6.84600830078125, -6.595458984375, -6.34490966796875, -6.0943603515625, -5.84381103515625, -5.59326171875, -5.34271240234375, -5.0921630859375, -4.84161376953125, -4.591064453125, -4.34051513671875, -4.0899658203125, -3.83941650390625, -3.5888671875, -3.33831787109375, -3.0877685546875, -2.83721923828125, -2.586669921875, -2.33612060546875, -2.0855712890625, -1.83502197265625, -1.58447265625, -1.33392333984375, -1.0833740234375, -0.83282470703125, -0.582275390625, -0.33172607421875, -0.0811767578125, 0.16937255859375, 0.419921875, 0.67047119140625, 0.9210205078125, 1.17156982421875, 1.422119140625, 1.67266845703125, 1.9232177734375, 2.17376708984375, 2.42431640625, 2.67486572265625, 2.9254150390625, 3.17596435546875, 3.426513671875, 3.67706298828125, 3.9276123046875, 4.17816162109375, 4.4287109375, 4.67926025390625, 4.9298095703125, 5.18035888671875, 5.430908203125, 5.68145751953125, 5.9320068359375, 6.18255615234375, 6.43310546875, 6.68365478515625, 6.9342041015625, 7.18475341796875, 7.435302734375, 7.68585205078125, 7.9364013671875, 8.18695068359375, 8.4375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 4.0, 3.0, 6.0, 13.0, 14.0, 22.0, 34.0, 44.0, 81.0, 98.0, 137.0, 231.0, 358.0, 560.0, 968.0, 1459.0, 2523.0, 4014.0, 6702.0, 11298.0, 19352.0, 33318.0, 56498.0, 92931.0, 138653.0, 174447.0, 169328.0, 129091.0, 83509.0, 50601.0, 29591.0, 17160.0, 10137.0, 6045.0, 3574.0, 2108.0, 1345.0, 802.0, 524.0, 319.0, 225.0, 144.0, 82.0, 58.0, 40.0, 27.0, 21.0, 11.0, 21.0, 11.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.7734375, -6.56103515625, -6.3486328125, -6.13623046875, -5.923828125, -5.71142578125, -5.4990234375, -5.28662109375, -5.07421875, -4.86181640625, -4.6494140625, -4.43701171875, -4.224609375, -4.01220703125, -3.7998046875, -3.58740234375, -3.375, -3.16259765625, -2.9501953125, -2.73779296875, -2.525390625, -2.31298828125, -2.1005859375, -1.88818359375, -1.67578125, -1.46337890625, -1.2509765625, -1.03857421875, -0.826171875, -0.61376953125, -0.4013671875, -0.18896484375, 0.0234375, 0.23583984375, 0.4482421875, 0.66064453125, 0.873046875, 1.08544921875, 1.2978515625, 1.51025390625, 1.72265625, 1.93505859375, 2.1474609375, 2.35986328125, 2.572265625, 2.78466796875, 2.9970703125, 3.20947265625, 3.421875, 3.63427734375, 3.8466796875, 4.05908203125, 4.271484375, 4.48388671875, 4.6962890625, 4.90869140625, 5.12109375, 5.33349609375, 5.5458984375, 5.75830078125, 5.970703125, 6.18310546875, 6.3955078125, 6.60791015625, 6.8203125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 7.0, 2.0, 5.0, 6.0, 3.0, 9.0, 8.0, 14.0, 21.0, 16.0, 18.0, 23.0, 32.0, 26.0, 27.0, 39.0, 29.0, 53.0, 40.0, 33.0, 41.0, 39.0, 47.0, 38.0, 29.0, 39.0, 31.0, 23.0, 45.0, 30.0, 35.0, 31.0, 18.0, 16.0, 19.0, 19.0, 11.0, 10.0, 6.0, 15.0, 8.0, 12.0, 9.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.3956298828125, -4.252197265625, -4.1087646484375, -3.96533203125, -3.8218994140625, -3.678466796875, -3.5350341796875, -3.3916015625, -3.2481689453125, -3.104736328125, -2.9613037109375, -2.81787109375, -2.6744384765625, -2.531005859375, -2.3875732421875, -2.244140625, -2.1007080078125, -1.957275390625, -1.8138427734375, -1.67041015625, -1.5269775390625, -1.383544921875, -1.2401123046875, -1.0966796875, -0.9532470703125, -0.809814453125, -0.6663818359375, -0.52294921875, -0.3795166015625, -0.236083984375, -0.0926513671875, 0.05078125, 0.1942138671875, 0.337646484375, 0.4810791015625, 0.62451171875, 0.7679443359375, 0.911376953125, 1.0548095703125, 1.1982421875, 1.3416748046875, 1.485107421875, 1.6285400390625, 1.77197265625, 1.9154052734375, 2.058837890625, 2.2022705078125, 2.345703125, 2.4891357421875, 2.632568359375, 2.7760009765625, 2.91943359375, 3.0628662109375, 3.206298828125, 3.3497314453125, 3.4931640625, 3.6365966796875, 3.780029296875, 3.9234619140625, 4.06689453125, 4.2103271484375, 4.353759765625, 4.4971923828125, 4.640625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 7.0, 4.0, 4.0, 5.0, 7.0, 13.0, 12.0, 31.0, 26.0, 50.0, 60.0, 83.0, 113.0, 167.0, 258.0, 379.0, 548.0, 811.0, 1280.0, 1971.0, 3337.0, 5505.0, 9772.0, 19004.0, 38982.0, 87020.0, 191503.0, 286352.0, 210703.0, 99177.0, 43729.0, 20898.0, 10908.0, 6093.0, 3490.0, 2131.0, 1357.0, 944.0, 569.0, 387.0, 274.0, 168.0, 130.0, 85.0, 75.0, 55.0, 30.0, 21.0, 9.0, 13.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.1953125, -5.03582763671875, -4.8763427734375, -4.71685791015625, -4.557373046875, -4.39788818359375, -4.2384033203125, -4.07891845703125, -3.91943359375, -3.75994873046875, -3.6004638671875, -3.44097900390625, -3.281494140625, -3.12200927734375, -2.9625244140625, -2.80303955078125, -2.6435546875, -2.48406982421875, -2.3245849609375, -2.16510009765625, -2.005615234375, -1.84613037109375, -1.6866455078125, -1.52716064453125, -1.36767578125, -1.20819091796875, -1.0487060546875, -0.88922119140625, -0.729736328125, -0.57025146484375, -0.4107666015625, -0.25128173828125, -0.091796875, 0.06768798828125, 0.2271728515625, 0.38665771484375, 0.546142578125, 0.70562744140625, 0.8651123046875, 1.02459716796875, 1.18408203125, 1.34356689453125, 1.5030517578125, 1.66253662109375, 1.822021484375, 1.98150634765625, 2.1409912109375, 2.30047607421875, 2.4599609375, 2.61944580078125, 2.7789306640625, 2.93841552734375, 3.097900390625, 3.25738525390625, 3.4168701171875, 3.57635498046875, 3.73583984375, 3.89532470703125, 4.0548095703125, 4.21429443359375, 4.373779296875, 4.53326416015625, 4.6927490234375, 4.85223388671875, 5.01171875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 3.0, 2.0, 4.0, 8.0, 7.0, 7.0, 7.0, 12.0, 17.0, 22.0, 28.0, 36.0, 33.0, 47.0, 58.0, 61.0, 65.0, 70.0, 64.0, 59.0, 61.0, 57.0, 44.0, 37.0, 39.0, 31.0, 24.0, 19.0, 21.0, 11.0, 9.0, 1.0, 8.0, 1.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0003387928009033203, -0.00032854825258255005, -0.0003183037042617798, -0.0003080591559410095, -0.00029781460762023926, -0.000287570059299469, -0.00027732551097869873, -0.00026708096265792847, -0.0002568364143371582, -0.00024659186601638794, -0.00023634731769561768, -0.0002261027693748474, -0.00021585822105407715, -0.00020561367273330688, -0.00019536912441253662, -0.00018512457609176636, -0.0001748800277709961, -0.00016463547945022583, -0.00015439093112945557, -0.0001441463828086853, -0.00013390183448791504, -0.00012365728616714478, -0.00011341273784637451, -0.00010316818952560425, -9.292364120483398e-05, -8.267909288406372e-05, -7.243454456329346e-05, -6.21899962425232e-05, -5.194544792175293e-05, -4.1700899600982666e-05, -3.14563512802124e-05, -2.121180295944214e-05, -1.0967254638671875e-05, -7.227063179016113e-07, 9.521842002868652e-06, 1.9766390323638916e-05, 3.001093864440918e-05, 4.025548696517944e-05, 5.050003528594971e-05, 6.074458360671997e-05, 7.098913192749023e-05, 8.12336802482605e-05, 9.147822856903076e-05, 0.00010172277688980103, 0.00011196732521057129, 0.00012221187353134155, 0.00013245642185211182, 0.00014270097017288208, 0.00015294551849365234, 0.0001631900668144226, 0.00017343461513519287, 0.00018367916345596313, 0.0001939237117767334, 0.00020416826009750366, 0.00021441280841827393, 0.0002246573567390442, 0.00023490190505981445, 0.0002451464533805847, 0.000255391001701355, 0.00026563555002212524, 0.0002758800983428955, 0.00028612464666366577, 0.00029636919498443604, 0.0003066137433052063, 0.00031685829162597656]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 4.0, 8.0, 16.0, 22.0, 24.0, 36.0, 52.0, 81.0, 108.0, 163.0, 247.0, 301.0, 498.0, 723.0, 1080.0, 1798.0, 2714.0, 4536.0, 7689.0, 13659.0, 25332.0, 49265.0, 96965.0, 181538.0, 244365.0, 193236.0, 106384.0, 54132.0, 27323.0, 14729.0, 8386.0, 4750.0, 2976.0, 1783.0, 1236.0, 772.0, 541.0, 341.0, 208.0, 163.0, 106.0, 74.0, 69.0, 32.0, 19.0, 24.0, 13.0, 7.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0], "bins": [-4.61328125, -4.47161865234375, -4.3299560546875, -4.18829345703125, -4.046630859375, -3.90496826171875, -3.7633056640625, -3.62164306640625, -3.47998046875, -3.33831787109375, -3.1966552734375, -3.05499267578125, -2.913330078125, -2.77166748046875, -2.6300048828125, -2.48834228515625, -2.3466796875, -2.20501708984375, -2.0633544921875, -1.92169189453125, -1.780029296875, -1.63836669921875, -1.4967041015625, -1.35504150390625, -1.21337890625, -1.07171630859375, -0.9300537109375, -0.78839111328125, -0.646728515625, -0.50506591796875, -0.3634033203125, -0.22174072265625, -0.080078125, 0.06158447265625, 0.2032470703125, 0.34490966796875, 0.486572265625, 0.62823486328125, 0.7698974609375, 0.91156005859375, 1.05322265625, 1.19488525390625, 1.3365478515625, 1.47821044921875, 1.619873046875, 1.76153564453125, 1.9031982421875, 2.04486083984375, 2.1865234375, 2.32818603515625, 2.4698486328125, 2.61151123046875, 2.753173828125, 2.89483642578125, 3.0364990234375, 3.17816162109375, 3.31982421875, 3.46148681640625, 3.6031494140625, 3.74481201171875, 3.886474609375, 4.02813720703125, 4.1697998046875, 4.31146240234375, 4.453125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 8.0, 4.0, 8.0, 7.0, 9.0, 24.0, 17.0, 27.0, 17.0, 25.0, 33.0, 40.0, 45.0, 37.0, 70.0, 73.0, 64.0, 72.0, 68.0, 62.0, 68.0, 42.0, 33.0, 19.0, 28.0, 21.0, 14.0, 13.0, 7.0, 12.0, 8.0, 3.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.36328125, -1.3202362060546875, -1.277191162109375, -1.2341461181640625, -1.19110107421875, -1.1480560302734375, -1.105010986328125, -1.0619659423828125, -1.0189208984375, -0.9758758544921875, -0.932830810546875, -0.8897857666015625, -0.84674072265625, -0.8036956787109375, -0.760650634765625, -0.7176055908203125, -0.674560546875, -0.6315155029296875, -0.588470458984375, -0.5454254150390625, -0.50238037109375, -0.4593353271484375, -0.416290283203125, -0.3732452392578125, -0.3302001953125, -0.2871551513671875, -0.244110107421875, -0.2010650634765625, -0.15802001953125, -0.1149749755859375, -0.071929931640625, -0.0288848876953125, 0.01416015625, 0.0572052001953125, 0.100250244140625, 0.1432952880859375, 0.18634033203125, 0.2293853759765625, 0.272430419921875, 0.3154754638671875, 0.3585205078125, 0.4015655517578125, 0.444610595703125, 0.4876556396484375, 0.53070068359375, 0.5737457275390625, 0.616790771484375, 0.6598358154296875, 0.702880859375, 0.7459259033203125, 0.788970947265625, 0.8320159912109375, 0.87506103515625, 0.9181060791015625, 0.961151123046875, 1.0041961669921875, 1.0472412109375, 1.0902862548828125, 1.133331298828125, 1.1763763427734375, 1.21942138671875, 1.2624664306640625, 1.305511474609375, 1.3485565185546875, 1.3916015625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 3.0, 0.0, 4.0, 9.0, 3.0, 11.0, 11.0, 10.0, 13.0, 15.0, 21.0, 23.0, 28.0, 25.0, 28.0, 34.0, 49.0, 50.0, 49.0, 65.0, 52.0, 56.0, 54.0, 42.0, 39.0, 50.0, 37.0, 29.0, 33.0, 34.0, 30.0, 19.0, 15.0, 9.0, 6.0, 9.0, 6.0, 6.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.812718391418457, -8.497692108154297, -8.182665824890137, -7.867639541625977, -7.552613258361816, -7.237586975097656, -6.922560691833496, -6.607534408569336, -6.292508125305176, -5.977481842041016, -5.6624555587768555, -5.347429275512695, -5.032402992248535, -4.717376708984375, -4.402350425720215, -4.087324142456055, -3.7722978591918945, -3.4572715759277344, -3.142245292663574, -2.827219009399414, -2.512192726135254, -2.1971664428710938, -1.8821401596069336, -1.5671138763427734, -1.2520875930786133, -0.9370613098144531, -0.622035026550293, -0.3070087432861328, 0.008017539978027344, 0.3230438232421875, 0.6380701065063477, 0.9530963897705078, 1.2681236267089844, 1.5831499099731445, 1.8981761932373047, 2.213202476501465, 2.528228759765625, 2.843255043029785, 3.1582813262939453, 3.4733076095581055, 3.7883338928222656, 4.103360176086426, 4.418386459350586, 4.733412742614746, 5.048439025878906, 5.363465309143066, 5.678491592407227, 5.993517875671387, 6.308544158935547, 6.623570442199707, 6.938596725463867, 7.253623008728027, 7.5686492919921875, 7.883675575256348, 8.198701858520508, 8.513728141784668, 8.828754425048828, 9.143780708312988, 9.458806991577148, 9.773833274841309, 10.088859558105469, 10.403885841369629, 10.718912124633789, 11.03393840789795, 11.34896469116211]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 11.0, 10.0, 14.0, 23.0, 23.0, 18.0, 27.0, 28.0, 24.0, 31.0, 29.0, 48.0, 50.0, 52.0, 49.0, 42.0, 38.0, 39.0, 43.0, 43.0, 44.0, 41.0, 32.0, 31.0, 42.0, 24.0, 21.0, 23.0, 18.0, 20.0, 4.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.13933277130127, -7.876277923583984, -7.613223075866699, -7.350168704986572, -7.087113857269287, -6.824059009552002, -6.561004638671875, -6.29794979095459, -6.034894943237305, -5.7718400955200195, -5.508785247802734, -5.245730876922607, -4.982676029205322, -4.719621181488037, -4.45656681060791, -4.193511962890625, -3.93045711517334, -3.6674022674560547, -3.4043476581573486, -3.1412930488586426, -2.8782382011413574, -2.6151833534240723, -2.352128744125366, -2.08907413482666, -1.826019287109375, -1.5629645586013794, -1.2999098300933838, -1.0368551015853882, -0.7738003730773926, -0.510745644569397, -0.24769091606140137, 0.015363812446594238, 0.27841949462890625, 0.5414742231369019, 0.8045289516448975, 1.067583680152893, 1.3306384086608887, 1.5936931371688843, 1.8567478656768799, 2.119802474975586, 2.382857322692871, 2.6459121704101562, 2.9089667797088623, 3.1720213890075684, 3.4350762367248535, 3.6981310844421387, 3.9611856937408447, 4.224240303039551, 4.487295150756836, 4.750349998474121, 5.013404846191406, 5.276459217071533, 5.539514064788818, 5.8025689125061035, 6.0656232833862305, 6.328678131103516, 6.591732978820801, 6.854787826538086, 7.117842674255371, 7.380897045135498, 7.643951892852783, 7.907006740570068, 8.170061111450195, 8.43311595916748, 8.696170806884766]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 1.0, 3.0, 5.0, 10.0, 6.0, 7.0, 20.0, 22.0, 45.0, 62.0, 127.0, 151.0, 256.0, 434.0, 671.0, 1229.0, 2209.0, 4037.0, 7154.0, 13747.0, 27297.0, 59933.0, 151908.0, 448550.0, 1195962.0, 1364902.0, 584118.0, 188774.0, 72139.0, 32356.0, 16665.0, 8758.0, 5070.0, 2939.0, 1717.0, 1098.0, 668.0, 413.0, 285.0, 173.0, 123.0, 84.0, 57.0, 28.0, 19.0, 17.0, 9.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.015625, -15.531982421875, -15.04833984375, -14.564697265625, -14.0810546875, -13.597412109375, -13.11376953125, -12.630126953125, -12.146484375, -11.662841796875, -11.17919921875, -10.695556640625, -10.2119140625, -9.728271484375, -9.24462890625, -8.760986328125, -8.27734375, -7.793701171875, -7.31005859375, -6.826416015625, -6.3427734375, -5.859130859375, -5.37548828125, -4.891845703125, -4.408203125, -3.924560546875, -3.44091796875, -2.957275390625, -2.4736328125, -1.989990234375, -1.50634765625, -1.022705078125, -0.5390625, -0.055419921875, 0.42822265625, 0.911865234375, 1.3955078125, 1.879150390625, 2.36279296875, 2.846435546875, 3.330078125, 3.813720703125, 4.29736328125, 4.781005859375, 5.2646484375, 5.748291015625, 6.23193359375, 6.715576171875, 7.19921875, 7.682861328125, 8.16650390625, 8.650146484375, 9.1337890625, 9.617431640625, 10.10107421875, 10.584716796875, 11.068359375, 11.552001953125, 12.03564453125, 12.519287109375, 13.0029296875, 13.486572265625, 13.97021484375, 14.453857421875, 14.9375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 4.0, 5.0, 5.0, 6.0, 8.0, 9.0, 13.0, 23.0, 24.0, 21.0, 24.0, 29.0, 29.0, 44.0, 45.0, 54.0, 48.0, 39.0, 52.0, 45.0, 48.0, 53.0, 46.0, 43.0, 41.0, 46.0, 34.0, 30.0, 29.0, 12.0, 16.0, 18.0, 18.0, 9.0, 11.0, 5.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.67578125, -7.42974853515625, -7.1837158203125, -6.93768310546875, -6.691650390625, -6.44561767578125, -6.1995849609375, -5.95355224609375, -5.70751953125, -5.46148681640625, -5.2154541015625, -4.96942138671875, -4.723388671875, -4.47735595703125, -4.2313232421875, -3.98529052734375, -3.7392578125, -3.49322509765625, -3.2471923828125, -3.00115966796875, -2.755126953125, -2.50909423828125, -2.2630615234375, -2.01702880859375, -1.77099609375, -1.52496337890625, -1.2789306640625, -1.03289794921875, -0.786865234375, -0.54083251953125, -0.2947998046875, -0.04876708984375, 0.197265625, 0.44329833984375, 0.6893310546875, 0.93536376953125, 1.181396484375, 1.42742919921875, 1.6734619140625, 1.91949462890625, 2.16552734375, 2.41156005859375, 2.6575927734375, 2.90362548828125, 3.149658203125, 3.39569091796875, 3.6417236328125, 3.88775634765625, 4.1337890625, 4.37982177734375, 4.6258544921875, 4.87188720703125, 5.117919921875, 5.36395263671875, 5.6099853515625, 5.85601806640625, 6.10205078125, 6.34808349609375, 6.5941162109375, 6.84014892578125, 7.086181640625, 7.33221435546875, 7.5782470703125, 7.82427978515625, 8.0703125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 13.0, 9.0, 18.0, 37.0, 57.0, 88.0, 101.0, 164.0, 244.0, 313.0, 475.0, 701.0, 1009.0, 1557.0, 2349.0, 3740.0, 5912.0, 10222.0, 17796.0, 32862.0, 63802.0, 133609.0, 297608.0, 690730.0, 1209598.0, 930700.0, 420163.0, 183667.0, 85985.0, 43592.0, 23552.0, 13200.0, 7715.0, 4711.0, 2772.0, 1792.0, 1126.0, 806.0, 468.0, 384.0, 199.0, 153.0, 92.0, 64.0, 52.0, 32.0, 18.0, 7.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -15.9498291015625, -15.462158203125, -14.9744873046875, -14.48681640625, -13.9991455078125, -13.511474609375, -13.0238037109375, -12.5361328125, -12.0484619140625, -11.560791015625, -11.0731201171875, -10.58544921875, -10.0977783203125, -9.610107421875, -9.1224365234375, -8.634765625, -8.1470947265625, -7.659423828125, -7.1717529296875, -6.68408203125, -6.1964111328125, -5.708740234375, -5.2210693359375, -4.7333984375, -4.2457275390625, -3.758056640625, -3.2703857421875, -2.78271484375, -2.2950439453125, -1.807373046875, -1.3197021484375, -0.83203125, -0.3443603515625, 0.143310546875, 0.6309814453125, 1.11865234375, 1.6063232421875, 2.093994140625, 2.5816650390625, 3.0693359375, 3.5570068359375, 4.044677734375, 4.5323486328125, 5.02001953125, 5.5076904296875, 5.995361328125, 6.4830322265625, 6.970703125, 7.4583740234375, 7.946044921875, 8.4337158203125, 8.92138671875, 9.4090576171875, 9.896728515625, 10.3843994140625, 10.8720703125, 11.3597412109375, 11.847412109375, 12.3350830078125, 12.82275390625, 13.3104248046875, 13.798095703125, 14.2857666015625, 14.7734375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 10.0, 6.0, 8.0, 9.0, 9.0, 13.0, 17.0, 28.0, 22.0, 45.0, 57.0, 77.0, 100.0, 133.0, 157.0, 216.0, 230.0, 326.0, 328.0, 365.0, 351.0, 289.0, 275.0, 237.0, 183.0, 142.0, 85.0, 75.0, 74.0, 58.0, 41.0, 32.0, 22.0, 11.0, 16.0, 7.0, 6.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.39453125, -5.228759765625, -5.06298828125, -4.897216796875, -4.7314453125, -4.565673828125, -4.39990234375, -4.234130859375, -4.068359375, -3.902587890625, -3.73681640625, -3.571044921875, -3.4052734375, -3.239501953125, -3.07373046875, -2.907958984375, -2.7421875, -2.576416015625, -2.41064453125, -2.244873046875, -2.0791015625, -1.913330078125, -1.74755859375, -1.581787109375, -1.416015625, -1.250244140625, -1.08447265625, -0.918701171875, -0.7529296875, -0.587158203125, -0.42138671875, -0.255615234375, -0.08984375, 0.075927734375, 0.24169921875, 0.407470703125, 0.5732421875, 0.739013671875, 0.90478515625, 1.070556640625, 1.236328125, 1.402099609375, 1.56787109375, 1.733642578125, 1.8994140625, 2.065185546875, 2.23095703125, 2.396728515625, 2.5625, 2.728271484375, 2.89404296875, 3.059814453125, 3.2255859375, 3.391357421875, 3.55712890625, 3.722900390625, 3.888671875, 4.054443359375, 4.22021484375, 4.385986328125, 4.5517578125, 4.717529296875, 4.88330078125, 5.049072265625, 5.21484375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 11.0, 7.0, 15.0, 14.0, 16.0, 16.0, 23.0, 26.0, 36.0, 39.0, 43.0, 42.0, 51.0, 51.0, 64.0, 60.0, 58.0, 59.0, 57.0, 44.0, 38.0, 42.0, 34.0, 32.0, 21.0, 21.0, 9.0, 8.0, 7.0, 9.0, 9.0, 8.0, 2.0, 3.0, 0.0, 6.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.505025863647461, -13.072253227233887, -12.639480590820312, -12.206708908081055, -11.77393627166748, -11.341163635253906, -10.908391952514648, -10.475619316101074, -10.0428466796875, -9.610074043273926, -9.177301406860352, -8.744529724121094, -8.31175708770752, -7.878984451293945, -7.446212291717529, -7.013440132141113, -6.580667495727539, -6.147894859313965, -5.715122699737549, -5.282350540161133, -4.849577903747559, -4.416805267333984, -3.9840331077575684, -3.5512607097625732, -3.118488311767578, -2.685715913772583, -2.252943515777588, -1.8201711177825928, -1.3873987197875977, -0.9546263217926025, -0.5218539237976074, -0.0890815258026123, 0.3436908721923828, 0.7764632701873779, 1.209235668182373, 1.6420080661773682, 2.0747804641723633, 2.5075528621673584, 2.9403252601623535, 3.3730976581573486, 3.8058700561523438, 4.238642692565918, 4.671414852142334, 5.10418701171875, 5.536959648132324, 5.969732284545898, 6.4025044441223145, 6.8352766036987305, 7.268049240112305, 7.700821876525879, 8.133594512939453, 8.566366195678711, 8.999138832092285, 9.43191146850586, 9.864683151245117, 10.297455787658691, 10.730228424072266, 11.16300106048584, 11.595773696899414, 12.028545379638672, 12.461318016052246, 12.89409065246582, 13.326862335205078, 13.759634971618652, 14.192407608032227]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 3.0, 5.0, 14.0, 13.0, 15.0, 15.0, 19.0, 17.0, 21.0, 27.0, 32.0, 30.0, 23.0, 32.0, 34.0, 35.0, 48.0, 29.0, 44.0, 42.0, 30.0, 31.0, 36.0, 38.0, 27.0, 33.0, 34.0, 32.0, 28.0, 23.0, 23.0, 11.0, 19.0, 19.0, 9.0, 23.0, 8.0, 5.0, 9.0, 5.0, 9.0, 5.0, 5.0, 6.0, 4.0, 0.0, 6.0, 4.0, 0.0, 2.0, 2.0], "bins": [-8.791692733764648, -8.5216064453125, -8.251520156860352, -7.981433868408203, -7.711347579956055, -7.441261291503906, -7.171175003051758, -6.901088714599609, -6.631002426147461, -6.3609161376953125, -6.090829849243164, -5.820743560791016, -5.550657272338867, -5.280570983886719, -5.01048469543457, -4.740398406982422, -4.470311641693115, -4.200225353240967, -3.9301390647888184, -3.66005277633667, -3.3899664878845215, -3.119880199432373, -2.8497936725616455, -2.579707384109497, -2.3096210956573486, -2.0395348072052, -1.7694485187530518, -1.4993621110916138, -1.2292758226394653, -0.9591895341873169, -0.6891031265258789, -0.41901683807373047, -0.14893054962158203, 0.1211557686328888, 0.3912420868873596, 0.6613284349441528, 0.9314147233963013, 1.2015010118484497, 1.4715874195098877, 1.7416737079620361, 2.0117599964141846, 2.281846284866333, 2.5519325733184814, 2.822019100189209, 3.0921053886413574, 3.362191677093506, 3.6322779655456543, 3.9023642539978027, 4.172450542449951, 4.4425368309021, 4.712623119354248, 4.9827094078063965, 5.252795696258545, 5.522881984710693, 5.79296875, 6.063055038452148, 6.333141326904297, 6.603227615356445, 6.873313903808594, 7.143400192260742, 7.413486480712891, 7.683572769165039, 7.9536590576171875, 8.223745346069336, 8.493831634521484]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 8.0, 6.0, 7.0, 21.0, 19.0, 26.0, 46.0, 69.0, 102.0, 189.0, 298.0, 438.0, 695.0, 1187.0, 1889.0, 3117.0, 5473.0, 9293.0, 16448.0, 29581.0, 53431.0, 96775.0, 158554.0, 206855.0, 185128.0, 121294.0, 69542.0, 38013.0, 21101.0, 11923.0, 6781.0, 4012.0, 2414.0, 1481.0, 831.0, 567.0, 283.0, 239.0, 156.0, 80.0, 62.0, 41.0, 33.0, 14.0, 12.0, 8.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7734375, -6.55987548828125, -6.3463134765625, -6.13275146484375, -5.919189453125, -5.70562744140625, -5.4920654296875, -5.27850341796875, -5.06494140625, -4.85137939453125, -4.6378173828125, -4.42425537109375, -4.210693359375, -3.99713134765625, -3.7835693359375, -3.57000732421875, -3.3564453125, -3.14288330078125, -2.9293212890625, -2.71575927734375, -2.502197265625, -2.28863525390625, -2.0750732421875, -1.86151123046875, -1.64794921875, -1.43438720703125, -1.2208251953125, -1.00726318359375, -0.793701171875, -0.58013916015625, -0.3665771484375, -0.15301513671875, 0.060546875, 0.27410888671875, 0.4876708984375, 0.70123291015625, 0.914794921875, 1.12835693359375, 1.3419189453125, 1.55548095703125, 1.76904296875, 1.98260498046875, 2.1961669921875, 2.40972900390625, 2.623291015625, 2.83685302734375, 3.0504150390625, 3.26397705078125, 3.4775390625, 3.69110107421875, 3.9046630859375, 4.11822509765625, 4.331787109375, 4.54534912109375, 4.7589111328125, 4.97247314453125, 5.18603515625, 5.39959716796875, 5.6131591796875, 5.82672119140625, 6.040283203125, 6.25384521484375, 6.4674072265625, 6.68096923828125, 6.89453125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 4.0, 10.0, 13.0, 10.0, 15.0, 13.0, 13.0, 23.0, 14.0, 19.0, 31.0, 29.0, 38.0, 31.0, 37.0, 39.0, 45.0, 44.0, 41.0, 40.0, 33.0, 34.0, 27.0, 35.0, 38.0, 41.0, 35.0, 32.0, 20.0, 40.0, 20.0, 20.0, 11.0, 17.0, 11.0, 9.0, 10.0, 6.0, 9.0, 8.0, 9.0, 6.0, 1.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.71875, -9.4139404296875, -9.109130859375, -8.8043212890625, -8.49951171875, -8.1947021484375, -7.889892578125, -7.5850830078125, -7.2802734375, -6.9754638671875, -6.670654296875, -6.3658447265625, -6.06103515625, -5.7562255859375, -5.451416015625, -5.1466064453125, -4.841796875, -4.5369873046875, -4.232177734375, -3.9273681640625, -3.62255859375, -3.3177490234375, -3.012939453125, -2.7081298828125, -2.4033203125, -2.0985107421875, -1.793701171875, -1.4888916015625, -1.18408203125, -0.8792724609375, -0.574462890625, -0.2696533203125, 0.03515625, 0.3399658203125, 0.644775390625, 0.9495849609375, 1.25439453125, 1.5592041015625, 1.864013671875, 2.1688232421875, 2.4736328125, 2.7784423828125, 3.083251953125, 3.3880615234375, 3.69287109375, 3.9976806640625, 4.302490234375, 4.6072998046875, 4.912109375, 5.2169189453125, 5.521728515625, 5.8265380859375, 6.13134765625, 6.4361572265625, 6.740966796875, 7.0457763671875, 7.3505859375, 7.6553955078125, 7.960205078125, 8.2650146484375, 8.56982421875, 8.8746337890625, 9.179443359375, 9.4842529296875, 9.7890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 9.0, 6.0, 4.0, 6.0, 13.0, 12.0, 31.0, 32.0, 34.0, 48.0, 64.0, 96.0, 140.0, 181.0, 247.0, 379.0, 584.0, 964.0, 1577.0, 2516.0, 4678.0, 8228.0, 15501.0, 30273.0, 62328.0, 128811.0, 240660.0, 258420.0, 146871.0, 71727.0, 34804.0, 17473.0, 9197.0, 4988.0, 2943.0, 1603.0, 1016.0, 657.0, 402.0, 314.0, 206.0, 144.0, 90.0, 79.0, 54.0, 26.0, 30.0, 22.0, 22.0, 16.0, 16.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 4.0], "bins": [-10.40625, -10.091796875, -9.77734375, -9.462890625, -9.1484375, -8.833984375, -8.51953125, -8.205078125, -7.890625, -7.576171875, -7.26171875, -6.947265625, -6.6328125, -6.318359375, -6.00390625, -5.689453125, -5.375, -5.060546875, -4.74609375, -4.431640625, -4.1171875, -3.802734375, -3.48828125, -3.173828125, -2.859375, -2.544921875, -2.23046875, -1.916015625, -1.6015625, -1.287109375, -0.97265625, -0.658203125, -0.34375, -0.029296875, 0.28515625, 0.599609375, 0.9140625, 1.228515625, 1.54296875, 1.857421875, 2.171875, 2.486328125, 2.80078125, 3.115234375, 3.4296875, 3.744140625, 4.05859375, 4.373046875, 4.6875, 5.001953125, 5.31640625, 5.630859375, 5.9453125, 6.259765625, 6.57421875, 6.888671875, 7.203125, 7.517578125, 7.83203125, 8.146484375, 8.4609375, 8.775390625, 9.08984375, 9.404296875, 9.71875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 7.0, 12.0, 7.0, 12.0, 15.0, 21.0, 28.0, 26.0, 20.0, 31.0, 30.0, 39.0, 40.0, 35.0, 31.0, 40.0, 59.0, 42.0, 32.0, 30.0, 46.0, 46.0, 40.0, 46.0, 31.0, 36.0, 30.0, 26.0, 22.0, 15.0, 20.0, 15.0, 13.0, 12.0, 12.0, 7.0, 1.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59375, -6.38909912109375, -6.1844482421875, -5.97979736328125, -5.775146484375, -5.57049560546875, -5.3658447265625, -5.16119384765625, -4.95654296875, -4.75189208984375, -4.5472412109375, -4.34259033203125, -4.137939453125, -3.93328857421875, -3.7286376953125, -3.52398681640625, -3.3193359375, -3.11468505859375, -2.9100341796875, -2.70538330078125, -2.500732421875, -2.29608154296875, -2.0914306640625, -1.88677978515625, -1.68212890625, -1.47747802734375, -1.2728271484375, -1.06817626953125, -0.863525390625, -0.65887451171875, -0.4542236328125, -0.24957275390625, -0.044921875, 0.15972900390625, 0.3643798828125, 0.56903076171875, 0.773681640625, 0.97833251953125, 1.1829833984375, 1.38763427734375, 1.59228515625, 1.79693603515625, 2.0015869140625, 2.20623779296875, 2.410888671875, 2.61553955078125, 2.8201904296875, 3.02484130859375, 3.2294921875, 3.43414306640625, 3.6387939453125, 3.84344482421875, 4.048095703125, 4.25274658203125, 4.4573974609375, 4.66204833984375, 4.86669921875, 5.07135009765625, 5.2760009765625, 5.48065185546875, 5.685302734375, 5.88995361328125, 6.0946044921875, 6.29925537109375, 6.50390625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 10.0, 8.0, 7.0, 12.0, 12.0, 29.0, 34.0, 34.0, 55.0, 74.0, 91.0, 110.0, 176.0, 268.0, 346.0, 581.0, 950.0, 1629.0, 2787.0, 5104.0, 10293.0, 21673.0, 50364.0, 123416.0, 282383.0, 303397.0, 139513.0, 56412.0, 24291.0, 11143.0, 5544.0, 3018.0, 1694.0, 1034.0, 616.0, 429.0, 313.0, 190.0, 120.0, 97.0, 73.0, 52.0, 49.0, 27.0, 18.0, 11.0, 19.0, 12.0, 7.0, 6.0, 5.0, 6.0, 3.0, 5.0, 1.0, 3.0, 1.0], "bins": [-6.6484375, -6.44110107421875, -6.2337646484375, -6.02642822265625, -5.819091796875, -5.61175537109375, -5.4044189453125, -5.19708251953125, -4.98974609375, -4.78240966796875, -4.5750732421875, -4.36773681640625, -4.160400390625, -3.95306396484375, -3.7457275390625, -3.53839111328125, -3.3310546875, -3.12371826171875, -2.9163818359375, -2.70904541015625, -2.501708984375, -2.29437255859375, -2.0870361328125, -1.87969970703125, -1.67236328125, -1.46502685546875, -1.2576904296875, -1.05035400390625, -0.843017578125, -0.63568115234375, -0.4283447265625, -0.22100830078125, -0.013671875, 0.19366455078125, 0.4010009765625, 0.60833740234375, 0.815673828125, 1.02301025390625, 1.2303466796875, 1.43768310546875, 1.64501953125, 1.85235595703125, 2.0596923828125, 2.26702880859375, 2.474365234375, 2.68170166015625, 2.8890380859375, 3.09637451171875, 3.3037109375, 3.51104736328125, 3.7183837890625, 3.92572021484375, 4.133056640625, 4.34039306640625, 4.5477294921875, 4.75506591796875, 4.96240234375, 5.16973876953125, 5.3770751953125, 5.58441162109375, 5.791748046875, 5.99908447265625, 6.2064208984375, 6.41375732421875, 6.62109375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 8.0, 7.0, 10.0, 14.0, 16.0, 18.0, 20.0, 28.0, 20.0, 23.0, 33.0, 41.0, 35.0, 48.0, 50.0, 56.0, 65.0, 51.0, 53.0, 49.0, 57.0, 48.0, 33.0, 34.0, 32.0, 22.0, 26.0, 23.0, 16.0, 9.0, 11.0, 8.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.00017261505126953125, -0.00016780942678451538, -0.0001630038022994995, -0.00015819817781448364, -0.00015339255332946777, -0.0001485869288444519, -0.00014378130435943604, -0.00013897567987442017, -0.0001341700553894043, -0.00012936443090438843, -0.00012455880641937256, -0.00011975318193435669, -0.00011494755744934082, -0.00011014193296432495, -0.00010533630847930908, -0.00010053068399429321, -9.572505950927734e-05, -9.091943502426147e-05, -8.61138105392456e-05, -8.130818605422974e-05, -7.650256156921387e-05, -7.1696937084198e-05, -6.689131259918213e-05, -6.208568811416626e-05, -5.728006362915039e-05, -5.247443914413452e-05, -4.766881465911865e-05, -4.286319017410278e-05, -3.8057565689086914e-05, -3.3251941204071045e-05, -2.8446316719055176e-05, -2.3640692234039307e-05, -1.8835067749023438e-05, -1.4029443264007568e-05, -9.2238187789917e-06, -4.41819429397583e-06, 3.8743019104003906e-07, 5.193054676055908e-06, 9.998679161071777e-06, 1.4804303646087646e-05, 1.9609928131103516e-05, 2.4415552616119385e-05, 2.9221177101135254e-05, 3.402680158615112e-05, 3.883242607116699e-05, 4.363805055618286e-05, 4.844367504119873e-05, 5.32492995262146e-05, 5.805492401123047e-05, 6.286054849624634e-05, 6.766617298126221e-05, 7.247179746627808e-05, 7.727742195129395e-05, 8.208304643630981e-05, 8.688867092132568e-05, 9.169429540634155e-05, 9.649991989135742e-05, 0.00010130554437637329, 0.00010611116886138916, 0.00011091679334640503, 0.0001157224178314209, 0.00012052804231643677, 0.00012533366680145264, 0.0001301392912864685, 0.00013494491577148438]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 15.0, 14.0, 18.0, 19.0, 37.0, 51.0, 83.0, 115.0, 136.0, 248.0, 374.0, 619.0, 1010.0, 1706.0, 3085.0, 5742.0, 11783.0, 27077.0, 72871.0, 212819.0, 366810.0, 216069.0, 74723.0, 27765.0, 12125.0, 5713.0, 2972.0, 1647.0, 988.0, 692.0, 390.0, 249.0, 169.0, 125.0, 117.0, 55.0, 32.0, 14.0, 17.0, 18.0, 11.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.508544921875, -8.22021484375, -7.931884765625, -7.6435546875, -7.355224609375, -7.06689453125, -6.778564453125, -6.490234375, -6.201904296875, -5.91357421875, -5.625244140625, -5.3369140625, -5.048583984375, -4.76025390625, -4.471923828125, -4.18359375, -3.895263671875, -3.60693359375, -3.318603515625, -3.0302734375, -2.741943359375, -2.45361328125, -2.165283203125, -1.876953125, -1.588623046875, -1.30029296875, -1.011962890625, -0.7236328125, -0.435302734375, -0.14697265625, 0.141357421875, 0.4296875, 0.718017578125, 1.00634765625, 1.294677734375, 1.5830078125, 1.871337890625, 2.15966796875, 2.447998046875, 2.736328125, 3.024658203125, 3.31298828125, 3.601318359375, 3.8896484375, 4.177978515625, 4.46630859375, 4.754638671875, 5.04296875, 5.331298828125, 5.61962890625, 5.907958984375, 6.1962890625, 6.484619140625, 6.77294921875, 7.061279296875, 7.349609375, 7.637939453125, 7.92626953125, 8.214599609375, 8.5029296875, 8.791259765625, 9.07958984375, 9.367919921875, 9.65625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 9.0, 13.0, 9.0, 21.0, 19.0, 27.0, 57.0, 57.0, 80.0, 114.0, 118.0, 124.0, 94.0, 72.0, 52.0, 30.0, 34.0, 24.0, 11.0, 6.0, 10.0, 5.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.9014892578125, -2.812744140625, -2.7239990234375, -2.63525390625, -2.5465087890625, -2.457763671875, -2.3690185546875, -2.2802734375, -2.1915283203125, -2.102783203125, -2.0140380859375, -1.92529296875, -1.8365478515625, -1.747802734375, -1.6590576171875, -1.5703125, -1.4815673828125, -1.392822265625, -1.3040771484375, -1.21533203125, -1.1265869140625, -1.037841796875, -0.9490966796875, -0.8603515625, -0.7716064453125, -0.682861328125, -0.5941162109375, -0.50537109375, -0.4166259765625, -0.327880859375, -0.2391357421875, -0.150390625, -0.0616455078125, 0.027099609375, 0.1158447265625, 0.20458984375, 0.2933349609375, 0.382080078125, 0.4708251953125, 0.5595703125, 0.6483154296875, 0.737060546875, 0.8258056640625, 0.91455078125, 1.0032958984375, 1.092041015625, 1.1807861328125, 1.26953125, 1.3582763671875, 1.447021484375, 1.5357666015625, 1.62451171875, 1.7132568359375, 1.802001953125, 1.8907470703125, 1.9794921875, 2.0682373046875, 2.156982421875, 2.2457275390625, 2.33447265625, 2.4232177734375, 2.511962890625, 2.6007080078125, 2.689453125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 5.0, 1.0, 5.0, 4.0, 11.0, 5.0, 16.0, 13.0, 15.0, 18.0, 25.0, 25.0, 31.0, 37.0, 45.0, 44.0, 50.0, 49.0, 57.0, 70.0, 67.0, 63.0, 51.0, 50.0, 38.0, 44.0, 27.0, 22.0, 24.0, 14.0, 12.0, 10.0, 7.0, 10.0, 10.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.514822006225586, -13.080727577209473, -12.64663314819336, -12.212539672851562, -11.77844524383545, -11.344350814819336, -10.910256385803223, -10.47616195678711, -10.042068481445312, -9.6079740524292, -9.173879623413086, -8.739786148071289, -8.305691719055176, -7.8715972900390625, -7.437502861022949, -7.003408432006836, -6.569314002990723, -6.135219573974609, -5.701125621795654, -5.267031192779541, -4.832937240600586, -4.398842811584473, -3.9647483825683594, -3.530654191970825, -3.096560001373291, -2.662465810775757, -2.2283716201782227, -1.7942771911621094, -1.3601830005645752, -0.926088809967041, -0.49199438095092773, -0.057900190353393555, 0.3761940002441406, 0.8102882504463196, 1.2443825006484985, 1.6784768104553223, 2.1125710010528564, 2.5466651916503906, 2.980759620666504, 3.414853811264038, 3.8489480018615723, 4.2830424308776855, 4.717136383056641, 5.151230812072754, 5.585325241088867, 6.019419193267822, 6.4535136222839355, 6.887607574462891, 7.321702003479004, 7.755796432495117, 8.18989086151123, 8.623985290527344, 9.05807876586914, 9.492173194885254, 9.926267623901367, 10.36036205291748, 10.794456481933594, 11.228550910949707, 11.66264533996582, 12.096738815307617, 12.53083324432373, 12.964927673339844, 13.399022102355957, 13.83311653137207, 14.267210006713867]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 5.0, 3.0, 8.0, 5.0, 11.0, 10.0, 14.0, 13.0, 15.0, 16.0, 25.0, 20.0, 35.0, 20.0, 27.0, 42.0, 36.0, 25.0, 35.0, 33.0, 50.0, 42.0, 40.0, 40.0, 32.0, 38.0, 31.0, 41.0, 29.0, 34.0, 38.0, 23.0, 13.0, 18.0, 16.0, 22.0, 14.0, 13.0, 14.0, 8.0, 7.0, 9.0, 4.0, 4.0, 4.0, 9.0, 0.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.146806716918945, -8.863174438476562, -8.579541206359863, -8.295907974243164, -8.012275695800781, -7.72864294052124, -7.445010185241699, -7.161377429962158, -6.877744674682617, -6.594111919403076, -6.310479164123535, -6.026846408843994, -5.743213653564453, -5.459580898284912, -5.175948143005371, -4.89231538772583, -4.608682632446289, -4.325049877166748, -4.041417121887207, -3.757784366607666, -3.474151611328125, -3.190518856048584, -2.906886100769043, -2.623253345489502, -2.339620590209961, -2.05598783493042, -1.772355079650879, -1.488722324371338, -1.2050895690917969, -0.9214568138122559, -0.6378240585327148, -0.35419130325317383, -0.0705575942993164, 0.2130751609802246, 0.4967079162597656, 0.7803406715393066, 1.0639734268188477, 1.3476061820983887, 1.6312389373779297, 1.9148716926574707, 2.1985044479370117, 2.4821372032165527, 2.7657699584960938, 3.0494027137756348, 3.333035469055176, 3.616668224334717, 3.900300979614258, 4.183933734893799, 4.46756649017334, 4.751199245452881, 5.034832000732422, 5.318464756011963, 5.602097511291504, 5.885730266571045, 6.169363021850586, 6.452995777130127, 6.736628532409668, 7.020261287689209, 7.30389404296875, 7.587526798248291, 7.871159553527832, 8.154792785644531, 8.438425064086914, 8.722057342529297, 9.005690574645996]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 15.0, 15.0, 25.0, 43.0, 65.0, 87.0, 127.0, 173.0, 274.0, 410.0, 624.0, 974.0, 1459.0, 2191.0, 3377.0, 5238.0, 7843.0, 12107.0, 19007.0, 28643.0, 43483.0, 64706.0, 92470.0, 120543.0, 139617.0, 136293.0, 113941.0, 84257.0, 58649.0, 38938.0, 25488.0, 16544.0, 10798.0, 7031.0, 4468.0, 2899.0, 1918.0, 1294.0, 847.0, 569.0, 381.0, 252.0, 164.0, 112.0, 69.0, 42.0, 29.0, 21.0, 14.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44140625, -5.25286865234375, -5.0643310546875, -4.87579345703125, -4.687255859375, -4.49871826171875, -4.3101806640625, -4.12164306640625, -3.93310546875, -3.74456787109375, -3.5560302734375, -3.36749267578125, -3.178955078125, -2.99041748046875, -2.8018798828125, -2.61334228515625, -2.4248046875, -2.23626708984375, -2.0477294921875, -1.85919189453125, -1.670654296875, -1.48211669921875, -1.2935791015625, -1.10504150390625, -0.91650390625, -0.72796630859375, -0.5394287109375, -0.35089111328125, -0.162353515625, 0.02618408203125, 0.2147216796875, 0.40325927734375, 0.591796875, 0.78033447265625, 0.9688720703125, 1.15740966796875, 1.345947265625, 1.53448486328125, 1.7230224609375, 1.91156005859375, 2.10009765625, 2.28863525390625, 2.4771728515625, 2.66571044921875, 2.854248046875, 3.04278564453125, 3.2313232421875, 3.41986083984375, 3.6083984375, 3.79693603515625, 3.9854736328125, 4.17401123046875, 4.362548828125, 4.55108642578125, 4.7396240234375, 4.92816162109375, 5.11669921875, 5.30523681640625, 5.4937744140625, 5.68231201171875, 5.870849609375, 6.05938720703125, 6.2479248046875, 6.43646240234375, 6.625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 5.0, 10.0, 10.0, 11.0, 19.0, 20.0, 19.0, 26.0, 30.0, 30.0, 30.0, 35.0, 41.0, 36.0, 32.0, 58.0, 40.0, 34.0, 40.0, 46.0, 44.0, 37.0, 29.0, 40.0, 31.0, 29.0, 26.0, 18.0, 23.0, 16.0, 17.0, 22.0, 13.0, 11.0, 6.0, 6.0, 9.0, 9.0, 5.0, 5.0, 6.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.03125, -9.7147216796875, -9.398193359375, -9.0816650390625, -8.76513671875, -8.4486083984375, -8.132080078125, -7.8155517578125, -7.4990234375, -7.1824951171875, -6.865966796875, -6.5494384765625, -6.23291015625, -5.9163818359375, -5.599853515625, -5.2833251953125, -4.966796875, -4.6502685546875, -4.333740234375, -4.0172119140625, -3.70068359375, -3.3841552734375, -3.067626953125, -2.7510986328125, -2.4345703125, -2.1180419921875, -1.801513671875, -1.4849853515625, -1.16845703125, -0.8519287109375, -0.535400390625, -0.2188720703125, 0.09765625, 0.4141845703125, 0.730712890625, 1.0472412109375, 1.36376953125, 1.6802978515625, 1.996826171875, 2.3133544921875, 2.6298828125, 2.9464111328125, 3.262939453125, 3.5794677734375, 3.89599609375, 4.2125244140625, 4.529052734375, 4.8455810546875, 5.162109375, 5.4786376953125, 5.795166015625, 6.1116943359375, 6.42822265625, 6.7447509765625, 7.061279296875, 7.3778076171875, 7.6943359375, 8.0108642578125, 8.327392578125, 8.6439208984375, 8.96044921875, 9.2769775390625, 9.593505859375, 9.9100341796875, 10.2265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 13.0, 17.0, 25.0, 38.0, 75.0, 132.0, 191.0, 381.0, 597.0, 1033.0, 1862.0, 3121.0, 5561.0, 9568.0, 17015.0, 30269.0, 53946.0, 92723.0, 147744.0, 190629.0, 180388.0, 130309.0, 79685.0, 45023.0, 24971.0, 14168.0, 8144.0, 4516.0, 2615.0, 1521.0, 906.0, 563.0, 324.0, 191.0, 110.0, 67.0, 33.0, 26.0, 16.0, 10.0, 9.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-9.9609375, -9.6666259765625, -9.372314453125, -9.0780029296875, -8.78369140625, -8.4893798828125, -8.195068359375, -7.9007568359375, -7.6064453125, -7.3121337890625, -7.017822265625, -6.7235107421875, -6.42919921875, -6.1348876953125, -5.840576171875, -5.5462646484375, -5.251953125, -4.9576416015625, -4.663330078125, -4.3690185546875, -4.07470703125, -3.7803955078125, -3.486083984375, -3.1917724609375, -2.8974609375, -2.6031494140625, -2.308837890625, -2.0145263671875, -1.72021484375, -1.4259033203125, -1.131591796875, -0.8372802734375, -0.54296875, -0.2486572265625, 0.045654296875, 0.3399658203125, 0.63427734375, 0.9285888671875, 1.222900390625, 1.5172119140625, 1.8115234375, 2.1058349609375, 2.400146484375, 2.6944580078125, 2.98876953125, 3.2830810546875, 3.577392578125, 3.8717041015625, 4.166015625, 4.4603271484375, 4.754638671875, 5.0489501953125, 5.34326171875, 5.6375732421875, 5.931884765625, 6.2261962890625, 6.5205078125, 6.8148193359375, 7.109130859375, 7.4034423828125, 7.69775390625, 7.9920654296875, 8.286376953125, 8.5806884765625, 8.875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 2.0, 4.0, 8.0, 7.0, 9.0, 15.0, 9.0, 12.0, 15.0, 25.0, 18.0, 25.0, 29.0, 35.0, 28.0, 26.0, 38.0, 36.0, 40.0, 36.0, 44.0, 34.0, 28.0, 33.0, 44.0, 22.0, 26.0, 35.0, 32.0, 31.0, 31.0, 30.0, 25.0, 16.0, 15.0, 16.0, 16.0, 26.0, 13.0, 10.0, 9.0, 6.0, 5.0, 10.0, 3.0, 6.0, 9.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.95703125, -5.76678466796875, -5.5765380859375, -5.38629150390625, -5.196044921875, -5.00579833984375, -4.8155517578125, -4.62530517578125, -4.43505859375, -4.24481201171875, -4.0545654296875, -3.86431884765625, -3.674072265625, -3.48382568359375, -3.2935791015625, -3.10333251953125, -2.9130859375, -2.72283935546875, -2.5325927734375, -2.34234619140625, -2.152099609375, -1.96185302734375, -1.7716064453125, -1.58135986328125, -1.39111328125, -1.20086669921875, -1.0106201171875, -0.82037353515625, -0.630126953125, -0.43988037109375, -0.2496337890625, -0.05938720703125, 0.130859375, 0.32110595703125, 0.5113525390625, 0.70159912109375, 0.891845703125, 1.08209228515625, 1.2723388671875, 1.46258544921875, 1.65283203125, 1.84307861328125, 2.0333251953125, 2.22357177734375, 2.413818359375, 2.60406494140625, 2.7943115234375, 2.98455810546875, 3.1748046875, 3.36505126953125, 3.5552978515625, 3.74554443359375, 3.935791015625, 4.12603759765625, 4.3162841796875, 4.50653076171875, 4.69677734375, 4.88702392578125, 5.0772705078125, 5.26751708984375, 5.457763671875, 5.64801025390625, 5.8382568359375, 6.02850341796875, 6.21875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 7.0, 18.0, 25.0, 42.0, 47.0, 72.0, 114.0, 153.0, 247.0, 311.0, 526.0, 772.0, 1265.0, 2185.0, 3851.0, 7373.0, 15542.0, 36164.0, 101053.0, 269714.0, 348051.0, 160152.0, 55947.0, 22346.0, 10221.0, 5146.0, 2789.0, 1598.0, 995.0, 609.0, 391.0, 250.0, 185.0, 120.0, 87.0, 56.0, 30.0, 36.0, 25.0, 10.0, 8.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.453125, -8.182373046875, -7.91162109375, -7.640869140625, -7.3701171875, -7.099365234375, -6.82861328125, -6.557861328125, -6.287109375, -6.016357421875, -5.74560546875, -5.474853515625, -5.2041015625, -4.933349609375, -4.66259765625, -4.391845703125, -4.12109375, -3.850341796875, -3.57958984375, -3.308837890625, -3.0380859375, -2.767333984375, -2.49658203125, -2.225830078125, -1.955078125, -1.684326171875, -1.41357421875, -1.142822265625, -0.8720703125, -0.601318359375, -0.33056640625, -0.059814453125, 0.2109375, 0.481689453125, 0.75244140625, 1.023193359375, 1.2939453125, 1.564697265625, 1.83544921875, 2.106201171875, 2.376953125, 2.647705078125, 2.91845703125, 3.189208984375, 3.4599609375, 3.730712890625, 4.00146484375, 4.272216796875, 4.54296875, 4.813720703125, 5.08447265625, 5.355224609375, 5.6259765625, 5.896728515625, 6.16748046875, 6.438232421875, 6.708984375, 6.979736328125, 7.25048828125, 7.521240234375, 7.7919921875, 8.062744140625, 8.33349609375, 8.604248046875, 8.875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 17.0, 12.0, 21.0, 25.0, 34.0, 50.0, 90.0, 118.0, 124.0, 115.0, 116.0, 88.0, 49.0, 32.0, 30.0, 16.0, 16.0, 11.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007653236389160156, -0.0007405653595924377, -0.0007158070802688599, -0.000691048800945282, -0.0006662905216217041, -0.0006415322422981262, -0.0006167739629745483, -0.0005920156836509705, -0.0005672574043273926, -0.0005424991250038147, -0.0005177408456802368, -0.0004929825663566589, -0.00046822428703308105, -0.0004434660077095032, -0.0004187077283859253, -0.0003939494490623474, -0.00036919116973876953, -0.00034443289041519165, -0.00031967461109161377, -0.0002949163317680359, -0.000270158052444458, -0.0002453997731208801, -0.00022064149379730225, -0.00019588321447372437, -0.00017112493515014648, -0.0001463666558265686, -0.00012160837650299072, -9.685009717941284e-05, -7.209181785583496e-05, -4.733353853225708e-05, -2.25752592086792e-05, 2.1830201148986816e-06, 2.6941299438476562e-05, 5.169957876205444e-05, 7.645785808563232e-05, 0.0001012161374092102, 0.00012597441673278809, 0.00015073269605636597, 0.00017549097537994385, 0.00020024925470352173, 0.0002250075340270996, 0.0002497658133506775, 0.00027452409267425537, 0.00029928237199783325, 0.00032404065132141113, 0.000348798930644989, 0.0003735572099685669, 0.0003983154892921448, 0.00042307376861572266, 0.00044783204793930054, 0.0004725903272628784, 0.0004973486065864563, 0.0005221068859100342, 0.0005468651652336121, 0.0005716234445571899, 0.0005963817238807678, 0.0006211400032043457, 0.0006458982825279236, 0.0006706565618515015, 0.0006954148411750793, 0.0007201731204986572, 0.0007449313998222351, 0.000769689679145813, 0.0007944479584693909, 0.0008192062377929688]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 7.0, 11.0, 18.0, 26.0, 31.0, 60.0, 94.0, 125.0, 206.0, 298.0, 395.0, 679.0, 1077.0, 1760.0, 3181.0, 6028.0, 12517.0, 29267.0, 75806.0, 202995.0, 351994.0, 219326.0, 82774.0, 31636.0, 13526.0, 6441.0, 3226.0, 1924.0, 1114.0, 670.0, 451.0, 302.0, 190.0, 119.0, 79.0, 65.0, 41.0, 31.0, 13.0, 19.0, 8.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.390625, -9.1187744140625, -8.846923828125, -8.5750732421875, -8.30322265625, -8.0313720703125, -7.759521484375, -7.4876708984375, -7.2158203125, -6.9439697265625, -6.672119140625, -6.4002685546875, -6.12841796875, -5.8565673828125, -5.584716796875, -5.3128662109375, -5.041015625, -4.7691650390625, -4.497314453125, -4.2254638671875, -3.95361328125, -3.6817626953125, -3.409912109375, -3.1380615234375, -2.8662109375, -2.5943603515625, -2.322509765625, -2.0506591796875, -1.77880859375, -1.5069580078125, -1.235107421875, -0.9632568359375, -0.69140625, -0.4195556640625, -0.147705078125, 0.1241455078125, 0.39599609375, 0.6678466796875, 0.939697265625, 1.2115478515625, 1.4833984375, 1.7552490234375, 2.027099609375, 2.2989501953125, 2.57080078125, 2.8426513671875, 3.114501953125, 3.3863525390625, 3.658203125, 3.9300537109375, 4.201904296875, 4.4737548828125, 4.74560546875, 5.0174560546875, 5.289306640625, 5.5611572265625, 5.8330078125, 6.1048583984375, 6.376708984375, 6.6485595703125, 6.92041015625, 7.1922607421875, 7.464111328125, 7.7359619140625, 8.0078125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 9.0, 9.0, 10.0, 18.0, 19.0, 18.0, 32.0, 37.0, 41.0, 67.0, 50.0, 72.0, 73.0, 78.0, 75.0, 67.0, 61.0, 41.0, 47.0, 40.0, 23.0, 21.0, 18.0, 9.0, 10.0, 11.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.462890625, -2.398406982421875, -2.33392333984375, -2.269439697265625, -2.2049560546875, -2.140472412109375, -2.07598876953125, -2.011505126953125, -1.947021484375, -1.882537841796875, -1.81805419921875, -1.753570556640625, -1.6890869140625, -1.624603271484375, -1.56011962890625, -1.495635986328125, -1.43115234375, -1.366668701171875, -1.30218505859375, -1.237701416015625, -1.1732177734375, -1.108734130859375, -1.04425048828125, -0.979766845703125, -0.915283203125, -0.850799560546875, -0.78631591796875, -0.721832275390625, -0.6573486328125, -0.592864990234375, -0.52838134765625, -0.463897705078125, -0.3994140625, -0.334930419921875, -0.27044677734375, -0.205963134765625, -0.1414794921875, -0.076995849609375, -0.01251220703125, 0.051971435546875, 0.116455078125, 0.180938720703125, 0.24542236328125, 0.309906005859375, 0.3743896484375, 0.438873291015625, 0.50335693359375, 0.567840576171875, 0.63232421875, 0.696807861328125, 0.76129150390625, 0.825775146484375, 0.8902587890625, 0.954742431640625, 1.01922607421875, 1.083709716796875, 1.148193359375, 1.212677001953125, 1.27716064453125, 1.341644287109375, 1.4061279296875, 1.470611572265625, 1.53509521484375, 1.599578857421875, 1.6640625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 7.0, 2.0, 5.0, 6.0, 10.0, 10.0, 12.0, 16.0, 16.0, 22.0, 21.0, 32.0, 37.0, 34.0, 47.0, 51.0, 52.0, 52.0, 65.0, 63.0, 78.0, 44.0, 54.0, 41.0, 41.0, 25.0, 26.0, 26.0, 27.0, 14.0, 16.0, 7.0, 8.0, 7.0, 8.0, 3.0, 2.0, 0.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.086257934570312, -12.643107414245605, -12.199956893920898, -11.756806373596191, -11.313655853271484, -10.870505332946777, -10.42735481262207, -9.984204292297363, -9.541053771972656, -9.09790325164795, -8.654752731323242, -8.211602210998535, -7.768451690673828, -7.325301170349121, -6.882150650024414, -6.439000129699707, -5.995849609375, -5.552699089050293, -5.109548568725586, -4.666398048400879, -4.223247528076172, -3.780097007751465, -3.336946487426758, -2.893795967102051, -2.4506454467773438, -2.0074949264526367, -1.5643444061279297, -1.1211938858032227, -0.6780433654785156, -0.2348928451538086, 0.20825767517089844, 0.6514081954956055, 1.094557762145996, 1.5377082824707031, 1.9808588027954102, 2.424009323120117, 2.867159843444824, 3.3103103637695312, 3.7534608840942383, 4.196611404418945, 4.639761924743652, 5.082912445068359, 5.526062965393066, 5.969213485717773, 6.4123640060424805, 6.8555145263671875, 7.2986650466918945, 7.741815567016602, 8.184966087341309, 8.628116607666016, 9.071267127990723, 9.51441764831543, 9.957568168640137, 10.400718688964844, 10.84386920928955, 11.287019729614258, 11.730170249938965, 12.173320770263672, 12.616471290588379, 13.059621810913086, 13.502772331237793, 13.9459228515625, 14.389073371887207, 14.832223892211914, 15.275374412536621]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 9.0, 3.0, 7.0, 21.0, 15.0, 25.0, 19.0, 24.0, 25.0, 41.0, 29.0, 41.0, 32.0, 55.0, 45.0, 49.0, 32.0, 39.0, 51.0, 50.0, 35.0, 43.0, 48.0, 33.0, 43.0, 24.0, 32.0, 13.0, 19.0, 15.0, 12.0, 12.0, 8.0, 11.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.65682315826416, -12.281082153320312, -11.905341148376465, -11.529600143432617, -11.153858184814453, -10.778117179870605, -10.402376174926758, -10.02663516998291, -9.650894165039062, -9.275153160095215, -8.899412155151367, -8.523670196533203, -8.147929191589355, -7.772188186645508, -7.39644718170166, -7.0207061767578125, -6.644964218139648, -6.269223213195801, -5.893481731414795, -5.517740726470947, -5.141999244689941, -4.766258239746094, -4.390517234802246, -4.014776229858398, -3.6390347480773926, -3.263293504714966, -2.887552261352539, -2.5118112564086914, -2.1360700130462646, -1.760328769683838, -1.3845877647399902, -1.0088465213775635, -0.6331043243408203, -0.25736314058303833, 0.11837804317474365, 0.49411916732788086, 0.8698604106903076, 1.2456016540527344, 1.621342658996582, 1.9970839023590088, 2.3728251457214355, 2.7485663890838623, 3.124307632446289, 3.5000486373901367, 3.8757898807525635, 4.25153112411499, 4.627272129058838, 5.003013610839844, 5.378754615783691, 5.754495620727539, 6.130237102508545, 6.505978107452393, 6.881719589233398, 7.257460594177246, 7.633201599121094, 8.008942604064941, 8.384683609008789, 8.760424613952637, 9.136165618896484, 9.511907577514648, 9.887648582458496, 10.263389587402344, 10.639130592346191, 11.014871597290039, 11.390613555908203]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 7.0, 7.0, 20.0, 13.0, 26.0, 35.0, 69.0, 75.0, 108.0, 156.0, 223.0, 359.0, 501.0, 733.0, 1151.0, 1707.0, 2626.0, 4039.0, 6490.0, 10663.0, 18439.0, 33750.0, 66281.0, 143043.0, 334182.0, 749652.0, 1158185.0, 897343.0, 420239.0, 174362.0, 78084.0, 38573.0, 20735.0, 11954.0, 7218.0, 4491.0, 2901.0, 1890.0, 1270.0, 839.0, 524.0, 416.0, 275.0, 191.0, 137.0, 93.0, 70.0, 48.0, 32.0, 21.0, 15.0, 3.0, 6.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-13.5703125, -13.0963134765625, -12.622314453125, -12.1483154296875, -11.67431640625, -11.2003173828125, -10.726318359375, -10.2523193359375, -9.7783203125, -9.3043212890625, -8.830322265625, -8.3563232421875, -7.88232421875, -7.4083251953125, -6.934326171875, -6.4603271484375, -5.986328125, -5.5123291015625, -5.038330078125, -4.5643310546875, -4.09033203125, -3.6163330078125, -3.142333984375, -2.6683349609375, -2.1943359375, -1.7203369140625, -1.246337890625, -0.7723388671875, -0.29833984375, 0.1756591796875, 0.649658203125, 1.1236572265625, 1.59765625, 2.0716552734375, 2.545654296875, 3.0196533203125, 3.49365234375, 3.9676513671875, 4.441650390625, 4.9156494140625, 5.3896484375, 5.8636474609375, 6.337646484375, 6.8116455078125, 7.28564453125, 7.7596435546875, 8.233642578125, 8.7076416015625, 9.181640625, 9.6556396484375, 10.129638671875, 10.6036376953125, 11.07763671875, 11.5516357421875, 12.025634765625, 12.4996337890625, 12.9736328125, 13.4476318359375, 13.921630859375, 14.3956298828125, 14.86962890625, 15.3436279296875, 15.817626953125, 16.2916259765625, 16.765625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 9.0, 6.0, 9.0, 11.0, 13.0, 10.0, 19.0, 21.0, 24.0, 25.0, 27.0, 28.0, 41.0, 39.0, 39.0, 49.0, 55.0, 51.0, 33.0, 50.0, 45.0, 40.0, 42.0, 55.0, 40.0, 34.0, 37.0, 25.0, 28.0, 13.0, 23.0, 14.0, 4.0, 8.0, 9.0, 12.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-11.6796875, -11.3319091796875, -10.984130859375, -10.6363525390625, -10.28857421875, -9.9407958984375, -9.593017578125, -9.2452392578125, -8.8974609375, -8.5496826171875, -8.201904296875, -7.8541259765625, -7.50634765625, -7.1585693359375, -6.810791015625, -6.4630126953125, -6.115234375, -5.7674560546875, -5.419677734375, -5.0718994140625, -4.72412109375, -4.3763427734375, -4.028564453125, -3.6807861328125, -3.3330078125, -2.9852294921875, -2.637451171875, -2.2896728515625, -1.94189453125, -1.5941162109375, -1.246337890625, -0.8985595703125, -0.55078125, -0.2030029296875, 0.144775390625, 0.4925537109375, 0.84033203125, 1.1881103515625, 1.535888671875, 1.8836669921875, 2.2314453125, 2.5792236328125, 2.927001953125, 3.2747802734375, 3.62255859375, 3.9703369140625, 4.318115234375, 4.6658935546875, 5.013671875, 5.3614501953125, 5.709228515625, 6.0570068359375, 6.40478515625, 6.7525634765625, 7.100341796875, 7.4481201171875, 7.7958984375, 8.1436767578125, 8.491455078125, 8.8392333984375, 9.18701171875, 9.5347900390625, 9.882568359375, 10.2303466796875, 10.578125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 5.0, 16.0, 15.0, 31.0, 35.0, 67.0, 98.0, 127.0, 165.0, 269.0, 403.0, 614.0, 953.0, 1457.0, 2453.0, 4071.0, 7080.0, 12801.0, 23705.0, 46657.0, 94696.0, 204468.0, 465855.0, 993135.0, 1173884.0, 632060.0, 276198.0, 124382.0, 60476.0, 30525.0, 16015.0, 8810.0, 5020.0, 2877.0, 1744.0, 1088.0, 692.0, 463.0, 285.0, 195.0, 123.0, 87.0, 57.0, 37.0, 32.0, 16.0, 13.0, 12.0, 3.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0], "bins": [-21.890625, -21.23095703125, -20.5712890625, -19.91162109375, -19.251953125, -18.59228515625, -17.9326171875, -17.27294921875, -16.61328125, -15.95361328125, -15.2939453125, -14.63427734375, -13.974609375, -13.31494140625, -12.6552734375, -11.99560546875, -11.3359375, -10.67626953125, -10.0166015625, -9.35693359375, -8.697265625, -8.03759765625, -7.3779296875, -6.71826171875, -6.05859375, -5.39892578125, -4.7392578125, -4.07958984375, -3.419921875, -2.76025390625, -2.1005859375, -1.44091796875, -0.78125, -0.12158203125, 0.5380859375, 1.19775390625, 1.857421875, 2.51708984375, 3.1767578125, 3.83642578125, 4.49609375, 5.15576171875, 5.8154296875, 6.47509765625, 7.134765625, 7.79443359375, 8.4541015625, 9.11376953125, 9.7734375, 10.43310546875, 11.0927734375, 11.75244140625, 12.412109375, 13.07177734375, 13.7314453125, 14.39111328125, 15.05078125, 15.71044921875, 16.3701171875, 17.02978515625, 17.689453125, 18.34912109375, 19.0087890625, 19.66845703125, 20.328125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 4.0, 11.0, 6.0, 9.0, 18.0, 25.0, 29.0, 34.0, 62.0, 54.0, 80.0, 130.0, 135.0, 223.0, 239.0, 279.0, 346.0, 405.0, 393.0, 306.0, 313.0, 202.0, 198.0, 127.0, 119.0, 77.0, 70.0, 50.0, 40.0, 22.0, 16.0, 19.0, 10.0, 3.0, 5.0, 3.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8515625, -7.61297607421875, -7.3743896484375, -7.13580322265625, -6.897216796875, -6.65863037109375, -6.4200439453125, -6.18145751953125, -5.94287109375, -5.70428466796875, -5.4656982421875, -5.22711181640625, -4.988525390625, -4.74993896484375, -4.5113525390625, -4.27276611328125, -4.0341796875, -3.79559326171875, -3.5570068359375, -3.31842041015625, -3.079833984375, -2.84124755859375, -2.6026611328125, -2.36407470703125, -2.12548828125, -1.88690185546875, -1.6483154296875, -1.40972900390625, -1.171142578125, -0.93255615234375, -0.6939697265625, -0.45538330078125, -0.216796875, 0.02178955078125, 0.2603759765625, 0.49896240234375, 0.737548828125, 0.97613525390625, 1.2147216796875, 1.45330810546875, 1.69189453125, 1.93048095703125, 2.1690673828125, 2.40765380859375, 2.646240234375, 2.88482666015625, 3.1234130859375, 3.36199951171875, 3.6005859375, 3.83917236328125, 4.0777587890625, 4.31634521484375, 4.554931640625, 4.79351806640625, 5.0321044921875, 5.27069091796875, 5.50927734375, 5.74786376953125, 5.9864501953125, 6.22503662109375, 6.463623046875, 6.70220947265625, 6.9407958984375, 7.17938232421875, 7.41796875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 9.0, 4.0, 4.0, 8.0, 8.0, 9.0, 15.0, 20.0, 37.0, 24.0, 33.0, 48.0, 50.0, 57.0, 65.0, 74.0, 75.0, 72.0, 56.0, 49.0, 48.0, 41.0, 39.0, 26.0, 28.0, 21.0, 12.0, 12.0, 8.0, 8.0, 10.0, 9.0, 5.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.54970359802246, -18.924062728881836, -18.29842185974121, -17.672780990600586, -17.04714012145996, -16.421499252319336, -15.795857429504395, -15.17021656036377, -14.544575691223145, -13.91893482208252, -13.293293952941895, -12.66765308380127, -12.042011260986328, -11.416370391845703, -10.790729522705078, -10.165088653564453, -9.539447784423828, -8.913806915283203, -8.288166046142578, -7.662524700164795, -7.03688383102417, -6.411242961883545, -5.785601615905762, -5.159960746765137, -4.534319877624512, -3.9086790084838867, -3.2830379009246826, -2.6573967933654785, -2.0317559242248535, -1.4061150550842285, -0.7804739475250244, -0.1548328399658203, 0.4708080291748047, 1.0964490175247192, 1.7220900058746338, 2.347731113433838, 2.973371982574463, 3.599012851715088, 4.224654197692871, 4.850295066833496, 5.475935935974121, 6.101576805114746, 6.727217674255371, 7.352859020233154, 7.978499889373779, 8.604141235351562, 9.229782104492188, 9.855422973632812, 10.481063842773438, 11.106704711914062, 11.732345581054688, 12.357986450195312, 12.983627319335938, 13.609268188476562, 14.234910011291504, 14.860550880432129, 15.486191749572754, 16.111833572387695, 16.73747444152832, 17.363115310668945, 17.98875617980957, 18.614397048950195, 19.24003791809082, 19.865678787231445, 20.49131965637207]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 4.0, 13.0, 10.0, 16.0, 16.0, 12.0, 22.0, 24.0, 22.0, 21.0, 16.0, 26.0, 33.0, 33.0, 45.0, 34.0, 42.0, 49.0, 41.0, 35.0, 41.0, 39.0, 36.0, 36.0, 34.0, 43.0, 32.0, 30.0, 27.0, 21.0, 19.0, 17.0, 16.0, 13.0, 15.0, 12.0, 12.0, 3.0, 9.0, 5.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-14.454890251159668, -14.022396087646484, -13.589900970458984, -13.1574068069458, -12.724912643432617, -12.292417526245117, -11.859923362731934, -11.42742919921875, -10.99493408203125, -10.562439918518066, -10.129944801330566, -9.697450637817383, -9.264955520629883, -8.8324613571167, -8.399967193603516, -7.967472553253174, -7.534977912902832, -7.10248327255249, -6.669988632202148, -6.237494468688965, -5.804999828338623, -5.372505187988281, -4.940011024475098, -4.507516384124756, -4.075021743774414, -3.6425271034240723, -3.2100327014923096, -2.777538299560547, -2.345043659210205, -1.9125490188598633, -1.4800546169281006, -1.047560214996338, -0.6150665283203125, -0.18257200717926025, 0.249922513961792, 0.6824170351028442, 1.1149115562438965, 1.5474061965942383, 1.979900598526001, 2.4123950004577637, 2.8448896408081055, 3.2773842811584473, 3.70987868309021, 4.142373085021973, 4.5748677253723145, 5.007362365722656, 5.43985652923584, 5.872351169586182, 6.304845809936523, 6.737340450286865, 7.169835090637207, 7.602329254150391, 8.03482437133789, 8.467318534851074, 8.899812698364258, 9.332307815551758, 9.764801979064941, 10.197296142578125, 10.629791259765625, 11.062285423278809, 11.494779586791992, 11.927274703979492, 12.359768867492676, 12.79226303100586, 13.22475814819336]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 10.0, 14.0, 17.0, 18.0, 46.0, 67.0, 82.0, 126.0, 209.0, 276.0, 460.0, 667.0, 967.0, 1505.0, 2176.0, 3413.0, 5318.0, 8133.0, 12668.0, 20426.0, 32313.0, 51070.0, 79372.0, 115531.0, 151552.0, 159634.0, 134614.0, 95601.0, 62899.0, 39889.0, 25028.0, 15755.0, 10040.0, 6515.0, 4104.0, 2782.0, 1742.0, 1168.0, 721.0, 509.0, 375.0, 240.0, 173.0, 110.0, 66.0, 56.0, 40.0, 21.0, 13.0, 12.0, 4.0, 1.0, 5.0, 3.0, 0.0, 2.0], "bins": [-7.52734375, -7.30084228515625, -7.0743408203125, -6.84783935546875, -6.621337890625, -6.39483642578125, -6.1683349609375, -5.94183349609375, -5.71533203125, -5.48883056640625, -5.2623291015625, -5.03582763671875, -4.809326171875, -4.58282470703125, -4.3563232421875, -4.12982177734375, -3.9033203125, -3.67681884765625, -3.4503173828125, -3.22381591796875, -2.997314453125, -2.77081298828125, -2.5443115234375, -2.31781005859375, -2.09130859375, -1.86480712890625, -1.6383056640625, -1.41180419921875, -1.185302734375, -0.95880126953125, -0.7322998046875, -0.50579833984375, -0.279296875, -0.05279541015625, 0.1737060546875, 0.40020751953125, 0.626708984375, 0.85321044921875, 1.0797119140625, 1.30621337890625, 1.53271484375, 1.75921630859375, 1.9857177734375, 2.21221923828125, 2.438720703125, 2.66522216796875, 2.8917236328125, 3.11822509765625, 3.3447265625, 3.57122802734375, 3.7977294921875, 4.02423095703125, 4.250732421875, 4.47723388671875, 4.7037353515625, 4.93023681640625, 5.15673828125, 5.38323974609375, 5.6097412109375, 5.83624267578125, 6.062744140625, 6.28924560546875, 6.5157470703125, 6.74224853515625, 6.96875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 16.0, 15.0, 18.0, 12.0, 23.0, 18.0, 19.0, 23.0, 34.0, 28.0, 43.0, 40.0, 39.0, 52.0, 48.0, 49.0, 43.0, 38.0, 50.0, 37.0, 35.0, 42.0, 47.0, 35.0, 27.0, 16.0, 15.0, 17.0, 15.0, 15.0, 9.0, 11.0, 7.0, 6.0, 5.0, 9.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.03125, -15.5465087890625, -15.061767578125, -14.5770263671875, -14.09228515625, -13.6075439453125, -13.122802734375, -12.6380615234375, -12.1533203125, -11.6685791015625, -11.183837890625, -10.6990966796875, -10.21435546875, -9.7296142578125, -9.244873046875, -8.7601318359375, -8.275390625, -7.7906494140625, -7.305908203125, -6.8211669921875, -6.33642578125, -5.8516845703125, -5.366943359375, -4.8822021484375, -4.3974609375, -3.9127197265625, -3.427978515625, -2.9432373046875, -2.45849609375, -1.9737548828125, -1.489013671875, -1.0042724609375, -0.51953125, -0.0347900390625, 0.449951171875, 0.9346923828125, 1.41943359375, 1.9041748046875, 2.388916015625, 2.8736572265625, 3.3583984375, 3.8431396484375, 4.327880859375, 4.8126220703125, 5.29736328125, 5.7821044921875, 6.266845703125, 6.7515869140625, 7.236328125, 7.7210693359375, 8.205810546875, 8.6905517578125, 9.17529296875, 9.6600341796875, 10.144775390625, 10.6295166015625, 11.1142578125, 11.5989990234375, 12.083740234375, 12.5684814453125, 13.05322265625, 13.5379638671875, 14.022705078125, 14.5074462890625, 14.9921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 9.0, 11.0, 14.0, 25.0, 33.0, 46.0, 47.0, 77.0, 144.0, 182.0, 312.0, 425.0, 675.0, 1106.0, 1707.0, 2828.0, 4599.0, 7883.0, 13275.0, 23857.0, 42759.0, 80434.0, 144145.0, 220783.0, 210084.0, 130665.0, 71851.0, 39051.0, 21249.0, 12129.0, 7078.0, 4140.0, 2500.0, 1509.0, 1022.0, 635.0, 422.0, 274.0, 159.0, 134.0, 74.0, 61.0, 44.0, 21.0, 18.0, 19.0, 6.0, 12.0, 4.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9921875, -10.6365966796875, -10.281005859375, -9.9254150390625, -9.56982421875, -9.2142333984375, -8.858642578125, -8.5030517578125, -8.1474609375, -7.7918701171875, -7.436279296875, -7.0806884765625, -6.72509765625, -6.3695068359375, -6.013916015625, -5.6583251953125, -5.302734375, -4.9471435546875, -4.591552734375, -4.2359619140625, -3.88037109375, -3.5247802734375, -3.169189453125, -2.8135986328125, -2.4580078125, -2.1024169921875, -1.746826171875, -1.3912353515625, -1.03564453125, -0.6800537109375, -0.324462890625, 0.0311279296875, 0.38671875, 0.7423095703125, 1.097900390625, 1.4534912109375, 1.80908203125, 2.1646728515625, 2.520263671875, 2.8758544921875, 3.2314453125, 3.5870361328125, 3.942626953125, 4.2982177734375, 4.65380859375, 5.0093994140625, 5.364990234375, 5.7205810546875, 6.076171875, 6.4317626953125, 6.787353515625, 7.1429443359375, 7.49853515625, 7.8541259765625, 8.209716796875, 8.5653076171875, 8.9208984375, 9.2764892578125, 9.632080078125, 9.9876708984375, 10.34326171875, 10.6988525390625, 11.054443359375, 11.4100341796875, 11.765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 9.0, 16.0, 8.0, 15.0, 19.0, 19.0, 30.0, 18.0, 26.0, 25.0, 39.0, 33.0, 41.0, 34.0, 55.0, 37.0, 43.0, 34.0, 36.0, 41.0, 35.0, 34.0, 22.0, 38.0, 35.0, 26.0, 28.0, 26.0, 19.0, 23.0, 22.0, 12.0, 8.0, 12.0, 4.0, 15.0, 6.0, 5.0, 5.0, 6.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-8.96875, -8.69921875, -8.4296875, -8.16015625, -7.890625, -7.62109375, -7.3515625, -7.08203125, -6.8125, -6.54296875, -6.2734375, -6.00390625, -5.734375, -5.46484375, -5.1953125, -4.92578125, -4.65625, -4.38671875, -4.1171875, -3.84765625, -3.578125, -3.30859375, -3.0390625, -2.76953125, -2.5, -2.23046875, -1.9609375, -1.69140625, -1.421875, -1.15234375, -0.8828125, -0.61328125, -0.34375, -0.07421875, 0.1953125, 0.46484375, 0.734375, 1.00390625, 1.2734375, 1.54296875, 1.8125, 2.08203125, 2.3515625, 2.62109375, 2.890625, 3.16015625, 3.4296875, 3.69921875, 3.96875, 4.23828125, 4.5078125, 4.77734375, 5.046875, 5.31640625, 5.5859375, 5.85546875, 6.125, 6.39453125, 6.6640625, 6.93359375, 7.203125, 7.47265625, 7.7421875, 8.01171875, 8.28125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 13.0, 13.0, 17.0, 33.0, 34.0, 59.0, 66.0, 104.0, 146.0, 257.0, 340.0, 451.0, 678.0, 1037.0, 1600.0, 2529.0, 4036.0, 6971.0, 12043.0, 21767.0, 40679.0, 78992.0, 150446.0, 243885.0, 217658.0, 123784.0, 63770.0, 33556.0, 17646.0, 10176.0, 5809.0, 3540.0, 2174.0, 1406.0, 876.0, 639.0, 388.0, 265.0, 207.0, 134.0, 107.0, 60.0, 54.0, 30.0, 22.0, 13.0, 16.0, 5.0, 12.0, 3.0, 6.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.953125, -6.74139404296875, -6.5296630859375, -6.31793212890625, -6.106201171875, -5.89447021484375, -5.6827392578125, -5.47100830078125, -5.25927734375, -5.04754638671875, -4.8358154296875, -4.62408447265625, -4.412353515625, -4.20062255859375, -3.9888916015625, -3.77716064453125, -3.5654296875, -3.35369873046875, -3.1419677734375, -2.93023681640625, -2.718505859375, -2.50677490234375, -2.2950439453125, -2.08331298828125, -1.87158203125, -1.65985107421875, -1.4481201171875, -1.23638916015625, -1.024658203125, -0.81292724609375, -0.6011962890625, -0.38946533203125, -0.177734375, 0.03399658203125, 0.2457275390625, 0.45745849609375, 0.669189453125, 0.88092041015625, 1.0926513671875, 1.30438232421875, 1.51611328125, 1.72784423828125, 1.9395751953125, 2.15130615234375, 2.363037109375, 2.57476806640625, 2.7864990234375, 2.99822998046875, 3.2099609375, 3.42169189453125, 3.6334228515625, 3.84515380859375, 4.056884765625, 4.26861572265625, 4.4803466796875, 4.69207763671875, 4.90380859375, 5.11553955078125, 5.3272705078125, 5.53900146484375, 5.750732421875, 5.96246337890625, 6.1741943359375, 6.38592529296875, 6.59765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 5.0, 4.0, 11.0, 17.0, 7.0, 10.0, 17.0, 24.0, 33.0, 32.0, 33.0, 37.0, 50.0, 54.0, 44.0, 59.0, 60.0, 56.0, 59.0, 61.0, 47.0, 45.0, 40.0, 34.0, 19.0, 19.0, 20.0, 10.0, 15.0, 14.0, 13.0, 7.0, 7.0, 2.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0002243518829345703, -0.00021751224994659424, -0.00021067261695861816, -0.0002038329839706421, -0.00019699335098266602, -0.00019015371799468994, -0.00018331408500671387, -0.0001764744520187378, -0.00016963481903076172, -0.00016279518604278564, -0.00015595555305480957, -0.0001491159200668335, -0.00014227628707885742, -0.00013543665409088135, -0.00012859702110290527, -0.0001217573881149292, -0.00011491775512695312, -0.00010807812213897705, -0.00010123848915100098, -9.43988561630249e-05, -8.755922317504883e-05, -8.071959018707275e-05, -7.387995719909668e-05, -6.70403242111206e-05, -6.020069122314453e-05, -5.336105823516846e-05, -4.652142524719238e-05, -3.968179225921631e-05, -3.2842159271240234e-05, -2.600252628326416e-05, -1.9162893295288086e-05, -1.2323260307312012e-05, -5.4836273193359375e-06, 1.3560056686401367e-06, 8.195638656616211e-06, 1.5035271644592285e-05, 2.187490463256836e-05, 2.8714537620544434e-05, 3.555417060852051e-05, 4.239380359649658e-05, 4.9233436584472656e-05, 5.607306957244873e-05, 6.29127025604248e-05, 6.975233554840088e-05, 7.659196853637695e-05, 8.343160152435303e-05, 9.02712345123291e-05, 9.711086750030518e-05, 0.00010395050048828125, 0.00011079013347625732, 0.0001176297664642334, 0.00012446939945220947, 0.00013130903244018555, 0.00013814866542816162, 0.0001449882984161377, 0.00015182793140411377, 0.00015866756439208984, 0.00016550719738006592, 0.000172346830368042, 0.00017918646335601807, 0.00018602609634399414, 0.00019286572933197021, 0.0001997053623199463, 0.00020654499530792236, 0.00021338462829589844]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 15.0, 9.0, 11.0, 34.0, 46.0, 75.0, 116.0, 223.0, 334.0, 650.0, 1080.0, 1917.0, 3294.0, 5566.0, 10149.0, 19165.0, 37444.0, 74901.0, 148175.0, 237738.0, 228995.0, 136605.0, 68599.0, 34107.0, 17607.0, 9359.0, 5094.0, 3046.0, 1697.0, 1034.0, 580.0, 374.0, 185.0, 123.0, 81.0, 41.0, 31.0, 24.0, 10.0, 10.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8291015625, -7.548828125, -7.2685546875, -6.98828125, -6.7080078125, -6.427734375, -6.1474609375, -5.8671875, -5.5869140625, -5.306640625, -5.0263671875, -4.74609375, -4.4658203125, -4.185546875, -3.9052734375, -3.625, -3.3447265625, -3.064453125, -2.7841796875, -2.50390625, -2.2236328125, -1.943359375, -1.6630859375, -1.3828125, -1.1025390625, -0.822265625, -0.5419921875, -0.26171875, 0.0185546875, 0.298828125, 0.5791015625, 0.859375, 1.1396484375, 1.419921875, 1.7001953125, 1.98046875, 2.2607421875, 2.541015625, 2.8212890625, 3.1015625, 3.3818359375, 3.662109375, 3.9423828125, 4.22265625, 4.5029296875, 4.783203125, 5.0634765625, 5.34375, 5.6240234375, 5.904296875, 6.1845703125, 6.46484375, 6.7451171875, 7.025390625, 7.3056640625, 7.5859375, 7.8662109375, 8.146484375, 8.4267578125, 8.70703125, 8.9873046875, 9.267578125, 9.5478515625, 9.828125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 8.0, 7.0, 11.0, 18.0, 19.0, 19.0, 26.0, 36.0, 37.0, 47.0, 62.0, 50.0, 61.0, 62.0, 60.0, 61.0, 64.0, 54.0, 44.0, 42.0, 36.0, 25.0, 29.0, 15.0, 20.0, 17.0, 15.0, 9.0, 9.0, 12.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.068359375, -1.98846435546875, -1.9085693359375, -1.82867431640625, -1.748779296875, -1.66888427734375, -1.5889892578125, -1.50909423828125, -1.42919921875, -1.34930419921875, -1.2694091796875, -1.18951416015625, -1.109619140625, -1.02972412109375, -0.9498291015625, -0.86993408203125, -0.7900390625, -0.71014404296875, -0.6302490234375, -0.55035400390625, -0.470458984375, -0.39056396484375, -0.3106689453125, -0.23077392578125, -0.15087890625, -0.07098388671875, 0.0089111328125, 0.08880615234375, 0.168701171875, 0.24859619140625, 0.3284912109375, 0.40838623046875, 0.48828125, 0.56817626953125, 0.6480712890625, 0.72796630859375, 0.807861328125, 0.88775634765625, 0.9676513671875, 1.04754638671875, 1.12744140625, 1.20733642578125, 1.2872314453125, 1.36712646484375, 1.447021484375, 1.52691650390625, 1.6068115234375, 1.68670654296875, 1.7666015625, 1.84649658203125, 1.9263916015625, 2.00628662109375, 2.086181640625, 2.16607666015625, 2.2459716796875, 2.32586669921875, 2.40576171875, 2.48565673828125, 2.5655517578125, 2.64544677734375, 2.725341796875, 2.80523681640625, 2.8851318359375, 2.96502685546875, 3.044921875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 7.0, 5.0, 5.0, 7.0, 9.0, 11.0, 18.0, 21.0, 23.0, 30.0, 41.0, 39.0, 50.0, 53.0, 70.0, 69.0, 78.0, 71.0, 62.0, 45.0, 51.0, 37.0, 38.0, 27.0, 33.0, 20.0, 11.0, 11.0, 8.0, 8.0, 9.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.962488174438477, -18.337907791137695, -17.713327407836914, -17.088748931884766, -16.464168548583984, -15.839588165283203, -15.215007781982422, -14.590428352355957, -13.965848922729492, -13.341268539428711, -12.716689109802246, -12.092108726501465, -11.467529296875, -10.842948913574219, -10.218368530273438, -9.593789100646973, -8.969208717346191, -8.34462833404541, -7.720048904418945, -7.095468521118164, -6.470889091491699, -5.846308708190918, -5.221728801727295, -4.597148895263672, -3.972568988800049, -3.347989082336426, -2.7234091758728027, -2.0988290309906006, -1.4742491245269775, -0.8496692180633545, -0.22508907318115234, 0.3994908332824707, 1.0240707397460938, 1.6486506462097168, 2.27323055267334, 2.897810697555542, 3.522390604019165, 4.146970748901367, 4.77155065536499, 5.396130561828613, 6.020710468292236, 6.645290374755859, 7.269870281219482, 7.8944501876831055, 8.519030570983887, 9.143610000610352, 9.768190383911133, 10.392770767211914, 11.017350196838379, 11.64193058013916, 12.266510009765625, 12.891090393066406, 13.515669822692871, 14.140250205993652, 14.764829635620117, 15.389410018920898, 16.01399040222168, 16.63857078552246, 17.263151168823242, 17.88772964477539, 18.512310028076172, 19.136890411376953, 19.761470794677734, 20.386051177978516, 21.010629653930664]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 3.0, 4.0, 4.0, 10.0, 14.0, 21.0, 11.0, 10.0, 25.0, 19.0, 22.0, 26.0, 19.0, 30.0, 35.0, 37.0, 35.0, 41.0, 42.0, 43.0, 45.0, 41.0, 41.0, 39.0, 41.0, 41.0, 32.0, 33.0, 44.0, 27.0, 21.0, 16.0, 19.0, 15.0, 17.0, 13.0, 11.0, 7.0, 13.0, 8.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.69821548461914, -14.253523826599121, -13.808832168579102, -13.364140510559082, -12.919448852539062, -12.47475814819336, -12.03006649017334, -11.58537483215332, -11.1406831741333, -10.695991516113281, -10.251299858093262, -9.806608200073242, -9.361917495727539, -8.917224884033203, -8.4725341796875, -8.02784252166748, -7.583150863647461, -7.138459205627441, -6.693767547607422, -6.2490763664245605, -5.804384708404541, -5.3596930503845215, -4.91500186920166, -4.470310211181641, -4.025618553161621, -3.5809268951416016, -3.136235475540161, -2.6915440559387207, -2.246852397918701, -1.8021607398986816, -1.3574693202972412, -0.9127779006958008, -0.46808624267578125, -0.02339470386505127, 0.4212968349456787, 0.8659883737564087, 1.3106799125671387, 1.7553715705871582, 2.2000629901885986, 2.644754409790039, 3.0894460678100586, 3.534137725830078, 3.9788291454315186, 4.423520565032959, 4.8682122230529785, 5.312903881072998, 5.757595062255859, 6.202286720275879, 6.646978378295898, 7.091670036315918, 7.5363616943359375, 7.981052875518799, 8.425745010375977, 8.87043571472168, 9.3151273727417, 9.759819030761719, 10.204510688781738, 10.649202346801758, 11.093894004821777, 11.538585662841797, 11.9832763671875, 12.427968978881836, 12.872659683227539, 13.317351341247559, 13.762042999267578]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 7.0, 13.0, 17.0, 19.0, 27.0, 48.0, 56.0, 106.0, 135.0, 178.0, 314.0, 480.0, 746.0, 1161.0, 2018.0, 3659.0, 6816.0, 14140.0, 30482.0, 68437.0, 151969.0, 262596.0, 251308.0, 136856.0, 61753.0, 27493.0, 12817.0, 6577.0, 3393.0, 1933.0, 1105.0, 598.0, 431.0, 286.0, 186.0, 110.0, 70.0, 66.0, 36.0, 38.0, 23.0, 15.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.1875, -15.646728515625, -15.10595703125, -14.565185546875, -14.0244140625, -13.483642578125, -12.94287109375, -12.402099609375, -11.861328125, -11.320556640625, -10.77978515625, -10.239013671875, -9.6982421875, -9.157470703125, -8.61669921875, -8.075927734375, -7.53515625, -6.994384765625, -6.45361328125, -5.912841796875, -5.3720703125, -4.831298828125, -4.29052734375, -3.749755859375, -3.208984375, -2.668212890625, -2.12744140625, -1.586669921875, -1.0458984375, -0.505126953125, 0.03564453125, 0.576416015625, 1.1171875, 1.657958984375, 2.19873046875, 2.739501953125, 3.2802734375, 3.821044921875, 4.36181640625, 4.902587890625, 5.443359375, 5.984130859375, 6.52490234375, 7.065673828125, 7.6064453125, 8.147216796875, 8.68798828125, 9.228759765625, 9.76953125, 10.310302734375, 10.85107421875, 11.391845703125, 11.9326171875, 12.473388671875, 13.01416015625, 13.554931640625, 14.095703125, 14.636474609375, 15.17724609375, 15.718017578125, 16.2587890625, 16.799560546875, 17.34033203125, 17.881103515625, 18.421875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 4.0, 17.0, 11.0, 18.0, 17.0, 14.0, 19.0, 18.0, 32.0, 33.0, 33.0, 44.0, 64.0, 48.0, 51.0, 52.0, 48.0, 41.0, 46.0, 47.0, 40.0, 48.0, 35.0, 39.0, 36.0, 16.0, 15.0, 23.0, 13.0, 17.0, 6.0, 4.0, 12.0, 9.0, 3.0, 4.0, 3.0, 6.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.126708984375, -16.59716796875, -16.067626953125, -15.5380859375, -15.008544921875, -14.47900390625, -13.949462890625, -13.419921875, -12.890380859375, -12.36083984375, -11.831298828125, -11.3017578125, -10.772216796875, -10.24267578125, -9.713134765625, -9.18359375, -8.654052734375, -8.12451171875, -7.594970703125, -7.0654296875, -6.535888671875, -6.00634765625, -5.476806640625, -4.947265625, -4.417724609375, -3.88818359375, -3.358642578125, -2.8291015625, -2.299560546875, -1.77001953125, -1.240478515625, -0.7109375, -0.181396484375, 0.34814453125, 0.877685546875, 1.4072265625, 1.936767578125, 2.46630859375, 2.995849609375, 3.525390625, 4.054931640625, 4.58447265625, 5.114013671875, 5.6435546875, 6.173095703125, 6.70263671875, 7.232177734375, 7.76171875, 8.291259765625, 8.82080078125, 9.350341796875, 9.8798828125, 10.409423828125, 10.93896484375, 11.468505859375, 11.998046875, 12.527587890625, 13.05712890625, 13.586669921875, 14.1162109375, 14.645751953125, 15.17529296875, 15.704833984375, 16.234375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 10.0, 8.0, 13.0, 17.0, 21.0, 41.0, 47.0, 53.0, 90.0, 127.0, 220.0, 277.0, 380.0, 624.0, 903.0, 1403.0, 2253.0, 3641.0, 6101.0, 10755.0, 19021.0, 35761.0, 71014.0, 136522.0, 219324.0, 226600.0, 147096.0, 77666.0, 39164.0, 20789.0, 11413.0, 6471.0, 3862.0, 2360.0, 1510.0, 1013.0, 615.0, 418.0, 274.0, 217.0, 137.0, 81.0, 70.0, 48.0, 40.0, 16.0, 20.0, 10.0, 9.0, 10.0, 8.0, 3.0, 4.0, 3.0, 3.0], "bins": [-18.828125, -18.275390625, -17.72265625, -17.169921875, -16.6171875, -16.064453125, -15.51171875, -14.958984375, -14.40625, -13.853515625, -13.30078125, -12.748046875, -12.1953125, -11.642578125, -11.08984375, -10.537109375, -9.984375, -9.431640625, -8.87890625, -8.326171875, -7.7734375, -7.220703125, -6.66796875, -6.115234375, -5.5625, -5.009765625, -4.45703125, -3.904296875, -3.3515625, -2.798828125, -2.24609375, -1.693359375, -1.140625, -0.587890625, -0.03515625, 0.517578125, 1.0703125, 1.623046875, 2.17578125, 2.728515625, 3.28125, 3.833984375, 4.38671875, 4.939453125, 5.4921875, 6.044921875, 6.59765625, 7.150390625, 7.703125, 8.255859375, 8.80859375, 9.361328125, 9.9140625, 10.466796875, 11.01953125, 11.572265625, 12.125, 12.677734375, 13.23046875, 13.783203125, 14.3359375, 14.888671875, 15.44140625, 15.994140625, 16.546875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 9.0, 7.0, 11.0, 8.0, 9.0, 8.0, 11.0, 13.0, 21.0, 22.0, 25.0, 24.0, 26.0, 25.0, 31.0, 32.0, 41.0, 31.0, 30.0, 35.0, 29.0, 34.0, 45.0, 39.0, 44.0, 30.0, 38.0, 36.0, 37.0, 34.0, 25.0, 23.0, 32.0, 24.0, 19.0, 13.0, 10.0, 16.0, 13.0, 7.0, 6.0, 7.0, 6.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.0390625, -9.7431640625, -9.447265625, -9.1513671875, -8.85546875, -8.5595703125, -8.263671875, -7.9677734375, -7.671875, -7.3759765625, -7.080078125, -6.7841796875, -6.48828125, -6.1923828125, -5.896484375, -5.6005859375, -5.3046875, -5.0087890625, -4.712890625, -4.4169921875, -4.12109375, -3.8251953125, -3.529296875, -3.2333984375, -2.9375, -2.6416015625, -2.345703125, -2.0498046875, -1.75390625, -1.4580078125, -1.162109375, -0.8662109375, -0.5703125, -0.2744140625, 0.021484375, 0.3173828125, 0.61328125, 0.9091796875, 1.205078125, 1.5009765625, 1.796875, 2.0927734375, 2.388671875, 2.6845703125, 2.98046875, 3.2763671875, 3.572265625, 3.8681640625, 4.1640625, 4.4599609375, 4.755859375, 5.0517578125, 5.34765625, 5.6435546875, 5.939453125, 6.2353515625, 6.53125, 6.8271484375, 7.123046875, 7.4189453125, 7.71484375, 8.0107421875, 8.306640625, 8.6025390625, 8.8984375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 14.0, 25.0, 20.0, 47.0, 61.0, 90.0, 114.0, 181.0, 235.0, 396.0, 596.0, 937.0, 1483.0, 2326.0, 3754.0, 6389.0, 10913.0, 19380.0, 37119.0, 76333.0, 157989.0, 261921.0, 226403.0, 118904.0, 56606.0, 28750.0, 15186.0, 8611.0, 4996.0, 3120.0, 2035.0, 1229.0, 814.0, 524.0, 355.0, 255.0, 156.0, 96.0, 54.0, 40.0, 28.0, 22.0, 12.0, 11.0, 5.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.5234375, -10.1925048828125, -9.861572265625, -9.5306396484375, -9.19970703125, -8.8687744140625, -8.537841796875, -8.2069091796875, -7.8759765625, -7.5450439453125, -7.214111328125, -6.8831787109375, -6.55224609375, -6.2213134765625, -5.890380859375, -5.5594482421875, -5.228515625, -4.8975830078125, -4.566650390625, -4.2357177734375, -3.90478515625, -3.5738525390625, -3.242919921875, -2.9119873046875, -2.5810546875, -2.2501220703125, -1.919189453125, -1.5882568359375, -1.25732421875, -0.9263916015625, -0.595458984375, -0.2645263671875, 0.06640625, 0.3973388671875, 0.728271484375, 1.0592041015625, 1.39013671875, 1.7210693359375, 2.052001953125, 2.3829345703125, 2.7138671875, 3.0447998046875, 3.375732421875, 3.7066650390625, 4.03759765625, 4.3685302734375, 4.699462890625, 5.0303955078125, 5.361328125, 5.6922607421875, 6.023193359375, 6.3541259765625, 6.68505859375, 7.0159912109375, 7.346923828125, 7.6778564453125, 8.0087890625, 8.3397216796875, 8.670654296875, 9.0015869140625, 9.33251953125, 9.6634521484375, 9.994384765625, 10.3253173828125, 10.65625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 2.0, 4.0, 4.0, 2.0, 2.0, 8.0, 10.0, 14.0, 14.0, 21.0, 17.0, 33.0, 35.0, 37.0, 79.0, 73.0, 111.0, 93.0, 94.0, 80.0, 54.0, 52.0, 36.0, 29.0, 18.0, 14.0, 15.0, 14.0, 8.0, 6.0, 6.0, 1.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.0012760162353515625, -0.0012428909540176392, -0.0012097656726837158, -0.0011766403913497925, -0.0011435151100158691, -0.0011103898286819458, -0.0010772645473480225, -0.0010441392660140991, -0.0010110139846801758, -0.0009778887033462524, -0.0009447634220123291, -0.0009116381406784058, -0.0008785128593444824, -0.0008453875780105591, -0.0008122622966766357, -0.0007791370153427124, -0.0007460117340087891, -0.0007128864526748657, -0.0006797611713409424, -0.000646635890007019, -0.0006135106086730957, -0.0005803853273391724, -0.000547260046005249, -0.0005141347646713257, -0.00048100948333740234, -0.000447884202003479, -0.00041475892066955566, -0.0003816336393356323, -0.000348508358001709, -0.00031538307666778564, -0.0002822577953338623, -0.00024913251399993896, -0.00021600723266601562, -0.00018288195133209229, -0.00014975666999816895, -0.0001166313886642456, -8.350610733032227e-05, -5.0380825996398926e-05, -1.7255544662475586e-05, 1.5869736671447754e-05, 4.8995018005371094e-05, 8.212029933929443e-05, 0.00011524558067321777, 0.0001483708620071411, 0.00018149614334106445, 0.0002146214246749878, 0.00024774670600891113, 0.00028087198734283447, 0.0003139972686767578, 0.00034712255001068115, 0.0003802478313446045, 0.00041337311267852783, 0.00044649839401245117, 0.0004796236753463745, 0.0005127489566802979, 0.0005458742380142212, 0.0005789995193481445, 0.0006121248006820679, 0.0006452500820159912, 0.0006783753633499146, 0.0007115006446838379, 0.0007446259260177612, 0.0007777512073516846, 0.0008108764886856079, 0.0008440017700195312]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 3.0, 3.0, 11.0, 11.0, 16.0, 25.0, 43.0, 50.0, 149.0, 192.0, 375.0, 676.0, 1346.0, 2469.0, 5059.0, 10371.0, 23639.0, 56381.0, 143660.0, 312854.0, 283986.0, 121088.0, 47484.0, 20201.0, 9307.0, 4442.0, 2234.0, 1090.0, 586.0, 336.0, 178.0, 93.0, 60.0, 54.0, 27.0, 17.0, 10.0, 8.0, 7.0, 9.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.5804443359375, -12.145263671875, -11.7100830078125, -11.27490234375, -10.8397216796875, -10.404541015625, -9.9693603515625, -9.5341796875, -9.0989990234375, -8.663818359375, -8.2286376953125, -7.79345703125, -7.3582763671875, -6.923095703125, -6.4879150390625, -6.052734375, -5.6175537109375, -5.182373046875, -4.7471923828125, -4.31201171875, -3.8768310546875, -3.441650390625, -3.0064697265625, -2.5712890625, -2.1361083984375, -1.700927734375, -1.2657470703125, -0.83056640625, -0.3953857421875, 0.039794921875, 0.4749755859375, 0.91015625, 1.3453369140625, 1.780517578125, 2.2156982421875, 2.65087890625, 3.0860595703125, 3.521240234375, 3.9564208984375, 4.3916015625, 4.8267822265625, 5.261962890625, 5.6971435546875, 6.13232421875, 6.5675048828125, 7.002685546875, 7.4378662109375, 7.873046875, 8.3082275390625, 8.743408203125, 9.1785888671875, 9.61376953125, 10.0489501953125, 10.484130859375, 10.9193115234375, 11.3544921875, 11.7896728515625, 12.224853515625, 12.6600341796875, 13.09521484375, 13.5303955078125, 13.965576171875, 14.4007568359375, 14.8359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 6.0, 6.0, 9.0, 14.0, 9.0, 23.0, 20.0, 25.0, 30.0, 33.0, 35.0, 50.0, 58.0, 55.0, 56.0, 50.0, 55.0, 38.0, 53.0, 51.0, 38.0, 47.0, 41.0, 33.0, 27.0, 23.0, 20.0, 11.0, 13.0, 19.0, 8.0, 5.0, 11.0, 3.0, 3.0, 6.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.05078125, -1.979644775390625, -1.90850830078125, -1.837371826171875, -1.7662353515625, -1.695098876953125, -1.62396240234375, -1.552825927734375, -1.481689453125, -1.410552978515625, -1.33941650390625, -1.268280029296875, -1.1971435546875, -1.126007080078125, -1.05487060546875, -0.983734130859375, -0.91259765625, -0.841461181640625, -0.77032470703125, -0.699188232421875, -0.6280517578125, -0.556915283203125, -0.48577880859375, -0.414642333984375, -0.343505859375, -0.272369384765625, -0.20123291015625, -0.130096435546875, -0.0589599609375, 0.012176513671875, 0.08331298828125, 0.154449462890625, 0.2255859375, 0.296722412109375, 0.36785888671875, 0.438995361328125, 0.5101318359375, 0.581268310546875, 0.65240478515625, 0.723541259765625, 0.794677734375, 0.865814208984375, 0.93695068359375, 1.008087158203125, 1.0792236328125, 1.150360107421875, 1.22149658203125, 1.292633056640625, 1.36376953125, 1.434906005859375, 1.50604248046875, 1.577178955078125, 1.6483154296875, 1.719451904296875, 1.79058837890625, 1.861724853515625, 1.932861328125, 2.003997802734375, 2.07513427734375, 2.146270751953125, 2.2174072265625, 2.288543701171875, 2.35968017578125, 2.430816650390625, 2.501953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 4.0, 6.0, 3.0, 2.0, 5.0, 3.0, 4.0, 6.0, 14.0, 5.0, 18.0, 14.0, 11.0, 15.0, 29.0, 29.0, 37.0, 39.0, 67.0, 69.0, 65.0, 59.0, 56.0, 51.0, 58.0, 50.0, 47.0, 40.0, 37.0, 39.0, 26.0, 19.0, 17.0, 11.0, 7.0, 11.0, 5.0, 8.0, 6.0, 3.0, 5.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.010011672973633, -18.402679443359375, -17.795345306396484, -17.188013076782227, -16.58068084716797, -15.973347663879395, -15.36601448059082, -14.758682250976562, -14.151349067687988, -13.544015884399414, -12.936683654785156, -12.329350471496582, -11.722017288208008, -11.11468505859375, -10.507351875305176, -9.900018692016602, -9.292686462402344, -8.68535327911377, -8.078021049499512, -7.4706878662109375, -6.8633551597595215, -6.2560224533081055, -5.648689270019531, -5.041356563568115, -4.434023857116699, -3.826691150665283, -3.219358205795288, -2.612025260925293, -2.004692554473877, -1.397359848022461, -0.7900269031524658, -0.1826939582824707, 0.4246368408203125, 1.031969666481018, 1.6393024921417236, 2.2466354370117188, 2.8539681434631348, 3.461300849914551, 4.068634033203125, 4.675966739654541, 5.283299446105957, 5.890632152557373, 6.497964859008789, 7.105298042297363, 7.712630748748779, 8.319963455200195, 8.92729663848877, 9.534629821777344, 10.141962051391602, 10.749295234680176, 11.356627464294434, 11.963960647583008, 12.571292877197266, 13.17862606048584, 13.785959243774414, 14.393291473388672, 15.000624656677246, 15.60795783996582, 16.215290069580078, 16.822622299194336, 17.429956436157227, 18.037288665771484, 18.644620895385742, 19.251955032348633, 19.85928726196289]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 10.0, 8.0, 18.0, 19.0, 20.0, 12.0, 21.0, 20.0, 30.0, 25.0, 23.0, 35.0, 46.0, 50.0, 41.0, 40.0, 49.0, 50.0, 49.0, 41.0, 36.0, 43.0, 37.0, 36.0, 36.0, 28.0, 25.0, 22.0, 23.0, 17.0, 18.0, 14.0, 11.0, 11.0, 9.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-18.90999984741211, -18.345932006835938, -17.7818660736084, -17.217798233032227, -16.653732299804688, -16.089664459228516, -15.525596618652344, -14.961529731750488, -14.397462844848633, -13.833395957946777, -13.269329071044922, -12.70526123046875, -12.141194343566895, -11.577127456665039, -11.013059616088867, -10.448992729187012, -9.884925842285156, -9.3208589553833, -8.756792068481445, -8.192724227905273, -7.628657341003418, -7.0645904541015625, -6.500523090362549, -5.936455726623535, -5.37238883972168, -4.808321952819824, -4.2442545890808105, -3.680187463760376, -3.1161203384399414, -2.552053213119507, -1.9879860877990723, -1.4239189624786377, -0.8598537445068359, -0.29578661918640137, 0.2682805061340332, 0.8323476314544678, 1.3964147567749023, 1.960481882095337, 2.5245490074157715, 3.088616132736206, 3.6526832580566406, 4.216750144958496, 4.78081750869751, 5.344884872436523, 5.908951759338379, 6.473018646240234, 7.037086009979248, 7.601153373718262, 8.165220260620117, 8.729287147521973, 9.293354034423828, 9.857421875, 10.421488761901855, 10.985555648803711, 11.549623489379883, 12.113690376281738, 12.677757263183594, 13.24182415008545, 13.805891036987305, 14.369958877563477, 14.934025764465332, 15.498092651367188, 16.06216049194336, 16.6262264251709, 17.19029426574707]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 12.0, 20.0, 19.0, 36.0, 65.0, 90.0, 110.0, 217.0, 297.0, 529.0, 855.0, 1286.0, 2330.0, 4130.0, 7473.0, 14364.0, 29628.0, 67494.0, 178879.0, 511646.0, 1194216.0, 1266170.0, 570786.0, 199934.0, 75704.0, 33069.0, 15899.0, 8128.0, 4505.0, 2550.0, 1509.0, 872.0, 553.0, 339.0, 214.0, 121.0, 85.0, 52.0, 25.0, 20.0, 16.0, 4.0, 8.0, 7.0, 3.0, 9.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.3125, -27.5048828125, -26.697265625, -25.8896484375, -25.08203125, -24.2744140625, -23.466796875, -22.6591796875, -21.8515625, -21.0439453125, -20.236328125, -19.4287109375, -18.62109375, -17.8134765625, -17.005859375, -16.1982421875, -15.390625, -14.5830078125, -13.775390625, -12.9677734375, -12.16015625, -11.3525390625, -10.544921875, -9.7373046875, -8.9296875, -8.1220703125, -7.314453125, -6.5068359375, -5.69921875, -4.8916015625, -4.083984375, -3.2763671875, -2.46875, -1.6611328125, -0.853515625, -0.0458984375, 0.76171875, 1.5693359375, 2.376953125, 3.1845703125, 3.9921875, 4.7998046875, 5.607421875, 6.4150390625, 7.22265625, 8.0302734375, 8.837890625, 9.6455078125, 10.453125, 11.2607421875, 12.068359375, 12.8759765625, 13.68359375, 14.4912109375, 15.298828125, 16.1064453125, 16.9140625, 17.7216796875, 18.529296875, 19.3369140625, 20.14453125, 20.9521484375, 21.759765625, 22.5673828125, 23.375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 5.0, 11.0, 11.0, 15.0, 17.0, 15.0, 9.0, 21.0, 17.0, 26.0, 23.0, 29.0, 31.0, 42.0, 54.0, 44.0, 38.0, 46.0, 49.0, 36.0, 29.0, 44.0, 44.0, 40.0, 40.0, 29.0, 28.0, 29.0, 28.0, 21.0, 19.0, 15.0, 14.0, 11.0, 14.0, 10.0, 15.0, 7.0, 6.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.171875, -16.653076171875, -16.13427734375, -15.615478515625, -15.0966796875, -14.577880859375, -14.05908203125, -13.540283203125, -13.021484375, -12.502685546875, -11.98388671875, -11.465087890625, -10.9462890625, -10.427490234375, -9.90869140625, -9.389892578125, -8.87109375, -8.352294921875, -7.83349609375, -7.314697265625, -6.7958984375, -6.277099609375, -5.75830078125, -5.239501953125, -4.720703125, -4.201904296875, -3.68310546875, -3.164306640625, -2.6455078125, -2.126708984375, -1.60791015625, -1.089111328125, -0.5703125, -0.051513671875, 0.46728515625, 0.986083984375, 1.5048828125, 2.023681640625, 2.54248046875, 3.061279296875, 3.580078125, 4.098876953125, 4.61767578125, 5.136474609375, 5.6552734375, 6.174072265625, 6.69287109375, 7.211669921875, 7.73046875, 8.249267578125, 8.76806640625, 9.286865234375, 9.8056640625, 10.324462890625, 10.84326171875, 11.362060546875, 11.880859375, 12.399658203125, 12.91845703125, 13.437255859375, 13.9560546875, 14.474853515625, 14.99365234375, 15.512451171875, 16.03125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 11.0, 14.0, 6.0, 19.0, 35.0, 37.0, 61.0, 97.0, 121.0, 190.0, 283.0, 432.0, 634.0, 1035.0, 1638.0, 2463.0, 4036.0, 6465.0, 10369.0, 17493.0, 29766.0, 52881.0, 98563.0, 189743.0, 380010.0, 738514.0, 1056046.0, 769899.0, 398419.0, 198999.0, 103164.0, 55308.0, 30888.0, 18199.0, 10549.0, 6546.0, 4070.0, 2562.0, 1657.0, 1008.0, 691.0, 425.0, 314.0, 184.0, 133.0, 110.0, 71.0, 44.0, 21.0, 19.0, 9.0, 12.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0], "bins": [-26.171875, -25.367431640625, -24.56298828125, -23.758544921875, -22.9541015625, -22.149658203125, -21.34521484375, -20.540771484375, -19.736328125, -18.931884765625, -18.12744140625, -17.322998046875, -16.5185546875, -15.714111328125, -14.90966796875, -14.105224609375, -13.30078125, -12.496337890625, -11.69189453125, -10.887451171875, -10.0830078125, -9.278564453125, -8.47412109375, -7.669677734375, -6.865234375, -6.060791015625, -5.25634765625, -4.451904296875, -3.6474609375, -2.843017578125, -2.03857421875, -1.234130859375, -0.4296875, 0.374755859375, 1.17919921875, 1.983642578125, 2.7880859375, 3.592529296875, 4.39697265625, 5.201416015625, 6.005859375, 6.810302734375, 7.61474609375, 8.419189453125, 9.2236328125, 10.028076171875, 10.83251953125, 11.636962890625, 12.44140625, 13.245849609375, 14.05029296875, 14.854736328125, 15.6591796875, 16.463623046875, 17.26806640625, 18.072509765625, 18.876953125, 19.681396484375, 20.48583984375, 21.290283203125, 22.0947265625, 22.899169921875, 23.70361328125, 24.508056640625, 25.3125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 4.0, 3.0, 3.0, 9.0, 5.0, 9.0, 12.0, 17.0, 18.0, 37.0, 34.0, 45.0, 54.0, 64.0, 87.0, 98.0, 149.0, 163.0, 217.0, 215.0, 235.0, 314.0, 311.0, 287.0, 307.0, 248.0, 215.0, 182.0, 141.0, 136.0, 96.0, 86.0, 59.0, 48.0, 32.0, 33.0, 23.0, 15.0, 10.0, 13.0, 9.0, 8.0, 10.0, 6.0, 2.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-10.5, -10.2086181640625, -9.917236328125, -9.6258544921875, -9.33447265625, -9.0430908203125, -8.751708984375, -8.4603271484375, -8.1689453125, -7.8775634765625, -7.586181640625, -7.2947998046875, -7.00341796875, -6.7120361328125, -6.420654296875, -6.1292724609375, -5.837890625, -5.5465087890625, -5.255126953125, -4.9637451171875, -4.67236328125, -4.3809814453125, -4.089599609375, -3.7982177734375, -3.5068359375, -3.2154541015625, -2.924072265625, -2.6326904296875, -2.34130859375, -2.0499267578125, -1.758544921875, -1.4671630859375, -1.17578125, -0.8843994140625, -0.593017578125, -0.3016357421875, -0.01025390625, 0.2811279296875, 0.572509765625, 0.8638916015625, 1.1552734375, 1.4466552734375, 1.738037109375, 2.0294189453125, 2.32080078125, 2.6121826171875, 2.903564453125, 3.1949462890625, 3.486328125, 3.7777099609375, 4.069091796875, 4.3604736328125, 4.65185546875, 4.9432373046875, 5.234619140625, 5.5260009765625, 5.8173828125, 6.1087646484375, 6.400146484375, 6.6915283203125, 6.98291015625, 7.2742919921875, 7.565673828125, 7.8570556640625, 8.1484375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 3.0, 7.0, 9.0, 7.0, 11.0, 25.0, 15.0, 20.0, 30.0, 36.0, 36.0, 56.0, 80.0, 61.0, 68.0, 72.0, 64.0, 77.0, 52.0, 52.0, 36.0, 35.0, 32.0, 31.0, 14.0, 15.0, 9.0, 8.0, 10.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.50762176513672, -31.463815689086914, -30.420007705688477, -29.376201629638672, -28.332393646240234, -27.28858757019043, -26.244781494140625, -25.200973510742188, -24.157167434692383, -23.113361358642578, -22.06955337524414, -21.025747299194336, -19.98194122314453, -18.938133239746094, -17.89432716369629, -16.850521087646484, -15.806713104248047, -14.762906074523926, -13.719099044799805, -12.67529296875, -11.631485939025879, -10.587678909301758, -9.543872833251953, -8.500065803527832, -7.456258773803711, -6.41245174407959, -5.368645191192627, -4.324838638305664, -3.281031608581543, -2.237224578857422, -1.193418025970459, -0.1496114730834961, 0.8941993713378906, 1.9380061626434326, 2.9818129539489746, 4.0256195068359375, 5.069426536560059, 6.11323356628418, 7.157040119171143, 8.200846672058105, 9.244653701782227, 10.288460731506348, 11.332267761230469, 12.376073837280273, 13.419880867004395, 14.463687896728516, 15.50749397277832, 16.551300048828125, 17.595108032226562, 18.638914108276367, 19.682722091674805, 20.72652816772461, 21.770336151123047, 22.81414222717285, 23.857948303222656, 24.901756286621094, 25.9455623626709, 26.989368438720703, 28.03317642211914, 29.076982498168945, 30.12078857421875, 31.164596557617188, 32.208404541015625, 33.2522087097168, 34.296016693115234]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 5.0, 17.0, 17.0, 19.0, 21.0, 20.0, 16.0, 21.0, 23.0, 38.0, 32.0, 36.0, 44.0, 42.0, 46.0, 49.0, 48.0, 41.0, 38.0, 37.0, 40.0, 38.0, 41.0, 26.0, 41.0, 30.0, 16.0, 32.0, 18.0, 22.0, 16.0, 10.0, 8.0, 5.0, 7.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.939693450927734, -24.156044006347656, -23.372394561767578, -22.5887451171875, -21.805095672607422, -21.02144432067871, -20.237794876098633, -19.454145431518555, -18.670495986938477, -17.8868465423584, -17.10319709777832, -16.319547653198242, -15.535897254943848, -14.75224781036377, -13.968597412109375, -13.184947967529297, -12.401298522949219, -11.61764907836914, -10.833999633789062, -10.050349235534668, -9.26669979095459, -8.483050346374512, -7.699400424957275, -6.915750503540039, -6.132101058959961, -5.348451614379883, -4.5648016929626465, -3.7811520099639893, -2.997502326965332, -2.213852643966675, -1.4302029609680176, -0.6465530395507812, 0.13709640502929688, 0.9207460880279541, 1.7043957710266113, 2.4880454540252686, 3.271695137023926, 4.055344581604004, 4.83899450302124, 5.622644424438477, 6.406293869018555, 7.189943313598633, 7.973593235015869, 8.757243156433105, 9.540892601013184, 10.324542045593262, 11.108192443847656, 11.891841888427734, 12.675491333007812, 13.45914077758789, 14.242790222167969, 15.026440620422363, 15.810090065002441, 16.593740463256836, 17.377389907836914, 18.161039352416992, 18.94468879699707, 19.72833824157715, 20.511987686157227, 21.295637130737305, 22.079288482666016, 22.862937927246094, 23.646587371826172, 24.43023681640625, 25.213886260986328]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 9.0, 13.0, 13.0, 12.0, 23.0, 42.0, 56.0, 78.0, 128.0, 202.0, 276.0, 441.0, 613.0, 1028.0, 1613.0, 2652.0, 4136.0, 6612.0, 10984.0, 18313.0, 30577.0, 51825.0, 87858.0, 139209.0, 186864.0, 179607.0, 128482.0, 79708.0, 46687.0, 27668.0, 16726.0, 9925.0, 6046.0, 3600.0, 2278.0, 1521.0, 923.0, 610.0, 389.0, 260.0, 177.0, 130.0, 99.0, 55.0, 29.0, 27.0, 15.0, 6.0, 3.0, 11.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4296875, -11.059814453125, -10.68994140625, -10.320068359375, -9.9501953125, -9.580322265625, -9.21044921875, -8.840576171875, -8.470703125, -8.100830078125, -7.73095703125, -7.361083984375, -6.9912109375, -6.621337890625, -6.25146484375, -5.881591796875, -5.51171875, -5.141845703125, -4.77197265625, -4.402099609375, -4.0322265625, -3.662353515625, -3.29248046875, -2.922607421875, -2.552734375, -2.182861328125, -1.81298828125, -1.443115234375, -1.0732421875, -0.703369140625, -0.33349609375, 0.036376953125, 0.40625, 0.776123046875, 1.14599609375, 1.515869140625, 1.8857421875, 2.255615234375, 2.62548828125, 2.995361328125, 3.365234375, 3.735107421875, 4.10498046875, 4.474853515625, 4.8447265625, 5.214599609375, 5.58447265625, 5.954345703125, 6.32421875, 6.694091796875, 7.06396484375, 7.433837890625, 7.8037109375, 8.173583984375, 8.54345703125, 8.913330078125, 9.283203125, 9.653076171875, 10.02294921875, 10.392822265625, 10.7626953125, 11.132568359375, 11.50244140625, 11.872314453125, 12.2421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 11.0, 8.0, 11.0, 17.0, 20.0, 13.0, 27.0, 26.0, 35.0, 34.0, 39.0, 38.0, 43.0, 46.0, 51.0, 64.0, 43.0, 46.0, 42.0, 42.0, 45.0, 43.0, 37.0, 31.0, 30.0, 17.0, 33.0, 23.0, 17.0, 12.0, 10.0, 8.0, 1.0, 5.0, 3.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.125, -28.220458984375, -27.31591796875, -26.411376953125, -25.5068359375, -24.602294921875, -23.69775390625, -22.793212890625, -21.888671875, -20.984130859375, -20.07958984375, -19.175048828125, -18.2705078125, -17.365966796875, -16.46142578125, -15.556884765625, -14.65234375, -13.747802734375, -12.84326171875, -11.938720703125, -11.0341796875, -10.129638671875, -9.22509765625, -8.320556640625, -7.416015625, -6.511474609375, -5.60693359375, -4.702392578125, -3.7978515625, -2.893310546875, -1.98876953125, -1.084228515625, -0.1796875, 0.724853515625, 1.62939453125, 2.533935546875, 3.4384765625, 4.343017578125, 5.24755859375, 6.152099609375, 7.056640625, 7.961181640625, 8.86572265625, 9.770263671875, 10.6748046875, 11.579345703125, 12.48388671875, 13.388427734375, 14.29296875, 15.197509765625, 16.10205078125, 17.006591796875, 17.9111328125, 18.815673828125, 19.72021484375, 20.624755859375, 21.529296875, 22.433837890625, 23.33837890625, 24.242919921875, 25.1474609375, 26.052001953125, 26.95654296875, 27.861083984375, 28.765625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 9.0, 15.0, 7.0, 16.0, 32.0, 22.0, 60.0, 95.0, 128.0, 217.0, 308.0, 481.0, 684.0, 1146.0, 1839.0, 2800.0, 4432.0, 7055.0, 11607.0, 18797.0, 30932.0, 52191.0, 86029.0, 138033.0, 190299.0, 181350.0, 123964.0, 77087.0, 46241.0, 27820.0, 16875.0, 10348.0, 6460.0, 3979.0, 2537.0, 1662.0, 1004.0, 708.0, 464.0, 277.0, 199.0, 122.0, 88.0, 46.0, 43.0, 13.0, 11.0, 7.0, 9.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.40625, -11.976806640625, -11.54736328125, -11.117919921875, -10.6884765625, -10.259033203125, -9.82958984375, -9.400146484375, -8.970703125, -8.541259765625, -8.11181640625, -7.682373046875, -7.2529296875, -6.823486328125, -6.39404296875, -5.964599609375, -5.53515625, -5.105712890625, -4.67626953125, -4.246826171875, -3.8173828125, -3.387939453125, -2.95849609375, -2.529052734375, -2.099609375, -1.670166015625, -1.24072265625, -0.811279296875, -0.3818359375, 0.047607421875, 0.47705078125, 0.906494140625, 1.3359375, 1.765380859375, 2.19482421875, 2.624267578125, 3.0537109375, 3.483154296875, 3.91259765625, 4.342041015625, 4.771484375, 5.200927734375, 5.63037109375, 6.059814453125, 6.4892578125, 6.918701171875, 7.34814453125, 7.777587890625, 8.20703125, 8.636474609375, 9.06591796875, 9.495361328125, 9.9248046875, 10.354248046875, 10.78369140625, 11.213134765625, 11.642578125, 12.072021484375, 12.50146484375, 12.930908203125, 13.3603515625, 13.789794921875, 14.21923828125, 14.648681640625, 15.078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 12.0, 9.0, 7.0, 8.0, 15.0, 13.0, 10.0, 14.0, 22.0, 16.0, 23.0, 18.0, 35.0, 43.0, 29.0, 35.0, 32.0, 39.0, 49.0, 35.0, 44.0, 31.0, 39.0, 35.0, 44.0, 41.0, 28.0, 30.0, 32.0, 20.0, 33.0, 18.0, 19.0, 17.0, 14.0, 17.0, 10.0, 6.0, 11.0, 9.0, 8.0, 8.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8828125, -12.45703125, -12.03125, -11.60546875, -11.1796875, -10.75390625, -10.328125, -9.90234375, -9.4765625, -9.05078125, -8.625, -8.19921875, -7.7734375, -7.34765625, -6.921875, -6.49609375, -6.0703125, -5.64453125, -5.21875, -4.79296875, -4.3671875, -3.94140625, -3.515625, -3.08984375, -2.6640625, -2.23828125, -1.8125, -1.38671875, -0.9609375, -0.53515625, -0.109375, 0.31640625, 0.7421875, 1.16796875, 1.59375, 2.01953125, 2.4453125, 2.87109375, 3.296875, 3.72265625, 4.1484375, 4.57421875, 5.0, 5.42578125, 5.8515625, 6.27734375, 6.703125, 7.12890625, 7.5546875, 7.98046875, 8.40625, 8.83203125, 9.2578125, 9.68359375, 10.109375, 10.53515625, 10.9609375, 11.38671875, 11.8125, 12.23828125, 12.6640625, 13.08984375, 13.515625, 13.94140625, 14.3671875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 12.0, 12.0, 21.0, 25.0, 34.0, 50.0, 61.0, 94.0, 183.0, 241.0, 347.0, 491.0, 816.0, 1286.0, 1961.0, 3228.0, 5137.0, 8720.0, 14963.0, 25925.0, 45220.0, 82037.0, 144422.0, 218299.0, 202728.0, 126528.0, 70935.0, 39343.0, 22209.0, 12907.0, 7579.0, 4533.0, 2961.0, 1847.0, 1140.0, 740.0, 514.0, 299.0, 221.0, 176.0, 100.0, 63.0, 51.0, 29.0, 21.0, 22.0, 9.0, 0.0, 9.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-7.1875, -6.9547119140625, -6.721923828125, -6.4891357421875, -6.25634765625, -6.0235595703125, -5.790771484375, -5.5579833984375, -5.3251953125, -5.0924072265625, -4.859619140625, -4.6268310546875, -4.39404296875, -4.1612548828125, -3.928466796875, -3.6956787109375, -3.462890625, -3.2301025390625, -2.997314453125, -2.7645263671875, -2.53173828125, -2.2989501953125, -2.066162109375, -1.8333740234375, -1.6005859375, -1.3677978515625, -1.135009765625, -0.9022216796875, -0.66943359375, -0.4366455078125, -0.203857421875, 0.0289306640625, 0.26171875, 0.4945068359375, 0.727294921875, 0.9600830078125, 1.19287109375, 1.4256591796875, 1.658447265625, 1.8912353515625, 2.1240234375, 2.3568115234375, 2.589599609375, 2.8223876953125, 3.05517578125, 3.2879638671875, 3.520751953125, 3.7535400390625, 3.986328125, 4.2191162109375, 4.451904296875, 4.6846923828125, 4.91748046875, 5.1502685546875, 5.383056640625, 5.6158447265625, 5.8486328125, 6.0814208984375, 6.314208984375, 6.5469970703125, 6.77978515625, 7.0125732421875, 7.245361328125, 7.4781494140625, 7.7109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 4.0, 5.0, 8.0, 7.0, 11.0, 9.0, 9.0, 16.0, 17.0, 17.0, 20.0, 26.0, 28.0, 37.0, 35.0, 48.0, 46.0, 45.0, 46.0, 60.0, 60.0, 44.0, 57.0, 35.0, 48.0, 41.0, 20.0, 24.0, 29.0, 31.0, 19.0, 19.0, 21.0, 16.0, 9.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00023603439331054688, -0.0002270713448524475, -0.00021810829639434814, -0.00020914524793624878, -0.00020018219947814941, -0.00019121915102005005, -0.00018225610256195068, -0.00017329305410385132, -0.00016433000564575195, -0.0001553669571876526, -0.00014640390872955322, -0.00013744086027145386, -0.0001284778118133545, -0.00011951476335525513, -0.00011055171489715576, -0.0001015886664390564, -9.262561798095703e-05, -8.366256952285767e-05, -7.46995210647583e-05, -6.573647260665894e-05, -5.677342414855957e-05, -4.7810375690460205e-05, -3.884732723236084e-05, -2.9884278774261475e-05, -2.092123031616211e-05, -1.1958181858062744e-05, -2.995133399963379e-06, 5.967915058135986e-06, 1.4930963516235352e-05, 2.3894011974334717e-05, 3.285706043243408e-05, 4.182010889053345e-05, 5.078315734863281e-05, 5.974620580673218e-05, 6.870925426483154e-05, 7.767230272293091e-05, 8.663535118103027e-05, 9.559839963912964e-05, 0.000104561448097229, 0.00011352449655532837, 0.00012248754501342773, 0.0001314505934715271, 0.00014041364192962646, 0.00014937669038772583, 0.0001583397388458252, 0.00016730278730392456, 0.00017626583576202393, 0.0001852288842201233, 0.00019419193267822266, 0.00020315498113632202, 0.0002121180295944214, 0.00022108107805252075, 0.00023004412651062012, 0.00023900717496871948, 0.00024797022342681885, 0.0002569332718849182, 0.0002658963203430176, 0.00027485936880111694, 0.0002838224172592163, 0.0002927854657173157, 0.00030174851417541504, 0.0003107115626335144, 0.00031967461109161377, 0.00032863765954971313, 0.0003376007080078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 14.0, 12.0, 18.0, 26.0, 20.0, 35.0, 47.0, 73.0, 89.0, 133.0, 190.0, 259.0, 391.0, 599.0, 966.0, 1513.0, 2695.0, 4784.0, 8878.0, 17392.0, 33713.0, 66818.0, 127241.0, 211496.0, 233087.0, 160009.0, 86267.0, 43468.0, 22223.0, 11331.0, 6016.0, 3265.0, 2003.0, 1206.0, 697.0, 487.0, 312.0, 236.0, 152.0, 114.0, 69.0, 51.0, 39.0, 38.0, 26.0, 15.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-9.8359375, -9.5303955078125, -9.224853515625, -8.9193115234375, -8.61376953125, -8.3082275390625, -8.002685546875, -7.6971435546875, -7.3916015625, -7.0860595703125, -6.780517578125, -6.4749755859375, -6.16943359375, -5.8638916015625, -5.558349609375, -5.2528076171875, -4.947265625, -4.6417236328125, -4.336181640625, -4.0306396484375, -3.72509765625, -3.4195556640625, -3.114013671875, -2.8084716796875, -2.5029296875, -2.1973876953125, -1.891845703125, -1.5863037109375, -1.28076171875, -0.9752197265625, -0.669677734375, -0.3641357421875, -0.05859375, 0.2469482421875, 0.552490234375, 0.8580322265625, 1.16357421875, 1.4691162109375, 1.774658203125, 2.0802001953125, 2.3857421875, 2.6912841796875, 2.996826171875, 3.3023681640625, 3.60791015625, 3.9134521484375, 4.218994140625, 4.5245361328125, 4.830078125, 5.1356201171875, 5.441162109375, 5.7467041015625, 6.05224609375, 6.3577880859375, 6.663330078125, 6.9688720703125, 7.2744140625, 7.5799560546875, 7.885498046875, 8.1910400390625, 8.49658203125, 8.8021240234375, 9.107666015625, 9.4132080078125, 9.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 3.0, 8.0, 15.0, 8.0, 19.0, 22.0, 19.0, 31.0, 33.0, 52.0, 66.0, 57.0, 80.0, 72.0, 62.0, 86.0, 62.0, 69.0, 57.0, 36.0, 43.0, 23.0, 19.0, 17.0, 11.0, 7.0, 3.0, 3.0, 4.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.923828125, -3.800445556640625, -3.67706298828125, -3.553680419921875, -3.4302978515625, -3.306915283203125, -3.18353271484375, -3.060150146484375, -2.936767578125, -2.813385009765625, -2.69000244140625, -2.566619873046875, -2.4432373046875, -2.319854736328125, -2.19647216796875, -2.073089599609375, -1.94970703125, -1.826324462890625, -1.70294189453125, -1.579559326171875, -1.4561767578125, -1.332794189453125, -1.20941162109375, -1.086029052734375, -0.962646484375, -0.839263916015625, -0.71588134765625, -0.592498779296875, -0.4691162109375, -0.345733642578125, -0.22235107421875, -0.098968505859375, 0.0244140625, 0.147796630859375, 0.27117919921875, 0.394561767578125, 0.5179443359375, 0.641326904296875, 0.76470947265625, 0.888092041015625, 1.011474609375, 1.134857177734375, 1.25823974609375, 1.381622314453125, 1.5050048828125, 1.628387451171875, 1.75177001953125, 1.875152587890625, 1.99853515625, 2.121917724609375, 2.24530029296875, 2.368682861328125, 2.4920654296875, 2.615447998046875, 2.73883056640625, 2.862213134765625, 2.985595703125, 3.108978271484375, 3.23236083984375, 3.355743408203125, 3.4791259765625, 3.602508544921875, 3.72589111328125, 3.849273681640625, 3.97265625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 8.0, 6.0, 7.0, 8.0, 5.0, 13.0, 18.0, 24.0, 17.0, 28.0, 30.0, 34.0, 58.0, 66.0, 70.0, 68.0, 74.0, 68.0, 75.0, 46.0, 43.0, 47.0, 38.0, 33.0, 30.0, 20.0, 14.0, 15.0, 7.0, 7.0, 3.0, 5.0, 2.0, 0.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.53426742553711, -30.496740341186523, -29.459213256835938, -28.421688079833984, -27.3841609954834, -26.346633911132812, -25.309106826782227, -24.27157974243164, -23.234054565429688, -22.1965274810791, -21.159000396728516, -20.121475219726562, -19.083948135375977, -18.04642105102539, -17.008893966674805, -15.971366882324219, -14.933839797973633, -13.896312713623047, -12.858786582946777, -11.821259498596191, -10.783733367919922, -9.746206283569336, -8.70867919921875, -7.671152591705322, -6.6336259841918945, -5.596099376678467, -4.558572769165039, -3.521045684814453, -2.4835190773010254, -1.4459924697875977, -0.4084653854370117, 0.629061222076416, 1.6665878295898438, 2.7041144371032715, 3.7416412830352783, 4.779168128967285, 5.816694736480713, 6.854221343994141, 7.891748428344727, 8.929275512695312, 9.966801643371582, 11.004328727722168, 12.041854858398438, 13.079381942749023, 14.11690902709961, 15.154435157775879, 16.19196319580078, 17.229488372802734, 18.26701545715332, 19.304542541503906, 20.342069625854492, 21.379596710205078, 22.41712188720703, 23.454648971557617, 24.492176055908203, 25.52970314025879, 26.567230224609375, 27.60475730895996, 28.642284393310547, 29.6798095703125, 30.717336654663086, 31.754863739013672, 32.792388916015625, 33.829917907714844, 34.8674430847168]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 9.0, 6.0, 10.0, 17.0, 12.0, 19.0, 22.0, 17.0, 22.0, 24.0, 31.0, 34.0, 32.0, 48.0, 36.0, 48.0, 45.0, 47.0, 43.0, 50.0, 37.0, 25.0, 54.0, 40.0, 29.0, 33.0, 34.0, 30.0, 23.0, 21.0, 19.0, 20.0, 13.0, 8.0, 6.0, 6.0, 1.0, 6.0, 8.0, 5.0, 5.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.265186309814453, -25.455320358276367, -24.64545249938965, -23.835586547851562, -23.025718688964844, -22.215852737426758, -21.405986785888672, -20.596118927001953, -19.786251068115234, -18.97638511657715, -18.16651725769043, -17.356651306152344, -16.546783447265625, -15.736917495727539, -14.927050590515137, -14.117183685302734, -13.307317733764648, -12.497450828552246, -11.687583923339844, -10.877717971801758, -10.067850112915039, -9.257984161376953, -8.44811725616455, -7.638250350952148, -6.828383445739746, -6.018516540527344, -5.208649635314941, -4.398783206939697, -3.588916301727295, -2.7790493965148926, -1.9691829681396484, -1.159316062927246, -0.34944725036621094, 0.46041953563690186, 1.2702863216400146, 2.080152988433838, 2.8900198936462402, 3.6998867988586426, 4.509753227233887, 5.319620132446289, 6.129487037658691, 6.939353942871094, 7.749220848083496, 8.559087753295898, 9.368953704833984, 10.178821563720703, 10.988687515258789, 11.798554420471191, 12.608421325683594, 13.418288230895996, 14.228155136108398, 15.038021087646484, 15.847888946533203, 16.65775489807129, 17.467620849609375, 18.277488708496094, 19.087356567382812, 19.8972225189209, 20.707090377807617, 21.516956329345703, 22.326824188232422, 23.136690139770508, 23.946556091308594, 24.756423950195312, 25.5662899017334]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 8.0, 11.0, 6.0, 14.0, 17.0, 46.0, 75.0, 82.0, 123.0, 155.0, 265.0, 383.0, 542.0, 783.0, 1200.0, 1807.0, 2804.0, 4257.0, 6522.0, 10252.0, 16132.0, 25962.0, 42001.0, 66221.0, 99806.0, 137473.0, 159742.0, 148430.0, 114410.0, 76260.0, 48794.0, 30474.0, 19125.0, 12002.0, 7686.0, 4975.0, 3219.0, 2188.0, 1404.0, 950.0, 614.0, 445.0, 281.0, 184.0, 139.0, 95.0, 62.0, 45.0, 30.0, 19.0, 17.0, 6.0, 12.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.28125, -12.8482666015625, -12.415283203125, -11.9822998046875, -11.54931640625, -11.1163330078125, -10.683349609375, -10.2503662109375, -9.8173828125, -9.3843994140625, -8.951416015625, -8.5184326171875, -8.08544921875, -7.6524658203125, -7.219482421875, -6.7864990234375, -6.353515625, -5.9205322265625, -5.487548828125, -5.0545654296875, -4.62158203125, -4.1885986328125, -3.755615234375, -3.3226318359375, -2.8896484375, -2.4566650390625, -2.023681640625, -1.5906982421875, -1.15771484375, -0.7247314453125, -0.291748046875, 0.1412353515625, 0.57421875, 1.0072021484375, 1.440185546875, 1.8731689453125, 2.30615234375, 2.7391357421875, 3.172119140625, 3.6051025390625, 4.0380859375, 4.4710693359375, 4.904052734375, 5.3370361328125, 5.77001953125, 6.2030029296875, 6.635986328125, 7.0689697265625, 7.501953125, 7.9349365234375, 8.367919921875, 8.8009033203125, 9.23388671875, 9.6668701171875, 10.099853515625, 10.5328369140625, 10.9658203125, 11.3988037109375, 11.831787109375, 12.2647705078125, 12.69775390625, 13.1307373046875, 13.563720703125, 13.9967041015625, 14.4296875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 1.0, 11.0, 9.0, 18.0, 12.0, 24.0, 14.0, 20.0, 10.0, 25.0, 31.0, 37.0, 32.0, 37.0, 32.0, 47.0, 51.0, 34.0, 42.0, 45.0, 53.0, 35.0, 38.0, 51.0, 39.0, 23.0, 39.0, 34.0, 25.0, 16.0, 23.0, 19.0, 16.0, 10.0, 10.0, 4.0, 0.0, 4.0, 0.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.609375, -25.796142578125, -24.98291015625, -24.169677734375, -23.3564453125, -22.543212890625, -21.72998046875, -20.916748046875, -20.103515625, -19.290283203125, -18.47705078125, -17.663818359375, -16.8505859375, -16.037353515625, -15.22412109375, -14.410888671875, -13.59765625, -12.784423828125, -11.97119140625, -11.157958984375, -10.3447265625, -9.531494140625, -8.71826171875, -7.905029296875, -7.091796875, -6.278564453125, -5.46533203125, -4.652099609375, -3.8388671875, -3.025634765625, -2.21240234375, -1.399169921875, -0.5859375, 0.227294921875, 1.04052734375, 1.853759765625, 2.6669921875, 3.480224609375, 4.29345703125, 5.106689453125, 5.919921875, 6.733154296875, 7.54638671875, 8.359619140625, 9.1728515625, 9.986083984375, 10.79931640625, 11.612548828125, 12.42578125, 13.239013671875, 14.05224609375, 14.865478515625, 15.6787109375, 16.491943359375, 17.30517578125, 18.118408203125, 18.931640625, 19.744873046875, 20.55810546875, 21.371337890625, 22.1845703125, 22.997802734375, 23.81103515625, 24.624267578125, 25.4375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 15.0, 17.0, 32.0, 38.0, 65.0, 85.0, 162.0, 210.0, 321.0, 452.0, 736.0, 1086.0, 1661.0, 2532.0, 3972.0, 6493.0, 10435.0, 17102.0, 30064.0, 52919.0, 94874.0, 169773.0, 233563.0, 181432.0, 102643.0, 57358.0, 31881.0, 18644.0, 11256.0, 6724.0, 4260.0, 2658.0, 1699.0, 1129.0, 760.0, 532.0, 307.0, 224.0, 119.0, 116.0, 74.0, 38.0, 24.0, 24.0, 12.0, 8.0, 12.0, 5.0, 0.0, 4.0, 1.0, 1.0], "bins": [-36.53125, -35.474365234375, -34.41748046875, -33.360595703125, -32.3037109375, -31.246826171875, -30.18994140625, -29.133056640625, -28.076171875, -27.019287109375, -25.96240234375, -24.905517578125, -23.8486328125, -22.791748046875, -21.73486328125, -20.677978515625, -19.62109375, -18.564208984375, -17.50732421875, -16.450439453125, -15.3935546875, -14.336669921875, -13.27978515625, -12.222900390625, -11.166015625, -10.109130859375, -9.05224609375, -7.995361328125, -6.9384765625, -5.881591796875, -4.82470703125, -3.767822265625, -2.7109375, -1.654052734375, -0.59716796875, 0.459716796875, 1.5166015625, 2.573486328125, 3.63037109375, 4.687255859375, 5.744140625, 6.801025390625, 7.85791015625, 8.914794921875, 9.9716796875, 11.028564453125, 12.08544921875, 13.142333984375, 14.19921875, 15.256103515625, 16.31298828125, 17.369873046875, 18.4267578125, 19.483642578125, 20.54052734375, 21.597412109375, 22.654296875, 23.711181640625, 24.76806640625, 25.824951171875, 26.8818359375, 27.938720703125, 28.99560546875, 30.052490234375, 31.109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 5.0, 9.0, 5.0, 12.0, 7.0, 12.0, 10.0, 14.0, 20.0, 27.0, 20.0, 28.0, 29.0, 28.0, 28.0, 33.0, 34.0, 40.0, 45.0, 40.0, 49.0, 44.0, 36.0, 28.0, 33.0, 36.0, 35.0, 23.0, 30.0, 36.0, 18.0, 31.0, 27.0, 24.0, 15.0, 20.0, 13.0, 14.0, 11.0, 4.0, 9.0, 8.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.8125, -15.275146484375, -14.73779296875, -14.200439453125, -13.6630859375, -13.125732421875, -12.58837890625, -12.051025390625, -11.513671875, -10.976318359375, -10.43896484375, -9.901611328125, -9.3642578125, -8.826904296875, -8.28955078125, -7.752197265625, -7.21484375, -6.677490234375, -6.14013671875, -5.602783203125, -5.0654296875, -4.528076171875, -3.99072265625, -3.453369140625, -2.916015625, -2.378662109375, -1.84130859375, -1.303955078125, -0.7666015625, -0.229248046875, 0.30810546875, 0.845458984375, 1.3828125, 1.920166015625, 2.45751953125, 2.994873046875, 3.5322265625, 4.069580078125, 4.60693359375, 5.144287109375, 5.681640625, 6.218994140625, 6.75634765625, 7.293701171875, 7.8310546875, 8.368408203125, 8.90576171875, 9.443115234375, 9.98046875, 10.517822265625, 11.05517578125, 11.592529296875, 12.1298828125, 12.667236328125, 13.20458984375, 13.741943359375, 14.279296875, 14.816650390625, 15.35400390625, 15.891357421875, 16.4287109375, 16.966064453125, 17.50341796875, 18.040771484375, 18.578125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 13.0, 13.0, 16.0, 28.0, 32.0, 48.0, 67.0, 95.0, 137.0, 163.0, 229.0, 362.0, 514.0, 688.0, 1064.0, 1703.0, 2686.0, 4555.0, 8108.0, 14859.0, 28900.0, 57057.0, 114363.0, 202018.0, 242986.0, 174850.0, 93367.0, 46312.0, 23369.0, 12244.0, 6769.0, 3881.0, 2431.0, 1460.0, 992.0, 647.0, 466.0, 314.0, 213.0, 162.0, 106.0, 89.0, 56.0, 27.0, 31.0, 19.0, 12.0, 13.0, 5.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.3515625, -13.8453369140625, -13.339111328125, -12.8328857421875, -12.32666015625, -11.8204345703125, -11.314208984375, -10.8079833984375, -10.3017578125, -9.7955322265625, -9.289306640625, -8.7830810546875, -8.27685546875, -7.7706298828125, -7.264404296875, -6.7581787109375, -6.251953125, -5.7457275390625, -5.239501953125, -4.7332763671875, -4.22705078125, -3.7208251953125, -3.214599609375, -2.7083740234375, -2.2021484375, -1.6959228515625, -1.189697265625, -0.6834716796875, -0.17724609375, 0.3289794921875, 0.835205078125, 1.3414306640625, 1.84765625, 2.3538818359375, 2.860107421875, 3.3663330078125, 3.87255859375, 4.3787841796875, 4.885009765625, 5.3912353515625, 5.8974609375, 6.4036865234375, 6.909912109375, 7.4161376953125, 7.92236328125, 8.4285888671875, 8.934814453125, 9.4410400390625, 9.947265625, 10.4534912109375, 10.959716796875, 11.4659423828125, 11.97216796875, 12.4783935546875, 12.984619140625, 13.4908447265625, 13.9970703125, 14.5032958984375, 15.009521484375, 15.5157470703125, 16.02197265625, 16.5281982421875, 17.034423828125, 17.5406494140625, 18.046875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 7.0, 6.0, 7.0, 5.0, 17.0, 25.0, 24.0, 14.0, 25.0, 38.0, 59.0, 62.0, 54.0, 72.0, 78.0, 65.0, 71.0, 57.0, 54.0, 51.0, 37.0, 37.0, 31.0, 15.0, 18.0, 18.0, 15.0, 9.0, 8.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0013484954833984375, -0.001299530267715454, -0.0012505650520324707, -0.0012015998363494873, -0.001152634620666504, -0.0011036694049835205, -0.0010547041893005371, -0.0010057389736175537, -0.0009567737579345703, -0.0009078085422515869, -0.0008588433265686035, -0.0008098781108856201, -0.0007609128952026367, -0.0007119476795196533, -0.0006629824638366699, -0.0006140172481536865, -0.0005650520324707031, -0.0005160868167877197, -0.00046712160110473633, -0.00041815638542175293, -0.00036919116973876953, -0.00032022595405578613, -0.00027126073837280273, -0.00022229552268981934, -0.00017333030700683594, -0.00012436509132385254, -7.539987564086914e-05, -2.6434659957885742e-05, 2.2530555725097656e-05, 7.149577140808105e-05, 0.00012046098709106445, 0.00016942620277404785, 0.00021839141845703125, 0.00026735663414001465, 0.00031632184982299805, 0.00036528706550598145, 0.00041425228118896484, 0.00046321749687194824, 0.0005121827125549316, 0.000561147928237915, 0.0006101131439208984, 0.0006590783596038818, 0.0007080435752868652, 0.0007570087909698486, 0.000805974006652832, 0.0008549392223358154, 0.0009039044380187988, 0.0009528696537017822, 0.0010018348693847656, 0.001050800085067749, 0.0010997653007507324, 0.0011487305164337158, 0.0011976957321166992, 0.0012466609477996826, 0.001295626163482666, 0.0013445913791656494, 0.0013935565948486328, 0.0014425218105316162, 0.0014914870262145996, 0.001540452241897583, 0.0015894174575805664, 0.0016383826732635498, 0.0016873478889465332, 0.0017363131046295166, 0.0017852783203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 13.0, 12.0, 15.0, 23.0, 35.0, 59.0, 45.0, 86.0, 96.0, 121.0, 170.0, 239.0, 327.0, 506.0, 718.0, 1110.0, 1778.0, 3141.0, 5592.0, 10346.0, 20496.0, 44722.0, 99143.0, 200609.0, 277222.0, 197100.0, 96468.0, 43878.0, 20377.0, 10379.0, 5390.0, 3022.0, 1774.0, 1159.0, 713.0, 421.0, 313.0, 256.0, 156.0, 113.0, 105.0, 78.0, 59.0, 36.0, 46.0, 22.0, 16.0, 10.0, 16.0, 10.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.6416015625, -16.095703125, -15.5498046875, -15.00390625, -14.4580078125, -13.912109375, -13.3662109375, -12.8203125, -12.2744140625, -11.728515625, -11.1826171875, -10.63671875, -10.0908203125, -9.544921875, -8.9990234375, -8.453125, -7.9072265625, -7.361328125, -6.8154296875, -6.26953125, -5.7236328125, -5.177734375, -4.6318359375, -4.0859375, -3.5400390625, -2.994140625, -2.4482421875, -1.90234375, -1.3564453125, -0.810546875, -0.2646484375, 0.28125, 0.8271484375, 1.373046875, 1.9189453125, 2.46484375, 3.0107421875, 3.556640625, 4.1025390625, 4.6484375, 5.1943359375, 5.740234375, 6.2861328125, 6.83203125, 7.3779296875, 7.923828125, 8.4697265625, 9.015625, 9.5615234375, 10.107421875, 10.6533203125, 11.19921875, 11.7451171875, 12.291015625, 12.8369140625, 13.3828125, 13.9287109375, 14.474609375, 15.0205078125, 15.56640625, 16.1123046875, 16.658203125, 17.2041015625, 17.75]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 9.0, 15.0, 19.0, 16.0, 23.0, 42.0, 49.0, 51.0, 66.0, 68.0, 101.0, 85.0, 83.0, 60.0, 75.0, 58.0, 48.0, 32.0, 27.0, 19.0, 12.0, 11.0, 10.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.65460205078125, -4.5006103515625, -4.34661865234375, -4.192626953125, -4.03863525390625, -3.8846435546875, -3.73065185546875, -3.57666015625, -3.42266845703125, -3.2686767578125, -3.11468505859375, -2.960693359375, -2.80670166015625, -2.6527099609375, -2.49871826171875, -2.3447265625, -2.19073486328125, -2.0367431640625, -1.88275146484375, -1.728759765625, -1.57476806640625, -1.4207763671875, -1.26678466796875, -1.11279296875, -0.95880126953125, -0.8048095703125, -0.65081787109375, -0.496826171875, -0.34283447265625, -0.1888427734375, -0.03485107421875, 0.119140625, 0.27313232421875, 0.4271240234375, 0.58111572265625, 0.735107421875, 0.88909912109375, 1.0430908203125, 1.19708251953125, 1.35107421875, 1.50506591796875, 1.6590576171875, 1.81304931640625, 1.967041015625, 2.12103271484375, 2.2750244140625, 2.42901611328125, 2.5830078125, 2.73699951171875, 2.8909912109375, 3.04498291015625, 3.198974609375, 3.35296630859375, 3.5069580078125, 3.66094970703125, 3.81494140625, 3.96893310546875, 4.1229248046875, 4.27691650390625, 4.430908203125, 4.58489990234375, 4.7388916015625, 4.89288330078125, 5.046875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 6.0, 9.0, 1.0, 8.0, 5.0, 9.0, 22.0, 26.0, 30.0, 34.0, 44.0, 50.0, 58.0, 72.0, 66.0, 75.0, 79.0, 71.0, 46.0, 50.0, 52.0, 36.0, 29.0, 30.0, 15.0, 18.0, 14.0, 12.0, 6.0, 7.0, 5.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.58736038208008, -31.37037467956543, -30.15338897705078, -28.936403274536133, -27.719417572021484, -26.50243377685547, -25.28544807434082, -24.068462371826172, -22.851476669311523, -21.634490966796875, -20.417505264282227, -19.200519561767578, -17.983535766601562, -16.76654815673828, -15.549564361572266, -14.332578659057617, -13.115592956542969, -11.89860725402832, -10.681621551513672, -9.46463680267334, -8.247651100158691, -7.030665397644043, -5.813680171966553, -4.5966949462890625, -3.379709243774414, -2.1627237796783447, -0.9457383155822754, 0.27124714851379395, 1.4882326126098633, 2.7052183151245117, 3.922203540802002, 5.139188766479492, 6.356174468994141, 7.573160171508789, 8.790145874023438, 10.00713062286377, 11.224116325378418, 12.441102027893066, 13.658086776733398, 14.875072479248047, 16.092058181762695, 17.309043884277344, 18.526029586791992, 19.74301528930664, 20.959999084472656, 22.176986694335938, 23.393970489501953, 24.6109561920166, 25.82794189453125, 27.0449275970459, 28.261913299560547, 29.478899002075195, 30.695884704589844, 31.91286849975586, 33.12985610961914, 34.346839904785156, 35.56382751464844, 36.78081130981445, 37.997798919677734, 39.21478271484375, 40.43177032470703, 41.64875411987305, 42.86574172973633, 44.082725524902344, 45.29970932006836]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 6.0, 6.0, 12.0, 13.0, 17.0, 19.0, 25.0, 31.0, 24.0, 35.0, 38.0, 29.0, 35.0, 30.0, 40.0, 49.0, 48.0, 46.0, 46.0, 46.0, 39.0, 45.0, 30.0, 30.0, 30.0, 41.0, 35.0, 28.0, 21.0, 21.0, 16.0, 6.0, 9.0, 14.0, 8.0, 5.0, 2.0, 5.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.42322540283203, -31.32977867126465, -30.236331939697266, -29.142885208129883, -28.0494384765625, -26.955991744995117, -25.862545013427734, -24.76909828186035, -23.67565155029297, -22.582204818725586, -21.488758087158203, -20.39531135559082, -19.301864624023438, -18.208417892456055, -17.114971160888672, -16.02152442932129, -14.928077697753906, -13.834630966186523, -12.74118423461914, -11.647737503051758, -10.554290771484375, -9.460844039916992, -8.36739730834961, -7.273950576782227, -6.180503845214844, -5.087057113647461, -3.993610382080078, -2.9001636505126953, -1.8067169189453125, -0.7132701873779297, 0.3801765441894531, 1.473623275756836, 2.567066192626953, 3.660512924194336, 4.753959655761719, 5.847406387329102, 6.940853118896484, 8.034299850463867, 9.12774658203125, 10.221193313598633, 11.314640045166016, 12.408086776733398, 13.501533508300781, 14.594980239868164, 15.688426971435547, 16.78187370300293, 17.875320434570312, 18.968767166137695, 20.062213897705078, 21.15566062927246, 22.249107360839844, 23.342554092407227, 24.43600082397461, 25.529447555541992, 26.622894287109375, 27.716341018676758, 28.80978775024414, 29.903234481811523, 30.996681213378906, 32.090126037597656, 33.18357467651367, 34.27702331542969, 35.37046813964844, 36.46391296386719, 37.5573616027832]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 6.0, 9.0, 4.0, 19.0, 12.0, 17.0, 23.0, 37.0, 36.0, 47.0, 72.0, 71.0, 100.0, 101.0, 127.0, 166.0, 187.0, 262.0, 372.0, 714.0, 1443.0, 3717.0, 493522.0, 16476.0, 3085.0, 1301.0, 646.0, 382.0, 273.0, 211.0, 161.0, 138.0, 104.0, 93.0, 66.0, 53.0, 56.0, 32.0, 27.0, 22.0, 13.0, 10.0, 10.0, 11.0, 3.0, 5.0, 6.0, 2.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-404.01214599609375, -390.50897216796875, -377.00579833984375, -363.5026550292969, -349.9994812011719, -336.4963073730469, -322.9931640625, -309.489990234375, -295.98681640625, -282.483642578125, -268.98046875, -255.47732543945312, -241.97415161132812, -228.47097778320312, -214.9678192138672, -201.46466064453125, -187.96148681640625, -174.45831298828125, -160.9551544189453, -147.45199584960938, -133.94882202148438, -120.4456558227539, -106.94248962402344, -93.43932342529297, -79.9361572265625, -66.43299102783203, -52.92982482910156, -39.426658630371094, -25.923492431640625, -12.420326232910156, 1.0828399658203125, 14.586006164550781, 28.089141845703125, 41.592308044433594, 55.09547424316406, 68.59864044189453, 82.101806640625, 95.60497283935547, 109.10813903808594, 122.6113052368164, 136.11447143554688, 149.61764526367188, 163.1208038330078, 176.62396240234375, 190.12713623046875, 203.63031005859375, 217.1334686279297, 230.63662719726562, 244.13980102539062, 257.6429748535156, 271.1461181640625, 284.6492919921875, 298.1524658203125, 311.6556396484375, 325.1588134765625, 338.6619567871094, 352.1651306152344, 365.6683044433594, 379.17144775390625, 392.67462158203125, 406.17779541015625, 419.68096923828125, 433.18414306640625, 446.6872863769531, 460.1904602050781]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 5.0, 8.0, 5.0, 12.0, 18.0, 10.0, 19.0, 24.0, 33.0, 28.0, 34.0, 29.0, 34.0, 38.0, 33.0, 37.0, 45.0, 56.0, 1067.0, 51.0, 49.0, 33.0, 39.0, 42.0, 24.0, 29.0, 43.0, 32.0, 32.0, 18.0, 22.0, 14.0, 6.0, 10.0, 12.0, 10.0, 2.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1043.31787109375, -1008.0817260742188, -972.8455810546875, -937.6094360351562, -902.373291015625, -867.1371459960938, -831.9010009765625, -796.664794921875, -761.4287109375, -726.1925659179688, -690.9564208984375, -655.7202758789062, -620.484130859375, -585.2479858398438, -550.0118408203125, -514.775634765625, -479.53948974609375, -444.3033447265625, -409.06719970703125, -373.8310546875, -338.59490966796875, -303.3587646484375, -268.1225891113281, -232.88644409179688, -197.65029907226562, -162.41415405273438, -127.1780014038086, -91.94184875488281, -56.70570373535156, -21.469558715820312, 13.7666015625, 49.00274658203125, 84.2388916015625, 119.47503662109375, 154.711181640625, 189.9473419189453, 225.18348693847656, 260.41961669921875, 295.6557922363281, 330.8919372558594, 366.1280822753906, 401.3642272949219, 436.6003723144531, 471.8365478515625, 507.07269287109375, 542.308837890625, 577.5449829101562, 612.7811279296875, 648.0172729492188, 683.25341796875, 718.4895629882812, 753.7257080078125, 788.9618530273438, 824.197998046875, 859.4342041015625, 894.6702880859375, 929.906494140625, 965.1426391601562, 1000.3787841796875, 1035.614990234375, 1070.85107421875, 1106.0872802734375, 1141.3233642578125, 1176.5595703125, 1211.795654296875]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 7.0, 8.0, 7.0, 8.0, 12.0, 17.0, 18.0, 19.0, 42.0, 42.0, 64.0, 96.0, 113.0, 185.0, 243.0, 339.0, 493.0, 678.0, 884.0, 1184.0, 1562.0, 2085.0, 3210.0, 9003.0, 31201316.0, 15442.0, 8018.0, 6085.0, 1687.0, 635.0, 489.0, 165.0, 96.0, 62.0, 50.0, 41.0, 35.0, 17.0, 16.0, 8.0, 6.0, 13.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-1371.5205078125, -1338.51171875, -1305.5029296875, -1272.4942626953125, -1239.4854736328125, -1206.4766845703125, -1173.4678955078125, -1140.4591064453125, -1107.450439453125, -1074.441650390625, -1041.432861328125, -1008.4241333007812, -975.4154052734375, -942.4066162109375, -909.3978271484375, -876.3890380859375, -843.3802490234375, -810.3714599609375, -777.3627319335938, -744.3539428710938, -711.34521484375, -678.33642578125, -645.32763671875, -612.31884765625, -579.3101196289062, -546.3013305664062, -513.2926025390625, -480.2838134765625, -447.2750549316406, -414.26629638671875, -381.25750732421875, -348.2487487792969, -315.239990234375, -282.2312316894531, -249.2224578857422, -216.21368408203125, -183.20492553710938, -150.1961669921875, -117.18739318847656, -84.17861938476562, -51.16986083984375, -18.161094665527344, 14.847671508789062, 47.85643768310547, 80.86520385742188, 113.87396240234375, 146.8827362060547, 179.89151000976562, 212.9002685546875, 245.90902709960938, 278.91778564453125, 311.92657470703125, 344.9353332519531, 377.944091796875, 410.952880859375, 443.9616394042969, 476.97039794921875, 509.9791564941406, 542.9879150390625, 575.9967041015625, 609.0054931640625, 642.0142211914062, 675.0230102539062, 708.03173828125, 741.04052734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 13.0, 9.0, 7.0, 20.0, 31.0, 29.0, 75.0, 109.0, 234.0, 426.0, 772.0, 1685.0, 3703.0, 8947.0, 23004.0, 63762.0, 200705.0, 726139.0, 3053758.0, 1639213.0, 387557.0, 115909.0, 39638.0, 14573.0, 6070.0, 2545.0, 1189.0, 550.0, 278.0, 199.0, 101.0, 69.0, 41.0, 16.0, 14.0, 15.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.1875, -86.6865234375, -83.185546875, -79.6845703125, -76.18359375, -72.6826171875, -69.181640625, -65.6806640625, -62.1796875, -58.6787109375, -55.177734375, -51.6767578125, -48.17578125, -44.6748046875, -41.173828125, -37.6728515625, -34.171875, -30.6708984375, -27.169921875, -23.6689453125, -20.16796875, -16.6669921875, -13.166015625, -9.6650390625, -6.1640625, -2.6630859375, 0.837890625, 4.3388671875, 7.83984375, 11.3408203125, 14.841796875, 18.3427734375, 21.84375, 25.3447265625, 28.845703125, 32.3466796875, 35.84765625, 39.3486328125, 42.849609375, 46.3505859375, 49.8515625, 53.3525390625, 56.853515625, 60.3544921875, 63.85546875, 67.3564453125, 70.857421875, 74.3583984375, 77.859375, 81.3603515625, 84.861328125, 88.3623046875, 91.86328125, 95.3642578125, 98.865234375, 102.3662109375, 105.8671875, 109.3681640625, 112.869140625, 116.3701171875, 119.87109375, 123.3720703125, 126.873046875, 130.3740234375, 133.875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 2.0, 4.0, 5.0, 6.0, 6.0, 4.0, 7.0, 8.0, 15.0, 24.0, 29.0, 20.0, 35.0, 38.0, 56.0, 66.0, 92.0, 95.0, 132.0, 176.0, 191.0, 189.0, 148.0, 132.0, 120.0, 101.0, 62.0, 46.0, 51.0, 31.0, 23.0, 28.0, 19.0, 15.0, 13.0, 6.0, 9.0, 3.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.171875, -23.369873046875, -22.56787109375, -21.765869140625, -20.9638671875, -20.161865234375, -19.35986328125, -18.557861328125, -17.755859375, -16.953857421875, -16.15185546875, -15.349853515625, -14.5478515625, -13.745849609375, -12.94384765625, -12.141845703125, -11.33984375, -10.537841796875, -9.73583984375, -8.933837890625, -8.1318359375, -7.329833984375, -6.52783203125, -5.725830078125, -4.923828125, -4.121826171875, -3.31982421875, -2.517822265625, -1.7158203125, -0.913818359375, -0.11181640625, 0.690185546875, 1.4921875, 2.294189453125, 3.09619140625, 3.898193359375, 4.7001953125, 5.502197265625, 6.30419921875, 7.106201171875, 7.908203125, 8.710205078125, 9.51220703125, 10.314208984375, 11.1162109375, 11.918212890625, 12.72021484375, 13.522216796875, 14.32421875, 15.126220703125, 15.92822265625, 16.730224609375, 17.5322265625, 18.334228515625, 19.13623046875, 19.938232421875, 20.740234375, 21.542236328125, 22.34423828125, 23.146240234375, 23.9482421875, 24.750244140625, 25.55224609375, 26.354248046875, 27.15625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 7.0, 8.0, 6.0, 12.0, 24.0, 44.0, 52.0, 78.0, 138.0, 191.0, 320.0, 464.0, 753.0, 1340.0, 2004.0, 3222.0, 5019.0, 8261.0, 13129.0, 21224.0, 34615.0, 56763.0, 92063.0, 149966.0, 248307.0, 432166.0, 867601.0, 1720361.0, 1244374.0, 582665.0, 318611.0, 188738.0, 114555.0, 70511.0, 43978.0, 26800.0, 16232.0, 10026.0, 6263.0, 3926.0, 2403.0, 1514.0, 985.0, 642.0, 394.0, 257.0, 164.0, 93.0, 73.0, 43.0, 24.0, 17.0, 5.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.296875, -24.4736328125, -23.650390625, -22.8271484375, -22.00390625, -21.1806640625, -20.357421875, -19.5341796875, -18.7109375, -17.8876953125, -17.064453125, -16.2412109375, -15.41796875, -14.5947265625, -13.771484375, -12.9482421875, -12.125, -11.3017578125, -10.478515625, -9.6552734375, -8.83203125, -8.0087890625, -7.185546875, -6.3623046875, -5.5390625, -4.7158203125, -3.892578125, -3.0693359375, -2.24609375, -1.4228515625, -0.599609375, 0.2236328125, 1.046875, 1.8701171875, 2.693359375, 3.5166015625, 4.33984375, 5.1630859375, 5.986328125, 6.8095703125, 7.6328125, 8.4560546875, 9.279296875, 10.1025390625, 10.92578125, 11.7490234375, 12.572265625, 13.3955078125, 14.21875, 15.0419921875, 15.865234375, 16.6884765625, 17.51171875, 18.3349609375, 19.158203125, 19.9814453125, 20.8046875, 21.6279296875, 22.451171875, 23.2744140625, 24.09765625, 24.9208984375, 25.744140625, 26.5673828125, 27.390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 3.0, 7.0, 3.0, 5.0, 11.0, 7.0, 5.0, 10.0, 15.0, 24.0, 19.0, 31.0, 31.0, 30.0, 61.0, 62.0, 80.0, 96.0, 153.0, 201.0, 213.0, 223.0, 159.0, 119.0, 95.0, 68.0, 49.0, 43.0, 34.0, 32.0, 14.0, 20.0, 17.0, 18.0, 18.0, 10.0, 11.0, 6.0, 6.0, 7.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.484375, -30.496337890625, -29.50830078125, -28.520263671875, -27.5322265625, -26.544189453125, -25.55615234375, -24.568115234375, -23.580078125, -22.592041015625, -21.60400390625, -20.615966796875, -19.6279296875, -18.639892578125, -17.65185546875, -16.663818359375, -15.67578125, -14.687744140625, -13.69970703125, -12.711669921875, -11.7236328125, -10.735595703125, -9.74755859375, -8.759521484375, -7.771484375, -6.783447265625, -5.79541015625, -4.807373046875, -3.8193359375, -2.831298828125, -1.84326171875, -0.855224609375, 0.1328125, 1.120849609375, 2.10888671875, 3.096923828125, 4.0849609375, 5.072998046875, 6.06103515625, 7.049072265625, 8.037109375, 9.025146484375, 10.01318359375, 11.001220703125, 11.9892578125, 12.977294921875, 13.96533203125, 14.953369140625, 15.94140625, 16.929443359375, 17.91748046875, 18.905517578125, 19.8935546875, 20.881591796875, 21.86962890625, 22.857666015625, 23.845703125, 24.833740234375, 25.82177734375, 26.809814453125, 27.7978515625, 28.785888671875, 29.77392578125, 30.761962890625, 31.75]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 9.0, 19.0, 23.0, 31.0, 50.0, 90.0, 88.0, 160.0, 222.0, 412.0, 571.0, 964.0, 1767.0, 3330.0, 6068.0, 13239.0, 28929.0, 71104.0, 308014.0, 5654121.0, 120422.0, 43559.0, 19016.0, 9193.0, 4389.0, 2221.0, 1335.0, 852.0, 499.0, 270.0, 161.0, 95.0, 62.0, 44.0, 38.0, 22.0, 9.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-96.25, -92.841796875, -89.43359375, -86.025390625, -82.6171875, -79.208984375, -75.80078125, -72.392578125, -68.984375, -65.576171875, -62.16796875, -58.759765625, -55.3515625, -51.943359375, -48.53515625, -45.126953125, -41.71875, -38.310546875, -34.90234375, -31.494140625, -28.0859375, -24.677734375, -21.26953125, -17.861328125, -14.453125, -11.044921875, -7.63671875, -4.228515625, -0.8203125, 2.587890625, 5.99609375, 9.404296875, 12.8125, 16.220703125, 19.62890625, 23.037109375, 26.4453125, 29.853515625, 33.26171875, 36.669921875, 40.078125, 43.486328125, 46.89453125, 50.302734375, 53.7109375, 57.119140625, 60.52734375, 63.935546875, 67.34375, 70.751953125, 74.16015625, 77.568359375, 80.9765625, 84.384765625, 87.79296875, 91.201171875, 94.609375, 98.017578125, 101.42578125, 104.833984375, 108.2421875, 111.650390625, 115.05859375, 118.466796875, 121.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 16.0, 15.0, 20.0, 13.0, 19.0, 29.0, 40.0, 47.0, 52.0, 74.0, 126.0, 280.0, 480.0, 290.0, 137.0, 79.0, 59.0, 40.0, 43.0, 35.0, 21.0, 27.0, 12.0, 9.0, 18.0, 7.0, 8.0, 6.0, 4.0, 9.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.6875, -61.462890625, -59.23828125, -57.013671875, -54.7890625, -52.564453125, -50.33984375, -48.115234375, -45.890625, -43.666015625, -41.44140625, -39.216796875, -36.9921875, -34.767578125, -32.54296875, -30.318359375, -28.09375, -25.869140625, -23.64453125, -21.419921875, -19.1953125, -16.970703125, -14.74609375, -12.521484375, -10.296875, -8.072265625, -5.84765625, -3.623046875, -1.3984375, 0.826171875, 3.05078125, 5.275390625, 7.5, 9.724609375, 11.94921875, 14.173828125, 16.3984375, 18.623046875, 20.84765625, 23.072265625, 25.296875, 27.521484375, 29.74609375, 31.970703125, 34.1953125, 36.419921875, 38.64453125, 40.869140625, 43.09375, 45.318359375, 47.54296875, 49.767578125, 51.9921875, 54.216796875, 56.44140625, 58.666015625, 60.890625, 63.115234375, 65.33984375, 67.564453125, 69.7890625, 72.013671875, 74.23828125, 76.462890625, 78.6875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 7.0, 8.0, 5.0, 5.0, 9.0, 14.0, 21.0, 32.0, 25.0, 35.0, 47.0, 69.0, 118.0, 208.0, 113.0, 71.0, 47.0, 38.0, 22.0, 30.0, 17.0, 19.0, 8.0, 8.0, 9.0, 7.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2328.625, -2272.683349609375, -2216.741943359375, -2160.80029296875, -2104.858642578125, -2048.917236328125, -1992.9755859375, -1937.033935546875, -1881.0924072265625, -1825.15087890625, -1769.209228515625, -1713.2677001953125, -1657.326171875, -1601.384521484375, -1545.4429931640625, -1489.50146484375, -1433.559814453125, -1377.6182861328125, -1321.6766357421875, -1265.735107421875, -1209.7935791015625, -1153.8519287109375, -1097.910400390625, -1041.96875, -986.02734375, -930.0857543945312, -874.1442260742188, -818.20263671875, -762.2610473632812, -706.3194580078125, -650.3779296875, -594.4363403320312, -538.4947509765625, -482.5531921386719, -426.6116027832031, -370.6700439453125, -314.72845458984375, -258.7868957519531, -202.8453369140625, -146.90374755859375, -90.96218872070312, -35.0206184387207, 20.92095184326172, 76.86251831054688, 132.80409240722656, 188.74566650390625, 244.68722534179688, 300.6288146972656, 356.57037353515625, 412.5119323730469, 468.4535217285156, 524.3950805664062, 580.336669921875, 636.2781982421875, 692.2197875976562, 748.161376953125, 804.1029052734375, 860.0444946289062, 915.9860229492188, 971.9276123046875, 1027.869140625, 1083.810791015625, 1139.7523193359375, 1195.69384765625, 1251.635498046875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 4.0, 10.0, 8.0, 8.0, 8.0, 14.0, 10.0, 17.0, 13.0, 18.0, 17.0, 22.0, 19.0, 24.0, 32.0, 45.0, 85.0, 137.0, 135.0, 67.0, 45.0, 26.0, 33.0, 28.0, 16.0, 14.0, 19.0, 17.0, 7.0, 17.0, 13.0, 12.0, 11.0, 12.0, 4.0, 3.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1619.1690673828125, -1568.353759765625, -1517.53857421875, -1466.723388671875, -1415.9080810546875, -1365.0927734375, -1314.277587890625, -1263.46240234375, -1212.6470947265625, -1161.831787109375, -1111.0166015625, -1060.201416015625, -1009.3861083984375, -958.5708618164062, -907.755615234375, -856.9403686523438, -806.1251220703125, -755.3098754882812, -704.49462890625, -653.6793823242188, -602.8641357421875, -552.0488891601562, -501.233642578125, -450.41839599609375, -399.6031494140625, -348.78790283203125, -297.97265625, -247.15740966796875, -196.3421630859375, -145.52691650390625, -94.711669921875, -43.89642333984375, 6.9188232421875, 57.73406982421875, 108.54931640625, 159.36456298828125, 210.1798095703125, 260.99505615234375, 311.810302734375, 362.62554931640625, 413.4407958984375, 464.25604248046875, 515.0712890625, 565.8865356445312, 616.7017822265625, 667.5170288085938, 718.332275390625, 769.1475219726562, 819.9627685546875, 870.7780151367188, 921.59326171875, 972.4085083007812, 1023.2237548828125, 1074.0390625, 1124.854248046875, 1175.66943359375, 1226.4847412109375, 1277.300048828125, 1328.115234375, 1378.930419921875, 1429.7457275390625, 1480.56103515625, 1531.376220703125, 1582.19140625, 1633.0067138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 5.0, 7.0, 20.0, 25.0, 39.0, 34.0, 78.0, 78.0, 106.0, 177.0, 246.0, 354.0, 511.0, 707.0, 1070.0, 1549.0, 2381.0, 3852.0, 6641.0, 12263.0, 25934.0, 65140.0, 236079.0, 2929813.0, 701064.0, 123147.0, 41711.0, 18442.0, 9344.0, 5062.0, 3001.0, 1877.0, 1201.0, 811.0, 503.0, 355.0, 203.0, 137.0, 110.0, 69.0, 37.0, 29.0, 27.0, 7.0, 10.0, 6.0, 6.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-17.5625, -17.057373046875, -16.55224609375, -16.047119140625, -15.5419921875, -15.036865234375, -14.53173828125, -14.026611328125, -13.521484375, -13.016357421875, -12.51123046875, -12.006103515625, -11.5009765625, -10.995849609375, -10.49072265625, -9.985595703125, -9.48046875, -8.975341796875, -8.47021484375, -7.965087890625, -7.4599609375, -6.954833984375, -6.44970703125, -5.944580078125, -5.439453125, -4.934326171875, -4.42919921875, -3.924072265625, -3.4189453125, -2.913818359375, -2.40869140625, -1.903564453125, -1.3984375, -0.893310546875, -0.38818359375, 0.116943359375, 0.6220703125, 1.127197265625, 1.63232421875, 2.137451171875, 2.642578125, 3.147705078125, 3.65283203125, 4.157958984375, 4.6630859375, 5.168212890625, 5.67333984375, 6.178466796875, 6.68359375, 7.188720703125, 7.69384765625, 8.198974609375, 8.7041015625, 9.209228515625, 9.71435546875, 10.219482421875, 10.724609375, 11.229736328125, 11.73486328125, 12.239990234375, 12.7451171875, 13.250244140625, 13.75537109375, 14.260498046875, 14.765625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 5.0, 9.0, 10.0, 13.0, 16.0, 21.0, 41.0, 44.0, 61.0, 97.0, 150.0, 176.0, 97.0, 74.0, 57.0, 21.0, 28.0, 19.0, 11.0, 9.0, 5.0, 9.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8369140625, -1.7829742431640625, -1.729034423828125, -1.6750946044921875, -1.62115478515625, -1.5672149658203125, -1.513275146484375, -1.4593353271484375, -1.4053955078125, -1.3514556884765625, -1.297515869140625, -1.2435760498046875, -1.18963623046875, -1.1356964111328125, -1.081756591796875, -1.0278167724609375, -0.973876953125, -0.9199371337890625, -0.865997314453125, -0.8120574951171875, -0.75811767578125, -0.7041778564453125, -0.650238037109375, -0.5962982177734375, -0.5423583984375, -0.4884185791015625, -0.434478759765625, -0.3805389404296875, -0.32659912109375, -0.2726593017578125, -0.218719482421875, -0.1647796630859375, -0.11083984375, -0.0569000244140625, -0.002960205078125, 0.0509796142578125, 0.10491943359375, 0.1588592529296875, 0.212799072265625, 0.2667388916015625, 0.3206787109375, 0.3746185302734375, 0.428558349609375, 0.4824981689453125, 0.53643798828125, 0.5903778076171875, 0.644317626953125, 0.6982574462890625, 0.752197265625, 0.8061370849609375, 0.860076904296875, 0.9140167236328125, 0.96795654296875, 1.0218963623046875, 1.075836181640625, 1.1297760009765625, 1.1837158203125, 1.2376556396484375, 1.291595458984375, 1.3455352783203125, 1.39947509765625, 1.4534149169921875, 1.507354736328125, 1.5612945556640625, 1.615234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 14.0, 13.0, 26.0, 44.0, 48.0, 97.0, 138.0, 215.0, 343.0, 621.0, 1085.0, 2132.0, 4519.0, 10977.0, 31461.0, 105320.0, 438597.0, 2344403.0, 972435.0, 198463.0, 52880.0, 17168.0, 6699.0, 3009.0, 1451.0, 807.0, 482.0, 256.0, 199.0, 110.0, 72.0, 60.0, 35.0, 29.0, 19.0, 7.0, 15.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.328125, -17.784912109375, -17.24169921875, -16.698486328125, -16.1552734375, -15.612060546875, -15.06884765625, -14.525634765625, -13.982421875, -13.439208984375, -12.89599609375, -12.352783203125, -11.8095703125, -11.266357421875, -10.72314453125, -10.179931640625, -9.63671875, -9.093505859375, -8.55029296875, -8.007080078125, -7.4638671875, -6.920654296875, -6.37744140625, -5.834228515625, -5.291015625, -4.747802734375, -4.20458984375, -3.661376953125, -3.1181640625, -2.574951171875, -2.03173828125, -1.488525390625, -0.9453125, -0.402099609375, 0.14111328125, 0.684326171875, 1.2275390625, 1.770751953125, 2.31396484375, 2.857177734375, 3.400390625, 3.943603515625, 4.48681640625, 5.030029296875, 5.5732421875, 6.116455078125, 6.65966796875, 7.202880859375, 7.74609375, 8.289306640625, 8.83251953125, 9.375732421875, 9.9189453125, 10.462158203125, 11.00537109375, 11.548583984375, 12.091796875, 12.635009765625, 13.17822265625, 13.721435546875, 14.2646484375, 14.807861328125, 15.35107421875, 15.894287109375, 16.4375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 12.0, 10.0, 15.0, 15.0, 25.0, 28.0, 39.0, 45.0, 53.0, 78.0, 84.0, 103.0, 152.0, 201.0, 226.0, 350.0, 538.0, 614.0, 371.0, 257.0, 194.0, 141.0, 120.0, 85.0, 73.0, 51.0, 47.0, 37.0, 29.0, 18.0, 17.0, 8.0, 9.0, 6.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.9371337890625, -3.792236328125, -3.6473388671875, -3.50244140625, -3.3575439453125, -3.212646484375, -3.0677490234375, -2.9228515625, -2.7779541015625, -2.633056640625, -2.4881591796875, -2.34326171875, -2.1983642578125, -2.053466796875, -1.9085693359375, -1.763671875, -1.6187744140625, -1.473876953125, -1.3289794921875, -1.18408203125, -1.0391845703125, -0.894287109375, -0.7493896484375, -0.6044921875, -0.4595947265625, -0.314697265625, -0.1697998046875, -0.02490234375, 0.1199951171875, 0.264892578125, 0.4097900390625, 0.5546875, 0.6995849609375, 0.844482421875, 0.9893798828125, 1.13427734375, 1.2791748046875, 1.424072265625, 1.5689697265625, 1.7138671875, 1.8587646484375, 2.003662109375, 2.1485595703125, 2.29345703125, 2.4383544921875, 2.583251953125, 2.7281494140625, 2.873046875, 3.0179443359375, 3.162841796875, 3.3077392578125, 3.45263671875, 3.5975341796875, 3.742431640625, 3.8873291015625, 4.0322265625, 4.1771240234375, 4.322021484375, 4.4669189453125, 4.61181640625, 4.7567138671875, 4.901611328125, 5.0465087890625, 5.19140625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 5.0, 10.0, 15.0, 19.0, 24.0, 45.0, 80.0, 108.0, 173.0, 163.0, 126.0, 92.0, 45.0, 30.0, 16.0, 11.0, 8.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.42622375488281, -55.24839782714844, -53.07057189941406, -50.89274978637695, -48.71492385864258, -46.5370979309082, -44.359275817871094, -42.18144989013672, -40.003623962402344, -37.82579803466797, -35.647972106933594, -33.470149993896484, -31.29232406616211, -29.114498138427734, -26.936674118041992, -24.75885009765625, -22.581024169921875, -20.4031982421875, -18.225374221801758, -16.047550201416016, -13.86972427368164, -11.691899299621582, -9.514074325561523, -7.336249351501465, -5.158424377441406, -2.9805994033813477, -0.8027744293212891, 1.3750505447387695, 3.552875518798828, 5.730700492858887, 7.908525466918945, 10.086350440979004, 12.264175415039062, 14.442000389099121, 16.61982536315918, 18.797649383544922, 20.975475311279297, 23.153301239013672, 25.331125259399414, 27.508949279785156, 29.68677520751953, 31.864601135253906, 34.04242706298828, 36.22024917602539, 38.398075103759766, 40.57590103149414, 42.75372314453125, 44.931549072265625, 47.109375, 49.287200927734375, 51.46502685546875, 53.64284896850586, 55.820674896240234, 57.99850082397461, 60.17632293701172, 62.354148864746094, 64.53197479248047, 66.70980072021484, 68.88762664794922, 71.0654525756836, 73.24327087402344, 75.42109680175781, 77.59892272949219, 79.77674865722656, 81.95457458496094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 21.0, 8.0, 10.0, 23.0, 13.0, 37.0, 31.0, 32.0, 35.0, 42.0, 28.0, 45.0, 39.0, 52.0, 54.0, 62.0, 62.0, 52.0, 43.0, 25.0, 45.0, 38.0, 23.0, 25.0, 29.0, 21.0, 25.0, 17.0, 14.0, 7.0, 5.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.19241714477539, -30.18705940246582, -29.18170166015625, -28.17634391784668, -27.17098617553711, -26.165630340576172, -25.1602725982666, -24.15491485595703, -23.14955711364746, -22.14419937133789, -21.13884162902832, -20.13348388671875, -19.128128051757812, -18.12276840209961, -17.117412567138672, -16.1120548248291, -15.106697082519531, -14.101339340209961, -13.09598159790039, -12.090624809265137, -11.085267066955566, -10.079909324645996, -9.074552536010742, -8.069194793701172, -7.063837051391602, -6.058479309082031, -5.053122043609619, -4.047764778137207, -3.0424070358276367, -2.0370492935180664, -1.0316920280456543, -0.026334762573242188, 0.9790267944335938, 1.984384298324585, 2.989741802215576, 3.9950993061065674, 5.000456809997559, 6.005814552307129, 7.011171817779541, 8.016529083251953, 9.021886825561523, 10.027244567871094, 11.032602310180664, 12.037959098815918, 13.043316841125488, 14.048674583435059, 15.054031372070312, 16.059389114379883, 17.064746856689453, 18.070104598999023, 19.075462341308594, 20.080820083618164, 21.086177825927734, 22.091533660888672, 23.096891403198242, 24.102249145507812, 25.107606887817383, 26.112964630126953, 27.118322372436523, 28.123680114746094, 29.12903594970703, 30.134395599365234, 31.139751434326172, 32.145111083984375, 33.15046691894531]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 11.0, 10.0, 12.0, 11.0, 21.0, 25.0, 47.0, 59.0, 80.0, 140.0, 228.0, 275.0, 408.0, 633.0, 1043.0, 1718.0, 3112.0, 5529.0, 11378.0, 25982.0, 71632.0, 276606.0, 461411.0, 117017.0, 38520.0, 15531.0, 7439.0, 3851.0, 2249.0, 1268.0, 845.0, 472.0, 289.0, 214.0, 154.0, 92.0, 55.0, 47.0, 53.0, 18.0, 16.0, 15.0, 10.0, 7.0, 8.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.58349609375, -9.2763671875, -8.96923828125, -8.662109375, -8.35498046875, -8.0478515625, -7.74072265625, -7.43359375, -7.12646484375, -6.8193359375, -6.51220703125, -6.205078125, -5.89794921875, -5.5908203125, -5.28369140625, -4.9765625, -4.66943359375, -4.3623046875, -4.05517578125, -3.748046875, -3.44091796875, -3.1337890625, -2.82666015625, -2.51953125, -2.21240234375, -1.9052734375, -1.59814453125, -1.291015625, -0.98388671875, -0.6767578125, -0.36962890625, -0.0625, 0.24462890625, 0.5517578125, 0.85888671875, 1.166015625, 1.47314453125, 1.7802734375, 2.08740234375, 2.39453125, 2.70166015625, 3.0087890625, 3.31591796875, 3.623046875, 3.93017578125, 4.2373046875, 4.54443359375, 4.8515625, 5.15869140625, 5.4658203125, 5.77294921875, 6.080078125, 6.38720703125, 6.6943359375, 7.00146484375, 7.30859375, 7.61572265625, 7.9228515625, 8.22998046875, 8.537109375, 8.84423828125, 9.1513671875, 9.45849609375, 9.765625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 1.0, 10.0, 10.0, 10.0, 14.0, 26.0, 36.0, 37.0, 63.0, 70.0, 84.0, 112.0, 84.0, 86.0, 74.0, 68.0, 54.0, 42.0, 30.0, 18.0, 16.0, 15.0, 10.0, 3.0, 9.0, 0.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.76739501953125, -1.7027587890625, -1.63812255859375, -1.573486328125, -1.50885009765625, -1.4442138671875, -1.37957763671875, -1.31494140625, -1.25030517578125, -1.1856689453125, -1.12103271484375, -1.056396484375, -0.99176025390625, -0.9271240234375, -0.86248779296875, -0.7978515625, -0.73321533203125, -0.6685791015625, -0.60394287109375, -0.539306640625, -0.47467041015625, -0.4100341796875, -0.34539794921875, -0.28076171875, -0.21612548828125, -0.1514892578125, -0.08685302734375, -0.022216796875, 0.04241943359375, 0.1070556640625, 0.17169189453125, 0.236328125, 0.30096435546875, 0.3656005859375, 0.43023681640625, 0.494873046875, 0.55950927734375, 0.6241455078125, 0.68878173828125, 0.75341796875, 0.81805419921875, 0.8826904296875, 0.94732666015625, 1.011962890625, 1.07659912109375, 1.1412353515625, 1.20587158203125, 1.2705078125, 1.33514404296875, 1.3997802734375, 1.46441650390625, 1.529052734375, 1.59368896484375, 1.6583251953125, 1.72296142578125, 1.78759765625, 1.85223388671875, 1.9168701171875, 1.98150634765625, 2.046142578125, 2.11077880859375, 2.1754150390625, 2.24005126953125, 2.3046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 4.0, 4.0, 5.0, 8.0, 17.0, 23.0, 20.0, 37.0, 59.0, 57.0, 85.0, 112.0, 144.0, 229.0, 303.0, 442.0, 713.0, 1075.0, 1694.0, 2705.0, 4583.0, 7969.0, 14973.0, 30149.0, 67757.0, 177061.0, 389585.0, 201773.0, 75674.0, 33261.0, 16278.0, 8875.0, 4912.0, 2779.0, 1787.0, 1120.0, 642.0, 483.0, 335.0, 239.0, 168.0, 99.0, 101.0, 58.0, 40.0, 21.0, 25.0, 27.0, 11.0, 7.0, 8.0, 4.0, 10.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.46875, -6.24993896484375, -6.0311279296875, -5.81231689453125, -5.593505859375, -5.37469482421875, -5.1558837890625, -4.93707275390625, -4.71826171875, -4.49945068359375, -4.2806396484375, -4.06182861328125, -3.843017578125, -3.62420654296875, -3.4053955078125, -3.18658447265625, -2.9677734375, -2.74896240234375, -2.5301513671875, -2.31134033203125, -2.092529296875, -1.87371826171875, -1.6549072265625, -1.43609619140625, -1.21728515625, -0.99847412109375, -0.7796630859375, -0.56085205078125, -0.342041015625, -0.12322998046875, 0.0955810546875, 0.31439208984375, 0.533203125, 0.75201416015625, 0.9708251953125, 1.18963623046875, 1.408447265625, 1.62725830078125, 1.8460693359375, 2.06488037109375, 2.28369140625, 2.50250244140625, 2.7213134765625, 2.94012451171875, 3.158935546875, 3.37774658203125, 3.5965576171875, 3.81536865234375, 4.0341796875, 4.25299072265625, 4.4718017578125, 4.69061279296875, 4.909423828125, 5.12823486328125, 5.3470458984375, 5.56585693359375, 5.78466796875, 6.00347900390625, 6.2222900390625, 6.44110107421875, 6.659912109375, 6.87872314453125, 7.0975341796875, 7.31634521484375, 7.53515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 0.0, 6.0, 3.0, 8.0, 6.0, 11.0, 9.0, 11.0, 13.0, 11.0, 14.0, 14.0, 25.0, 22.0, 30.0, 42.0, 28.0, 27.0, 25.0, 34.0, 24.0, 33.0, 47.0, 36.0, 33.0, 48.0, 41.0, 34.0, 37.0, 30.0, 29.0, 22.0, 33.0, 28.0, 28.0, 19.0, 17.0, 25.0, 16.0, 12.0, 11.0, 7.0, 9.0, 13.0, 6.0, 5.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0], "bins": [-7.91796875, -7.69134521484375, -7.4647216796875, -7.23809814453125, -7.011474609375, -6.78485107421875, -6.5582275390625, -6.33160400390625, -6.10498046875, -5.87835693359375, -5.6517333984375, -5.42510986328125, -5.198486328125, -4.97186279296875, -4.7452392578125, -4.51861572265625, -4.2919921875, -4.06536865234375, -3.8387451171875, -3.61212158203125, -3.385498046875, -3.15887451171875, -2.9322509765625, -2.70562744140625, -2.47900390625, -2.25238037109375, -2.0257568359375, -1.79913330078125, -1.572509765625, -1.34588623046875, -1.1192626953125, -0.89263916015625, -0.666015625, -0.43939208984375, -0.2127685546875, 0.01385498046875, 0.240478515625, 0.46710205078125, 0.6937255859375, 0.92034912109375, 1.14697265625, 1.37359619140625, 1.6002197265625, 1.82684326171875, 2.053466796875, 2.28009033203125, 2.5067138671875, 2.73333740234375, 2.9599609375, 3.18658447265625, 3.4132080078125, 3.63983154296875, 3.866455078125, 4.09307861328125, 4.3197021484375, 4.54632568359375, 4.77294921875, 4.99957275390625, 5.2261962890625, 5.45281982421875, 5.679443359375, 5.90606689453125, 6.1326904296875, 6.35931396484375, 6.5859375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 6.0, 3.0, 6.0, 10.0, 15.0, 28.0, 31.0, 58.0, 61.0, 88.0, 167.0, 292.0, 463.0, 1048.0, 2095.0, 5136.0, 14398.0, 54598.0, 312991.0, 521729.0, 99501.0, 22681.0, 7328.0, 2980.0, 1318.0, 654.0, 327.0, 201.0, 107.0, 63.0, 54.0, 39.0, 27.0, 20.0, 9.0, 7.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.44921875, -7.2247314453125, -7.000244140625, -6.7757568359375, -6.55126953125, -6.3267822265625, -6.102294921875, -5.8778076171875, -5.6533203125, -5.4288330078125, -5.204345703125, -4.9798583984375, -4.75537109375, -4.5308837890625, -4.306396484375, -4.0819091796875, -3.857421875, -3.6329345703125, -3.408447265625, -3.1839599609375, -2.95947265625, -2.7349853515625, -2.510498046875, -2.2860107421875, -2.0615234375, -1.8370361328125, -1.612548828125, -1.3880615234375, -1.16357421875, -0.9390869140625, -0.714599609375, -0.4901123046875, -0.265625, -0.0411376953125, 0.183349609375, 0.4078369140625, 0.63232421875, 0.8568115234375, 1.081298828125, 1.3057861328125, 1.5302734375, 1.7547607421875, 1.979248046875, 2.2037353515625, 2.42822265625, 2.6527099609375, 2.877197265625, 3.1016845703125, 3.326171875, 3.5506591796875, 3.775146484375, 3.9996337890625, 4.22412109375, 4.4486083984375, 4.673095703125, 4.8975830078125, 5.1220703125, 5.3465576171875, 5.571044921875, 5.7955322265625, 6.02001953125, 6.2445068359375, 6.468994140625, 6.6934814453125, 6.91796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 8.0, 12.0, 19.0, 23.0, 38.0, 55.0, 64.0, 80.0, 75.0, 92.0, 108.0, 85.0, 81.0, 54.0, 43.0, 33.0, 30.0, 32.0, 16.0, 7.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00022423267364501953, -0.00021628104150295258, -0.00020832940936088562, -0.00020037777721881866, -0.0001924261450767517, -0.00018447451293468475, -0.0001765228807926178, -0.00016857124865055084, -0.0001606196165084839, -0.00015266798436641693, -0.00014471635222434998, -0.00013676472008228302, -0.00012881308794021606, -0.00012086145579814911, -0.00011290982365608215, -0.0001049581915140152, -9.700655937194824e-05, -8.905492722988129e-05, -8.110329508781433e-05, -7.315166294574738e-05, -6.520003080368042e-05, -5.7248398661613464e-05, -4.929676651954651e-05, -4.134513437747955e-05, -3.33935022354126e-05, -2.5441870093345642e-05, -1.7490237951278687e-05, -9.538605809211731e-06, -1.5869736671447754e-06, 6.36465847492218e-06, 1.4316290616989136e-05, 2.226792275905609e-05, 3.0219554901123047e-05, 3.817118704319e-05, 4.612281918525696e-05, 5.4074451327323914e-05, 6.202608346939087e-05, 6.997771561145782e-05, 7.792934775352478e-05, 8.588097989559174e-05, 9.383261203765869e-05, 0.00010178424417972565, 0.0001097358763217926, 0.00011768750846385956, 0.00012563914060592651, 0.00013359077274799347, 0.00014154240489006042, 0.00014949403703212738, 0.00015744566917419434, 0.0001653973013162613, 0.00017334893345832825, 0.0001813005656003952, 0.00018925219774246216, 0.00019720382988452911, 0.00020515546202659607, 0.00021310709416866302, 0.00022105872631072998, 0.00022901035845279694, 0.0002369619905948639, 0.00024491362273693085, 0.0002528652548789978, 0.00026081688702106476, 0.0002687685191631317, 0.00027672015130519867, 0.0002846717834472656]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 10.0, 24.0, 25.0, 48.0, 57.0, 121.0, 147.0, 229.0, 365.0, 532.0, 987.0, 1644.0, 3209.0, 6415.0, 13728.0, 33311.0, 93881.0, 286383.0, 383614.0, 140831.0, 46946.0, 18566.0, 8256.0, 4147.0, 2099.0, 1189.0, 671.0, 397.0, 236.0, 162.0, 110.0, 75.0, 40.0, 28.0, 23.0, 12.0, 6.0, 6.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.45855712890625, -4.3155517578125, -4.17254638671875, -4.029541015625, -3.88653564453125, -3.7435302734375, -3.60052490234375, -3.45751953125, -3.31451416015625, -3.1715087890625, -3.02850341796875, -2.885498046875, -2.74249267578125, -2.5994873046875, -2.45648193359375, -2.3134765625, -2.17047119140625, -2.0274658203125, -1.88446044921875, -1.741455078125, -1.59844970703125, -1.4554443359375, -1.31243896484375, -1.16943359375, -1.02642822265625, -0.8834228515625, -0.74041748046875, -0.597412109375, -0.45440673828125, -0.3114013671875, -0.16839599609375, -0.025390625, 0.11761474609375, 0.2606201171875, 0.40362548828125, 0.546630859375, 0.68963623046875, 0.8326416015625, 0.97564697265625, 1.11865234375, 1.26165771484375, 1.4046630859375, 1.54766845703125, 1.690673828125, 1.83367919921875, 1.9766845703125, 2.11968994140625, 2.2626953125, 2.40570068359375, 2.5487060546875, 2.69171142578125, 2.834716796875, 2.97772216796875, 3.1207275390625, 3.26373291015625, 3.40673828125, 3.54974365234375, 3.6927490234375, 3.83575439453125, 3.978759765625, 4.12176513671875, 4.2647705078125, 4.40777587890625, 4.55078125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 3.0, 5.0, 6.0, 10.0, 12.0, 20.0, 19.0, 31.0, 30.0, 30.0, 43.0, 39.0, 49.0, 60.0, 49.0, 60.0, 63.0, 65.0, 54.0, 50.0, 42.0, 46.0, 39.0, 30.0, 27.0, 23.0, 13.0, 22.0, 13.0, 9.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.895782470703125, -2.78570556640625, -2.675628662109375, -2.5655517578125, -2.455474853515625, -2.34539794921875, -2.235321044921875, -2.125244140625, -2.015167236328125, -1.90509033203125, -1.795013427734375, -1.6849365234375, -1.574859619140625, -1.46478271484375, -1.354705810546875, -1.24462890625, -1.134552001953125, -1.02447509765625, -0.914398193359375, -0.8043212890625, -0.694244384765625, -0.58416748046875, -0.474090576171875, -0.364013671875, -0.253936767578125, -0.14385986328125, -0.033782958984375, 0.0762939453125, 0.186370849609375, 0.29644775390625, 0.406524658203125, 0.5166015625, 0.626678466796875, 0.73675537109375, 0.846832275390625, 0.9569091796875, 1.066986083984375, 1.17706298828125, 1.287139892578125, 1.397216796875, 1.507293701171875, 1.61737060546875, 1.727447509765625, 1.8375244140625, 1.947601318359375, 2.05767822265625, 2.167755126953125, 2.27783203125, 2.387908935546875, 2.49798583984375, 2.608062744140625, 2.7181396484375, 2.828216552734375, 2.93829345703125, 3.048370361328125, 3.158447265625, 3.268524169921875, 3.37860107421875, 3.488677978515625, 3.5987548828125, 3.708831787109375, 3.81890869140625, 3.928985595703125, 4.0390625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 25.0, 80.0, 148.0, 236.0, 219.0, 110.0, 51.0, 35.0, 22.0, 13.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.54007720947266, -60.87861633300781, -57.21715545654297, -53.555694580078125, -49.89423370361328, -46.23277282714844, -42.571311950683594, -38.90985107421875, -35.248390197753906, -31.586929321289062, -27.92546844482422, -24.264007568359375, -20.60254669189453, -16.941085815429688, -13.279624938964844, -9.6181640625, -5.956703186035156, -2.2952423095703125, 1.3662185668945312, 5.027679443359375, 8.689140319824219, 12.350601196289062, 16.012062072753906, 19.67352294921875, 23.334983825683594, 26.996444702148438, 30.65790557861328, 34.319366455078125, 37.98082733154297, 41.64228820800781, 45.303749084472656, 48.9652099609375, 52.62666320800781, 56.288124084472656, 59.9495849609375, 63.611045837402344, 67.27250671386719, 70.93396759033203, 74.59542846679688, 78.25688934326172, 81.91835021972656, 85.5798110961914, 89.24127197265625, 92.9027328491211, 96.56419372558594, 100.22565460205078, 103.88711547851562, 107.54857635498047, 111.21003723144531, 114.87149810791016, 118.532958984375, 122.19441986083984, 125.85588073730469, 129.517333984375, 133.17880249023438, 136.84027099609375, 140.50172424316406, 144.16317749023438, 147.82464599609375, 151.48611450195312, 155.14756774902344, 158.80902099609375, 162.47048950195312, 166.1319580078125, 169.7934112548828]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 8.0, 6.0, 16.0, 13.0, 24.0, 57.0, 73.0, 118.0, 158.0, 152.0, 117.0, 96.0, 38.0, 34.0, 16.0, 14.0, 7.0, 9.0, 5.0, 5.0, 3.0, 7.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.6510467529297, -145.63816833496094, -140.62530517578125, -135.6124267578125, -130.5995635986328, -125.58668518066406, -120.57381439208984, -115.56094360351562, -110.5480728149414, -105.53520202636719, -100.52233123779297, -95.50946044921875, -90.49658203125, -85.48371887207031, -80.47084045410156, -75.45796966552734, -70.44509887695312, -65.4322280883789, -60.41935729980469, -55.4064826965332, -50.393611907958984, -45.380741119384766, -40.36786651611328, -35.35499572753906, -30.342124938964844, -25.329254150390625, -20.316381454467773, -15.303509712219238, -10.290637969970703, -5.277767181396484, -0.2648944854736328, 4.747978210449219, 9.760833740234375, 14.77370548248291, 19.786577224731445, 24.799449920654297, 29.812320709228516, 34.825191497802734, 39.83806610107422, 44.85093688964844, 49.863807678222656, 54.876678466796875, 59.889549255371094, 64.90242004394531, 69.91529846191406, 74.92816162109375, 79.9410400390625, 84.95391082763672, 89.96678161621094, 94.97965240478516, 99.99252319335938, 105.0053939819336, 110.01826477050781, 115.03114318847656, 120.04401397705078, 125.056884765625, 130.06976318359375, 135.0826416015625, 140.0955047607422, 145.10838317871094, 150.12124633789062, 155.13412475585938, 160.14698791503906, 165.1598663330078, 170.1727294921875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 10.0, 7.0, 13.0, 13.0, 19.0, 18.0, 45.0, 48.0, 78.0, 118.0, 160.0, 264.0, 466.0, 796.0, 1350.0, 2708.0, 6093.0, 15899.0, 56108.0, 471244.0, 3477828.0, 117590.0, 26413.0, 9147.0, 3760.0, 1825.0, 944.0, 467.0, 271.0, 192.0, 114.0, 79.0, 57.0, 35.0, 18.0, 21.0, 14.0, 12.0, 8.0, 7.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.1875, -30.1884765625, -29.189453125, -28.1904296875, -27.19140625, -26.1923828125, -25.193359375, -24.1943359375, -23.1953125, -22.1962890625, -21.197265625, -20.1982421875, -19.19921875, -18.2001953125, -17.201171875, -16.2021484375, -15.203125, -14.2041015625, -13.205078125, -12.2060546875, -11.20703125, -10.2080078125, -9.208984375, -8.2099609375, -7.2109375, -6.2119140625, -5.212890625, -4.2138671875, -3.21484375, -2.2158203125, -1.216796875, -0.2177734375, 0.78125, 1.7802734375, 2.779296875, 3.7783203125, 4.77734375, 5.7763671875, 6.775390625, 7.7744140625, 8.7734375, 9.7724609375, 10.771484375, 11.7705078125, 12.76953125, 13.7685546875, 14.767578125, 15.7666015625, 16.765625, 17.7646484375, 18.763671875, 19.7626953125, 20.76171875, 21.7607421875, 22.759765625, 23.7587890625, 24.7578125, 25.7568359375, 26.755859375, 27.7548828125, 28.75390625, 29.7529296875, 30.751953125, 31.7509765625, 32.75]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 10.0, 3.0, 8.0, 15.0, 18.0, 26.0, 40.0, 54.0, 65.0, 79.0, 103.0, 84.0, 102.0, 78.0, 75.0, 59.0, 39.0, 31.0, 31.0, 20.0, 19.0, 8.0, 7.0, 5.0, 4.0, 3.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2109375, -2.139251708984375, -2.06756591796875, -1.995880126953125, -1.9241943359375, -1.852508544921875, -1.78082275390625, -1.709136962890625, -1.637451171875, -1.565765380859375, -1.49407958984375, -1.422393798828125, -1.3507080078125, -1.279022216796875, -1.20733642578125, -1.135650634765625, -1.06396484375, -0.992279052734375, -0.92059326171875, -0.848907470703125, -0.7772216796875, -0.705535888671875, -0.63385009765625, -0.562164306640625, -0.490478515625, -0.418792724609375, -0.34710693359375, -0.275421142578125, -0.2037353515625, -0.132049560546875, -0.06036376953125, 0.011322021484375, 0.0830078125, 0.154693603515625, 0.22637939453125, 0.298065185546875, 0.3697509765625, 0.441436767578125, 0.51312255859375, 0.584808349609375, 0.656494140625, 0.728179931640625, 0.79986572265625, 0.871551513671875, 0.9432373046875, 1.014923095703125, 1.08660888671875, 1.158294677734375, 1.22998046875, 1.301666259765625, 1.37335205078125, 1.445037841796875, 1.5167236328125, 1.588409423828125, 1.66009521484375, 1.731781005859375, 1.803466796875, 1.875152587890625, 1.94683837890625, 2.018524169921875, 2.0902099609375, 2.161895751953125, 2.23358154296875, 2.305267333984375, 2.376953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 12.0, 19.0, 22.0, 31.0, 49.0, 61.0, 104.0, 180.0, 286.0, 581.0, 1125.0, 2374.0, 5587.0, 15007.0, 50451.0, 254989.0, 3187679.0, 556573.0, 83745.0, 21907.0, 7410.0, 3076.0, 1384.0, 706.0, 342.0, 188.0, 122.0, 84.0, 41.0, 33.0, 27.0, 20.0, 14.0, 6.0, 12.0, 8.0, 0.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.4375, -31.474365234375, -30.51123046875, -29.548095703125, -28.5849609375, -27.621826171875, -26.65869140625, -25.695556640625, -24.732421875, -23.769287109375, -22.80615234375, -21.843017578125, -20.8798828125, -19.916748046875, -18.95361328125, -17.990478515625, -17.02734375, -16.064208984375, -15.10107421875, -14.137939453125, -13.1748046875, -12.211669921875, -11.24853515625, -10.285400390625, -9.322265625, -8.359130859375, -7.39599609375, -6.432861328125, -5.4697265625, -4.506591796875, -3.54345703125, -2.580322265625, -1.6171875, -0.654052734375, 0.30908203125, 1.272216796875, 2.2353515625, 3.198486328125, 4.16162109375, 5.124755859375, 6.087890625, 7.051025390625, 8.01416015625, 8.977294921875, 9.9404296875, 10.903564453125, 11.86669921875, 12.829833984375, 13.79296875, 14.756103515625, 15.71923828125, 16.682373046875, 17.6455078125, 18.608642578125, 19.57177734375, 20.534912109375, 21.498046875, 22.461181640625, 23.42431640625, 24.387451171875, 25.3505859375, 26.313720703125, 27.27685546875, 28.239990234375, 29.203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 4.0, 6.0, 5.0, 13.0, 14.0, 28.0, 35.0, 34.0, 56.0, 101.0, 153.0, 274.0, 754.0, 1588.0, 429.0, 223.0, 123.0, 78.0, 39.0, 36.0, 25.0, 12.0, 11.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.109375, -6.937103271484375, -6.76483154296875, -6.592559814453125, -6.4202880859375, -6.248016357421875, -6.07574462890625, -5.903472900390625, -5.731201171875, -5.558929443359375, -5.38665771484375, -5.214385986328125, -5.0421142578125, -4.869842529296875, -4.69757080078125, -4.525299072265625, -4.35302734375, -4.180755615234375, -4.00848388671875, -3.836212158203125, -3.6639404296875, -3.491668701171875, -3.31939697265625, -3.147125244140625, -2.974853515625, -2.802581787109375, -2.63031005859375, -2.458038330078125, -2.2857666015625, -2.113494873046875, -1.94122314453125, -1.768951416015625, -1.5966796875, -1.424407958984375, -1.25213623046875, -1.079864501953125, -0.9075927734375, -0.735321044921875, -0.56304931640625, -0.390777587890625, -0.218505859375, -0.046234130859375, 0.12603759765625, 0.298309326171875, 0.4705810546875, 0.642852783203125, 0.81512451171875, 0.987396240234375, 1.15966796875, 1.331939697265625, 1.50421142578125, 1.676483154296875, 1.8487548828125, 2.021026611328125, 2.19329833984375, 2.365570068359375, 2.537841796875, 2.710113525390625, 2.88238525390625, 3.054656982421875, 3.2269287109375, 3.399200439453125, 3.57147216796875, 3.743743896484375, 3.916015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 8.0, 15.0, 15.0, 27.0, 50.0, 82.0, 130.0, 175.0, 188.0, 155.0, 76.0, 41.0, 12.0, 14.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-59.660587310791016, -58.139892578125, -56.61920166015625, -55.098506927490234, -53.57781219482422, -52.05712127685547, -50.53642654418945, -49.01573181152344, -47.49504089355469, -45.97434616088867, -44.45365524291992, -42.932960510253906, -41.412269592285156, -39.89157485961914, -38.370880126953125, -36.850189208984375, -35.32949447631836, -33.808799743652344, -32.288108825683594, -30.767414093017578, -29.246721267700195, -27.726028442382812, -26.205333709716797, -24.684640884399414, -23.16394805908203, -21.64325523376465, -20.122562408447266, -18.60186767578125, -17.081174850463867, -15.560482025146484, -14.039788246154785, -12.519094467163086, -10.998405456542969, -9.477712631225586, -7.957018852233887, -6.436325550079346, -4.915632247924805, -3.3949389457702637, -1.8742456436157227, -0.35355186462402344, 1.1671409606933594, 2.6878342628479004, 4.208527565002441, 5.729220867156982, 7.249914169311523, 8.770606994628906, 10.291300773620605, 11.811994552612305, 13.332687377929688, 14.85338020324707, 16.374073028564453, 17.89476776123047, 19.41546058654785, 20.936153411865234, 22.45684814453125, 23.977540969848633, 25.498233795166016, 27.0189266204834, 28.53961944580078, 30.060314178466797, 31.58100700378418, 33.10169982910156, 34.62239456176758, 36.143089294433594, 37.663780212402344]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 2.0, 3.0, 6.0, 10.0, 6.0, 9.0, 10.0, 11.0, 20.0, 20.0, 31.0, 35.0, 27.0, 32.0, 32.0, 36.0, 44.0, 50.0, 51.0, 38.0, 51.0, 56.0, 54.0, 38.0, 40.0, 29.0, 34.0, 27.0, 35.0, 26.0, 16.0, 26.0, 14.0, 16.0, 14.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-18.467355728149414, -17.914037704467773, -17.360721588134766, -16.807403564453125, -16.254085540771484, -15.700767517089844, -15.14745044708252, -14.594133377075195, -14.040815353393555, -13.487497329711914, -12.93418025970459, -12.380863189697266, -11.827545166015625, -11.274227142333984, -10.72091007232666, -10.167593002319336, -9.614274978637695, -9.060956954956055, -8.50763988494873, -7.954322338104248, -7.401004791259766, -6.847687244415283, -6.294369697570801, -5.741052150726318, -5.187734603881836, -4.6344170570373535, -4.081099510192871, -3.5277819633483887, -2.9744644165039062, -2.421146869659424, -1.8678293228149414, -1.314511775970459, -0.7611923217773438, -0.20787477493286133, 0.3454427719116211, 0.8987603187561035, 1.452077865600586, 2.0053954124450684, 2.558712959289551, 3.112030506134033, 3.6653480529785156, 4.218665599822998, 4.7719831466674805, 5.325300693511963, 5.878618240356445, 6.431935787200928, 6.98525333404541, 7.538570880889893, 8.091888427734375, 8.645206451416016, 9.19852352142334, 9.751840591430664, 10.305158615112305, 10.858476638793945, 11.41179370880127, 11.965110778808594, 12.518428802490234, 13.071746826171875, 13.6250638961792, 14.178380966186523, 14.731698989868164, 15.285017013549805, 15.838334083557129, 16.391651153564453, 16.944969177246094]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 6.0, 0.0, 2.0, 5.0, 4.0, 7.0, 7.0, 13.0, 21.0, 30.0, 37.0, 69.0, 117.0, 214.0, 342.0, 581.0, 992.0, 1794.0, 3718.0, 7377.0, 16585.0, 43383.0, 143941.0, 489449.0, 234747.0, 63120.0, 22464.0, 9783.0, 4570.0, 2190.0, 1226.0, 705.0, 403.0, 250.0, 132.0, 85.0, 60.0, 49.0, 32.0, 14.0, 15.0, 5.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9765625, -12.4505615234375, -11.924560546875, -11.3985595703125, -10.87255859375, -10.3465576171875, -9.820556640625, -9.2945556640625, -8.7685546875, -8.2425537109375, -7.716552734375, -7.1905517578125, -6.66455078125, -6.1385498046875, -5.612548828125, -5.0865478515625, -4.560546875, -4.0345458984375, -3.508544921875, -2.9825439453125, -2.45654296875, -1.9305419921875, -1.404541015625, -0.8785400390625, -0.3525390625, 0.1734619140625, 0.699462890625, 1.2254638671875, 1.75146484375, 2.2774658203125, 2.803466796875, 3.3294677734375, 3.85546875, 4.3814697265625, 4.907470703125, 5.4334716796875, 5.95947265625, 6.4854736328125, 7.011474609375, 7.5374755859375, 8.0634765625, 8.5894775390625, 9.115478515625, 9.6414794921875, 10.16748046875, 10.6934814453125, 11.219482421875, 11.7454833984375, 12.271484375, 12.7974853515625, 13.323486328125, 13.8494873046875, 14.37548828125, 14.9014892578125, 15.427490234375, 15.9534912109375, 16.4794921875, 17.0054931640625, 17.531494140625, 18.0574951171875, 18.58349609375, 19.1094970703125, 19.635498046875, 20.1614990234375, 20.6875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 6.0, 7.0, 11.0, 10.0, 13.0, 28.0, 19.0, 25.0, 45.0, 33.0, 47.0, 46.0, 62.0, 69.0, 65.0, 60.0, 62.0, 59.0, 58.0, 51.0, 48.0, 43.0, 23.0, 18.0, 20.0, 14.0, 13.0, 9.0, 12.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.072265625, -2.0162353515625, -1.960205078125, -1.9041748046875, -1.84814453125, -1.7921142578125, -1.736083984375, -1.6800537109375, -1.6240234375, -1.5679931640625, -1.511962890625, -1.4559326171875, -1.39990234375, -1.3438720703125, -1.287841796875, -1.2318115234375, -1.17578125, -1.1197509765625, -1.063720703125, -1.0076904296875, -0.95166015625, -0.8956298828125, -0.839599609375, -0.7835693359375, -0.7275390625, -0.6715087890625, -0.615478515625, -0.5594482421875, -0.50341796875, -0.4473876953125, -0.391357421875, -0.3353271484375, -0.279296875, -0.2232666015625, -0.167236328125, -0.1112060546875, -0.05517578125, 0.0008544921875, 0.056884765625, 0.1129150390625, 0.1689453125, 0.2249755859375, 0.281005859375, 0.3370361328125, 0.39306640625, 0.4490966796875, 0.505126953125, 0.5611572265625, 0.6171875, 0.6732177734375, 0.729248046875, 0.7852783203125, 0.84130859375, 0.8973388671875, 0.953369140625, 1.0093994140625, 1.0654296875, 1.1214599609375, 1.177490234375, 1.2335205078125, 1.28955078125, 1.3455810546875, 1.401611328125, 1.4576416015625, 1.513671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 14.0, 11.0, 18.0, 21.0, 30.0, 43.0, 80.0, 87.0, 146.0, 221.0, 365.0, 600.0, 924.0, 1488.0, 2620.0, 4918.0, 10007.0, 22181.0, 59369.0, 202276.0, 455043.0, 189213.0, 57022.0, 21353.0, 9437.0, 4638.0, 2537.0, 1553.0, 844.0, 515.0, 351.0, 218.0, 138.0, 78.0, 57.0, 47.0, 25.0, 15.0, 11.0, 13.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-12.53125, -12.1568603515625, -11.782470703125, -11.4080810546875, -11.03369140625, -10.6593017578125, -10.284912109375, -9.9105224609375, -9.5361328125, -9.1617431640625, -8.787353515625, -8.4129638671875, -8.03857421875, -7.6641845703125, -7.289794921875, -6.9154052734375, -6.541015625, -6.1666259765625, -5.792236328125, -5.4178466796875, -5.04345703125, -4.6690673828125, -4.294677734375, -3.9202880859375, -3.5458984375, -3.1715087890625, -2.797119140625, -2.4227294921875, -2.04833984375, -1.6739501953125, -1.299560546875, -0.9251708984375, -0.55078125, -0.1763916015625, 0.197998046875, 0.5723876953125, 0.94677734375, 1.3211669921875, 1.695556640625, 2.0699462890625, 2.4443359375, 2.8187255859375, 3.193115234375, 3.5675048828125, 3.94189453125, 4.3162841796875, 4.690673828125, 5.0650634765625, 5.439453125, 5.8138427734375, 6.188232421875, 6.5626220703125, 6.93701171875, 7.3114013671875, 7.685791015625, 8.0601806640625, 8.4345703125, 8.8089599609375, 9.183349609375, 9.5577392578125, 9.93212890625, 10.3065185546875, 10.680908203125, 11.0552978515625, 11.4296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 2.0, 4.0, 1.0, 6.0, 7.0, 14.0, 16.0, 14.0, 22.0, 30.0, 48.0, 41.0, 45.0, 40.0, 53.0, 54.0, 51.0, 66.0, 56.0, 55.0, 63.0, 54.0, 53.0, 46.0, 26.0, 21.0, 24.0, 20.0, 18.0, 17.0, 9.0, 9.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.1328125, -9.862548828125, -9.59228515625, -9.322021484375, -9.0517578125, -8.781494140625, -8.51123046875, -8.240966796875, -7.970703125, -7.700439453125, -7.43017578125, -7.159912109375, -6.8896484375, -6.619384765625, -6.34912109375, -6.078857421875, -5.80859375, -5.538330078125, -5.26806640625, -4.997802734375, -4.7275390625, -4.457275390625, -4.18701171875, -3.916748046875, -3.646484375, -3.376220703125, -3.10595703125, -2.835693359375, -2.5654296875, -2.295166015625, -2.02490234375, -1.754638671875, -1.484375, -1.214111328125, -0.94384765625, -0.673583984375, -0.4033203125, -0.133056640625, 0.13720703125, 0.407470703125, 0.677734375, 0.947998046875, 1.21826171875, 1.488525390625, 1.7587890625, 2.029052734375, 2.29931640625, 2.569580078125, 2.83984375, 3.110107421875, 3.38037109375, 3.650634765625, 3.9208984375, 4.191162109375, 4.46142578125, 4.731689453125, 5.001953125, 5.272216796875, 5.54248046875, 5.812744140625, 6.0830078125, 6.353271484375, 6.62353515625, 6.893798828125, 7.1640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 2.0, 8.0, 14.0, 23.0, 37.0, 60.0, 86.0, 123.0, 217.0, 377.0, 711.0, 1263.0, 2367.0, 4990.0, 11385.0, 27607.0, 74068.0, 196933.0, 352563.0, 229610.0, 88357.0, 32985.0, 13117.0, 5726.0, 2712.0, 1402.0, 754.0, 422.0, 252.0, 157.0, 70.0, 53.0, 30.0, 23.0, 14.0, 13.0, 6.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -7.01629638671875, -6.7708740234375, -6.52545166015625, -6.280029296875, -6.03460693359375, -5.7891845703125, -5.54376220703125, -5.29833984375, -5.05291748046875, -4.8074951171875, -4.56207275390625, -4.316650390625, -4.07122802734375, -3.8258056640625, -3.58038330078125, -3.3349609375, -3.08953857421875, -2.8441162109375, -2.59869384765625, -2.353271484375, -2.10784912109375, -1.8624267578125, -1.61700439453125, -1.37158203125, -1.12615966796875, -0.8807373046875, -0.63531494140625, -0.389892578125, -0.14447021484375, 0.1009521484375, 0.34637451171875, 0.591796875, 0.83721923828125, 1.0826416015625, 1.32806396484375, 1.573486328125, 1.81890869140625, 2.0643310546875, 2.30975341796875, 2.55517578125, 2.80059814453125, 3.0460205078125, 3.29144287109375, 3.536865234375, 3.78228759765625, 4.0277099609375, 4.27313232421875, 4.5185546875, 4.76397705078125, 5.0093994140625, 5.25482177734375, 5.500244140625, 5.74566650390625, 5.9910888671875, 6.23651123046875, 6.48193359375, 6.72735595703125, 6.9727783203125, 7.21820068359375, 7.463623046875, 7.70904541015625, 7.9544677734375, 8.19989013671875, 8.4453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 5.0, 6.0, 11.0, 21.0, 74.0, 198.0, 309.0, 205.0, 80.0, 30.0, 18.0, 6.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.0011673569679260254, -0.0011216402053833008, -0.0010759234428405762, -0.0010302066802978516, -0.000984489917755127, -0.0009387731552124023, -0.0008930563926696777, -0.0008473396301269531, -0.0008016228675842285, -0.0007559061050415039, -0.0007101893424987793, -0.0006644725799560547, -0.0006187558174133301, -0.0005730390548706055, -0.0005273222923278809, -0.00048160552978515625, -0.00043588876724243164, -0.00039017200469970703, -0.0003444552421569824, -0.0002987384796142578, -0.0002530217170715332, -0.0002073049545288086, -0.00016158819198608398, -0.00011587142944335938, -7.015466690063477e-05, -2.4437904357910156e-05, 2.1278858184814453e-05, 6.699562072753906e-05, 0.00011271238327026367, 0.00015842914581298828, 0.0002041459083557129, 0.0002498626708984375, 0.0002955794334411621, 0.0003412961959838867, 0.00038701295852661133, 0.00043272972106933594, 0.00047844648361206055, 0.0005241632461547852, 0.0005698800086975098, 0.0006155967712402344, 0.000661313533782959, 0.0007070302963256836, 0.0007527470588684082, 0.0007984638214111328, 0.0008441805839538574, 0.000889897346496582, 0.0009356141090393066, 0.0009813308715820312, 0.0010270476341247559, 0.0010727643966674805, 0.001118481159210205, 0.0011641979217529297, 0.0012099146842956543, 0.001255631446838379, 0.0013013482093811035, 0.0013470649719238281, 0.0013927817344665527, 0.0014384984970092773, 0.001484215259552002, 0.0015299320220947266, 0.0015756487846374512, 0.0016213655471801758, 0.0016670823097229004, 0.001712799072265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 12.0, 13.0, 20.0, 31.0, 51.0, 87.0, 120.0, 205.0, 284.0, 461.0, 766.0, 1247.0, 2154.0, 3804.0, 6874.0, 12385.0, 23831.0, 45650.0, 89813.0, 165758.0, 239203.0, 205694.0, 119685.0, 61897.0, 31526.0, 16363.0, 9000.0, 4815.0, 2716.0, 1636.0, 898.0, 618.0, 313.0, 204.0, 141.0, 88.0, 76.0, 47.0, 27.0, 8.0, 12.0, 12.0, 7.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.0396728515625, -5.860595703125, -5.6815185546875, -5.50244140625, -5.3233642578125, -5.144287109375, -4.9652099609375, -4.7861328125, -4.6070556640625, -4.427978515625, -4.2489013671875, -4.06982421875, -3.8907470703125, -3.711669921875, -3.5325927734375, -3.353515625, -3.1744384765625, -2.995361328125, -2.8162841796875, -2.63720703125, -2.4581298828125, -2.279052734375, -2.0999755859375, -1.9208984375, -1.7418212890625, -1.562744140625, -1.3836669921875, -1.20458984375, -1.0255126953125, -0.846435546875, -0.6673583984375, -0.48828125, -0.3092041015625, -0.130126953125, 0.0489501953125, 0.22802734375, 0.4071044921875, 0.586181640625, 0.7652587890625, 0.9443359375, 1.1234130859375, 1.302490234375, 1.4815673828125, 1.66064453125, 1.8397216796875, 2.018798828125, 2.1978759765625, 2.376953125, 2.5560302734375, 2.735107421875, 2.9141845703125, 3.09326171875, 3.2723388671875, 3.451416015625, 3.6304931640625, 3.8095703125, 3.9886474609375, 4.167724609375, 4.3468017578125, 4.52587890625, 4.7049560546875, 4.884033203125, 5.0631103515625, 5.2421875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 6.0, 9.0, 12.0, 15.0, 18.0, 24.0, 22.0, 23.0, 30.0, 30.0, 38.0, 34.0, 39.0, 48.0, 51.0, 62.0, 57.0, 47.0, 50.0, 30.0, 57.0, 42.0, 34.0, 32.0, 24.0, 21.0, 20.0, 23.0, 12.0, 8.0, 12.0, 12.0, 9.0, 10.0, 3.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.328125, -3.21588134765625, -3.1036376953125, -2.99139404296875, -2.879150390625, -2.76690673828125, -2.6546630859375, -2.54241943359375, -2.43017578125, -2.31793212890625, -2.2056884765625, -2.09344482421875, -1.981201171875, -1.86895751953125, -1.7567138671875, -1.64447021484375, -1.5322265625, -1.41998291015625, -1.3077392578125, -1.19549560546875, -1.083251953125, -0.97100830078125, -0.8587646484375, -0.74652099609375, -0.63427734375, -0.52203369140625, -0.4097900390625, -0.29754638671875, -0.185302734375, -0.07305908203125, 0.0391845703125, 0.15142822265625, 0.263671875, 0.37591552734375, 0.4881591796875, 0.60040283203125, 0.712646484375, 0.82489013671875, 0.9371337890625, 1.04937744140625, 1.16162109375, 1.27386474609375, 1.3861083984375, 1.49835205078125, 1.610595703125, 1.72283935546875, 1.8350830078125, 1.94732666015625, 2.0595703125, 2.17181396484375, 2.2840576171875, 2.39630126953125, 2.508544921875, 2.62078857421875, 2.7330322265625, 2.84527587890625, 2.95751953125, 3.06976318359375, 3.1820068359375, 3.29425048828125, 3.406494140625, 3.51873779296875, 3.6309814453125, 3.74322509765625, 3.85546875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 9.0, 10.0, 19.0, 40.0, 74.0, 132.0, 177.0, 184.0, 162.0, 83.0, 46.0, 39.0, 13.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.42327117919922, -79.64752197265625, -75.87176513671875, -72.09601593017578, -68.32025909423828, -64.54450988769531, -60.76875686645508, -56.993003845214844, -53.21725082397461, -49.441497802734375, -45.66574478149414, -41.889991760253906, -38.11424255371094, -34.33848571777344, -30.56273651123047, -26.786983489990234, -23.01123046875, -19.235477447509766, -15.459725379943848, -11.68397331237793, -7.908220291137695, -4.132467269897461, -0.3567161560058594, 3.419036865234375, 7.194789886474609, 10.970542907714844, 14.746294975280762, 18.52204704284668, 22.297800064086914, 26.07355308532715, 29.84930419921875, 33.625057220458984, 37.40080261230469, 41.17655563354492, 44.952308654785156, 48.728057861328125, 52.503814697265625, 56.279563903808594, 60.05531692504883, 63.83106994628906, 67.60682678222656, 71.38257598876953, 75.15833282470703, 78.93408203125, 82.7098388671875, 86.48558807373047, 90.26133728027344, 94.03709411621094, 97.8128433227539, 101.58859252929688, 105.36434936523438, 109.14009857177734, 112.91585540771484, 116.69160461425781, 120.46736145019531, 124.24311065673828, 128.01885986328125, 131.79461669921875, 135.5703582763672, 139.3461151123047, 143.1218719482422, 146.8976287841797, 150.67337036132812, 154.44912719726562, 158.22488403320312]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 3.0, 7.0, 7.0, 7.0, 11.0, 13.0, 12.0, 8.0, 17.0, 30.0, 28.0, 22.0, 39.0, 46.0, 49.0, 48.0, 62.0, 51.0, 58.0, 48.0, 72.0, 53.0, 43.0, 38.0, 48.0, 39.0, 23.0, 16.0, 28.0, 17.0, 6.0, 7.0, 4.0, 13.0, 5.0, 5.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.52190399169922, -38.87868118286133, -37.23545837402344, -35.59223556518555, -33.949012756347656, -32.305789947509766, -30.662567138671875, -29.019344329833984, -27.376121520996094, -25.732898712158203, -24.089675903320312, -22.446453094482422, -20.80323028564453, -19.16000747680664, -17.51678466796875, -15.873560905456543, -14.230337142944336, -12.587114334106445, -10.943891525268555, -9.300668716430664, -7.657445430755615, -6.014222145080566, -4.370999336242676, -2.727776527404785, -1.0845537185668945, 0.5586692094802856, 2.201892137527466, 3.8451151847839355, 5.488337993621826, 7.131561279296875, 8.774784088134766, 10.418006896972656, 12.061229705810547, 13.704452514648438, 15.347675323486328, 16.99089813232422, 18.63412094116211, 20.27734375, 21.92056655883789, 23.56378936767578, 25.207012176513672, 26.850234985351562, 28.493457794189453, 30.136680603027344, 31.779903411865234, 33.423126220703125, 35.066349029541016, 36.709571838378906, 38.35279846191406, 39.99602127075195, 41.639244079589844, 43.282466888427734, 44.925689697265625, 46.568912506103516, 48.212135314941406, 49.8553581237793, 51.49858093261719, 53.14180374145508, 54.78502655029297, 56.42824935913086, 58.07147216796875, 59.71469497680664, 61.35791778564453, 63.00114059448242, 64.64436340332031]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 4.0, 6.0, 10.0, 14.0, 18.0, 20.0, 31.0, 46.0, 75.0, 108.0, 142.0, 199.0, 329.0, 458.0, 800.0, 1232.0, 2023.0, 3800.0, 6735.0, 13480.0, 29224.0, 81754.0, 488442.0, 3310888.0, 166854.0, 46612.0, 19180.0, 9536.0, 4914.0, 2913.0, 1668.0, 957.0, 652.0, 382.0, 263.0, 153.0, 111.0, 84.0, 52.0, 35.0, 26.0, 12.0, 17.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.21826171875, -32.1552734375, -31.09228515625, -30.029296875, -28.96630859375, -27.9033203125, -26.84033203125, -25.77734375, -24.71435546875, -23.6513671875, -22.58837890625, -21.525390625, -20.46240234375, -19.3994140625, -18.33642578125, -17.2734375, -16.21044921875, -15.1474609375, -14.08447265625, -13.021484375, -11.95849609375, -10.8955078125, -9.83251953125, -8.76953125, -7.70654296875, -6.6435546875, -5.58056640625, -4.517578125, -3.45458984375, -2.3916015625, -1.32861328125, -0.265625, 0.79736328125, 1.8603515625, 2.92333984375, 3.986328125, 5.04931640625, 6.1123046875, 7.17529296875, 8.23828125, 9.30126953125, 10.3642578125, 11.42724609375, 12.490234375, 13.55322265625, 14.6162109375, 15.67919921875, 16.7421875, 17.80517578125, 18.8681640625, 19.93115234375, 20.994140625, 22.05712890625, 23.1201171875, 24.18310546875, 25.24609375, 26.30908203125, 27.3720703125, 28.43505859375, 29.498046875, 30.56103515625, 31.6240234375, 32.68701171875, 33.75]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 13.0, 19.0, 14.0, 28.0, 30.0, 29.0, 38.0, 47.0, 47.0, 45.0, 44.0, 54.0, 68.0, 62.0, 54.0, 52.0, 49.0, 53.0, 38.0, 33.0, 27.0, 19.0, 26.0, 20.0, 20.0, 10.0, 16.0, 6.0, 3.0, 8.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8251953125, -1.77301025390625, -1.7208251953125, -1.66864013671875, -1.616455078125, -1.56427001953125, -1.5120849609375, -1.45989990234375, -1.40771484375, -1.35552978515625, -1.3033447265625, -1.25115966796875, -1.198974609375, -1.14678955078125, -1.0946044921875, -1.04241943359375, -0.990234375, -0.93804931640625, -0.8858642578125, -0.83367919921875, -0.781494140625, -0.72930908203125, -0.6771240234375, -0.62493896484375, -0.57275390625, -0.52056884765625, -0.4683837890625, -0.41619873046875, -0.364013671875, -0.31182861328125, -0.2596435546875, -0.20745849609375, -0.1552734375, -0.10308837890625, -0.0509033203125, 0.00128173828125, 0.053466796875, 0.10565185546875, 0.1578369140625, 0.21002197265625, 0.26220703125, 0.31439208984375, 0.3665771484375, 0.41876220703125, 0.470947265625, 0.52313232421875, 0.5753173828125, 0.62750244140625, 0.6796875, 0.73187255859375, 0.7840576171875, 0.83624267578125, 0.888427734375, 0.94061279296875, 0.9927978515625, 1.04498291015625, 1.09716796875, 1.14935302734375, 1.2015380859375, 1.25372314453125, 1.305908203125, 1.35809326171875, 1.4102783203125, 1.46246337890625, 1.5146484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 5.0, 12.0, 22.0, 34.0, 44.0, 63.0, 139.0, 197.0, 445.0, 1306.0, 7954.0, 182478.0, 3928227.0, 67171.0, 4383.0, 892.0, 369.0, 205.0, 111.0, 84.0, 44.0, 33.0, 19.0, 11.0, 11.0, 10.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.875, -111.212890625, -107.55078125, -103.888671875, -100.2265625, -96.564453125, -92.90234375, -89.240234375, -85.578125, -81.916015625, -78.25390625, -74.591796875, -70.9296875, -67.267578125, -63.60546875, -59.943359375, -56.28125, -52.619140625, -48.95703125, -45.294921875, -41.6328125, -37.970703125, -34.30859375, -30.646484375, -26.984375, -23.322265625, -19.66015625, -15.998046875, -12.3359375, -8.673828125, -5.01171875, -1.349609375, 2.3125, 5.974609375, 9.63671875, 13.298828125, 16.9609375, 20.623046875, 24.28515625, 27.947265625, 31.609375, 35.271484375, 38.93359375, 42.595703125, 46.2578125, 49.919921875, 53.58203125, 57.244140625, 60.90625, 64.568359375, 68.23046875, 71.892578125, 75.5546875, 79.216796875, 82.87890625, 86.541015625, 90.203125, 93.865234375, 97.52734375, 101.189453125, 104.8515625, 108.513671875, 112.17578125, 115.837890625, 119.5]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 7.0, 11.0, 14.0, 27.0, 37.0, 43.0, 66.0, 102.0, 150.0, 266.0, 588.0, 1662.0, 514.0, 205.0, 120.0, 81.0, 51.0, 41.0, 31.0, 18.0, 10.0, 5.0, 8.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.94140625, -6.7203369140625, -6.499267578125, -6.2781982421875, -6.05712890625, -5.8360595703125, -5.614990234375, -5.3939208984375, -5.1728515625, -4.9517822265625, -4.730712890625, -4.5096435546875, -4.28857421875, -4.0675048828125, -3.846435546875, -3.6253662109375, -3.404296875, -3.1832275390625, -2.962158203125, -2.7410888671875, -2.52001953125, -2.2989501953125, -2.077880859375, -1.8568115234375, -1.6357421875, -1.4146728515625, -1.193603515625, -0.9725341796875, -0.75146484375, -0.5303955078125, -0.309326171875, -0.0882568359375, 0.1328125, 0.3538818359375, 0.574951171875, 0.7960205078125, 1.01708984375, 1.2381591796875, 1.459228515625, 1.6802978515625, 1.9013671875, 2.1224365234375, 2.343505859375, 2.5645751953125, 2.78564453125, 3.0067138671875, 3.227783203125, 3.4488525390625, 3.669921875, 3.8909912109375, 4.112060546875, 4.3331298828125, 4.55419921875, 4.7752685546875, 4.996337890625, 5.2174072265625, 5.4384765625, 5.6595458984375, 5.880615234375, 6.1016845703125, 6.32275390625, 6.5438232421875, 6.764892578125, 6.9859619140625, 7.20703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 12.0, 8.0, 19.0, 43.0, 90.0, 188.0, 234.0, 200.0, 124.0, 46.0, 22.0, 9.0, 7.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.22520446777344, -51.134368896484375, -48.04352951049805, -44.952693939208984, -41.861854553222656, -38.771018981933594, -35.68018341064453, -32.5893440246582, -29.498506546020508, -26.407669067382812, -23.316831588745117, -20.225994110107422, -17.13515853881836, -14.044320106506348, -10.953483581542969, -7.862646102905273, -4.771808624267578, -1.680971384048462, 1.4098658561706543, 4.500702857971191, 7.591540336608887, 10.682377815246582, 13.773214340209961, 16.864051818847656, 19.95488929748535, 23.045726776123047, 26.136564254760742, 29.227401733398438, 32.3182373046875, 35.40907669067383, 38.49991226196289, 41.59075164794922, 44.68158721923828, 47.772422790527344, 50.86326217651367, 53.954097747802734, 57.04493713378906, 60.135772705078125, 63.22660827636719, 66.31744384765625, 69.40828704833984, 72.4991226196289, 75.58995819091797, 78.68080139160156, 81.77163696289062, 84.86247253417969, 87.95330810546875, 91.04414367675781, 94.13497924804688, 97.22581481933594, 100.316650390625, 103.4074935913086, 106.49832916259766, 109.58916473388672, 112.68000030517578, 115.77084350585938, 118.86167907714844, 121.9525146484375, 125.04335021972656, 128.13418579101562, 131.2250213623047, 134.3158721923828, 137.40670776367188, 140.49754333496094, 143.58837890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 12.0, 9.0, 10.0, 17.0, 4.0, 17.0, 23.0, 22.0, 30.0, 24.0, 14.0, 26.0, 38.0, 35.0, 41.0, 44.0, 39.0, 31.0, 41.0, 47.0, 46.0, 43.0, 36.0, 50.0, 25.0, 28.0, 39.0, 27.0, 24.0, 21.0, 24.0, 11.0, 13.0, 12.0, 10.0, 14.0, 3.0, 7.0, 10.0, 6.0, 3.0, 3.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-23.066146850585938, -22.335039138793945, -21.603933334350586, -20.872825622558594, -20.1417179107666, -19.41061019897461, -18.67950439453125, -17.948396682739258, -17.217288970947266, -16.486181259155273, -15.755074501037598, -15.023967742919922, -14.29286003112793, -13.561753273010254, -12.830646514892578, -12.099538803100586, -11.36843204498291, -10.637325286865234, -9.906217575073242, -9.175110816955566, -8.444003105163574, -7.712896347045898, -6.9817891120910645, -6.2506818771362305, -5.5195746421813965, -4.7884674072265625, -4.0573601722717285, -3.3262531757354736, -2.5951459407806396, -1.8640387058258057, -1.1329317092895508, -0.4018244743347168, 0.3292827606201172, 1.0603899955749512, 1.7914971113204956, 2.52260422706604, 3.253711462020874, 3.984818696975708, 4.715925693511963, 5.447032928466797, 6.178140163421631, 6.909247398376465, 7.640354633331299, 8.371461868286133, 9.102568626403809, 9.8336763381958, 10.564783096313477, 11.295890808105469, 12.026997566223145, 12.75810432434082, 13.489212036132812, 14.220318794250488, 14.95142650604248, 15.682533264160156, 16.41364097595215, 17.14474868774414, 17.8758544921875, 18.606962203979492, 19.33806800842285, 20.069175720214844, 20.800283432006836, 21.531391143798828, 22.262496948242188, 22.99360466003418, 23.724712371826172]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 12.0, 17.0, 20.0, 37.0, 67.0, 104.0, 142.0, 224.0, 350.0, 594.0, 1084.0, 1725.0, 2996.0, 5154.0, 8856.0, 15782.0, 28929.0, 53930.0, 96805.0, 162865.0, 218943.0, 187057.0, 117063.0, 65204.0, 35829.0, 19462.0, 10729.0, 5910.0, 3506.0, 2036.0, 1219.0, 742.0, 445.0, 262.0, 171.0, 110.0, 74.0, 43.0, 21.0, 10.0, 11.0, 5.0, 4.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.6484375, -15.197021484375, -14.74560546875, -14.294189453125, -13.8427734375, -13.391357421875, -12.93994140625, -12.488525390625, -12.037109375, -11.585693359375, -11.13427734375, -10.682861328125, -10.2314453125, -9.780029296875, -9.32861328125, -8.877197265625, -8.42578125, -7.974365234375, -7.52294921875, -7.071533203125, -6.6201171875, -6.168701171875, -5.71728515625, -5.265869140625, -4.814453125, -4.363037109375, -3.91162109375, -3.460205078125, -3.0087890625, -2.557373046875, -2.10595703125, -1.654541015625, -1.203125, -0.751708984375, -0.30029296875, 0.151123046875, 0.6025390625, 1.053955078125, 1.50537109375, 1.956787109375, 2.408203125, 2.859619140625, 3.31103515625, 3.762451171875, 4.2138671875, 4.665283203125, 5.11669921875, 5.568115234375, 6.01953125, 6.470947265625, 6.92236328125, 7.373779296875, 7.8251953125, 8.276611328125, 8.72802734375, 9.179443359375, 9.630859375, 10.082275390625, 10.53369140625, 10.985107421875, 11.4365234375, 11.887939453125, 12.33935546875, 12.790771484375, 13.2421875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 7.0, 2.0, 1.0, 7.0, 7.0, 3.0, 10.0, 14.0, 9.0, 18.0, 18.0, 14.0, 24.0, 15.0, 29.0, 32.0, 30.0, 49.0, 54.0, 34.0, 41.0, 43.0, 44.0, 47.0, 42.0, 45.0, 43.0, 29.0, 35.0, 32.0, 38.0, 25.0, 20.0, 15.0, 17.0, 17.0, 17.0, 10.0, 19.0, 6.0, 15.0, 2.0, 4.0, 12.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5400390625, -1.492034912109375, -1.44403076171875, -1.396026611328125, -1.3480224609375, -1.300018310546875, -1.25201416015625, -1.204010009765625, -1.156005859375, -1.108001708984375, -1.05999755859375, -1.011993408203125, -0.9639892578125, -0.915985107421875, -0.86798095703125, -0.819976806640625, -0.77197265625, -0.723968505859375, -0.67596435546875, -0.627960205078125, -0.5799560546875, -0.531951904296875, -0.48394775390625, -0.435943603515625, -0.387939453125, -0.339935302734375, -0.29193115234375, -0.243927001953125, -0.1959228515625, -0.147918701171875, -0.09991455078125, -0.051910400390625, -0.00390625, 0.044097900390625, 0.09210205078125, 0.140106201171875, 0.1881103515625, 0.236114501953125, 0.28411865234375, 0.332122802734375, 0.380126953125, 0.428131103515625, 0.47613525390625, 0.524139404296875, 0.5721435546875, 0.620147705078125, 0.66815185546875, 0.716156005859375, 0.76416015625, 0.812164306640625, 0.86016845703125, 0.908172607421875, 0.9561767578125, 1.004180908203125, 1.05218505859375, 1.100189208984375, 1.148193359375, 1.196197509765625, 1.24420166015625, 1.292205810546875, 1.3402099609375, 1.388214111328125, 1.43621826171875, 1.484222412109375, 1.5322265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 13.0, 9.0, 25.0, 26.0, 31.0, 52.0, 78.0, 108.0, 190.0, 325.0, 514.0, 807.0, 1641.0, 3499.0, 8495.0, 24167.0, 75261.0, 232823.0, 403234.0, 199656.0, 63270.0, 20281.0, 7342.0, 3080.0, 1541.0, 810.0, 479.0, 313.0, 173.0, 107.0, 70.0, 45.0, 35.0, 17.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.6875, -30.710205078125, -29.73291015625, -28.755615234375, -27.7783203125, -26.801025390625, -25.82373046875, -24.846435546875, -23.869140625, -22.891845703125, -21.91455078125, -20.937255859375, -19.9599609375, -18.982666015625, -18.00537109375, -17.028076171875, -16.05078125, -15.073486328125, -14.09619140625, -13.118896484375, -12.1416015625, -11.164306640625, -10.18701171875, -9.209716796875, -8.232421875, -7.255126953125, -6.27783203125, -5.300537109375, -4.3232421875, -3.345947265625, -2.36865234375, -1.391357421875, -0.4140625, 0.563232421875, 1.54052734375, 2.517822265625, 3.4951171875, 4.472412109375, 5.44970703125, 6.427001953125, 7.404296875, 8.381591796875, 9.35888671875, 10.336181640625, 11.3134765625, 12.290771484375, 13.26806640625, 14.245361328125, 15.22265625, 16.199951171875, 17.17724609375, 18.154541015625, 19.1318359375, 20.109130859375, 21.08642578125, 22.063720703125, 23.041015625, 24.018310546875, 24.99560546875, 25.972900390625, 26.9501953125, 27.927490234375, 28.90478515625, 29.882080078125, 30.859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 11.0, 18.0, 20.0, 27.0, 38.0, 49.0, 46.0, 59.0, 70.0, 82.0, 65.0, 85.0, 64.0, 68.0, 55.0, 55.0, 40.0, 40.0, 27.0, 22.0, 18.0, 14.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.8125, -18.18701171875, -17.5615234375, -16.93603515625, -16.310546875, -15.68505859375, -15.0595703125, -14.43408203125, -13.80859375, -13.18310546875, -12.5576171875, -11.93212890625, -11.306640625, -10.68115234375, -10.0556640625, -9.43017578125, -8.8046875, -8.17919921875, -7.5537109375, -6.92822265625, -6.302734375, -5.67724609375, -5.0517578125, -4.42626953125, -3.80078125, -3.17529296875, -2.5498046875, -1.92431640625, -1.298828125, -0.67333984375, -0.0478515625, 0.57763671875, 1.203125, 1.82861328125, 2.4541015625, 3.07958984375, 3.705078125, 4.33056640625, 4.9560546875, 5.58154296875, 6.20703125, 6.83251953125, 7.4580078125, 8.08349609375, 8.708984375, 9.33447265625, 9.9599609375, 10.58544921875, 11.2109375, 11.83642578125, 12.4619140625, 13.08740234375, 13.712890625, 14.33837890625, 14.9638671875, 15.58935546875, 16.21484375, 16.84033203125, 17.4658203125, 18.09130859375, 18.716796875, 19.34228515625, 19.9677734375, 20.59326171875, 21.21875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 14.0, 12.0, 20.0, 16.0, 38.0, 33.0, 83.0, 124.0, 187.0, 278.0, 491.0, 859.0, 1856.0, 3937.0, 9444.0, 25298.0, 74021.0, 218931.0, 379034.0, 217448.0, 74145.0, 25079.0, 9184.0, 3871.0, 1800.0, 949.0, 524.0, 290.0, 205.0, 119.0, 71.0, 59.0, 42.0, 35.0, 11.0, 12.0, 5.0, 6.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.65625, -16.12744140625, -15.5986328125, -15.06982421875, -14.541015625, -14.01220703125, -13.4833984375, -12.95458984375, -12.42578125, -11.89697265625, -11.3681640625, -10.83935546875, -10.310546875, -9.78173828125, -9.2529296875, -8.72412109375, -8.1953125, -7.66650390625, -7.1376953125, -6.60888671875, -6.080078125, -5.55126953125, -5.0224609375, -4.49365234375, -3.96484375, -3.43603515625, -2.9072265625, -2.37841796875, -1.849609375, -1.32080078125, -0.7919921875, -0.26318359375, 0.265625, 0.79443359375, 1.3232421875, 1.85205078125, 2.380859375, 2.90966796875, 3.4384765625, 3.96728515625, 4.49609375, 5.02490234375, 5.5537109375, 6.08251953125, 6.611328125, 7.14013671875, 7.6689453125, 8.19775390625, 8.7265625, 9.25537109375, 9.7841796875, 10.31298828125, 10.841796875, 11.37060546875, 11.8994140625, 12.42822265625, 12.95703125, 13.48583984375, 14.0146484375, 14.54345703125, 15.072265625, 15.60107421875, 16.1298828125, 16.65869140625, 17.1875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 8.0, 10.0, 34.0, 40.0, 39.0, 72.0, 102.0, 152.0, 120.0, 122.0, 84.0, 64.0, 43.0, 35.0, 14.0, 21.0, 11.0, 8.0, 7.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004604339599609375, -0.004487335681915283, -0.004370331764221191, -0.0042533278465271, -0.004136323928833008, -0.004019320011138916, -0.0039023160934448242, -0.0037853121757507324, -0.0036683082580566406, -0.003551304340362549, -0.003434300422668457, -0.0033172965049743652, -0.0032002925872802734, -0.0030832886695861816, -0.00296628475189209, -0.002849280834197998, -0.0027322769165039062, -0.0026152729988098145, -0.0024982690811157227, -0.002381265163421631, -0.002264261245727539, -0.0021472573280334473, -0.0020302534103393555, -0.0019132494926452637, -0.0017962455749511719, -0.00167924165725708, -0.0015622377395629883, -0.0014452338218688965, -0.0013282299041748047, -0.0012112259864807129, -0.001094222068786621, -0.0009772181510925293, -0.0008602142333984375, -0.0007432103157043457, -0.0006262063980102539, -0.0005092024803161621, -0.0003921985626220703, -0.0002751946449279785, -0.00015819072723388672, -4.118680953979492e-05, 7.581710815429688e-05, 0.00019282102584838867, 0.00030982494354248047, 0.00042682886123657227, 0.0005438327789306641, 0.0006608366966247559, 0.0007778406143188477, 0.0008948445320129395, 0.0010118484497070312, 0.001128852367401123, 0.0012458562850952148, 0.0013628602027893066, 0.0014798641204833984, 0.0015968680381774902, 0.001713871955871582, 0.0018308758735656738, 0.0019478797912597656, 0.0020648837089538574, 0.0021818876266479492, 0.002298891544342041, 0.002415895462036133, 0.0025328993797302246, 0.0026499032974243164, 0.002766907215118408, 0.0028839111328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 9.0, 9.0, 13.0, 18.0, 34.0, 23.0, 49.0, 72.0, 86.0, 123.0, 176.0, 247.0, 344.0, 531.0, 767.0, 1283.0, 2135.0, 3608.0, 6810.0, 13818.0, 28667.0, 63754.0, 139317.0, 249084.0, 257339.0, 149538.0, 68744.0, 30492.0, 14445.0, 7050.0, 3876.0, 2145.0, 1290.0, 828.0, 579.0, 383.0, 260.0, 194.0, 104.0, 87.0, 74.0, 36.0, 34.0, 19.0, 13.0, 17.0, 11.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.0234375, -9.6898193359375, -9.356201171875, -9.0225830078125, -8.68896484375, -8.3553466796875, -8.021728515625, -7.6881103515625, -7.3544921875, -7.0208740234375, -6.687255859375, -6.3536376953125, -6.02001953125, -5.6864013671875, -5.352783203125, -5.0191650390625, -4.685546875, -4.3519287109375, -4.018310546875, -3.6846923828125, -3.35107421875, -3.0174560546875, -2.683837890625, -2.3502197265625, -2.0166015625, -1.6829833984375, -1.349365234375, -1.0157470703125, -0.68212890625, -0.3485107421875, -0.014892578125, 0.3187255859375, 0.65234375, 0.9859619140625, 1.319580078125, 1.6531982421875, 1.98681640625, 2.3204345703125, 2.654052734375, 2.9876708984375, 3.3212890625, 3.6549072265625, 3.988525390625, 4.3221435546875, 4.65576171875, 4.9893798828125, 5.322998046875, 5.6566162109375, 5.990234375, 6.3238525390625, 6.657470703125, 6.9910888671875, 7.32470703125, 7.6583251953125, 7.991943359375, 8.3255615234375, 8.6591796875, 8.9927978515625, 9.326416015625, 9.6600341796875, 9.99365234375, 10.3272705078125, 10.660888671875, 10.9945068359375, 11.328125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 4.0, 7.0, 13.0, 5.0, 14.0, 18.0, 21.0, 14.0, 24.0, 18.0, 18.0, 28.0, 46.0, 30.0, 41.0, 50.0, 45.0, 41.0, 51.0, 65.0, 38.0, 56.0, 47.0, 39.0, 45.0, 31.0, 31.0, 16.0, 21.0, 23.0, 17.0, 13.0, 8.0, 15.0, 2.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.8521728515625, -4.669189453125, -4.4862060546875, -4.30322265625, -4.1202392578125, -3.937255859375, -3.7542724609375, -3.5712890625, -3.3883056640625, -3.205322265625, -3.0223388671875, -2.83935546875, -2.6563720703125, -2.473388671875, -2.2904052734375, -2.107421875, -1.9244384765625, -1.741455078125, -1.5584716796875, -1.37548828125, -1.1925048828125, -1.009521484375, -0.8265380859375, -0.6435546875, -0.4605712890625, -0.277587890625, -0.0946044921875, 0.08837890625, 0.2713623046875, 0.454345703125, 0.6373291015625, 0.8203125, 1.0032958984375, 1.186279296875, 1.3692626953125, 1.55224609375, 1.7352294921875, 1.918212890625, 2.1011962890625, 2.2841796875, 2.4671630859375, 2.650146484375, 2.8331298828125, 3.01611328125, 3.1990966796875, 3.382080078125, 3.5650634765625, 3.748046875, 3.9310302734375, 4.114013671875, 4.2969970703125, 4.47998046875, 4.6629638671875, 4.845947265625, 5.0289306640625, 5.2119140625, 5.3948974609375, 5.577880859375, 5.7608642578125, 5.94384765625, 6.1268310546875, 6.309814453125, 6.4927978515625, 6.67578125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 11.0, 27.0, 69.0, 144.0, 272.0, 259.0, 138.0, 54.0, 18.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-427.16729736328125, -414.5718994140625, -401.97650146484375, -389.381103515625, -376.7857360839844, -364.1903381347656, -351.5949401855469, -338.9995422363281, -326.4041748046875, -313.80877685546875, -301.21337890625, -288.61798095703125, -276.0226135253906, -263.4272155761719, -250.83181762695312, -238.23641967773438, -225.64102172851562, -213.04562377929688, -200.4502410888672, -187.85484313964844, -175.25946044921875, -162.6640625, -150.06866455078125, -137.4732666015625, -124.87788391113281, -112.2824935913086, -99.68710327148438, -87.09170532226562, -74.4963150024414, -61.90092468261719, -49.30552673339844, -36.71013641357422, -24.11474609375, -11.519353866577148, 1.0760383605957031, 13.671432495117188, 26.266822814941406, 38.862213134765625, 51.457611083984375, 64.0530014038086, 76.64839172363281, 89.24378204345703, 101.83917236328125, 114.4345703125, 127.02996063232422, 139.62535095214844, 152.2207489013672, 164.81613159179688, 177.41152954101562, 190.00692749023438, 202.60231018066406, 215.1977081298828, 227.7930908203125, 240.38848876953125, 252.98388671875, 265.57928466796875, 278.1746826171875, 290.77008056640625, 303.365478515625, 315.96087646484375, 328.5562438964844, 341.1516418457031, 353.7470397949219, 366.3424377441406, 378.93780517578125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 13.0, 13.0, 16.0, 25.0, 21.0, 44.0, 45.0, 49.0, 54.0, 64.0, 58.0, 65.0, 64.0, 69.0, 66.0, 47.0, 51.0, 41.0, 44.0, 26.0, 32.0, 22.0, 20.0, 16.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.555908203125, -130.48863220214844, -126.42134857177734, -122.35407257080078, -118.28678894042969, -114.21951293945312, -110.15223693847656, -106.0849609375, -102.0176773071289, -97.95040130615234, -93.88311767578125, -89.81584167480469, -85.74856567382812, -81.68128204345703, -77.61400604248047, -73.54672241210938, -69.47944641113281, -65.41217041015625, -61.344886779785156, -57.277610778808594, -53.210330963134766, -49.14305114746094, -45.075775146484375, -41.00849533081055, -36.94121551513672, -32.87393569946289, -28.806657791137695, -24.7393798828125, -20.672100067138672, -16.604820251464844, -12.537542343139648, -8.470264434814453, -4.4029998779296875, -0.3357210159301758, 3.731557846069336, 7.798836708068848, 11.86611557006836, 15.933395385742188, 20.000673294067383, 24.067951202392578, 28.135231018066406, 32.202510833740234, 36.26979064941406, 40.337066650390625, 44.40434646606445, 48.47162628173828, 52.538902282714844, 56.60618209838867, 60.6734619140625, 64.74073791503906, 68.80802154541016, 72.87529754638672, 76.94258117675781, 81.00985717773438, 85.07713317871094, 89.1444091796875, 93.2116928100586, 97.27896881103516, 101.34625244140625, 105.41352844238281, 109.48080444335938, 113.54808807373047, 117.61536407470703, 121.68264770507812, 125.74992370605469]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 12.0, 10.0, 12.0, 32.0, 47.0, 99.0, 180.0, 481.0, 1439.0, 6955.0, 76253.0, 3970709.0, 127289.0, 8815.0, 1250.0, 348.0, 139.0, 62.0, 51.0, 36.0, 25.0, 13.0, 13.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.5, -131.72265625, -126.9453125, -122.16796875, -117.390625, -112.61328125, -107.8359375, -103.05859375, -98.28125, -93.50390625, -88.7265625, -83.94921875, -79.171875, -74.39453125, -69.6171875, -64.83984375, -60.0625, -55.28515625, -50.5078125, -45.73046875, -40.953125, -36.17578125, -31.3984375, -26.62109375, -21.84375, -17.06640625, -12.2890625, -7.51171875, -2.734375, 2.04296875, 6.8203125, 11.59765625, 16.375, 21.15234375, 25.9296875, 30.70703125, 35.484375, 40.26171875, 45.0390625, 49.81640625, 54.59375, 59.37109375, 64.1484375, 68.92578125, 73.703125, 78.48046875, 83.2578125, 88.03515625, 92.8125, 97.58984375, 102.3671875, 107.14453125, 111.921875, 116.69921875, 121.4765625, 126.25390625, 131.03125, 135.80859375, 140.5859375, 145.36328125, 150.140625, 154.91796875, 159.6953125, 164.47265625, 169.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 9.0, 10.0, 12.0, 25.0, 37.0, 40.0, 44.0, 68.0, 77.0, 87.0, 96.0, 85.0, 82.0, 63.0, 62.0, 48.0, 40.0, 33.0, 30.0, 18.0, 14.0, 8.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.67657470703125, -3.5445556640625, -3.41253662109375, -3.280517578125, -3.14849853515625, -3.0164794921875, -2.88446044921875, -2.75244140625, -2.62042236328125, -2.4884033203125, -2.35638427734375, -2.224365234375, -2.09234619140625, -1.9603271484375, -1.82830810546875, -1.6962890625, -1.56427001953125, -1.4322509765625, -1.30023193359375, -1.168212890625, -1.03619384765625, -0.9041748046875, -0.77215576171875, -0.64013671875, -0.50811767578125, -0.3760986328125, -0.24407958984375, -0.112060546875, 0.01995849609375, 0.1519775390625, 0.28399658203125, 0.416015625, 0.54803466796875, 0.6800537109375, 0.81207275390625, 0.944091796875, 1.07611083984375, 1.2081298828125, 1.34014892578125, 1.47216796875, 1.60418701171875, 1.7362060546875, 1.86822509765625, 2.000244140625, 2.13226318359375, 2.2642822265625, 2.39630126953125, 2.5283203125, 2.66033935546875, 2.7923583984375, 2.92437744140625, 3.056396484375, 3.18841552734375, 3.3204345703125, 3.45245361328125, 3.58447265625, 3.71649169921875, 3.8485107421875, 3.98052978515625, 4.112548828125, 4.24456787109375, 4.3765869140625, 4.50860595703125, 4.640625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 13.0, 9.0, 11.0, 12.0, 16.0, 23.0, 20.0, 25.0, 28.0, 36.0, 49.0, 136.0, 552.0, 4381.0, 67460.0, 3744152.0, 361376.0, 14098.0, 1282.0, 222.0, 66.0, 38.0, 55.0, 31.0, 32.0, 29.0, 27.0, 26.0, 15.0, 18.0, 11.0, 7.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-156.75, -152.103515625, -147.45703125, -142.810546875, -138.1640625, -133.517578125, -128.87109375, -124.224609375, -119.578125, -114.931640625, -110.28515625, -105.638671875, -100.9921875, -96.345703125, -91.69921875, -87.052734375, -82.40625, -77.759765625, -73.11328125, -68.466796875, -63.8203125, -59.173828125, -54.52734375, -49.880859375, -45.234375, -40.587890625, -35.94140625, -31.294921875, -26.6484375, -22.001953125, -17.35546875, -12.708984375, -8.0625, -3.416015625, 1.23046875, 5.876953125, 10.5234375, 15.169921875, 19.81640625, 24.462890625, 29.109375, 33.755859375, 38.40234375, 43.048828125, 47.6953125, 52.341796875, 56.98828125, 61.634765625, 66.28125, 70.927734375, 75.57421875, 80.220703125, 84.8671875, 89.513671875, 94.16015625, 98.806640625, 103.453125, 108.099609375, 112.74609375, 117.392578125, 122.0390625, 126.685546875, 131.33203125, 135.978515625, 140.625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 12.0, 23.0, 56.0, 64.0, 132.0, 212.0, 574.0, 2013.0, 523.0, 209.0, 110.0, 43.0, 44.0, 31.0, 12.0, 9.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.736083984375, -9.14404296875, -8.552001953125, -7.9599609375, -7.367919921875, -6.77587890625, -6.183837890625, -5.591796875, -4.999755859375, -4.40771484375, -3.815673828125, -3.2236328125, -2.631591796875, -2.03955078125, -1.447509765625, -0.85546875, -0.263427734375, 0.32861328125, 0.920654296875, 1.5126953125, 2.104736328125, 2.69677734375, 3.288818359375, 3.880859375, 4.472900390625, 5.06494140625, 5.656982421875, 6.2490234375, 6.841064453125, 7.43310546875, 8.025146484375, 8.6171875, 9.209228515625, 9.80126953125, 10.393310546875, 10.9853515625, 11.577392578125, 12.16943359375, 12.761474609375, 13.353515625, 13.945556640625, 14.53759765625, 15.129638671875, 15.7216796875, 16.313720703125, 16.90576171875, 17.497802734375, 18.08984375, 18.681884765625, 19.27392578125, 19.865966796875, 20.4580078125, 21.050048828125, 21.64208984375, 22.234130859375, 22.826171875, 23.418212890625, 24.01025390625, 24.602294921875, 25.1943359375, 25.786376953125, 26.37841796875, 26.970458984375, 27.5625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 13.0, 20.0, 29.0, 47.0, 100.0, 117.0, 142.0, 151.0, 113.0, 76.0, 59.0, 41.0, 29.0, 15.0, 15.0, 7.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.46695709228516, -120.31245422363281, -117.15795135498047, -114.00344848632812, -110.84893798828125, -107.6944351196289, -104.53993225097656, -101.38542938232422, -98.23092651367188, -95.07642364501953, -91.92192077636719, -88.76741790771484, -85.6129150390625, -82.45840454101562, -79.30390167236328, -76.14939880371094, -72.9948959350586, -69.84039306640625, -66.6858901977539, -63.5313835144043, -60.37688064575195, -57.22237777709961, -54.06787109375, -50.913368225097656, -47.75886535644531, -44.60436248779297, -41.449859619140625, -38.295352935791016, -35.14085006713867, -31.986347198486328, -28.83184242248535, -25.677337646484375, -22.5228271484375, -19.368324279785156, -16.21381950378418, -13.05931568145752, -9.90481185913086, -6.750308036804199, -3.595804214477539, -0.4412994384765625, 2.7132034301757812, 5.867707252502441, 9.022211074829102, 12.176714897155762, 15.331218719482422, 18.485721588134766, 21.640226364135742, 24.79473114013672, 27.949234008789062, 31.103736877441406, 34.25823974609375, 37.41274642944336, 40.5672492980957, 43.72175216674805, 46.876258850097656, 50.03076171875, 53.185264587402344, 56.33976745605469, 59.49427032470703, 62.64877700805664, 65.80328369140625, 68.9577865600586, 72.11228942871094, 75.26679229736328, 78.42129516601562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 9.0, 5.0, 8.0, 9.0, 9.0, 5.0, 10.0, 15.0, 16.0, 19.0, 28.0, 19.0, 23.0, 34.0, 37.0, 44.0, 42.0, 45.0, 42.0, 47.0, 55.0, 28.0, 53.0, 51.0, 48.0, 39.0, 28.0, 39.0, 30.0, 33.0, 28.0, 20.0, 22.0, 16.0, 12.0, 9.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.714412689208984, -34.186805725097656, -32.659202575683594, -31.131595611572266, -29.603988647460938, -28.07638168334961, -26.548776626586914, -25.02117156982422, -23.49356460571289, -21.965957641601562, -20.438352584838867, -18.910747528076172, -17.383140563964844, -15.855534553527832, -14.32792854309082, -12.800322532653809, -11.272716522216797, -9.745110511779785, -8.217504501342773, -6.689898490905762, -5.16229248046875, -3.6346864700317383, -2.1070804595947266, -0.5794744491577148, 0.9481315612792969, 2.4757375717163086, 4.00334358215332, 5.530949592590332, 7.058555603027344, 8.586161613464355, 10.113767623901367, 11.641373634338379, 13.168983459472656, 14.696589469909668, 16.22419548034668, 17.751800537109375, 19.279407501220703, 20.80701446533203, 22.334619522094727, 23.862224578857422, 25.38983154296875, 26.917438507080078, 28.445043563842773, 29.97264862060547, 31.500255584716797, 33.027862548828125, 34.55546569824219, 36.083072662353516, 37.610679626464844, 39.13828659057617, 40.6658935546875, 42.19349670410156, 43.72110366821289, 45.24871063232422, 46.77631378173828, 48.30392074584961, 49.83152770996094, 51.359134674072266, 52.886741638183594, 54.414344787597656, 55.941951751708984, 57.46955871582031, 58.997161865234375, 60.5247688293457, 62.05237579345703]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 0.0, 7.0, 11.0, 14.0, 20.0, 21.0, 38.0, 54.0, 73.0, 133.0, 198.0, 350.0, 598.0, 1120.0, 2281.0, 6813.0, 26029.0, 115669.0, 412450.0, 358553.0, 92721.0, 21259.0, 5575.0, 2135.0, 976.0, 535.0, 354.0, 214.0, 129.0, 97.0, 40.0, 31.0, 17.0, 14.0, 9.0, 9.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.59375, -36.24755859375, -34.9013671875, -33.55517578125, -32.208984375, -30.86279296875, -29.5166015625, -28.17041015625, -26.82421875, -25.47802734375, -24.1318359375, -22.78564453125, -21.439453125, -20.09326171875, -18.7470703125, -17.40087890625, -16.0546875, -14.70849609375, -13.3623046875, -12.01611328125, -10.669921875, -9.32373046875, -7.9775390625, -6.63134765625, -5.28515625, -3.93896484375, -2.5927734375, -1.24658203125, 0.099609375, 1.44580078125, 2.7919921875, 4.13818359375, 5.484375, 6.83056640625, 8.1767578125, 9.52294921875, 10.869140625, 12.21533203125, 13.5615234375, 14.90771484375, 16.25390625, 17.60009765625, 18.9462890625, 20.29248046875, 21.638671875, 22.98486328125, 24.3310546875, 25.67724609375, 27.0234375, 28.36962890625, 29.7158203125, 31.06201171875, 32.408203125, 33.75439453125, 35.1005859375, 36.44677734375, 37.79296875, 39.13916015625, 40.4853515625, 41.83154296875, 43.177734375, 44.52392578125, 45.8701171875, 47.21630859375, 48.5625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 13.0, 14.0, 39.0, 51.0, 38.0, 61.0, 82.0, 95.0, 102.0, 99.0, 100.0, 85.0, 71.0, 49.0, 33.0, 20.0, 20.0, 7.0, 10.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66015625, -4.4727783203125, -4.285400390625, -4.0980224609375, -3.91064453125, -3.7232666015625, -3.535888671875, -3.3485107421875, -3.1611328125, -2.9737548828125, -2.786376953125, -2.5989990234375, -2.41162109375, -2.2242431640625, -2.036865234375, -1.8494873046875, -1.662109375, -1.4747314453125, -1.287353515625, -1.0999755859375, -0.91259765625, -0.7252197265625, -0.537841796875, -0.3504638671875, -0.1630859375, 0.0242919921875, 0.211669921875, 0.3990478515625, 0.58642578125, 0.7738037109375, 0.961181640625, 1.1485595703125, 1.3359375, 1.5233154296875, 1.710693359375, 1.8980712890625, 2.08544921875, 2.2728271484375, 2.460205078125, 2.6475830078125, 2.8349609375, 3.0223388671875, 3.209716796875, 3.3970947265625, 3.58447265625, 3.7718505859375, 3.959228515625, 4.1466064453125, 4.333984375, 4.5213623046875, 4.708740234375, 4.8961181640625, 5.08349609375, 5.2708740234375, 5.458251953125, 5.6456298828125, 5.8330078125, 6.0203857421875, 6.207763671875, 6.3951416015625, 6.58251953125, 6.7698974609375, 6.957275390625, 7.1446533203125, 7.33203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 0.0, 2.0, 9.0, 3.0, 12.0, 15.0, 22.0, 29.0, 44.0, 67.0, 98.0, 139.0, 209.0, 291.0, 502.0, 790.0, 1401.0, 2626.0, 5472.0, 14019.0, 39389.0, 117435.0, 314786.0, 343478.0, 134266.0, 44846.0, 15603.0, 6251.0, 2835.0, 1519.0, 850.0, 532.0, 324.0, 220.0, 145.0, 101.0, 79.0, 42.0, 33.0, 28.0, 18.0, 5.0, 4.0, 1.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-32.21875, -31.2138671875, -30.208984375, -29.2041015625, -28.19921875, -27.1943359375, -26.189453125, -25.1845703125, -24.1796875, -23.1748046875, -22.169921875, -21.1650390625, -20.16015625, -19.1552734375, -18.150390625, -17.1455078125, -16.140625, -15.1357421875, -14.130859375, -13.1259765625, -12.12109375, -11.1162109375, -10.111328125, -9.1064453125, -8.1015625, -7.0966796875, -6.091796875, -5.0869140625, -4.08203125, -3.0771484375, -2.072265625, -1.0673828125, -0.0625, 0.9423828125, 1.947265625, 2.9521484375, 3.95703125, 4.9619140625, 5.966796875, 6.9716796875, 7.9765625, 8.9814453125, 9.986328125, 10.9912109375, 11.99609375, 13.0009765625, 14.005859375, 15.0107421875, 16.015625, 17.0205078125, 18.025390625, 19.0302734375, 20.03515625, 21.0400390625, 22.044921875, 23.0498046875, 24.0546875, 25.0595703125, 26.064453125, 27.0693359375, 28.07421875, 29.0791015625, 30.083984375, 31.0888671875, 32.09375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 9.0, 13.0, 17.0, 12.0, 24.0, 23.0, 25.0, 31.0, 40.0, 30.0, 49.0, 46.0, 54.0, 53.0, 60.0, 51.0, 60.0, 57.0, 47.0, 50.0, 45.0, 36.0, 22.0, 32.0, 13.0, 25.0, 17.0, 14.0, 9.0, 6.0, 13.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-24.0625, -23.43017578125, -22.7978515625, -22.16552734375, -21.533203125, -20.90087890625, -20.2685546875, -19.63623046875, -19.00390625, -18.37158203125, -17.7392578125, -17.10693359375, -16.474609375, -15.84228515625, -15.2099609375, -14.57763671875, -13.9453125, -13.31298828125, -12.6806640625, -12.04833984375, -11.416015625, -10.78369140625, -10.1513671875, -9.51904296875, -8.88671875, -8.25439453125, -7.6220703125, -6.98974609375, -6.357421875, -5.72509765625, -5.0927734375, -4.46044921875, -3.828125, -3.19580078125, -2.5634765625, -1.93115234375, -1.298828125, -0.66650390625, -0.0341796875, 0.59814453125, 1.23046875, 1.86279296875, 2.4951171875, 3.12744140625, 3.759765625, 4.39208984375, 5.0244140625, 5.65673828125, 6.2890625, 6.92138671875, 7.5537109375, 8.18603515625, 8.818359375, 9.45068359375, 10.0830078125, 10.71533203125, 11.34765625, 11.97998046875, 12.6123046875, 13.24462890625, 13.876953125, 14.50927734375, 15.1416015625, 15.77392578125, 16.40625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 9.0, 18.0, 17.0, 44.0, 64.0, 72.0, 122.0, 207.0, 321.0, 640.0, 1251.0, 2720.0, 7366.0, 23512.0, 89251.0, 322218.0, 411540.0, 137128.0, 34826.0, 10267.0, 3602.0, 1506.0, 786.0, 399.0, 217.0, 132.0, 91.0, 56.0, 36.0, 35.0, 19.0, 17.0, 13.0, 13.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.424072265625, -15.87939453125, -15.334716796875, -14.7900390625, -14.245361328125, -13.70068359375, -13.156005859375, -12.611328125, -12.066650390625, -11.52197265625, -10.977294921875, -10.4326171875, -9.887939453125, -9.34326171875, -8.798583984375, -8.25390625, -7.709228515625, -7.16455078125, -6.619873046875, -6.0751953125, -5.530517578125, -4.98583984375, -4.441162109375, -3.896484375, -3.351806640625, -2.80712890625, -2.262451171875, -1.7177734375, -1.173095703125, -0.62841796875, -0.083740234375, 0.4609375, 1.005615234375, 1.55029296875, 2.094970703125, 2.6396484375, 3.184326171875, 3.72900390625, 4.273681640625, 4.818359375, 5.363037109375, 5.90771484375, 6.452392578125, 6.9970703125, 7.541748046875, 8.08642578125, 8.631103515625, 9.17578125, 9.720458984375, 10.26513671875, 10.809814453125, 11.3544921875, 11.899169921875, 12.44384765625, 12.988525390625, 13.533203125, 14.077880859375, 14.62255859375, 15.167236328125, 15.7119140625, 16.256591796875, 16.80126953125, 17.345947265625, 17.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 6.0, 7.0, 8.0, 4.0, 10.0, 16.0, 18.0, 14.0, 13.0, 35.0, 33.0, 40.0, 39.0, 52.0, 46.0, 67.0, 59.0, 86.0, 78.0, 82.0, 50.0, 41.0, 39.0, 31.0, 25.0, 17.0, 10.0, 15.0, 12.0, 7.0, 11.0, 4.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0020580291748046875, -0.001995474100112915, -0.0019329190254211426, -0.0018703639507293701, -0.0018078088760375977, -0.0017452538013458252, -0.0016826987266540527, -0.0016201436519622803, -0.0015575885772705078, -0.0014950335025787354, -0.0014324784278869629, -0.0013699233531951904, -0.001307368278503418, -0.0012448132038116455, -0.001182258129119873, -0.0011197030544281006, -0.0010571479797363281, -0.0009945929050445557, -0.0009320378303527832, -0.0008694827556610107, -0.0008069276809692383, -0.0007443726062774658, -0.0006818175315856934, -0.0006192624568939209, -0.0005567073822021484, -0.000494152307510376, -0.0004315972328186035, -0.00036904215812683105, -0.0003064870834350586, -0.00024393200874328613, -0.00018137693405151367, -0.00011882185935974121, -5.626678466796875e-05, 6.288290023803711e-06, 6.884336471557617e-05, 0.00013139843940734863, 0.0001939535140991211, 0.00025650858879089355, 0.000319063663482666, 0.0003816187381744385, 0.00044417381286621094, 0.0005067288875579834, 0.0005692839622497559, 0.0006318390369415283, 0.0006943941116333008, 0.0007569491863250732, 0.0008195042610168457, 0.0008820593357086182, 0.0009446144104003906, 0.001007169485092163, 0.0010697245597839355, 0.001132279634475708, 0.0011948347091674805, 0.001257389783859253, 0.0013199448585510254, 0.0013824999332427979, 0.0014450550079345703, 0.0015076100826263428, 0.0015701651573181152, 0.0016327202320098877, 0.0016952753067016602, 0.0017578303813934326, 0.001820385456085205, 0.0018829405307769775, 0.00194549560546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 10.0, 11.0, 20.0, 24.0, 41.0, 58.0, 85.0, 136.0, 208.0, 352.0, 687.0, 1147.0, 2331.0, 5052.0, 13489.0, 47413.0, 200489.0, 464920.0, 231066.0, 54722.0, 15231.0, 5555.0, 2452.0, 1274.0, 674.0, 427.0, 239.0, 137.0, 81.0, 52.0, 44.0, 27.0, 31.0, 6.0, 9.0, 13.0, 3.0, 3.0, 5.0, 1.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.515625, -15.956787109375, -15.39794921875, -14.839111328125, -14.2802734375, -13.721435546875, -13.16259765625, -12.603759765625, -12.044921875, -11.486083984375, -10.92724609375, -10.368408203125, -9.8095703125, -9.250732421875, -8.69189453125, -8.133056640625, -7.57421875, -7.015380859375, -6.45654296875, -5.897705078125, -5.3388671875, -4.780029296875, -4.22119140625, -3.662353515625, -3.103515625, -2.544677734375, -1.98583984375, -1.427001953125, -0.8681640625, -0.309326171875, 0.24951171875, 0.808349609375, 1.3671875, 1.926025390625, 2.48486328125, 3.043701171875, 3.6025390625, 4.161376953125, 4.72021484375, 5.279052734375, 5.837890625, 6.396728515625, 6.95556640625, 7.514404296875, 8.0732421875, 8.632080078125, 9.19091796875, 9.749755859375, 10.30859375, 10.867431640625, 11.42626953125, 11.985107421875, 12.5439453125, 13.102783203125, 13.66162109375, 14.220458984375, 14.779296875, 15.338134765625, 15.89697265625, 16.455810546875, 17.0146484375, 17.573486328125, 18.13232421875, 18.691162109375, 19.25]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 8.0, 9.0, 5.0, 9.0, 19.0, 14.0, 31.0, 48.0, 60.0, 59.0, 68.0, 59.0, 78.0, 92.0, 70.0, 71.0, 65.0, 55.0, 45.0, 35.0, 28.0, 14.0, 17.0, 12.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0859375, -8.786376953125, -8.48681640625, -8.187255859375, -7.8876953125, -7.588134765625, -7.28857421875, -6.989013671875, -6.689453125, -6.389892578125, -6.09033203125, -5.790771484375, -5.4912109375, -5.191650390625, -4.89208984375, -4.592529296875, -4.29296875, -3.993408203125, -3.69384765625, -3.394287109375, -3.0947265625, -2.795166015625, -2.49560546875, -2.196044921875, -1.896484375, -1.596923828125, -1.29736328125, -0.997802734375, -0.6982421875, -0.398681640625, -0.09912109375, 0.200439453125, 0.5, 0.799560546875, 1.09912109375, 1.398681640625, 1.6982421875, 1.997802734375, 2.29736328125, 2.596923828125, 2.896484375, 3.196044921875, 3.49560546875, 3.795166015625, 4.0947265625, 4.394287109375, 4.69384765625, 4.993408203125, 5.29296875, 5.592529296875, 5.89208984375, 6.191650390625, 6.4912109375, 6.790771484375, 7.09033203125, 7.389892578125, 7.689453125, 7.989013671875, 8.28857421875, 8.588134765625, 8.8876953125, 9.187255859375, 9.48681640625, 9.786376953125, 10.0859375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 10.0, 12.0, 27.0, 55.0, 107.0, 162.0, 210.0, 193.0, 111.0, 56.0, 34.0, 17.0, 5.0, 8.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.885498046875, -176.25062561035156, -165.61575317382812, -154.9808807373047, -144.34600830078125, -133.7111358642578, -123.07625579833984, -112.4413833618164, -101.80651092529297, -91.17163848876953, -80.5367660522461, -69.90188598632812, -59.26701736450195, -48.632144927978516, -37.99726867675781, -27.362396240234375, -16.727523803710938, -6.092650413513184, 4.54222297668457, 15.17709732055664, 25.811969757080078, 36.446842193603516, 47.08171844482422, 57.716590881347656, 68.3514633178711, 78.98633575439453, 89.62120819091797, 100.25608825683594, 110.89096069335938, 121.52583312988281, 132.16070556640625, 142.7955780029297, 153.43045043945312, 164.06532287597656, 174.7001953125, 185.33506774902344, 195.96994018554688, 206.6048126220703, 217.23968505859375, 227.87457275390625, 238.50942993164062, 249.14430236816406, 259.7791748046875, 270.4140625, 281.0489196777344, 291.6838073730469, 302.31866455078125, 312.95355224609375, 323.58843994140625, 334.22332763671875, 344.8581848144531, 355.4930725097656, 366.1279296875, 376.7628173828125, 387.3976745605469, 398.0325622558594, 408.66741943359375, 419.30230712890625, 429.9371643066406, 440.5720520019531, 451.2069091796875, 461.841796875, 472.4766540527344, 483.1115417480469, 493.74639892578125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 17.0, 3.0, 29.0, 20.0, 29.0, 34.0, 39.0, 45.0, 44.0, 48.0, 59.0, 53.0, 49.0, 55.0, 54.0, 54.0, 41.0, 57.0, 39.0, 41.0, 33.0, 16.0, 28.0, 18.0, 15.0, 12.0, 13.0, 12.0, 2.0, 5.0, 4.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-119.51838684082031, -115.35527038574219, -111.19215393066406, -107.0290298461914, -102.86591339111328, -98.70279693603516, -94.5396728515625, -90.37655639648438, -86.21343994140625, -82.05032348632812, -77.88720703125, -73.72408294677734, -69.56096649169922, -65.3978500366211, -61.2347297668457, -57.07160949707031, -52.90849304199219, -48.74537658691406, -44.58225631713867, -40.41913604736328, -36.256019592285156, -32.09290313720703, -27.92978286743164, -23.766664505004883, -19.603546142578125, -15.440427780151367, -11.27730941772461, -7.114191055297852, -2.9510726928710938, 1.212045669555664, 5.375164031982422, 9.53828239440918, 13.701416015625, 17.864534378051758, 22.027652740478516, 26.190771102905273, 30.35388946533203, 34.517005920410156, 38.68012619018555, 42.84324645996094, 47.00636291503906, 51.16947937011719, 55.33259963989258, 59.49571990966797, 63.658836364746094, 67.82195281982422, 71.98507690429688, 76.148193359375, 80.31130981445312, 84.47442626953125, 88.63754272460938, 92.80066680908203, 96.96378326416016, 101.12689971923828, 105.29002380371094, 109.45314025878906, 113.61625671386719, 117.77937316894531, 121.94248962402344, 126.1056137084961, 130.26873779296875, 134.43185424804688, 138.594970703125, 142.75808715820312, 146.92120361328125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 8.0, 11.0, 24.0, 23.0, 46.0, 52.0, 110.0, 203.0, 428.0, 1064.0, 3593.0, 15309.0, 137801.0, 3907742.0, 108975.0, 13411.0, 3329.0, 1153.0, 449.0, 225.0, 123.0, 74.0, 38.0, 22.0, 25.0, 9.0, 10.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.0625, -81.96484375, -78.8671875, -75.76953125, -72.671875, -69.57421875, -66.4765625, -63.37890625, -60.28125, -57.18359375, -54.0859375, -50.98828125, -47.890625, -44.79296875, -41.6953125, -38.59765625, -35.5, -32.40234375, -29.3046875, -26.20703125, -23.109375, -20.01171875, -16.9140625, -13.81640625, -10.71875, -7.62109375, -4.5234375, -1.42578125, 1.671875, 4.76953125, 7.8671875, 10.96484375, 14.0625, 17.16015625, 20.2578125, 23.35546875, 26.453125, 29.55078125, 32.6484375, 35.74609375, 38.84375, 41.94140625, 45.0390625, 48.13671875, 51.234375, 54.33203125, 57.4296875, 60.52734375, 63.625, 66.72265625, 69.8203125, 72.91796875, 76.015625, 79.11328125, 82.2109375, 85.30859375, 88.40625, 91.50390625, 94.6015625, 97.69921875, 100.796875, 103.89453125, 106.9921875, 110.08984375, 113.1875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 5.0, 8.0, 7.0, 15.0, 17.0, 25.0, 30.0, 36.0, 51.0, 55.0, 65.0, 69.0, 72.0, 77.0, 72.0, 75.0, 65.0, 61.0, 43.0, 28.0, 22.0, 23.0, 24.0, 16.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.3175048828125, -4.166259765625, -4.0150146484375, -3.86376953125, -3.7125244140625, -3.561279296875, -3.4100341796875, -3.2587890625, -3.1075439453125, -2.956298828125, -2.8050537109375, -2.65380859375, -2.5025634765625, -2.351318359375, -2.2000732421875, -2.048828125, -1.8975830078125, -1.746337890625, -1.5950927734375, -1.44384765625, -1.2926025390625, -1.141357421875, -0.9901123046875, -0.8388671875, -0.6876220703125, -0.536376953125, -0.3851318359375, -0.23388671875, -0.0826416015625, 0.068603515625, 0.2198486328125, 0.37109375, 0.5223388671875, 0.673583984375, 0.8248291015625, 0.97607421875, 1.1273193359375, 1.278564453125, 1.4298095703125, 1.5810546875, 1.7322998046875, 1.883544921875, 2.0347900390625, 2.18603515625, 2.3372802734375, 2.488525390625, 2.6397705078125, 2.791015625, 2.9422607421875, 3.093505859375, 3.2447509765625, 3.39599609375, 3.5472412109375, 3.698486328125, 3.8497314453125, 4.0009765625, 4.1522216796875, 4.303466796875, 4.4547119140625, 4.60595703125, 4.7572021484375, 4.908447265625, 5.0596923828125, 5.2109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 7.0, 5.0, 14.0, 19.0, 37.0, 54.0, 103.0, 172.0, 329.0, 457.0, 883.0, 1630.0, 3178.0, 6516.0, 15089.0, 38031.0, 113521.0, 530275.0, 3046151.0, 305567.0, 80771.0, 28791.0, 11805.0, 5391.0, 2699.0, 1250.0, 661.0, 330.0, 214.0, 133.0, 74.0, 48.0, 35.0, 31.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -35.87158203125, -34.6494140625, -33.42724609375, -32.205078125, -30.98291015625, -29.7607421875, -28.53857421875, -27.31640625, -26.09423828125, -24.8720703125, -23.64990234375, -22.427734375, -21.20556640625, -19.9833984375, -18.76123046875, -17.5390625, -16.31689453125, -15.0947265625, -13.87255859375, -12.650390625, -11.42822265625, -10.2060546875, -8.98388671875, -7.76171875, -6.53955078125, -5.3173828125, -4.09521484375, -2.873046875, -1.65087890625, -0.4287109375, 0.79345703125, 2.015625, 3.23779296875, 4.4599609375, 5.68212890625, 6.904296875, 8.12646484375, 9.3486328125, 10.57080078125, 11.79296875, 13.01513671875, 14.2373046875, 15.45947265625, 16.681640625, 17.90380859375, 19.1259765625, 20.34814453125, 21.5703125, 22.79248046875, 24.0146484375, 25.23681640625, 26.458984375, 27.68115234375, 28.9033203125, 30.12548828125, 31.34765625, 32.56982421875, 33.7919921875, 35.01416015625, 36.236328125, 37.45849609375, 38.6806640625, 39.90283203125, 41.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 1.0, 4.0, 6.0, 4.0, 5.0, 12.0, 8.0, 14.0, 17.0, 9.0, 26.0, 23.0, 47.0, 63.0, 70.0, 105.0, 164.0, 265.0, 536.0, 1418.0, 467.0, 234.0, 154.0, 89.0, 70.0, 61.0, 43.0, 28.0, 30.0, 26.0, 16.0, 10.0, 8.0, 13.0, 2.0, 11.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.768310546875, -8.49755859375, -8.226806640625, -7.9560546875, -7.685302734375, -7.41455078125, -7.143798828125, -6.873046875, -6.602294921875, -6.33154296875, -6.060791015625, -5.7900390625, -5.519287109375, -5.24853515625, -4.977783203125, -4.70703125, -4.436279296875, -4.16552734375, -3.894775390625, -3.6240234375, -3.353271484375, -3.08251953125, -2.811767578125, -2.541015625, -2.270263671875, -1.99951171875, -1.728759765625, -1.4580078125, -1.187255859375, -0.91650390625, -0.645751953125, -0.375, -0.104248046875, 0.16650390625, 0.437255859375, 0.7080078125, 0.978759765625, 1.24951171875, 1.520263671875, 1.791015625, 2.061767578125, 2.33251953125, 2.603271484375, 2.8740234375, 3.144775390625, 3.41552734375, 3.686279296875, 3.95703125, 4.227783203125, 4.49853515625, 4.769287109375, 5.0400390625, 5.310791015625, 5.58154296875, 5.852294921875, 6.123046875, 6.393798828125, 6.66455078125, 6.935302734375, 7.2060546875, 7.476806640625, 7.74755859375, 8.018310546875, 8.2890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 22.0, 60.0, 135.0, 209.0, 264.0, 170.0, 84.0, 34.0, 16.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.54171752929688, -81.52543640136719, -76.50914764404297, -71.49285888671875, -66.47657775878906, -61.46029281616211, -56.444007873535156, -51.4277229309082, -46.41143798828125, -41.3951530456543, -36.378868103027344, -31.36258316040039, -26.346298217773438, -21.330013275146484, -16.31372833251953, -11.297443389892578, -6.281158447265625, -1.2648735046386719, 3.7514114379882812, 8.767696380615234, 13.783981323242188, 18.80026626586914, 23.816551208496094, 28.832836151123047, 33.84912109375, 38.86540603637695, 43.881690979003906, 48.89797592163086, 53.91426086425781, 58.930545806884766, 63.94683074951172, 68.96311950683594, 73.97940063476562, 78.99568176269531, 84.01197052001953, 89.02825927734375, 94.04454040527344, 99.06082153320312, 104.07711029052734, 109.09339904785156, 114.10968017578125, 119.12596130371094, 124.14225006103516, 129.15853881835938, 134.17481994628906, 139.19110107421875, 144.2073974609375, 149.2236785888672, 154.23995971679688, 159.25624084472656, 164.27252197265625, 169.288818359375, 174.3050994873047, 179.32138061523438, 184.33767700195312, 189.3539581298828, 194.3702392578125, 199.3865203857422, 204.40280151367188, 209.41909790039062, 214.4353790283203, 219.45166015625, 224.46795654296875, 229.48423767089844, 234.50051879882812]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 14.0, 19.0, 20.0, 25.0, 32.0, 48.0, 60.0, 50.0, 68.0, 92.0, 65.0, 79.0, 76.0, 65.0, 59.0, 43.0, 33.0, 44.0, 27.0, 23.0, 23.0, 13.0, 9.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.23870849609375, -65.3755874633789, -63.51247024536133, -61.649349212646484, -59.786231994628906, -57.92311096191406, -56.05998992919922, -54.19687271118164, -52.33375549316406, -50.47063446044922, -48.60751724243164, -46.7443962097168, -44.88127899169922, -43.018157958984375, -41.15503692626953, -39.29191970825195, -37.42879867553711, -35.565677642822266, -33.70256042480469, -31.839439392089844, -29.976322174072266, -28.113201141357422, -26.25008201599121, -24.386962890625, -22.52384376525879, -20.660724639892578, -18.797605514526367, -16.934486389160156, -15.071366310119629, -13.208247184753418, -11.34512710571289, -9.48200798034668, -7.618892669677734, -5.755773544311523, -3.8926539421081543, -2.029534339904785, -0.16641521453857422, 1.6967039108276367, 3.559823989868164, 5.422943115234375, 7.286062240600586, 9.149181365966797, 11.012300491333008, 12.875420570373535, 14.738539695739746, 16.60165786743164, 18.464778900146484, 20.327898025512695, 22.191017150878906, 24.054136276245117, 25.917255401611328, 27.780376434326172, 29.64349365234375, 31.506614685058594, 33.36973571777344, 35.232852935791016, 37.095970153808594, 38.95909118652344, 40.822208404541016, 42.68532943725586, 44.54844665527344, 46.41156768798828, 48.274688720703125, 50.1378059387207, 52.00092697143555]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 13.0, 13.0, 15.0, 17.0, 26.0, 37.0, 38.0, 58.0, 82.0, 104.0, 135.0, 181.0, 243.0, 344.0, 564.0, 914.0, 1489.0, 2695.0, 5072.0, 10056.0, 21461.0, 46913.0, 101321.0, 199707.0, 286178.0, 190358.0, 96027.0, 43877.0, 19955.0, 9427.0, 4618.0, 2572.0, 1363.0, 829.0, 538.0, 378.0, 228.0, 170.0, 139.0, 102.0, 76.0, 46.0, 47.0, 38.0, 26.0, 13.0, 9.0, 18.0, 7.0, 8.0, 5.0, 4.0, 3.0, 2.0, 4.0, 1.0], "bins": [-20.5, -19.868408203125, -19.23681640625, -18.605224609375, -17.9736328125, -17.342041015625, -16.71044921875, -16.078857421875, -15.447265625, -14.815673828125, -14.18408203125, -13.552490234375, -12.9208984375, -12.289306640625, -11.65771484375, -11.026123046875, -10.39453125, -9.762939453125, -9.13134765625, -8.499755859375, -7.8681640625, -7.236572265625, -6.60498046875, -5.973388671875, -5.341796875, -4.710205078125, -4.07861328125, -3.447021484375, -2.8154296875, -2.183837890625, -1.55224609375, -0.920654296875, -0.2890625, 0.342529296875, 0.97412109375, 1.605712890625, 2.2373046875, 2.868896484375, 3.50048828125, 4.132080078125, 4.763671875, 5.395263671875, 6.02685546875, 6.658447265625, 7.2900390625, 7.921630859375, 8.55322265625, 9.184814453125, 9.81640625, 10.447998046875, 11.07958984375, 11.711181640625, 12.3427734375, 12.974365234375, 13.60595703125, 14.237548828125, 14.869140625, 15.500732421875, 16.13232421875, 16.763916015625, 17.3955078125, 18.027099609375, 18.65869140625, 19.290283203125, 19.921875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 15.0, 28.0, 27.0, 43.0, 42.0, 55.0, 67.0, 70.0, 74.0, 96.0, 72.0, 64.0, 70.0, 59.0, 35.0, 36.0, 38.0, 21.0, 23.0, 14.0, 18.0, 4.0, 4.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19140625, -5.0279541015625, -4.864501953125, -4.7010498046875, -4.53759765625, -4.3741455078125, -4.210693359375, -4.0472412109375, -3.8837890625, -3.7203369140625, -3.556884765625, -3.3934326171875, -3.22998046875, -3.0665283203125, -2.903076171875, -2.7396240234375, -2.576171875, -2.4127197265625, -2.249267578125, -2.0858154296875, -1.92236328125, -1.7589111328125, -1.595458984375, -1.4320068359375, -1.2685546875, -1.1051025390625, -0.941650390625, -0.7781982421875, -0.61474609375, -0.4512939453125, -0.287841796875, -0.1243896484375, 0.0390625, 0.2025146484375, 0.365966796875, 0.5294189453125, 0.69287109375, 0.8563232421875, 1.019775390625, 1.1832275390625, 1.3466796875, 1.5101318359375, 1.673583984375, 1.8370361328125, 2.00048828125, 2.1639404296875, 2.327392578125, 2.4908447265625, 2.654296875, 2.8177490234375, 2.981201171875, 3.1446533203125, 3.30810546875, 3.4715576171875, 3.635009765625, 3.7984619140625, 3.9619140625, 4.1253662109375, 4.288818359375, 4.4522705078125, 4.61572265625, 4.7791748046875, 4.942626953125, 5.1060791015625, 5.26953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 8.0, 13.0, 29.0, 34.0, 57.0, 60.0, 113.0, 135.0, 197.0, 253.0, 416.0, 601.0, 896.0, 1613.0, 2972.0, 6121.0, 13124.0, 30050.0, 71331.0, 158260.0, 279541.0, 249938.0, 129447.0, 56811.0, 24427.0, 10730.0, 4966.0, 2461.0, 1387.0, 832.0, 528.0, 368.0, 244.0, 156.0, 109.0, 77.0, 65.0, 47.0, 42.0, 21.0, 17.0, 13.0, 10.0, 7.0, 3.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.765625, -18.1767578125, -17.587890625, -16.9990234375, -16.41015625, -15.8212890625, -15.232421875, -14.6435546875, -14.0546875, -13.4658203125, -12.876953125, -12.2880859375, -11.69921875, -11.1103515625, -10.521484375, -9.9326171875, -9.34375, -8.7548828125, -8.166015625, -7.5771484375, -6.98828125, -6.3994140625, -5.810546875, -5.2216796875, -4.6328125, -4.0439453125, -3.455078125, -2.8662109375, -2.27734375, -1.6884765625, -1.099609375, -0.5107421875, 0.078125, 0.6669921875, 1.255859375, 1.8447265625, 2.43359375, 3.0224609375, 3.611328125, 4.2001953125, 4.7890625, 5.3779296875, 5.966796875, 6.5556640625, 7.14453125, 7.7333984375, 8.322265625, 8.9111328125, 9.5, 10.0888671875, 10.677734375, 11.2666015625, 11.85546875, 12.4443359375, 13.033203125, 13.6220703125, 14.2109375, 14.7998046875, 15.388671875, 15.9775390625, 16.56640625, 17.1552734375, 17.744140625, 18.3330078125, 18.921875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 7.0, 6.0, 8.0, 7.0, 22.0, 17.0, 24.0, 16.0, 22.0, 22.0, 35.0, 38.0, 46.0, 45.0, 45.0, 40.0, 50.0, 41.0, 49.0, 58.0, 44.0, 46.0, 29.0, 38.0, 33.0, 32.0, 30.0, 33.0, 24.0, 19.0, 14.0, 20.0, 7.0, 15.0, 4.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.53125, -14.99658203125, -14.4619140625, -13.92724609375, -13.392578125, -12.85791015625, -12.3232421875, -11.78857421875, -11.25390625, -10.71923828125, -10.1845703125, -9.64990234375, -9.115234375, -8.58056640625, -8.0458984375, -7.51123046875, -6.9765625, -6.44189453125, -5.9072265625, -5.37255859375, -4.837890625, -4.30322265625, -3.7685546875, -3.23388671875, -2.69921875, -2.16455078125, -1.6298828125, -1.09521484375, -0.560546875, -0.02587890625, 0.5087890625, 1.04345703125, 1.578125, 2.11279296875, 2.6474609375, 3.18212890625, 3.716796875, 4.25146484375, 4.7861328125, 5.32080078125, 5.85546875, 6.39013671875, 6.9248046875, 7.45947265625, 7.994140625, 8.52880859375, 9.0634765625, 9.59814453125, 10.1328125, 10.66748046875, 11.2021484375, 11.73681640625, 12.271484375, 12.80615234375, 13.3408203125, 13.87548828125, 14.41015625, 14.94482421875, 15.4794921875, 16.01416015625, 16.548828125, 17.08349609375, 17.6181640625, 18.15283203125, 18.6875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 6.0, 7.0, 15.0, 21.0, 40.0, 57.0, 67.0, 107.0, 245.0, 458.0, 1163.0, 2909.0, 9510.0, 47438.0, 350587.0, 528351.0, 85903.0, 14736.0, 4054.0, 1526.0, 629.0, 327.0, 157.0, 69.0, 48.0, 32.0, 26.0, 12.0, 7.0, 10.0, 7.0, 11.0, 6.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.482666015625, -16.90283203125, -16.322998046875, -15.7431640625, -15.163330078125, -14.58349609375, -14.003662109375, -13.423828125, -12.843994140625, -12.26416015625, -11.684326171875, -11.1044921875, -10.524658203125, -9.94482421875, -9.364990234375, -8.78515625, -8.205322265625, -7.62548828125, -7.045654296875, -6.4658203125, -5.885986328125, -5.30615234375, -4.726318359375, -4.146484375, -3.566650390625, -2.98681640625, -2.406982421875, -1.8271484375, -1.247314453125, -0.66748046875, -0.087646484375, 0.4921875, 1.072021484375, 1.65185546875, 2.231689453125, 2.8115234375, 3.391357421875, 3.97119140625, 4.551025390625, 5.130859375, 5.710693359375, 6.29052734375, 6.870361328125, 7.4501953125, 8.030029296875, 8.60986328125, 9.189697265625, 9.76953125, 10.349365234375, 10.92919921875, 11.509033203125, 12.0888671875, 12.668701171875, 13.24853515625, 13.828369140625, 14.408203125, 14.988037109375, 15.56787109375, 16.147705078125, 16.7275390625, 17.307373046875, 17.88720703125, 18.467041015625, 19.046875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 7.0, 7.0, 11.0, 4.0, 9.0, 13.0, 13.0, 21.0, 28.0, 44.0, 49.0, 51.0, 63.0, 79.0, 107.0, 103.0, 73.0, 63.0, 54.0, 39.0, 32.0, 29.0, 18.0, 14.0, 16.0, 12.0, 9.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0017108917236328125, -0.0016517043113708496, -0.0015925168991088867, -0.0015333294868469238, -0.001474142074584961, -0.001414954662322998, -0.0013557672500610352, -0.0012965798377990723, -0.0012373924255371094, -0.0011782050132751465, -0.0011190176010131836, -0.0010598301887512207, -0.0010006427764892578, -0.0009414553642272949, -0.000882267951965332, -0.0008230805397033691, -0.0007638931274414062, -0.0007047057151794434, -0.0006455183029174805, -0.0005863308906555176, -0.0005271434783935547, -0.0004679560661315918, -0.0004087686538696289, -0.000349581241607666, -0.0002903938293457031, -0.00023120641708374023, -0.00017201900482177734, -0.00011283159255981445, -5.364418029785156e-05, 5.543231964111328e-06, 6.473064422607422e-05, 0.0001239180564880371, 0.00018310546875, 0.0002422928810119629, 0.0003014802932739258, 0.00036066770553588867, 0.00041985511779785156, 0.00047904253005981445, 0.0005382299423217773, 0.0005974173545837402, 0.0006566047668457031, 0.000715792179107666, 0.0007749795913696289, 0.0008341670036315918, 0.0008933544158935547, 0.0009525418281555176, 0.0010117292404174805, 0.0010709166526794434, 0.0011301040649414062, 0.0011892914772033691, 0.001248478889465332, 0.001307666301727295, 0.0013668537139892578, 0.0014260411262512207, 0.0014852285385131836, 0.0015444159507751465, 0.0016036033630371094, 0.0016627907752990723, 0.0017219781875610352, 0.001781165599822998, 0.001840353012084961, 0.0018995404243469238, 0.0019587278366088867, 0.0020179152488708496, 0.0020771026611328125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 15.0, 6.0, 20.0, 21.0, 23.0, 36.0, 36.0, 64.0, 104.0, 149.0, 235.0, 427.0, 806.0, 1484.0, 2888.0, 6755.0, 18289.0, 63914.0, 266934.0, 466526.0, 158107.0, 39449.0, 12386.0, 4857.0, 2191.0, 1178.0, 635.0, 357.0, 218.0, 122.0, 102.0, 60.0, 40.0, 24.0, 13.0, 16.0, 7.0, 14.0, 6.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.578125, -12.1632080078125, -11.748291015625, -11.3333740234375, -10.91845703125, -10.5035400390625, -10.088623046875, -9.6737060546875, -9.2587890625, -8.8438720703125, -8.428955078125, -8.0140380859375, -7.59912109375, -7.1842041015625, -6.769287109375, -6.3543701171875, -5.939453125, -5.5245361328125, -5.109619140625, -4.6947021484375, -4.27978515625, -3.8648681640625, -3.449951171875, -3.0350341796875, -2.6201171875, -2.2052001953125, -1.790283203125, -1.3753662109375, -0.96044921875, -0.5455322265625, -0.130615234375, 0.2843017578125, 0.69921875, 1.1141357421875, 1.529052734375, 1.9439697265625, 2.35888671875, 2.7738037109375, 3.188720703125, 3.6036376953125, 4.0185546875, 4.4334716796875, 4.848388671875, 5.2633056640625, 5.67822265625, 6.0931396484375, 6.508056640625, 6.9229736328125, 7.337890625, 7.7528076171875, 8.167724609375, 8.5826416015625, 8.99755859375, 9.4124755859375, 9.827392578125, 10.2423095703125, 10.6572265625, 11.0721435546875, 11.487060546875, 11.9019775390625, 12.31689453125, 12.7318115234375, 13.146728515625, 13.5616455078125, 13.9765625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 3.0, 6.0, 6.0, 11.0, 9.0, 14.0, 22.0, 18.0, 33.0, 29.0, 41.0, 41.0, 65.0, 60.0, 69.0, 60.0, 78.0, 79.0, 63.0, 58.0, 41.0, 34.0, 36.0, 27.0, 19.0, 21.0, 9.0, 12.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.73828125, -6.49761962890625, -6.2569580078125, -6.01629638671875, -5.775634765625, -5.53497314453125, -5.2943115234375, -5.05364990234375, -4.81298828125, -4.57232666015625, -4.3316650390625, -4.09100341796875, -3.850341796875, -3.60968017578125, -3.3690185546875, -3.12835693359375, -2.8876953125, -2.64703369140625, -2.4063720703125, -2.16571044921875, -1.925048828125, -1.68438720703125, -1.4437255859375, -1.20306396484375, -0.96240234375, -0.72174072265625, -0.4810791015625, -0.24041748046875, 0.000244140625, 0.24090576171875, 0.4815673828125, 0.72222900390625, 0.962890625, 1.20355224609375, 1.4442138671875, 1.68487548828125, 1.925537109375, 2.16619873046875, 2.4068603515625, 2.64752197265625, 2.88818359375, 3.12884521484375, 3.3695068359375, 3.61016845703125, 3.850830078125, 4.09149169921875, 4.3321533203125, 4.57281494140625, 4.8134765625, 5.05413818359375, 5.2947998046875, 5.53546142578125, 5.776123046875, 6.01678466796875, 6.2574462890625, 6.49810791015625, 6.73876953125, 6.97943115234375, 7.2200927734375, 7.46075439453125, 7.701416015625, 7.94207763671875, 8.1827392578125, 8.42340087890625, 8.6640625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 5.0, 12.0, 10.0, 10.0, 18.0, 43.0, 43.0, 70.0, 84.0, 84.0, 103.0, 102.0, 91.0, 92.0, 64.0, 44.0, 30.0, 29.0, 20.0, 12.0, 11.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.47711181640625, -120.33177947998047, -116.18644714355469, -112.0411148071289, -107.89578247070312, -103.75045776367188, -99.6051254272461, -95.45979309082031, -91.31446075439453, -87.16912841796875, -83.02379608154297, -78.87846374511719, -74.73313903808594, -70.58779907226562, -66.44247436523438, -62.297142028808594, -58.15180969238281, -54.00647735595703, -49.86114501953125, -45.715816497802734, -41.57048416137695, -37.42515182495117, -33.279823303222656, -29.134490966796875, -24.989158630371094, -20.843826293945312, -16.698495864868164, -12.5531644821167, -8.407833099365234, -4.262500762939453, -0.11717033386230469, 4.028160095214844, 8.173477172851562, 12.318808555603027, 16.464139938354492, 20.60947036743164, 24.754802703857422, 28.900135040283203, 33.04546356201172, 37.1907958984375, 41.33612823486328, 45.48146057128906, 49.626792907714844, 53.77212142944336, 57.91745376586914, 62.06278610229492, 66.20811462402344, 70.35344696044922, 74.498779296875, 78.64411163330078, 82.78944396972656, 86.93477630615234, 91.08010864257812, 95.22543334960938, 99.37076568603516, 103.51609802246094, 107.66143035888672, 111.8067626953125, 115.95209503173828, 120.09742736816406, 124.24275207519531, 128.38809204101562, 132.53341674804688, 136.67874145507812, 140.82408142089844]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 8.0, 5.0, 3.0, 14.0, 13.0, 14.0, 9.0, 16.0, 31.0, 30.0, 21.0, 34.0, 37.0, 37.0, 42.0, 48.0, 51.0, 51.0, 58.0, 42.0, 53.0, 40.0, 41.0, 45.0, 34.0, 31.0, 37.0, 28.0, 13.0, 21.0, 24.0, 15.0, 6.0, 12.0, 10.0, 6.0, 4.0, 8.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-94.22860717773438, -90.94551849365234, -87.66242980957031, -84.37934875488281, -81.09626007080078, -77.81317138671875, -74.53008270263672, -71.24699401855469, -67.96390533447266, -64.68081665039062, -61.39773178100586, -58.11464309692383, -54.8315544128418, -51.54846954345703, -48.265380859375, -44.98229217529297, -41.6992073059082, -38.41611862182617, -35.133033752441406, -31.849945068359375, -28.566856384277344, -25.283769607543945, -22.000682830810547, -18.717594146728516, -15.434507369995117, -12.151419639587402, -8.868331909179688, -5.585245132446289, -2.302157402038574, 0.9809303283691406, 4.264017105102539, 7.54710578918457, 10.830192565917969, 14.113280296325684, 17.3963680267334, 20.679454803466797, 23.962543487548828, 27.245630264282227, 30.528717041015625, 33.811805725097656, 37.09489440917969, 40.37798309326172, 43.661067962646484, 46.944156646728516, 50.22724533081055, 53.51033020019531, 56.793418884277344, 60.076507568359375, 63.35959243774414, 66.6426773071289, 69.92576599121094, 73.20885467529297, 76.491943359375, 79.77503204345703, 83.05812072753906, 86.34120178222656, 89.6242904663086, 92.90737915039062, 96.19046783447266, 99.47355651855469, 102.75663757324219, 106.03972625732422, 109.32281494140625, 112.60590362548828, 115.88899230957031]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 7.0, 8.0, 5.0, 11.0, 10.0, 4.0, 13.0, 19.0, 42.0, 33.0, 60.0, 99.0, 143.0, 213.0, 314.0, 585.0, 1115.0, 2302.0, 5548.0, 16638.0, 71620.0, 3475166.0, 552518.0, 46316.0, 12308.0, 4650.0, 2044.0, 1076.0, 540.0, 305.0, 190.0, 121.0, 85.0, 53.0, 30.0, 23.0, 21.0, 11.0, 11.0, 17.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.6318359375, -37.138671875, -35.6455078125, -34.15234375, -32.6591796875, -31.166015625, -29.6728515625, -28.1796875, -26.6865234375, -25.193359375, -23.7001953125, -22.20703125, -20.7138671875, -19.220703125, -17.7275390625, -16.234375, -14.7412109375, -13.248046875, -11.7548828125, -10.26171875, -8.7685546875, -7.275390625, -5.7822265625, -4.2890625, -2.7958984375, -1.302734375, 0.1904296875, 1.68359375, 3.1767578125, 4.669921875, 6.1630859375, 7.65625, 9.1494140625, 10.642578125, 12.1357421875, 13.62890625, 15.1220703125, 16.615234375, 18.1083984375, 19.6015625, 21.0947265625, 22.587890625, 24.0810546875, 25.57421875, 27.0673828125, 28.560546875, 30.0537109375, 31.546875, 33.0400390625, 34.533203125, 36.0263671875, 37.51953125, 39.0126953125, 40.505859375, 41.9990234375, 43.4921875, 44.9853515625, 46.478515625, 47.9716796875, 49.46484375, 50.9580078125, 52.451171875, 53.9443359375, 55.4375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 1.0, 9.0, 9.0, 11.0, 17.0, 20.0, 27.0, 44.0, 56.0, 60.0, 73.0, 90.0, 62.0, 70.0, 77.0, 69.0, 51.0, 45.0, 44.0, 45.0, 29.0, 15.0, 21.0, 11.0, 12.0, 7.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.8773193359375, -4.711669921875, -4.5460205078125, -4.38037109375, -4.2147216796875, -4.049072265625, -3.8834228515625, -3.7177734375, -3.5521240234375, -3.386474609375, -3.2208251953125, -3.05517578125, -2.8895263671875, -2.723876953125, -2.5582275390625, -2.392578125, -2.2269287109375, -2.061279296875, -1.8956298828125, -1.72998046875, -1.5643310546875, -1.398681640625, -1.2330322265625, -1.0673828125, -0.9017333984375, -0.736083984375, -0.5704345703125, -0.40478515625, -0.2391357421875, -0.073486328125, 0.0921630859375, 0.2578125, 0.4234619140625, 0.589111328125, 0.7547607421875, 0.92041015625, 1.0860595703125, 1.251708984375, 1.4173583984375, 1.5830078125, 1.7486572265625, 1.914306640625, 2.0799560546875, 2.24560546875, 2.4112548828125, 2.576904296875, 2.7425537109375, 2.908203125, 3.0738525390625, 3.239501953125, 3.4051513671875, 3.57080078125, 3.7364501953125, 3.902099609375, 4.0677490234375, 4.2333984375, 4.3990478515625, 4.564697265625, 4.7303466796875, 4.89599609375, 5.0616455078125, 5.227294921875, 5.3929443359375, 5.55859375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 0.0, 2.0, 7.0, 11.0, 23.0, 30.0, 33.0, 44.0, 61.0, 107.0, 176.0, 339.0, 506.0, 863.0, 1643.0, 3231.0, 6451.0, 14048.0, 34225.0, 100022.0, 471700.0, 3146935.0, 288502.0, 74990.0, 27364.0, 11418.0, 5328.0, 2717.0, 1436.0, 788.0, 477.0, 250.0, 162.0, 132.0, 78.0, 59.0, 42.0, 20.0, 20.0, 11.0, 7.0, 6.0, 7.0, 7.0, 4.0, 2.0, 0.0, 1.0], "bins": [-30.984375, -30.1552734375, -29.326171875, -28.4970703125, -27.66796875, -26.8388671875, -26.009765625, -25.1806640625, -24.3515625, -23.5224609375, -22.693359375, -21.8642578125, -21.03515625, -20.2060546875, -19.376953125, -18.5478515625, -17.71875, -16.8896484375, -16.060546875, -15.2314453125, -14.40234375, -13.5732421875, -12.744140625, -11.9150390625, -11.0859375, -10.2568359375, -9.427734375, -8.5986328125, -7.76953125, -6.9404296875, -6.111328125, -5.2822265625, -4.453125, -3.6240234375, -2.794921875, -1.9658203125, -1.13671875, -0.3076171875, 0.521484375, 1.3505859375, 2.1796875, 3.0087890625, 3.837890625, 4.6669921875, 5.49609375, 6.3251953125, 7.154296875, 7.9833984375, 8.8125, 9.6416015625, 10.470703125, 11.2998046875, 12.12890625, 12.9580078125, 13.787109375, 14.6162109375, 15.4453125, 16.2744140625, 17.103515625, 17.9326171875, 18.76171875, 19.5908203125, 20.419921875, 21.2490234375, 22.078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 10.0, 12.0, 20.0, 24.0, 39.0, 37.0, 88.0, 112.0, 185.0, 315.0, 1382.0, 978.0, 301.0, 174.0, 110.0, 68.0, 54.0, 25.0, 20.0, 22.0, 17.0, 11.0, 11.0, 7.0, 4.0, 9.0, 1.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.05596923828125, -6.8033447265625, -6.55072021484375, -6.298095703125, -6.04547119140625, -5.7928466796875, -5.54022216796875, -5.28759765625, -5.03497314453125, -4.7823486328125, -4.52972412109375, -4.277099609375, -4.02447509765625, -3.7718505859375, -3.51922607421875, -3.2666015625, -3.01397705078125, -2.7613525390625, -2.50872802734375, -2.256103515625, -2.00347900390625, -1.7508544921875, -1.49822998046875, -1.24560546875, -0.99298095703125, -0.7403564453125, -0.48773193359375, -0.235107421875, 0.01751708984375, 0.2701416015625, 0.52276611328125, 0.775390625, 1.02801513671875, 1.2806396484375, 1.53326416015625, 1.785888671875, 2.03851318359375, 2.2911376953125, 2.54376220703125, 2.79638671875, 3.04901123046875, 3.3016357421875, 3.55426025390625, 3.806884765625, 4.05950927734375, 4.3121337890625, 4.56475830078125, 4.8173828125, 5.07000732421875, 5.3226318359375, 5.57525634765625, 5.827880859375, 6.08050537109375, 6.3331298828125, 6.58575439453125, 6.83837890625, 7.09100341796875, 7.3436279296875, 7.59625244140625, 7.848876953125, 8.10150146484375, 8.3541259765625, 8.60675048828125, 8.859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 12.0, 5.0, 28.0, 28.0, 56.0, 76.0, 112.0, 109.0, 115.0, 128.0, 96.0, 85.0, 59.0, 27.0, 24.0, 12.0, 10.0, 10.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.83511734008789, -33.99361038208008, -32.152103424072266, -30.31059455871582, -28.469085693359375, -26.627578735351562, -24.78607177734375, -22.944564819335938, -21.103055953979492, -19.26154899597168, -17.420040130615234, -15.578533172607422, -13.737025260925293, -11.895517349243164, -10.054010391235352, -8.212502479553223, -6.370994567871094, -4.529486656188965, -2.687979221343994, -0.8464717864990234, 0.9950361251831055, 2.8365440368652344, 4.678050994873047, 6.519558906555176, 8.361066818237305, 10.202574729919434, 12.044082641601562, 13.885589599609375, 15.727097511291504, 17.568605422973633, 19.410112380981445, 21.25162124633789, 23.09313201904297, 24.93463897705078, 26.776147842407227, 28.61765480041504, 30.459163665771484, 32.3006706237793, 34.14217758178711, 35.98368453979492, 37.8251953125, 39.66670227050781, 41.508209228515625, 43.34971618652344, 45.191226959228516, 47.03273391723633, 48.87424087524414, 50.71574783325195, 52.557254791259766, 54.39876174926758, 56.24026870727539, 58.08177947998047, 59.92328643798828, 61.764793395996094, 63.606300354003906, 65.44780731201172, 67.28931427001953, 69.13082122802734, 70.97232818603516, 72.81383514404297, 74.65534210205078, 76.49685668945312, 78.33836364746094, 80.17987060546875, 82.02137756347656]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 4.0, 4.0, 10.0, 6.0, 14.0, 6.0, 14.0, 11.0, 15.0, 16.0, 36.0, 38.0, 43.0, 39.0, 34.0, 58.0, 38.0, 41.0, 45.0, 53.0, 53.0, 54.0, 44.0, 59.0, 38.0, 35.0, 31.0, 37.0, 20.0, 18.0, 12.0, 22.0, 19.0, 8.0, 8.0, 3.0, 10.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-36.840904235839844, -35.8980598449707, -34.95521926879883, -34.01237487792969, -33.06953430175781, -32.12668991088867, -31.183849334716797, -30.241004943847656, -29.29816436767578, -28.355321884155273, -27.412479400634766, -26.469636917114258, -25.52679443359375, -24.583951950073242, -23.641109466552734, -22.698265075683594, -21.755422592163086, -20.812580108642578, -19.86973762512207, -18.926895141601562, -17.984052658081055, -17.041210174560547, -16.098365783691406, -15.155524253845215, -14.212681770324707, -13.2698392868042, -12.326996803283691, -11.384153366088867, -10.44131088256836, -9.498468399047852, -8.555625915527344, -7.612783432006836, -6.669939041137695, -5.7270965576171875, -4.78425407409668, -3.8414111137390137, -2.898568630218506, -1.955726146697998, -1.012883186340332, -0.07004070281982422, 0.8728017807006836, 1.815644383430481, 2.7584869861602783, 3.7013297080993652, 4.644172191619873, 5.587014675140381, 6.529857635498047, 7.472700119018555, 8.415542602539062, 9.35838508605957, 10.301227569580078, 11.244070053100586, 12.186912536621094, 13.129755020141602, 14.072598457336426, 15.015440940856934, 15.958283424377441, 16.901126861572266, 17.843969345092773, 18.78681182861328, 19.72965431213379, 20.672496795654297, 21.615339279174805, 22.558181762695312, 23.50102424621582]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 2.0, 8.0, 8.0, 11.0, 19.0, 22.0, 30.0, 51.0, 59.0, 92.0, 135.0, 223.0, 317.0, 487.0, 751.0, 1401.0, 2471.0, 4996.0, 10674.0, 24586.0, 58850.0, 141440.0, 300591.0, 280009.0, 127075.0, 52382.0, 22069.0, 9457.0, 4658.0, 2252.0, 1287.0, 731.0, 468.0, 286.0, 205.0, 132.0, 92.0, 69.0, 47.0, 32.0, 24.0, 13.0, 15.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.90625, -23.180419921875, -22.45458984375, -21.728759765625, -21.0029296875, -20.277099609375, -19.55126953125, -18.825439453125, -18.099609375, -17.373779296875, -16.64794921875, -15.922119140625, -15.1962890625, -14.470458984375, -13.74462890625, -13.018798828125, -12.29296875, -11.567138671875, -10.84130859375, -10.115478515625, -9.3896484375, -8.663818359375, -7.93798828125, -7.212158203125, -6.486328125, -5.760498046875, -5.03466796875, -4.308837890625, -3.5830078125, -2.857177734375, -2.13134765625, -1.405517578125, -0.6796875, 0.046142578125, 0.77197265625, 1.497802734375, 2.2236328125, 2.949462890625, 3.67529296875, 4.401123046875, 5.126953125, 5.852783203125, 6.57861328125, 7.304443359375, 8.0302734375, 8.756103515625, 9.48193359375, 10.207763671875, 10.93359375, 11.659423828125, 12.38525390625, 13.111083984375, 13.8369140625, 14.562744140625, 15.28857421875, 16.014404296875, 16.740234375, 17.466064453125, 18.19189453125, 18.917724609375, 19.6435546875, 20.369384765625, 21.09521484375, 21.821044921875, 22.546875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 12.0, 17.0, 17.0, 24.0, 40.0, 21.0, 59.0, 61.0, 70.0, 81.0, 75.0, 54.0, 68.0, 55.0, 67.0, 51.0, 44.0, 33.0, 31.0, 31.0, 14.0, 14.0, 15.0, 12.0, 10.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1328125, -4.9700927734375, -4.807373046875, -4.6446533203125, -4.48193359375, -4.3192138671875, -4.156494140625, -3.9937744140625, -3.8310546875, -3.6683349609375, -3.505615234375, -3.3428955078125, -3.18017578125, -3.0174560546875, -2.854736328125, -2.6920166015625, -2.529296875, -2.3665771484375, -2.203857421875, -2.0411376953125, -1.87841796875, -1.7156982421875, -1.552978515625, -1.3902587890625, -1.2275390625, -1.0648193359375, -0.902099609375, -0.7393798828125, -0.57666015625, -0.4139404296875, -0.251220703125, -0.0885009765625, 0.07421875, 0.2369384765625, 0.399658203125, 0.5623779296875, 0.72509765625, 0.8878173828125, 1.050537109375, 1.2132568359375, 1.3759765625, 1.5386962890625, 1.701416015625, 1.8641357421875, 2.02685546875, 2.1895751953125, 2.352294921875, 2.5150146484375, 2.677734375, 2.8404541015625, 3.003173828125, 3.1658935546875, 3.32861328125, 3.4913330078125, 3.654052734375, 3.8167724609375, 3.9794921875, 4.1422119140625, 4.304931640625, 4.4676513671875, 4.63037109375, 4.7930908203125, 4.955810546875, 5.1185302734375, 5.28125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 8.0, 14.0, 22.0, 18.0, 38.0, 53.0, 72.0, 96.0, 141.0, 198.0, 318.0, 469.0, 789.0, 1337.0, 2389.0, 4856.0, 10308.0, 24429.0, 61241.0, 147093.0, 304224.0, 273295.0, 126709.0, 51149.0, 20719.0, 9015.0, 4173.0, 2103.0, 1197.0, 699.0, 442.0, 307.0, 187.0, 143.0, 95.0, 62.0, 42.0, 31.0, 20.0, 24.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.735107421875, -17.14208984375, -16.549072265625, -15.9560546875, -15.363037109375, -14.77001953125, -14.177001953125, -13.583984375, -12.990966796875, -12.39794921875, -11.804931640625, -11.2119140625, -10.618896484375, -10.02587890625, -9.432861328125, -8.83984375, -8.246826171875, -7.65380859375, -7.060791015625, -6.4677734375, -5.874755859375, -5.28173828125, -4.688720703125, -4.095703125, -3.502685546875, -2.90966796875, -2.316650390625, -1.7236328125, -1.130615234375, -0.53759765625, 0.055419921875, 0.6484375, 1.241455078125, 1.83447265625, 2.427490234375, 3.0205078125, 3.613525390625, 4.20654296875, 4.799560546875, 5.392578125, 5.985595703125, 6.57861328125, 7.171630859375, 7.7646484375, 8.357666015625, 8.95068359375, 9.543701171875, 10.13671875, 10.729736328125, 11.32275390625, 11.915771484375, 12.5087890625, 13.101806640625, 13.69482421875, 14.287841796875, 14.880859375, 15.473876953125, 16.06689453125, 16.659912109375, 17.2529296875, 17.845947265625, 18.43896484375, 19.031982421875, 19.625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 7.0, 7.0, 11.0, 9.0, 9.0, 14.0, 15.0, 19.0, 19.0, 22.0, 37.0, 32.0, 26.0, 27.0, 36.0, 29.0, 43.0, 39.0, 43.0, 50.0, 51.0, 38.0, 41.0, 45.0, 38.0, 42.0, 38.0, 28.0, 28.0, 24.0, 14.0, 22.0, 11.0, 18.0, 18.0, 8.0, 2.0, 7.0, 7.0, 2.0, 6.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0], "bins": [-16.421875, -15.94873046875, -15.4755859375, -15.00244140625, -14.529296875, -14.05615234375, -13.5830078125, -13.10986328125, -12.63671875, -12.16357421875, -11.6904296875, -11.21728515625, -10.744140625, -10.27099609375, -9.7978515625, -9.32470703125, -8.8515625, -8.37841796875, -7.9052734375, -7.43212890625, -6.958984375, -6.48583984375, -6.0126953125, -5.53955078125, -5.06640625, -4.59326171875, -4.1201171875, -3.64697265625, -3.173828125, -2.70068359375, -2.2275390625, -1.75439453125, -1.28125, -0.80810546875, -0.3349609375, 0.13818359375, 0.611328125, 1.08447265625, 1.5576171875, 2.03076171875, 2.50390625, 2.97705078125, 3.4501953125, 3.92333984375, 4.396484375, 4.86962890625, 5.3427734375, 5.81591796875, 6.2890625, 6.76220703125, 7.2353515625, 7.70849609375, 8.181640625, 8.65478515625, 9.1279296875, 9.60107421875, 10.07421875, 10.54736328125, 11.0205078125, 11.49365234375, 11.966796875, 12.43994140625, 12.9130859375, 13.38623046875, 13.859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 3.0, 4.0, 9.0, 17.0, 18.0, 38.0, 44.0, 58.0, 99.0, 204.0, 298.0, 467.0, 810.0, 1376.0, 3029.0, 8293.0, 31383.0, 198509.0, 629443.0, 137775.0, 24161.0, 6653.0, 2695.0, 1303.0, 767.0, 460.0, 224.0, 137.0, 86.0, 64.0, 42.0, 23.0, 26.0, 6.0, 11.0, 4.0, 3.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.15625, -15.625, -15.09375, -14.5625, -14.03125, -13.5, -12.96875, -12.4375, -11.90625, -11.375, -10.84375, -10.3125, -9.78125, -9.25, -8.71875, -8.1875, -7.65625, -7.125, -6.59375, -6.0625, -5.53125, -5.0, -4.46875, -3.9375, -3.40625, -2.875, -2.34375, -1.8125, -1.28125, -0.75, -0.21875, 0.3125, 0.84375, 1.375, 1.90625, 2.4375, 2.96875, 3.5, 4.03125, 4.5625, 5.09375, 5.625, 6.15625, 6.6875, 7.21875, 7.75, 8.28125, 8.8125, 9.34375, 9.875, 10.40625, 10.9375, 11.46875, 12.0, 12.53125, 13.0625, 13.59375, 14.125, 14.65625, 15.1875, 15.71875, 16.25, 16.78125, 17.3125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 4.0, 13.0, 9.0, 14.0, 18.0, 28.0, 43.0, 68.0, 105.0, 191.0, 180.0, 117.0, 67.0, 41.0, 29.0, 21.0, 10.0, 12.0, 7.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0033512115478515625, -0.003243178129196167, -0.0031351447105407715, -0.003027111291885376, -0.0029190778732299805, -0.002811044454574585, -0.0027030110359191895, -0.002594977617263794, -0.0024869441986083984, -0.002378910779953003, -0.0022708773612976074, -0.002162843942642212, -0.0020548105239868164, -0.001946777105331421, -0.0018387436866760254, -0.0017307102680206299, -0.0016226768493652344, -0.0015146434307098389, -0.0014066100120544434, -0.0012985765933990479, -0.0011905431747436523, -0.0010825097560882568, -0.0009744763374328613, -0.0008664429187774658, -0.0007584095001220703, -0.0006503760814666748, -0.0005423426628112793, -0.0004343092441558838, -0.0003262758255004883, -0.00021824240684509277, -0.00011020898818969727, -2.175569534301758e-06, 0.00010585784912109375, 0.00021389126777648926, 0.00032192468643188477, 0.0004299581050872803, 0.0005379915237426758, 0.0006460249423980713, 0.0007540583610534668, 0.0008620917797088623, 0.0009701251983642578, 0.0010781586170196533, 0.0011861920356750488, 0.0012942254543304443, 0.0014022588729858398, 0.0015102922916412354, 0.0016183257102966309, 0.0017263591289520264, 0.0018343925476074219, 0.0019424259662628174, 0.002050459384918213, 0.0021584928035736084, 0.002266526222229004, 0.0023745596408843994, 0.002482593059539795, 0.0025906264781951904, 0.002698659896850586, 0.0028066933155059814, 0.002914726734161377, 0.0030227601528167725, 0.003130793571472168, 0.0032388269901275635, 0.003346860408782959, 0.0034548938274383545, 0.00356292724609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 11.0, 7.0, 10.0, 12.0, 22.0, 31.0, 44.0, 62.0, 118.0, 150.0, 282.0, 396.0, 669.0, 1213.0, 2298.0, 5171.0, 15093.0, 64844.0, 435639.0, 432483.0, 64470.0, 15022.0, 5200.0, 2343.0, 1173.0, 665.0, 399.0, 261.0, 154.0, 95.0, 54.0, 49.0, 25.0, 25.0, 15.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.703125, -15.196533203125, -14.68994140625, -14.183349609375, -13.6767578125, -13.170166015625, -12.66357421875, -12.156982421875, -11.650390625, -11.143798828125, -10.63720703125, -10.130615234375, -9.6240234375, -9.117431640625, -8.61083984375, -8.104248046875, -7.59765625, -7.091064453125, -6.58447265625, -6.077880859375, -5.5712890625, -5.064697265625, -4.55810546875, -4.051513671875, -3.544921875, -3.038330078125, -2.53173828125, -2.025146484375, -1.5185546875, -1.011962890625, -0.50537109375, 0.001220703125, 0.5078125, 1.014404296875, 1.52099609375, 2.027587890625, 2.5341796875, 3.040771484375, 3.54736328125, 4.053955078125, 4.560546875, 5.067138671875, 5.57373046875, 6.080322265625, 6.5869140625, 7.093505859375, 7.60009765625, 8.106689453125, 8.61328125, 9.119873046875, 9.62646484375, 10.133056640625, 10.6396484375, 11.146240234375, 11.65283203125, 12.159423828125, 12.666015625, 13.172607421875, 13.67919921875, 14.185791015625, 14.6923828125, 15.198974609375, 15.70556640625, 16.212158203125, 16.71875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 7.0, 13.0, 23.0, 38.0, 52.0, 76.0, 101.0, 124.0, 136.0, 136.0, 85.0, 65.0, 43.0, 29.0, 20.0, 11.0, 6.0, 7.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.4609375, -13.079345703125, -12.69775390625, -12.316162109375, -11.9345703125, -11.552978515625, -11.17138671875, -10.789794921875, -10.408203125, -10.026611328125, -9.64501953125, -9.263427734375, -8.8818359375, -8.500244140625, -8.11865234375, -7.737060546875, -7.35546875, -6.973876953125, -6.59228515625, -6.210693359375, -5.8291015625, -5.447509765625, -5.06591796875, -4.684326171875, -4.302734375, -3.921142578125, -3.53955078125, -3.157958984375, -2.7763671875, -2.394775390625, -2.01318359375, -1.631591796875, -1.25, -0.868408203125, -0.48681640625, -0.105224609375, 0.2763671875, 0.657958984375, 1.03955078125, 1.421142578125, 1.802734375, 2.184326171875, 2.56591796875, 2.947509765625, 3.3291015625, 3.710693359375, 4.09228515625, 4.473876953125, 4.85546875, 5.237060546875, 5.61865234375, 6.000244140625, 6.3818359375, 6.763427734375, 7.14501953125, 7.526611328125, 7.908203125, 8.289794921875, 8.67138671875, 9.052978515625, 9.4345703125, 9.816162109375, 10.19775390625, 10.579345703125, 10.9609375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 12.0, 11.0, 23.0, 28.0, 45.0, 66.0, 92.0, 123.0, 119.0, 131.0, 107.0, 81.0, 51.0, 42.0, 26.0, 16.0, 11.0, 8.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-198.13973999023438, -192.74169921875, -187.34364318847656, -181.9456024169922, -176.5475616455078, -171.14952087402344, -165.75146484375, -160.35342407226562, -154.95538330078125, -149.55734252929688, -144.15928649902344, -138.76124572753906, -133.3632049560547, -127.96515655517578, -122.56710815429688, -117.1690673828125, -111.7710189819336, -106.37297058105469, -100.97492980957031, -95.5768814086914, -90.17884063720703, -84.78079223632812, -79.38275146484375, -73.98470306396484, -68.58665466308594, -63.1886100769043, -57.790565490722656, -52.39251708984375, -46.994476318359375, -41.59642791748047, -36.19838333129883, -30.800338745117188, -25.402297973632812, -20.004253387451172, -14.606207847595215, -9.208162307739258, -3.810117721557617, 1.5879268646240234, 6.985973358154297, 12.384017944335938, 17.782062530517578, 23.18010711669922, 28.57815170288086, 33.9761962890625, 39.374244689941406, 44.77228546142578, 50.17033386230469, 55.56837844848633, 60.96642303466797, 66.36447143554688, 71.76251220703125, 77.16056060791016, 82.55860137939453, 87.95664978027344, 93.35469055175781, 98.75273895263672, 104.15078735351562, 109.54883575439453, 114.9468765258789, 120.34492492675781, 125.74296569824219, 131.14100646972656, 136.5390625, 141.93710327148438, 147.33514404296875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 7.0, 8.0, 21.0, 7.0, 16.0, 13.0, 35.0, 33.0, 37.0, 22.0, 34.0, 38.0, 52.0, 43.0, 56.0, 53.0, 65.0, 45.0, 59.0, 42.0, 47.0, 45.0, 35.0, 23.0, 29.0, 9.0, 23.0, 13.0, 12.0, 7.0, 14.0, 8.0, 5.0, 7.0, 6.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.4470443725586, -98.230712890625, -95.0143814086914, -91.79804992675781, -88.58171081542969, -85.3653793334961, -82.1490478515625, -78.9327163696289, -75.71638488769531, -72.50005340576172, -69.28372192382812, -66.0673828125, -62.851051330566406, -59.63471984863281, -56.41838836669922, -53.202056884765625, -49.9857177734375, -46.769386291503906, -43.55305099487305, -40.33671951293945, -37.120384216308594, -33.904052734375, -30.687721252441406, -27.47138786315918, -24.255054473876953, -21.038721084594727, -17.8223876953125, -14.606056213378906, -11.38972282409668, -8.173389434814453, -4.957057952880859, -1.7407245635986328, 1.475616455078125, 4.691949367523193, 7.908282279968262, 11.124614715576172, 14.340948104858398, 17.557281494140625, 20.77361297607422, 23.989946365356445, 27.206279754638672, 30.4226131439209, 33.638946533203125, 36.85527801513672, 40.07160949707031, 43.28794479370117, 46.504276275634766, 49.720611572265625, 52.93694305419922, 56.15327453613281, 59.36960983276367, 62.585941314697266, 65.80227661132812, 69.01860809326172, 72.23493957519531, 75.4512710571289, 78.6676025390625, 81.8839340209961, 85.10026550292969, 88.31660461425781, 91.5329360961914, 94.749267578125, 97.9655990600586, 101.18193054199219, 104.39826965332031]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 10.0, 4.0, 10.0, 13.0, 12.0, 14.0, 18.0, 29.0, 37.0, 44.0, 63.0, 93.0, 129.0, 221.0, 299.0, 435.0, 660.0, 1148.0, 2045.0, 3834.0, 7857.0, 17940.0, 47756.0, 173206.0, 3038014.0, 733124.0, 105489.0, 33577.0, 13795.0, 6339.0, 3333.0, 1795.0, 1047.0, 666.0, 421.0, 267.0, 182.0, 130.0, 59.0, 46.0, 35.0, 23.0, 21.0, 10.0, 14.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-29.84375, -28.90625, -27.96875, -27.03125, -26.09375, -25.15625, -24.21875, -23.28125, -22.34375, -21.40625, -20.46875, -19.53125, -18.59375, -17.65625, -16.71875, -15.78125, -14.84375, -13.90625, -12.96875, -12.03125, -11.09375, -10.15625, -9.21875, -8.28125, -7.34375, -6.40625, -5.46875, -4.53125, -3.59375, -2.65625, -1.71875, -0.78125, 0.15625, 1.09375, 2.03125, 2.96875, 3.90625, 4.84375, 5.78125, 6.71875, 7.65625, 8.59375, 9.53125, 10.46875, 11.40625, 12.34375, 13.28125, 14.21875, 15.15625, 16.09375, 17.03125, 17.96875, 18.90625, 19.84375, 20.78125, 21.71875, 22.65625, 23.59375, 24.53125, 25.46875, 26.40625, 27.34375, 28.28125, 29.21875, 30.15625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 9.0, 10.0, 21.0, 22.0, 17.0, 47.0, 42.0, 47.0, 69.0, 76.0, 89.0, 69.0, 59.0, 71.0, 76.0, 53.0, 54.0, 32.0, 29.0, 29.0, 14.0, 19.0, 20.0, 9.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5859375, -5.416748046875, -5.24755859375, -5.078369140625, -4.9091796875, -4.739990234375, -4.57080078125, -4.401611328125, -4.232421875, -4.063232421875, -3.89404296875, -3.724853515625, -3.5556640625, -3.386474609375, -3.21728515625, -3.048095703125, -2.87890625, -2.709716796875, -2.54052734375, -2.371337890625, -2.2021484375, -2.032958984375, -1.86376953125, -1.694580078125, -1.525390625, -1.356201171875, -1.18701171875, -1.017822265625, -0.8486328125, -0.679443359375, -0.51025390625, -0.341064453125, -0.171875, -0.002685546875, 0.16650390625, 0.335693359375, 0.5048828125, 0.674072265625, 0.84326171875, 1.012451171875, 1.181640625, 1.350830078125, 1.52001953125, 1.689208984375, 1.8583984375, 2.027587890625, 2.19677734375, 2.365966796875, 2.53515625, 2.704345703125, 2.87353515625, 3.042724609375, 3.2119140625, 3.381103515625, 3.55029296875, 3.719482421875, 3.888671875, 4.057861328125, 4.22705078125, 4.396240234375, 4.5654296875, 4.734619140625, 4.90380859375, 5.072998046875, 5.2421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 12.0, 16.0, 21.0, 20.0, 44.0, 40.0, 75.0, 76.0, 133.0, 170.0, 278.0, 428.0, 653.0, 1124.0, 1963.0, 3839.0, 8004.0, 21220.0, 76875.0, 461134.0, 3209685.0, 318436.0, 59836.0, 16731.0, 6383.0, 3042.0, 1562.0, 922.0, 522.0, 315.0, 224.0, 132.0, 80.0, 78.0, 53.0, 41.0, 29.0, 23.0, 8.0, 13.0, 8.0, 7.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-32.59375, -31.55615234375, -30.5185546875, -29.48095703125, -28.443359375, -27.40576171875, -26.3681640625, -25.33056640625, -24.29296875, -23.25537109375, -22.2177734375, -21.18017578125, -20.142578125, -19.10498046875, -18.0673828125, -17.02978515625, -15.9921875, -14.95458984375, -13.9169921875, -12.87939453125, -11.841796875, -10.80419921875, -9.7666015625, -8.72900390625, -7.69140625, -6.65380859375, -5.6162109375, -4.57861328125, -3.541015625, -2.50341796875, -1.4658203125, -0.42822265625, 0.609375, 1.64697265625, 2.6845703125, 3.72216796875, 4.759765625, 5.79736328125, 6.8349609375, 7.87255859375, 8.91015625, 9.94775390625, 10.9853515625, 12.02294921875, 13.060546875, 14.09814453125, 15.1357421875, 16.17333984375, 17.2109375, 18.24853515625, 19.2861328125, 20.32373046875, 21.361328125, 22.39892578125, 23.4365234375, 24.47412109375, 25.51171875, 26.54931640625, 27.5869140625, 28.62451171875, 29.662109375, 30.69970703125, 31.7373046875, 32.77490234375, 33.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 10.0, 1.0, 7.0, 10.0, 15.0, 13.0, 22.0, 35.0, 52.0, 75.0, 130.0, 221.0, 406.0, 1390.0, 780.0, 355.0, 199.0, 120.0, 82.0, 50.0, 27.0, 15.0, 20.0, 12.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -16.0599365234375, -15.635498046875, -15.2110595703125, -14.78662109375, -14.3621826171875, -13.937744140625, -13.5133056640625, -13.0888671875, -12.6644287109375, -12.239990234375, -11.8155517578125, -11.39111328125, -10.9666748046875, -10.542236328125, -10.1177978515625, -9.693359375, -9.2689208984375, -8.844482421875, -8.4200439453125, -7.99560546875, -7.5711669921875, -7.146728515625, -6.7222900390625, -6.2978515625, -5.8734130859375, -5.448974609375, -5.0245361328125, -4.60009765625, -4.1756591796875, -3.751220703125, -3.3267822265625, -2.90234375, -2.4779052734375, -2.053466796875, -1.6290283203125, -1.20458984375, -0.7801513671875, -0.355712890625, 0.0687255859375, 0.4931640625, 0.9176025390625, 1.342041015625, 1.7664794921875, 2.19091796875, 2.6153564453125, 3.039794921875, 3.4642333984375, 3.888671875, 4.3131103515625, 4.737548828125, 5.1619873046875, 5.58642578125, 6.0108642578125, 6.435302734375, 6.8597412109375, 7.2841796875, 7.7086181640625, 8.133056640625, 8.5574951171875, 8.98193359375, 9.4063720703125, 9.830810546875, 10.2552490234375, 10.6796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 30.0, 48.0, 106.0, 160.0, 213.0, 205.0, 117.0, 63.0, 22.0, 11.0, 4.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.431396484375, -203.17308044433594, -197.9147491455078, -192.65643310546875, -187.3981170654297, -182.13978576660156, -176.8814697265625, -171.62313842773438, -166.3648223876953, -161.10650634765625, -155.84817504882812, -150.58985900878906, -145.33154296875, -140.07321166992188, -134.8148956298828, -129.55657958984375, -124.29825592041016, -119.03993225097656, -113.7816162109375, -108.5232925415039, -103.26496887207031, -98.00665283203125, -92.74832916259766, -87.49000549316406, -82.231689453125, -76.9733657836914, -71.71504974365234, -66.45672607421875, -61.198402404785156, -55.94008255004883, -50.6817626953125, -45.423439025878906, -40.16511535644531, -34.906795501708984, -29.64847183227539, -24.390151977539062, -19.1318302154541, -13.87350845336914, -8.615188598632812, -3.3568649291992188, 1.9014549255371094, 7.159776210784912, 12.418097496032715, 17.67641830444336, 22.93474006652832, 28.19306182861328, 33.45138168334961, 38.7097053527832, 43.96802520751953, 49.22634506225586, 54.48466873168945, 59.74298858642578, 65.00131225585938, 70.25962829589844, 75.51795196533203, 80.77627563476562, 86.03459167480469, 91.29291534423828, 96.55123138427734, 101.80955505371094, 107.06787872314453, 112.32620239257812, 117.58451843261719, 122.84284210205078, 128.10116577148438]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 11.0, 8.0, 22.0, 31.0, 20.0, 39.0, 33.0, 69.0, 49.0, 57.0, 79.0, 68.0, 78.0, 76.0, 55.0, 64.0, 48.0, 42.0, 33.0, 29.0, 24.0, 18.0, 12.0, 14.0, 10.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.65126037597656, -60.55528259277344, -58.45930480957031, -56.36332702636719, -54.26734924316406, -52.17137145996094, -50.07539749145508, -47.97941970825195, -45.88344192504883, -43.7874641418457, -41.69148635864258, -39.59550857543945, -37.499534606933594, -35.40355682373047, -33.307579040527344, -31.21160125732422, -29.115623474121094, -27.01964569091797, -24.923667907714844, -22.82769203186035, -20.731714248657227, -18.6357364654541, -16.53976058959961, -14.443782806396484, -12.34780502319336, -10.251827239990234, -8.155850410461426, -6.059873104095459, -3.963895797729492, -1.8679180145263672, 0.2280588150024414, 2.32403564453125, 4.420013427734375, 6.515990734100342, 8.611968040466309, 10.707944869995117, 12.803922653198242, 14.899900436401367, 16.99587631225586, 19.091854095458984, 21.18783187866211, 23.283809661865234, 25.37978744506836, 27.47576332092285, 29.571741104125977, 31.6677188873291, 33.763694763183594, 35.85967254638672, 37.955650329589844, 40.05162811279297, 42.147605895996094, 44.24358367919922, 46.339561462402344, 48.43553924560547, 50.53151321411133, 52.62749099731445, 54.72346878051758, 56.8194465637207, 58.91542434692383, 61.01140213012695, 63.10737609863281, 65.20335388183594, 67.29933166503906, 69.39530944824219, 71.49128723144531]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 3.0, 9.0, 20.0, 24.0, 28.0, 42.0, 71.0, 94.0, 142.0, 251.0, 344.0, 655.0, 1171.0, 2523.0, 7051.0, 24578.0, 111913.0, 524481.0, 293358.0, 59086.0, 14142.0, 4418.0, 1783.0, 953.0, 499.0, 280.0, 208.0, 120.0, 81.0, 67.0, 41.0, 30.0, 19.0, 16.0, 8.0, 6.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-48.28125, -46.8525390625, -45.423828125, -43.9951171875, -42.56640625, -41.1376953125, -39.708984375, -38.2802734375, -36.8515625, -35.4228515625, -33.994140625, -32.5654296875, -31.13671875, -29.7080078125, -28.279296875, -26.8505859375, -25.421875, -23.9931640625, -22.564453125, -21.1357421875, -19.70703125, -18.2783203125, -16.849609375, -15.4208984375, -13.9921875, -12.5634765625, -11.134765625, -9.7060546875, -8.27734375, -6.8486328125, -5.419921875, -3.9912109375, -2.5625, -1.1337890625, 0.294921875, 1.7236328125, 3.15234375, 4.5810546875, 6.009765625, 7.4384765625, 8.8671875, 10.2958984375, 11.724609375, 13.1533203125, 14.58203125, 16.0107421875, 17.439453125, 18.8681640625, 20.296875, 21.7255859375, 23.154296875, 24.5830078125, 26.01171875, 27.4404296875, 28.869140625, 30.2978515625, 31.7265625, 33.1552734375, 34.583984375, 36.0126953125, 37.44140625, 38.8701171875, 40.298828125, 41.7275390625, 43.15625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 11.0, 15.0, 26.0, 40.0, 49.0, 57.0, 100.0, 87.0, 82.0, 96.0, 92.0, 83.0, 71.0, 46.0, 42.0, 30.0, 24.0, 14.0, 15.0, 9.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.69140625, -6.47125244140625, -6.2510986328125, -6.03094482421875, -5.810791015625, -5.59063720703125, -5.3704833984375, -5.15032958984375, -4.93017578125, -4.71002197265625, -4.4898681640625, -4.26971435546875, -4.049560546875, -3.82940673828125, -3.6092529296875, -3.38909912109375, -3.1689453125, -2.94879150390625, -2.7286376953125, -2.50848388671875, -2.288330078125, -2.06817626953125, -1.8480224609375, -1.62786865234375, -1.40771484375, -1.18756103515625, -0.9674072265625, -0.74725341796875, -0.527099609375, -0.30694580078125, -0.0867919921875, 0.13336181640625, 0.353515625, 0.57366943359375, 0.7938232421875, 1.01397705078125, 1.234130859375, 1.45428466796875, 1.6744384765625, 1.89459228515625, 2.11474609375, 2.33489990234375, 2.5550537109375, 2.77520751953125, 2.995361328125, 3.21551513671875, 3.4356689453125, 3.65582275390625, 3.8759765625, 4.09613037109375, 4.3162841796875, 4.53643798828125, 4.756591796875, 4.97674560546875, 5.1968994140625, 5.41705322265625, 5.63720703125, 5.85736083984375, 6.0775146484375, 6.29766845703125, 6.517822265625, 6.73797607421875, 6.9581298828125, 7.17828369140625, 7.3984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 7.0, 11.0, 10.0, 12.0, 32.0, 38.0, 48.0, 67.0, 104.0, 185.0, 300.0, 424.0, 651.0, 1159.0, 2022.0, 3847.0, 7384.0, 15230.0, 32365.0, 69815.0, 153651.0, 302494.0, 245451.0, 113301.0, 51742.0, 23988.0, 11410.0, 5582.0, 2917.0, 1582.0, 1010.0, 598.0, 354.0, 241.0, 161.0, 124.0, 68.0, 54.0, 35.0, 35.0, 18.0, 8.0, 9.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.71875, -15.2396240234375, -14.760498046875, -14.2813720703125, -13.80224609375, -13.3231201171875, -12.843994140625, -12.3648681640625, -11.8857421875, -11.4066162109375, -10.927490234375, -10.4483642578125, -9.96923828125, -9.4901123046875, -9.010986328125, -8.5318603515625, -8.052734375, -7.5736083984375, -7.094482421875, -6.6153564453125, -6.13623046875, -5.6571044921875, -5.177978515625, -4.6988525390625, -4.2197265625, -3.7406005859375, -3.261474609375, -2.7823486328125, -2.30322265625, -1.8240966796875, -1.344970703125, -0.8658447265625, -0.38671875, 0.0924072265625, 0.571533203125, 1.0506591796875, 1.52978515625, 2.0089111328125, 2.488037109375, 2.9671630859375, 3.4462890625, 3.9254150390625, 4.404541015625, 4.8836669921875, 5.36279296875, 5.8419189453125, 6.321044921875, 6.8001708984375, 7.279296875, 7.7584228515625, 8.237548828125, 8.7166748046875, 9.19580078125, 9.6749267578125, 10.154052734375, 10.6331787109375, 11.1123046875, 11.5914306640625, 12.070556640625, 12.5496826171875, 13.02880859375, 13.5079345703125, 13.987060546875, 14.4661865234375, 14.9453125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 6.0, 4.0, 8.0, 6.0, 10.0, 11.0, 9.0, 12.0, 16.0, 21.0, 21.0, 22.0, 21.0, 38.0, 33.0, 34.0, 30.0, 48.0, 43.0, 43.0, 43.0, 51.0, 50.0, 37.0, 40.0, 38.0, 41.0, 41.0, 34.0, 25.0, 32.0, 20.0, 21.0, 11.0, 15.0, 13.0, 14.0, 7.0, 7.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -14.06201171875, -13.6083984375, -13.15478515625, -12.701171875, -12.24755859375, -11.7939453125, -11.34033203125, -10.88671875, -10.43310546875, -9.9794921875, -9.52587890625, -9.072265625, -8.61865234375, -8.1650390625, -7.71142578125, -7.2578125, -6.80419921875, -6.3505859375, -5.89697265625, -5.443359375, -4.98974609375, -4.5361328125, -4.08251953125, -3.62890625, -3.17529296875, -2.7216796875, -2.26806640625, -1.814453125, -1.36083984375, -0.9072265625, -0.45361328125, 0.0, 0.45361328125, 0.9072265625, 1.36083984375, 1.814453125, 2.26806640625, 2.7216796875, 3.17529296875, 3.62890625, 4.08251953125, 4.5361328125, 4.98974609375, 5.443359375, 5.89697265625, 6.3505859375, 6.80419921875, 7.2578125, 7.71142578125, 8.1650390625, 8.61865234375, 9.072265625, 9.52587890625, 9.9794921875, 10.43310546875, 10.88671875, 11.34033203125, 11.7939453125, 12.24755859375, 12.701171875, 13.15478515625, 13.6083984375, 14.06201171875, 14.515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 14.0, 10.0, 24.0, 48.0, 65.0, 111.0, 205.0, 427.0, 892.0, 1941.0, 4491.0, 12763.0, 45392.0, 203443.0, 520645.0, 193895.0, 43523.0, 12510.0, 4543.0, 1777.0, 876.0, 400.0, 212.0, 115.0, 71.0, 51.0, 21.0, 19.0, 14.0, 14.0, 10.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.953125, -11.5477294921875, -11.142333984375, -10.7369384765625, -10.33154296875, -9.9261474609375, -9.520751953125, -9.1153564453125, -8.7099609375, -8.3045654296875, -7.899169921875, -7.4937744140625, -7.08837890625, -6.6829833984375, -6.277587890625, -5.8721923828125, -5.466796875, -5.0614013671875, -4.656005859375, -4.2506103515625, -3.84521484375, -3.4398193359375, -3.034423828125, -2.6290283203125, -2.2236328125, -1.8182373046875, -1.412841796875, -1.0074462890625, -0.60205078125, -0.1966552734375, 0.208740234375, 0.6141357421875, 1.01953125, 1.4249267578125, 1.830322265625, 2.2357177734375, 2.64111328125, 3.0465087890625, 3.451904296875, 3.8572998046875, 4.2626953125, 4.6680908203125, 5.073486328125, 5.4788818359375, 5.88427734375, 6.2896728515625, 6.695068359375, 7.1004638671875, 7.505859375, 7.9112548828125, 8.316650390625, 8.7220458984375, 9.12744140625, 9.5328369140625, 9.938232421875, 10.3436279296875, 10.7490234375, 11.1544189453125, 11.559814453125, 11.9652099609375, 12.37060546875, 12.7760009765625, 13.181396484375, 13.5867919921875, 13.9921875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 15.0, 18.0, 26.0, 35.0, 36.0, 72.0, 127.0, 211.0, 166.0, 95.0, 55.0, 33.0, 29.0, 15.0, 16.0, 9.0, 8.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002529144287109375, -0.002443850040435791, -0.002358555793762207, -0.002273261547088623, -0.002187967300415039, -0.002102673053741455, -0.002017378807067871, -0.0019320845603942871, -0.0018467903137207031, -0.0017614960670471191, -0.0016762018203735352, -0.0015909075736999512, -0.0015056133270263672, -0.0014203190803527832, -0.0013350248336791992, -0.0012497305870056152, -0.0011644363403320312, -0.0010791420936584473, -0.0009938478469848633, -0.0009085536003112793, -0.0008232593536376953, -0.0007379651069641113, -0.0006526708602905273, -0.0005673766136169434, -0.0004820823669433594, -0.0003967881202697754, -0.0003114938735961914, -0.00022619962692260742, -0.00014090538024902344, -5.561113357543945e-05, 2.968311309814453e-05, 0.00011497735977172852, 0.0002002716064453125, 0.0002855658531188965, 0.00037086009979248047, 0.00045615434646606445, 0.0005414485931396484, 0.0006267428398132324, 0.0007120370864868164, 0.0007973313331604004, 0.0008826255798339844, 0.0009679198265075684, 0.0010532140731811523, 0.0011385083198547363, 0.0012238025665283203, 0.0013090968132019043, 0.0013943910598754883, 0.0014796853065490723, 0.0015649795532226562, 0.0016502737998962402, 0.0017355680465698242, 0.0018208622932434082, 0.0019061565399169922, 0.001991450786590576, 0.00207674503326416, 0.002162039279937744, 0.002247333526611328, 0.002332627773284912, 0.002417922019958496, 0.00250321626663208, 0.002588510513305664, 0.002673804759979248, 0.002759099006652832, 0.002844393253326416, 0.0029296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 6.0, 9.0, 10.0, 17.0, 13.0, 20.0, 46.0, 53.0, 91.0, 145.0, 201.0, 393.0, 619.0, 1229.0, 2293.0, 4611.0, 10630.0, 29044.0, 97214.0, 341769.0, 385209.0, 118163.0, 33976.0, 12108.0, 5159.0, 2480.0, 1212.0, 701.0, 438.0, 249.0, 152.0, 88.0, 78.0, 48.0, 15.0, 16.0, 14.0, 11.0, 7.0, 8.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.109375, -10.7734375, -10.4375, -10.1015625, -9.765625, -9.4296875, -9.09375, -8.7578125, -8.421875, -8.0859375, -7.75, -7.4140625, -7.078125, -6.7421875, -6.40625, -6.0703125, -5.734375, -5.3984375, -5.0625, -4.7265625, -4.390625, -4.0546875, -3.71875, -3.3828125, -3.046875, -2.7109375, -2.375, -2.0390625, -1.703125, -1.3671875, -1.03125, -0.6953125, -0.359375, -0.0234375, 0.3125, 0.6484375, 0.984375, 1.3203125, 1.65625, 1.9921875, 2.328125, 2.6640625, 3.0, 3.3359375, 3.671875, 4.0078125, 4.34375, 4.6796875, 5.015625, 5.3515625, 5.6875, 6.0234375, 6.359375, 6.6953125, 7.03125, 7.3671875, 7.703125, 8.0390625, 8.375, 8.7109375, 9.046875, 9.3828125, 9.71875, 10.0546875, 10.390625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 11.0, 20.0, 25.0, 18.0, 38.0, 33.0, 63.0, 82.0, 84.0, 90.0, 113.0, 92.0, 81.0, 59.0, 41.0, 27.0, 21.0, 23.0, 17.0, 10.0, 12.0, 3.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.4921875, -11.20684814453125, -10.9215087890625, -10.63616943359375, -10.350830078125, -10.06549072265625, -9.7801513671875, -9.49481201171875, -9.20947265625, -8.92413330078125, -8.6387939453125, -8.35345458984375, -8.068115234375, -7.78277587890625, -7.4974365234375, -7.21209716796875, -6.9267578125, -6.64141845703125, -6.3560791015625, -6.07073974609375, -5.785400390625, -5.50006103515625, -5.2147216796875, -4.92938232421875, -4.64404296875, -4.35870361328125, -4.0733642578125, -3.78802490234375, -3.502685546875, -3.21734619140625, -2.9320068359375, -2.64666748046875, -2.361328125, -2.07598876953125, -1.7906494140625, -1.50531005859375, -1.219970703125, -0.93463134765625, -0.6492919921875, -0.36395263671875, -0.07861328125, 0.20672607421875, 0.4920654296875, 0.77740478515625, 1.062744140625, 1.34808349609375, 1.6334228515625, 1.91876220703125, 2.2041015625, 2.48944091796875, 2.7747802734375, 3.06011962890625, 3.345458984375, 3.63079833984375, 3.9161376953125, 4.20147705078125, 4.48681640625, 4.77215576171875, 5.0574951171875, 5.34283447265625, 5.628173828125, 5.91351318359375, 6.1988525390625, 6.48419189453125, 6.76953125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 3.0, 10.0, 13.0, 22.0, 31.0, 34.0, 61.0, 72.0, 87.0, 118.0, 129.0, 102.0, 93.0, 64.0, 63.0, 19.0, 31.0, 20.0, 16.0, 2.0, 6.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-170.14627075195312, -165.8067169189453, -161.46717834472656, -157.12762451171875, -152.78807067871094, -148.4485321044922, -144.10897827148438, -139.76942443847656, -135.4298858642578, -131.09033203125, -126.75078582763672, -122.41123962402344, -118.07169342041016, -113.73214721679688, -109.39259338378906, -105.05304718017578, -100.71349334716797, -96.37394714355469, -92.03439331054688, -87.6948471069336, -83.35530090332031, -79.0157470703125, -74.67620086669922, -70.33665466308594, -65.99710083007812, -61.65755081176758, -57.3180046081543, -52.97845458984375, -48.63890838623047, -44.29935836791992, -39.959808349609375, -35.620262145996094, -31.280723571777344, -26.94117546081543, -22.601627349853516, -18.26207733154297, -13.922529220581055, -9.58298110961914, -5.243431091308594, -0.9038829803466797, 3.4356651306152344, 7.775213718414307, 12.114762306213379, 16.45431137084961, 20.793859481811523, 25.133407592773438, 29.472957611083984, 33.81250762939453, 38.15205383300781, 42.49160385131836, 46.83115005493164, 51.17070007324219, 55.51024627685547, 59.849796295166016, 64.18934631347656, 68.52889251708984, 72.86843872070312, 77.2079849243164, 81.54753875732422, 85.8870849609375, 90.22663116455078, 94.56617736816406, 98.90573120117188, 103.24527740478516, 107.58483123779297]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 8.0, 8.0, 19.0, 21.0, 26.0, 25.0, 37.0, 28.0, 45.0, 51.0, 52.0, 54.0, 48.0, 64.0, 45.0, 50.0, 55.0, 34.0, 43.0, 48.0, 35.0, 29.0, 17.0, 26.0, 24.0, 17.0, 19.0, 14.0, 12.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.37962341308594, -102.38147735595703, -99.3833236694336, -96.38517761230469, -93.38702392578125, -90.38887786865234, -87.39073181152344, -84.392578125, -81.39442443847656, -78.39627838134766, -75.39812469482422, -72.39997863769531, -69.40182495117188, -66.40367889404297, -63.4055290222168, -60.407379150390625, -57.40923309326172, -54.41108322143555, -51.412933349609375, -48.41478729248047, -45.41663360595703, -42.418487548828125, -39.42033767700195, -36.42218780517578, -33.42403793334961, -30.425888061523438, -27.427738189697266, -24.429590225219727, -21.431440353393555, -18.433290481567383, -15.435142517089844, -12.436992645263672, -9.438850402832031, -6.440701007843018, -3.442551612854004, -0.44440269470214844, 2.5537471771240234, 5.551897048950195, 8.550045013427734, 11.548194885253906, 14.546344757080078, 17.54449462890625, 20.542644500732422, 23.54079246520996, 26.538942337036133, 29.537092208862305, 32.535240173339844, 35.533390045166016, 38.53153991699219, 41.52968978881836, 44.52783966064453, 47.52598571777344, 50.524139404296875, 53.52228546142578, 56.52043533325195, 59.518585205078125, 62.5167350769043, 65.51488494873047, 68.51303100585938, 71.51118469238281, 74.50933074951172, 77.50748443603516, 80.50563049316406, 83.5037841796875, 86.5019302368164]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 6.0, 5.0, 9.0, 14.0, 12.0, 27.0, 21.0, 36.0, 58.0, 74.0, 143.0, 240.0, 483.0, 1014.0, 2345.0, 7194.0, 38033.0, 3350046.0, 754917.0, 29646.0, 6160.0, 2021.0, 892.0, 412.0, 198.0, 109.0, 62.0, 38.0, 19.0, 13.0, 15.0, 7.0, 3.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.8125, -80.685546875, -78.55859375, -76.431640625, -74.3046875, -72.177734375, -70.05078125, -67.923828125, -65.796875, -63.669921875, -61.54296875, -59.416015625, -57.2890625, -55.162109375, -53.03515625, -50.908203125, -48.78125, -46.654296875, -44.52734375, -42.400390625, -40.2734375, -38.146484375, -36.01953125, -33.892578125, -31.765625, -29.638671875, -27.51171875, -25.384765625, -23.2578125, -21.130859375, -19.00390625, -16.876953125, -14.75, -12.623046875, -10.49609375, -8.369140625, -6.2421875, -4.115234375, -1.98828125, 0.138671875, 2.265625, 4.392578125, 6.51953125, 8.646484375, 10.7734375, 12.900390625, 15.02734375, 17.154296875, 19.28125, 21.408203125, 23.53515625, 25.662109375, 27.7890625, 29.916015625, 32.04296875, 34.169921875, 36.296875, 38.423828125, 40.55078125, 42.677734375, 44.8046875, 46.931640625, 49.05859375, 51.185546875, 53.3125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 11.0, 21.0, 30.0, 39.0, 56.0, 59.0, 72.0, 86.0, 96.0, 82.0, 74.0, 82.0, 63.0, 60.0, 48.0, 36.0, 28.0, 18.0, 13.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.375, -6.156982421875, -5.93896484375, -5.720947265625, -5.5029296875, -5.284912109375, -5.06689453125, -4.848876953125, -4.630859375, -4.412841796875, -4.19482421875, -3.976806640625, -3.7587890625, -3.540771484375, -3.32275390625, -3.104736328125, -2.88671875, -2.668701171875, -2.45068359375, -2.232666015625, -2.0146484375, -1.796630859375, -1.57861328125, -1.360595703125, -1.142578125, -0.924560546875, -0.70654296875, -0.488525390625, -0.2705078125, -0.052490234375, 0.16552734375, 0.383544921875, 0.6015625, 0.819580078125, 1.03759765625, 1.255615234375, 1.4736328125, 1.691650390625, 1.90966796875, 2.127685546875, 2.345703125, 2.563720703125, 2.78173828125, 2.999755859375, 3.2177734375, 3.435791015625, 3.65380859375, 3.871826171875, 4.08984375, 4.307861328125, 4.52587890625, 4.743896484375, 4.9619140625, 5.179931640625, 5.39794921875, 5.615966796875, 5.833984375, 6.052001953125, 6.27001953125, 6.488037109375, 6.7060546875, 6.924072265625, 7.14208984375, 7.360107421875, 7.578125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 6.0, 7.0, 11.0, 8.0, 12.0, 14.0, 27.0, 31.0, 39.0, 54.0, 68.0, 117.0, 197.0, 347.0, 682.0, 1475.0, 3465.0, 10260.0, 37203.0, 190282.0, 3229945.0, 610808.0, 79842.0, 19075.0, 5847.0, 2347.0, 966.0, 443.0, 273.0, 144.0, 75.0, 47.0, 45.0, 21.0, 18.0, 19.0, 10.0, 11.0, 5.0, 11.0, 9.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.875, -32.871337890625, -31.86767578125, -30.864013671875, -29.8603515625, -28.856689453125, -27.85302734375, -26.849365234375, -25.845703125, -24.842041015625, -23.83837890625, -22.834716796875, -21.8310546875, -20.827392578125, -19.82373046875, -18.820068359375, -17.81640625, -16.812744140625, -15.80908203125, -14.805419921875, -13.8017578125, -12.798095703125, -11.79443359375, -10.790771484375, -9.787109375, -8.783447265625, -7.77978515625, -6.776123046875, -5.7724609375, -4.768798828125, -3.76513671875, -2.761474609375, -1.7578125, -0.754150390625, 0.24951171875, 1.253173828125, 2.2568359375, 3.260498046875, 4.26416015625, 5.267822265625, 6.271484375, 7.275146484375, 8.27880859375, 9.282470703125, 10.2861328125, 11.289794921875, 12.29345703125, 13.297119140625, 14.30078125, 15.304443359375, 16.30810546875, 17.311767578125, 18.3154296875, 19.319091796875, 20.32275390625, 21.326416015625, 22.330078125, 23.333740234375, 24.33740234375, 25.341064453125, 26.3447265625, 27.348388671875, 28.35205078125, 29.355712890625, 30.359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 12.0, 12.0, 22.0, 29.0, 45.0, 58.0, 108.0, 154.0, 342.0, 1020.0, 1357.0, 392.0, 191.0, 125.0, 62.0, 47.0, 28.0, 17.0, 14.0, 8.0, 6.0, 3.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.4140625, -13.0616455078125, -12.709228515625, -12.3568115234375, -12.00439453125, -11.6519775390625, -11.299560546875, -10.9471435546875, -10.5947265625, -10.2423095703125, -9.889892578125, -9.5374755859375, -9.18505859375, -8.8326416015625, -8.480224609375, -8.1278076171875, -7.775390625, -7.4229736328125, -7.070556640625, -6.7181396484375, -6.36572265625, -6.0133056640625, -5.660888671875, -5.3084716796875, -4.9560546875, -4.6036376953125, -4.251220703125, -3.8988037109375, -3.54638671875, -3.1939697265625, -2.841552734375, -2.4891357421875, -2.13671875, -1.7843017578125, -1.431884765625, -1.0794677734375, -0.72705078125, -0.3746337890625, -0.022216796875, 0.3302001953125, 0.6826171875, 1.0350341796875, 1.387451171875, 1.7398681640625, 2.09228515625, 2.4447021484375, 2.797119140625, 3.1495361328125, 3.501953125, 3.8543701171875, 4.206787109375, 4.5592041015625, 4.91162109375, 5.2640380859375, 5.616455078125, 5.9688720703125, 6.3212890625, 6.6737060546875, 7.026123046875, 7.3785400390625, 7.73095703125, 8.0833740234375, 8.435791015625, 8.7882080078125, 9.140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 15.0, 26.0, 47.0, 74.0, 85.0, 113.0, 109.0, 139.0, 114.0, 92.0, 67.0, 46.0, 22.0, 16.0, 9.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.94747543334961, -52.6427116394043, -50.337947845458984, -48.03318405151367, -45.72842025756836, -43.42365646362305, -41.11888885498047, -38.814125061035156, -36.509361267089844, -34.20459747314453, -31.89983367919922, -29.595069885253906, -27.290306091308594, -24.98554229736328, -22.680776596069336, -20.376012802124023, -18.071250915527344, -15.766487121582031, -13.461723327636719, -11.15695858001709, -8.852194786071777, -6.547430992126465, -4.242666244506836, -1.9379024505615234, 0.36686134338378906, 2.6716253757476807, 4.976389408111572, 7.281153678894043, 9.585917472839355, 11.890681266784668, 14.195446014404297, 16.50020980834961, 18.804977416992188, 21.1097412109375, 23.414505004882812, 25.719268798828125, 28.024032592773438, 30.32879638671875, 32.63356018066406, 34.938323974609375, 37.24308776855469, 39.5478515625, 41.85261535644531, 44.157379150390625, 46.46214294433594, 48.76690673828125, 51.07167053222656, 53.376434326171875, 55.68120193481445, 57.985965728759766, 60.29072952270508, 62.59549331665039, 64.90026092529297, 67.20502471923828, 69.5097885131836, 71.8145523071289, 74.11931610107422, 76.42407989501953, 78.72884368896484, 81.03360748291016, 83.33837127685547, 85.64313507080078, 87.9478988647461, 90.2526626586914, 92.55742645263672]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 4.0, 8.0, 7.0, 7.0, 12.0, 7.0, 18.0, 17.0, 22.0, 24.0, 29.0, 32.0, 34.0, 39.0, 38.0, 47.0, 44.0, 46.0, 49.0, 49.0, 45.0, 61.0, 47.0, 36.0, 33.0, 36.0, 29.0, 27.0, 29.0, 27.0, 13.0, 11.0, 18.0, 17.0, 12.0, 10.0, 2.0, 6.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.967315673828125, -27.91663360595703, -26.865951538085938, -25.815269470214844, -24.76458740234375, -23.713905334472656, -22.66322135925293, -21.612539291381836, -20.561857223510742, -19.51117515563965, -18.460493087768555, -17.40981101989746, -16.359127044677734, -15.308445930480957, -14.257762908935547, -13.207080841064453, -12.15639877319336, -11.105716705322266, -10.055034637451172, -9.004351615905762, -7.953669548034668, -6.902987480163574, -5.852304935455322, -4.80162239074707, -3.7509403228759766, -2.7002580165863037, -1.6495757102966309, -0.598893404006958, 0.45178890228271484, 1.5024709701538086, 2.5531535148620605, 3.6038360595703125, 4.654518127441406, 5.7052001953125, 6.755882740020752, 7.806565284729004, 8.857247352600098, 9.907929420471191, 10.958612442016602, 12.009294509887695, 13.059976577758789, 14.110658645629883, 15.161340713500977, 16.21202278137207, 17.262706756591797, 18.31338882446289, 19.364070892333984, 20.414752960205078, 21.465435028076172, 22.516117095947266, 23.56679916381836, 24.617481231689453, 25.668163299560547, 26.71884536743164, 27.769529342651367, 28.82021141052246, 29.870893478393555, 30.92157554626465, 31.972257614135742, 33.02294158935547, 34.07362365722656, 35.124305725097656, 36.17498779296875, 37.225669860839844, 38.27635192871094]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 13.0, 19.0, 30.0, 45.0, 82.0, 131.0, 230.0, 436.0, 819.0, 1665.0, 4472.0, 16688.0, 92402.0, 567229.0, 303889.0, 45137.0, 9726.0, 2923.0, 1204.0, 586.0, 286.0, 186.0, 119.0, 69.0, 45.0, 39.0, 21.0, 17.0, 7.0, 4.0, 5.0, 6.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.84375, -54.087890625, -52.33203125, -50.576171875, -48.8203125, -47.064453125, -45.30859375, -43.552734375, -41.796875, -40.041015625, -38.28515625, -36.529296875, -34.7734375, -33.017578125, -31.26171875, -29.505859375, -27.75, -25.994140625, -24.23828125, -22.482421875, -20.7265625, -18.970703125, -17.21484375, -15.458984375, -13.703125, -11.947265625, -10.19140625, -8.435546875, -6.6796875, -4.923828125, -3.16796875, -1.412109375, 0.34375, 2.099609375, 3.85546875, 5.611328125, 7.3671875, 9.123046875, 10.87890625, 12.634765625, 14.390625, 16.146484375, 17.90234375, 19.658203125, 21.4140625, 23.169921875, 24.92578125, 26.681640625, 28.4375, 30.193359375, 31.94921875, 33.705078125, 35.4609375, 37.216796875, 38.97265625, 40.728515625, 42.484375, 44.240234375, 45.99609375, 47.751953125, 49.5078125, 51.263671875, 53.01953125, 54.775390625, 56.53125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 7.0, 9.0, 24.0, 32.0, 42.0, 56.0, 52.0, 61.0, 98.0, 97.0, 77.0, 77.0, 73.0, 65.0, 60.0, 55.0, 36.0, 28.0, 15.0, 17.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.30877685546875, -6.0863037109375, -5.86383056640625, -5.641357421875, -5.41888427734375, -5.1964111328125, -4.97393798828125, -4.75146484375, -4.52899169921875, -4.3065185546875, -4.08404541015625, -3.861572265625, -3.63909912109375, -3.4166259765625, -3.19415283203125, -2.9716796875, -2.74920654296875, -2.5267333984375, -2.30426025390625, -2.081787109375, -1.85931396484375, -1.6368408203125, -1.41436767578125, -1.19189453125, -0.96942138671875, -0.7469482421875, -0.52447509765625, -0.302001953125, -0.07952880859375, 0.1429443359375, 0.36541748046875, 0.587890625, 0.81036376953125, 1.0328369140625, 1.25531005859375, 1.477783203125, 1.70025634765625, 1.9227294921875, 2.14520263671875, 2.36767578125, 2.59014892578125, 2.8126220703125, 3.03509521484375, 3.257568359375, 3.48004150390625, 3.7025146484375, 3.92498779296875, 4.1474609375, 4.36993408203125, 4.5924072265625, 4.81488037109375, 5.037353515625, 5.25982666015625, 5.4822998046875, 5.70477294921875, 5.92724609375, 6.14971923828125, 6.3721923828125, 6.59466552734375, 6.817138671875, 7.03961181640625, 7.2620849609375, 7.48455810546875, 7.70703125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 2.0, 3.0, 6.0, 14.0, 14.0, 19.0, 29.0, 43.0, 45.0, 88.0, 137.0, 228.0, 287.0, 477.0, 801.0, 1371.0, 2475.0, 5649.0, 13253.0, 34679.0, 94487.0, 274778.0, 385228.0, 146603.0, 52258.0, 19579.0, 8040.0, 3534.0, 1744.0, 998.0, 565.0, 332.0, 270.0, 162.0, 114.0, 73.0, 53.0, 39.0, 19.0, 18.0, 16.0, 7.0, 6.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.6875, -21.071533203125, -20.45556640625, -19.839599609375, -19.2236328125, -18.607666015625, -17.99169921875, -17.375732421875, -16.759765625, -16.143798828125, -15.52783203125, -14.911865234375, -14.2958984375, -13.679931640625, -13.06396484375, -12.447998046875, -11.83203125, -11.216064453125, -10.60009765625, -9.984130859375, -9.3681640625, -8.752197265625, -8.13623046875, -7.520263671875, -6.904296875, -6.288330078125, -5.67236328125, -5.056396484375, -4.4404296875, -3.824462890625, -3.20849609375, -2.592529296875, -1.9765625, -1.360595703125, -0.74462890625, -0.128662109375, 0.4873046875, 1.103271484375, 1.71923828125, 2.335205078125, 2.951171875, 3.567138671875, 4.18310546875, 4.799072265625, 5.4150390625, 6.031005859375, 6.64697265625, 7.262939453125, 7.87890625, 8.494873046875, 9.11083984375, 9.726806640625, 10.3427734375, 10.958740234375, 11.57470703125, 12.190673828125, 12.806640625, 13.422607421875, 14.03857421875, 14.654541015625, 15.2705078125, 15.886474609375, 16.50244140625, 17.118408203125, 17.734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 7.0, 9.0, 16.0, 11.0, 14.0, 23.0, 23.0, 24.0, 37.0, 36.0, 33.0, 42.0, 41.0, 39.0, 38.0, 50.0, 43.0, 54.0, 38.0, 38.0, 42.0, 55.0, 31.0, 36.0, 31.0, 37.0, 18.0, 15.0, 17.0, 16.0, 8.0, 11.0, 13.0, 6.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.171875, -14.7061767578125, -14.240478515625, -13.7747802734375, -13.30908203125, -12.8433837890625, -12.377685546875, -11.9119873046875, -11.4462890625, -10.9805908203125, -10.514892578125, -10.0491943359375, -9.58349609375, -9.1177978515625, -8.652099609375, -8.1864013671875, -7.720703125, -7.2550048828125, -6.789306640625, -6.3236083984375, -5.85791015625, -5.3922119140625, -4.926513671875, -4.4608154296875, -3.9951171875, -3.5294189453125, -3.063720703125, -2.5980224609375, -2.13232421875, -1.6666259765625, -1.200927734375, -0.7352294921875, -0.26953125, 0.1961669921875, 0.661865234375, 1.1275634765625, 1.59326171875, 2.0589599609375, 2.524658203125, 2.9903564453125, 3.4560546875, 3.9217529296875, 4.387451171875, 4.8531494140625, 5.31884765625, 5.7845458984375, 6.250244140625, 6.7159423828125, 7.181640625, 7.6473388671875, 8.113037109375, 8.5787353515625, 9.04443359375, 9.5101318359375, 9.975830078125, 10.4415283203125, 10.9072265625, 11.3729248046875, 11.838623046875, 12.3043212890625, 12.77001953125, 13.2357177734375, 13.701416015625, 14.1671142578125, 14.6328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 17.0, 8.0, 31.0, 44.0, 68.0, 114.0, 198.0, 325.0, 575.0, 1126.0, 2251.0, 4822.0, 11031.0, 26163.0, 67438.0, 184246.0, 377725.0, 231651.0, 83989.0, 32084.0, 13184.0, 5686.0, 2723.0, 1351.0, 707.0, 400.0, 231.0, 123.0, 100.0, 52.0, 32.0, 15.0, 12.0, 10.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.3125, -8.049560546875, -7.78662109375, -7.523681640625, -7.2607421875, -6.997802734375, -6.73486328125, -6.471923828125, -6.208984375, -5.946044921875, -5.68310546875, -5.420166015625, -5.1572265625, -4.894287109375, -4.63134765625, -4.368408203125, -4.10546875, -3.842529296875, -3.57958984375, -3.316650390625, -3.0537109375, -2.790771484375, -2.52783203125, -2.264892578125, -2.001953125, -1.739013671875, -1.47607421875, -1.213134765625, -0.9501953125, -0.687255859375, -0.42431640625, -0.161376953125, 0.1015625, 0.364501953125, 0.62744140625, 0.890380859375, 1.1533203125, 1.416259765625, 1.67919921875, 1.942138671875, 2.205078125, 2.468017578125, 2.73095703125, 2.993896484375, 3.2568359375, 3.519775390625, 3.78271484375, 4.045654296875, 4.30859375, 4.571533203125, 4.83447265625, 5.097412109375, 5.3603515625, 5.623291015625, 5.88623046875, 6.149169921875, 6.412109375, 6.675048828125, 6.93798828125, 7.200927734375, 7.4638671875, 7.726806640625, 7.98974609375, 8.252685546875, 8.515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 8.0, 8.0, 6.0, 11.0, 8.0, 11.0, 23.0, 21.0, 30.0, 44.0, 48.0, 74.0, 104.0, 113.0, 108.0, 92.0, 57.0, 26.0, 40.0, 26.0, 26.0, 19.0, 19.0, 3.0, 15.0, 8.0, 10.0, 8.0, 2.0, 2.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001834869384765625, -0.0017755329608917236, -0.0017161965370178223, -0.001656860113143921, -0.0015975236892700195, -0.0015381872653961182, -0.0014788508415222168, -0.0014195144176483154, -0.001360177993774414, -0.0013008415699005127, -0.0012415051460266113, -0.00118216872215271, -0.0011228322982788086, -0.0010634958744049072, -0.0010041594505310059, -0.0009448230266571045, -0.0008854866027832031, -0.0008261501789093018, -0.0007668137550354004, -0.000707477331161499, -0.0006481409072875977, -0.0005888044834136963, -0.0005294680595397949, -0.00047013163566589355, -0.0004107952117919922, -0.0003514587879180908, -0.00029212236404418945, -0.00023278594017028809, -0.00017344951629638672, -0.00011411309242248535, -5.4776668548583984e-05, 4.559755325317383e-06, 6.389617919921875e-05, 0.00012323260307312012, 0.00018256902694702148, 0.00024190545082092285, 0.0003012418746948242, 0.0003605782985687256, 0.00041991472244262695, 0.0004792511463165283, 0.0005385875701904297, 0.0005979239940643311, 0.0006572604179382324, 0.0007165968418121338, 0.0007759332656860352, 0.0008352696895599365, 0.0008946061134338379, 0.0009539425373077393, 0.0010132789611816406, 0.001072615385055542, 0.0011319518089294434, 0.0011912882328033447, 0.001250624656677246, 0.0013099610805511475, 0.0013692975044250488, 0.0014286339282989502, 0.0014879703521728516, 0.001547306776046753, 0.0016066431999206543, 0.0016659796237945557, 0.001725316047668457, 0.0017846524715423584, 0.0018439888954162598, 0.0019033253192901611, 0.0019626617431640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 9.0, 19.0, 28.0, 36.0, 51.0, 88.0, 143.0, 240.0, 425.0, 784.0, 1666.0, 3846.0, 10448.0, 34081.0, 131925.0, 465155.0, 296204.0, 71667.0, 19805.0, 6646.0, 2674.0, 1198.0, 599.0, 328.0, 167.0, 110.0, 63.0, 45.0, 33.0, 21.0, 13.0, 12.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.261962890625, -7.91455078125, -7.567138671875, -7.2197265625, -6.872314453125, -6.52490234375, -6.177490234375, -5.830078125, -5.482666015625, -5.13525390625, -4.787841796875, -4.4404296875, -4.093017578125, -3.74560546875, -3.398193359375, -3.05078125, -2.703369140625, -2.35595703125, -2.008544921875, -1.6611328125, -1.313720703125, -0.96630859375, -0.618896484375, -0.271484375, 0.075927734375, 0.42333984375, 0.770751953125, 1.1181640625, 1.465576171875, 1.81298828125, 2.160400390625, 2.5078125, 2.855224609375, 3.20263671875, 3.550048828125, 3.8974609375, 4.244873046875, 4.59228515625, 4.939697265625, 5.287109375, 5.634521484375, 5.98193359375, 6.329345703125, 6.6767578125, 7.024169921875, 7.37158203125, 7.718994140625, 8.06640625, 8.413818359375, 8.76123046875, 9.108642578125, 9.4560546875, 9.803466796875, 10.15087890625, 10.498291015625, 10.845703125, 11.193115234375, 11.54052734375, 11.887939453125, 12.2353515625, 12.582763671875, 12.93017578125, 13.277587890625, 13.625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 6.0, 4.0, 8.0, 15.0, 13.0, 17.0, 30.0, 46.0, 42.0, 46.0, 94.0, 91.0, 91.0, 97.0, 93.0, 54.0, 66.0, 50.0, 27.0, 22.0, 18.0, 18.0, 17.0, 9.0, 10.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.7120361328125, -6.470947265625, -6.2298583984375, -5.98876953125, -5.7476806640625, -5.506591796875, -5.2655029296875, -5.0244140625, -4.7833251953125, -4.542236328125, -4.3011474609375, -4.06005859375, -3.8189697265625, -3.577880859375, -3.3367919921875, -3.095703125, -2.8546142578125, -2.613525390625, -2.3724365234375, -2.13134765625, -1.8902587890625, -1.649169921875, -1.4080810546875, -1.1669921875, -0.9259033203125, -0.684814453125, -0.4437255859375, -0.20263671875, 0.0384521484375, 0.279541015625, 0.5206298828125, 0.76171875, 1.0028076171875, 1.243896484375, 1.4849853515625, 1.72607421875, 1.9671630859375, 2.208251953125, 2.4493408203125, 2.6904296875, 2.9315185546875, 3.172607421875, 3.4136962890625, 3.65478515625, 3.8958740234375, 4.136962890625, 4.3780517578125, 4.619140625, 4.8602294921875, 5.101318359375, 5.3424072265625, 5.58349609375, 5.8245849609375, 6.065673828125, 6.3067626953125, 6.5478515625, 6.7889404296875, 7.030029296875, 7.2711181640625, 7.51220703125, 7.7532958984375, 7.994384765625, 8.2354736328125, 8.4765625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 7.0, 13.0, 15.0, 22.0, 37.0, 48.0, 59.0, 79.0, 94.0, 82.0, 95.0, 84.0, 85.0, 69.0, 56.0, 51.0, 27.0, 24.0, 21.0, 10.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.95167541503906, -109.37156677246094, -105.79145812988281, -102.21135711669922, -98.6312484741211, -95.05113983154297, -91.47103881835938, -87.89093017578125, -84.31082153320312, -80.730712890625, -77.15060424804688, -73.57050323486328, -69.99039459228516, -66.41028594970703, -62.83018112182617, -59.25007629394531, -55.66996765136719, -52.08985900878906, -48.5097541809082, -44.929649353027344, -41.34954071044922, -37.769432067871094, -34.189327239990234, -30.609220504760742, -27.02911376953125, -23.449007034301758, -19.868900299072266, -16.288793563842773, -12.708686828613281, -9.128580093383789, -5.548473358154297, -1.9683666229248047, 1.6117401123046875, 5.19184684753418, 8.771953582763672, 12.352060317993164, 15.932167053222656, 19.51227378845215, 23.09238052368164, 26.672487258911133, 30.252593994140625, 33.83270263671875, 37.41280746459961, 40.99291229248047, 44.573020935058594, 48.15312957763672, 51.73323440551758, 55.31333923339844, 58.89344787597656, 62.47355651855469, 66.05366516113281, 69.6337661743164, 73.21387481689453, 76.79398345947266, 80.37408447265625, 83.95419311523438, 87.5343017578125, 91.11441040039062, 94.69451904296875, 98.27462005615234, 101.85472869873047, 105.4348373413086, 109.01493835449219, 112.59504699707031, 116.17515563964844]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 3.0, 1.0, 5.0, 4.0, 12.0, 12.0, 9.0, 10.0, 6.0, 17.0, 21.0, 22.0, 29.0, 30.0, 38.0, 32.0, 32.0, 45.0, 50.0, 51.0, 36.0, 53.0, 35.0, 46.0, 49.0, 38.0, 35.0, 34.0, 24.0, 35.0, 26.0, 30.0, 22.0, 18.0, 17.0, 11.0, 12.0, 9.0, 10.0, 8.0, 12.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-80.69986724853516, -78.16695404052734, -75.63404083251953, -73.10112762451172, -70.5682144165039, -68.0353012084961, -65.50238800048828, -62.969478607177734, -60.43656539916992, -57.90365219116211, -55.3707389831543, -52.837825775146484, -50.30491638183594, -47.772003173828125, -45.23908996582031, -42.7061767578125, -40.17326354980469, -37.640350341796875, -35.10743713378906, -32.57452392578125, -30.04161262512207, -27.508699417114258, -24.975788116455078, -22.442874908447266, -19.909961700439453, -17.37704849243164, -14.844136238098145, -12.311223983764648, -9.778310775756836, -7.245397567749023, -4.712485313415527, -2.1795730590820312, 0.35333251953125, 2.8862452507019043, 5.419157981872559, 7.952070713043213, 10.484983444213867, 13.01789665222168, 15.550808906555176, 18.083721160888672, 20.616634368896484, 23.149547576904297, 25.68246078491211, 28.21537208557129, 30.7482852935791, 33.28119659423828, 35.814109802246094, 38.347023010253906, 40.87993621826172, 43.41284942626953, 45.945762634277344, 48.478675842285156, 51.01158905029297, 53.54450225830078, 56.07741165161133, 58.61032485961914, 61.14323806762695, 63.676151275634766, 66.20906066894531, 68.74197387695312, 71.27488708496094, 73.80780029296875, 76.34071350097656, 78.87362670898438, 81.40653991699219]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 14.0, 15.0, 13.0, 24.0, 37.0, 35.0, 66.0, 98.0, 183.0, 263.0, 489.0, 955.0, 2316.0, 7108.0, 35534.0, 625491.0, 3447203.0, 58876.0, 10271.0, 2996.0, 1142.0, 462.0, 266.0, 151.0, 97.0, 58.0, 32.0, 31.0, 12.0, 8.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-79.125, -77.04931640625, -74.9736328125, -72.89794921875, -70.822265625, -68.74658203125, -66.6708984375, -64.59521484375, -62.51953125, -60.44384765625, -58.3681640625, -56.29248046875, -54.216796875, -52.14111328125, -50.0654296875, -47.98974609375, -45.9140625, -43.83837890625, -41.7626953125, -39.68701171875, -37.611328125, -35.53564453125, -33.4599609375, -31.38427734375, -29.30859375, -27.23291015625, -25.1572265625, -23.08154296875, -21.005859375, -18.93017578125, -16.8544921875, -14.77880859375, -12.703125, -10.62744140625, -8.5517578125, -6.47607421875, -4.400390625, -2.32470703125, -0.2490234375, 1.82666015625, 3.90234375, 5.97802734375, 8.0537109375, 10.12939453125, 12.205078125, 14.28076171875, 16.3564453125, 18.43212890625, 20.5078125, 22.58349609375, 24.6591796875, 26.73486328125, 28.810546875, 30.88623046875, 32.9619140625, 35.03759765625, 37.11328125, 39.18896484375, 41.2646484375, 43.34033203125, 45.416015625, 47.49169921875, 49.5673828125, 51.64306640625, 53.71875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 14.0, 22.0, 32.0, 40.0, 54.0, 45.0, 69.0, 89.0, 88.0, 77.0, 85.0, 76.0, 68.0, 62.0, 47.0, 30.0, 22.0, 26.0, 14.0, 12.0, 9.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.2451171875, -6.025390625, -5.8056640625, -5.5859375, -5.3662109375, -5.146484375, -4.9267578125, -4.70703125, -4.4873046875, -4.267578125, -4.0478515625, -3.828125, -3.6083984375, -3.388671875, -3.1689453125, -2.94921875, -2.7294921875, -2.509765625, -2.2900390625, -2.0703125, -1.8505859375, -1.630859375, -1.4111328125, -1.19140625, -0.9716796875, -0.751953125, -0.5322265625, -0.3125, -0.0927734375, 0.126953125, 0.3466796875, 0.56640625, 0.7861328125, 1.005859375, 1.2255859375, 1.4453125, 1.6650390625, 1.884765625, 2.1044921875, 2.32421875, 2.5439453125, 2.763671875, 2.9833984375, 3.203125, 3.4228515625, 3.642578125, 3.8623046875, 4.08203125, 4.3017578125, 4.521484375, 4.7412109375, 4.9609375, 5.1806640625, 5.400390625, 5.6201171875, 5.83984375, 6.0595703125, 6.279296875, 6.4990234375, 6.71875, 6.9384765625, 7.158203125, 7.3779296875, 7.59765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 5.0, 11.0, 15.0, 21.0, 18.0, 29.0, 33.0, 42.0, 57.0, 67.0, 103.0, 125.0, 212.0, 377.0, 815.0, 1847.0, 5395.0, 20291.0, 107753.0, 2051027.0, 1871753.0, 105220.0, 19908.0, 5440.0, 1837.0, 801.0, 327.0, 219.0, 135.0, 108.0, 75.0, 46.0, 37.0, 30.0, 31.0, 22.0, 16.0, 11.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-43.5, -42.29150390625, -41.0830078125, -39.87451171875, -38.666015625, -37.45751953125, -36.2490234375, -35.04052734375, -33.83203125, -32.62353515625, -31.4150390625, -30.20654296875, -28.998046875, -27.78955078125, -26.5810546875, -25.37255859375, -24.1640625, -22.95556640625, -21.7470703125, -20.53857421875, -19.330078125, -18.12158203125, -16.9130859375, -15.70458984375, -14.49609375, -13.28759765625, -12.0791015625, -10.87060546875, -9.662109375, -8.45361328125, -7.2451171875, -6.03662109375, -4.828125, -3.61962890625, -2.4111328125, -1.20263671875, 0.005859375, 1.21435546875, 2.4228515625, 3.63134765625, 4.83984375, 6.04833984375, 7.2568359375, 8.46533203125, 9.673828125, 10.88232421875, 12.0908203125, 13.29931640625, 14.5078125, 15.71630859375, 16.9248046875, 18.13330078125, 19.341796875, 20.55029296875, 21.7587890625, 22.96728515625, 24.17578125, 25.38427734375, 26.5927734375, 27.80126953125, 29.009765625, 30.21826171875, 31.4267578125, 32.63525390625, 33.84375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 4.0, 3.0, 5.0, 9.0, 13.0, 19.0, 20.0, 32.0, 52.0, 66.0, 108.0, 169.0, 275.0, 644.0, 1451.0, 506.0, 235.0, 146.0, 93.0, 75.0, 47.0, 32.0, 17.0, 15.0, 15.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.703125, -14.3099365234375, -13.916748046875, -13.5235595703125, -13.13037109375, -12.7371826171875, -12.343994140625, -11.9508056640625, -11.5576171875, -11.1644287109375, -10.771240234375, -10.3780517578125, -9.98486328125, -9.5916748046875, -9.198486328125, -8.8052978515625, -8.412109375, -8.0189208984375, -7.625732421875, -7.2325439453125, -6.83935546875, -6.4461669921875, -6.052978515625, -5.6597900390625, -5.2666015625, -4.8734130859375, -4.480224609375, -4.0870361328125, -3.69384765625, -3.3006591796875, -2.907470703125, -2.5142822265625, -2.12109375, -1.7279052734375, -1.334716796875, -0.9415283203125, -0.54833984375, -0.1551513671875, 0.238037109375, 0.6312255859375, 1.0244140625, 1.4176025390625, 1.810791015625, 2.2039794921875, 2.59716796875, 2.9903564453125, 3.383544921875, 3.7767333984375, 4.169921875, 4.5631103515625, 4.956298828125, 5.3494873046875, 5.74267578125, 6.1358642578125, 6.529052734375, 6.9222412109375, 7.3154296875, 7.7086181640625, 8.101806640625, 8.4949951171875, 8.88818359375, 9.2813720703125, 9.674560546875, 10.0677490234375, 10.4609375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 9.0, 18.0, 23.0, 55.0, 63.0, 103.0, 127.0, 141.0, 144.0, 94.0, 81.0, 54.0, 36.0, 21.0, 16.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.6307144165039, -72.41205596923828, -69.19338989257812, -65.9747314453125, -62.756072998046875, -59.53741455078125, -56.31875228881836, -53.10009002685547, -49.881431579589844, -46.66277313232422, -43.44411087036133, -40.22544860839844, -37.00679016113281, -33.78813171386719, -30.569469451904297, -27.35080909729004, -24.13214874267578, -20.913488388061523, -17.694828033447266, -14.476167678833008, -11.25750732421875, -8.038846969604492, -4.820186614990234, -1.6015262603759766, 1.6171340942382812, 4.835794448852539, 8.054454803466797, 11.273115158081055, 14.491775512695312, 17.71043586730957, 20.929096221923828, 24.147756576538086, 27.366409301757812, 30.58506965637207, 33.80373001098633, 37.02239227294922, 40.241050720214844, 43.45970916748047, 46.67837142944336, 49.89703369140625, 53.115692138671875, 56.3343505859375, 59.55301284790039, 62.77167510986328, 65.9903335571289, 69.20899200439453, 72.42765808105469, 75.64631652832031, 78.86497497558594, 82.08363342285156, 85.30229187011719, 88.52095794677734, 91.73961639404297, 94.9582748413086, 98.17694091796875, 101.39559936523438, 104.6142578125, 107.83291625976562, 111.05157470703125, 114.2702407836914, 117.48889923095703, 120.70755767822266, 123.92622375488281, 127.14488220214844, 130.36354064941406]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 7.0, 15.0, 12.0, 15.0, 16.0, 24.0, 21.0, 21.0, 29.0, 34.0, 49.0, 41.0, 29.0, 44.0, 49.0, 47.0, 47.0, 59.0, 46.0, 36.0, 48.0, 45.0, 42.0, 25.0, 31.0, 32.0, 23.0, 18.0, 18.0, 11.0, 12.0, 6.0, 7.0, 11.0, 4.0, 5.0, 4.0, 0.0, 4.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.44134521484375, -35.189483642578125, -33.9376220703125, -32.685760498046875, -31.433900833129883, -30.182039260864258, -28.930179595947266, -27.67831802368164, -26.426456451416016, -25.17459487915039, -23.922733306884766, -22.670873641967773, -21.41901206970215, -20.167150497436523, -18.91529083251953, -17.663429260253906, -16.41156768798828, -15.159706115722656, -13.907845497131348, -12.655984878540039, -11.404123306274414, -10.152261734008789, -8.90040111541748, -7.648540496826172, -6.396678924560547, -5.14481782913208, -3.8929567337036133, -2.6410956382751465, -1.3892345428466797, -0.1373734474182129, 1.114487648010254, 2.3663482666015625, 3.618213653564453, 4.87007474899292, 6.121935844421387, 7.3737969398498535, 8.62565803527832, 9.877519607543945, 11.129380226135254, 12.381240844726562, 13.633102416992188, 14.884963989257812, 16.136825561523438, 17.38868522644043, 18.640546798706055, 19.89240837097168, 21.144268035888672, 22.396129608154297, 23.647991180419922, 24.899852752685547, 26.151714324951172, 27.403573989868164, 28.65543556213379, 29.907297134399414, 31.159156799316406, 32.41101837158203, 33.662879943847656, 34.91474151611328, 36.166603088378906, 37.41846466064453, 38.670326232910156, 39.922183990478516, 41.17404556274414, 42.425907135009766, 43.67776870727539]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 3.0, 4.0, 9.0, 9.0, 16.0, 26.0, 28.0, 37.0, 59.0, 80.0, 118.0, 182.0, 288.0, 538.0, 996.0, 2247.0, 5494.0, 17155.0, 70767.0, 503696.0, 367332.0, 56012.0, 14366.0, 4823.0, 1978.0, 952.0, 507.0, 286.0, 176.0, 119.0, 76.0, 39.0, 41.0, 27.0, 16.0, 13.0, 8.0, 3.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-50.15625, -48.72021484375, -47.2841796875, -45.84814453125, -44.412109375, -42.97607421875, -41.5400390625, -40.10400390625, -38.66796875, -37.23193359375, -35.7958984375, -34.35986328125, -32.923828125, -31.48779296875, -30.0517578125, -28.61572265625, -27.1796875, -25.74365234375, -24.3076171875, -22.87158203125, -21.435546875, -19.99951171875, -18.5634765625, -17.12744140625, -15.69140625, -14.25537109375, -12.8193359375, -11.38330078125, -9.947265625, -8.51123046875, -7.0751953125, -5.63916015625, -4.203125, -2.76708984375, -1.3310546875, 0.10498046875, 1.541015625, 2.97705078125, 4.4130859375, 5.84912109375, 7.28515625, 8.72119140625, 10.1572265625, 11.59326171875, 13.029296875, 14.46533203125, 15.9013671875, 17.33740234375, 18.7734375, 20.20947265625, 21.6455078125, 23.08154296875, 24.517578125, 25.95361328125, 27.3896484375, 28.82568359375, 30.26171875, 31.69775390625, 33.1337890625, 34.56982421875, 36.005859375, 37.44189453125, 38.8779296875, 40.31396484375, 41.75]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 10.0, 8.0, 17.0, 29.0, 27.0, 31.0, 57.0, 50.0, 77.0, 91.0, 76.0, 93.0, 72.0, 68.0, 68.0, 57.0, 42.0, 40.0, 31.0, 17.0, 10.0, 19.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3153076171875, -6.091552734375, -5.8677978515625, -5.64404296875, -5.4202880859375, -5.196533203125, -4.9727783203125, -4.7490234375, -4.5252685546875, -4.301513671875, -4.0777587890625, -3.85400390625, -3.6302490234375, -3.406494140625, -3.1827392578125, -2.958984375, -2.7352294921875, -2.511474609375, -2.2877197265625, -2.06396484375, -1.8402099609375, -1.616455078125, -1.3927001953125, -1.1689453125, -0.9451904296875, -0.721435546875, -0.4976806640625, -0.27392578125, -0.0501708984375, 0.173583984375, 0.3973388671875, 0.62109375, 0.8448486328125, 1.068603515625, 1.2923583984375, 1.51611328125, 1.7398681640625, 1.963623046875, 2.1873779296875, 2.4111328125, 2.6348876953125, 2.858642578125, 3.0823974609375, 3.30615234375, 3.5299072265625, 3.753662109375, 3.9774169921875, 4.201171875, 4.4249267578125, 4.648681640625, 4.8724365234375, 5.09619140625, 5.3199462890625, 5.543701171875, 5.7674560546875, 5.9912109375, 6.2149658203125, 6.438720703125, 6.6624755859375, 6.88623046875, 7.1099853515625, 7.333740234375, 7.5574951171875, 7.78125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 8.0, 8.0, 8.0, 17.0, 5.0, 20.0, 24.0, 35.0, 49.0, 75.0, 101.0, 140.0, 190.0, 256.0, 464.0, 769.0, 1342.0, 2880.0, 6741.0, 17057.0, 48185.0, 152633.0, 491289.0, 222039.0, 65555.0, 22603.0, 8378.0, 3460.0, 1698.0, 878.0, 504.0, 372.0, 216.0, 146.0, 113.0, 87.0, 54.0, 40.0, 40.0, 30.0, 10.0, 13.0, 9.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.515625, -20.8564453125, -20.197265625, -19.5380859375, -18.87890625, -18.2197265625, -17.560546875, -16.9013671875, -16.2421875, -15.5830078125, -14.923828125, -14.2646484375, -13.60546875, -12.9462890625, -12.287109375, -11.6279296875, -10.96875, -10.3095703125, -9.650390625, -8.9912109375, -8.33203125, -7.6728515625, -7.013671875, -6.3544921875, -5.6953125, -5.0361328125, -4.376953125, -3.7177734375, -3.05859375, -2.3994140625, -1.740234375, -1.0810546875, -0.421875, 0.2373046875, 0.896484375, 1.5556640625, 2.21484375, 2.8740234375, 3.533203125, 4.1923828125, 4.8515625, 5.5107421875, 6.169921875, 6.8291015625, 7.48828125, 8.1474609375, 8.806640625, 9.4658203125, 10.125, 10.7841796875, 11.443359375, 12.1025390625, 12.76171875, 13.4208984375, 14.080078125, 14.7392578125, 15.3984375, 16.0576171875, 16.716796875, 17.3759765625, 18.03515625, 18.6943359375, 19.353515625, 20.0126953125, 20.671875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 6.0, 8.0, 8.0, 8.0, 11.0, 13.0, 20.0, 22.0, 21.0, 16.0, 28.0, 34.0, 39.0, 32.0, 53.0, 49.0, 40.0, 40.0, 45.0, 36.0, 54.0, 50.0, 34.0, 36.0, 50.0, 36.0, 28.0, 15.0, 28.0, 25.0, 18.0, 20.0, 18.0, 11.0, 12.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-16.6875, -16.1927490234375, -15.697998046875, -15.2032470703125, -14.70849609375, -14.2137451171875, -13.718994140625, -13.2242431640625, -12.7294921875, -12.2347412109375, -11.739990234375, -11.2452392578125, -10.75048828125, -10.2557373046875, -9.760986328125, -9.2662353515625, -8.771484375, -8.2767333984375, -7.781982421875, -7.2872314453125, -6.79248046875, -6.2977294921875, -5.802978515625, -5.3082275390625, -4.8134765625, -4.3187255859375, -3.823974609375, -3.3292236328125, -2.83447265625, -2.3397216796875, -1.844970703125, -1.3502197265625, -0.85546875, -0.3607177734375, 0.134033203125, 0.6287841796875, 1.12353515625, 1.6182861328125, 2.113037109375, 2.6077880859375, 3.1025390625, 3.5972900390625, 4.092041015625, 4.5867919921875, 5.08154296875, 5.5762939453125, 6.071044921875, 6.5657958984375, 7.060546875, 7.5552978515625, 8.050048828125, 8.5447998046875, 9.03955078125, 9.5343017578125, 10.029052734375, 10.5238037109375, 11.0185546875, 11.5133056640625, 12.008056640625, 12.5028076171875, 12.99755859375, 13.4923095703125, 13.987060546875, 14.4818115234375, 14.9765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 4.0, 13.0, 22.0, 40.0, 52.0, 128.0, 243.0, 880.0, 4858.0, 137969.0, 888389.0, 13596.0, 1610.0, 411.0, 148.0, 77.0, 54.0, 18.0, 18.0, 9.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.0, -38.67578125, -37.3515625, -36.02734375, -34.703125, -33.37890625, -32.0546875, -30.73046875, -29.40625, -28.08203125, -26.7578125, -25.43359375, -24.109375, -22.78515625, -21.4609375, -20.13671875, -18.8125, -17.48828125, -16.1640625, -14.83984375, -13.515625, -12.19140625, -10.8671875, -9.54296875, -8.21875, -6.89453125, -5.5703125, -4.24609375, -2.921875, -1.59765625, -0.2734375, 1.05078125, 2.375, 3.69921875, 5.0234375, 6.34765625, 7.671875, 8.99609375, 10.3203125, 11.64453125, 12.96875, 14.29296875, 15.6171875, 16.94140625, 18.265625, 19.58984375, 20.9140625, 22.23828125, 23.5625, 24.88671875, 26.2109375, 27.53515625, 28.859375, 30.18359375, 31.5078125, 32.83203125, 34.15625, 35.48046875, 36.8046875, 38.12890625, 39.453125, 40.77734375, 42.1015625, 43.42578125, 44.75]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 9.0, 2.0, 9.0, 15.0, 14.0, 23.0, 26.0, 42.0, 57.0, 188.0, 291.0, 154.0, 41.0, 40.0, 23.0, 17.0, 12.0, 10.0, 8.0, 2.0, 2.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026874542236328125, -0.002589315176010132, -0.002491176128387451, -0.0023930370807647705, -0.00229489803314209, -0.002196758985519409, -0.0020986199378967285, -0.002000480890274048, -0.0019023418426513672, -0.0018042027950286865, -0.0017060637474060059, -0.0016079246997833252, -0.0015097856521606445, -0.0014116466045379639, -0.0013135075569152832, -0.0012153685092926025, -0.0011172294616699219, -0.0010190904140472412, -0.0009209513664245605, -0.0008228123188018799, -0.0007246732711791992, -0.0006265342235565186, -0.0005283951759338379, -0.0004302561283111572, -0.00033211708068847656, -0.0002339780330657959, -0.00013583898544311523, -3.769993782043457e-05, 6.0439109802246094e-05, 0.00015857815742492676, 0.0002567172050476074, 0.0003548562526702881, 0.00045299530029296875, 0.0005511343479156494, 0.0006492733955383301, 0.0007474124431610107, 0.0008455514907836914, 0.0009436905384063721, 0.0010418295860290527, 0.0011399686336517334, 0.001238107681274414, 0.0013362467288970947, 0.0014343857765197754, 0.001532524824142456, 0.0016306638717651367, 0.0017288029193878174, 0.001826941967010498, 0.0019250810146331787, 0.0020232200622558594, 0.00212135910987854, 0.0022194981575012207, 0.0023176372051239014, 0.002415776252746582, 0.0025139153003692627, 0.0026120543479919434, 0.002710193395614624, 0.0028083324432373047, 0.0029064714908599854, 0.003004610538482666, 0.0031027495861053467, 0.0032008886337280273, 0.003299027681350708, 0.0033971667289733887, 0.0034953057765960693, 0.00359344482421875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 7.0, 7.0, 10.0, 12.0, 17.0, 22.0, 23.0, 33.0, 35.0, 59.0, 98.0, 124.0, 195.0, 339.0, 497.0, 791.0, 1407.0, 2589.0, 5371.0, 13662.0, 50592.0, 428704.0, 463779.0, 54019.0, 14073.0, 5622.0, 2700.0, 1408.0, 839.0, 500.0, 329.0, 212.0, 124.0, 85.0, 65.0, 46.0, 28.0, 24.0, 18.0, 12.0, 19.0, 9.0, 9.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.3671875, -11.968505859375, -11.56982421875, -11.171142578125, -10.7724609375, -10.373779296875, -9.97509765625, -9.576416015625, -9.177734375, -8.779052734375, -8.38037109375, -7.981689453125, -7.5830078125, -7.184326171875, -6.78564453125, -6.386962890625, -5.98828125, -5.589599609375, -5.19091796875, -4.792236328125, -4.3935546875, -3.994873046875, -3.59619140625, -3.197509765625, -2.798828125, -2.400146484375, -2.00146484375, -1.602783203125, -1.2041015625, -0.805419921875, -0.40673828125, -0.008056640625, 0.390625, 0.789306640625, 1.18798828125, 1.586669921875, 1.9853515625, 2.384033203125, 2.78271484375, 3.181396484375, 3.580078125, 3.978759765625, 4.37744140625, 4.776123046875, 5.1748046875, 5.573486328125, 5.97216796875, 6.370849609375, 6.76953125, 7.168212890625, 7.56689453125, 7.965576171875, 8.3642578125, 8.762939453125, 9.16162109375, 9.560302734375, 9.958984375, 10.357666015625, 10.75634765625, 11.155029296875, 11.5537109375, 11.952392578125, 12.35107421875, 12.749755859375, 13.1484375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 3.0, 5.0, 7.0, 10.0, 12.0, 13.0, 28.0, 47.0, 89.0, 144.0, 182.0, 155.0, 113.0, 59.0, 38.0, 24.0, 18.0, 10.0, 5.0, 10.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.40625, -12.0269775390625, -11.647705078125, -11.2684326171875, -10.88916015625, -10.5098876953125, -10.130615234375, -9.7513427734375, -9.3720703125, -8.9927978515625, -8.613525390625, -8.2342529296875, -7.85498046875, -7.4757080078125, -7.096435546875, -6.7171630859375, -6.337890625, -5.9586181640625, -5.579345703125, -5.2000732421875, -4.82080078125, -4.4415283203125, -4.062255859375, -3.6829833984375, -3.3037109375, -2.9244384765625, -2.545166015625, -2.1658935546875, -1.78662109375, -1.4073486328125, -1.028076171875, -0.6488037109375, -0.26953125, 0.1097412109375, 0.489013671875, 0.8682861328125, 1.24755859375, 1.6268310546875, 2.006103515625, 2.3853759765625, 2.7646484375, 3.1439208984375, 3.523193359375, 3.9024658203125, 4.28173828125, 4.6610107421875, 5.040283203125, 5.4195556640625, 5.798828125, 6.1781005859375, 6.557373046875, 6.9366455078125, 7.31591796875, 7.6951904296875, 8.074462890625, 8.4537353515625, 8.8330078125, 9.2122802734375, 9.591552734375, 9.9708251953125, 10.35009765625, 10.7293701171875, 11.108642578125, 11.4879150390625, 11.8671875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 8.0, 24.0, 32.0, 72.0, 93.0, 167.0, 178.0, 173.0, 118.0, 71.0, 40.0, 17.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-150.31546020507812, -142.99058532714844, -135.66571044921875, -128.3408203125, -121.01595306396484, -113.69107055664062, -106.36619567871094, -99.04132080078125, -91.71644592285156, -84.39157104492188, -77.06668853759766, -69.74181365966797, -62.41693878173828, -55.09206008911133, -47.767181396484375, -40.44230651855469, -33.11742401123047, -25.79254722595215, -18.467670440673828, -11.142791748046875, -3.8179149627685547, 3.5069618225097656, 10.831840515136719, 18.156715393066406, 25.48159408569336, 32.80647277832031, 40.13134765625, 47.45622634887695, 54.781105041503906, 62.105979919433594, 69.43086242675781, 76.7557373046875, 84.08061218261719, 91.40548706054688, 98.7303695678711, 106.05524444580078, 113.38011932373047, 120.70500183105469, 128.02987670898438, 135.35475158691406, 142.67962646484375, 150.00450134277344, 157.32937622070312, 164.65426635742188, 171.97914123535156, 179.30401611328125, 186.62889099121094, 193.95376586914062, 201.27865600585938, 208.60353088378906, 215.92840576171875, 223.2532958984375, 230.5781707763672, 237.90304565429688, 245.22792053222656, 252.55279541015625, 259.8776550292969, 267.2025451660156, 274.52740478515625, 281.852294921875, 289.1771545410156, 296.5020446777344, 303.826904296875, 311.15179443359375, 318.4766845703125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 7.0, 8.0, 10.0, 13.0, 18.0, 19.0, 10.0, 16.0, 23.0, 20.0, 32.0, 36.0, 40.0, 33.0, 35.0, 40.0, 39.0, 38.0, 41.0, 37.0, 35.0, 43.0, 38.0, 40.0, 37.0, 34.0, 29.0, 26.0, 27.0, 23.0, 17.0, 13.0, 24.0, 17.0, 15.0, 17.0, 11.0, 8.0, 3.0, 2.0, 8.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-80.02961730957031, -77.57621765136719, -75.12281036376953, -72.6694107055664, -70.21600341796875, -67.76260375976562, -65.3092041015625, -62.85580062866211, -60.40239715576172, -57.94899368286133, -55.49559020996094, -53.04219055175781, -50.58878707885742, -48.13538360595703, -45.681983947753906, -43.228580474853516, -40.775177001953125, -38.321773529052734, -35.868370056152344, -33.41497039794922, -30.961566925048828, -28.508163452148438, -26.05476188659668, -23.601360321044922, -21.14795684814453, -18.69455337524414, -16.241151809692383, -13.787749290466309, -11.334346771240234, -8.88094425201416, -6.427541732788086, -3.974140167236328, -1.5207366943359375, 0.9326658248901367, 3.386068344116211, 5.839470863342285, 8.29287338256836, 10.746275901794434, 13.199678421020508, 15.653079986572266, 18.106483459472656, 20.559886932373047, 23.013288497924805, 25.466690063476562, 27.920093536376953, 30.373497009277344, 32.82689666748047, 35.28030014038086, 37.73370361328125, 40.18710708618164, 42.64051055908203, 45.093910217285156, 47.54731369018555, 50.00071716308594, 52.45411682128906, 54.90752029418945, 57.360923767089844, 59.814327239990234, 62.267730712890625, 64.72113037109375, 67.17453002929688, 69.62793731689453, 72.08133697509766, 74.53474426269531, 76.98814392089844]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 1.0, 5.0, 6.0, 6.0, 11.0, 10.0, 12.0, 9.0, 11.0, 19.0, 26.0, 27.0, 33.0, 54.0, 72.0, 107.0, 177.0, 254.0, 354.0, 568.0, 1042.0, 2054.0, 4198.0, 10439.0, 33865.0, 211604.0, 3700480.0, 179090.0, 31305.0, 9918.0, 4037.0, 1904.0, 1009.0, 552.0, 335.0, 180.0, 144.0, 95.0, 60.0, 50.0, 36.0, 22.0, 16.0, 16.0, 16.0, 13.0, 12.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-53.5, -51.94775390625, -50.3955078125, -48.84326171875, -47.291015625, -45.73876953125, -44.1865234375, -42.63427734375, -41.08203125, -39.52978515625, -37.9775390625, -36.42529296875, -34.873046875, -33.32080078125, -31.7685546875, -30.21630859375, -28.6640625, -27.11181640625, -25.5595703125, -24.00732421875, -22.455078125, -20.90283203125, -19.3505859375, -17.79833984375, -16.24609375, -14.69384765625, -13.1416015625, -11.58935546875, -10.037109375, -8.48486328125, -6.9326171875, -5.38037109375, -3.828125, -2.27587890625, -0.7236328125, 0.82861328125, 2.380859375, 3.93310546875, 5.4853515625, 7.03759765625, 8.58984375, 10.14208984375, 11.6943359375, 13.24658203125, 14.798828125, 16.35107421875, 17.9033203125, 19.45556640625, 21.0078125, 22.56005859375, 24.1123046875, 25.66455078125, 27.216796875, 28.76904296875, 30.3212890625, 31.87353515625, 33.42578125, 34.97802734375, 36.5302734375, 38.08251953125, 39.634765625, 41.18701171875, 42.7392578125, 44.29150390625, 45.84375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 10.0, 14.0, 15.0, 20.0, 28.0, 31.0, 48.0, 58.0, 58.0, 72.0, 84.0, 80.0, 77.0, 66.0, 70.0, 59.0, 60.0, 39.0, 32.0, 16.0, 21.0, 18.0, 14.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3671875, -6.1451416015625, -5.923095703125, -5.7010498046875, -5.47900390625, -5.2569580078125, -5.034912109375, -4.8128662109375, -4.5908203125, -4.3687744140625, -4.146728515625, -3.9246826171875, -3.70263671875, -3.4805908203125, -3.258544921875, -3.0364990234375, -2.814453125, -2.5924072265625, -2.370361328125, -2.1483154296875, -1.92626953125, -1.7042236328125, -1.482177734375, -1.2601318359375, -1.0380859375, -0.8160400390625, -0.593994140625, -0.3719482421875, -0.14990234375, 0.0721435546875, 0.294189453125, 0.5162353515625, 0.73828125, 0.9603271484375, 1.182373046875, 1.4044189453125, 1.62646484375, 1.8485107421875, 2.070556640625, 2.2926025390625, 2.5146484375, 2.7366943359375, 2.958740234375, 3.1807861328125, 3.40283203125, 3.6248779296875, 3.846923828125, 4.0689697265625, 4.291015625, 4.5130615234375, 4.735107421875, 4.9571533203125, 5.17919921875, 5.4012451171875, 5.623291015625, 5.8453369140625, 6.0673828125, 6.2894287109375, 6.511474609375, 6.7335205078125, 6.95556640625, 7.1776123046875, 7.399658203125, 7.6217041015625, 7.84375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 12.0, 16.0, 21.0, 19.0, 38.0, 41.0, 75.0, 92.0, 133.0, 198.0, 348.0, 481.0, 812.0, 1296.0, 2405.0, 4291.0, 8080.0, 17318.0, 41866.0, 128503.0, 806137.0, 2844663.0, 228447.0, 62663.0, 23623.0, 10494.0, 5194.0, 2808.0, 1589.0, 993.0, 564.0, 359.0, 242.0, 130.0, 96.0, 63.0, 56.0, 29.0, 23.0, 11.0, 16.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.953125, -24.201416015625, -23.44970703125, -22.697998046875, -21.9462890625, -21.194580078125, -20.44287109375, -19.691162109375, -18.939453125, -18.187744140625, -17.43603515625, -16.684326171875, -15.9326171875, -15.180908203125, -14.42919921875, -13.677490234375, -12.92578125, -12.174072265625, -11.42236328125, -10.670654296875, -9.9189453125, -9.167236328125, -8.41552734375, -7.663818359375, -6.912109375, -6.160400390625, -5.40869140625, -4.656982421875, -3.9052734375, -3.153564453125, -2.40185546875, -1.650146484375, -0.8984375, -0.146728515625, 0.60498046875, 1.356689453125, 2.1083984375, 2.860107421875, 3.61181640625, 4.363525390625, 5.115234375, 5.866943359375, 6.61865234375, 7.370361328125, 8.1220703125, 8.873779296875, 9.62548828125, 10.377197265625, 11.12890625, 11.880615234375, 12.63232421875, 13.384033203125, 14.1357421875, 14.887451171875, 15.63916015625, 16.390869140625, 17.142578125, 17.894287109375, 18.64599609375, 19.397705078125, 20.1494140625, 20.901123046875, 21.65283203125, 22.404541015625, 23.15625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 10.0, 12.0, 8.0, 16.0, 14.0, 23.0, 31.0, 35.0, 61.0, 107.0, 192.0, 398.0, 1239.0, 1046.0, 341.0, 198.0, 101.0, 78.0, 45.0, 30.0, 22.0, 16.0, 12.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.59375, -13.2259521484375, -12.858154296875, -12.4903564453125, -12.12255859375, -11.7547607421875, -11.386962890625, -11.0191650390625, -10.6513671875, -10.2835693359375, -9.915771484375, -9.5479736328125, -9.18017578125, -8.8123779296875, -8.444580078125, -8.0767822265625, -7.708984375, -7.3411865234375, -6.973388671875, -6.6055908203125, -6.23779296875, -5.8699951171875, -5.502197265625, -5.1343994140625, -4.7666015625, -4.3988037109375, -4.031005859375, -3.6632080078125, -3.29541015625, -2.9276123046875, -2.559814453125, -2.1920166015625, -1.82421875, -1.4564208984375, -1.088623046875, -0.7208251953125, -0.35302734375, 0.0147705078125, 0.382568359375, 0.7503662109375, 1.1181640625, 1.4859619140625, 1.853759765625, 2.2215576171875, 2.58935546875, 2.9571533203125, 3.324951171875, 3.6927490234375, 4.060546875, 4.4283447265625, 4.796142578125, 5.1639404296875, 5.53173828125, 5.8995361328125, 6.267333984375, 6.6351318359375, 7.0029296875, 7.3707275390625, 7.738525390625, 8.1063232421875, 8.47412109375, 8.8419189453125, 9.209716796875, 9.5775146484375, 9.9453125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 9.0, 15.0, 16.0, 31.0, 51.0, 63.0, 97.0, 117.0, 120.0, 135.0, 93.0, 83.0, 59.0, 44.0, 19.0, 29.0, 7.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.90001678466797, -79.15853118896484, -76.41704559326172, -73.67555236816406, -70.93406677246094, -68.19258117675781, -65.45109558105469, -62.70960998535156, -59.96812057495117, -57.22663497924805, -54.485145568847656, -51.74365997314453, -49.002174377441406, -46.260684967041016, -43.51919937133789, -40.7777099609375, -38.036224365234375, -35.29473876953125, -32.55324935913086, -29.811763763427734, -27.070276260375977, -24.32878875732422, -21.587303161621094, -18.845815658569336, -16.104328155517578, -13.36284065246582, -10.621354103088379, -7.8798675537109375, -5.13838005065918, -2.396892547607422, 0.3445930480957031, 3.086080551147461, 5.827568054199219, 8.569055557250977, 11.310542106628418, 14.05202865600586, 16.793516159057617, 19.535003662109375, 22.2764892578125, 25.017976760864258, 27.759464263916016, 30.500951766967773, 33.24243927001953, 35.983924865722656, 38.72541046142578, 41.46689987182617, 44.2083854675293, 46.94987487792969, 49.69136047363281, 52.43284606933594, 55.17433547973633, 57.91582107543945, 60.657310485839844, 63.39879608154297, 66.1402816772461, 68.88176727294922, 71.62326049804688, 74.36474609375, 77.10623168945312, 79.84771728515625, 82.5892105102539, 85.33069610595703, 88.07218170166016, 90.81366729736328, 93.5551528930664]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 7.0, 8.0, 23.0, 21.0, 25.0, 17.0, 30.0, 34.0, 33.0, 33.0, 43.0, 53.0, 57.0, 51.0, 62.0, 43.0, 54.0, 46.0, 43.0, 46.0, 41.0, 34.0, 34.0, 20.0, 21.0, 22.0, 16.0, 14.0, 15.0, 9.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.453407287597656, -39.134368896484375, -37.81532669067383, -36.49628829956055, -35.177249908447266, -33.85820770263672, -32.53916931152344, -31.220130920410156, -29.901090621948242, -28.582050323486328, -27.263011932373047, -25.943971633911133, -24.62493133544922, -23.305892944335938, -21.986852645874023, -20.66781234741211, -19.348773956298828, -18.029733657836914, -16.710695266723633, -15.391654968261719, -14.072615623474121, -12.753576278686523, -11.43453598022461, -10.115496635437012, -8.796457290649414, -7.477417945861816, -6.1583781242370605, -4.839338302612305, -3.520298957824707, -2.2012596130371094, -0.8822197914123535, 0.43682003021240234, 1.755859375, 3.0748989582061768, 4.3939385414123535, 5.712978363037109, 7.032017707824707, 8.351057052612305, 9.670097351074219, 10.989136695861816, 12.308176040649414, 13.627215385437012, 14.94625473022461, 16.265295028686523, 17.584335327148438, 18.90337371826172, 20.222414016723633, 21.541454315185547, 22.860492706298828, 24.179533004760742, 25.498571395874023, 26.817611694335938, 28.13665008544922, 29.455690383911133, 30.774730682373047, 32.09376907348633, 33.412811279296875, 34.731849670410156, 36.0508918762207, 37.369930267333984, 38.688968658447266, 40.00801086425781, 41.327049255371094, 42.646087646484375, 43.965126037597656]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 4.0, 7.0, 5.0, 11.0, 21.0, 21.0, 35.0, 53.0, 83.0, 129.0, 243.0, 439.0, 854.0, 2059.0, 7410.0, 36752.0, 299200.0, 622431.0, 62044.0, 11588.0, 2895.0, 1060.0, 461.0, 313.0, 174.0, 88.0, 55.0, 39.0, 25.0, 17.0, 11.0, 11.0, 7.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.71875, -53.0166015625, -51.314453125, -49.6123046875, -47.91015625, -46.2080078125, -44.505859375, -42.8037109375, -41.1015625, -39.3994140625, -37.697265625, -35.9951171875, -34.29296875, -32.5908203125, -30.888671875, -29.1865234375, -27.484375, -25.7822265625, -24.080078125, -22.3779296875, -20.67578125, -18.9736328125, -17.271484375, -15.5693359375, -13.8671875, -12.1650390625, -10.462890625, -8.7607421875, -7.05859375, -5.3564453125, -3.654296875, -1.9521484375, -0.25, 1.4521484375, 3.154296875, 4.8564453125, 6.55859375, 8.2607421875, 9.962890625, 11.6650390625, 13.3671875, 15.0693359375, 16.771484375, 18.4736328125, 20.17578125, 21.8779296875, 23.580078125, 25.2822265625, 26.984375, 28.6865234375, 30.388671875, 32.0908203125, 33.79296875, 35.4951171875, 37.197265625, 38.8994140625, 40.6015625, 42.3037109375, 44.005859375, 45.7080078125, 47.41015625, 49.1123046875, 50.814453125, 52.5166015625, 54.21875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 13.0, 9.0, 32.0, 32.0, 45.0, 31.0, 53.0, 54.0, 66.0, 68.0, 75.0, 68.0, 61.0, 57.0, 67.0, 52.0, 58.0, 30.0, 38.0, 23.0, 13.0, 17.0, 16.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.453125, -6.23175048828125, -6.0103759765625, -5.78900146484375, -5.567626953125, -5.34625244140625, -5.1248779296875, -4.90350341796875, -4.68212890625, -4.46075439453125, -4.2393798828125, -4.01800537109375, -3.796630859375, -3.57525634765625, -3.3538818359375, -3.13250732421875, -2.9111328125, -2.68975830078125, -2.4683837890625, -2.24700927734375, -2.025634765625, -1.80426025390625, -1.5828857421875, -1.36151123046875, -1.14013671875, -0.91876220703125, -0.6973876953125, -0.47601318359375, -0.254638671875, -0.03326416015625, 0.1881103515625, 0.40948486328125, 0.630859375, 0.85223388671875, 1.0736083984375, 1.29498291015625, 1.516357421875, 1.73773193359375, 1.9591064453125, 2.18048095703125, 2.40185546875, 2.62322998046875, 2.8446044921875, 3.06597900390625, 3.287353515625, 3.50872802734375, 3.7301025390625, 3.95147705078125, 4.1728515625, 4.39422607421875, 4.6156005859375, 4.83697509765625, 5.058349609375, 5.27972412109375, 5.5010986328125, 5.72247314453125, 5.94384765625, 6.16522216796875, 6.3865966796875, 6.60797119140625, 6.829345703125, 7.05072021484375, 7.2720947265625, 7.49346923828125, 7.71484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 15.0, 21.0, 23.0, 24.0, 46.0, 91.0, 156.0, 226.0, 455.0, 853.0, 1937.0, 4635.0, 12262.0, 35784.0, 141052.0, 654659.0, 139948.0, 35693.0, 12267.0, 4619.0, 1865.0, 864.0, 429.0, 229.0, 130.0, 81.0, 57.0, 31.0, 15.0, 21.0, 6.0, 10.0, 12.0, 3.0, 1.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-27.859375, -26.974853515625, -26.09033203125, -25.205810546875, -24.3212890625, -23.436767578125, -22.55224609375, -21.667724609375, -20.783203125, -19.898681640625, -19.01416015625, -18.129638671875, -17.2451171875, -16.360595703125, -15.47607421875, -14.591552734375, -13.70703125, -12.822509765625, -11.93798828125, -11.053466796875, -10.1689453125, -9.284423828125, -8.39990234375, -7.515380859375, -6.630859375, -5.746337890625, -4.86181640625, -3.977294921875, -3.0927734375, -2.208251953125, -1.32373046875, -0.439208984375, 0.4453125, 1.329833984375, 2.21435546875, 3.098876953125, 3.9833984375, 4.867919921875, 5.75244140625, 6.636962890625, 7.521484375, 8.406005859375, 9.29052734375, 10.175048828125, 11.0595703125, 11.944091796875, 12.82861328125, 13.713134765625, 14.59765625, 15.482177734375, 16.36669921875, 17.251220703125, 18.1357421875, 19.020263671875, 19.90478515625, 20.789306640625, 21.673828125, 22.558349609375, 23.44287109375, 24.327392578125, 25.2119140625, 26.096435546875, 26.98095703125, 27.865478515625, 28.75]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 8.0, 8.0, 14.0, 17.0, 23.0, 43.0, 42.0, 51.0, 54.0, 61.0, 87.0, 86.0, 69.0, 84.0, 69.0, 50.0, 55.0, 42.0, 37.0, 19.0, 14.0, 20.0, 17.0, 7.0, 8.0, 10.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.140625, -29.181884765625, -28.22314453125, -27.264404296875, -26.3056640625, -25.346923828125, -24.38818359375, -23.429443359375, -22.470703125, -21.511962890625, -20.55322265625, -19.594482421875, -18.6357421875, -17.677001953125, -16.71826171875, -15.759521484375, -14.80078125, -13.842041015625, -12.88330078125, -11.924560546875, -10.9658203125, -10.007080078125, -9.04833984375, -8.089599609375, -7.130859375, -6.172119140625, -5.21337890625, -4.254638671875, -3.2958984375, -2.337158203125, -1.37841796875, -0.419677734375, 0.5390625, 1.497802734375, 2.45654296875, 3.415283203125, 4.3740234375, 5.332763671875, 6.29150390625, 7.250244140625, 8.208984375, 9.167724609375, 10.12646484375, 11.085205078125, 12.0439453125, 13.002685546875, 13.96142578125, 14.920166015625, 15.87890625, 16.837646484375, 17.79638671875, 18.755126953125, 19.7138671875, 20.672607421875, 21.63134765625, 22.590087890625, 23.548828125, 24.507568359375, 25.46630859375, 26.425048828125, 27.3837890625, 28.342529296875, 29.30126953125, 30.260009765625, 31.21875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 14.0, 10.0, 20.0, 20.0, 28.0, 39.0, 75.0, 129.0, 238.0, 503.0, 1056.0, 2567.0, 7512.0, 22328.0, 82802.0, 685063.0, 193280.0, 35062.0, 11045.0, 3885.0, 1424.0, 713.0, 294.0, 150.0, 97.0, 61.0, 35.0, 29.0, 16.0, 21.0, 15.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.12744140625, -10.6767578125, -10.22607421875, -9.775390625, -9.32470703125, -8.8740234375, -8.42333984375, -7.97265625, -7.52197265625, -7.0712890625, -6.62060546875, -6.169921875, -5.71923828125, -5.2685546875, -4.81787109375, -4.3671875, -3.91650390625, -3.4658203125, -3.01513671875, -2.564453125, -2.11376953125, -1.6630859375, -1.21240234375, -0.76171875, -0.31103515625, 0.1396484375, 0.59033203125, 1.041015625, 1.49169921875, 1.9423828125, 2.39306640625, 2.84375, 3.29443359375, 3.7451171875, 4.19580078125, 4.646484375, 5.09716796875, 5.5478515625, 5.99853515625, 6.44921875, 6.89990234375, 7.3505859375, 7.80126953125, 8.251953125, 8.70263671875, 9.1533203125, 9.60400390625, 10.0546875, 10.50537109375, 10.9560546875, 11.40673828125, 11.857421875, 12.30810546875, 12.7587890625, 13.20947265625, 13.66015625, 14.11083984375, 14.5615234375, 15.01220703125, 15.462890625, 15.91357421875, 16.3642578125, 16.81494140625, 17.265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 13.0, 16.0, 22.0, 29.0, 20.0, 52.0, 119.0, 301.0, 213.0, 67.0, 21.0, 11.0, 14.0, 15.0, 8.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002307891845703125, -0.0022275447845458984, -0.002147197723388672, -0.0020668506622314453, -0.0019865036010742188, -0.0019061565399169922, -0.0018258094787597656, -0.001745462417602539, -0.0016651153564453125, -0.001584768295288086, -0.0015044212341308594, -0.0014240741729736328, -0.0013437271118164062, -0.0012633800506591797, -0.0011830329895019531, -0.0011026859283447266, -0.0010223388671875, -0.0009419918060302734, -0.0008616447448730469, -0.0007812976837158203, -0.0007009506225585938, -0.0006206035614013672, -0.0005402565002441406, -0.00045990943908691406, -0.0003795623779296875, -0.00029921531677246094, -0.00021886825561523438, -0.0001385211944580078, -5.817413330078125e-05, 2.2172927856445312e-05, 0.00010251998901367188, 0.00018286705017089844, 0.000263214111328125, 0.00034356117248535156, 0.0004239082336425781, 0.0005042552947998047, 0.0005846023559570312, 0.0006649494171142578, 0.0007452964782714844, 0.0008256435394287109, 0.0009059906005859375, 0.000986337661743164, 0.0010666847229003906, 0.0011470317840576172, 0.0012273788452148438, 0.0013077259063720703, 0.0013880729675292969, 0.0014684200286865234, 0.00154876708984375, 0.0016291141510009766, 0.0017094612121582031, 0.0017898082733154297, 0.0018701553344726562, 0.0019505023956298828, 0.0020308494567871094, 0.002111196517944336, 0.0021915435791015625, 0.002271890640258789, 0.0023522377014160156, 0.002432584762573242, 0.0025129318237304688, 0.0025932788848876953, 0.002673625946044922, 0.0027539730072021484, 0.002834320068359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 21.0, 25.0, 30.0, 48.0, 54.0, 80.0, 139.0, 174.0, 332.0, 661.0, 1499.0, 4452.0, 15395.0, 56150.0, 615770.0, 298360.0, 38462.0, 10912.0, 3438.0, 1184.0, 557.0, 300.0, 163.0, 113.0, 60.0, 49.0, 32.0, 20.0, 16.0, 10.0, 13.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.484375, -14.982666015625, -14.48095703125, -13.979248046875, -13.4775390625, -12.975830078125, -12.47412109375, -11.972412109375, -11.470703125, -10.968994140625, -10.46728515625, -9.965576171875, -9.4638671875, -8.962158203125, -8.46044921875, -7.958740234375, -7.45703125, -6.955322265625, -6.45361328125, -5.951904296875, -5.4501953125, -4.948486328125, -4.44677734375, -3.945068359375, -3.443359375, -2.941650390625, -2.43994140625, -1.938232421875, -1.4365234375, -0.934814453125, -0.43310546875, 0.068603515625, 0.5703125, 1.072021484375, 1.57373046875, 2.075439453125, 2.5771484375, 3.078857421875, 3.58056640625, 4.082275390625, 4.583984375, 5.085693359375, 5.58740234375, 6.089111328125, 6.5908203125, 7.092529296875, 7.59423828125, 8.095947265625, 8.59765625, 9.099365234375, 9.60107421875, 10.102783203125, 10.6044921875, 11.106201171875, 11.60791015625, 12.109619140625, 12.611328125, 13.113037109375, 13.61474609375, 14.116455078125, 14.6181640625, 15.119873046875, 15.62158203125, 16.123291015625, 16.625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 4.0, 10.0, 9.0, 11.0, 15.0, 13.0, 17.0, 26.0, 50.0, 105.0, 186.0, 171.0, 119.0, 82.0, 54.0, 25.0, 24.0, 12.0, 13.0, 13.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.28125, -10.9346923828125, -10.588134765625, -10.2415771484375, -9.89501953125, -9.5484619140625, -9.201904296875, -8.8553466796875, -8.5087890625, -8.1622314453125, -7.815673828125, -7.4691162109375, -7.12255859375, -6.7760009765625, -6.429443359375, -6.0828857421875, -5.736328125, -5.3897705078125, -5.043212890625, -4.6966552734375, -4.35009765625, -4.0035400390625, -3.656982421875, -3.3104248046875, -2.9638671875, -2.6173095703125, -2.270751953125, -1.9241943359375, -1.57763671875, -1.2310791015625, -0.884521484375, -0.5379638671875, -0.19140625, 0.1551513671875, 0.501708984375, 0.8482666015625, 1.19482421875, 1.5413818359375, 1.887939453125, 2.2344970703125, 2.5810546875, 2.9276123046875, 3.274169921875, 3.6207275390625, 3.96728515625, 4.3138427734375, 4.660400390625, 5.0069580078125, 5.353515625, 5.7000732421875, 6.046630859375, 6.3931884765625, 6.73974609375, 7.0863037109375, 7.432861328125, 7.7794189453125, 8.1259765625, 8.4725341796875, 8.819091796875, 9.1656494140625, 9.51220703125, 9.8587646484375, 10.205322265625, 10.5518798828125, 10.8984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 5.0, 16.0, 34.0, 44.0, 83.0, 111.0, 133.0, 147.0, 145.0, 129.0, 76.0, 38.0, 20.0, 10.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.25495910644531, -88.2148208618164, -82.17469024658203, -76.13455200195312, -70.09442138671875, -64.05428314208984, -58.01414489746094, -51.9740104675293, -45.933876037597656, -39.893741607666016, -33.853607177734375, -27.81346893310547, -21.773334503173828, -15.733200073242188, -9.693061828613281, -3.6529273986816406, 2.38720703125, 8.427342414855957, 14.467477798461914, 20.507614135742188, 26.547748565673828, 32.58788299560547, 38.628021240234375, 44.668155670166016, 50.708290100097656, 56.7484245300293, 62.78855895996094, 68.82869720458984, 74.86883544921875, 80.90896606445312, 86.94910430908203, 92.98924255371094, 99.02938842773438, 105.06952667236328, 111.10965728759766, 117.14979553222656, 123.18992614746094, 129.23007202148438, 135.27020263671875, 141.31033325195312, 147.3504638671875, 153.39059448242188, 159.4307403564453, 165.4708709716797, 171.51100158691406, 177.5511474609375, 183.59127807617188, 189.63140869140625, 195.6715545654297, 201.71168518066406, 207.7518310546875, 213.79196166992188, 219.83209228515625, 225.87222290039062, 231.91236877441406, 237.95249938964844, 243.99264526367188, 250.03277587890625, 256.0729064941406, 262.113037109375, 268.1531982421875, 274.1933288574219, 280.23345947265625, 286.2735900878906, 292.313720703125]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 1.0, 8.0, 10.0, 8.0, 13.0, 11.0, 14.0, 21.0, 25.0, 18.0, 25.0, 24.0, 34.0, 31.0, 26.0, 37.0, 42.0, 45.0, 37.0, 46.0, 27.0, 44.0, 40.0, 41.0, 39.0, 33.0, 37.0, 31.0, 23.0, 29.0, 23.0, 24.0, 18.0, 16.0, 17.0, 16.0, 15.0, 16.0, 9.0, 7.0, 3.0, 8.0, 6.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-69.92535400390625, -67.42276000976562, -64.920166015625, -62.41757583618164, -59.91498565673828, -57.412391662597656, -54.90979766845703, -52.407203674316406, -49.90461349487305, -47.40201950073242, -44.89942932128906, -42.39683532714844, -39.89424133300781, -37.39165115356445, -34.88905715942383, -32.38646697998047, -29.883872985839844, -27.38128089904785, -24.87868881225586, -22.376094818115234, -19.873502731323242, -17.37091064453125, -14.868317604064941, -12.365724563598633, -9.86313247680664, -7.36053991317749, -4.85794734954834, -2.3553547859191895, 0.14723777770996094, 2.649829864501953, 5.152422904968262, 7.65501594543457, 10.157608032226562, 12.660200119018555, 15.162793159484863, 17.665386199951172, 20.167978286743164, 22.670570373535156, 25.17316436767578, 27.675756454467773, 30.178348541259766, 32.68094253540039, 35.18353271484375, 37.686126708984375, 40.188720703125, 42.69131088256836, 45.193904876708984, 47.696495056152344, 50.19908905029297, 52.701683044433594, 55.20427322387695, 57.70686721801758, 60.20945739746094, 62.71205139160156, 65.21464538574219, 67.71723937988281, 70.21983337402344, 72.72242736816406, 75.22502136230469, 77.72760772705078, 80.2302017211914, 82.73279571533203, 85.23538970947266, 87.73798370361328, 90.24057006835938]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 6.0, 13.0, 20.0, 19.0, 20.0, 38.0, 58.0, 72.0, 87.0, 134.0, 193.0, 289.0, 443.0, 753.0, 1471.0, 3081.0, 7278.0, 20886.0, 78184.0, 2598929.0, 1373696.0, 74863.0, 20074.0, 7047.0, 3170.0, 1446.0, 809.0, 407.0, 247.0, 171.0, 108.0, 74.0, 54.0, 36.0, 27.0, 16.0, 11.0, 12.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.3125, -58.48388671875, -56.6552734375, -54.82666015625, -52.998046875, -51.16943359375, -49.3408203125, -47.51220703125, -45.68359375, -43.85498046875, -42.0263671875, -40.19775390625, -38.369140625, -36.54052734375, -34.7119140625, -32.88330078125, -31.0546875, -29.22607421875, -27.3974609375, -25.56884765625, -23.740234375, -21.91162109375, -20.0830078125, -18.25439453125, -16.42578125, -14.59716796875, -12.7685546875, -10.93994140625, -9.111328125, -7.28271484375, -5.4541015625, -3.62548828125, -1.796875, 0.03173828125, 1.8603515625, 3.68896484375, 5.517578125, 7.34619140625, 9.1748046875, 11.00341796875, 12.83203125, 14.66064453125, 16.4892578125, 18.31787109375, 20.146484375, 21.97509765625, 23.8037109375, 25.63232421875, 27.4609375, 29.28955078125, 31.1181640625, 32.94677734375, 34.775390625, 36.60400390625, 38.4326171875, 40.26123046875, 42.08984375, 43.91845703125, 45.7470703125, 47.57568359375, 49.404296875, 51.23291015625, 53.0615234375, 54.89013671875, 56.71875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 16.0, 12.0, 25.0, 25.0, 30.0, 40.0, 45.0, 50.0, 56.0, 61.0, 65.0, 65.0, 65.0, 67.0, 62.0, 53.0, 58.0, 43.0, 38.0, 21.0, 27.0, 15.0, 18.0, 10.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.30078125, -6.08184814453125, -5.8629150390625, -5.64398193359375, -5.425048828125, -5.20611572265625, -4.9871826171875, -4.76824951171875, -4.54931640625, -4.33038330078125, -4.1114501953125, -3.89251708984375, -3.673583984375, -3.45465087890625, -3.2357177734375, -3.01678466796875, -2.7978515625, -2.57891845703125, -2.3599853515625, -2.14105224609375, -1.922119140625, -1.70318603515625, -1.4842529296875, -1.26531982421875, -1.04638671875, -0.82745361328125, -0.6085205078125, -0.38958740234375, -0.170654296875, 0.04827880859375, 0.2672119140625, 0.48614501953125, 0.705078125, 0.92401123046875, 1.1429443359375, 1.36187744140625, 1.580810546875, 1.79974365234375, 2.0186767578125, 2.23760986328125, 2.45654296875, 2.67547607421875, 2.8944091796875, 3.11334228515625, 3.332275390625, 3.55120849609375, 3.7701416015625, 3.98907470703125, 4.2080078125, 4.42694091796875, 4.6458740234375, 4.86480712890625, 5.083740234375, 5.30267333984375, 5.5216064453125, 5.74053955078125, 5.95947265625, 6.17840576171875, 6.3973388671875, 6.61627197265625, 6.835205078125, 7.05413818359375, 7.2730712890625, 7.49200439453125, 7.7109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 8.0, 4.0, 5.0, 4.0, 12.0, 13.0, 18.0, 20.0, 44.0, 50.0, 55.0, 87.0, 112.0, 172.0, 233.0, 341.0, 510.0, 861.0, 1468.0, 2629.0, 5180.0, 10668.0, 24235.0, 64335.0, 235996.0, 3121609.0, 553227.0, 106104.0, 36108.0, 14812.0, 6986.0, 3586.0, 1841.0, 1072.0, 610.0, 423.0, 243.0, 174.0, 120.0, 78.0, 51.0, 47.0, 39.0, 21.0, 17.0, 11.0, 14.0, 10.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-30.328125, -29.401123046875, -28.47412109375, -27.547119140625, -26.6201171875, -25.693115234375, -24.76611328125, -23.839111328125, -22.912109375, -21.985107421875, -21.05810546875, -20.131103515625, -19.2041015625, -18.277099609375, -17.35009765625, -16.423095703125, -15.49609375, -14.569091796875, -13.64208984375, -12.715087890625, -11.7880859375, -10.861083984375, -9.93408203125, -9.007080078125, -8.080078125, -7.153076171875, -6.22607421875, -5.299072265625, -4.3720703125, -3.445068359375, -2.51806640625, -1.591064453125, -0.6640625, 0.262939453125, 1.18994140625, 2.116943359375, 3.0439453125, 3.970947265625, 4.89794921875, 5.824951171875, 6.751953125, 7.678955078125, 8.60595703125, 9.532958984375, 10.4599609375, 11.386962890625, 12.31396484375, 13.240966796875, 14.16796875, 15.094970703125, 16.02197265625, 16.948974609375, 17.8759765625, 18.802978515625, 19.72998046875, 20.656982421875, 21.583984375, 22.510986328125, 23.43798828125, 24.364990234375, 25.2919921875, 26.218994140625, 27.14599609375, 28.072998046875, 29.0]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 9.0, 16.0, 22.0, 47.0, 45.0, 83.0, 157.0, 316.0, 1723.0, 982.0, 282.0, 145.0, 66.0, 42.0, 34.0, 21.0, 17.0, 10.0, 5.0, 9.0, 6.0, 1.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.34375, -21.79736328125, -21.2509765625, -20.70458984375, -20.158203125, -19.61181640625, -19.0654296875, -18.51904296875, -17.97265625, -17.42626953125, -16.8798828125, -16.33349609375, -15.787109375, -15.24072265625, -14.6943359375, -14.14794921875, -13.6015625, -13.05517578125, -12.5087890625, -11.96240234375, -11.416015625, -10.86962890625, -10.3232421875, -9.77685546875, -9.23046875, -8.68408203125, -8.1376953125, -7.59130859375, -7.044921875, -6.49853515625, -5.9521484375, -5.40576171875, -4.859375, -4.31298828125, -3.7666015625, -3.22021484375, -2.673828125, -2.12744140625, -1.5810546875, -1.03466796875, -0.48828125, 0.05810546875, 0.6044921875, 1.15087890625, 1.697265625, 2.24365234375, 2.7900390625, 3.33642578125, 3.8828125, 4.42919921875, 4.9755859375, 5.52197265625, 6.068359375, 6.61474609375, 7.1611328125, 7.70751953125, 8.25390625, 8.80029296875, 9.3466796875, 9.89306640625, 10.439453125, 10.98583984375, 11.5322265625, 12.07861328125, 12.625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 14.0, 46.0, 75.0, 153.0, 196.0, 241.0, 143.0, 71.0, 37.0, 14.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-230.5846405029297, -225.5850830078125, -220.58551025390625, -215.58595275878906, -210.58639526367188, -205.58682250976562, -200.58726501464844, -195.58770751953125, -190.588134765625, -185.5885772705078, -180.58900451660156, -175.58944702148438, -170.5898895263672, -165.59031677246094, -160.59075927734375, -155.5911865234375, -150.59164428710938, -145.5920867919922, -140.59251403808594, -135.59295654296875, -130.59339904785156, -125.59382629394531, -120.59426879882812, -115.5947036743164, -110.59513854980469, -105.59557342529297, -100.59601593017578, -95.59645080566406, -90.59688568115234, -85.59732055664062, -80.59776306152344, -75.59819793701172, -70.59862518310547, -65.59906005859375, -60.5994987487793, -55.599937438964844, -50.600372314453125, -45.60081100463867, -40.60124969482422, -35.6016845703125, -30.602123260498047, -25.60256004333496, -20.602996826171875, -15.603435516357422, -10.603872299194336, -5.60430908203125, -0.6047477722167969, 4.394817352294922, 9.394378662109375, 14.393941879272461, 19.393505096435547, 24.39306640625, 29.392629623413086, 34.39219284057617, 39.391754150390625, 44.391319274902344, 49.3908805847168, 54.39044189453125, 59.39000701904297, 64.38957214355469, 69.38912963867188, 74.3886947631836, 79.38825988769531, 84.3878173828125, 89.38738250732422]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 5.0, 12.0, 19.0, 23.0, 26.0, 37.0, 35.0, 37.0, 40.0, 37.0, 47.0, 56.0, 42.0, 57.0, 59.0, 71.0, 49.0, 45.0, 43.0, 41.0, 32.0, 42.0, 34.0, 24.0, 21.0, 15.0, 11.0, 9.0, 7.0, 7.0, 2.0, 2.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.89250564575195, -50.052852630615234, -48.213199615478516, -46.37354278564453, -44.53388977050781, -42.694236755371094, -40.854583740234375, -39.014930725097656, -37.17527770996094, -35.33562469482422, -33.4959716796875, -31.65631675720215, -29.816661834716797, -27.977008819580078, -26.13735580444336, -24.29770278930664, -22.458045959472656, -20.618392944335938, -18.778738021850586, -16.939085006713867, -15.099431037902832, -13.259777069091797, -11.420124053955078, -9.580470085144043, -7.740816116333008, -5.901162147521973, -4.061508655548096, -2.2218551635742188, -0.3822011947631836, 1.4574527740478516, 3.2971057891845703, 5.1367597579956055, 6.976417541503906, 8.816071510314941, 10.655725479125977, 12.495378494262695, 14.33503246307373, 16.174686431884766, 18.014339447021484, 19.853992462158203, 21.693647384643555, 23.533300399780273, 25.372955322265625, 27.212608337402344, 29.052261352539062, 30.891916275024414, 32.7315673828125, 34.571224212646484, 36.4108772277832, 38.25053024291992, 40.09018325805664, 41.929840087890625, 43.769493103027344, 45.60914611816406, 47.44879913330078, 49.2884521484375, 51.12810516357422, 52.96775817871094, 54.807411193847656, 56.647064208984375, 58.48672103881836, 60.32637405395508, 62.1660270690918, 64.00568389892578, 65.8453369140625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 17.0, 26.0, 39.0, 60.0, 90.0, 139.0, 219.0, 388.0, 697.0, 1468.0, 3676.0, 11004.0, 41872.0, 175244.0, 570900.0, 181550.0, 42741.0, 11454.0, 3754.0, 1504.0, 694.0, 382.0, 212.0, 144.0, 92.0, 58.0, 37.0, 27.0, 18.0, 15.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.25, -40.9091796875, -39.568359375, -38.2275390625, -36.88671875, -35.5458984375, -34.205078125, -32.8642578125, -31.5234375, -30.1826171875, -28.841796875, -27.5009765625, -26.16015625, -24.8193359375, -23.478515625, -22.1376953125, -20.796875, -19.4560546875, -18.115234375, -16.7744140625, -15.43359375, -14.0927734375, -12.751953125, -11.4111328125, -10.0703125, -8.7294921875, -7.388671875, -6.0478515625, -4.70703125, -3.3662109375, -2.025390625, -0.6845703125, 0.65625, 1.9970703125, 3.337890625, 4.6787109375, 6.01953125, 7.3603515625, 8.701171875, 10.0419921875, 11.3828125, 12.7236328125, 14.064453125, 15.4052734375, 16.74609375, 18.0869140625, 19.427734375, 20.7685546875, 22.109375, 23.4501953125, 24.791015625, 26.1318359375, 27.47265625, 28.8134765625, 30.154296875, 31.4951171875, 32.8359375, 34.1767578125, 35.517578125, 36.8583984375, 38.19921875, 39.5400390625, 40.880859375, 42.2216796875, 43.5625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 8.0, 11.0, 15.0, 28.0, 31.0, 34.0, 40.0, 50.0, 46.0, 47.0, 51.0, 57.0, 71.0, 53.0, 66.0, 62.0, 62.0, 43.0, 49.0, 36.0, 41.0, 26.0, 18.0, 20.0, 10.0, 6.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.8125, -6.578125, -6.34375, -6.109375, -5.875, -5.640625, -5.40625, -5.171875, -4.9375, -4.703125, -4.46875, -4.234375, -4.0, -3.765625, -3.53125, -3.296875, -3.0625, -2.828125, -2.59375, -2.359375, -2.125, -1.890625, -1.65625, -1.421875, -1.1875, -0.953125, -0.71875, -0.484375, -0.25, -0.015625, 0.21875, 0.453125, 0.6875, 0.921875, 1.15625, 1.390625, 1.625, 1.859375, 2.09375, 2.328125, 2.5625, 2.796875, 3.03125, 3.265625, 3.5, 3.734375, 3.96875, 4.203125, 4.4375, 4.671875, 4.90625, 5.140625, 5.375, 5.609375, 5.84375, 6.078125, 6.3125, 6.546875, 6.78125, 7.015625, 7.25, 7.484375, 7.71875, 7.953125, 8.1875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 7.0, 5.0, 16.0, 13.0, 18.0, 27.0, 29.0, 68.0, 81.0, 122.0, 143.0, 217.0, 309.0, 440.0, 750.0, 1407.0, 2930.0, 7551.0, 23520.0, 81335.0, 331784.0, 443985.0, 105917.0, 30546.0, 9769.0, 3513.0, 1612.0, 806.0, 498.0, 313.0, 228.0, 160.0, 139.0, 73.0, 74.0, 39.0, 40.0, 26.0, 14.0, 11.0, 11.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.421875, -22.6171875, -21.8125, -21.0078125, -20.203125, -19.3984375, -18.59375, -17.7890625, -16.984375, -16.1796875, -15.375, -14.5703125, -13.765625, -12.9609375, -12.15625, -11.3515625, -10.546875, -9.7421875, -8.9375, -8.1328125, -7.328125, -6.5234375, -5.71875, -4.9140625, -4.109375, -3.3046875, -2.5, -1.6953125, -0.890625, -0.0859375, 0.71875, 1.5234375, 2.328125, 3.1328125, 3.9375, 4.7421875, 5.546875, 6.3515625, 7.15625, 7.9609375, 8.765625, 9.5703125, 10.375, 11.1796875, 11.984375, 12.7890625, 13.59375, 14.3984375, 15.203125, 16.0078125, 16.8125, 17.6171875, 18.421875, 19.2265625, 20.03125, 20.8359375, 21.640625, 22.4453125, 23.25, 24.0546875, 24.859375, 25.6640625, 26.46875, 27.2734375, 28.078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 5.0, 2.0, 10.0, 4.0, 7.0, 15.0, 8.0, 14.0, 20.0, 18.0, 26.0, 27.0, 25.0, 37.0, 33.0, 32.0, 30.0, 40.0, 43.0, 38.0, 48.0, 61.0, 50.0, 46.0, 40.0, 49.0, 38.0, 33.0, 24.0, 26.0, 23.0, 28.0, 16.0, 24.0, 18.0, 5.0, 11.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.640625, -20.98828125, -20.3359375, -19.68359375, -19.03125, -18.37890625, -17.7265625, -17.07421875, -16.421875, -15.76953125, -15.1171875, -14.46484375, -13.8125, -13.16015625, -12.5078125, -11.85546875, -11.203125, -10.55078125, -9.8984375, -9.24609375, -8.59375, -7.94140625, -7.2890625, -6.63671875, -5.984375, -5.33203125, -4.6796875, -4.02734375, -3.375, -2.72265625, -2.0703125, -1.41796875, -0.765625, -0.11328125, 0.5390625, 1.19140625, 1.84375, 2.49609375, 3.1484375, 3.80078125, 4.453125, 5.10546875, 5.7578125, 6.41015625, 7.0625, 7.71484375, 8.3671875, 9.01953125, 9.671875, 10.32421875, 10.9765625, 11.62890625, 12.28125, 12.93359375, 13.5859375, 14.23828125, 14.890625, 15.54296875, 16.1953125, 16.84765625, 17.5, 18.15234375, 18.8046875, 19.45703125, 20.109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 14.0, 7.0, 21.0, 24.0, 41.0, 49.0, 92.0, 120.0, 233.0, 408.0, 665.0, 1271.0, 2684.0, 6003.0, 15796.0, 46962.0, 162076.0, 521630.0, 201526.0, 56899.0, 18840.0, 7015.0, 2951.0, 1426.0, 741.0, 430.0, 240.0, 145.0, 93.0, 55.0, 32.0, 20.0, 18.0, 10.0, 6.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.7529296875, -8.435546875, -8.1181640625, -7.80078125, -7.4833984375, -7.166015625, -6.8486328125, -6.53125, -6.2138671875, -5.896484375, -5.5791015625, -5.26171875, -4.9443359375, -4.626953125, -4.3095703125, -3.9921875, -3.6748046875, -3.357421875, -3.0400390625, -2.72265625, -2.4052734375, -2.087890625, -1.7705078125, -1.453125, -1.1357421875, -0.818359375, -0.5009765625, -0.18359375, 0.1337890625, 0.451171875, 0.7685546875, 1.0859375, 1.4033203125, 1.720703125, 2.0380859375, 2.35546875, 2.6728515625, 2.990234375, 3.3076171875, 3.625, 3.9423828125, 4.259765625, 4.5771484375, 4.89453125, 5.2119140625, 5.529296875, 5.8466796875, 6.1640625, 6.4814453125, 6.798828125, 7.1162109375, 7.43359375, 7.7509765625, 8.068359375, 8.3857421875, 8.703125, 9.0205078125, 9.337890625, 9.6552734375, 9.97265625, 10.2900390625, 10.607421875, 10.9248046875, 11.2421875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 8.0, 10.0, 10.0, 6.0, 19.0, 14.0, 15.0, 30.0, 40.0, 35.0, 49.0, 92.0, 140.0, 168.0, 100.0, 48.0, 38.0, 29.0, 28.0, 26.0, 17.0, 16.0, 10.0, 8.0, 4.0, 8.0, 10.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018281936645507812, -0.0017672628164291382, -0.0017063319683074951, -0.001645401120185852, -0.001584470272064209, -0.001523539423942566, -0.0014626085758209229, -0.0014016777276992798, -0.0013407468795776367, -0.0012798160314559937, -0.0012188851833343506, -0.0011579543352127075, -0.0010970234870910645, -0.0010360926389694214, -0.0009751617908477783, -0.0009142309427261353, -0.0008533000946044922, -0.0007923692464828491, -0.0007314383983612061, -0.000670507550239563, -0.0006095767021179199, -0.0005486458539962769, -0.0004877150058746338, -0.0004267841577529907, -0.00036585330963134766, -0.0003049224615097046, -0.00024399161338806152, -0.00018306076526641846, -0.0001221299171447754, -6.119906902313232e-05, -2.682209014892578e-07, 6.066262722015381e-05, 0.00012159347534179688, 0.00018252432346343994, 0.000243455171585083, 0.0003043860197067261, 0.00036531686782836914, 0.0004262477159500122, 0.0004871785640716553, 0.0005481094121932983, 0.0006090402603149414, 0.0006699711084365845, 0.0007309019565582275, 0.0007918328046798706, 0.0008527636528015137, 0.0009136945009231567, 0.0009746253490447998, 0.0010355561971664429, 0.001096487045288086, 0.001157417893409729, 0.001218348741531372, 0.0012792795896530151, 0.0013402104377746582, 0.0014011412858963013, 0.0014620721340179443, 0.0015230029821395874, 0.0015839338302612305, 0.0016448646783828735, 0.0017057955265045166, 0.0017667263746261597, 0.0018276572227478027, 0.0018885880708694458, 0.0019495189189910889, 0.002010449767112732, 0.002071380615234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 12.0, 16.0, 26.0, 35.0, 58.0, 122.0, 246.0, 583.0, 1631.0, 5149.0, 25797.0, 306857.0, 642657.0, 53339.0, 8197.0, 2286.0, 809.0, 358.0, 151.0, 78.0, 55.0, 25.0, 24.0, 9.0, 11.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-27.40625, -26.70654296875, -26.0068359375, -25.30712890625, -24.607421875, -23.90771484375, -23.2080078125, -22.50830078125, -21.80859375, -21.10888671875, -20.4091796875, -19.70947265625, -19.009765625, -18.31005859375, -17.6103515625, -16.91064453125, -16.2109375, -15.51123046875, -14.8115234375, -14.11181640625, -13.412109375, -12.71240234375, -12.0126953125, -11.31298828125, -10.61328125, -9.91357421875, -9.2138671875, -8.51416015625, -7.814453125, -7.11474609375, -6.4150390625, -5.71533203125, -5.015625, -4.31591796875, -3.6162109375, -2.91650390625, -2.216796875, -1.51708984375, -0.8173828125, -0.11767578125, 0.58203125, 1.28173828125, 1.9814453125, 2.68115234375, 3.380859375, 4.08056640625, 4.7802734375, 5.47998046875, 6.1796875, 6.87939453125, 7.5791015625, 8.27880859375, 8.978515625, 9.67822265625, 10.3779296875, 11.07763671875, 11.77734375, 12.47705078125, 13.1767578125, 13.87646484375, 14.576171875, 15.27587890625, 15.9755859375, 16.67529296875, 17.375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 6.0, 21.0, 13.0, 22.0, 24.0, 51.0, 79.0, 112.0, 119.0, 142.0, 139.0, 80.0, 56.0, 41.0, 31.0, 15.0, 12.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.859375, -19.3773193359375, -18.895263671875, -18.4132080078125, -17.93115234375, -17.4490966796875, -16.967041015625, -16.4849853515625, -16.0029296875, -15.5208740234375, -15.038818359375, -14.5567626953125, -14.07470703125, -13.5926513671875, -13.110595703125, -12.6285400390625, -12.146484375, -11.6644287109375, -11.182373046875, -10.7003173828125, -10.21826171875, -9.7362060546875, -9.254150390625, -8.7720947265625, -8.2900390625, -7.8079833984375, -7.325927734375, -6.8438720703125, -6.36181640625, -5.8797607421875, -5.397705078125, -4.9156494140625, -4.43359375, -3.9515380859375, -3.469482421875, -2.9874267578125, -2.50537109375, -2.0233154296875, -1.541259765625, -1.0592041015625, -0.5771484375, -0.0950927734375, 0.386962890625, 0.8690185546875, 1.35107421875, 1.8331298828125, 2.315185546875, 2.7972412109375, 3.279296875, 3.7613525390625, 4.243408203125, 4.7254638671875, 5.20751953125, 5.6895751953125, 6.171630859375, 6.6536865234375, 7.1357421875, 7.6177978515625, 8.099853515625, 8.5819091796875, 9.06396484375, 9.5460205078125, 10.028076171875, 10.5101318359375, 10.9921875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 19.0, 99.0, 272.0, 385.0, 185.0, 50.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.3323974609375, -154.78855895996094, -136.24472045898438, -117.70086669921875, -99.15702819824219, -80.61318969726562, -62.06934356689453, -43.52549743652344, -24.981658935546875, -6.437816619873047, 12.106025695800781, 30.64986801147461, 49.19371032714844, 67.737548828125, 86.2813949584961, 104.82524108886719, 123.36907958984375, 141.9129180908203, 160.45675659179688, 179.0006103515625, 197.54444885253906, 216.08828735351562, 234.63214111328125, 253.1759796142578, 271.7198181152344, 290.263671875, 308.8074951171875, 327.3513488769531, 345.89520263671875, 364.43902587890625, 382.9828796386719, 401.5267333984375, 420.07049560546875, 438.6143493652344, 457.1581726074219, 475.7020263671875, 494.245849609375, 512.7896728515625, 531.3335571289062, 549.8773803710938, 568.4212646484375, 586.965087890625, 605.5089721679688, 624.0527954101562, 642.5966186523438, 661.1405029296875, 679.684326171875, 698.2281494140625, 716.77197265625, 735.3157958984375, 753.8596801757812, 772.4035034179688, 790.9473266601562, 809.4912109375, 828.0350341796875, 846.578857421875, 865.1226806640625, 883.66650390625, 902.2103881835938, 920.7542114257812, 939.2980346679688, 957.8419189453125, 976.3857421875, 994.9295654296875, 1013.4734497070312]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 10.0, 7.0, 12.0, 10.0, 16.0, 20.0, 28.0, 26.0, 22.0, 25.0, 46.0, 37.0, 42.0, 40.0, 43.0, 42.0, 41.0, 50.0, 40.0, 47.0, 41.0, 38.0, 47.0, 42.0, 33.0, 30.0, 28.0, 18.0, 12.0, 20.0, 17.0, 13.0, 19.0, 9.0, 5.0, 10.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.46636962890625, -107.0630111694336, -103.65966033935547, -100.25630187988281, -96.85295104980469, -93.44959259033203, -90.0462417602539, -86.64288330078125, -83.23953247070312, -79.83617401123047, -76.43282318115234, -73.02946472167969, -69.62611389160156, -66.2227554321289, -62.81940460205078, -59.416046142578125, -56.012691497802734, -52.609336853027344, -49.20598220825195, -45.80262756347656, -42.39927291870117, -38.99591827392578, -35.592559814453125, -32.189208984375, -28.785852432250977, -25.382497787475586, -21.979143142700195, -18.575786590576172, -15.172432899475098, -11.76907730102539, -8.36572265625, -4.962368011474609, -1.5590133666992188, 1.844341516494751, 5.247696399688721, 8.65105152130127, 12.05440616607666, 15.457761764526367, 18.861116409301758, 22.26447105407715, 25.66782569885254, 29.07118034362793, 32.47453689575195, 35.877891540527344, 39.281246185302734, 42.684600830078125, 46.087955474853516, 49.491310119628906, 52.8946647644043, 56.29801940917969, 59.70137405395508, 63.10472869873047, 66.50808715820312, 69.91143798828125, 73.3147964477539, 76.71814727783203, 80.12150573730469, 83.52486419677734, 86.92821502685547, 90.33157348632812, 93.73492431640625, 97.1382827758789, 100.54163360595703, 103.94499206542969, 107.34834289550781]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 16.0, 22.0, 26.0, 47.0, 40.0, 63.0, 99.0, 113.0, 226.0, 283.0, 489.0, 873.0, 1705.0, 3690.0, 9825.0, 31905.0, 156006.0, 3355582.0, 536644.0, 67453.0, 17510.0, 6224.0, 2539.0, 1254.0, 625.0, 357.0, 234.0, 140.0, 91.0, 46.0, 43.0, 29.0, 19.0, 8.0, 8.0, 7.0, 5.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-61.3125, -59.64453125, -57.9765625, -56.30859375, -54.640625, -52.97265625, -51.3046875, -49.63671875, -47.96875, -46.30078125, -44.6328125, -42.96484375, -41.296875, -39.62890625, -37.9609375, -36.29296875, -34.625, -32.95703125, -31.2890625, -29.62109375, -27.953125, -26.28515625, -24.6171875, -22.94921875, -21.28125, -19.61328125, -17.9453125, -16.27734375, -14.609375, -12.94140625, -11.2734375, -9.60546875, -7.9375, -6.26953125, -4.6015625, -2.93359375, -1.265625, 0.40234375, 2.0703125, 3.73828125, 5.40625, 7.07421875, 8.7421875, 10.41015625, 12.078125, 13.74609375, 15.4140625, 17.08203125, 18.75, 20.41796875, 22.0859375, 23.75390625, 25.421875, 27.08984375, 28.7578125, 30.42578125, 32.09375, 33.76171875, 35.4296875, 37.09765625, 38.765625, 40.43359375, 42.1015625, 43.76953125, 45.4375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 9.0, 14.0, 16.0, 21.0, 23.0, 34.0, 43.0, 45.0, 51.0, 62.0, 46.0, 50.0, 60.0, 57.0, 66.0, 53.0, 77.0, 51.0, 48.0, 39.0, 30.0, 26.0, 26.0, 11.0, 10.0, 10.0, 3.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.67578125, -6.44586181640625, -6.2159423828125, -5.98602294921875, -5.756103515625, -5.52618408203125, -5.2962646484375, -5.06634521484375, -4.83642578125, -4.60650634765625, -4.3765869140625, -4.14666748046875, -3.916748046875, -3.68682861328125, -3.4569091796875, -3.22698974609375, -2.9970703125, -2.76715087890625, -2.5372314453125, -2.30731201171875, -2.077392578125, -1.84747314453125, -1.6175537109375, -1.38763427734375, -1.15771484375, -0.92779541015625, -0.6978759765625, -0.46795654296875, -0.238037109375, -0.00811767578125, 0.2218017578125, 0.45172119140625, 0.681640625, 0.91156005859375, 1.1414794921875, 1.37139892578125, 1.601318359375, 1.83123779296875, 2.0611572265625, 2.29107666015625, 2.52099609375, 2.75091552734375, 2.9808349609375, 3.21075439453125, 3.440673828125, 3.67059326171875, 3.9005126953125, 4.13043212890625, 4.3603515625, 4.59027099609375, 4.8201904296875, 5.05010986328125, 5.280029296875, 5.50994873046875, 5.7398681640625, 5.96978759765625, 6.19970703125, 6.42962646484375, 6.6595458984375, 6.88946533203125, 7.119384765625, 7.34930419921875, 7.5792236328125, 7.80914306640625, 8.0390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 7.0, 9.0, 14.0, 17.0, 30.0, 53.0, 59.0, 103.0, 145.0, 240.0, 331.0, 563.0, 1081.0, 2342.0, 5838.0, 18982.0, 84261.0, 629513.0, 3169822.0, 221557.0, 41242.0, 10627.0, 3719.0, 1598.0, 789.0, 504.0, 278.0, 184.0, 109.0, 77.0, 64.0, 25.0, 35.0, 19.0, 13.0, 7.0, 14.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-43.375, -42.109375, -40.84375, -39.578125, -38.3125, -37.046875, -35.78125, -34.515625, -33.25, -31.984375, -30.71875, -29.453125, -28.1875, -26.921875, -25.65625, -24.390625, -23.125, -21.859375, -20.59375, -19.328125, -18.0625, -16.796875, -15.53125, -14.265625, -13.0, -11.734375, -10.46875, -9.203125, -7.9375, -6.671875, -5.40625, -4.140625, -2.875, -1.609375, -0.34375, 0.921875, 2.1875, 3.453125, 4.71875, 5.984375, 7.25, 8.515625, 9.78125, 11.046875, 12.3125, 13.578125, 14.84375, 16.109375, 17.375, 18.640625, 19.90625, 21.171875, 22.4375, 23.703125, 24.96875, 26.234375, 27.5, 28.765625, 30.03125, 31.296875, 32.5625, 33.828125, 35.09375, 36.359375, 37.625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 9.0, 12.0, 12.0, 20.0, 24.0, 22.0, 50.0, 74.0, 114.0, 162.0, 313.0, 722.0, 1365.0, 485.0, 259.0, 125.0, 85.0, 73.0, 41.0, 26.0, 15.0, 18.0, 14.0, 8.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.625, -18.0968017578125, -17.568603515625, -17.0404052734375, -16.51220703125, -15.9840087890625, -15.455810546875, -14.9276123046875, -14.3994140625, -13.8712158203125, -13.343017578125, -12.8148193359375, -12.28662109375, -11.7584228515625, -11.230224609375, -10.7020263671875, -10.173828125, -9.6456298828125, -9.117431640625, -8.5892333984375, -8.06103515625, -7.5328369140625, -7.004638671875, -6.4764404296875, -5.9482421875, -5.4200439453125, -4.891845703125, -4.3636474609375, -3.83544921875, -3.3072509765625, -2.779052734375, -2.2508544921875, -1.72265625, -1.1944580078125, -0.666259765625, -0.1380615234375, 0.39013671875, 0.9183349609375, 1.446533203125, 1.9747314453125, 2.5029296875, 3.0311279296875, 3.559326171875, 4.0875244140625, 4.61572265625, 5.1439208984375, 5.672119140625, 6.2003173828125, 6.728515625, 7.2567138671875, 7.784912109375, 8.3131103515625, 8.84130859375, 9.3695068359375, 9.897705078125, 10.4259033203125, 10.9541015625, 11.4822998046875, 12.010498046875, 12.5386962890625, 13.06689453125, 13.5950927734375, 14.123291015625, 14.6514892578125, 15.1796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 15.0, 19.0, 30.0, 41.0, 65.0, 94.0, 98.0, 111.0, 121.0, 125.0, 87.0, 68.0, 47.0, 26.0, 26.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.21259307861328, -84.56591796875, -80.91924285888672, -77.27256774902344, -73.62589263916016, -69.97921752929688, -66.3325424194336, -62.68586730957031, -59.03919219970703, -55.39251708984375, -51.74584197998047, -48.09916687011719, -44.452491760253906, -40.805816650390625, -37.159141540527344, -33.51246643066406, -29.86579132080078, -26.2191162109375, -22.57244110107422, -18.925765991210938, -15.279090881347656, -11.632415771484375, -7.985740661621094, -4.3390655517578125, -0.6923904418945312, 2.95428466796875, 6.600959777832031, 10.247634887695312, 13.894309997558594, 17.540985107421875, 21.187660217285156, 24.834335327148438, 28.48101806640625, 32.12769317626953, 35.77436828613281, 39.421043395996094, 43.067718505859375, 46.714393615722656, 50.36106872558594, 54.00774383544922, 57.6544189453125, 61.30109405517578, 64.94776916503906, 68.59444427490234, 72.24111938476562, 75.8877944946289, 79.53446960449219, 83.18114471435547, 86.82781982421875, 90.47449493408203, 94.12117004394531, 97.7678451538086, 101.41452026367188, 105.06119537353516, 108.70787048339844, 112.35454559326172, 116.001220703125, 119.64789581298828, 123.29457092285156, 126.94124603271484, 130.58792114257812, 134.23458862304688, 137.8812713623047, 141.5279541015625, 145.17462158203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 11.0, 14.0, 15.0, 12.0, 22.0, 35.0, 19.0, 29.0, 46.0, 49.0, 46.0, 56.0, 57.0, 45.0, 53.0, 74.0, 51.0, 61.0, 59.0, 40.0, 39.0, 34.0, 31.0, 21.0, 17.0, 11.0, 15.0, 4.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.87149047851562, -70.60835266113281, -68.34522247314453, -66.08208465576172, -63.818946838378906, -61.55581283569336, -59.29267883300781, -57.029541015625, -54.76640701293945, -52.503273010253906, -50.240135192871094, -47.97700119018555, -45.7138671875, -43.45072937011719, -41.18759536743164, -38.924461364746094, -36.66132354736328, -34.398189544677734, -32.13505172729492, -29.871917724609375, -27.608781814575195, -25.345645904541016, -23.08251190185547, -20.81937599182129, -18.55624008178711, -16.29310417175293, -14.029969215393066, -11.766834259033203, -9.503698348999023, -7.240562438964844, -4.9774274826049805, -2.714292526245117, -0.4511566162109375, 1.811978816986084, 4.0751142501831055, 6.338249683380127, 8.601385116577148, 10.864521026611328, 13.127655982971191, 15.390790939331055, 17.653926849365234, 19.917062759399414, 22.180198669433594, 24.44333267211914, 26.70646858215332, 28.9696044921875, 31.232738494873047, 33.495872497558594, 35.759010314941406, 38.02214431762695, 40.285282135009766, 42.54841613769531, 44.811553955078125, 47.07468795776367, 49.33782196044922, 51.60095977783203, 53.86409378051758, 56.127227783203125, 58.39036560058594, 60.653499603271484, 62.91663360595703, 65.17977142333984, 67.44290924072266, 69.70603942871094, 71.96917724609375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 9.0, 15.0, 13.0, 24.0, 31.0, 32.0, 73.0, 101.0, 140.0, 216.0, 404.0, 780.0, 1578.0, 3671.0, 10028.0, 34147.0, 149603.0, 500407.0, 264418.0, 57745.0, 15580.0, 5145.0, 2054.0, 1021.0, 496.0, 286.0, 170.0, 103.0, 78.0, 57.0, 41.0, 18.0, 16.0, 6.0, 8.0, 7.0, 8.0, 3.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-42.96875, -41.72998046875, -40.4912109375, -39.25244140625, -38.013671875, -36.77490234375, -35.5361328125, -34.29736328125, -33.05859375, -31.81982421875, -30.5810546875, -29.34228515625, -28.103515625, -26.86474609375, -25.6259765625, -24.38720703125, -23.1484375, -21.90966796875, -20.6708984375, -19.43212890625, -18.193359375, -16.95458984375, -15.7158203125, -14.47705078125, -13.23828125, -11.99951171875, -10.7607421875, -9.52197265625, -8.283203125, -7.04443359375, -5.8056640625, -4.56689453125, -3.328125, -2.08935546875, -0.8505859375, 0.38818359375, 1.626953125, 2.86572265625, 4.1044921875, 5.34326171875, 6.58203125, 7.82080078125, 9.0595703125, 10.29833984375, 11.537109375, 12.77587890625, 14.0146484375, 15.25341796875, 16.4921875, 17.73095703125, 18.9697265625, 20.20849609375, 21.447265625, 22.68603515625, 23.9248046875, 25.16357421875, 26.40234375, 27.64111328125, 28.8798828125, 30.11865234375, 31.357421875, 32.59619140625, 33.8349609375, 35.07373046875, 36.3125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 6.0, 14.0, 12.0, 20.0, 18.0, 23.0, 31.0, 38.0, 40.0, 65.0, 55.0, 58.0, 54.0, 59.0, 60.0, 58.0, 74.0, 44.0, 52.0, 43.0, 30.0, 33.0, 26.0, 17.0, 20.0, 15.0, 10.0, 4.0, 1.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.51171875, -7.26812744140625, -7.0245361328125, -6.78094482421875, -6.537353515625, -6.29376220703125, -6.0501708984375, -5.80657958984375, -5.56298828125, -5.31939697265625, -5.0758056640625, -4.83221435546875, -4.588623046875, -4.34503173828125, -4.1014404296875, -3.85784912109375, -3.6142578125, -3.37066650390625, -3.1270751953125, -2.88348388671875, -2.639892578125, -2.39630126953125, -2.1527099609375, -1.90911865234375, -1.66552734375, -1.42193603515625, -1.1783447265625, -0.93475341796875, -0.691162109375, -0.44757080078125, -0.2039794921875, 0.03961181640625, 0.283203125, 0.52679443359375, 0.7703857421875, 1.01397705078125, 1.257568359375, 1.50115966796875, 1.7447509765625, 1.98834228515625, 2.23193359375, 2.47552490234375, 2.7191162109375, 2.96270751953125, 3.206298828125, 3.44989013671875, 3.6934814453125, 3.93707275390625, 4.1806640625, 4.42425537109375, 4.6678466796875, 4.91143798828125, 5.155029296875, 5.39862060546875, 5.6422119140625, 5.88580322265625, 6.12939453125, 6.37298583984375, 6.6165771484375, 6.86016845703125, 7.103759765625, 7.34735107421875, 7.5909423828125, 7.83453369140625, 8.078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 12.0, 11.0, 12.0, 21.0, 40.0, 47.0, 62.0, 92.0, 135.0, 181.0, 222.0, 330.0, 446.0, 720.0, 1324.0, 2410.0, 5119.0, 11597.0, 29056.0, 88491.0, 320924.0, 403258.0, 119398.0, 37474.0, 14088.0, 5949.0, 2934.0, 1522.0, 826.0, 535.0, 378.0, 290.0, 173.0, 128.0, 104.0, 65.0, 44.0, 46.0, 25.0, 12.0, 14.0, 11.0, 4.0, 5.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.734375, -23.987548828125, -23.24072265625, -22.493896484375, -21.7470703125, -21.000244140625, -20.25341796875, -19.506591796875, -18.759765625, -18.012939453125, -17.26611328125, -16.519287109375, -15.7724609375, -15.025634765625, -14.27880859375, -13.531982421875, -12.78515625, -12.038330078125, -11.29150390625, -10.544677734375, -9.7978515625, -9.051025390625, -8.30419921875, -7.557373046875, -6.810546875, -6.063720703125, -5.31689453125, -4.570068359375, -3.8232421875, -3.076416015625, -2.32958984375, -1.582763671875, -0.8359375, -0.089111328125, 0.65771484375, 1.404541015625, 2.1513671875, 2.898193359375, 3.64501953125, 4.391845703125, 5.138671875, 5.885498046875, 6.63232421875, 7.379150390625, 8.1259765625, 8.872802734375, 9.61962890625, 10.366455078125, 11.11328125, 11.860107421875, 12.60693359375, 13.353759765625, 14.1005859375, 14.847412109375, 15.59423828125, 16.341064453125, 17.087890625, 17.834716796875, 18.58154296875, 19.328369140625, 20.0751953125, 20.822021484375, 21.56884765625, 22.315673828125, 23.0625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 9.0, 9.0, 8.0, 16.0, 25.0, 19.0, 28.0, 26.0, 29.0, 38.0, 48.0, 34.0, 59.0, 40.0, 71.0, 61.0, 54.0, 50.0, 49.0, 41.0, 49.0, 33.0, 30.0, 28.0, 19.0, 24.0, 25.0, 11.0, 7.0, 10.0, 5.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.421875, -27.52490234375, -26.6279296875, -25.73095703125, -24.833984375, -23.93701171875, -23.0400390625, -22.14306640625, -21.24609375, -20.34912109375, -19.4521484375, -18.55517578125, -17.658203125, -16.76123046875, -15.8642578125, -14.96728515625, -14.0703125, -13.17333984375, -12.2763671875, -11.37939453125, -10.482421875, -9.58544921875, -8.6884765625, -7.79150390625, -6.89453125, -5.99755859375, -5.1005859375, -4.20361328125, -3.306640625, -2.40966796875, -1.5126953125, -0.61572265625, 0.28125, 1.17822265625, 2.0751953125, 2.97216796875, 3.869140625, 4.76611328125, 5.6630859375, 6.56005859375, 7.45703125, 8.35400390625, 9.2509765625, 10.14794921875, 11.044921875, 11.94189453125, 12.8388671875, 13.73583984375, 14.6328125, 15.52978515625, 16.4267578125, 17.32373046875, 18.220703125, 19.11767578125, 20.0146484375, 20.91162109375, 21.80859375, 22.70556640625, 23.6025390625, 24.49951171875, 25.396484375, 26.29345703125, 27.1904296875, 28.08740234375, 28.984375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 12.0, 11.0, 19.0, 47.0, 69.0, 109.0, 244.0, 612.0, 1733.0, 7103.0, 53215.0, 536627.0, 403379.0, 37301.0, 5558.0, 1487.0, 514.0, 231.0, 94.0, 64.0, 43.0, 25.0, 10.0, 16.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.765625, -19.165283203125, -18.56494140625, -17.964599609375, -17.3642578125, -16.763916015625, -16.16357421875, -15.563232421875, -14.962890625, -14.362548828125, -13.76220703125, -13.161865234375, -12.5615234375, -11.961181640625, -11.36083984375, -10.760498046875, -10.16015625, -9.559814453125, -8.95947265625, -8.359130859375, -7.7587890625, -7.158447265625, -6.55810546875, -5.957763671875, -5.357421875, -4.757080078125, -4.15673828125, -3.556396484375, -2.9560546875, -2.355712890625, -1.75537109375, -1.155029296875, -0.5546875, 0.045654296875, 0.64599609375, 1.246337890625, 1.8466796875, 2.447021484375, 3.04736328125, 3.647705078125, 4.248046875, 4.848388671875, 5.44873046875, 6.049072265625, 6.6494140625, 7.249755859375, 7.85009765625, 8.450439453125, 9.05078125, 9.651123046875, 10.25146484375, 10.851806640625, 11.4521484375, 12.052490234375, 12.65283203125, 13.253173828125, 13.853515625, 14.453857421875, 15.05419921875, 15.654541015625, 16.2548828125, 16.855224609375, 17.45556640625, 18.055908203125, 18.65625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 17.0, 10.0, 22.0, 31.0, 36.0, 43.0, 54.0, 94.0, 85.0, 113.0, 116.0, 97.0, 68.0, 48.0, 47.0, 22.0, 22.0, 14.0, 18.0, 8.0, 9.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00229644775390625, -0.0022340863943099976, -0.002171725034713745, -0.0021093636751174927, -0.0020470023155212402, -0.001984640955924988, -0.0019222795963287354, -0.001859918236732483, -0.0017975568771362305, -0.001735195517539978, -0.0016728341579437256, -0.0016104727983474731, -0.0015481114387512207, -0.0014857500791549683, -0.0014233887195587158, -0.0013610273599624634, -0.001298666000366211, -0.0012363046407699585, -0.001173943281173706, -0.0011115819215774536, -0.0010492205619812012, -0.0009868592023849487, -0.0009244978427886963, -0.0008621364831924438, -0.0007997751235961914, -0.000737413763999939, -0.0006750524044036865, -0.0006126910448074341, -0.0005503296852111816, -0.0004879683256149292, -0.00042560696601867676, -0.0003632456064224243, -0.0003008842468261719, -0.00023852288722991943, -0.000176161527633667, -0.00011380016803741455, -5.143880844116211e-05, 1.0922551155090332e-05, 7.328391075134277e-05, 0.00013564527034759521, 0.00019800662994384766, 0.0002603679895401001, 0.00032272934913635254, 0.000385090708732605, 0.0004474520683288574, 0.0005098134279251099, 0.0005721747875213623, 0.0006345361471176147, 0.0006968975067138672, 0.0007592588663101196, 0.0008216202259063721, 0.0008839815855026245, 0.000946342945098877, 0.0010087043046951294, 0.0010710656642913818, 0.0011334270238876343, 0.0011957883834838867, 0.0012581497430801392, 0.0013205111026763916, 0.001382872462272644, 0.0014452338218688965, 0.001507595181465149, 0.0015699565410614014, 0.0016323179006576538, 0.0016946792602539062]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 6.0, 15.0, 14.0, 32.0, 56.0, 107.0, 248.0, 603.0, 1883.0, 10689.0, 217064.0, 763655.0, 48082.0, 4312.0, 1037.0, 380.0, 188.0, 73.0, 45.0, 19.0, 19.0, 12.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.46875, -28.63330078125, -27.7978515625, -26.96240234375, -26.126953125, -25.29150390625, -24.4560546875, -23.62060546875, -22.78515625, -21.94970703125, -21.1142578125, -20.27880859375, -19.443359375, -18.60791015625, -17.7724609375, -16.93701171875, -16.1015625, -15.26611328125, -14.4306640625, -13.59521484375, -12.759765625, -11.92431640625, -11.0888671875, -10.25341796875, -9.41796875, -8.58251953125, -7.7470703125, -6.91162109375, -6.076171875, -5.24072265625, -4.4052734375, -3.56982421875, -2.734375, -1.89892578125, -1.0634765625, -0.22802734375, 0.607421875, 1.44287109375, 2.2783203125, 3.11376953125, 3.94921875, 4.78466796875, 5.6201171875, 6.45556640625, 7.291015625, 8.12646484375, 8.9619140625, 9.79736328125, 10.6328125, 11.46826171875, 12.3037109375, 13.13916015625, 13.974609375, 14.81005859375, 15.6455078125, 16.48095703125, 17.31640625, 18.15185546875, 18.9873046875, 19.82275390625, 20.658203125, 21.49365234375, 22.3291015625, 23.16455078125, 24.0]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 12.0, 20.0, 22.0, 36.0, 56.0, 75.0, 88.0, 121.0, 111.0, 121.0, 93.0, 77.0, 40.0, 35.0, 24.0, 21.0, 11.0, 4.0, 3.0, 1.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.015625, -18.542724609375, -18.06982421875, -17.596923828125, -17.1240234375, -16.651123046875, -16.17822265625, -15.705322265625, -15.232421875, -14.759521484375, -14.28662109375, -13.813720703125, -13.3408203125, -12.867919921875, -12.39501953125, -11.922119140625, -11.44921875, -10.976318359375, -10.50341796875, -10.030517578125, -9.5576171875, -9.084716796875, -8.61181640625, -8.138916015625, -7.666015625, -7.193115234375, -6.72021484375, -6.247314453125, -5.7744140625, -5.301513671875, -4.82861328125, -4.355712890625, -3.8828125, -3.409912109375, -2.93701171875, -2.464111328125, -1.9912109375, -1.518310546875, -1.04541015625, -0.572509765625, -0.099609375, 0.373291015625, 0.84619140625, 1.319091796875, 1.7919921875, 2.264892578125, 2.73779296875, 3.210693359375, 3.68359375, 4.156494140625, 4.62939453125, 5.102294921875, 5.5751953125, 6.048095703125, 6.52099609375, 6.993896484375, 7.466796875, 7.939697265625, 8.41259765625, 8.885498046875, 9.3583984375, 9.831298828125, 10.30419921875, 10.777099609375, 11.25]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 13.0, 8.0, 21.0, 26.0, 35.0, 53.0, 64.0, 88.0, 102.0, 102.0, 99.0, 105.0, 85.0, 67.0, 48.0, 22.0, 23.0, 16.0, 13.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.3284454345703, -229.6723175048828, -224.0161895751953, -218.3600616455078, -212.7039337158203, -207.0478057861328, -201.39166259765625, -195.73553466796875, -190.07940673828125, -184.42327880859375, -178.76715087890625, -173.11102294921875, -167.45489501953125, -161.79876708984375, -156.14263916015625, -150.48651123046875, -144.83038330078125, -139.17425537109375, -133.51812744140625, -127.86199951171875, -122.20587158203125, -116.54974365234375, -110.89360809326172, -105.23748016357422, -99.58135223388672, -93.92522430419922, -88.26909637451172, -82.61296081542969, -76.95683288574219, -71.30070495605469, -65.64457702636719, -59.98844909667969, -54.33232116699219, -48.67619323730469, -43.02006530761719, -37.36393356323242, -31.707805633544922, -26.051677703857422, -20.395545959472656, -14.739418029785156, -9.083290100097656, -3.42716121673584, 2.2289676666259766, 7.885097503662109, 13.54122543334961, 19.19735336303711, 24.853485107421875, 30.509613037109375, 36.165740966796875, 41.821868896484375, 47.477996826171875, 53.13412857055664, 58.79025650024414, 64.44638061523438, 70.1025161743164, 75.7586441040039, 81.4147720336914, 87.0708999633789, 92.7270278930664, 98.38316345214844, 104.03929138183594, 109.69541931152344, 115.35154724121094, 121.00767517089844, 126.66380310058594]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 8.0, 5.0, 5.0, 13.0, 13.0, 9.0, 10.0, 25.0, 18.0, 26.0, 30.0, 26.0, 34.0, 44.0, 34.0, 36.0, 39.0, 43.0, 52.0, 49.0, 40.0, 34.0, 46.0, 35.0, 46.0, 37.0, 33.0, 29.0, 39.0, 27.0, 18.0, 12.0, 10.0, 11.0, 14.0, 9.0, 13.0, 7.0, 7.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.31553649902344, -123.28887939453125, -119.2622299194336, -115.2355728149414, -111.20892333984375, -107.18226623535156, -103.15560913085938, -99.12895202636719, -95.10230255126953, -91.07564544677734, -87.04899597167969, -83.0223388671875, -78.99568176269531, -74.96903228759766, -70.94237518310547, -66.91572570800781, -62.889068603515625, -58.8624153137207, -54.83576202392578, -50.809104919433594, -46.78245162963867, -42.75579833984375, -38.72914123535156, -34.70248794555664, -30.67583465576172, -26.649181365966797, -22.622526168823242, -18.595870971679688, -14.569217681884766, -10.542564392089844, -6.515909194946289, -2.4892539978027344, 1.5373992919921875, 5.564053535461426, 9.590707778930664, 13.617362022399902, 17.64401626586914, 21.670669555664062, 25.697324752807617, 29.723979949951172, 33.750633239746094, 37.777286529541016, 41.80393981933594, 45.830596923828125, 49.85725021362305, 53.88390350341797, 57.910560607910156, 61.93721389770508, 65.9638671875, 69.99052429199219, 74.01717376708984, 78.04383087158203, 82.07048034667969, 86.09713745117188, 90.12379455566406, 94.15045166015625, 98.1771011352539, 102.2037582397461, 106.23040771484375, 110.25706481933594, 114.28372192382812, 118.31037139892578, 122.33702850341797, 126.36367797851562, 130.3903350830078]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 10.0, 11.0, 15.0, 16.0, 32.0, 35.0, 57.0, 58.0, 126.0, 147.0, 241.0, 415.0, 772.0, 1791.0, 4352.0, 13796.0, 106406.0, 4020231.0, 32475.0, 7768.0, 2773.0, 1191.0, 582.0, 332.0, 192.0, 129.0, 106.0, 68.0, 35.0, 27.0, 20.0, 21.0, 15.0, 11.0, 11.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-106.25, -103.611328125, -100.97265625, -98.333984375, -95.6953125, -93.056640625, -90.41796875, -87.779296875, -85.140625, -82.501953125, -79.86328125, -77.224609375, -74.5859375, -71.947265625, -69.30859375, -66.669921875, -64.03125, -61.392578125, -58.75390625, -56.115234375, -53.4765625, -50.837890625, -48.19921875, -45.560546875, -42.921875, -40.283203125, -37.64453125, -35.005859375, -32.3671875, -29.728515625, -27.08984375, -24.451171875, -21.8125, -19.173828125, -16.53515625, -13.896484375, -11.2578125, -8.619140625, -5.98046875, -3.341796875, -0.703125, 1.935546875, 4.57421875, 7.212890625, 9.8515625, 12.490234375, 15.12890625, 17.767578125, 20.40625, 23.044921875, 25.68359375, 28.322265625, 30.9609375, 33.599609375, 36.23828125, 38.876953125, 41.515625, 44.154296875, 46.79296875, 49.431640625, 52.0703125, 54.708984375, 57.34765625, 59.986328125, 62.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 2.0, 3.0, 7.0, 19.0, 10.0, 18.0, 24.0, 25.0, 28.0, 37.0, 44.0, 43.0, 41.0, 31.0, 49.0, 59.0, 49.0, 67.0, 55.0, 59.0, 55.0, 54.0, 41.0, 39.0, 39.0, 25.0, 13.0, 10.0, 10.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.1796875, -7.921142578125, -7.66259765625, -7.404052734375, -7.1455078125, -6.886962890625, -6.62841796875, -6.369873046875, -6.111328125, -5.852783203125, -5.59423828125, -5.335693359375, -5.0771484375, -4.818603515625, -4.56005859375, -4.301513671875, -4.04296875, -3.784423828125, -3.52587890625, -3.267333984375, -3.0087890625, -2.750244140625, -2.49169921875, -2.233154296875, -1.974609375, -1.716064453125, -1.45751953125, -1.198974609375, -0.9404296875, -0.681884765625, -0.42333984375, -0.164794921875, 0.09375, 0.352294921875, 0.61083984375, 0.869384765625, 1.1279296875, 1.386474609375, 1.64501953125, 1.903564453125, 2.162109375, 2.420654296875, 2.67919921875, 2.937744140625, 3.1962890625, 3.454833984375, 3.71337890625, 3.971923828125, 4.23046875, 4.489013671875, 4.74755859375, 5.006103515625, 5.2646484375, 5.523193359375, 5.78173828125, 6.040283203125, 6.298828125, 6.557373046875, 6.81591796875, 7.074462890625, 7.3330078125, 7.591552734375, 7.85009765625, 8.108642578125, 8.3671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 8.0, 15.0, 29.0, 47.0, 86.0, 144.0, 243.0, 398.0, 769.0, 1257.0, 2575.0, 5422.0, 13504.0, 50659.0, 3791144.0, 280432.0, 29681.0, 9546.0, 4070.0, 1945.0, 1044.0, 562.0, 302.0, 183.0, 83.0, 51.0, 39.0, 26.0, 15.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.75, -51.3916015625, -50.033203125, -48.6748046875, -47.31640625, -45.9580078125, -44.599609375, -43.2412109375, -41.8828125, -40.5244140625, -39.166015625, -37.8076171875, -36.44921875, -35.0908203125, -33.732421875, -32.3740234375, -31.015625, -29.6572265625, -28.298828125, -26.9404296875, -25.58203125, -24.2236328125, -22.865234375, -21.5068359375, -20.1484375, -18.7900390625, -17.431640625, -16.0732421875, -14.71484375, -13.3564453125, -11.998046875, -10.6396484375, -9.28125, -7.9228515625, -6.564453125, -5.2060546875, -3.84765625, -2.4892578125, -1.130859375, 0.2275390625, 1.5859375, 2.9443359375, 4.302734375, 5.6611328125, 7.01953125, 8.3779296875, 9.736328125, 11.0947265625, 12.453125, 13.8115234375, 15.169921875, 16.5283203125, 17.88671875, 19.2451171875, 20.603515625, 21.9619140625, 23.3203125, 24.6787109375, 26.037109375, 27.3955078125, 28.75390625, 30.1123046875, 31.470703125, 32.8291015625, 34.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 6.0, 17.0, 18.0, 23.0, 23.0, 63.0, 106.0, 260.0, 3008.0, 286.0, 96.0, 58.0, 18.0, 11.0, 12.0, 7.0, 6.0, 6.0, 7.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4140625, -7.2052001953125, -6.996337890625, -6.7874755859375, -6.57861328125, -6.3697509765625, -6.160888671875, -5.9520263671875, -5.7431640625, -5.5343017578125, -5.325439453125, -5.1165771484375, -4.90771484375, -4.6988525390625, -4.489990234375, -4.2811279296875, -4.072265625, -3.8634033203125, -3.654541015625, -3.4456787109375, -3.23681640625, -3.0279541015625, -2.819091796875, -2.6102294921875, -2.4013671875, -2.1925048828125, -1.983642578125, -1.7747802734375, -1.56591796875, -1.3570556640625, -1.148193359375, -0.9393310546875, -0.73046875, -0.5216064453125, -0.312744140625, -0.1038818359375, 0.10498046875, 0.3138427734375, 0.522705078125, 0.7315673828125, 0.9404296875, 1.1492919921875, 1.358154296875, 1.5670166015625, 1.77587890625, 1.9847412109375, 2.193603515625, 2.4024658203125, 2.611328125, 2.8201904296875, 3.029052734375, 3.2379150390625, 3.44677734375, 3.6556396484375, 3.864501953125, 4.0733642578125, 4.2822265625, 4.4910888671875, 4.699951171875, 4.9088134765625, 5.11767578125, 5.3265380859375, 5.535400390625, 5.7442626953125, 5.953125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 2.0, 4.0, 10.0, 14.0, 12.0, 21.0, 24.0, 40.0, 55.0, 70.0, 93.0, 104.0, 115.0, 112.0, 89.0, 79.0, 48.0, 41.0, 23.0, 15.0, 9.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.55391311645508, -39.42695999145508, -38.30000305175781, -37.17304992675781, -36.04609680175781, -34.91913986206055, -33.79218673706055, -32.66522979736328, -31.53827667236328, -30.41132164001465, -29.284366607666016, -28.157413482666016, -27.030458450317383, -25.90350341796875, -24.77655029296875, -23.649595260620117, -22.522640228271484, -21.39568519592285, -20.26873016357422, -19.14177703857422, -18.014822006225586, -16.887866973876953, -15.760912895202637, -14.63395881652832, -13.507003784179688, -12.380048751831055, -11.253094673156738, -10.126140594482422, -8.999185562133789, -7.8722310066223145, -6.74527645111084, -5.618321895599365, -4.491367340087891, -3.364412784576416, -2.2374582290649414, -1.1105036735534668, 0.016450881958007812, 1.1434054374694824, 2.270359992980957, 3.3973145484924316, 4.524269104003906, 5.651223659515381, 6.7781782150268555, 7.90513277053833, 9.032087326049805, 10.159042358398438, 11.285996437072754, 12.41295051574707, 13.539905548095703, 14.666860580444336, 15.793814659118652, 16.92076873779297, 18.0477237701416, 19.174678802490234, 20.301631927490234, 21.428586959838867, 22.5555419921875, 23.682497024536133, 24.809452056884766, 25.936405181884766, 27.0633602142334, 28.19031524658203, 29.31726837158203, 30.444223403930664, 31.571178436279297]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 19.0, 23.0, 21.0, 23.0, 12.0, 22.0, 32.0, 30.0, 31.0, 26.0, 33.0, 34.0, 38.0, 27.0, 41.0, 36.0, 35.0, 48.0, 37.0, 35.0, 43.0, 45.0, 38.0, 27.0, 39.0, 31.0, 30.0, 22.0, 23.0, 20.0, 10.0, 12.0, 10.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.270694732666016, -24.47759246826172, -23.684490203857422, -22.891387939453125, -22.098285675048828, -21.30518341064453, -20.512081146240234, -19.718978881835938, -18.92587661743164, -18.132774353027344, -17.339672088623047, -16.54656982421875, -15.753467559814453, -14.960365295410156, -14.167262077331543, -13.374159812927246, -12.581056594848633, -11.787954330444336, -10.994852066040039, -10.201749801635742, -9.408647537231445, -8.615545272827148, -7.822442054748535, -7.029339790344238, -6.236237525939941, -5.4431352615356445, -4.650032997131348, -3.8569302558898926, -3.0638279914855957, -2.270725727081299, -1.4776229858398438, -0.6845207214355469, 0.10858154296875, 0.9016839265823364, 1.6947863101959229, 2.487888813018799, 3.2809910774230957, 4.074093341827393, 4.867196083068848, 5.6602983474731445, 6.453400611877441, 7.246502876281738, 8.039605140686035, 8.832708358764648, 9.625810623168945, 10.418912887573242, 11.212015151977539, 12.005117416381836, 12.798219680786133, 13.59132194519043, 14.384424209594727, 15.177526473999023, 15.97062873840332, 16.763731002807617, 17.556835174560547, 18.349937438964844, 19.14303970336914, 19.936141967773438, 20.729244232177734, 21.52234649658203, 22.315448760986328, 23.108551025390625, 23.901653289794922, 24.69475555419922, 25.487857818603516]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 4.0, 6.0, 7.0, 4.0, 10.0, 12.0, 21.0, 35.0, 64.0, 69.0, 132.0, 179.0, 310.0, 595.0, 1216.0, 2852.0, 7145.0, 21009.0, 67947.0, 226928.0, 430164.0, 200170.0, 59791.0, 18445.0, 6373.0, 2520.0, 1167.0, 554.0, 321.0, 184.0, 103.0, 66.0, 58.0, 19.0, 22.0, 19.0, 12.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.71875, -29.77197265625, -28.8251953125, -27.87841796875, -26.931640625, -25.98486328125, -25.0380859375, -24.09130859375, -23.14453125, -22.19775390625, -21.2509765625, -20.30419921875, -19.357421875, -18.41064453125, -17.4638671875, -16.51708984375, -15.5703125, -14.62353515625, -13.6767578125, -12.72998046875, -11.783203125, -10.83642578125, -9.8896484375, -8.94287109375, -7.99609375, -7.04931640625, -6.1025390625, -5.15576171875, -4.208984375, -3.26220703125, -2.3154296875, -1.36865234375, -0.421875, 0.52490234375, 1.4716796875, 2.41845703125, 3.365234375, 4.31201171875, 5.2587890625, 6.20556640625, 7.15234375, 8.09912109375, 9.0458984375, 9.99267578125, 10.939453125, 11.88623046875, 12.8330078125, 13.77978515625, 14.7265625, 15.67333984375, 16.6201171875, 17.56689453125, 18.513671875, 19.46044921875, 20.4072265625, 21.35400390625, 22.30078125, 23.24755859375, 24.1943359375, 25.14111328125, 26.087890625, 27.03466796875, 27.9814453125, 28.92822265625, 29.875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 2.0, 5.0, 8.0, 8.0, 9.0, 16.0, 15.0, 12.0, 22.0, 19.0, 38.0, 29.0, 31.0, 31.0, 41.0, 52.0, 40.0, 47.0, 37.0, 48.0, 52.0, 35.0, 49.0, 47.0, 48.0, 36.0, 46.0, 42.0, 28.0, 22.0, 22.0, 19.0, 7.0, 9.0, 5.0, 4.0, 4.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.34326171875, -8.0693359375, -7.79541015625, -7.521484375, -7.24755859375, -6.9736328125, -6.69970703125, -6.42578125, -6.15185546875, -5.8779296875, -5.60400390625, -5.330078125, -5.05615234375, -4.7822265625, -4.50830078125, -4.234375, -3.96044921875, -3.6865234375, -3.41259765625, -3.138671875, -2.86474609375, -2.5908203125, -2.31689453125, -2.04296875, -1.76904296875, -1.4951171875, -1.22119140625, -0.947265625, -0.67333984375, -0.3994140625, -0.12548828125, 0.1484375, 0.42236328125, 0.6962890625, 0.97021484375, 1.244140625, 1.51806640625, 1.7919921875, 2.06591796875, 2.33984375, 2.61376953125, 2.8876953125, 3.16162109375, 3.435546875, 3.70947265625, 3.9833984375, 4.25732421875, 4.53125, 4.80517578125, 5.0791015625, 5.35302734375, 5.626953125, 5.90087890625, 6.1748046875, 6.44873046875, 6.72265625, 6.99658203125, 7.2705078125, 7.54443359375, 7.818359375, 8.09228515625, 8.3662109375, 8.64013671875, 8.9140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 14.0, 25.0, 55.0, 110.0, 209.0, 464.0, 977.0, 2512.0, 18545.0, 562776.0, 443551.0, 15174.0, 2362.0, 938.0, 446.0, 199.0, 87.0, 49.0, 22.0, 9.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.28125, -56.03662109375, -53.7919921875, -51.54736328125, -49.302734375, -47.05810546875, -44.8134765625, -42.56884765625, -40.32421875, -38.07958984375, -35.8349609375, -33.59033203125, -31.345703125, -29.10107421875, -26.8564453125, -24.61181640625, -22.3671875, -20.12255859375, -17.8779296875, -15.63330078125, -13.388671875, -11.14404296875, -8.8994140625, -6.65478515625, -4.41015625, -2.16552734375, 0.0791015625, 2.32373046875, 4.568359375, 6.81298828125, 9.0576171875, 11.30224609375, 13.546875, 15.79150390625, 18.0361328125, 20.28076171875, 22.525390625, 24.77001953125, 27.0146484375, 29.25927734375, 31.50390625, 33.74853515625, 35.9931640625, 38.23779296875, 40.482421875, 42.72705078125, 44.9716796875, 47.21630859375, 49.4609375, 51.70556640625, 53.9501953125, 56.19482421875, 58.439453125, 60.68408203125, 62.9287109375, 65.17333984375, 67.41796875, 69.66259765625, 71.9072265625, 74.15185546875, 76.396484375, 78.64111328125, 80.8857421875, 83.13037109375, 85.375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 10.0, 13.0, 30.0, 44.0, 60.0, 77.0, 101.0, 98.0, 114.0, 118.0, 112.0, 76.0, 52.0, 39.0, 30.0, 22.0, 9.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.625, -107.6796875, -104.734375, -101.7890625, -98.84375, -95.8984375, -92.953125, -90.0078125, -87.0625, -84.1171875, -81.171875, -78.2265625, -75.28125, -72.3359375, -69.390625, -66.4453125, -63.5, -60.5546875, -57.609375, -54.6640625, -51.71875, -48.7734375, -45.828125, -42.8828125, -39.9375, -36.9921875, -34.046875, -31.1015625, -28.15625, -25.2109375, -22.265625, -19.3203125, -16.375, -13.4296875, -10.484375, -7.5390625, -4.59375, -1.6484375, 1.296875, 4.2421875, 7.1875, 10.1328125, 13.078125, 16.0234375, 18.96875, 21.9140625, 24.859375, 27.8046875, 30.75, 33.6953125, 36.640625, 39.5859375, 42.53125, 45.4765625, 48.421875, 51.3671875, 54.3125, 57.2578125, 60.203125, 63.1484375, 66.09375, 69.0390625, 71.984375, 74.9296875, 77.875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 7.0, 9.0, 7.0, 15.0, 20.0, 44.0, 33.0, 62.0, 102.0, 148.0, 219.0, 473.0, 1057.0, 2538.0, 8309.0, 54343.0, 775019.0, 182709.0, 16536.0, 3967.0, 1442.0, 615.0, 348.0, 169.0, 121.0, 65.0, 52.0, 30.0, 26.0, 15.0, 16.0, 8.0, 8.0, 5.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.6875, -29.803466796875, -28.91943359375, -28.035400390625, -27.1513671875, -26.267333984375, -25.38330078125, -24.499267578125, -23.615234375, -22.731201171875, -21.84716796875, -20.963134765625, -20.0791015625, -19.195068359375, -18.31103515625, -17.427001953125, -16.54296875, -15.658935546875, -14.77490234375, -13.890869140625, -13.0068359375, -12.122802734375, -11.23876953125, -10.354736328125, -9.470703125, -8.586669921875, -7.70263671875, -6.818603515625, -5.9345703125, -5.050537109375, -4.16650390625, -3.282470703125, -2.3984375, -1.514404296875, -0.63037109375, 0.253662109375, 1.1376953125, 2.021728515625, 2.90576171875, 3.789794921875, 4.673828125, 5.557861328125, 6.44189453125, 7.325927734375, 8.2099609375, 9.093994140625, 9.97802734375, 10.862060546875, 11.74609375, 12.630126953125, 13.51416015625, 14.398193359375, 15.2822265625, 16.166259765625, 17.05029296875, 17.934326171875, 18.818359375, 19.702392578125, 20.58642578125, 21.470458984375, 22.3544921875, 23.238525390625, 24.12255859375, 25.006591796875, 25.890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 5.0, 6.0, 6.0, 7.0, 15.0, 24.0, 36.0, 64.0, 75.0, 118.0, 148.0, 126.0, 108.0, 87.0, 56.0, 32.0, 20.0, 19.0, 12.0, 8.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.003002166748046875, -0.0029165446758270264, -0.0028309226036071777, -0.002745300531387329, -0.0026596784591674805, -0.002574056386947632, -0.002488434314727783, -0.0024028122425079346, -0.002317190170288086, -0.0022315680980682373, -0.0021459460258483887, -0.00206032395362854, -0.0019747018814086914, -0.0018890798091888428, -0.0018034577369689941, -0.0017178356647491455, -0.0016322135925292969, -0.0015465915203094482, -0.0014609694480895996, -0.001375347375869751, -0.0012897253036499023, -0.0012041032314300537, -0.001118481159210205, -0.0010328590869903564, -0.0009472370147705078, -0.0008616149425506592, -0.0007759928703308105, -0.0006903707981109619, -0.0006047487258911133, -0.0005191266536712646, -0.000433504581451416, -0.0003478825092315674, -0.00026226043701171875, -0.00017663836479187012, -9.101629257202148e-05, -5.3942203521728516e-06, 8.022785186767578e-05, 0.00016584992408752441, 0.00025147199630737305, 0.0003370940685272217, 0.0004227161407470703, 0.0005083382129669189, 0.0005939602851867676, 0.0006795823574066162, 0.0007652044296264648, 0.0008508265018463135, 0.0009364485740661621, 0.0010220706462860107, 0.0011076927185058594, 0.001193314790725708, 0.0012789368629455566, 0.0013645589351654053, 0.001450181007385254, 0.0015358030796051025, 0.0016214251518249512, 0.0017070472240447998, 0.0017926692962646484, 0.001878291368484497, 0.0019639134407043457, 0.0020495355129241943, 0.002135157585144043, 0.0022207796573638916, 0.0023064017295837402, 0.002392023801803589, 0.0024776458740234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 3.0, 9.0, 7.0, 14.0, 13.0, 24.0, 44.0, 68.0, 116.0, 214.0, 567.0, 1869.0, 8555.0, 154911.0, 852601.0, 24143.0, 3608.0, 1005.0, 352.0, 162.0, 89.0, 46.0, 32.0, 25.0, 20.0, 18.0, 6.0, 6.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -43.267578125, -42.00390625, -40.740234375, -39.4765625, -38.212890625, -36.94921875, -35.685546875, -34.421875, -33.158203125, -31.89453125, -30.630859375, -29.3671875, -28.103515625, -26.83984375, -25.576171875, -24.3125, -23.048828125, -21.78515625, -20.521484375, -19.2578125, -17.994140625, -16.73046875, -15.466796875, -14.203125, -12.939453125, -11.67578125, -10.412109375, -9.1484375, -7.884765625, -6.62109375, -5.357421875, -4.09375, -2.830078125, -1.56640625, -0.302734375, 0.9609375, 2.224609375, 3.48828125, 4.751953125, 6.015625, 7.279296875, 8.54296875, 9.806640625, 11.0703125, 12.333984375, 13.59765625, 14.861328125, 16.125, 17.388671875, 18.65234375, 19.916015625, 21.1796875, 22.443359375, 23.70703125, 24.970703125, 26.234375, 27.498046875, 28.76171875, 30.025390625, 31.2890625, 32.552734375, 33.81640625, 35.080078125, 36.34375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 25.0, 57.0, 129.0, 272.0, 260.0, 129.0, 51.0, 25.0, 18.0, 10.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.78125, -27.34130859375, -25.9013671875, -24.46142578125, -23.021484375, -21.58154296875, -20.1416015625, -18.70166015625, -17.26171875, -15.82177734375, -14.3818359375, -12.94189453125, -11.501953125, -10.06201171875, -8.6220703125, -7.18212890625, -5.7421875, -4.30224609375, -2.8623046875, -1.42236328125, 0.017578125, 1.45751953125, 2.8974609375, 4.33740234375, 5.77734375, 7.21728515625, 8.6572265625, 10.09716796875, 11.537109375, 12.97705078125, 14.4169921875, 15.85693359375, 17.296875, 18.73681640625, 20.1767578125, 21.61669921875, 23.056640625, 24.49658203125, 25.9365234375, 27.37646484375, 28.81640625, 30.25634765625, 31.6962890625, 33.13623046875, 34.576171875, 36.01611328125, 37.4560546875, 38.89599609375, 40.3359375, 41.77587890625, 43.2158203125, 44.65576171875, 46.095703125, 47.53564453125, 48.9755859375, 50.41552734375, 51.85546875, 53.29541015625, 54.7353515625, 56.17529296875, 57.615234375, 59.05517578125, 60.4951171875, 61.93505859375, 63.375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 12.0, 26.0, 39.0, 64.0, 79.0, 141.0, 136.0, 135.0, 111.0, 79.0, 63.0, 46.0, 28.0, 16.0, 9.0, 5.0, 5.0, 3.0], "bins": [-508.4969787597656, -498.9168395996094, -489.33673095703125, -479.756591796875, -470.17645263671875, -460.5963439941406, -451.0162048339844, -441.43609619140625, -431.85595703125, -422.27581787109375, -412.6957092285156, -403.1155700683594, -393.53546142578125, -383.955322265625, -374.37518310546875, -364.7950439453125, -355.2149353027344, -345.6347961425781, -336.0546875, -326.47454833984375, -316.8944091796875, -307.3143005371094, -297.7341613769531, -288.154052734375, -278.57391357421875, -268.9937744140625, -259.4136657714844, -249.83352661132812, -240.25340270996094, -230.67327880859375, -221.0931396484375, -211.5130157470703, -201.93287658691406, -192.35275268554688, -182.77261352539062, -173.19248962402344, -163.61236572265625, -154.03224182128906, -144.45211791992188, -134.87197875976562, -125.29185485839844, -115.71173095703125, -106.13159942626953, -96.55146789550781, -86.97134399414062, -77.39122009277344, -67.81108856201172, -58.23095703125, -48.65083312988281, -39.07070541381836, -29.490577697753906, -19.910449981689453, -10.330322265625, -0.7501945495605469, 8.829933166503906, 18.410064697265625, 27.990188598632812, 37.570316314697266, 47.15044403076172, 56.73057174682617, 66.31069946289062, 75.89082336425781, 85.47095489501953, 95.05108642578125, 104.63121032714844]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 11.0, 6.0, 14.0, 22.0, 25.0, 18.0, 22.0, 28.0, 31.0, 44.0, 33.0, 41.0, 48.0, 48.0, 48.0, 56.0, 48.0, 48.0, 46.0, 40.0, 47.0, 34.0, 42.0, 28.0, 26.0, 24.0, 21.0, 20.0, 20.0, 14.0, 12.0, 7.0, 7.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-222.62237548828125, -215.91629028320312, -209.210205078125, -202.50411987304688, -195.7980499267578, -189.0919647216797, -182.38587951660156, -175.67979431152344, -168.97372436523438, -162.26763916015625, -155.56155395507812, -148.85546875, -142.14939880371094, -135.4433135986328, -128.7372283935547, -122.03114318847656, -115.32505798339844, -108.61897277832031, -101.91289520263672, -95.2068099975586, -88.500732421875, -81.79464721679688, -75.08856201171875, -68.38247680664062, -61.67639923095703, -54.97031784057617, -48.26423645019531, -41.55815124511719, -34.85206985473633, -28.14598846435547, -21.439903259277344, -14.733821868896484, -8.027740478515625, -1.3216581344604492, 5.384424209594727, 12.090507507324219, 18.796588897705078, 25.502670288085938, 32.20875549316406, 38.91483688354492, 45.62091827392578, 52.32699966430664, 59.0330810546875, 65.73916625976562, 72.44525146484375, 79.15132904052734, 85.85741424560547, 92.56349182128906, 99.26957702636719, 105.97566223144531, 112.6817398071289, 119.38782501220703, 126.09390258789062, 132.79998779296875, 139.50607299804688, 146.212158203125, 152.91824340820312, 159.62432861328125, 166.33041381835938, 173.0364990234375, 179.74256896972656, 186.4486541748047, 193.1547393798828, 199.86082458496094, 206.56689453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 7.0, 9.0, 6.0, 12.0, 19.0, 31.0, 48.0, 51.0, 87.0, 109.0, 187.0, 348.0, 595.0, 1204.0, 2508.0, 6710.0, 25521.0, 3249366.0, 870753.0, 24844.0, 6616.0, 2555.0, 1210.0, 574.0, 321.0, 204.0, 123.0, 77.0, 45.0, 43.0, 32.0, 15.0, 20.0, 12.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-75.8125, -73.76318359375, -71.7138671875, -69.66455078125, -67.615234375, -65.56591796875, -63.5166015625, -61.46728515625, -59.41796875, -57.36865234375, -55.3193359375, -53.27001953125, -51.220703125, -49.17138671875, -47.1220703125, -45.07275390625, -43.0234375, -40.97412109375, -38.9248046875, -36.87548828125, -34.826171875, -32.77685546875, -30.7275390625, -28.67822265625, -26.62890625, -24.57958984375, -22.5302734375, -20.48095703125, -18.431640625, -16.38232421875, -14.3330078125, -12.28369140625, -10.234375, -8.18505859375, -6.1357421875, -4.08642578125, -2.037109375, 0.01220703125, 2.0615234375, 4.11083984375, 6.16015625, 8.20947265625, 10.2587890625, 12.30810546875, 14.357421875, 16.40673828125, 18.4560546875, 20.50537109375, 22.5546875, 24.60400390625, 26.6533203125, 28.70263671875, 30.751953125, 32.80126953125, 34.8505859375, 36.89990234375, 38.94921875, 40.99853515625, 43.0478515625, 45.09716796875, 47.146484375, 49.19580078125, 51.2451171875, 53.29443359375, 55.34375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 2.0, 10.0, 9.0, 12.0, 19.0, 21.0, 26.0, 32.0, 20.0, 37.0, 32.0, 46.0, 46.0, 37.0, 46.0, 56.0, 55.0, 47.0, 64.0, 45.0, 41.0, 52.0, 46.0, 28.0, 28.0, 31.0, 28.0, 23.0, 15.0, 10.0, 7.0, 7.0, 5.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.2265625, -8.934814453125, -8.64306640625, -8.351318359375, -8.0595703125, -7.767822265625, -7.47607421875, -7.184326171875, -6.892578125, -6.600830078125, -6.30908203125, -6.017333984375, -5.7255859375, -5.433837890625, -5.14208984375, -4.850341796875, -4.55859375, -4.266845703125, -3.97509765625, -3.683349609375, -3.3916015625, -3.099853515625, -2.80810546875, -2.516357421875, -2.224609375, -1.932861328125, -1.64111328125, -1.349365234375, -1.0576171875, -0.765869140625, -0.47412109375, -0.182373046875, 0.109375, 0.401123046875, 0.69287109375, 0.984619140625, 1.2763671875, 1.568115234375, 1.85986328125, 2.151611328125, 2.443359375, 2.735107421875, 3.02685546875, 3.318603515625, 3.6103515625, 3.902099609375, 4.19384765625, 4.485595703125, 4.77734375, 5.069091796875, 5.36083984375, 5.652587890625, 5.9443359375, 6.236083984375, 6.52783203125, 6.819580078125, 7.111328125, 7.403076171875, 7.69482421875, 7.986572265625, 8.2783203125, 8.570068359375, 8.86181640625, 9.153564453125, 9.4453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 5.0, 7.0, 12.0, 19.0, 14.0, 21.0, 26.0, 33.0, 54.0, 90.0, 167.0, 248.0, 512.0, 1264.0, 3257.0, 10300.0, 61218.0, 3998428.0, 98831.0, 13069.0, 3915.0, 1393.0, 586.0, 292.0, 140.0, 115.0, 47.0, 42.0, 40.0, 21.0, 14.0, 18.0, 11.0, 18.0, 7.0, 12.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.09375, -55.22705078125, -53.3603515625, -51.49365234375, -49.626953125, -47.76025390625, -45.8935546875, -44.02685546875, -42.16015625, -40.29345703125, -38.4267578125, -36.56005859375, -34.693359375, -32.82666015625, -30.9599609375, -29.09326171875, -27.2265625, -25.35986328125, -23.4931640625, -21.62646484375, -19.759765625, -17.89306640625, -16.0263671875, -14.15966796875, -12.29296875, -10.42626953125, -8.5595703125, -6.69287109375, -4.826171875, -2.95947265625, -1.0927734375, 0.77392578125, 2.640625, 4.50732421875, 6.3740234375, 8.24072265625, 10.107421875, 11.97412109375, 13.8408203125, 15.70751953125, 17.57421875, 19.44091796875, 21.3076171875, 23.17431640625, 25.041015625, 26.90771484375, 28.7744140625, 30.64111328125, 32.5078125, 34.37451171875, 36.2412109375, 38.10791015625, 39.974609375, 41.84130859375, 43.7080078125, 45.57470703125, 47.44140625, 49.30810546875, 51.1748046875, 53.04150390625, 54.908203125, 56.77490234375, 58.6416015625, 60.50830078125, 62.375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 6.0, 14.0, 13.0, 18.0, 22.0, 51.0, 117.0, 448.0, 3049.0, 188.0, 71.0, 30.0, 16.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.74468994140625, -6.3526611328125, -5.96063232421875, -5.568603515625, -5.17657470703125, -4.7845458984375, -4.39251708984375, -4.00048828125, -3.60845947265625, -3.2164306640625, -2.82440185546875, -2.432373046875, -2.04034423828125, -1.6483154296875, -1.25628662109375, -0.8642578125, -0.47222900390625, -0.0802001953125, 0.31182861328125, 0.703857421875, 1.09588623046875, 1.4879150390625, 1.87994384765625, 2.27197265625, 2.66400146484375, 3.0560302734375, 3.44805908203125, 3.840087890625, 4.23211669921875, 4.6241455078125, 5.01617431640625, 5.408203125, 5.80023193359375, 6.1922607421875, 6.58428955078125, 6.976318359375, 7.36834716796875, 7.7603759765625, 8.15240478515625, 8.54443359375, 8.93646240234375, 9.3284912109375, 9.72052001953125, 10.112548828125, 10.50457763671875, 10.8966064453125, 11.28863525390625, 11.6806640625, 12.07269287109375, 12.4647216796875, 12.85675048828125, 13.248779296875, 13.64080810546875, 14.0328369140625, 14.42486572265625, 14.81689453125, 15.20892333984375, 15.6009521484375, 15.99298095703125, 16.385009765625, 16.77703857421875, 17.1690673828125, 17.56109619140625, 17.953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 19.0, 21.0, 32.0, 70.0, 101.0, 149.0, 154.0, 131.0, 121.0, 73.0, 61.0, 26.0, 17.0, 13.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-89.9949722290039, -88.09232330322266, -86.1896743774414, -84.28702545166016, -82.3843765258789, -80.48172760009766, -78.5790786743164, -76.67642974853516, -74.7737808227539, -72.87113189697266, -70.9684829711914, -69.06583404541016, -67.1631851196289, -65.26053619384766, -63.357887268066406, -61.455238342285156, -59.55258560180664, -57.64993667602539, -55.74728775024414, -53.84463882446289, -51.94198989868164, -50.03934097290039, -48.136688232421875, -46.234039306640625, -44.331390380859375, -42.428741455078125, -40.526092529296875, -38.623443603515625, -36.720794677734375, -34.818145751953125, -32.915496826171875, -31.012845993041992, -29.11020278930664, -27.20755386352539, -25.30490493774414, -23.40225601196289, -21.49960708618164, -19.59695816040039, -17.694307327270508, -15.791658401489258, -13.889009475708008, -11.986360549926758, -10.083711624145508, -8.181061744689941, -6.278412818908691, -4.375763893127441, -2.473114013671875, -0.570465087890625, 1.332183837890625, 3.234833002090454, 5.137482166290283, 7.040131568908691, 8.942780494689941, 10.845429420471191, 12.748079299926758, 14.650728225708008, 16.553377151489258, 18.456026077270508, 20.358675003051758, 22.26132583618164, 24.16397476196289, 26.06662368774414, 27.96927261352539, 29.87192153930664, 31.77457046508789]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 8.0, 7.0, 10.0, 8.0, 10.0, 11.0, 24.0, 22.0, 26.0, 35.0, 41.0, 45.0, 49.0, 55.0, 37.0, 39.0, 45.0, 50.0, 45.0, 37.0, 46.0, 38.0, 47.0, 35.0, 35.0, 28.0, 23.0, 30.0, 14.0, 16.0, 19.0, 15.0, 18.0, 7.0, 8.0, 9.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.405664443969727, -25.60245704650879, -24.79924774169922, -23.99604034423828, -23.19283103942871, -22.389623641967773, -21.586414337158203, -20.783206939697266, -19.979997634887695, -19.176790237426758, -18.373580932617188, -17.57037353515625, -16.76716423034668, -15.963956832885742, -15.160747528076172, -14.357540130615234, -13.55433177947998, -12.751123428344727, -11.947915077209473, -11.144706726074219, -10.341498374938965, -9.538290023803711, -8.735082626342773, -7.931873798370361, -7.128665447235107, -6.3254570960998535, -5.5222487449646, -4.719040870666504, -3.915832281112671, -3.112624168395996, -2.309415817260742, -1.5062074661254883, -0.7029991149902344, 0.10020917654037476, 0.9034174680709839, 1.7066256999969482, 2.509834051132202, 3.313042163848877, 4.116250514984131, 4.919458866119385, 5.722667217254639, 6.525875568389893, 7.3290839195251465, 8.132291793823242, 8.935500144958496, 9.73870849609375, 10.541916847229004, 11.345125198364258, 12.148333549499512, 12.951541900634766, 13.75475025177002, 14.557958602905273, 15.361166954040527, 16.16437530517578, 16.96758270263672, 17.77079200744629, 18.573999404907227, 19.377206802368164, 20.180416107177734, 20.983623504638672, 21.786832809448242, 22.59004020690918, 23.39324951171875, 24.196456909179688, 24.999666213989258]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 11.0, 10.0, 13.0, 29.0, 30.0, 72.0, 142.0, 280.0, 552.0, 1234.0, 3571.0, 11198.0, 42035.0, 168499.0, 470327.0, 259883.0, 65539.0, 17063.0, 4869.0, 1750.0, 705.0, 331.0, 188.0, 98.0, 52.0, 27.0, 21.0, 5.0, 8.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.578125, -27.703125, -26.828125, -25.953125, -25.078125, -24.203125, -23.328125, -22.453125, -21.578125, -20.703125, -19.828125, -18.953125, -18.078125, -17.203125, -16.328125, -15.453125, -14.578125, -13.703125, -12.828125, -11.953125, -11.078125, -10.203125, -9.328125, -8.453125, -7.578125, -6.703125, -5.828125, -4.953125, -4.078125, -3.203125, -2.328125, -1.453125, -0.578125, 0.296875, 1.171875, 2.046875, 2.921875, 3.796875, 4.671875, 5.546875, 6.421875, 7.296875, 8.171875, 9.046875, 9.921875, 10.796875, 11.671875, 12.546875, 13.421875, 14.296875, 15.171875, 16.046875, 16.921875, 17.796875, 18.671875, 19.546875, 20.421875, 21.296875, 22.171875, 23.046875, 23.921875, 24.796875, 25.671875, 26.546875, 27.421875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 4.0, 15.0, 10.0, 11.0, 14.0, 14.0, 30.0, 33.0, 33.0, 38.0, 34.0, 39.0, 44.0, 46.0, 39.0, 57.0, 47.0, 66.0, 44.0, 41.0, 46.0, 61.0, 38.0, 30.0, 24.0, 30.0, 24.0, 11.0, 16.0, 14.0, 9.0, 12.0, 4.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.2734375, -8.977783203125, -8.68212890625, -8.386474609375, -8.0908203125, -7.795166015625, -7.49951171875, -7.203857421875, -6.908203125, -6.612548828125, -6.31689453125, -6.021240234375, -5.7255859375, -5.429931640625, -5.13427734375, -4.838623046875, -4.54296875, -4.247314453125, -3.95166015625, -3.656005859375, -3.3603515625, -3.064697265625, -2.76904296875, -2.473388671875, -2.177734375, -1.882080078125, -1.58642578125, -1.290771484375, -0.9951171875, -0.699462890625, -0.40380859375, -0.108154296875, 0.1875, 0.483154296875, 0.77880859375, 1.074462890625, 1.3701171875, 1.665771484375, 1.96142578125, 2.257080078125, 2.552734375, 2.848388671875, 3.14404296875, 3.439697265625, 3.7353515625, 4.031005859375, 4.32666015625, 4.622314453125, 4.91796875, 5.213623046875, 5.50927734375, 5.804931640625, 6.1005859375, 6.396240234375, 6.69189453125, 6.987548828125, 7.283203125, 7.578857421875, 7.87451171875, 8.170166015625, 8.4658203125, 8.761474609375, 9.05712890625, 9.352783203125, 9.6484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 15.0, 26.0, 34.0, 53.0, 79.0, 163.0, 288.0, 456.0, 833.0, 1662.0, 4774.0, 44373.0, 733209.0, 243451.0, 13688.0, 2734.0, 1184.0, 643.0, 377.0, 218.0, 121.0, 80.0, 40.0, 28.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.41796875, -36.8671875, -35.31640625, -33.765625, -32.21484375, -30.6640625, -29.11328125, -27.5625, -26.01171875, -24.4609375, -22.91015625, -21.359375, -19.80859375, -18.2578125, -16.70703125, -15.15625, -13.60546875, -12.0546875, -10.50390625, -8.953125, -7.40234375, -5.8515625, -4.30078125, -2.75, -1.19921875, 0.3515625, 1.90234375, 3.453125, 5.00390625, 6.5546875, 8.10546875, 9.65625, 11.20703125, 12.7578125, 14.30859375, 15.859375, 17.41015625, 18.9609375, 20.51171875, 22.0625, 23.61328125, 25.1640625, 26.71484375, 28.265625, 29.81640625, 31.3671875, 32.91796875, 34.46875, 36.01953125, 37.5703125, 39.12109375, 40.671875, 42.22265625, 43.7734375, 45.32421875, 46.875, 48.42578125, 49.9765625, 51.52734375, 53.078125, 54.62890625, 56.1796875, 57.73046875, 59.28125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 9.0, 15.0, 17.0, 20.0, 21.0, 42.0, 46.0, 50.0, 59.0, 70.0, 66.0, 75.0, 71.0, 74.0, 78.0, 58.0, 57.0, 46.0, 33.0, 30.0, 16.0, 15.0, 8.0, 10.0, 10.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.59375, -41.77978515625, -39.9658203125, -38.15185546875, -36.337890625, -34.52392578125, -32.7099609375, -30.89599609375, -29.08203125, -27.26806640625, -25.4541015625, -23.64013671875, -21.826171875, -20.01220703125, -18.1982421875, -16.38427734375, -14.5703125, -12.75634765625, -10.9423828125, -9.12841796875, -7.314453125, -5.50048828125, -3.6865234375, -1.87255859375, -0.05859375, 1.75537109375, 3.5693359375, 5.38330078125, 7.197265625, 9.01123046875, 10.8251953125, 12.63916015625, 14.453125, 16.26708984375, 18.0810546875, 19.89501953125, 21.708984375, 23.52294921875, 25.3369140625, 27.15087890625, 28.96484375, 30.77880859375, 32.5927734375, 34.40673828125, 36.220703125, 38.03466796875, 39.8486328125, 41.66259765625, 43.4765625, 45.29052734375, 47.1044921875, 48.91845703125, 50.732421875, 52.54638671875, 54.3603515625, 56.17431640625, 57.98828125, 59.80224609375, 61.6162109375, 63.43017578125, 65.244140625, 67.05810546875, 68.8720703125, 70.68603515625, 72.5]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 9.0, 12.0, 8.0, 10.0, 24.0, 45.0, 59.0, 89.0, 123.0, 238.0, 433.0, 850.0, 2036.0, 6585.0, 34613.0, 404461.0, 543005.0, 43727.0, 7843.0, 2284.0, 990.0, 457.0, 247.0, 126.0, 91.0, 57.0, 49.0, 27.0, 12.0, 16.0, 8.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6640625, -13.1187744140625, -12.573486328125, -12.0281982421875, -11.48291015625, -10.9376220703125, -10.392333984375, -9.8470458984375, -9.3017578125, -8.7564697265625, -8.211181640625, -7.6658935546875, -7.12060546875, -6.5753173828125, -6.030029296875, -5.4847412109375, -4.939453125, -4.3941650390625, -3.848876953125, -3.3035888671875, -2.75830078125, -2.2130126953125, -1.667724609375, -1.1224365234375, -0.5771484375, -0.0318603515625, 0.513427734375, 1.0587158203125, 1.60400390625, 2.1492919921875, 2.694580078125, 3.2398681640625, 3.78515625, 4.3304443359375, 4.875732421875, 5.4210205078125, 5.96630859375, 6.5115966796875, 7.056884765625, 7.6021728515625, 8.1474609375, 8.6927490234375, 9.238037109375, 9.7833251953125, 10.32861328125, 10.8739013671875, 11.419189453125, 11.9644775390625, 12.509765625, 13.0550537109375, 13.600341796875, 14.1456298828125, 14.69091796875, 15.2362060546875, 15.781494140625, 16.3267822265625, 16.8720703125, 17.4173583984375, 17.962646484375, 18.5079345703125, 19.05322265625, 19.5985107421875, 20.143798828125, 20.6890869140625, 21.234375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 9.0, 14.0, 10.0, 14.0, 25.0, 31.0, 33.0, 54.0, 66.0, 99.0, 113.0, 127.0, 97.0, 74.0, 57.0, 45.0, 37.0, 23.0, 16.0, 10.0, 6.0, 6.0, 5.0, 9.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001434326171875, -0.0013771653175354004, -0.0013200044631958008, -0.0012628436088562012, -0.0012056827545166016, -0.001148521900177002, -0.0010913610458374023, -0.0010342001914978027, -0.0009770393371582031, -0.0009198784828186035, -0.0008627176284790039, -0.0008055567741394043, -0.0007483959197998047, -0.0006912350654602051, -0.0006340742111206055, -0.0005769133567810059, -0.0005197525024414062, -0.00046259164810180664, -0.00040543079376220703, -0.0003482699394226074, -0.0002911090850830078, -0.0002339482307434082, -0.0001767873764038086, -0.00011962652206420898, -6.246566772460938e-05, -5.304813385009766e-06, 5.1856040954589844e-05, 0.00010901689529418945, 0.00016617774963378906, 0.00022333860397338867, 0.0002804994583129883, 0.0003376603126525879, 0.0003948211669921875, 0.0004519820213317871, 0.0005091428756713867, 0.0005663037300109863, 0.0006234645843505859, 0.0006806254386901855, 0.0007377862930297852, 0.0007949471473693848, 0.0008521080017089844, 0.000909268856048584, 0.0009664297103881836, 0.0010235905647277832, 0.0010807514190673828, 0.0011379122734069824, 0.001195073127746582, 0.0012522339820861816, 0.0013093948364257812, 0.0013665556907653809, 0.0014237165451049805, 0.00148087739944458, 0.0015380382537841797, 0.0015951991081237793, 0.001652359962463379, 0.0017095208168029785, 0.0017666816711425781, 0.0018238425254821777, 0.0018810033798217773, 0.001938164234161377, 0.0019953250885009766, 0.002052485942840576, 0.0021096467971801758, 0.0021668076515197754, 0.002223968505859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 7.0, 14.0, 17.0, 26.0, 46.0, 55.0, 98.0, 165.0, 305.0, 585.0, 1263.0, 3653.0, 15599.0, 130711.0, 755682.0, 119440.0, 14740.0, 3647.0, 1174.0, 593.0, 299.0, 157.0, 94.0, 63.0, 33.0, 28.0, 16.0, 14.0, 8.0, 9.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.828125, -20.2724609375, -19.716796875, -19.1611328125, -18.60546875, -18.0498046875, -17.494140625, -16.9384765625, -16.3828125, -15.8271484375, -15.271484375, -14.7158203125, -14.16015625, -13.6044921875, -13.048828125, -12.4931640625, -11.9375, -11.3818359375, -10.826171875, -10.2705078125, -9.71484375, -9.1591796875, -8.603515625, -8.0478515625, -7.4921875, -6.9365234375, -6.380859375, -5.8251953125, -5.26953125, -4.7138671875, -4.158203125, -3.6025390625, -3.046875, -2.4912109375, -1.935546875, -1.3798828125, -0.82421875, -0.2685546875, 0.287109375, 0.8427734375, 1.3984375, 1.9541015625, 2.509765625, 3.0654296875, 3.62109375, 4.1767578125, 4.732421875, 5.2880859375, 5.84375, 6.3994140625, 6.955078125, 7.5107421875, 8.06640625, 8.6220703125, 9.177734375, 9.7333984375, 10.2890625, 10.8447265625, 11.400390625, 11.9560546875, 12.51171875, 13.0673828125, 13.623046875, 14.1787109375, 14.734375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 13.0, 17.0, 36.0, 68.0, 133.0, 184.0, 240.0, 141.0, 57.0, 49.0, 26.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.25, -19.33349609375, -18.4169921875, -17.50048828125, -16.583984375, -15.66748046875, -14.7509765625, -13.83447265625, -12.91796875, -12.00146484375, -11.0849609375, -10.16845703125, -9.251953125, -8.33544921875, -7.4189453125, -6.50244140625, -5.5859375, -4.66943359375, -3.7529296875, -2.83642578125, -1.919921875, -1.00341796875, -0.0869140625, 0.82958984375, 1.74609375, 2.66259765625, 3.5791015625, 4.49560546875, 5.412109375, 6.32861328125, 7.2451171875, 8.16162109375, 9.078125, 9.99462890625, 10.9111328125, 11.82763671875, 12.744140625, 13.66064453125, 14.5771484375, 15.49365234375, 16.41015625, 17.32666015625, 18.2431640625, 19.15966796875, 20.076171875, 20.99267578125, 21.9091796875, 22.82568359375, 23.7421875, 24.65869140625, 25.5751953125, 26.49169921875, 27.408203125, 28.32470703125, 29.2412109375, 30.15771484375, 31.07421875, 31.99072265625, 32.9072265625, 33.82373046875, 34.740234375, 35.65673828125, 36.5732421875, 37.48974609375, 38.40625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 25.0, 139.0, 441.0, 288.0, 96.0, 16.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-244.26541137695312, -218.94081115722656, -193.61619567871094, -168.29159545898438, -142.96697998046875, -117.64237976074219, -92.31777954101562, -66.9931640625, -41.66856384277344, -16.343957901000977, 8.980648040771484, 34.30525207519531, 59.629859924316406, 84.9544677734375, 110.27906799316406, 135.6036834716797, 160.92828369140625, 186.2528839111328, 211.57749938964844, 236.902099609375, 262.2267150878906, 287.55133056640625, 312.87591552734375, 338.2005310058594, 363.525146484375, 388.8497619628906, 414.1743469238281, 439.49896240234375, 464.8235778808594, 490.148193359375, 515.4727783203125, 540.79736328125, 566.1220092773438, 591.4465942382812, 616.771240234375, 642.0958251953125, 667.42041015625, 692.7450561523438, 718.0696411132812, 743.394287109375, 768.7188720703125, 794.04345703125, 819.3681030273438, 844.6926879882812, 870.0172729492188, 895.3419189453125, 920.66650390625, 945.9910888671875, 971.315673828125, 996.6402587890625, 1021.9649047851562, 1047.28955078125, 1072.6141357421875, 1097.938720703125, 1123.2633056640625, 1148.587890625, 1173.91259765625, 1199.2371826171875, 1224.561767578125, 1249.886474609375, 1275.2110595703125, 1300.53564453125, 1325.8602294921875, 1351.184814453125, 1376.5093994140625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 8.0, 4.0, 13.0, 6.0, 8.0, 11.0, 20.0, 29.0, 17.0, 19.0, 22.0, 26.0, 26.0, 49.0, 41.0, 36.0, 39.0, 49.0, 45.0, 42.0, 40.0, 43.0, 36.0, 48.0, 36.0, 38.0, 32.0, 27.0, 30.0, 20.0, 25.0, 15.0, 17.0, 18.0, 14.0, 5.0, 9.0, 6.0, 6.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-178.16281127929688, -173.02392578125, -167.88502502441406, -162.74612426757812, -157.60723876953125, -152.46835327148438, -147.32945251464844, -142.1905517578125, -137.05166625976562, -131.91278076171875, -126.77388000488281, -121.6349868774414, -116.49609375, -111.3572006225586, -106.21830749511719, -101.07941436767578, -95.94052124023438, -90.80162811279297, -85.66273498535156, -80.52384185791016, -75.38494873046875, -70.24605560302734, -65.10716247558594, -59.96826934814453, -54.829376220703125, -49.69048309326172, -44.55158996582031, -39.412696838378906, -34.2738037109375, -29.134910583496094, -23.996017456054688, -18.85712432861328, -13.718231201171875, -8.579338073730469, -3.4404449462890625, 1.6984481811523438, 6.83734130859375, 11.976234436035156, 17.115127563476562, 22.25402069091797, 27.392913818359375, 32.53180694580078, 37.67070007324219, 42.809593200683594, 47.948486328125, 53.087379455566406, 58.22627258300781, 63.36516571044922, 68.50405883789062, 73.64295196533203, 78.78184509277344, 83.92073822021484, 89.05963134765625, 94.19852447509766, 99.33741760253906, 104.47631072998047, 109.61520385742188, 114.75409698486328, 119.89299011230469, 125.0318832397461, 130.1707763671875, 135.30966186523438, 140.4485626220703, 145.58746337890625, 150.72634887695312]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 11.0, 17.0, 18.0, 44.0, 65.0, 115.0, 141.0, 284.0, 490.0, 1038.0, 3321.0, 15871.0, 4115522.0, 48429.0, 5784.0, 1611.0, 645.0, 359.0, 201.0, 102.0, 70.0, 53.0, 28.0, 19.0, 13.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-109.9375, -107.1689453125, -104.400390625, -101.6318359375, -98.86328125, -96.0947265625, -93.326171875, -90.5576171875, -87.7890625, -85.0205078125, -82.251953125, -79.4833984375, -76.71484375, -73.9462890625, -71.177734375, -68.4091796875, -65.640625, -62.8720703125, -60.103515625, -57.3349609375, -54.56640625, -51.7978515625, -49.029296875, -46.2607421875, -43.4921875, -40.7236328125, -37.955078125, -35.1865234375, -32.41796875, -29.6494140625, -26.880859375, -24.1123046875, -21.34375, -18.5751953125, -15.806640625, -13.0380859375, -10.26953125, -7.5009765625, -4.732421875, -1.9638671875, 0.8046875, 3.5732421875, 6.341796875, 9.1103515625, 11.87890625, 14.6474609375, 17.416015625, 20.1845703125, 22.953125, 25.7216796875, 28.490234375, 31.2587890625, 34.02734375, 36.7958984375, 39.564453125, 42.3330078125, 45.1015625, 47.8701171875, 50.638671875, 53.4072265625, 56.17578125, 58.9443359375, 61.712890625, 64.4814453125, 67.25]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 2.0, 1.0, 8.0, 9.0, 10.0, 13.0, 15.0, 27.0, 27.0, 32.0, 29.0, 38.0, 21.0, 45.0, 44.0, 33.0, 54.0, 58.0, 49.0, 51.0, 54.0, 45.0, 43.0, 50.0, 39.0, 31.0, 33.0, 30.0, 28.0, 16.0, 15.0, 7.0, 10.0, 5.0, 8.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.296875, -8.991455078125, -8.68603515625, -8.380615234375, -8.0751953125, -7.769775390625, -7.46435546875, -7.158935546875, -6.853515625, -6.548095703125, -6.24267578125, -5.937255859375, -5.6318359375, -5.326416015625, -5.02099609375, -4.715576171875, -4.41015625, -4.104736328125, -3.79931640625, -3.493896484375, -3.1884765625, -2.883056640625, -2.57763671875, -2.272216796875, -1.966796875, -1.661376953125, -1.35595703125, -1.050537109375, -0.7451171875, -0.439697265625, -0.13427734375, 0.171142578125, 0.4765625, 0.781982421875, 1.08740234375, 1.392822265625, 1.6982421875, 2.003662109375, 2.30908203125, 2.614501953125, 2.919921875, 3.225341796875, 3.53076171875, 3.836181640625, 4.1416015625, 4.447021484375, 4.75244140625, 5.057861328125, 5.36328125, 5.668701171875, 5.97412109375, 6.279541015625, 6.5849609375, 6.890380859375, 7.19580078125, 7.501220703125, 7.806640625, 8.112060546875, 8.41748046875, 8.722900390625, 9.0283203125, 9.333740234375, 9.63916015625, 9.944580078125, 10.25]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 6.0, 13.0, 13.0, 14.0, 13.0, 30.0, 25.0, 36.0, 42.0, 54.0, 69.0, 85.0, 125.0, 150.0, 233.0, 399.0, 925.0, 2327.0, 9396.0, 92209.0, 4059176.0, 21436.0, 4325.0, 1419.0, 595.0, 298.0, 205.0, 133.0, 105.0, 90.0, 61.0, 39.0, 43.0, 22.0, 37.0, 23.0, 22.0, 14.0, 14.0, 17.0, 7.0, 6.0, 5.0, 5.0, 5.0, 0.0, 3.0, 2.0], "bins": [-67.0625, -65.2119140625, -63.361328125, -61.5107421875, -59.66015625, -57.8095703125, -55.958984375, -54.1083984375, -52.2578125, -50.4072265625, -48.556640625, -46.7060546875, -44.85546875, -43.0048828125, -41.154296875, -39.3037109375, -37.453125, -35.6025390625, -33.751953125, -31.9013671875, -30.05078125, -28.2001953125, -26.349609375, -24.4990234375, -22.6484375, -20.7978515625, -18.947265625, -17.0966796875, -15.24609375, -13.3955078125, -11.544921875, -9.6943359375, -7.84375, -5.9931640625, -4.142578125, -2.2919921875, -0.44140625, 1.4091796875, 3.259765625, 5.1103515625, 6.9609375, 8.8115234375, 10.662109375, 12.5126953125, 14.36328125, 16.2138671875, 18.064453125, 19.9150390625, 21.765625, 23.6162109375, 25.466796875, 27.3173828125, 29.16796875, 31.0185546875, 32.869140625, 34.7197265625, 36.5703125, 38.4208984375, 40.271484375, 42.1220703125, 43.97265625, 45.8232421875, 47.673828125, 49.5244140625, 51.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 20.0, 26.0, 61.0, 337.0, 3450.0, 91.0, 33.0, 19.0, 8.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6484375, -8.2745361328125, -7.900634765625, -7.5267333984375, -7.15283203125, -6.7789306640625, -6.405029296875, -6.0311279296875, -5.6572265625, -5.2833251953125, -4.909423828125, -4.5355224609375, -4.16162109375, -3.7877197265625, -3.413818359375, -3.0399169921875, -2.666015625, -2.2921142578125, -1.918212890625, -1.5443115234375, -1.17041015625, -0.7965087890625, -0.422607421875, -0.0487060546875, 0.3251953125, 0.6990966796875, 1.072998046875, 1.4468994140625, 1.82080078125, 2.1947021484375, 2.568603515625, 2.9425048828125, 3.31640625, 3.6903076171875, 4.064208984375, 4.4381103515625, 4.81201171875, 5.1859130859375, 5.559814453125, 5.9337158203125, 6.3076171875, 6.6815185546875, 7.055419921875, 7.4293212890625, 7.80322265625, 8.1771240234375, 8.551025390625, 8.9249267578125, 9.298828125, 9.6727294921875, 10.046630859375, 10.4205322265625, 10.79443359375, 11.1683349609375, 11.542236328125, 11.9161376953125, 12.2900390625, 12.6639404296875, 13.037841796875, 13.4117431640625, 13.78564453125, 14.1595458984375, 14.533447265625, 14.9073486328125, 15.28125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 7.0, 18.0, 22.0, 20.0, 42.0, 57.0, 101.0, 105.0, 109.0, 124.0, 87.0, 74.0, 63.0, 54.0, 29.0, 29.0, 14.0, 12.0, 11.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-48.419193267822266, -47.24048614501953, -46.0617790222168, -44.88307571411133, -43.704368591308594, -42.52566146850586, -41.346954345703125, -40.16824722290039, -38.989540100097656, -37.81083297729492, -36.63212585449219, -35.45342254638672, -34.274715423583984, -33.09600830078125, -31.917301177978516, -30.73859405517578, -29.559890747070312, -28.381183624267578, -27.202478408813477, -26.023771286010742, -24.84506607055664, -23.666358947753906, -22.487651824951172, -21.308944702148438, -20.130239486694336, -18.9515323638916, -17.7728271484375, -16.594120025634766, -15.415413856506348, -14.23670768737793, -13.058000564575195, -11.879294395446777, -10.700584411621094, -9.521878242492676, -8.343172073364258, -7.164464950561523, -5.9857587814331055, -4.8070526123046875, -3.6283459663391113, -2.449639320373535, -1.2709331512451172, -0.09222674369812012, 1.086479663848877, 2.265186071395874, 3.443892478942871, 4.622598648071289, 5.801305294036865, 6.980011940002441, 8.15871810913086, 9.337424278259277, 10.516130447387695, 11.69483757019043, 12.873543739318848, 14.052249908447266, 15.23095703125, 16.409664154052734, 17.588369369506836, 18.76707649230957, 19.945781707763672, 21.124488830566406, 22.30319595336914, 23.481901168823242, 24.660608291625977, 25.839313507080078, 27.018020629882812]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 9.0, 11.0, 11.0, 10.0, 12.0, 12.0, 17.0, 23.0, 15.0, 20.0, 31.0, 30.0, 34.0, 29.0, 28.0, 34.0, 26.0, 22.0, 37.0, 34.0, 39.0, 32.0, 37.0, 48.0, 38.0, 33.0, 37.0, 33.0, 26.0, 31.0, 27.0, 22.0, 20.0, 20.0, 14.0, 14.0, 13.0, 10.0, 13.0, 10.0, 8.0, 11.0, 7.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-19.241703033447266, -18.67993927001953, -18.118175506591797, -17.556411743164062, -16.994647979736328, -16.432884216308594, -15.871121406555176, -15.309357643127441, -14.747593879699707, -14.185830116271973, -13.624066352844238, -13.062302589416504, -12.500539779663086, -11.938776016235352, -11.377012252807617, -10.815248489379883, -10.253484725952148, -9.691720962524414, -9.12995719909668, -8.568193435668945, -8.006429672241211, -7.444666385650635, -6.882903099060059, -6.321139335632324, -5.75937557220459, -5.1976118087768555, -4.635848045349121, -4.074084758758545, -3.5123209953308105, -2.950557231903076, -2.388793706893921, -1.8270301818847656, -1.2652664184570312, -0.7035027742385864, -0.1417391300201416, 0.4200245141983032, 0.981788158416748, 1.5435519218444824, 2.1053154468536377, 2.667078971862793, 3.2288427352905273, 3.7906064987182617, 4.352370262145996, 4.914133548736572, 5.475897312164307, 6.037661075592041, 6.599424362182617, 7.161188125610352, 7.722951889038086, 8.28471565246582, 8.846479415893555, 9.408243179321289, 9.970006942749023, 10.531770706176758, 11.093533515930176, 11.65529727935791, 12.217061042785645, 12.778824806213379, 13.340588569641113, 13.902352333068848, 14.464115142822266, 15.02587890625, 15.587642669677734, 16.14940643310547, 16.711170196533203]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 7.0, 8.0, 17.0, 12.0, 38.0, 73.0, 120.0, 217.0, 428.0, 817.0, 1788.0, 4186.0, 10190.0, 27728.0, 79977.0, 236872.0, 404255.0, 183652.0, 62130.0, 21463.0, 8301.0, 3316.0, 1461.0, 692.0, 354.0, 196.0, 96.0, 56.0, 35.0, 25.0, 15.0, 10.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.796875, -19.166015625, -18.53515625, -17.904296875, -17.2734375, -16.642578125, -16.01171875, -15.380859375, -14.75, -14.119140625, -13.48828125, -12.857421875, -12.2265625, -11.595703125, -10.96484375, -10.333984375, -9.703125, -9.072265625, -8.44140625, -7.810546875, -7.1796875, -6.548828125, -5.91796875, -5.287109375, -4.65625, -4.025390625, -3.39453125, -2.763671875, -2.1328125, -1.501953125, -0.87109375, -0.240234375, 0.390625, 1.021484375, 1.65234375, 2.283203125, 2.9140625, 3.544921875, 4.17578125, 4.806640625, 5.4375, 6.068359375, 6.69921875, 7.330078125, 7.9609375, 8.591796875, 9.22265625, 9.853515625, 10.484375, 11.115234375, 11.74609375, 12.376953125, 13.0078125, 13.638671875, 14.26953125, 14.900390625, 15.53125, 16.162109375, 16.79296875, 17.423828125, 18.0546875, 18.685546875, 19.31640625, 19.947265625, 20.578125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 8.0, 10.0, 13.0, 13.0, 19.0, 23.0, 34.0, 33.0, 40.0, 35.0, 46.0, 42.0, 53.0, 50.0, 51.0, 58.0, 39.0, 51.0, 56.0, 53.0, 44.0, 30.0, 37.0, 29.0, 15.0, 24.0, 19.0, 13.0, 10.0, 11.0, 7.0, 3.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.265625, -9.92431640625, -9.5830078125, -9.24169921875, -8.900390625, -8.55908203125, -8.2177734375, -7.87646484375, -7.53515625, -7.19384765625, -6.8525390625, -6.51123046875, -6.169921875, -5.82861328125, -5.4873046875, -5.14599609375, -4.8046875, -4.46337890625, -4.1220703125, -3.78076171875, -3.439453125, -3.09814453125, -2.7568359375, -2.41552734375, -2.07421875, -1.73291015625, -1.3916015625, -1.05029296875, -0.708984375, -0.36767578125, -0.0263671875, 0.31494140625, 0.65625, 0.99755859375, 1.3388671875, 1.68017578125, 2.021484375, 2.36279296875, 2.7041015625, 3.04541015625, 3.38671875, 3.72802734375, 4.0693359375, 4.41064453125, 4.751953125, 5.09326171875, 5.4345703125, 5.77587890625, 6.1171875, 6.45849609375, 6.7998046875, 7.14111328125, 7.482421875, 7.82373046875, 8.1650390625, 8.50634765625, 8.84765625, 9.18896484375, 9.5302734375, 9.87158203125, 10.212890625, 10.55419921875, 10.8955078125, 11.23681640625, 11.578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 5.0, 5.0, 10.0, 7.0, 9.0, 20.0, 22.0, 20.0, 36.0, 50.0, 76.0, 111.0, 173.0, 238.0, 347.0, 443.0, 708.0, 1154.0, 2318.0, 6471.0, 33648.0, 324858.0, 598475.0, 62309.0, 10067.0, 3040.0, 1395.0, 778.0, 538.0, 354.0, 270.0, 191.0, 115.0, 71.0, 64.0, 35.0, 26.0, 30.0, 17.0, 10.0, 12.0, 9.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-31.765625, -30.745849609375, -29.72607421875, -28.706298828125, -27.6865234375, -26.666748046875, -25.64697265625, -24.627197265625, -23.607421875, -22.587646484375, -21.56787109375, -20.548095703125, -19.5283203125, -18.508544921875, -17.48876953125, -16.468994140625, -15.44921875, -14.429443359375, -13.40966796875, -12.389892578125, -11.3701171875, -10.350341796875, -9.33056640625, -8.310791015625, -7.291015625, -6.271240234375, -5.25146484375, -4.231689453125, -3.2119140625, -2.192138671875, -1.17236328125, -0.152587890625, 0.8671875, 1.886962890625, 2.90673828125, 3.926513671875, 4.9462890625, 5.966064453125, 6.98583984375, 8.005615234375, 9.025390625, 10.045166015625, 11.06494140625, 12.084716796875, 13.1044921875, 14.124267578125, 15.14404296875, 16.163818359375, 17.18359375, 18.203369140625, 19.22314453125, 20.242919921875, 21.2626953125, 22.282470703125, 23.30224609375, 24.322021484375, 25.341796875, 26.361572265625, 27.38134765625, 28.401123046875, 29.4208984375, 30.440673828125, 31.46044921875, 32.480224609375, 33.5]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 12.0, 7.0, 13.0, 17.0, 19.0, 19.0, 24.0, 42.0, 53.0, 55.0, 53.0, 53.0, 58.0, 54.0, 63.0, 54.0, 53.0, 42.0, 38.0, 51.0, 52.0, 36.0, 29.0, 24.0, 18.0, 23.0, 7.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.125, -53.56982421875, -52.0146484375, -50.45947265625, -48.904296875, -47.34912109375, -45.7939453125, -44.23876953125, -42.68359375, -41.12841796875, -39.5732421875, -38.01806640625, -36.462890625, -34.90771484375, -33.3525390625, -31.79736328125, -30.2421875, -28.68701171875, -27.1318359375, -25.57666015625, -24.021484375, -22.46630859375, -20.9111328125, -19.35595703125, -17.80078125, -16.24560546875, -14.6904296875, -13.13525390625, -11.580078125, -10.02490234375, -8.4697265625, -6.91455078125, -5.359375, -3.80419921875, -2.2490234375, -0.69384765625, 0.861328125, 2.41650390625, 3.9716796875, 5.52685546875, 7.08203125, 8.63720703125, 10.1923828125, 11.74755859375, 13.302734375, 14.85791015625, 16.4130859375, 17.96826171875, 19.5234375, 21.07861328125, 22.6337890625, 24.18896484375, 25.744140625, 27.29931640625, 28.8544921875, 30.40966796875, 31.96484375, 33.52001953125, 35.0751953125, 36.63037109375, 38.185546875, 39.74072265625, 41.2958984375, 42.85107421875, 44.40625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 4.0, 9.0, 11.0, 5.0, 14.0, 28.0, 40.0, 49.0, 77.0, 119.0, 165.0, 288.0, 459.0, 798.0, 1317.0, 2793.0, 6530.0, 22286.0, 161042.0, 736286.0, 90036.0, 15713.0, 5184.0, 2346.0, 1136.0, 648.0, 424.0, 227.0, 161.0, 96.0, 66.0, 43.0, 34.0, 28.0, 13.0, 25.0, 17.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.3828125, -12.969482421875, -12.55615234375, -12.142822265625, -11.7294921875, -11.316162109375, -10.90283203125, -10.489501953125, -10.076171875, -9.662841796875, -9.24951171875, -8.836181640625, -8.4228515625, -8.009521484375, -7.59619140625, -7.182861328125, -6.76953125, -6.356201171875, -5.94287109375, -5.529541015625, -5.1162109375, -4.702880859375, -4.28955078125, -3.876220703125, -3.462890625, -3.049560546875, -2.63623046875, -2.222900390625, -1.8095703125, -1.396240234375, -0.98291015625, -0.569580078125, -0.15625, 0.257080078125, 0.67041015625, 1.083740234375, 1.4970703125, 1.910400390625, 2.32373046875, 2.737060546875, 3.150390625, 3.563720703125, 3.97705078125, 4.390380859375, 4.8037109375, 5.217041015625, 5.63037109375, 6.043701171875, 6.45703125, 6.870361328125, 7.28369140625, 7.697021484375, 8.1103515625, 8.523681640625, 8.93701171875, 9.350341796875, 9.763671875, 10.177001953125, 10.59033203125, 11.003662109375, 11.4169921875, 11.830322265625, 12.24365234375, 12.656982421875, 13.0703125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 1.0, 4.0, 8.0, 10.0, 15.0, 26.0, 35.0, 46.0, 91.0, 141.0, 190.0, 146.0, 96.0, 48.0, 32.0, 30.0, 18.0, 14.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002407073974609375, -0.0023307204246520996, -0.0022543668746948242, -0.002178013324737549, -0.0021016597747802734, -0.002025306224822998, -0.0019489526748657227, -0.0018725991249084473, -0.0017962455749511719, -0.0017198920249938965, -0.001643538475036621, -0.0015671849250793457, -0.0014908313751220703, -0.001414477825164795, -0.0013381242752075195, -0.0012617707252502441, -0.0011854171752929688, -0.0011090636253356934, -0.001032710075378418, -0.0009563565254211426, -0.0008800029754638672, -0.0008036494255065918, -0.0007272958755493164, -0.000650942325592041, -0.0005745887756347656, -0.0004982352256774902, -0.00042188167572021484, -0.00034552812576293945, -0.00026917457580566406, -0.00019282102584838867, -0.00011646747589111328, -4.011392593383789e-05, 3.62396240234375e-05, 0.00011259317398071289, 0.00018894672393798828, 0.00026530027389526367, 0.00034165382385253906, 0.00041800737380981445, 0.0004943609237670898, 0.0005707144737243652, 0.0006470680236816406, 0.000723421573638916, 0.0007997751235961914, 0.0008761286735534668, 0.0009524822235107422, 0.0010288357734680176, 0.001105189323425293, 0.0011815428733825684, 0.0012578964233398438, 0.0013342499732971191, 0.0014106035232543945, 0.00148695707321167, 0.0015633106231689453, 0.0016396641731262207, 0.001716017723083496, 0.0017923712730407715, 0.0018687248229980469, 0.0019450783729553223, 0.0020214319229125977, 0.002097785472869873, 0.0021741390228271484, 0.002250492572784424, 0.0023268461227416992, 0.0024031996726989746, 0.00247955322265625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 6.0, 9.0, 13.0, 16.0, 19.0, 33.0, 40.0, 55.0, 75.0, 97.0, 172.0, 291.0, 430.0, 718.0, 1195.0, 2318.0, 5579.0, 18537.0, 135847.0, 744524.0, 111568.0, 16597.0, 5078.0, 2202.0, 1246.0, 699.0, 369.0, 270.0, 160.0, 103.0, 76.0, 55.0, 42.0, 30.0, 14.0, 21.0, 8.0, 11.0, 9.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.8984375, -14.439453125, -13.98046875, -13.521484375, -13.0625, -12.603515625, -12.14453125, -11.685546875, -11.2265625, -10.767578125, -10.30859375, -9.849609375, -9.390625, -8.931640625, -8.47265625, -8.013671875, -7.5546875, -7.095703125, -6.63671875, -6.177734375, -5.71875, -5.259765625, -4.80078125, -4.341796875, -3.8828125, -3.423828125, -2.96484375, -2.505859375, -2.046875, -1.587890625, -1.12890625, -0.669921875, -0.2109375, 0.248046875, 0.70703125, 1.166015625, 1.625, 2.083984375, 2.54296875, 3.001953125, 3.4609375, 3.919921875, 4.37890625, 4.837890625, 5.296875, 5.755859375, 6.21484375, 6.673828125, 7.1328125, 7.591796875, 8.05078125, 8.509765625, 8.96875, 9.427734375, 9.88671875, 10.345703125, 10.8046875, 11.263671875, 11.72265625, 12.181640625, 12.640625, 13.099609375, 13.55859375, 14.017578125, 14.4765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 12.0, 18.0, 27.0, 42.0, 67.0, 118.0, 174.0, 200.0, 141.0, 81.0, 38.0, 29.0, 14.0, 11.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.405517578125, -16.76416015625, -16.122802734375, -15.4814453125, -14.840087890625, -14.19873046875, -13.557373046875, -12.916015625, -12.274658203125, -11.63330078125, -10.991943359375, -10.3505859375, -9.709228515625, -9.06787109375, -8.426513671875, -7.78515625, -7.143798828125, -6.50244140625, -5.861083984375, -5.2197265625, -4.578369140625, -3.93701171875, -3.295654296875, -2.654296875, -2.012939453125, -1.37158203125, -0.730224609375, -0.0888671875, 0.552490234375, 1.19384765625, 1.835205078125, 2.4765625, 3.117919921875, 3.75927734375, 4.400634765625, 5.0419921875, 5.683349609375, 6.32470703125, 6.966064453125, 7.607421875, 8.248779296875, 8.89013671875, 9.531494140625, 10.1728515625, 10.814208984375, 11.45556640625, 12.096923828125, 12.73828125, 13.379638671875, 14.02099609375, 14.662353515625, 15.3037109375, 15.945068359375, 16.58642578125, 17.227783203125, 17.869140625, 18.510498046875, 19.15185546875, 19.793212890625, 20.4345703125, 21.075927734375, 21.71728515625, 22.358642578125, 23.0]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 13.0, 23.0, 78.0, 247.0, 405.0, 181.0, 49.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1205.760498046875, -1184.0751953125, -1162.389892578125, -1140.7044677734375, -1119.0191650390625, -1097.3338623046875, -1075.6485595703125, -1053.963134765625, -1032.27783203125, -1010.592529296875, -988.9071655273438, -967.2218627929688, -945.5364990234375, -923.8511962890625, -902.1658935546875, -880.4805297851562, -858.7952270507812, -837.1099243164062, -815.424560546875, -793.7392578125, -772.0538940429688, -750.3685913085938, -728.6832275390625, -706.9979248046875, -685.3126220703125, -663.6273193359375, -641.9419555664062, -620.2566528320312, -598.5712890625, -576.885986328125, -555.20068359375, -533.5153198242188, -511.83001708984375, -490.1446838378906, -468.4593505859375, -446.7740478515625, -425.08868408203125, -403.40338134765625, -381.7180480957031, -360.03271484375, -338.34735107421875, -316.6620178222656, -294.9766845703125, -273.2913818359375, -251.6060333251953, -229.9207000732422, -208.23538208007812, -186.550048828125, -164.86473083496094, -143.1793975830078, -121.49407196044922, -99.80874633789062, -78.1234130859375, -56.438079833984375, -34.75276184082031, -13.067428588867188, 8.617904663085938, 30.303234100341797, 51.988563537597656, 73.67388916015625, 95.35922241210938, 117.0445556640625, 138.72987365722656, 160.4152069091797, 182.1005401611328]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 11.0, 10.0, 17.0, 14.0, 16.0, 24.0, 21.0, 29.0, 25.0, 30.0, 41.0, 46.0, 37.0, 49.0, 64.0, 57.0, 51.0, 54.0, 48.0, 53.0, 45.0, 36.0, 33.0, 26.0, 31.0, 20.0, 25.0, 16.0, 8.0, 7.0, 13.0, 6.0, 9.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-217.52169799804688, -211.4401397705078, -205.3585662841797, -199.27700805664062, -193.1954345703125, -187.11387634277344, -181.03231811523438, -174.95074462890625, -168.8691864013672, -162.78762817382812, -156.7060546875, -150.62449645996094, -144.54293823242188, -138.46136474609375, -132.3798065185547, -126.2982406616211, -120.2166748046875, -114.1351089477539, -108.05354309082031, -101.97198486328125, -95.89041900634766, -89.80885314941406, -83.727294921875, -77.6457290649414, -71.56416320800781, -65.48259735107422, -59.40103530883789, -53.31947326660156, -47.23790740966797, -41.156341552734375, -35.07477951049805, -28.99321746826172, -22.911636352539062, -16.8300724029541, -10.74850845336914, -4.66694450378418, 1.4146194458007812, 7.496183395385742, 13.577747344970703, 19.65930938720703, 25.740875244140625, 31.822439193725586, 37.90400314331055, 43.985565185546875, 50.06713104248047, 56.14869689941406, 62.23025894165039, 68.31182098388672, 74.39338684082031, 80.4749526977539, 86.5565185546875, 92.63807678222656, 98.71964263916016, 104.80120849609375, 110.88276672363281, 116.9643325805664, 123.0458984375, 129.12745666503906, 135.2090301513672, 141.29058837890625, 147.37216186523438, 153.45372009277344, 159.5352783203125, 165.61685180664062, 171.6984100341797]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 1.0, 4.0, 7.0, 11.0, 9.0, 17.0, 25.0, 30.0, 31.0, 55.0, 64.0, 81.0, 99.0, 137.0, 162.0, 306.0, 459.0, 803.0, 1498.0, 2904.0, 7437.0, 28103.0, 3862896.0, 258001.0, 19475.0, 6013.0, 2430.0, 1206.0, 682.0, 403.0, 251.0, 185.0, 119.0, 80.0, 58.0, 50.0, 52.0, 30.0, 36.0, 23.0, 19.0, 13.0, 10.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.375, -41.0458984375, -39.716796875, -38.3876953125, -37.05859375, -35.7294921875, -34.400390625, -33.0712890625, -31.7421875, -30.4130859375, -29.083984375, -27.7548828125, -26.42578125, -25.0966796875, -23.767578125, -22.4384765625, -21.109375, -19.7802734375, -18.451171875, -17.1220703125, -15.79296875, -14.4638671875, -13.134765625, -11.8056640625, -10.4765625, -9.1474609375, -7.818359375, -6.4892578125, -5.16015625, -3.8310546875, -2.501953125, -1.1728515625, 0.15625, 1.4853515625, 2.814453125, 4.1435546875, 5.47265625, 6.8017578125, 8.130859375, 9.4599609375, 10.7890625, 12.1181640625, 13.447265625, 14.7763671875, 16.10546875, 17.4345703125, 18.763671875, 20.0927734375, 21.421875, 22.7509765625, 24.080078125, 25.4091796875, 26.73828125, 28.0673828125, 29.396484375, 30.7255859375, 32.0546875, 33.3837890625, 34.712890625, 36.0419921875, 37.37109375, 38.7001953125, 40.029296875, 41.3583984375, 42.6875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 2.0, 9.0, 7.0, 9.0, 12.0, 10.0, 18.0, 25.0, 25.0, 40.0, 33.0, 48.0, 47.0, 49.0, 45.0, 51.0, 61.0, 46.0, 58.0, 57.0, 49.0, 47.0, 49.0, 32.0, 28.0, 24.0, 19.0, 18.0, 17.0, 18.0, 12.0, 10.0, 8.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.984375, -11.65966796875, -11.3349609375, -11.01025390625, -10.685546875, -10.36083984375, -10.0361328125, -9.71142578125, -9.38671875, -9.06201171875, -8.7373046875, -8.41259765625, -8.087890625, -7.76318359375, -7.4384765625, -7.11376953125, -6.7890625, -6.46435546875, -6.1396484375, -5.81494140625, -5.490234375, -5.16552734375, -4.8408203125, -4.51611328125, -4.19140625, -3.86669921875, -3.5419921875, -3.21728515625, -2.892578125, -2.56787109375, -2.2431640625, -1.91845703125, -1.59375, -1.26904296875, -0.9443359375, -0.61962890625, -0.294921875, 0.02978515625, 0.3544921875, 0.67919921875, 1.00390625, 1.32861328125, 1.6533203125, 1.97802734375, 2.302734375, 2.62744140625, 2.9521484375, 3.27685546875, 3.6015625, 3.92626953125, 4.2509765625, 4.57568359375, 4.900390625, 5.22509765625, 5.5498046875, 5.87451171875, 6.19921875, 6.52392578125, 6.8486328125, 7.17333984375, 7.498046875, 7.82275390625, 8.1474609375, 8.47216796875, 8.796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 4.0, 7.0, 15.0, 12.0, 15.0, 21.0, 33.0, 43.0, 56.0, 60.0, 106.0, 121.0, 177.0, 303.0, 503.0, 942.0, 2184.0, 6296.0, 25475.0, 3731981.0, 397021.0, 19553.0, 5216.0, 1893.0, 832.0, 456.0, 274.0, 174.0, 128.0, 99.0, 69.0, 56.0, 37.0, 26.0, 23.0, 13.0, 18.0, 14.0, 7.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.9375, -44.49853515625, -43.0595703125, -41.62060546875, -40.181640625, -38.74267578125, -37.3037109375, -35.86474609375, -34.42578125, -32.98681640625, -31.5478515625, -30.10888671875, -28.669921875, -27.23095703125, -25.7919921875, -24.35302734375, -22.9140625, -21.47509765625, -20.0361328125, -18.59716796875, -17.158203125, -15.71923828125, -14.2802734375, -12.84130859375, -11.40234375, -9.96337890625, -8.5244140625, -7.08544921875, -5.646484375, -4.20751953125, -2.7685546875, -1.32958984375, 0.109375, 1.54833984375, 2.9873046875, 4.42626953125, 5.865234375, 7.30419921875, 8.7431640625, 10.18212890625, 11.62109375, 13.06005859375, 14.4990234375, 15.93798828125, 17.376953125, 18.81591796875, 20.2548828125, 21.69384765625, 23.1328125, 24.57177734375, 26.0107421875, 27.44970703125, 28.888671875, 30.32763671875, 31.7666015625, 33.20556640625, 34.64453125, 36.08349609375, 37.5224609375, 38.96142578125, 40.400390625, 41.83935546875, 43.2783203125, 44.71728515625, 46.15625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 11.0, 12.0, 18.0, 28.0, 66.0, 336.0, 3280.0, 188.0, 60.0, 34.0, 14.0, 8.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9140625, -9.2679443359375, -8.621826171875, -7.9757080078125, -7.32958984375, -6.6834716796875, -6.037353515625, -5.3912353515625, -4.7451171875, -4.0989990234375, -3.452880859375, -2.8067626953125, -2.16064453125, -1.5145263671875, -0.868408203125, -0.2222900390625, 0.423828125, 1.0699462890625, 1.716064453125, 2.3621826171875, 3.00830078125, 3.6544189453125, 4.300537109375, 4.9466552734375, 5.5927734375, 6.2388916015625, 6.885009765625, 7.5311279296875, 8.17724609375, 8.8233642578125, 9.469482421875, 10.1156005859375, 10.76171875, 11.4078369140625, 12.053955078125, 12.7000732421875, 13.34619140625, 13.9923095703125, 14.638427734375, 15.2845458984375, 15.9306640625, 16.5767822265625, 17.222900390625, 17.8690185546875, 18.51513671875, 19.1612548828125, 19.807373046875, 20.4534912109375, 21.099609375, 21.7457275390625, 22.391845703125, 23.0379638671875, 23.68408203125, 24.3302001953125, 24.976318359375, 25.6224365234375, 26.2685546875, 26.9146728515625, 27.560791015625, 28.2069091796875, 28.85302734375, 29.4991455078125, 30.145263671875, 30.7913818359375, 31.4375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 10.0, 14.0, 23.0, 40.0, 51.0, 58.0, 91.0, 115.0, 106.0, 116.0, 100.0, 69.0, 63.0, 43.0, 34.0, 15.0, 15.0, 12.0, 4.0, 7.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.596824645996094, -38.90652084350586, -37.21621322631836, -35.525909423828125, -33.83560562133789, -32.145301818847656, -30.454994201660156, -28.764690399169922, -27.074386596679688, -25.38408088684082, -23.693777084350586, -22.00347137451172, -20.313167572021484, -18.622861862182617, -16.93255615234375, -15.242252349853516, -13.551946640014648, -11.861641883850098, -10.171337127685547, -8.48103141784668, -6.790727138519287, -5.100421905517578, -3.4101171493530273, -1.7198123931884766, -0.02950763702392578, 1.6607972383499146, 3.351102113723755, 5.041407108306885, 6.7317118644714355, 8.422017097473145, 10.112321853637695, 11.802626609802246, 13.492931365966797, 15.183236122131348, 16.8735408782959, 18.563846588134766, 20.254150390625, 21.944456100463867, 23.634761810302734, 25.32506561279297, 27.015369415283203, 28.70567512512207, 30.395978927612305, 32.08628463745117, 33.776588439941406, 35.466896057128906, 37.15719985961914, 38.847503662109375, 40.537811279296875, 42.22811508178711, 43.91842269897461, 45.608726501464844, 47.29903030395508, 48.98933410644531, 50.67964172363281, 52.36994552612305, 54.06024932861328, 55.750553131103516, 57.440860748291016, 59.13116455078125, 60.821468353271484, 62.51177215576172, 64.20207977294922, 65.89237976074219, 67.58268737792969]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 2.0, 8.0, 8.0, 13.0, 14.0, 20.0, 32.0, 39.0, 44.0, 45.0, 60.0, 57.0, 60.0, 64.0, 87.0, 57.0, 62.0, 45.0, 58.0, 47.0, 41.0, 26.0, 19.0, 25.0, 13.0, 15.0, 7.0, 6.0, 7.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.510215759277344, -42.01044845581055, -40.510677337646484, -39.01091003417969, -37.511138916015625, -36.01137161254883, -34.51160430908203, -33.01183319091797, -31.51206398010254, -30.01229476928711, -28.51252555847168, -27.01275634765625, -25.512989044189453, -24.01321792602539, -22.513450622558594, -21.013681411743164, -19.513912200927734, -18.014142990112305, -16.514373779296875, -15.014605522155762, -13.514836311340332, -12.015067100524902, -10.515298843383789, -9.01552963256836, -7.51576042175293, -6.0159912109375, -4.5162224769592285, -3.016453742980957, -1.5166845321655273, -0.016915321350097656, 1.4828529357910156, 2.9826221466064453, 4.482391357421875, 5.982160568237305, 7.481929302215576, 8.981698036193848, 10.481467247009277, 11.981236457824707, 13.48100471496582, 14.98077392578125, 16.48054313659668, 17.98031234741211, 19.48008155822754, 20.97985076904297, 22.479618072509766, 23.979389190673828, 25.479156494140625, 26.978925704956055, 28.478694915771484, 29.978464126586914, 31.478233337402344, 32.97800064086914, 34.4777717590332, 35.9775390625, 37.47731018066406, 38.97707748413086, 40.476844787597656, 41.97661209106445, 43.476383209228516, 44.97615051269531, 46.475921630859375, 47.97568893432617, 49.47545623779297, 50.97522735595703, 52.474998474121094]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 6.0, 3.0, 12.0, 13.0, 23.0, 32.0, 53.0, 85.0, 124.0, 187.0, 329.0, 499.0, 869.0, 1549.0, 2925.0, 5946.0, 12910.0, 29176.0, 69268.0, 161973.0, 337900.0, 241252.0, 103173.0, 43808.0, 18909.0, 8463.0, 4073.0, 2094.0, 1205.0, 650.0, 376.0, 235.0, 145.0, 107.0, 66.0, 46.0, 26.0, 12.0, 15.0, 7.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.609375, -21.918701171875, -21.22802734375, -20.537353515625, -19.8466796875, -19.156005859375, -18.46533203125, -17.774658203125, -17.083984375, -16.393310546875, -15.70263671875, -15.011962890625, -14.3212890625, -13.630615234375, -12.93994140625, -12.249267578125, -11.55859375, -10.867919921875, -10.17724609375, -9.486572265625, -8.7958984375, -8.105224609375, -7.41455078125, -6.723876953125, -6.033203125, -5.342529296875, -4.65185546875, -3.961181640625, -3.2705078125, -2.579833984375, -1.88916015625, -1.198486328125, -0.5078125, 0.182861328125, 0.87353515625, 1.564208984375, 2.2548828125, 2.945556640625, 3.63623046875, 4.326904296875, 5.017578125, 5.708251953125, 6.39892578125, 7.089599609375, 7.7802734375, 8.470947265625, 9.16162109375, 9.852294921875, 10.54296875, 11.233642578125, 11.92431640625, 12.614990234375, 13.3056640625, 13.996337890625, 14.68701171875, 15.377685546875, 16.068359375, 16.759033203125, 17.44970703125, 18.140380859375, 18.8310546875, 19.521728515625, 20.21240234375, 20.903076171875, 21.59375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 7.0, 5.0, 4.0, 8.0, 12.0, 11.0, 19.0, 13.0, 25.0, 26.0, 32.0, 32.0, 40.0, 36.0, 44.0, 40.0, 31.0, 54.0, 53.0, 46.0, 42.0, 48.0, 54.0, 33.0, 41.0, 36.0, 38.0, 32.0, 18.0, 27.0, 16.0, 19.0, 10.0, 14.0, 6.0, 7.0, 3.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8203125, -10.51025390625, -10.2001953125, -9.89013671875, -9.580078125, -9.27001953125, -8.9599609375, -8.64990234375, -8.33984375, -8.02978515625, -7.7197265625, -7.40966796875, -7.099609375, -6.78955078125, -6.4794921875, -6.16943359375, -5.859375, -5.54931640625, -5.2392578125, -4.92919921875, -4.619140625, -4.30908203125, -3.9990234375, -3.68896484375, -3.37890625, -3.06884765625, -2.7587890625, -2.44873046875, -2.138671875, -1.82861328125, -1.5185546875, -1.20849609375, -0.8984375, -0.58837890625, -0.2783203125, 0.03173828125, 0.341796875, 0.65185546875, 0.9619140625, 1.27197265625, 1.58203125, 1.89208984375, 2.2021484375, 2.51220703125, 2.822265625, 3.13232421875, 3.4423828125, 3.75244140625, 4.0625, 4.37255859375, 4.6826171875, 4.99267578125, 5.302734375, 5.61279296875, 5.9228515625, 6.23291015625, 6.54296875, 6.85302734375, 7.1630859375, 7.47314453125, 7.783203125, 8.09326171875, 8.4033203125, 8.71337890625, 9.0234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 14.0, 18.0, 16.0, 27.0, 42.0, 44.0, 77.0, 115.0, 170.0, 255.0, 442.0, 814.0, 1865.0, 5990.0, 31811.0, 339280.0, 600206.0, 53926.0, 8566.0, 2526.0, 938.0, 498.0, 286.0, 193.0, 127.0, 73.0, 55.0, 52.0, 30.0, 16.0, 19.0, 13.0, 8.0, 8.0, 7.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.625, -45.126953125, -43.62890625, -42.130859375, -40.6328125, -39.134765625, -37.63671875, -36.138671875, -34.640625, -33.142578125, -31.64453125, -30.146484375, -28.6484375, -27.150390625, -25.65234375, -24.154296875, -22.65625, -21.158203125, -19.66015625, -18.162109375, -16.6640625, -15.166015625, -13.66796875, -12.169921875, -10.671875, -9.173828125, -7.67578125, -6.177734375, -4.6796875, -3.181640625, -1.68359375, -0.185546875, 1.3125, 2.810546875, 4.30859375, 5.806640625, 7.3046875, 8.802734375, 10.30078125, 11.798828125, 13.296875, 14.794921875, 16.29296875, 17.791015625, 19.2890625, 20.787109375, 22.28515625, 23.783203125, 25.28125, 26.779296875, 28.27734375, 29.775390625, 31.2734375, 32.771484375, 34.26953125, 35.767578125, 37.265625, 38.763671875, 40.26171875, 41.759765625, 43.2578125, 44.755859375, 46.25390625, 47.751953125, 49.25]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 11.0, 16.0, 22.0, 16.0, 15.0, 23.0, 29.0, 30.0, 27.0, 27.0, 33.0, 29.0, 41.0, 47.0, 51.0, 48.0, 38.0, 47.0, 56.0, 52.0, 48.0, 38.0, 24.0, 37.0, 29.0, 30.0, 12.0, 16.0, 18.0, 18.0, 10.0, 7.0, 9.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-45.1875, -43.9326171875, -42.677734375, -41.4228515625, -40.16796875, -38.9130859375, -37.658203125, -36.4033203125, -35.1484375, -33.8935546875, -32.638671875, -31.3837890625, -30.12890625, -28.8740234375, -27.619140625, -26.3642578125, -25.109375, -23.8544921875, -22.599609375, -21.3447265625, -20.08984375, -18.8349609375, -17.580078125, -16.3251953125, -15.0703125, -13.8154296875, -12.560546875, -11.3056640625, -10.05078125, -8.7958984375, -7.541015625, -6.2861328125, -5.03125, -3.7763671875, -2.521484375, -1.2666015625, -0.01171875, 1.2431640625, 2.498046875, 3.7529296875, 5.0078125, 6.2626953125, 7.517578125, 8.7724609375, 10.02734375, 11.2822265625, 12.537109375, 13.7919921875, 15.046875, 16.3017578125, 17.556640625, 18.8115234375, 20.06640625, 21.3212890625, 22.576171875, 23.8310546875, 25.0859375, 26.3408203125, 27.595703125, 28.8505859375, 30.10546875, 31.3603515625, 32.615234375, 33.8701171875, 35.125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 11.0, 21.0, 15.0, 35.0, 38.0, 64.0, 89.0, 129.0, 210.0, 328.0, 523.0, 1007.0, 2122.0, 4875.0, 13264.0, 44023.0, 177114.0, 584329.0, 158966.0, 39975.0, 12414.0, 4636.0, 1956.0, 1004.0, 494.0, 283.0, 192.0, 123.0, 73.0, 62.0, 43.0, 28.0, 16.0, 21.0, 9.0, 10.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-10.71875, -10.41650390625, -10.1142578125, -9.81201171875, -9.509765625, -9.20751953125, -8.9052734375, -8.60302734375, -8.30078125, -7.99853515625, -7.6962890625, -7.39404296875, -7.091796875, -6.78955078125, -6.4873046875, -6.18505859375, -5.8828125, -5.58056640625, -5.2783203125, -4.97607421875, -4.673828125, -4.37158203125, -4.0693359375, -3.76708984375, -3.46484375, -3.16259765625, -2.8603515625, -2.55810546875, -2.255859375, -1.95361328125, -1.6513671875, -1.34912109375, -1.046875, -0.74462890625, -0.4423828125, -0.14013671875, 0.162109375, 0.46435546875, 0.7666015625, 1.06884765625, 1.37109375, 1.67333984375, 1.9755859375, 2.27783203125, 2.580078125, 2.88232421875, 3.1845703125, 3.48681640625, 3.7890625, 4.09130859375, 4.3935546875, 4.69580078125, 4.998046875, 5.30029296875, 5.6025390625, 5.90478515625, 6.20703125, 6.50927734375, 6.8115234375, 7.11376953125, 7.416015625, 7.71826171875, 8.0205078125, 8.32275390625, 8.625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 7.0, 9.0, 21.0, 19.0, 33.0, 56.0, 57.0, 83.0, 198.0, 179.0, 95.0, 69.0, 45.0, 25.0, 25.0, 18.0, 9.0, 11.0, 5.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00411224365234375, -0.004006743431091309, -0.003901243209838867, -0.0037957429885864258, -0.0036902427673339844, -0.003584742546081543, -0.0034792423248291016, -0.00337374210357666, -0.0032682418823242188, -0.0031627416610717773, -0.003057241439819336, -0.0029517412185668945, -0.002846240997314453, -0.0027407407760620117, -0.0026352405548095703, -0.002529740333557129, -0.0024242401123046875, -0.002318739891052246, -0.0022132396697998047, -0.0021077394485473633, -0.002002239227294922, -0.0018967390060424805, -0.001791238784790039, -0.0016857385635375977, -0.0015802383422851562, -0.0014747381210327148, -0.0013692378997802734, -0.001263737678527832, -0.0011582374572753906, -0.0010527372360229492, -0.0009472370147705078, -0.0008417367935180664, -0.000736236572265625, -0.0006307363510131836, -0.0005252361297607422, -0.0004197359085083008, -0.0003142356872558594, -0.00020873546600341797, -0.00010323524475097656, 2.2649765014648438e-06, 0.00010776519775390625, 0.00021326541900634766, 0.00031876564025878906, 0.00042426586151123047, 0.0005297660827636719, 0.0006352663040161133, 0.0007407665252685547, 0.0008462667465209961, 0.0009517669677734375, 0.001057267189025879, 0.0011627674102783203, 0.0012682676315307617, 0.0013737678527832031, 0.0014792680740356445, 0.001584768295288086, 0.0016902685165405273, 0.0017957687377929688, 0.0019012689590454102, 0.0020067691802978516, 0.002112269401550293, 0.0022177696228027344, 0.0023232698440551758, 0.002428770065307617, 0.0025342702865600586, 0.0026397705078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 12.0, 19.0, 39.0, 42.0, 66.0, 98.0, 153.0, 292.0, 527.0, 1187.0, 3305.0, 12039.0, 72217.0, 683106.0, 238393.0, 27326.0, 6133.0, 1895.0, 746.0, 347.0, 190.0, 107.0, 71.0, 53.0, 40.0, 36.0, 20.0, 15.0, 10.0, 6.0, 4.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.6875, -16.177978515625, -15.66845703125, -15.158935546875, -14.6494140625, -14.139892578125, -13.63037109375, -13.120849609375, -12.611328125, -12.101806640625, -11.59228515625, -11.082763671875, -10.5732421875, -10.063720703125, -9.55419921875, -9.044677734375, -8.53515625, -8.025634765625, -7.51611328125, -7.006591796875, -6.4970703125, -5.987548828125, -5.47802734375, -4.968505859375, -4.458984375, -3.949462890625, -3.43994140625, -2.930419921875, -2.4208984375, -1.911376953125, -1.40185546875, -0.892333984375, -0.3828125, 0.126708984375, 0.63623046875, 1.145751953125, 1.6552734375, 2.164794921875, 2.67431640625, 3.183837890625, 3.693359375, 4.202880859375, 4.71240234375, 5.221923828125, 5.7314453125, 6.240966796875, 6.75048828125, 7.260009765625, 7.76953125, 8.279052734375, 8.78857421875, 9.298095703125, 9.8076171875, 10.317138671875, 10.82666015625, 11.336181640625, 11.845703125, 12.355224609375, 12.86474609375, 13.374267578125, 13.8837890625, 14.393310546875, 14.90283203125, 15.412353515625, 15.921875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 6.0, 3.0, 4.0, 12.0, 10.0, 9.0, 20.0, 16.0, 26.0, 34.0, 52.0, 49.0, 71.0, 81.0, 93.0, 113.0, 79.0, 57.0, 67.0, 47.0, 32.0, 22.0, 27.0, 15.0, 10.0, 6.0, 11.0, 2.0, 5.0, 6.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3203125, -13.9244384765625, -13.528564453125, -13.1326904296875, -12.73681640625, -12.3409423828125, -11.945068359375, -11.5491943359375, -11.1533203125, -10.7574462890625, -10.361572265625, -9.9656982421875, -9.56982421875, -9.1739501953125, -8.778076171875, -8.3822021484375, -7.986328125, -7.5904541015625, -7.194580078125, -6.7987060546875, -6.40283203125, -6.0069580078125, -5.611083984375, -5.2152099609375, -4.8193359375, -4.4234619140625, -4.027587890625, -3.6317138671875, -3.23583984375, -2.8399658203125, -2.444091796875, -2.0482177734375, -1.65234375, -1.2564697265625, -0.860595703125, -0.4647216796875, -0.06884765625, 0.3270263671875, 0.722900390625, 1.1187744140625, 1.5146484375, 1.9105224609375, 2.306396484375, 2.7022705078125, 3.09814453125, 3.4940185546875, 3.889892578125, 4.2857666015625, 4.681640625, 5.0775146484375, 5.473388671875, 5.8692626953125, 6.26513671875, 6.6610107421875, 7.056884765625, 7.4527587890625, 7.8486328125, 8.2445068359375, 8.640380859375, 9.0362548828125, 9.43212890625, 9.8280029296875, 10.223876953125, 10.6197509765625, 11.015625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 12.0, 25.0, 42.0, 63.0, 101.0, 128.0, 147.0, 122.0, 101.0, 93.0, 48.0, 42.0, 27.0, 16.0, 12.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-323.1836242675781, -314.6053161621094, -306.0269775390625, -297.44866943359375, -288.870361328125, -280.29205322265625, -271.7137451171875, -263.1354064941406, -254.55709838867188, -245.97879028320312, -237.4004669189453, -228.8221435546875, -220.24383544921875, -211.66552734375, -203.0872039794922, -194.50888061523438, -185.93057250976562, -177.35226440429688, -168.77394104003906, -160.19561767578125, -151.6173095703125, -143.03900146484375, -134.46067810058594, -125.88236236572266, -117.30404663085938, -108.7257308959961, -100.14741516113281, -91.56909942626953, -82.99078369140625, -74.41246795654297, -65.83415222167969, -57.255836486816406, -48.67755126953125, -40.09923553466797, -31.520919799804688, -22.942604064941406, -14.364288330078125, -5.785972595214844, 2.7923431396484375, 11.370658874511719, 19.948974609375, 28.52729034423828, 37.10560607910156, 45.683921813964844, 54.262237548828125, 62.840553283691406, 71.41886901855469, 79.99718475341797, 88.57550048828125, 97.15381622314453, 105.73213195800781, 114.3104476928711, 122.88876342773438, 131.46707153320312, 140.04539489746094, 148.62371826171875, 157.2020263671875, 165.78033447265625, 174.35865783691406, 182.93698120117188, 191.51528930664062, 200.09359741210938, 208.6719207763672, 217.250244140625, 225.82855224609375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 7.0, 6.0, 10.0, 15.0, 13.0, 11.0, 14.0, 29.0, 22.0, 31.0, 39.0, 44.0, 45.0, 56.0, 57.0, 56.0, 55.0, 67.0, 55.0, 43.0, 47.0, 37.0, 34.0, 34.0, 34.0, 26.0, 25.0, 15.0, 14.0, 16.0, 13.0, 8.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.02838134765625, -204.46856689453125, -197.90875244140625, -191.34893798828125, -184.78912353515625, -178.22930908203125, -171.66949462890625, -165.10968017578125, -158.54986572265625, -151.99005126953125, -145.43023681640625, -138.87042236328125, -132.31060791015625, -125.75079345703125, -119.19097900390625, -112.63116455078125, -106.07135772705078, -99.51154327392578, -92.95172882080078, -86.39191436767578, -79.83209991455078, -73.27229309082031, -66.71247863769531, -60.15266036987305, -53.59284591674805, -47.03303146362305, -40.47321701049805, -33.91340637207031, -27.35359001159668, -20.793777465820312, -14.233963012695312, -7.6741485595703125, -1.1143341064453125, 5.445479869842529, 12.005293846130371, 18.565107345581055, 25.124921798706055, 31.684734344482422, 38.24454879760742, 44.80436325073242, 51.36417770385742, 57.92399215698242, 64.48380279541016, 71.04361724853516, 77.60343170166016, 84.16324615478516, 90.72306060791016, 97.28287506103516, 103.84268951416016, 110.40250396728516, 116.96231842041016, 123.52213287353516, 130.08193969726562, 136.64175415039062, 143.20156860351562, 149.76138305664062, 156.32119750976562, 162.88101196289062, 169.44082641601562, 176.00064086914062, 182.56045532226562, 189.12026977539062, 195.68008422851562, 202.23989868164062, 208.79971313476562]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 13.0, 9.0, 13.0, 18.0, 33.0, 40.0, 40.0, 92.0, 106.0, 187.0, 310.0, 590.0, 1064.0, 2054.0, 4515.0, 10056.0, 25994.0, 80283.0, 558579.0, 3138987.0, 277329.0, 58158.0, 20265.0, 8218.0, 3666.0, 1715.0, 878.0, 487.0, 239.0, 128.0, 73.0, 44.0, 35.0, 20.0, 13.0, 8.0, 5.0, 9.0, 2.0, 1.0], "bins": [-28.28125, -27.6290283203125, -26.976806640625, -26.3245849609375, -25.67236328125, -25.0201416015625, -24.367919921875, -23.7156982421875, -23.0634765625, -22.4112548828125, -21.759033203125, -21.1068115234375, -20.45458984375, -19.8023681640625, -19.150146484375, -18.4979248046875, -17.845703125, -17.1934814453125, -16.541259765625, -15.8890380859375, -15.23681640625, -14.5845947265625, -13.932373046875, -13.2801513671875, -12.6279296875, -11.9757080078125, -11.323486328125, -10.6712646484375, -10.01904296875, -9.3668212890625, -8.714599609375, -8.0623779296875, -7.41015625, -6.7579345703125, -6.105712890625, -5.4534912109375, -4.80126953125, -4.1490478515625, -3.496826171875, -2.8446044921875, -2.1923828125, -1.5401611328125, -0.887939453125, -0.2357177734375, 0.41650390625, 1.0687255859375, 1.720947265625, 2.3731689453125, 3.025390625, 3.6776123046875, 4.329833984375, 4.9820556640625, 5.63427734375, 6.2864990234375, 6.938720703125, 7.5909423828125, 8.2431640625, 8.8953857421875, 9.547607421875, 10.1998291015625, 10.85205078125, 11.5042724609375, 12.156494140625, 12.8087158203125, 13.4609375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 12.0, 15.0, 10.0, 25.0, 36.0, 34.0, 61.0, 68.0, 106.0, 95.0, 96.0, 90.0, 89.0, 66.0, 67.0, 44.0, 33.0, 16.0, 19.0, 11.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.46875, -25.9085693359375, -25.348388671875, -24.7882080078125, -24.22802734375, -23.6678466796875, -23.107666015625, -22.5474853515625, -21.9873046875, -21.4271240234375, -20.866943359375, -20.3067626953125, -19.74658203125, -19.1864013671875, -18.626220703125, -18.0660400390625, -17.505859375, -16.9456787109375, -16.385498046875, -15.8253173828125, -15.26513671875, -14.7049560546875, -14.144775390625, -13.5845947265625, -13.0244140625, -12.4642333984375, -11.904052734375, -11.3438720703125, -10.78369140625, -10.2235107421875, -9.663330078125, -9.1031494140625, -8.54296875, -7.9827880859375, -7.422607421875, -6.8624267578125, -6.30224609375, -5.7420654296875, -5.181884765625, -4.6217041015625, -4.0615234375, -3.5013427734375, -2.941162109375, -2.3809814453125, -1.82080078125, -1.2606201171875, -0.700439453125, -0.1402587890625, 0.419921875, 0.9801025390625, 1.540283203125, 2.1004638671875, 2.66064453125, 3.2208251953125, 3.781005859375, 4.3411865234375, 4.9013671875, 5.4615478515625, 6.021728515625, 6.5819091796875, 7.14208984375, 7.7022705078125, 8.262451171875, 8.8226318359375, 9.3828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 7.0, 14.0, 17.0, 27.0, 42.0, 67.0, 162.0, 292.0, 706.0, 1807.0, 5597.0, 21024.0, 128700.0, 3454732.0, 520909.0, 44914.0, 10075.0, 2995.0, 1183.0, 480.0, 223.0, 125.0, 68.0, 33.0, 20.0, 14.0, 9.0, 14.0, 7.0, 4.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.4375, -27.33251953125, -26.2275390625, -25.12255859375, -24.017578125, -22.91259765625, -21.8076171875, -20.70263671875, -19.59765625, -18.49267578125, -17.3876953125, -16.28271484375, -15.177734375, -14.07275390625, -12.9677734375, -11.86279296875, -10.7578125, -9.65283203125, -8.5478515625, -7.44287109375, -6.337890625, -5.23291015625, -4.1279296875, -3.02294921875, -1.91796875, -0.81298828125, 0.2919921875, 1.39697265625, 2.501953125, 3.60693359375, 4.7119140625, 5.81689453125, 6.921875, 8.02685546875, 9.1318359375, 10.23681640625, 11.341796875, 12.44677734375, 13.5517578125, 14.65673828125, 15.76171875, 16.86669921875, 17.9716796875, 19.07666015625, 20.181640625, 21.28662109375, 22.3916015625, 23.49658203125, 24.6015625, 25.70654296875, 26.8115234375, 27.91650390625, 29.021484375, 30.12646484375, 31.2314453125, 32.33642578125, 33.44140625, 34.54638671875, 35.6513671875, 36.75634765625, 37.861328125, 38.96630859375, 40.0712890625, 41.17626953125, 42.28125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 8.0, 8.0, 12.0, 11.0, 20.0, 25.0, 37.0, 55.0, 87.0, 142.0, 310.0, 651.0, 1208.0, 707.0, 346.0, 146.0, 101.0, 68.0, 44.0, 26.0, 13.0, 10.0, 8.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.625, -32.591796875, -31.55859375, -30.525390625, -29.4921875, -28.458984375, -27.42578125, -26.392578125, -25.359375, -24.326171875, -23.29296875, -22.259765625, -21.2265625, -20.193359375, -19.16015625, -18.126953125, -17.09375, -16.060546875, -15.02734375, -13.994140625, -12.9609375, -11.927734375, -10.89453125, -9.861328125, -8.828125, -7.794921875, -6.76171875, -5.728515625, -4.6953125, -3.662109375, -2.62890625, -1.595703125, -0.5625, 0.470703125, 1.50390625, 2.537109375, 3.5703125, 4.603515625, 5.63671875, 6.669921875, 7.703125, 8.736328125, 9.76953125, 10.802734375, 11.8359375, 12.869140625, 13.90234375, 14.935546875, 15.96875, 17.001953125, 18.03515625, 19.068359375, 20.1015625, 21.134765625, 22.16796875, 23.201171875, 24.234375, 25.267578125, 26.30078125, 27.333984375, 28.3671875, 29.400390625, 30.43359375, 31.466796875, 32.5]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 9.0, 19.0, 29.0, 46.0, 60.0, 107.0, 128.0, 173.0, 149.0, 100.0, 66.0, 39.0, 21.0, 9.0, 5.0, 7.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-175.53738403320312, -168.53370666503906, -161.53001403808594, -154.52633666992188, -147.5226593017578, -140.5189666748047, -133.51528930664062, -126.51160430908203, -119.50791931152344, -112.50423431396484, -105.50055694580078, -98.49687194824219, -91.4931869506836, -84.489501953125, -77.48582458496094, -70.48213958740234, -63.47846221923828, -56.47478103637695, -49.47109603881836, -42.46741485595703, -35.46372985839844, -28.46004867553711, -21.45636749267578, -14.452682495117188, -7.449001312255859, -0.44531869888305664, 6.558363914489746, 13.56204605102539, 20.56572914123535, 27.569412231445312, 34.57309341430664, 41.576778411865234, 48.58045959472656, 55.58414077758789, 62.587825775146484, 69.59150695800781, 76.5951919555664, 83.598876953125, 90.60255432128906, 97.60623931884766, 104.60992431640625, 111.61360931396484, 118.6172866821289, 125.6209716796875, 132.62464904785156, 139.6283416748047, 146.63201904296875, 153.63571166992188, 160.63937377929688, 167.64305114746094, 174.64674377441406, 181.65042114257812, 188.6540985107422, 195.6577911376953, 202.66146850585938, 209.6651611328125, 216.66883850097656, 223.67251586914062, 230.67620849609375, 237.6798858642578, 244.68356323242188, 251.687255859375, 258.69091796875, 265.6946105957031, 272.69830322265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 9.0, 7.0, 9.0, 18.0, 21.0, 19.0, 27.0, 41.0, 33.0, 41.0, 56.0, 55.0, 56.0, 58.0, 71.0, 66.0, 42.0, 52.0, 61.0, 45.0, 33.0, 39.0, 27.0, 23.0, 24.0, 13.0, 18.0, 11.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.96173095703125, -142.18417358398438, -137.4066162109375, -132.62905883789062, -127.85150146484375, -123.07394409179688, -118.29638671875, -113.51882934570312, -108.74127197265625, -103.96371459960938, -99.1861572265625, -94.40859985351562, -89.63104248046875, -84.85348510742188, -80.075927734375, -75.29837036132812, -70.52080535888672, -65.74324798583984, -60.96569061279297, -56.188133239746094, -51.41057586669922, -46.633018493652344, -41.8554573059082, -37.07789993286133, -32.30034255981445, -27.522785186767578, -22.745227813720703, -17.967668533325195, -13.19011116027832, -8.412553787231445, -3.6349945068359375, 1.1425628662109375, 5.9201202392578125, 10.697677612304688, 15.475235939025879, 20.25279426574707, 25.030351638793945, 29.80790901184082, 34.58546829223633, 39.3630256652832, 44.14058303833008, 48.91814041137695, 53.69569778442383, 58.47325897216797, 63.250816345214844, 68.02837371826172, 72.8059310913086, 77.58348846435547, 82.36104583740234, 87.13860321044922, 91.9161605834961, 96.69371795654297, 101.47127532958984, 106.24883270263672, 111.02639770507812, 115.803955078125, 120.58151245117188, 125.35906982421875, 130.13662719726562, 134.9141845703125, 139.69174194335938, 144.46929931640625, 149.24685668945312, 154.0244140625, 158.80197143554688]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 7.0, 15.0, 17.0, 35.0, 45.0, 62.0, 139.0, 216.0, 408.0, 765.0, 1281.0, 2781.0, 5798.0, 13661.0, 34182.0, 94420.0, 314450.0, 388709.0, 119561.0, 42097.0, 16246.0, 7066.0, 3191.0, 1527.0, 814.0, 444.0, 234.0, 137.0, 87.0, 57.0, 40.0, 22.0, 14.0, 7.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.625, -22.865478515625, -22.10595703125, -21.346435546875, -20.5869140625, -19.827392578125, -19.06787109375, -18.308349609375, -17.548828125, -16.789306640625, -16.02978515625, -15.270263671875, -14.5107421875, -13.751220703125, -12.99169921875, -12.232177734375, -11.47265625, -10.713134765625, -9.95361328125, -9.194091796875, -8.4345703125, -7.675048828125, -6.91552734375, -6.156005859375, -5.396484375, -4.636962890625, -3.87744140625, -3.117919921875, -2.3583984375, -1.598876953125, -0.83935546875, -0.079833984375, 0.6796875, 1.439208984375, 2.19873046875, 2.958251953125, 3.7177734375, 4.477294921875, 5.23681640625, 5.996337890625, 6.755859375, 7.515380859375, 8.27490234375, 9.034423828125, 9.7939453125, 10.553466796875, 11.31298828125, 12.072509765625, 12.83203125, 13.591552734375, 14.35107421875, 15.110595703125, 15.8701171875, 16.629638671875, 17.38916015625, 18.148681640625, 18.908203125, 19.667724609375, 20.42724609375, 21.186767578125, 21.9462890625, 22.705810546875, 23.46533203125, 24.224853515625, 24.984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 10.0, 6.0, 9.0, 16.0, 14.0, 21.0, 26.0, 30.0, 38.0, 41.0, 57.0, 58.0, 80.0, 65.0, 61.0, 56.0, 57.0, 56.0, 54.0, 46.0, 46.0, 39.0, 35.0, 21.0, 9.0, 12.0, 10.0, 8.0, 4.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.4296875, -15.057373046875, -14.68505859375, -14.312744140625, -13.9404296875, -13.568115234375, -13.19580078125, -12.823486328125, -12.451171875, -12.078857421875, -11.70654296875, -11.334228515625, -10.9619140625, -10.589599609375, -10.21728515625, -9.844970703125, -9.47265625, -9.100341796875, -8.72802734375, -8.355712890625, -7.9833984375, -7.611083984375, -7.23876953125, -6.866455078125, -6.494140625, -6.121826171875, -5.74951171875, -5.377197265625, -5.0048828125, -4.632568359375, -4.26025390625, -3.887939453125, -3.515625, -3.143310546875, -2.77099609375, -2.398681640625, -2.0263671875, -1.654052734375, -1.28173828125, -0.909423828125, -0.537109375, -0.164794921875, 0.20751953125, 0.579833984375, 0.9521484375, 1.324462890625, 1.69677734375, 2.069091796875, 2.44140625, 2.813720703125, 3.18603515625, 3.558349609375, 3.9306640625, 4.302978515625, 4.67529296875, 5.047607421875, 5.419921875, 5.792236328125, 6.16455078125, 6.536865234375, 6.9091796875, 7.281494140625, 7.65380859375, 8.026123046875, 8.3984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 4.0, 3.0, 9.0, 15.0, 18.0, 23.0, 32.0, 38.0, 73.0, 108.0, 150.0, 267.0, 498.0, 1234.0, 3812.0, 24015.0, 668599.0, 328827.0, 15663.0, 2914.0, 1011.0, 462.0, 276.0, 145.0, 106.0, 87.0, 52.0, 36.0, 29.0, 11.0, 13.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.53125, -54.57568359375, -52.6201171875, -50.66455078125, -48.708984375, -46.75341796875, -44.7978515625, -42.84228515625, -40.88671875, -38.93115234375, -36.9755859375, -35.02001953125, -33.064453125, -31.10888671875, -29.1533203125, -27.19775390625, -25.2421875, -23.28662109375, -21.3310546875, -19.37548828125, -17.419921875, -15.46435546875, -13.5087890625, -11.55322265625, -9.59765625, -7.64208984375, -5.6865234375, -3.73095703125, -1.775390625, 0.18017578125, 2.1357421875, 4.09130859375, 6.046875, 8.00244140625, 9.9580078125, 11.91357421875, 13.869140625, 15.82470703125, 17.7802734375, 19.73583984375, 21.69140625, 23.64697265625, 25.6025390625, 27.55810546875, 29.513671875, 31.46923828125, 33.4248046875, 35.38037109375, 37.3359375, 39.29150390625, 41.2470703125, 43.20263671875, 45.158203125, 47.11376953125, 49.0693359375, 51.02490234375, 52.98046875, 54.93603515625, 56.8916015625, 58.84716796875, 60.802734375, 62.75830078125, 64.7138671875, 66.66943359375, 68.625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 13.0, 9.0, 15.0, 23.0, 24.0, 26.0, 35.0, 38.0, 32.0, 43.0, 55.0, 51.0, 48.0, 51.0, 61.0, 46.0, 58.0, 55.0, 46.0, 45.0, 39.0, 24.0, 25.0, 25.0, 22.0, 14.0, 13.0, 14.0, 8.0, 7.0, 10.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-48.65625, -47.298828125, -45.94140625, -44.583984375, -43.2265625, -41.869140625, -40.51171875, -39.154296875, -37.796875, -36.439453125, -35.08203125, -33.724609375, -32.3671875, -31.009765625, -29.65234375, -28.294921875, -26.9375, -25.580078125, -24.22265625, -22.865234375, -21.5078125, -20.150390625, -18.79296875, -17.435546875, -16.078125, -14.720703125, -13.36328125, -12.005859375, -10.6484375, -9.291015625, -7.93359375, -6.576171875, -5.21875, -3.861328125, -2.50390625, -1.146484375, 0.2109375, 1.568359375, 2.92578125, 4.283203125, 5.640625, 6.998046875, 8.35546875, 9.712890625, 11.0703125, 12.427734375, 13.78515625, 15.142578125, 16.5, 17.857421875, 19.21484375, 20.572265625, 21.9296875, 23.287109375, 24.64453125, 26.001953125, 27.359375, 28.716796875, 30.07421875, 31.431640625, 32.7890625, 34.146484375, 35.50390625, 36.861328125, 38.21875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 6.0, 5.0, 11.0, 7.0, 11.0, 10.0, 26.0, 36.0, 36.0, 79.0, 135.0, 217.0, 512.0, 1391.0, 4739.0, 28253.0, 597664.0, 385559.0, 23670.0, 4000.0, 1190.0, 460.0, 219.0, 118.0, 79.0, 36.0, 22.0, 17.0, 12.0, 9.0, 4.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0, -16.391845703125, -15.78369140625, -15.175537109375, -14.5673828125, -13.959228515625, -13.35107421875, -12.742919921875, -12.134765625, -11.526611328125, -10.91845703125, -10.310302734375, -9.7021484375, -9.093994140625, -8.48583984375, -7.877685546875, -7.26953125, -6.661376953125, -6.05322265625, -5.445068359375, -4.8369140625, -4.228759765625, -3.62060546875, -3.012451171875, -2.404296875, -1.796142578125, -1.18798828125, -0.579833984375, 0.0283203125, 0.636474609375, 1.24462890625, 1.852783203125, 2.4609375, 3.069091796875, 3.67724609375, 4.285400390625, 4.8935546875, 5.501708984375, 6.10986328125, 6.718017578125, 7.326171875, 7.934326171875, 8.54248046875, 9.150634765625, 9.7587890625, 10.366943359375, 10.97509765625, 11.583251953125, 12.19140625, 12.799560546875, 13.40771484375, 14.015869140625, 14.6240234375, 15.232177734375, 15.84033203125, 16.448486328125, 17.056640625, 17.664794921875, 18.27294921875, 18.881103515625, 19.4892578125, 20.097412109375, 20.70556640625, 21.313720703125, 21.921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 15.0, 17.0, 14.0, 32.0, 32.0, 42.0, 83.0, 166.0, 252.0, 111.0, 68.0, 38.0, 20.0, 35.0, 11.0, 17.0, 10.0, 11.0, 4.0, 7.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024356842041015625, -0.002326756715774536, -0.0022178292274475098, -0.0021089017391204834, -0.001999974250793457, -0.0018910467624664307, -0.0017821192741394043, -0.001673191785812378, -0.0015642642974853516, -0.0014553368091583252, -0.0013464093208312988, -0.0012374818325042725, -0.001128554344177246, -0.0010196268558502197, -0.0009106993675231934, -0.000801771879196167, -0.0006928443908691406, -0.0005839169025421143, -0.0004749894142150879, -0.0003660619258880615, -0.00025713443756103516, -0.0001482069492340088, -3.927946090698242e-05, 6.964802742004395e-05, 0.0001785755157470703, 0.0002875030040740967, 0.00039643049240112305, 0.0005053579807281494, 0.0006142854690551758, 0.0007232129573822021, 0.0008321404457092285, 0.0009410679340362549, 0.0010499954223632812, 0.0011589229106903076, 0.001267850399017334, 0.0013767778873443604, 0.0014857053756713867, 0.001594632863998413, 0.0017035603523254395, 0.0018124878406524658, 0.0019214153289794922, 0.0020303428173065186, 0.002139270305633545, 0.0022481977939605713, 0.0023571252822875977, 0.002466052770614624, 0.0025749802589416504, 0.0026839077472686768, 0.002792835235595703, 0.0029017627239227295, 0.003010690212249756, 0.0031196177005767822, 0.0032285451889038086, 0.003337472677230835, 0.0034464001655578613, 0.0035553276538848877, 0.003664255142211914, 0.0037731826305389404, 0.003882110118865967, 0.003991037607192993, 0.0040999650955200195, 0.004208892583847046, 0.004317820072174072, 0.004426747560501099, 0.004535675048828125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 8.0, 5.0, 7.0, 11.0, 15.0, 17.0, 30.0, 79.0, 105.0, 163.0, 369.0, 807.0, 2690.0, 17775.0, 662528.0, 347841.0, 12518.0, 2184.0, 670.0, 332.0, 150.0, 79.0, 62.0, 36.0, 21.0, 21.0, 16.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.69189453125, -15.9306640625, -15.16943359375, -14.408203125, -13.64697265625, -12.8857421875, -12.12451171875, -11.36328125, -10.60205078125, -9.8408203125, -9.07958984375, -8.318359375, -7.55712890625, -6.7958984375, -6.03466796875, -5.2734375, -4.51220703125, -3.7509765625, -2.98974609375, -2.228515625, -1.46728515625, -0.7060546875, 0.05517578125, 0.81640625, 1.57763671875, 2.3388671875, 3.10009765625, 3.861328125, 4.62255859375, 5.3837890625, 6.14501953125, 6.90625, 7.66748046875, 8.4287109375, 9.18994140625, 9.951171875, 10.71240234375, 11.4736328125, 12.23486328125, 12.99609375, 13.75732421875, 14.5185546875, 15.27978515625, 16.041015625, 16.80224609375, 17.5634765625, 18.32470703125, 19.0859375, 19.84716796875, 20.6083984375, 21.36962890625, 22.130859375, 22.89208984375, 23.6533203125, 24.41455078125, 25.17578125, 25.93701171875, 26.6982421875, 27.45947265625, 28.220703125, 28.98193359375, 29.7431640625, 30.50439453125, 31.265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 6.0, 5.0, 13.0, 10.0, 16.0, 14.0, 28.0, 30.0, 44.0, 49.0, 50.0, 64.0, 69.0, 75.0, 74.0, 73.0, 60.0, 53.0, 49.0, 44.0, 20.0, 22.0, 29.0, 13.0, 12.0, 11.0, 9.0, 8.0, 5.0, 2.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.5390625, -9.2216796875, -8.904296875, -8.5869140625, -8.26953125, -7.9521484375, -7.634765625, -7.3173828125, -7.0, -6.6826171875, -6.365234375, -6.0478515625, -5.73046875, -5.4130859375, -5.095703125, -4.7783203125, -4.4609375, -4.1435546875, -3.826171875, -3.5087890625, -3.19140625, -2.8740234375, -2.556640625, -2.2392578125, -1.921875, -1.6044921875, -1.287109375, -0.9697265625, -0.65234375, -0.3349609375, -0.017578125, 0.2998046875, 0.6171875, 0.9345703125, 1.251953125, 1.5693359375, 1.88671875, 2.2041015625, 2.521484375, 2.8388671875, 3.15625, 3.4736328125, 3.791015625, 4.1083984375, 4.42578125, 4.7431640625, 5.060546875, 5.3779296875, 5.6953125, 6.0126953125, 6.330078125, 6.6474609375, 6.96484375, 7.2822265625, 7.599609375, 7.9169921875, 8.234375, 8.5517578125, 8.869140625, 9.1865234375, 9.50390625, 9.8212890625, 10.138671875, 10.4560546875, 10.7734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 13.0, 46.0, 177.0, 352.0, 276.0, 97.0, 28.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-759.293212890625, -741.135986328125, -722.978759765625, -704.821533203125, -686.664306640625, -668.507080078125, -650.349853515625, -632.1925659179688, -614.0353393554688, -595.8781127929688, -577.7208862304688, -559.5636596679688, -541.4064331054688, -523.2491455078125, -505.0919494628906, -486.9347229003906, -468.7774963378906, -450.6202697753906, -432.4630432128906, -414.3057861328125, -396.1485595703125, -377.9913330078125, -359.8341064453125, -341.6768798828125, -323.5196533203125, -305.3624267578125, -287.2052001953125, -269.0479736328125, -250.89071655273438, -232.73348999023438, -214.57626342773438, -196.41903686523438, -178.26177978515625, -160.10455322265625, -141.9473114013672, -123.79008483886719, -105.63285064697266, -87.47561645507812, -69.31838989257812, -51.161155700683594, -33.00392150878906, -14.846689224243164, 3.3105430603027344, 21.4677734375, 39.62500762939453, 57.78224182128906, 75.93946838378906, 94.0967025756836, 112.25393676757812, 130.41116333007812, 148.5684051513672, 166.7256317138672, 184.88287353515625, 203.04010009765625, 221.19732666015625, 239.35455322265625, 257.51177978515625, 275.66900634765625, 293.82623291015625, 311.98345947265625, 330.1407165527344, 348.2979431152344, 366.4551696777344, 384.6123962402344, 402.7696533203125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 6.0, 8.0, 17.0, 10.0, 11.0, 20.0, 20.0, 14.0, 37.0, 24.0, 26.0, 40.0, 35.0, 58.0, 47.0, 69.0, 64.0, 69.0, 67.0, 61.0, 41.0, 36.0, 37.0, 26.0, 34.0, 29.0, 20.0, 17.0, 12.0, 16.0, 11.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.42391967773438, -157.95399475097656, -152.48406982421875, -147.01414489746094, -141.54421997070312, -136.07431030273438, -130.60438537597656, -125.13446044921875, -119.66453552246094, -114.19461059570312, -108.72468566894531, -103.25476837158203, -97.78484344482422, -92.3149185180664, -86.84500122070312, -81.37507629394531, -75.9051513671875, -70.43522644042969, -64.96530151367188, -59.495384216308594, -54.02545928955078, -48.55553436279297, -43.08561325073242, -37.615692138671875, -32.14576721191406, -26.675844192504883, -21.205921173095703, -15.735998153686523, -10.266075134277344, -4.796152114868164, 0.6737709045410156, 6.1436920166015625, 11.613632202148438, 17.083555221557617, 22.553478240966797, 28.023401260375977, 33.493324279785156, 38.96324920654297, 44.433170318603516, 49.90309143066406, 55.373016357421875, 60.84294128417969, 66.3128662109375, 71.78278350830078, 77.2527084350586, 82.7226333618164, 88.19255065917969, 93.6624755859375, 99.13240051269531, 104.60232543945312, 110.07225036621094, 115.54216766357422, 121.01209259033203, 126.48201751708984, 131.95193481445312, 137.42185974121094, 142.89178466796875, 148.36170959472656, 153.83163452148438, 159.3015594482422, 164.771484375, 170.24139404296875, 175.71131896972656, 181.18124389648438, 186.6511688232422]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 12.0, 14.0, 16.0, 24.0, 41.0, 92.0, 161.0, 276.0, 478.0, 1049.0, 2305.0, 5380.0, 14836.0, 53818.0, 491048.0, 3361974.0, 208857.0, 35301.0, 10857.0, 4170.0, 1863.0, 806.0, 395.0, 198.0, 104.0, 85.0, 36.0, 30.0, 23.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.299072265625, -12.67626953125, -12.053466796875, -11.4306640625, -10.807861328125, -10.18505859375, -9.562255859375, -8.939453125, -8.316650390625, -7.69384765625, -7.071044921875, -6.4482421875, -5.825439453125, -5.20263671875, -4.579833984375, -3.95703125, -3.334228515625, -2.71142578125, -2.088623046875, -1.4658203125, -0.843017578125, -0.22021484375, 0.402587890625, 1.025390625, 1.648193359375, 2.27099609375, 2.893798828125, 3.5166015625, 4.139404296875, 4.76220703125, 5.385009765625, 6.0078125, 6.630615234375, 7.25341796875, 7.876220703125, 8.4990234375, 9.121826171875, 9.74462890625, 10.367431640625, 10.990234375, 11.613037109375, 12.23583984375, 12.858642578125, 13.4814453125, 14.104248046875, 14.72705078125, 15.349853515625, 15.97265625, 16.595458984375, 17.21826171875, 17.841064453125, 18.4638671875, 19.086669921875, 19.70947265625, 20.332275390625, 20.955078125, 21.577880859375, 22.20068359375, 22.823486328125, 23.4462890625, 24.069091796875, 24.69189453125, 25.314697265625, 25.9375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 14.0, 23.0, 22.0, 44.0, 41.0, 53.0, 78.0, 96.0, 87.0, 83.0, 96.0, 81.0, 79.0, 63.0, 41.0, 34.0, 18.0, 16.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -11.8736572265625, -11.364501953125, -10.8553466796875, -10.34619140625, -9.8370361328125, -9.327880859375, -8.8187255859375, -8.3095703125, -7.8004150390625, -7.291259765625, -6.7821044921875, -6.27294921875, -5.7637939453125, -5.254638671875, -4.7454833984375, -4.236328125, -3.7271728515625, -3.218017578125, -2.7088623046875, -2.19970703125, -1.6905517578125, -1.181396484375, -0.6722412109375, -0.1630859375, 0.3460693359375, 0.855224609375, 1.3643798828125, 1.87353515625, 2.3826904296875, 2.891845703125, 3.4010009765625, 3.91015625, 4.4193115234375, 4.928466796875, 5.4376220703125, 5.94677734375, 6.4559326171875, 6.965087890625, 7.4742431640625, 7.9833984375, 8.4925537109375, 9.001708984375, 9.5108642578125, 10.02001953125, 10.5291748046875, 11.038330078125, 11.5474853515625, 12.056640625, 12.5657958984375, 13.074951171875, 13.5841064453125, 14.09326171875, 14.6024169921875, 15.111572265625, 15.6207275390625, 16.1298828125, 16.6390380859375, 17.148193359375, 17.6573486328125, 18.16650390625, 18.6756591796875, 19.184814453125, 19.6939697265625, 20.203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 8.0, 8.0, 27.0, 34.0, 59.0, 82.0, 168.0, 283.0, 528.0, 1030.0, 2070.0, 4214.0, 9500.0, 24550.0, 80043.0, 532537.0, 3136640.0, 306742.0, 60038.0, 19922.0, 8037.0, 3787.0, 1865.0, 1007.0, 514.0, 230.0, 147.0, 88.0, 33.0, 28.0, 30.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.0921630859375, -14.473388671875, -13.8546142578125, -13.23583984375, -12.6170654296875, -11.998291015625, -11.3795166015625, -10.7607421875, -10.1419677734375, -9.523193359375, -8.9044189453125, -8.28564453125, -7.6668701171875, -7.048095703125, -6.4293212890625, -5.810546875, -5.1917724609375, -4.572998046875, -3.9542236328125, -3.33544921875, -2.7166748046875, -2.097900390625, -1.4791259765625, -0.8603515625, -0.2415771484375, 0.377197265625, 0.9959716796875, 1.61474609375, 2.2335205078125, 2.852294921875, 3.4710693359375, 4.08984375, 4.7086181640625, 5.327392578125, 5.9461669921875, 6.56494140625, 7.1837158203125, 7.802490234375, 8.4212646484375, 9.0400390625, 9.6588134765625, 10.277587890625, 10.8963623046875, 11.51513671875, 12.1339111328125, 12.752685546875, 13.3714599609375, 13.990234375, 14.6090087890625, 15.227783203125, 15.8465576171875, 16.46533203125, 17.0841064453125, 17.702880859375, 18.3216552734375, 18.9404296875, 19.5592041015625, 20.177978515625, 20.7967529296875, 21.41552734375, 22.0343017578125, 22.653076171875, 23.2718505859375, 23.890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 9.0, 13.0, 21.0, 12.0, 17.0, 39.0, 56.0, 56.0, 98.0, 166.0, 323.0, 592.0, 932.0, 724.0, 385.0, 197.0, 121.0, 79.0, 67.0, 32.0, 35.0, 16.0, 16.0, 7.0, 8.0, 6.0, 10.0, 5.0, 9.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-23.5, -22.822021484375, -22.14404296875, -21.466064453125, -20.7880859375, -20.110107421875, -19.43212890625, -18.754150390625, -18.076171875, -17.398193359375, -16.72021484375, -16.042236328125, -15.3642578125, -14.686279296875, -14.00830078125, -13.330322265625, -12.65234375, -11.974365234375, -11.29638671875, -10.618408203125, -9.9404296875, -9.262451171875, -8.58447265625, -7.906494140625, -7.228515625, -6.550537109375, -5.87255859375, -5.194580078125, -4.5166015625, -3.838623046875, -3.16064453125, -2.482666015625, -1.8046875, -1.126708984375, -0.44873046875, 0.229248046875, 0.9072265625, 1.585205078125, 2.26318359375, 2.941162109375, 3.619140625, 4.297119140625, 4.97509765625, 5.653076171875, 6.3310546875, 7.009033203125, 7.68701171875, 8.364990234375, 9.04296875, 9.720947265625, 10.39892578125, 11.076904296875, 11.7548828125, 12.432861328125, 13.11083984375, 13.788818359375, 14.466796875, 15.144775390625, 15.82275390625, 16.500732421875, 17.1787109375, 17.856689453125, 18.53466796875, 19.212646484375, 19.890625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 17.0, 22.0, 45.0, 80.0, 180.0, 240.0, 218.0, 103.0, 52.0, 18.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.85206604003906, -152.69747924804688, -144.54290771484375, -136.38832092285156, -128.23373413085938, -120.07915496826172, -111.92457580566406, -103.76998901367188, -95.61540985107422, -87.46083068847656, -79.30624389648438, -71.15166473388672, -62.9970817565918, -54.842498779296875, -46.68791961669922, -38.5333366394043, -30.378753662109375, -22.224170684814453, -14.069589614868164, -5.915008544921875, 2.239574432373047, 10.394157409667969, 18.548736572265625, 26.703319549560547, 34.85790252685547, 43.01248550415039, 51.16706848144531, 59.32164764404297, 67.47622680664062, 75.63081359863281, 83.78539276123047, 91.93997192382812, 100.09454345703125, 108.2491226196289, 116.4037094116211, 124.55828857421875, 132.71287536621094, 140.86746215820312, 149.02203369140625, 157.17662048339844, 165.33120727539062, 173.4857940673828, 181.64036560058594, 189.79495239257812, 197.9495391845703, 206.1041259765625, 214.25869750976562, 222.4132843017578, 230.56785583496094, 238.72244262695312, 246.87701416015625, 255.03160095214844, 263.1861877441406, 271.34075927734375, 279.495361328125, 287.6499328613281, 295.80450439453125, 303.9590759277344, 312.1136779785156, 320.26824951171875, 328.4228210449219, 336.5774230957031, 344.73199462890625, 352.8865661621094, 361.0411682128906]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 11.0, 16.0, 20.0, 10.0, 24.0, 21.0, 38.0, 29.0, 35.0, 47.0, 41.0, 54.0, 54.0, 58.0, 43.0, 54.0, 53.0, 44.0, 43.0, 40.0, 35.0, 35.0, 40.0, 22.0, 26.0, 15.0, 18.0, 16.0, 6.0, 9.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.60320281982422, -86.44063568115234, -83.278076171875, -80.11550903320312, -76.95294189453125, -73.79037475585938, -70.62781524658203, -67.46524810791016, -64.30268859863281, -61.1401252746582, -57.97755813598633, -54.81499481201172, -51.652427673339844, -48.489864349365234, -45.327301025390625, -42.16473388671875, -39.002166748046875, -35.839603424072266, -32.67703628540039, -29.51447296142578, -26.35190773010254, -23.189342498779297, -20.026779174804688, -16.864213943481445, -13.701648712158203, -10.539083480834961, -7.376519203186035, -4.213954925537109, -1.0513896942138672, 2.111175537109375, 5.273738861083984, 8.436304092407227, 11.598876953125, 14.761442184448242, 17.924007415771484, 21.086570739746094, 24.249135971069336, 27.411701202392578, 30.574264526367188, 33.73683166503906, 36.89939498901367, 40.06195831298828, 43.224525451660156, 46.387088775634766, 49.549652099609375, 52.71221923828125, 55.87478256225586, 59.03734588623047, 62.199913024902344, 65.36248016357422, 68.52503967285156, 71.68760681152344, 74.85017395019531, 78.01274108886719, 81.17530059814453, 84.3378677368164, 87.50042724609375, 90.66299438476562, 93.82555389404297, 96.98812103271484, 100.15068817138672, 103.31324768066406, 106.47581481933594, 109.63838195800781, 112.80094909667969]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 10.0, 17.0, 28.0, 28.0, 60.0, 111.0, 148.0, 239.0, 461.0, 704.0, 1258.0, 2415.0, 4740.0, 9606.0, 21042.0, 49490.0, 131982.0, 349189.0, 296176.0, 105110.0, 40957.0, 17641.0, 8239.0, 4085.0, 2088.0, 1107.0, 665.0, 350.0, 223.0, 123.0, 91.0, 57.0, 42.0, 31.0, 16.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.40625, -17.8291015625, -17.251953125, -16.6748046875, -16.09765625, -15.5205078125, -14.943359375, -14.3662109375, -13.7890625, -13.2119140625, -12.634765625, -12.0576171875, -11.48046875, -10.9033203125, -10.326171875, -9.7490234375, -9.171875, -8.5947265625, -8.017578125, -7.4404296875, -6.86328125, -6.2861328125, -5.708984375, -5.1318359375, -4.5546875, -3.9775390625, -3.400390625, -2.8232421875, -2.24609375, -1.6689453125, -1.091796875, -0.5146484375, 0.0625, 0.6396484375, 1.216796875, 1.7939453125, 2.37109375, 2.9482421875, 3.525390625, 4.1025390625, 4.6796875, 5.2568359375, 5.833984375, 6.4111328125, 6.98828125, 7.5654296875, 8.142578125, 8.7197265625, 9.296875, 9.8740234375, 10.451171875, 11.0283203125, 11.60546875, 12.1826171875, 12.759765625, 13.3369140625, 13.9140625, 14.4912109375, 15.068359375, 15.6455078125, 16.22265625, 16.7998046875, 17.376953125, 17.9541015625, 18.53125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 6.0, 14.0, 21.0, 20.0, 27.0, 25.0, 39.0, 54.0, 64.0, 48.0, 70.0, 58.0, 70.0, 59.0, 72.0, 76.0, 68.0, 55.0, 37.0, 22.0, 25.0, 14.0, 11.0, 6.0, 16.0, 4.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9453125, -13.5399169921875, -13.134521484375, -12.7291259765625, -12.32373046875, -11.9183349609375, -11.512939453125, -11.1075439453125, -10.7021484375, -10.2967529296875, -9.891357421875, -9.4859619140625, -9.08056640625, -8.6751708984375, -8.269775390625, -7.8643798828125, -7.458984375, -7.0535888671875, -6.648193359375, -6.2427978515625, -5.83740234375, -5.4320068359375, -5.026611328125, -4.6212158203125, -4.2158203125, -3.8104248046875, -3.405029296875, -2.9996337890625, -2.59423828125, -2.1888427734375, -1.783447265625, -1.3780517578125, -0.97265625, -0.5672607421875, -0.161865234375, 0.2435302734375, 0.64892578125, 1.0543212890625, 1.459716796875, 1.8651123046875, 2.2705078125, 2.6759033203125, 3.081298828125, 3.4866943359375, 3.89208984375, 4.2974853515625, 4.702880859375, 5.1082763671875, 5.513671875, 5.9190673828125, 6.324462890625, 6.7298583984375, 7.13525390625, 7.5406494140625, 7.946044921875, 8.3514404296875, 8.7568359375, 9.1622314453125, 9.567626953125, 9.9730224609375, 10.37841796875, 10.7838134765625, 11.189208984375, 11.5946044921875, 12.0]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 10.0, 9.0, 12.0, 18.0, 23.0, 34.0, 55.0, 57.0, 90.0, 131.0, 196.0, 372.0, 681.0, 1411.0, 3488.0, 11502.0, 54190.0, 426041.0, 475259.0, 56187.0, 12008.0, 3627.0, 1422.0, 716.0, 356.0, 213.0, 145.0, 90.0, 60.0, 36.0, 28.0, 24.0, 17.0, 10.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 5.0], "bins": [-38.6875, -37.58251953125, -36.4775390625, -35.37255859375, -34.267578125, -33.16259765625, -32.0576171875, -30.95263671875, -29.84765625, -28.74267578125, -27.6376953125, -26.53271484375, -25.427734375, -24.32275390625, -23.2177734375, -22.11279296875, -21.0078125, -19.90283203125, -18.7978515625, -17.69287109375, -16.587890625, -15.48291015625, -14.3779296875, -13.27294921875, -12.16796875, -11.06298828125, -9.9580078125, -8.85302734375, -7.748046875, -6.64306640625, -5.5380859375, -4.43310546875, -3.328125, -2.22314453125, -1.1181640625, -0.01318359375, 1.091796875, 2.19677734375, 3.3017578125, 4.40673828125, 5.51171875, 6.61669921875, 7.7216796875, 8.82666015625, 9.931640625, 11.03662109375, 12.1416015625, 13.24658203125, 14.3515625, 15.45654296875, 16.5615234375, 17.66650390625, 18.771484375, 19.87646484375, 20.9814453125, 22.08642578125, 23.19140625, 24.29638671875, 25.4013671875, 26.50634765625, 27.611328125, 28.71630859375, 29.8212890625, 30.92626953125, 32.03125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 5.0, 3.0, 6.0, 10.0, 19.0, 19.0, 21.0, 29.0, 22.0, 44.0, 46.0, 47.0, 39.0, 37.0, 66.0, 50.0, 58.0, 59.0, 56.0, 50.0, 38.0, 50.0, 40.0, 34.0, 29.0, 18.0, 16.0, 17.0, 14.0, 9.0, 8.0, 7.0, 11.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-41.5625, -40.29248046875, -39.0224609375, -37.75244140625, -36.482421875, -35.21240234375, -33.9423828125, -32.67236328125, -31.40234375, -30.13232421875, -28.8623046875, -27.59228515625, -26.322265625, -25.05224609375, -23.7822265625, -22.51220703125, -21.2421875, -19.97216796875, -18.7021484375, -17.43212890625, -16.162109375, -14.89208984375, -13.6220703125, -12.35205078125, -11.08203125, -9.81201171875, -8.5419921875, -7.27197265625, -6.001953125, -4.73193359375, -3.4619140625, -2.19189453125, -0.921875, 0.34814453125, 1.6181640625, 2.88818359375, 4.158203125, 5.42822265625, 6.6982421875, 7.96826171875, 9.23828125, 10.50830078125, 11.7783203125, 13.04833984375, 14.318359375, 15.58837890625, 16.8583984375, 18.12841796875, 19.3984375, 20.66845703125, 21.9384765625, 23.20849609375, 24.478515625, 25.74853515625, 27.0185546875, 28.28857421875, 29.55859375, 30.82861328125, 32.0986328125, 33.36865234375, 34.638671875, 35.90869140625, 37.1787109375, 38.44873046875, 39.71875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 7.0, 8.0, 7.0, 18.0, 29.0, 87.0, 146.0, 571.0, 3590.0, 117607.0, 908200.0, 16480.0, 1285.0, 303.0, 109.0, 42.0, 28.0, 8.0, 9.0, 12.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.765625, -27.815185546875, -26.86474609375, -25.914306640625, -24.9638671875, -24.013427734375, -23.06298828125, -22.112548828125, -21.162109375, -20.211669921875, -19.26123046875, -18.310791015625, -17.3603515625, -16.409912109375, -15.45947265625, -14.509033203125, -13.55859375, -12.608154296875, -11.65771484375, -10.707275390625, -9.7568359375, -8.806396484375, -7.85595703125, -6.905517578125, -5.955078125, -5.004638671875, -4.05419921875, -3.103759765625, -2.1533203125, -1.202880859375, -0.25244140625, 0.697998046875, 1.6484375, 2.598876953125, 3.54931640625, 4.499755859375, 5.4501953125, 6.400634765625, 7.35107421875, 8.301513671875, 9.251953125, 10.202392578125, 11.15283203125, 12.103271484375, 13.0537109375, 14.004150390625, 14.95458984375, 15.905029296875, 16.85546875, 17.805908203125, 18.75634765625, 19.706787109375, 20.6572265625, 21.607666015625, 22.55810546875, 23.508544921875, 24.458984375, 25.409423828125, 26.35986328125, 27.310302734375, 28.2607421875, 29.211181640625, 30.16162109375, 31.112060546875, 32.0625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 6.0, 6.0, 13.0, 17.0, 23.0, 38.0, 50.0, 73.0, 102.0, 145.0, 149.0, 100.0, 65.0, 56.0, 32.0, 26.0, 14.0, 21.0, 17.0, 10.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002696990966796875, -0.002612859010696411, -0.0025287270545959473, -0.0024445950984954834, -0.0023604631423950195, -0.0022763311862945557, -0.002192199230194092, -0.002108067274093628, -0.002023935317993164, -0.0019398033618927002, -0.0018556714057922363, -0.0017715394496917725, -0.0016874074935913086, -0.0016032755374908447, -0.0015191435813903809, -0.001435011625289917, -0.0013508796691894531, -0.0012667477130889893, -0.0011826157569885254, -0.0010984838008880615, -0.0010143518447875977, -0.0009302198886871338, -0.0008460879325866699, -0.0007619559764862061, -0.0006778240203857422, -0.0005936920642852783, -0.0005095601081848145, -0.0004254281520843506, -0.0003412961959838867, -0.00025716423988342285, -0.00017303228378295898, -8.890032768249512e-05, -4.76837158203125e-06, 7.936358451843262e-05, 0.00016349554061889648, 0.00024762749671936035, 0.0003317594528198242, 0.0004158914089202881, 0.000500023365020752, 0.0005841553211212158, 0.0006682872772216797, 0.0007524192333221436, 0.0008365511894226074, 0.0009206831455230713, 0.0010048151016235352, 0.001088947057723999, 0.0011730790138244629, 0.0012572109699249268, 0.0013413429260253906, 0.0014254748821258545, 0.0015096068382263184, 0.0015937387943267822, 0.001677870750427246, 0.00176200270652771, 0.0018461346626281738, 0.0019302666187286377, 0.0020143985748291016, 0.0020985305309295654, 0.0021826624870300293, 0.002266794443130493, 0.002350926399230957, 0.002435058355331421, 0.0025191903114318848, 0.0026033222675323486, 0.0026874542236328125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 8.0, 4.0, 8.0, 7.0, 12.0, 16.0, 18.0, 43.0, 65.0, 73.0, 168.0, 242.0, 516.0, 1049.0, 2353.0, 8235.0, 43404.0, 483501.0, 453005.0, 43291.0, 8048.0, 2452.0, 908.0, 438.0, 287.0, 157.0, 102.0, 55.0, 29.0, 20.0, 12.0, 10.0, 5.0, 5.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.95361328125, -10.5478515625, -10.14208984375, -9.736328125, -9.33056640625, -8.9248046875, -8.51904296875, -8.11328125, -7.70751953125, -7.3017578125, -6.89599609375, -6.490234375, -6.08447265625, -5.6787109375, -5.27294921875, -4.8671875, -4.46142578125, -4.0556640625, -3.64990234375, -3.244140625, -2.83837890625, -2.4326171875, -2.02685546875, -1.62109375, -1.21533203125, -0.8095703125, -0.40380859375, 0.001953125, 0.40771484375, 0.8134765625, 1.21923828125, 1.625, 2.03076171875, 2.4365234375, 2.84228515625, 3.248046875, 3.65380859375, 4.0595703125, 4.46533203125, 4.87109375, 5.27685546875, 5.6826171875, 6.08837890625, 6.494140625, 6.89990234375, 7.3056640625, 7.71142578125, 8.1171875, 8.52294921875, 8.9287109375, 9.33447265625, 9.740234375, 10.14599609375, 10.5517578125, 10.95751953125, 11.36328125, 11.76904296875, 12.1748046875, 12.58056640625, 12.986328125, 13.39208984375, 13.7978515625, 14.20361328125, 14.609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 17.0, 13.0, 15.0, 22.0, 25.0, 25.0, 40.0, 34.0, 38.0, 59.0, 61.0, 60.0, 57.0, 63.0, 69.0, 59.0, 49.0, 54.0, 36.0, 32.0, 29.0, 16.0, 19.0, 8.0, 13.0, 12.0, 8.0, 9.0, 6.0, 6.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.78515625, -7.5465087890625, -7.307861328125, -7.0692138671875, -6.83056640625, -6.5919189453125, -6.353271484375, -6.1146240234375, -5.8759765625, -5.6373291015625, -5.398681640625, -5.1600341796875, -4.92138671875, -4.6827392578125, -4.444091796875, -4.2054443359375, -3.966796875, -3.7281494140625, -3.489501953125, -3.2508544921875, -3.01220703125, -2.7735595703125, -2.534912109375, -2.2962646484375, -2.0576171875, -1.8189697265625, -1.580322265625, -1.3416748046875, -1.10302734375, -0.8643798828125, -0.625732421875, -0.3870849609375, -0.1484375, 0.0902099609375, 0.328857421875, 0.5675048828125, 0.80615234375, 1.0447998046875, 1.283447265625, 1.5220947265625, 1.7607421875, 1.9993896484375, 2.238037109375, 2.4766845703125, 2.71533203125, 2.9539794921875, 3.192626953125, 3.4312744140625, 3.669921875, 3.9085693359375, 4.147216796875, 4.3858642578125, 4.62451171875, 4.8631591796875, 5.101806640625, 5.3404541015625, 5.5791015625, 5.8177490234375, 6.056396484375, 6.2950439453125, 6.53369140625, 6.7723388671875, 7.010986328125, 7.2496337890625, 7.48828125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 19.0, 16.0, 49.0, 76.0, 125.0, 181.0, 198.0, 128.0, 81.0, 47.0, 26.0, 19.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-127.72358703613281, -120.23841857910156, -112.75325012207031, -105.26807403564453, -97.78290557861328, -90.29773712158203, -82.81256103515625, -75.327392578125, -67.84222412109375, -60.3570556640625, -52.871883392333984, -45.38671112060547, -37.90154266357422, -30.41637420654297, -22.931201934814453, -15.446029663085938, -7.9608612060546875, -0.4756908416748047, 7.009479522705078, 14.494649887084961, 21.979820251464844, 29.464988708496094, 36.95016098022461, 44.435333251953125, 51.920501708984375, 59.405670166015625, 66.89083862304688, 74.37601470947266, 81.8611831665039, 89.34635162353516, 96.83152770996094, 104.31669616699219, 111.8018798828125, 119.28704833984375, 126.772216796875, 134.25738525390625, 141.7425537109375, 149.22772216796875, 156.71290588378906, 164.1980743408203, 171.68324279785156, 179.1684112548828, 186.65357971191406, 194.1387481689453, 201.62393188476562, 209.10910034179688, 216.59426879882812, 224.07943725585938, 231.56460571289062, 239.04977416992188, 246.53494262695312, 254.02011108398438, 261.5052795410156, 268.9904479980469, 276.4756164550781, 283.9608154296875, 291.44598388671875, 298.93115234375, 306.41632080078125, 313.9014892578125, 321.38665771484375, 328.871826171875, 336.35699462890625, 343.8421630859375, 351.32733154296875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 8.0, 11.0, 6.0, 13.0, 9.0, 15.0, 20.0, 22.0, 20.0, 39.0, 29.0, 49.0, 36.0, 42.0, 34.0, 54.0, 48.0, 52.0, 69.0, 49.0, 54.0, 40.0, 25.0, 33.0, 26.0, 32.0, 20.0, 19.0, 18.0, 10.0, 13.0, 16.0, 11.0, 14.0, 4.0, 9.0, 4.0, 6.0, 1.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-161.04635620117188, -156.62799072265625, -152.20962524414062, -147.79124450683594, -143.3728790283203, -138.9545135498047, -134.53614807128906, -130.11778259277344, -125.69940948486328, -121.28104400634766, -116.8626708984375, -112.44430541992188, -108.02593994140625, -103.6075668334961, -99.18920135498047, -94.77082824707031, -90.35246276855469, -85.93409729003906, -81.5157241821289, -77.09735870361328, -72.67898559570312, -68.2606201171875, -63.842254638671875, -59.423885345458984, -55.005516052246094, -50.5871467590332, -46.16877746582031, -41.75041198730469, -37.3320426940918, -32.913673400878906, -28.49530601501465, -24.07693862915039, -19.6585693359375, -15.240200996398926, -10.821832656860352, -6.403464317321777, -1.9850959777832031, 2.4332733154296875, 6.851640701293945, 11.270008087158203, 15.688377380371094, 20.106746673583984, 24.525114059448242, 28.9434814453125, 33.36185073852539, 37.78022003173828, 42.198585510253906, 46.6169548034668, 51.03532409667969, 55.45369338989258, 59.87206268310547, 64.2904281616211, 68.70880126953125, 73.12716674804688, 77.5455322265625, 81.96389770507812, 86.38227081298828, 90.8006362915039, 95.21900939941406, 99.63737487792969, 104.05574035644531, 108.47411346435547, 112.8924789428711, 117.31085205078125, 121.72921752929688]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 18.0, 19.0, 23.0, 46.0, 98.0, 154.0, 313.0, 695.0, 1589.0, 4021.0, 11284.0, 36967.0, 168136.0, 1368859.0, 2223541.0, 299672.0, 54776.0, 15164.0, 5174.0, 2064.0, 814.0, 392.0, 205.0, 85.0, 58.0, 36.0, 14.0, 11.0, 8.0, 11.0, 8.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.859375, -12.418212890625, -11.97705078125, -11.535888671875, -11.0947265625, -10.653564453125, -10.21240234375, -9.771240234375, -9.330078125, -8.888916015625, -8.44775390625, -8.006591796875, -7.5654296875, -7.124267578125, -6.68310546875, -6.241943359375, -5.80078125, -5.359619140625, -4.91845703125, -4.477294921875, -4.0361328125, -3.594970703125, -3.15380859375, -2.712646484375, -2.271484375, -1.830322265625, -1.38916015625, -0.947998046875, -0.5068359375, -0.065673828125, 0.37548828125, 0.816650390625, 1.2578125, 1.698974609375, 2.14013671875, 2.581298828125, 3.0224609375, 3.463623046875, 3.90478515625, 4.345947265625, 4.787109375, 5.228271484375, 5.66943359375, 6.110595703125, 6.5517578125, 6.992919921875, 7.43408203125, 7.875244140625, 8.31640625, 8.757568359375, 9.19873046875, 9.639892578125, 10.0810546875, 10.522216796875, 10.96337890625, 11.404541015625, 11.845703125, 12.286865234375, 12.72802734375, 13.169189453125, 13.6103515625, 14.051513671875, 14.49267578125, 14.933837890625, 15.375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 18.0, 23.0, 33.0, 45.0, 48.0, 73.0, 61.0, 75.0, 89.0, 75.0, 95.0, 81.0, 63.0, 76.0, 36.0, 30.0, 22.0, 20.0, 9.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2421875, -8.7821044921875, -8.322021484375, -7.8619384765625, -7.40185546875, -6.9417724609375, -6.481689453125, -6.0216064453125, -5.5615234375, -5.1014404296875, -4.641357421875, -4.1812744140625, -3.72119140625, -3.2611083984375, -2.801025390625, -2.3409423828125, -1.880859375, -1.4207763671875, -0.960693359375, -0.5006103515625, -0.04052734375, 0.4195556640625, 0.879638671875, 1.3397216796875, 1.7998046875, 2.2598876953125, 2.719970703125, 3.1800537109375, 3.64013671875, 4.1002197265625, 4.560302734375, 5.0203857421875, 5.48046875, 5.9405517578125, 6.400634765625, 6.8607177734375, 7.32080078125, 7.7808837890625, 8.240966796875, 8.7010498046875, 9.1611328125, 9.6212158203125, 10.081298828125, 10.5413818359375, 11.00146484375, 11.4615478515625, 11.921630859375, 12.3817138671875, 12.841796875, 13.3018798828125, 13.761962890625, 14.2220458984375, 14.68212890625, 15.1422119140625, 15.602294921875, 16.0623779296875, 16.5224609375, 16.9825439453125, 17.442626953125, 17.9027099609375, 18.36279296875, 18.8228759765625, 19.282958984375, 19.7430419921875, 20.203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 13.0, 11.0, 18.0, 26.0, 49.0, 57.0, 113.0, 230.0, 425.0, 976.0, 2402.0, 6760.0, 23376.0, 106262.0, 1004354.0, 2753207.0, 235013.0, 42635.0, 11734.0, 3880.0, 1451.0, 609.0, 273.0, 161.0, 71.0, 47.0, 42.0, 30.0, 18.0, 14.0, 6.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.078125, -24.421875, -23.765625, -23.109375, -22.453125, -21.796875, -21.140625, -20.484375, -19.828125, -19.171875, -18.515625, -17.859375, -17.203125, -16.546875, -15.890625, -15.234375, -14.578125, -13.921875, -13.265625, -12.609375, -11.953125, -11.296875, -10.640625, -9.984375, -9.328125, -8.671875, -8.015625, -7.359375, -6.703125, -6.046875, -5.390625, -4.734375, -4.078125, -3.421875, -2.765625, -2.109375, -1.453125, -0.796875, -0.140625, 0.515625, 1.171875, 1.828125, 2.484375, 3.140625, 3.796875, 4.453125, 5.109375, 5.765625, 6.421875, 7.078125, 7.734375, 8.390625, 9.046875, 9.703125, 10.359375, 11.015625, 11.671875, 12.328125, 12.984375, 13.640625, 14.296875, 14.953125, 15.609375, 16.265625, 16.921875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 9.0, 10.0, 10.0, 17.0, 10.0, 18.0, 24.0, 41.0, 56.0, 77.0, 81.0, 138.0, 162.0, 268.0, 391.0, 526.0, 603.0, 510.0, 304.0, 215.0, 151.0, 104.0, 83.0, 63.0, 44.0, 25.0, 20.0, 19.0, 24.0, 8.0, 10.0, 8.0, 4.0, 11.0, 7.0, 3.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.328125, -20.70703125, -20.0859375, -19.46484375, -18.84375, -18.22265625, -17.6015625, -16.98046875, -16.359375, -15.73828125, -15.1171875, -14.49609375, -13.875, -13.25390625, -12.6328125, -12.01171875, -11.390625, -10.76953125, -10.1484375, -9.52734375, -8.90625, -8.28515625, -7.6640625, -7.04296875, -6.421875, -5.80078125, -5.1796875, -4.55859375, -3.9375, -3.31640625, -2.6953125, -2.07421875, -1.453125, -0.83203125, -0.2109375, 0.41015625, 1.03125, 1.65234375, 2.2734375, 2.89453125, 3.515625, 4.13671875, 4.7578125, 5.37890625, 6.0, 6.62109375, 7.2421875, 7.86328125, 8.484375, 9.10546875, 9.7265625, 10.34765625, 10.96875, 11.58984375, 12.2109375, 12.83203125, 13.453125, 14.07421875, 14.6953125, 15.31640625, 15.9375, 16.55859375, 17.1796875, 17.80078125, 18.421875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 14.0, 32.0, 57.0, 115.0, 191.0, 220.0, 146.0, 111.0, 47.0, 21.0, 17.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-387.7190246582031, -379.2105712890625, -370.7021484375, -362.1936950683594, -353.68524169921875, -345.17681884765625, -336.6683654785156, -328.159912109375, -319.6514892578125, -311.1430358886719, -302.6346130371094, -294.12615966796875, -285.6177062988281, -277.1092529296875, -268.600830078125, -260.0923767089844, -251.58392333984375, -243.0754852294922, -234.56703186035156, -226.05859375, -217.55014038085938, -209.0417022705078, -200.53326416015625, -192.02481079101562, -183.51637268066406, -175.0079345703125, -166.49948120117188, -157.9910430908203, -149.48260498046875, -140.97415161132812, -132.46571350097656, -123.95726776123047, -115.44882202148438, -106.94037628173828, -98.43193054199219, -89.92349243164062, -81.41504669189453, -72.90660095214844, -64.39816284179688, -55.88971710205078, -47.38127136230469, -38.872825622558594, -30.364383697509766, -21.855939865112305, -13.347496032714844, -4.83905029296875, 3.669391632080078, 12.177833557128906, 20.686279296875, 29.19472312927246, 37.70316696166992, 46.21160888671875, 54.720054626464844, 63.22850036621094, 71.7369384765625, 80.2453842163086, 88.75382995605469, 97.26227569580078, 105.77072143554688, 114.27915954589844, 122.78760528564453, 131.29605102539062, 139.8044891357422, 148.31292724609375, 156.82138061523438]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 11.0, 9.0, 11.0, 17.0, 21.0, 28.0, 54.0, 38.0, 63.0, 70.0, 62.0, 73.0, 64.0, 84.0, 73.0, 69.0, 60.0, 43.0, 36.0, 35.0, 22.0, 20.0, 10.0, 9.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-191.76797485351562, -186.1566162109375, -180.5452423095703, -174.9338836669922, -169.322509765625, -163.71115112304688, -158.09979248046875, -152.48841857910156, -146.87705993652344, -141.2657012939453, -135.65432739257812, -130.04296875, -124.43160247802734, -118.82023620605469, -113.20886993408203, -107.59750366210938, -101.98613739013672, -96.37477111816406, -90.7634048461914, -85.15203857421875, -79.54067993164062, -73.92931365966797, -68.31794738769531, -62.70658493041992, -57.095218658447266, -51.48385238647461, -45.87248992919922, -40.26112365722656, -34.649757385253906, -29.038394927978516, -23.42702865600586, -17.81566619873047, -12.204299926757812, -6.592935085296631, -0.9815702438354492, 4.629795074462891, 10.241159439086914, 15.852523803710938, 21.463890075683594, 27.075252532958984, 32.68661880493164, 38.2979850769043, 43.90934753417969, 49.520713806152344, 55.132080078125, 60.74344253540039, 66.35481262207031, 71.96617126464844, 77.5775375366211, 83.18890380859375, 88.8002700805664, 94.41163635253906, 100.02299499511719, 105.63436126708984, 111.2457275390625, 116.85708618164062, 122.46846008300781, 128.07981872558594, 133.69119262695312, 139.30255126953125, 144.91392517089844, 150.52528381347656, 156.13665771484375, 161.74801635742188, 167.359375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 6.0, 11.0, 16.0, 17.0, 24.0, 51.0, 55.0, 71.0, 127.0, 180.0, 340.0, 542.0, 887.0, 1668.0, 3149.0, 6180.0, 12952.0, 27516.0, 58961.0, 127150.0, 261667.0, 280633.0, 140905.0, 65970.0, 30837.0, 14005.0, 6923.0, 3430.0, 1699.0, 992.0, 561.0, 372.0, 218.0, 142.0, 93.0, 56.0, 39.0, 35.0, 22.0, 16.0, 12.0, 5.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.2421875, -14.7515869140625, -14.260986328125, -13.7703857421875, -13.27978515625, -12.7891845703125, -12.298583984375, -11.8079833984375, -11.3173828125, -10.8267822265625, -10.336181640625, -9.8455810546875, -9.35498046875, -8.8643798828125, -8.373779296875, -7.8831787109375, -7.392578125, -6.9019775390625, -6.411376953125, -5.9207763671875, -5.43017578125, -4.9395751953125, -4.448974609375, -3.9583740234375, -3.4677734375, -2.9771728515625, -2.486572265625, -1.9959716796875, -1.50537109375, -1.0147705078125, -0.524169921875, -0.0335693359375, 0.45703125, 0.9476318359375, 1.438232421875, 1.9288330078125, 2.41943359375, 2.9100341796875, 3.400634765625, 3.8912353515625, 4.3818359375, 4.8724365234375, 5.363037109375, 5.8536376953125, 6.34423828125, 6.8348388671875, 7.325439453125, 7.8160400390625, 8.306640625, 8.7972412109375, 9.287841796875, 9.7784423828125, 10.26904296875, 10.7596435546875, 11.250244140625, 11.7408447265625, 12.2314453125, 12.7220458984375, 13.212646484375, 13.7032470703125, 14.19384765625, 14.6844482421875, 15.175048828125, 15.6656494140625, 16.15625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 12.0, 7.0, 14.0, 11.0, 17.0, 20.0, 22.0, 27.0, 29.0, 28.0, 21.0, 31.0, 33.0, 53.0, 46.0, 53.0, 46.0, 61.0, 47.0, 33.0, 53.0, 31.0, 41.0, 38.0, 36.0, 24.0, 24.0, 23.0, 18.0, 20.0, 12.0, 11.0, 7.0, 10.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.125, -8.86468505859375, -8.6043701171875, -8.34405517578125, -8.083740234375, -7.82342529296875, -7.5631103515625, -7.30279541015625, -7.04248046875, -6.78216552734375, -6.5218505859375, -6.26153564453125, -6.001220703125, -5.74090576171875, -5.4805908203125, -5.22027587890625, -4.9599609375, -4.69964599609375, -4.4393310546875, -4.17901611328125, -3.918701171875, -3.65838623046875, -3.3980712890625, -3.13775634765625, -2.87744140625, -2.61712646484375, -2.3568115234375, -2.09649658203125, -1.836181640625, -1.57586669921875, -1.3155517578125, -1.05523681640625, -0.794921875, -0.53460693359375, -0.2742919921875, -0.01397705078125, 0.246337890625, 0.50665283203125, 0.7669677734375, 1.02728271484375, 1.28759765625, 1.54791259765625, 1.8082275390625, 2.06854248046875, 2.328857421875, 2.58917236328125, 2.8494873046875, 3.10980224609375, 3.3701171875, 3.63043212890625, 3.8907470703125, 4.15106201171875, 4.411376953125, 4.67169189453125, 4.9320068359375, 5.19232177734375, 5.45263671875, 5.71295166015625, 5.9732666015625, 6.23358154296875, 6.493896484375, 6.75421142578125, 7.0145263671875, 7.27484130859375, 7.53515625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 4.0, 5.0, 3.0, 3.0, 11.0, 13.0, 19.0, 24.0, 42.0, 31.0, 64.0, 100.0, 133.0, 193.0, 354.0, 628.0, 1224.0, 2548.0, 8022.0, 59406.0, 783701.0, 169481.0, 15199.0, 3737.0, 1576.0, 822.0, 471.0, 257.0, 135.0, 112.0, 68.0, 54.0, 28.0, 23.0, 15.0, 13.0, 10.0, 7.0, 2.0, 3.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.03125, -48.34619140625, -46.6611328125, -44.97607421875, -43.291015625, -41.60595703125, -39.9208984375, -38.23583984375, -36.55078125, -34.86572265625, -33.1806640625, -31.49560546875, -29.810546875, -28.12548828125, -26.4404296875, -24.75537109375, -23.0703125, -21.38525390625, -19.7001953125, -18.01513671875, -16.330078125, -14.64501953125, -12.9599609375, -11.27490234375, -9.58984375, -7.90478515625, -6.2197265625, -4.53466796875, -2.849609375, -1.16455078125, 0.5205078125, 2.20556640625, 3.890625, 5.57568359375, 7.2607421875, 8.94580078125, 10.630859375, 12.31591796875, 14.0009765625, 15.68603515625, 17.37109375, 19.05615234375, 20.7412109375, 22.42626953125, 24.111328125, 25.79638671875, 27.4814453125, 29.16650390625, 30.8515625, 32.53662109375, 34.2216796875, 35.90673828125, 37.591796875, 39.27685546875, 40.9619140625, 42.64697265625, 44.33203125, 46.01708984375, 47.7021484375, 49.38720703125, 51.072265625, 52.75732421875, 54.4423828125, 56.12744140625, 57.8125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 11.0, 4.0, 9.0, 10.0, 20.0, 18.0, 22.0, 32.0, 30.0, 43.0, 43.0, 38.0, 53.0, 63.0, 64.0, 61.0, 50.0, 49.0, 44.0, 49.0, 41.0, 38.0, 34.0, 19.0, 23.0, 27.0, 17.0, 18.0, 19.0, 11.0, 9.0, 7.0, 5.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.40625, -39.041015625, -37.67578125, -36.310546875, -34.9453125, -33.580078125, -32.21484375, -30.849609375, -29.484375, -28.119140625, -26.75390625, -25.388671875, -24.0234375, -22.658203125, -21.29296875, -19.927734375, -18.5625, -17.197265625, -15.83203125, -14.466796875, -13.1015625, -11.736328125, -10.37109375, -9.005859375, -7.640625, -6.275390625, -4.91015625, -3.544921875, -2.1796875, -0.814453125, 0.55078125, 1.916015625, 3.28125, 4.646484375, 6.01171875, 7.376953125, 8.7421875, 10.107421875, 11.47265625, 12.837890625, 14.203125, 15.568359375, 16.93359375, 18.298828125, 19.6640625, 21.029296875, 22.39453125, 23.759765625, 25.125, 26.490234375, 27.85546875, 29.220703125, 30.5859375, 31.951171875, 33.31640625, 34.681640625, 36.046875, 37.412109375, 38.77734375, 40.142578125, 41.5078125, 42.873046875, 44.23828125, 45.603515625, 46.96875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 11.0, 8.0, 15.0, 15.0, 19.0, 53.0, 85.0, 194.0, 448.0, 1451.0, 6795.0, 84091.0, 865932.0, 80445.0, 6541.0, 1499.0, 500.0, 205.0, 87.0, 54.0, 28.0, 17.0, 17.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-21.640625, -21.047607421875, -20.45458984375, -19.861572265625, -19.2685546875, -18.675537109375, -18.08251953125, -17.489501953125, -16.896484375, -16.303466796875, -15.71044921875, -15.117431640625, -14.5244140625, -13.931396484375, -13.33837890625, -12.745361328125, -12.15234375, -11.559326171875, -10.96630859375, -10.373291015625, -9.7802734375, -9.187255859375, -8.59423828125, -8.001220703125, -7.408203125, -6.815185546875, -6.22216796875, -5.629150390625, -5.0361328125, -4.443115234375, -3.85009765625, -3.257080078125, -2.6640625, -2.071044921875, -1.47802734375, -0.885009765625, -0.2919921875, 0.301025390625, 0.89404296875, 1.487060546875, 2.080078125, 2.673095703125, 3.26611328125, 3.859130859375, 4.4521484375, 5.045166015625, 5.63818359375, 6.231201171875, 6.82421875, 7.417236328125, 8.01025390625, 8.603271484375, 9.1962890625, 9.789306640625, 10.38232421875, 10.975341796875, 11.568359375, 12.161376953125, 12.75439453125, 13.347412109375, 13.9404296875, 14.533447265625, 15.12646484375, 15.719482421875, 16.3125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 3.0, 7.0, 6.0, 6.0, 7.0, 10.0, 11.0, 7.0, 12.0, 20.0, 15.0, 25.0, 28.0, 28.0, 52.0, 49.0, 67.0, 95.0, 111.0, 91.0, 53.0, 56.0, 39.0, 35.0, 24.0, 24.0, 23.0, 18.0, 9.0, 10.0, 13.0, 5.0, 3.0, 7.0, 10.0, 2.0, 5.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0018405914306640625, -0.0017780065536499023, -0.0017154216766357422, -0.001652836799621582, -0.0015902519226074219, -0.0015276670455932617, -0.0014650821685791016, -0.0014024972915649414, -0.0013399124145507812, -0.001277327537536621, -0.001214742660522461, -0.0011521577835083008, -0.0010895729064941406, -0.0010269880294799805, -0.0009644031524658203, -0.0009018182754516602, -0.0008392333984375, -0.0007766485214233398, -0.0007140636444091797, -0.0006514787673950195, -0.0005888938903808594, -0.0005263090133666992, -0.00046372413635253906, -0.0004011392593383789, -0.00033855438232421875, -0.0002759695053100586, -0.00021338462829589844, -0.00015079975128173828, -8.821487426757812e-05, -2.562999725341797e-05, 3.695487976074219e-05, 9.953975677490234e-05, 0.0001621246337890625, 0.00022470951080322266, 0.0002872943878173828, 0.00034987926483154297, 0.0004124641418457031, 0.0004750490188598633, 0.0005376338958740234, 0.0006002187728881836, 0.0006628036499023438, 0.0007253885269165039, 0.0007879734039306641, 0.0008505582809448242, 0.0009131431579589844, 0.0009757280349731445, 0.0010383129119873047, 0.0011008977890014648, 0.001163482666015625, 0.0012260675430297852, 0.0012886524200439453, 0.0013512372970581055, 0.0014138221740722656, 0.0014764070510864258, 0.001538991928100586, 0.001601576805114746, 0.0016641616821289062, 0.0017267465591430664, 0.0017893314361572266, 0.0018519163131713867, 0.0019145011901855469, 0.001977086067199707, 0.002039670944213867, 0.0021022558212280273, 0.0021648406982421875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 12.0, 11.0, 11.0, 25.0, 36.0, 58.0, 76.0, 113.0, 190.0, 278.0, 546.0, 1005.0, 2402.0, 7342.0, 43846.0, 638656.0, 316859.0, 27441.0, 5529.0, 1981.0, 862.0, 456.0, 292.0, 146.0, 120.0, 75.0, 58.0, 31.0, 25.0, 21.0, 9.0, 10.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.1015625, -12.72607421875, -12.3505859375, -11.97509765625, -11.599609375, -11.22412109375, -10.8486328125, -10.47314453125, -10.09765625, -9.72216796875, -9.3466796875, -8.97119140625, -8.595703125, -8.22021484375, -7.8447265625, -7.46923828125, -7.09375, -6.71826171875, -6.3427734375, -5.96728515625, -5.591796875, -5.21630859375, -4.8408203125, -4.46533203125, -4.08984375, -3.71435546875, -3.3388671875, -2.96337890625, -2.587890625, -2.21240234375, -1.8369140625, -1.46142578125, -1.0859375, -0.71044921875, -0.3349609375, 0.04052734375, 0.416015625, 0.79150390625, 1.1669921875, 1.54248046875, 1.91796875, 2.29345703125, 2.6689453125, 3.04443359375, 3.419921875, 3.79541015625, 4.1708984375, 4.54638671875, 4.921875, 5.29736328125, 5.6728515625, 6.04833984375, 6.423828125, 6.79931640625, 7.1748046875, 7.55029296875, 7.92578125, 8.30126953125, 8.6767578125, 9.05224609375, 9.427734375, 9.80322265625, 10.1787109375, 10.55419921875, 10.9296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 7.0, 6.0, 5.0, 12.0, 17.0, 22.0, 24.0, 27.0, 37.0, 41.0, 45.0, 54.0, 68.0, 65.0, 71.0, 59.0, 55.0, 55.0, 51.0, 48.0, 31.0, 39.0, 28.0, 27.0, 19.0, 23.0, 10.0, 8.0, 7.0, 9.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.0, -7.76959228515625, -7.5391845703125, -7.30877685546875, -7.078369140625, -6.84796142578125, -6.6175537109375, -6.38714599609375, -6.15673828125, -5.92633056640625, -5.6959228515625, -5.46551513671875, -5.235107421875, -5.00469970703125, -4.7742919921875, -4.54388427734375, -4.3134765625, -4.08306884765625, -3.8526611328125, -3.62225341796875, -3.391845703125, -3.16143798828125, -2.9310302734375, -2.70062255859375, -2.47021484375, -2.23980712890625, -2.0093994140625, -1.77899169921875, -1.548583984375, -1.31817626953125, -1.0877685546875, -0.85736083984375, -0.626953125, -0.39654541015625, -0.1661376953125, 0.06427001953125, 0.294677734375, 0.52508544921875, 0.7554931640625, 0.98590087890625, 1.21630859375, 1.44671630859375, 1.6771240234375, 1.90753173828125, 2.137939453125, 2.36834716796875, 2.5987548828125, 2.82916259765625, 3.0595703125, 3.28997802734375, 3.5203857421875, 3.75079345703125, 3.981201171875, 4.21160888671875, 4.4420166015625, 4.67242431640625, 4.90283203125, 5.13323974609375, 5.3636474609375, 5.59405517578125, 5.824462890625, 6.05487060546875, 6.2852783203125, 6.51568603515625, 6.74609375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 15.0, 17.0, 35.0, 54.0, 88.0, 102.0, 179.0, 177.0, 121.0, 75.0, 61.0, 35.0, 9.0, 9.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.99990844726562, -203.25262451171875, -196.50535583496094, -189.75807189941406, -183.0107879638672, -176.26351928710938, -169.5162353515625, -162.76895141601562, -156.0216827392578, -149.27439880371094, -142.52713012695312, -135.77984619140625, -129.03256225585938, -122.28529357910156, -115.53800964355469, -108.79073333740234, -102.04344940185547, -95.29617309570312, -88.54888916015625, -81.8016128540039, -75.05433654785156, -68.30705261230469, -61.559776306152344, -54.8125, -48.06521987915039, -41.31793975830078, -34.57066345214844, -27.823383331298828, -21.07610511779785, -14.328826904296875, -7.581546783447266, -0.8342704772949219, 5.9130096435546875, 12.660287857055664, 19.40756607055664, 26.15484619140625, 32.902122497558594, 39.6494026184082, 46.39668273925781, 53.143959045410156, 59.891239166259766, 66.63851928710938, 73.38579559326172, 80.13307189941406, 86.88035583496094, 93.62763214111328, 100.37490844726562, 107.1221923828125, 113.86946868896484, 120.61674499511719, 127.36402893066406, 134.11129760742188, 140.85858154296875, 147.60586547851562, 154.3531494140625, 161.1004180908203, 167.8477020263672, 174.59498596191406, 181.34225463867188, 188.08953857421875, 194.83682250976562, 201.58409118652344, 208.3313751220703, 215.07864379882812, 221.825927734375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 5.0, 3.0, 12.0, 7.0, 6.0, 12.0, 8.0, 8.0, 20.0, 13.0, 12.0, 18.0, 24.0, 24.0, 19.0, 29.0, 41.0, 42.0, 33.0, 46.0, 45.0, 58.0, 63.0, 43.0, 50.0, 40.0, 37.0, 31.0, 33.0, 16.0, 26.0, 21.0, 19.0, 17.0, 19.0, 14.0, 17.0, 6.0, 14.0, 5.0, 6.0, 7.0, 3.0, 6.0, 3.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.57177734375, -107.85650634765625, -104.14122772216797, -100.42595672607422, -96.71067810058594, -92.99540710449219, -89.28013610839844, -85.56485748291016, -81.8495864868164, -78.13431549072266, -74.41903686523438, -70.70376586914062, -66.98848724365234, -63.273216247558594, -59.55794143676758, -55.84266662597656, -52.12739181518555, -48.41211700439453, -44.696842193603516, -40.9815673828125, -37.26629638671875, -33.551021575927734, -29.83574676513672, -26.120473861694336, -22.40519905090332, -18.689924240112305, -14.974651336669922, -11.259376525878906, -7.544102668762207, -3.828828811645508, -0.11355400085449219, 3.6017189025878906, 7.316993713378906, 11.032267570495605, 14.747541427612305, 18.46281623840332, 22.178089141845703, 25.89336395263672, 29.608638763427734, 33.32391357421875, 37.0391845703125, 40.754459381103516, 44.46973419189453, 48.18500518798828, 51.9002799987793, 55.61555480957031, 59.33082962036133, 63.046104431152344, 66.76138305664062, 70.47665405273438, 74.19193267822266, 77.9072036743164, 81.62248229980469, 85.33775329589844, 89.05302429199219, 92.76830291748047, 96.48357391357422, 100.19884490966797, 103.91412353515625, 107.62939453125, 111.34467315673828, 115.05994415283203, 118.77522277832031, 122.49049377441406, 126.20576477050781]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 13.0, 24.0, 25.0, 46.0, 79.0, 123.0, 238.0, 523.0, 1121.0, 2725.0, 7525.0, 26153.0, 128974.0, 1537959.0, 2255109.0, 185679.0, 32980.0, 9229.0, 3272.0, 1250.0, 577.0, 282.0, 151.0, 91.0, 37.0, 32.0, 25.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8984375, -15.3870849609375, -14.875732421875, -14.3643798828125, -13.85302734375, -13.3416748046875, -12.830322265625, -12.3189697265625, -11.8076171875, -11.2962646484375, -10.784912109375, -10.2735595703125, -9.76220703125, -9.2508544921875, -8.739501953125, -8.2281494140625, -7.716796875, -7.2054443359375, -6.694091796875, -6.1827392578125, -5.67138671875, -5.1600341796875, -4.648681640625, -4.1373291015625, -3.6259765625, -3.1146240234375, -2.603271484375, -2.0919189453125, -1.58056640625, -1.0692138671875, -0.557861328125, -0.0465087890625, 0.46484375, 0.9761962890625, 1.487548828125, 1.9989013671875, 2.51025390625, 3.0216064453125, 3.532958984375, 4.0443115234375, 4.5556640625, 5.0670166015625, 5.578369140625, 6.0897216796875, 6.60107421875, 7.1124267578125, 7.623779296875, 8.1351318359375, 8.646484375, 9.1578369140625, 9.669189453125, 10.1805419921875, 10.69189453125, 11.2032470703125, 11.714599609375, 12.2259521484375, 12.7373046875, 13.2486572265625, 13.760009765625, 14.2713623046875, 14.78271484375, 15.2940673828125, 15.805419921875, 16.3167724609375, 16.828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 3.0, 9.0, 4.0, 14.0, 18.0, 19.0, 19.0, 21.0, 29.0, 36.0, 41.0, 37.0, 37.0, 50.0, 54.0, 66.0, 55.0, 53.0, 48.0, 40.0, 43.0, 45.0, 43.0, 35.0, 25.0, 29.0, 27.0, 21.0, 9.0, 12.0, 14.0, 5.0, 11.0, 3.0, 7.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.953125, -8.6717529296875, -8.390380859375, -8.1090087890625, -7.82763671875, -7.5462646484375, -7.264892578125, -6.9835205078125, -6.7021484375, -6.4207763671875, -6.139404296875, -5.8580322265625, -5.57666015625, -5.2952880859375, -5.013916015625, -4.7325439453125, -4.451171875, -4.1697998046875, -3.888427734375, -3.6070556640625, -3.32568359375, -3.0443115234375, -2.762939453125, -2.4815673828125, -2.2001953125, -1.9188232421875, -1.637451171875, -1.3560791015625, -1.07470703125, -0.7933349609375, -0.511962890625, -0.2305908203125, 0.05078125, 0.3321533203125, 0.613525390625, 0.8948974609375, 1.17626953125, 1.4576416015625, 1.739013671875, 2.0203857421875, 2.3017578125, 2.5831298828125, 2.864501953125, 3.1458740234375, 3.42724609375, 3.7086181640625, 3.989990234375, 4.2713623046875, 4.552734375, 4.8341064453125, 5.115478515625, 5.3968505859375, 5.67822265625, 5.9595947265625, 6.240966796875, 6.5223388671875, 6.8037109375, 7.0850830078125, 7.366455078125, 7.6478271484375, 7.92919921875, 8.2105712890625, 8.491943359375, 8.7733154296875, 9.0546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 8.0, 3.0, 16.0, 12.0, 28.0, 38.0, 77.0, 146.0, 308.0, 637.0, 1476.0, 4008.0, 14277.0, 76936.0, 1282585.0, 2650944.0, 130460.0, 22837.0, 5879.0, 2064.0, 785.0, 356.0, 176.0, 90.0, 53.0, 35.0, 17.0, 10.0, 7.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.453125, -25.57470703125, -24.6962890625, -23.81787109375, -22.939453125, -22.06103515625, -21.1826171875, -20.30419921875, -19.42578125, -18.54736328125, -17.6689453125, -16.79052734375, -15.912109375, -15.03369140625, -14.1552734375, -13.27685546875, -12.3984375, -11.52001953125, -10.6416015625, -9.76318359375, -8.884765625, -8.00634765625, -7.1279296875, -6.24951171875, -5.37109375, -4.49267578125, -3.6142578125, -2.73583984375, -1.857421875, -0.97900390625, -0.1005859375, 0.77783203125, 1.65625, 2.53466796875, 3.4130859375, 4.29150390625, 5.169921875, 6.04833984375, 6.9267578125, 7.80517578125, 8.68359375, 9.56201171875, 10.4404296875, 11.31884765625, 12.197265625, 13.07568359375, 13.9541015625, 14.83251953125, 15.7109375, 16.58935546875, 17.4677734375, 18.34619140625, 19.224609375, 20.10302734375, 20.9814453125, 21.85986328125, 22.73828125, 23.61669921875, 24.4951171875, 25.37353515625, 26.251953125, 27.13037109375, 28.0087890625, 28.88720703125, 29.765625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 6.0, 7.0, 9.0, 13.0, 20.0, 24.0, 32.0, 34.0, 70.0, 113.0, 163.0, 270.0, 375.0, 537.0, 717.0, 590.0, 361.0, 223.0, 136.0, 69.0, 77.0, 62.0, 34.0, 31.0, 20.0, 16.0, 11.0, 13.0, 4.0, 9.0, 4.0, 1.0, 6.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.453125, -22.729736328125, -22.00634765625, -21.282958984375, -20.5595703125, -19.836181640625, -19.11279296875, -18.389404296875, -17.666015625, -16.942626953125, -16.21923828125, -15.495849609375, -14.7724609375, -14.049072265625, -13.32568359375, -12.602294921875, -11.87890625, -11.155517578125, -10.43212890625, -9.708740234375, -8.9853515625, -8.261962890625, -7.53857421875, -6.815185546875, -6.091796875, -5.368408203125, -4.64501953125, -3.921630859375, -3.1982421875, -2.474853515625, -1.75146484375, -1.028076171875, -0.3046875, 0.418701171875, 1.14208984375, 1.865478515625, 2.5888671875, 3.312255859375, 4.03564453125, 4.759033203125, 5.482421875, 6.205810546875, 6.92919921875, 7.652587890625, 8.3759765625, 9.099365234375, 9.82275390625, 10.546142578125, 11.26953125, 11.992919921875, 12.71630859375, 13.439697265625, 14.1630859375, 14.886474609375, 15.60986328125, 16.333251953125, 17.056640625, 17.780029296875, 18.50341796875, 19.226806640625, 19.9501953125, 20.673583984375, 21.39697265625, 22.120361328125, 22.84375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 11.0, 25.0, 64.0, 123.0, 150.0, 164.0, 144.0, 128.0, 83.0, 39.0, 25.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-236.2582550048828, -228.53550720214844, -220.812744140625, -213.08999633789062, -205.36724853515625, -197.6444854736328, -189.92173767089844, -182.198974609375, -174.47622680664062, -166.75347900390625, -159.0307159423828, -151.30796813964844, -143.585205078125, -135.86245727539062, -128.13970947265625, -120.41695404052734, -112.69419860839844, -104.97144317626953, -97.24868774414062, -89.52593994140625, -81.80318450927734, -74.08042907714844, -66.35768127441406, -58.634925842285156, -50.91217041015625, -43.189414978027344, -35.4666633605957, -27.74390983581543, -20.021156311035156, -12.29840087890625, -4.575649261474609, 3.1471023559570312, 10.869873046875, 18.592626571655273, 26.315380096435547, 34.03813171386719, 41.760887145996094, 49.483642578125, 57.20639419555664, 64.92914581298828, 72.65190124511719, 80.3746566772461, 88.097412109375, 95.82015991210938, 103.54291534423828, 111.26567077636719, 118.98841857910156, 126.71117401123047, 134.43392944335938, 142.15667724609375, 149.8794403076172, 157.60218811035156, 165.324951171875, 173.04769897460938, 180.77044677734375, 188.49319458007812, 196.21595764160156, 203.93870544433594, 211.66146850585938, 219.38421630859375, 227.10696411132812, 234.82972717285156, 242.55247497558594, 250.27523803710938, 257.99798583984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 4.0, 5.0, 8.0, 15.0, 9.0, 17.0, 17.0, 8.0, 21.0, 18.0, 27.0, 36.0, 21.0, 49.0, 36.0, 58.0, 33.0, 41.0, 36.0, 47.0, 50.0, 52.0, 32.0, 34.0, 43.0, 49.0, 31.0, 29.0, 39.0, 21.0, 21.0, 13.0, 16.0, 12.0, 13.0, 14.0, 6.0, 4.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-109.94772338867188, -106.66331481933594, -103.37890625, -100.09449768066406, -96.81008911132812, -93.52568054199219, -90.24127197265625, -86.95685577392578, -83.67244720458984, -80.3880386352539, -77.10363006591797, -73.81922149658203, -70.5348129272461, -67.25039672851562, -63.96599197387695, -60.68157958984375, -57.39717483520508, -54.11276626586914, -50.8283576965332, -47.5439453125, -44.25953674316406, -40.975128173828125, -37.69071960449219, -34.40631103515625, -31.12190055847168, -27.837491989135742, -24.553081512451172, -21.268672943115234, -17.984264373779297, -14.699853897094727, -11.415445327758789, -8.131034851074219, -4.846626281738281, -1.5622169971466064, 1.7221922874450684, 5.006601333618164, 8.291010856628418, 11.575420379638672, 14.85982894897461, 18.14423942565918, 21.428647994995117, 24.713056564331055, 27.997467041015625, 31.281875610351562, 34.5662841796875, 37.85069274902344, 41.135101318359375, 44.41951370239258, 47.703922271728516, 50.98833084106445, 54.27273941040039, 57.557151794433594, 60.84156036376953, 64.12596893310547, 67.4103775024414, 70.69478607177734, 73.97919464111328, 77.26360321044922, 80.54801177978516, 83.8324203491211, 87.11682891845703, 90.4012451171875, 93.68565368652344, 96.97006225585938, 100.25447082519531]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 10.0, 10.0, 19.0, 12.0, 25.0, 47.0, 58.0, 87.0, 136.0, 250.0, 345.0, 539.0, 892.0, 1500.0, 2559.0, 4573.0, 8199.0, 15835.0, 31512.0, 65515.0, 144740.0, 287233.0, 255090.0, 118550.0, 54101.0, 26469.0, 13404.0, 7049.0, 4025.0, 2248.0, 1310.0, 817.0, 478.0, 324.0, 176.0, 131.0, 81.0, 74.0, 45.0, 28.0, 14.0, 15.0, 11.0, 5.0, 2.0, 8.0, 2.0, 1.0, 4.0, 2.0, 1.0], "bins": [-15.53125, -15.0859375, -14.640625, -14.1953125, -13.75, -13.3046875, -12.859375, -12.4140625, -11.96875, -11.5234375, -11.078125, -10.6328125, -10.1875, -9.7421875, -9.296875, -8.8515625, -8.40625, -7.9609375, -7.515625, -7.0703125, -6.625, -6.1796875, -5.734375, -5.2890625, -4.84375, -4.3984375, -3.953125, -3.5078125, -3.0625, -2.6171875, -2.171875, -1.7265625, -1.28125, -0.8359375, -0.390625, 0.0546875, 0.5, 0.9453125, 1.390625, 1.8359375, 2.28125, 2.7265625, 3.171875, 3.6171875, 4.0625, 4.5078125, 4.953125, 5.3984375, 5.84375, 6.2890625, 6.734375, 7.1796875, 7.625, 8.0703125, 8.515625, 8.9609375, 9.40625, 9.8515625, 10.296875, 10.7421875, 11.1875, 11.6328125, 12.078125, 12.5234375, 12.96875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 12.0, 7.0, 10.0, 13.0, 12.0, 23.0, 16.0, 24.0, 30.0, 41.0, 31.0, 40.0, 42.0, 34.0, 49.0, 47.0, 43.0, 34.0, 35.0, 43.0, 38.0, 42.0, 47.0, 34.0, 37.0, 50.0, 25.0, 21.0, 16.0, 26.0, 10.0, 15.0, 19.0, 6.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.921875, -8.6478271484375, -8.373779296875, -8.0997314453125, -7.82568359375, -7.5516357421875, -7.277587890625, -7.0035400390625, -6.7294921875, -6.4554443359375, -6.181396484375, -5.9073486328125, -5.63330078125, -5.3592529296875, -5.085205078125, -4.8111572265625, -4.537109375, -4.2630615234375, -3.989013671875, -3.7149658203125, -3.44091796875, -3.1668701171875, -2.892822265625, -2.6187744140625, -2.3447265625, -2.0706787109375, -1.796630859375, -1.5225830078125, -1.24853515625, -0.9744873046875, -0.700439453125, -0.4263916015625, -0.15234375, 0.1217041015625, 0.395751953125, 0.6697998046875, 0.94384765625, 1.2178955078125, 1.491943359375, 1.7659912109375, 2.0400390625, 2.3140869140625, 2.588134765625, 2.8621826171875, 3.13623046875, 3.4102783203125, 3.684326171875, 3.9583740234375, 4.232421875, 4.5064697265625, 4.780517578125, 5.0545654296875, 5.32861328125, 5.6026611328125, 5.876708984375, 6.1507568359375, 6.4248046875, 6.6988525390625, 6.972900390625, 7.2469482421875, 7.52099609375, 7.7950439453125, 8.069091796875, 8.3431396484375, 8.6171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 12.0, 10.0, 14.0, 19.0, 31.0, 30.0, 47.0, 61.0, 81.0, 99.0, 194.0, 259.0, 393.0, 657.0, 1069.0, 2140.0, 5073.0, 17493.0, 96416.0, 704505.0, 179430.0, 27498.0, 6951.0, 2654.0, 1294.0, 791.0, 463.0, 287.0, 177.0, 118.0, 84.0, 47.0, 39.0, 34.0, 13.0, 21.0, 12.0, 11.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-38.84375, -37.72265625, -36.6015625, -35.48046875, -34.359375, -33.23828125, -32.1171875, -30.99609375, -29.875, -28.75390625, -27.6328125, -26.51171875, -25.390625, -24.26953125, -23.1484375, -22.02734375, -20.90625, -19.78515625, -18.6640625, -17.54296875, -16.421875, -15.30078125, -14.1796875, -13.05859375, -11.9375, -10.81640625, -9.6953125, -8.57421875, -7.453125, -6.33203125, -5.2109375, -4.08984375, -2.96875, -1.84765625, -0.7265625, 0.39453125, 1.515625, 2.63671875, 3.7578125, 4.87890625, 6.0, 7.12109375, 8.2421875, 9.36328125, 10.484375, 11.60546875, 12.7265625, 13.84765625, 14.96875, 16.08984375, 17.2109375, 18.33203125, 19.453125, 20.57421875, 21.6953125, 22.81640625, 23.9375, 25.05859375, 26.1796875, 27.30078125, 28.421875, 29.54296875, 30.6640625, 31.78515625, 32.90625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 6.0, 6.0, 11.0, 11.0, 11.0, 18.0, 27.0, 22.0, 31.0, 46.0, 50.0, 57.0, 56.0, 65.0, 66.0, 64.0, 70.0, 57.0, 63.0, 44.0, 45.0, 36.0, 29.0, 30.0, 22.0, 16.0, 10.0, 10.0, 9.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-49.25, -47.78271484375, -46.3154296875, -44.84814453125, -43.380859375, -41.91357421875, -40.4462890625, -38.97900390625, -37.51171875, -36.04443359375, -34.5771484375, -33.10986328125, -31.642578125, -30.17529296875, -28.7080078125, -27.24072265625, -25.7734375, -24.30615234375, -22.8388671875, -21.37158203125, -19.904296875, -18.43701171875, -16.9697265625, -15.50244140625, -14.03515625, -12.56787109375, -11.1005859375, -9.63330078125, -8.166015625, -6.69873046875, -5.2314453125, -3.76416015625, -2.296875, -0.82958984375, 0.6376953125, 2.10498046875, 3.572265625, 5.03955078125, 6.5068359375, 7.97412109375, 9.44140625, 10.90869140625, 12.3759765625, 13.84326171875, 15.310546875, 16.77783203125, 18.2451171875, 19.71240234375, 21.1796875, 22.64697265625, 24.1142578125, 25.58154296875, 27.048828125, 28.51611328125, 29.9833984375, 31.45068359375, 32.91796875, 34.38525390625, 35.8525390625, 37.31982421875, 38.787109375, 40.25439453125, 41.7216796875, 43.18896484375, 44.65625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 6.0, 10.0, 5.0, 14.0, 11.0, 20.0, 32.0, 55.0, 94.0, 191.0, 357.0, 868.0, 2865.0, 13837.0, 127510.0, 803874.0, 84491.0, 10474.0, 2342.0, 761.0, 324.0, 177.0, 79.0, 47.0, 24.0, 21.0, 16.0, 17.0, 11.0, 12.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.274658203125, -15.86181640625, -15.448974609375, -15.0361328125, -14.623291015625, -14.21044921875, -13.797607421875, -13.384765625, -12.971923828125, -12.55908203125, -12.146240234375, -11.7333984375, -11.320556640625, -10.90771484375, -10.494873046875, -10.08203125, -9.669189453125, -9.25634765625, -8.843505859375, -8.4306640625, -8.017822265625, -7.60498046875, -7.192138671875, -6.779296875, -6.366455078125, -5.95361328125, -5.540771484375, -5.1279296875, -4.715087890625, -4.30224609375, -3.889404296875, -3.4765625, -3.063720703125, -2.65087890625, -2.238037109375, -1.8251953125, -1.412353515625, -0.99951171875, -0.586669921875, -0.173828125, 0.239013671875, 0.65185546875, 1.064697265625, 1.4775390625, 1.890380859375, 2.30322265625, 2.716064453125, 3.12890625, 3.541748046875, 3.95458984375, 4.367431640625, 4.7802734375, 5.193115234375, 5.60595703125, 6.018798828125, 6.431640625, 6.844482421875, 7.25732421875, 7.670166015625, 8.0830078125, 8.495849609375, 8.90869140625, 9.321533203125, 9.734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 5.0, 12.0, 11.0, 16.0, 22.0, 25.0, 18.0, 39.0, 77.0, 130.0, 143.0, 118.0, 107.0, 77.0, 53.0, 37.0, 27.0, 13.0, 19.0, 13.0, 9.0, 5.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022945404052734375, -0.002214968204498291, -0.0021353960037231445, -0.002055823802947998, -0.0019762516021728516, -0.001896679401397705, -0.0018171072006225586, -0.0017375349998474121, -0.0016579627990722656, -0.0015783905982971191, -0.0014988183975219727, -0.0014192461967468262, -0.0013396739959716797, -0.0012601017951965332, -0.0011805295944213867, -0.0011009573936462402, -0.0010213851928710938, -0.0009418129920959473, -0.0008622407913208008, -0.0007826685905456543, -0.0007030963897705078, -0.0006235241889953613, -0.0005439519882202148, -0.00046437978744506836, -0.0003848075866699219, -0.0003052353858947754, -0.0002256631851196289, -0.00014609098434448242, -6.651878356933594e-05, 1.3053417205810547e-05, 9.262561798095703e-05, 0.00017219781875610352, 0.00025177001953125, 0.0003313422203063965, 0.00041091442108154297, 0.0004904866218566895, 0.0005700588226318359, 0.0006496310234069824, 0.0007292032241821289, 0.0008087754249572754, 0.0008883476257324219, 0.0009679198265075684, 0.0010474920272827148, 0.0011270642280578613, 0.0012066364288330078, 0.0012862086296081543, 0.0013657808303833008, 0.0014453530311584473, 0.0015249252319335938, 0.0016044974327087402, 0.0016840696334838867, 0.0017636418342590332, 0.0018432140350341797, 0.0019227862358093262, 0.0020023584365844727, 0.002081930637359619, 0.0021615028381347656, 0.002241075038909912, 0.0023206472396850586, 0.002400219440460205, 0.0024797916412353516, 0.002559363842010498, 0.0026389360427856445, 0.002718508243560791, 0.0027980804443359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 4.0, 7.0, 15.0, 21.0, 25.0, 36.0, 66.0, 116.0, 198.0, 361.0, 714.0, 1591.0, 4217.0, 17275.0, 153733.0, 755797.0, 95625.0, 12519.0, 3447.0, 1358.0, 683.0, 318.0, 174.0, 81.0, 65.0, 33.0, 23.0, 16.0, 12.0, 9.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.80859375, -5.49298095703125, -5.1773681640625, -4.86175537109375, -4.546142578125, -4.23052978515625, -3.9149169921875, -3.59930419921875, -3.28369140625, -2.96807861328125, -2.6524658203125, -2.33685302734375, -2.021240234375, -1.70562744140625, -1.3900146484375, -1.07440185546875, -0.7587890625, -0.44317626953125, -0.1275634765625, 0.18804931640625, 0.503662109375, 0.81927490234375, 1.1348876953125, 1.45050048828125, 1.76611328125, 2.08172607421875, 2.3973388671875, 2.71295166015625, 3.028564453125, 3.34417724609375, 3.6597900390625, 3.97540283203125, 4.291015625, 4.60662841796875, 4.9222412109375, 5.23785400390625, 5.553466796875, 5.86907958984375, 6.1846923828125, 6.50030517578125, 6.81591796875, 7.13153076171875, 7.4471435546875, 7.76275634765625, 8.078369140625, 8.39398193359375, 8.7095947265625, 9.02520751953125, 9.3408203125, 9.65643310546875, 9.9720458984375, 10.28765869140625, 10.603271484375, 10.91888427734375, 11.2344970703125, 11.55010986328125, 11.86572265625, 12.18133544921875, 12.4969482421875, 12.81256103515625, 13.128173828125, 13.44378662109375, 13.7593994140625, 14.07501220703125, 14.390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 4.0, 3.0, 11.0, 8.0, 14.0, 9.0, 15.0, 13.0, 38.0, 25.0, 38.0, 38.0, 58.0, 71.0, 62.0, 58.0, 79.0, 83.0, 89.0, 46.0, 60.0, 47.0, 25.0, 26.0, 17.0, 16.0, 17.0, 14.0, 4.0, 9.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.3984375, -5.181884765625, -4.96533203125, -4.748779296875, -4.5322265625, -4.315673828125, -4.09912109375, -3.882568359375, -3.666015625, -3.449462890625, -3.23291015625, -3.016357421875, -2.7998046875, -2.583251953125, -2.36669921875, -2.150146484375, -1.93359375, -1.717041015625, -1.50048828125, -1.283935546875, -1.0673828125, -0.850830078125, -0.63427734375, -0.417724609375, -0.201171875, 0.015380859375, 0.23193359375, 0.448486328125, 0.6650390625, 0.881591796875, 1.09814453125, 1.314697265625, 1.53125, 1.747802734375, 1.96435546875, 2.180908203125, 2.3974609375, 2.614013671875, 2.83056640625, 3.047119140625, 3.263671875, 3.480224609375, 3.69677734375, 3.913330078125, 4.1298828125, 4.346435546875, 4.56298828125, 4.779541015625, 4.99609375, 5.212646484375, 5.42919921875, 5.645751953125, 5.8623046875, 6.078857421875, 6.29541015625, 6.511962890625, 6.728515625, 6.945068359375, 7.16162109375, 7.378173828125, 7.5947265625, 7.811279296875, 8.02783203125, 8.244384765625, 8.4609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 9.0, 18.0, 26.0, 42.0, 42.0, 95.0, 88.0, 162.0, 145.0, 108.0, 71.0, 60.0, 45.0, 23.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.34353637695312, -129.54766845703125, -124.75180053710938, -119.9559326171875, -115.16007232666016, -110.36420440673828, -105.5683364868164, -100.77247619628906, -95.97660827636719, -91.18074035644531, -86.38487243652344, -81.58900451660156, -76.79314422607422, -71.99727630615234, -67.20140838623047, -62.40554428100586, -57.60967254638672, -52.813804626464844, -48.017940521240234, -43.22207260131836, -38.42620849609375, -33.630340576171875, -28.83447265625, -24.03860855102539, -19.242740631103516, -14.446874618530273, -9.651007652282715, -4.855140686035156, -0.05927467346191406, 4.736591339111328, 9.532459259033203, 14.328323364257812, 19.124191284179688, 23.92005729675293, 28.715923309326172, 33.51179122924805, 38.307655334472656, 43.10352325439453, 47.899391174316406, 52.695255279541016, 57.49112319946289, 62.286991119384766, 67.08285522460938, 71.87872314453125, 76.67459106445312, 81.470458984375, 86.26632690429688, 91.06218719482422, 95.8580551147461, 100.65392303466797, 105.44979095458984, 110.24565124511719, 115.04151916503906, 119.83738708496094, 124.63325500488281, 129.4291229248047, 134.22499084472656, 139.02085876464844, 143.8167266845703, 148.6125946044922, 153.40846252441406, 158.20431518554688, 163.00018310546875, 167.79605102539062, 172.5919189453125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 10.0, 8.0, 5.0, 8.0, 17.0, 14.0, 20.0, 28.0, 24.0, 22.0, 29.0, 29.0, 40.0, 57.0, 49.0, 71.0, 65.0, 60.0, 53.0, 42.0, 40.0, 41.0, 24.0, 31.0, 31.0, 18.0, 20.0, 14.0, 9.0, 16.0, 15.0, 16.0, 11.0, 13.0, 11.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-134.8965301513672, -130.94078063964844, -126.98502349853516, -123.0292739868164, -119.07351684570312, -115.11776733398438, -111.16201782226562, -107.20626068115234, -103.25050354003906, -99.29475402832031, -95.33899688720703, -91.38324737548828, -87.427490234375, -83.47174072265625, -79.5159912109375, -75.56023406982422, -71.60448455810547, -67.64873504638672, -63.69297790527344, -59.73722839355469, -55.781471252441406, -51.825721740722656, -47.86996841430664, -43.914215087890625, -39.95846176147461, -36.002708435058594, -32.04695510864258, -28.091203689575195, -24.13545036315918, -20.179697036743164, -16.22394561767578, -12.268192291259766, -8.31243896484375, -4.356686115264893, -0.40093326568603516, 3.554819107055664, 7.51057243347168, 11.466325759887695, 15.422077178955078, 19.377830505371094, 23.33358383178711, 27.289337158203125, 31.24509048461914, 35.200843811035156, 39.156593322753906, 43.11235046386719, 47.06809997558594, 51.02385330200195, 54.97960662841797, 58.935359954833984, 62.89111328125, 66.84686279296875, 70.80261993408203, 74.75836944580078, 78.71412658691406, 82.66987609863281, 86.62562561035156, 90.58137512207031, 94.5371322631836, 98.49288177490234, 102.44863891601562, 106.40438842773438, 110.36013793945312, 114.3158950805664, 118.27165222167969]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 13.0, 18.0, 29.0, 27.0, 32.0, 83.0, 87.0, 161.0, 213.0, 387.0, 704.0, 1200.0, 2277.0, 4474.0, 9704.0, 25516.0, 94732.0, 692234.0, 2582123.0, 646031.0, 90286.0, 24958.0, 9448.0, 4380.0, 2202.0, 1204.0, 677.0, 385.0, 243.0, 146.0, 107.0, 63.0, 43.0, 17.0, 19.0, 17.0, 8.0, 7.0, 7.0, 2.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-13.3671875, -12.990478515625, -12.61376953125, -12.237060546875, -11.8603515625, -11.483642578125, -11.10693359375, -10.730224609375, -10.353515625, -9.976806640625, -9.60009765625, -9.223388671875, -8.8466796875, -8.469970703125, -8.09326171875, -7.716552734375, -7.33984375, -6.963134765625, -6.58642578125, -6.209716796875, -5.8330078125, -5.456298828125, -5.07958984375, -4.702880859375, -4.326171875, -3.949462890625, -3.57275390625, -3.196044921875, -2.8193359375, -2.442626953125, -2.06591796875, -1.689208984375, -1.3125, -0.935791015625, -0.55908203125, -0.182373046875, 0.1943359375, 0.571044921875, 0.94775390625, 1.324462890625, 1.701171875, 2.077880859375, 2.45458984375, 2.831298828125, 3.2080078125, 3.584716796875, 3.96142578125, 4.338134765625, 4.71484375, 5.091552734375, 5.46826171875, 5.844970703125, 6.2216796875, 6.598388671875, 6.97509765625, 7.351806640625, 7.728515625, 8.105224609375, 8.48193359375, 8.858642578125, 9.2353515625, 9.612060546875, 9.98876953125, 10.365478515625, 10.7421875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 3.0, 6.0, 11.0, 8.0, 12.0, 16.0, 15.0, 36.0, 43.0, 32.0, 50.0, 47.0, 56.0, 72.0, 52.0, 67.0, 72.0, 62.0, 58.0, 45.0, 43.0, 59.0, 35.0, 26.0, 24.0, 14.0, 15.0, 6.0, 7.0, 10.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.90771484375, -10.5498046875, -10.19189453125, -9.833984375, -9.47607421875, -9.1181640625, -8.76025390625, -8.40234375, -8.04443359375, -7.6865234375, -7.32861328125, -6.970703125, -6.61279296875, -6.2548828125, -5.89697265625, -5.5390625, -5.18115234375, -4.8232421875, -4.46533203125, -4.107421875, -3.74951171875, -3.3916015625, -3.03369140625, -2.67578125, -2.31787109375, -1.9599609375, -1.60205078125, -1.244140625, -0.88623046875, -0.5283203125, -0.17041015625, 0.1875, 0.54541015625, 0.9033203125, 1.26123046875, 1.619140625, 1.97705078125, 2.3349609375, 2.69287109375, 3.05078125, 3.40869140625, 3.7666015625, 4.12451171875, 4.482421875, 4.84033203125, 5.1982421875, 5.55615234375, 5.9140625, 6.27197265625, 6.6298828125, 6.98779296875, 7.345703125, 7.70361328125, 8.0615234375, 8.41943359375, 8.77734375, 9.13525390625, 9.4931640625, 9.85107421875, 10.208984375, 10.56689453125, 10.9248046875, 11.28271484375, 11.640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 7.0, 7.0, 21.0, 28.0, 47.0, 76.0, 103.0, 234.0, 448.0, 977.0, 2685.0, 10107.0, 56151.0, 1060055.0, 2930452.0, 110042.0, 16673.0, 3885.0, 1254.0, 510.0, 254.0, 95.0, 54.0, 41.0, 28.0, 12.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.46875, -25.5908203125, -24.712890625, -23.8349609375, -22.95703125, -22.0791015625, -21.201171875, -20.3232421875, -19.4453125, -18.5673828125, -17.689453125, -16.8115234375, -15.93359375, -15.0556640625, -14.177734375, -13.2998046875, -12.421875, -11.5439453125, -10.666015625, -9.7880859375, -8.91015625, -8.0322265625, -7.154296875, -6.2763671875, -5.3984375, -4.5205078125, -3.642578125, -2.7646484375, -1.88671875, -1.0087890625, -0.130859375, 0.7470703125, 1.625, 2.5029296875, 3.380859375, 4.2587890625, 5.13671875, 6.0146484375, 6.892578125, 7.7705078125, 8.6484375, 9.5263671875, 10.404296875, 11.2822265625, 12.16015625, 13.0380859375, 13.916015625, 14.7939453125, 15.671875, 16.5498046875, 17.427734375, 18.3056640625, 19.18359375, 20.0615234375, 20.939453125, 21.8173828125, 22.6953125, 23.5732421875, 24.451171875, 25.3291015625, 26.20703125, 27.0849609375, 27.962890625, 28.8408203125, 29.71875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 17.0, 21.0, 24.0, 46.0, 61.0, 108.0, 190.0, 363.0, 622.0, 875.0, 718.0, 434.0, 204.0, 104.0, 79.0, 68.0, 35.0, 31.0, 20.0, 11.0, 8.0, 6.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-36.90625, -36.061767578125, -35.21728515625, -34.372802734375, -33.5283203125, -32.683837890625, -31.83935546875, -30.994873046875, -30.150390625, -29.305908203125, -28.46142578125, -27.616943359375, -26.7724609375, -25.927978515625, -25.08349609375, -24.239013671875, -23.39453125, -22.550048828125, -21.70556640625, -20.861083984375, -20.0166015625, -19.172119140625, -18.32763671875, -17.483154296875, -16.638671875, -15.794189453125, -14.94970703125, -14.105224609375, -13.2607421875, -12.416259765625, -11.57177734375, -10.727294921875, -9.8828125, -9.038330078125, -8.19384765625, -7.349365234375, -6.5048828125, -5.660400390625, -4.81591796875, -3.971435546875, -3.126953125, -2.282470703125, -1.43798828125, -0.593505859375, 0.2509765625, 1.095458984375, 1.93994140625, 2.784423828125, 3.62890625, 4.473388671875, 5.31787109375, 6.162353515625, 7.0068359375, 7.851318359375, 8.69580078125, 9.540283203125, 10.384765625, 11.229248046875, 12.07373046875, 12.918212890625, 13.7626953125, 14.607177734375, 15.45166015625, 16.296142578125, 17.140625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 11.0, 24.0, 49.0, 87.0, 132.0, 172.0, 192.0, 145.0, 82.0, 49.0, 15.0, 16.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-195.04254150390625, -188.08555603027344, -181.12857055664062, -174.17160034179688, -167.21461486816406, -160.25762939453125, -153.30064392089844, -146.34365844726562, -139.38668823242188, -132.42970275878906, -125.47272491455078, -118.51573944091797, -111.55876159667969, -104.60177612304688, -97.64479064941406, -90.68780517578125, -83.73081970214844, -76.77383422851562, -69.81685638427734, -62.85987091064453, -55.902889251708984, -48.94590759277344, -41.988922119140625, -35.03194046020508, -28.07495880126953, -21.117977142333984, -14.160993576049805, -7.204010009765625, -0.24702835083007812, 6.709953308105469, 13.666938781738281, 20.623920440673828, 27.580886840820312, 34.53786849975586, 41.494850158691406, 48.45183563232422, 55.408817291259766, 62.36579895019531, 69.32278442382812, 76.27976989746094, 83.23674774169922, 90.19373321533203, 97.15071105957031, 104.10769653320312, 111.06468200683594, 118.02165985107422, 124.97864532470703, 131.9356231689453, 138.89260864257812, 145.84959411621094, 152.80657958984375, 159.7635498046875, 166.7205352783203, 173.67752075195312, 180.63450622558594, 187.59149169921875, 194.5484619140625, 201.5054473876953, 208.46243286132812, 215.41940307617188, 222.3763885498047, 229.3333740234375, 236.2903594970703, 243.24734497070312, 250.20433044433594]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 8.0, 9.0, 9.0, 19.0, 22.0, 18.0, 31.0, 30.0, 27.0, 42.0, 47.0, 41.0, 39.0, 52.0, 52.0, 57.0, 47.0, 46.0, 45.0, 50.0, 36.0, 42.0, 45.0, 36.0, 32.0, 18.0, 20.0, 20.0, 16.0, 8.0, 8.0, 2.0, 8.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.86061096191406, -95.53082275390625, -92.20103454589844, -88.87124633789062, -85.54145812988281, -82.211669921875, -78.88188171386719, -75.55209350585938, -72.22230529785156, -68.89251708984375, -65.56272888183594, -62.232940673828125, -58.90315246582031, -55.5733642578125, -52.24357223510742, -48.91378402709961, -45.58399200439453, -42.25420379638672, -38.924415588378906, -35.594627380371094, -32.26483917236328, -28.935049057006836, -25.60525894165039, -22.275470733642578, -18.945682525634766, -15.615894317626953, -12.286105155944824, -8.956315994262695, -5.626527786254883, -2.2967395782470703, 1.033050537109375, 4.3628387451171875, 7.692634582519531, 11.022422790527344, 14.352211952209473, 17.6820011138916, 21.011789321899414, 24.341577529907227, 27.671367645263672, 31.001155853271484, 34.3309440612793, 37.66073226928711, 40.99052047729492, 44.3203125, 47.65010070800781, 50.979888916015625, 54.30967712402344, 57.63946533203125, 60.96925354003906, 64.29904174804688, 67.62882995605469, 70.9586181640625, 74.28840637207031, 77.61819458007812, 80.94798278808594, 84.27777099609375, 87.60755920410156, 90.93734741210938, 94.26713562011719, 97.596923828125, 100.92671203613281, 104.25650024414062, 107.58628845214844, 110.91607666015625, 114.2458724975586]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 6.0, 2.0, 12.0, 18.0, 20.0, 32.0, 39.0, 58.0, 81.0, 117.0, 187.0, 251.0, 407.0, 586.0, 914.0, 1349.0, 2199.0, 3779.0, 6185.0, 11124.0, 19682.0, 36638.0, 69382.0, 125813.0, 199962.0, 218867.0, 155312.0, 88962.0, 47591.0, 25280.0, 13679.0, 7812.0, 4574.0, 2735.0, 1718.0, 1086.0, 662.0, 463.0, 290.0, 212.0, 133.0, 97.0, 66.0, 61.0, 31.0, 17.0, 15.0, 12.0, 8.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0], "bins": [-9.109375, -8.843017578125, -8.57666015625, -8.310302734375, -8.0439453125, -7.777587890625, -7.51123046875, -7.244873046875, -6.978515625, -6.712158203125, -6.44580078125, -6.179443359375, -5.9130859375, -5.646728515625, -5.38037109375, -5.114013671875, -4.84765625, -4.581298828125, -4.31494140625, -4.048583984375, -3.7822265625, -3.515869140625, -3.24951171875, -2.983154296875, -2.716796875, -2.450439453125, -2.18408203125, -1.917724609375, -1.6513671875, -1.385009765625, -1.11865234375, -0.852294921875, -0.5859375, -0.319580078125, -0.05322265625, 0.213134765625, 0.4794921875, 0.745849609375, 1.01220703125, 1.278564453125, 1.544921875, 1.811279296875, 2.07763671875, 2.343994140625, 2.6103515625, 2.876708984375, 3.14306640625, 3.409423828125, 3.67578125, 3.942138671875, 4.20849609375, 4.474853515625, 4.7412109375, 5.007568359375, 5.27392578125, 5.540283203125, 5.806640625, 6.072998046875, 6.33935546875, 6.605712890625, 6.8720703125, 7.138427734375, 7.40478515625, 7.671142578125, 7.9375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 6.0, 8.0, 5.0, 8.0, 13.0, 16.0, 8.0, 22.0, 29.0, 25.0, 40.0, 26.0, 45.0, 39.0, 30.0, 40.0, 43.0, 32.0, 49.0, 58.0, 51.0, 36.0, 40.0, 47.0, 34.0, 22.0, 33.0, 46.0, 23.0, 23.0, 19.0, 17.0, 12.0, 15.0, 4.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-9.6484375, -9.3707275390625, -9.093017578125, -8.8153076171875, -8.53759765625, -8.2598876953125, -7.982177734375, -7.7044677734375, -7.4267578125, -7.1490478515625, -6.871337890625, -6.5936279296875, -6.31591796875, -6.0382080078125, -5.760498046875, -5.4827880859375, -5.205078125, -4.9273681640625, -4.649658203125, -4.3719482421875, -4.09423828125, -3.8165283203125, -3.538818359375, -3.2611083984375, -2.9833984375, -2.7056884765625, -2.427978515625, -2.1502685546875, -1.87255859375, -1.5948486328125, -1.317138671875, -1.0394287109375, -0.76171875, -0.4840087890625, -0.206298828125, 0.0714111328125, 0.34912109375, 0.6268310546875, 0.904541015625, 1.1822509765625, 1.4599609375, 1.7376708984375, 2.015380859375, 2.2930908203125, 2.57080078125, 2.8485107421875, 3.126220703125, 3.4039306640625, 3.681640625, 3.9593505859375, 4.237060546875, 4.5147705078125, 4.79248046875, 5.0701904296875, 5.347900390625, 5.6256103515625, 5.9033203125, 6.1810302734375, 6.458740234375, 6.7364501953125, 7.01416015625, 7.2918701171875, 7.569580078125, 7.8472900390625, 8.125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 6.0, 9.0, 16.0, 10.0, 23.0, 64.0, 93.0, 201.0, 529.0, 1769.0, 7521.0, 54523.0, 689451.0, 263447.0, 24765.0, 4292.0, 1101.0, 394.0, 132.0, 84.0, 55.0, 25.0, 15.0, 9.0, 9.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.46875, -38.3017578125, -37.134765625, -35.9677734375, -34.80078125, -33.6337890625, -32.466796875, -31.2998046875, -30.1328125, -28.9658203125, -27.798828125, -26.6318359375, -25.46484375, -24.2978515625, -23.130859375, -21.9638671875, -20.796875, -19.6298828125, -18.462890625, -17.2958984375, -16.12890625, -14.9619140625, -13.794921875, -12.6279296875, -11.4609375, -10.2939453125, -9.126953125, -7.9599609375, -6.79296875, -5.6259765625, -4.458984375, -3.2919921875, -2.125, -0.9580078125, 0.208984375, 1.3759765625, 2.54296875, 3.7099609375, 4.876953125, 6.0439453125, 7.2109375, 8.3779296875, 9.544921875, 10.7119140625, 11.87890625, 13.0458984375, 14.212890625, 15.3798828125, 16.546875, 17.7138671875, 18.880859375, 20.0478515625, 21.21484375, 22.3818359375, 23.548828125, 24.7158203125, 25.8828125, 27.0498046875, 28.216796875, 29.3837890625, 30.55078125, 31.7177734375, 32.884765625, 34.0517578125, 35.21875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 12.0, 12.0, 13.0, 20.0, 32.0, 26.0, 32.0, 50.0, 60.0, 53.0, 75.0, 60.0, 59.0, 69.0, 72.0, 61.0, 63.0, 44.0, 45.0, 30.0, 17.0, 18.0, 13.0, 17.0, 8.0, 11.0, 4.0, 6.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.6875, -47.2333984375, -45.779296875, -44.3251953125, -42.87109375, -41.4169921875, -39.962890625, -38.5087890625, -37.0546875, -35.6005859375, -34.146484375, -32.6923828125, -31.23828125, -29.7841796875, -28.330078125, -26.8759765625, -25.421875, -23.9677734375, -22.513671875, -21.0595703125, -19.60546875, -18.1513671875, -16.697265625, -15.2431640625, -13.7890625, -12.3349609375, -10.880859375, -9.4267578125, -7.97265625, -6.5185546875, -5.064453125, -3.6103515625, -2.15625, -0.7021484375, 0.751953125, 2.2060546875, 3.66015625, 5.1142578125, 6.568359375, 8.0224609375, 9.4765625, 10.9306640625, 12.384765625, 13.8388671875, 15.29296875, 16.7470703125, 18.201171875, 19.6552734375, 21.109375, 22.5634765625, 24.017578125, 25.4716796875, 26.92578125, 28.3798828125, 29.833984375, 31.2880859375, 32.7421875, 34.1962890625, 35.650390625, 37.1044921875, 38.55859375, 40.0126953125, 41.466796875, 42.9208984375, 44.375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 11.0, 3.0, 11.0, 13.0, 16.0, 18.0, 34.0, 64.0, 97.0, 170.0, 290.0, 616.0, 1352.0, 3858.0, 12069.0, 50173.0, 262702.0, 599656.0, 88265.0, 19710.0, 5697.0, 2006.0, 841.0, 366.0, 193.0, 108.0, 73.0, 45.0, 27.0, 17.0, 14.0, 18.0, 7.0, 10.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -6.21502685546875, -6.0277099609375, -5.84039306640625, -5.653076171875, -5.46575927734375, -5.2784423828125, -5.09112548828125, -4.90380859375, -4.71649169921875, -4.5291748046875, -4.34185791015625, -4.154541015625, -3.96722412109375, -3.7799072265625, -3.59259033203125, -3.4052734375, -3.21795654296875, -3.0306396484375, -2.84332275390625, -2.656005859375, -2.46868896484375, -2.2813720703125, -2.09405517578125, -1.90673828125, -1.71942138671875, -1.5321044921875, -1.34478759765625, -1.157470703125, -0.97015380859375, -0.7828369140625, -0.59552001953125, -0.408203125, -0.22088623046875, -0.0335693359375, 0.15374755859375, 0.341064453125, 0.52838134765625, 0.7156982421875, 0.90301513671875, 1.09033203125, 1.27764892578125, 1.4649658203125, 1.65228271484375, 1.839599609375, 2.02691650390625, 2.2142333984375, 2.40155029296875, 2.5888671875, 2.77618408203125, 2.9635009765625, 3.15081787109375, 3.338134765625, 3.52545166015625, 3.7127685546875, 3.90008544921875, 4.08740234375, 4.27471923828125, 4.4620361328125, 4.64935302734375, 4.836669921875, 5.02398681640625, 5.2113037109375, 5.39862060546875, 5.5859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 4.0, 7.0, 8.0, 20.0, 25.0, 39.0, 67.0, 98.0, 136.0, 149.0, 133.0, 100.0, 66.0, 50.0, 23.0, 15.0, 9.0, 16.0, 6.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013942718505859375, -0.0013399720191955566, -0.0012856721878051758, -0.001231372356414795, -0.001177072525024414, -0.0011227726936340332, -0.0010684728622436523, -0.0010141730308532715, -0.0009598731994628906, -0.0009055733680725098, -0.0008512735366821289, -0.000796973705291748, -0.0007426738739013672, -0.0006883740425109863, -0.0006340742111206055, -0.0005797743797302246, -0.0005254745483398438, -0.0004711747169494629, -0.00041687488555908203, -0.00036257505416870117, -0.0003082752227783203, -0.00025397539138793945, -0.0001996755599975586, -0.00014537572860717773, -9.107589721679688e-05, -3.6776065826416016e-05, 1.7523765563964844e-05, 7.18235969543457e-05, 0.00012612342834472656, 0.00018042325973510742, 0.00023472309112548828, 0.00028902292251586914, 0.00034332275390625, 0.00039762258529663086, 0.0004519224166870117, 0.0005062222480773926, 0.0005605220794677734, 0.0006148219108581543, 0.0006691217422485352, 0.000723421573638916, 0.0007777214050292969, 0.0008320212364196777, 0.0008863210678100586, 0.0009406208992004395, 0.0009949207305908203, 0.0010492205619812012, 0.001103520393371582, 0.0011578202247619629, 0.0012121200561523438, 0.0012664198875427246, 0.0013207197189331055, 0.0013750195503234863, 0.0014293193817138672, 0.001483619213104248, 0.001537919044494629, 0.0015922188758850098, 0.0016465187072753906, 0.0017008185386657715, 0.0017551183700561523, 0.0018094182014465332, 0.001863718032836914, 0.001918017864227295, 0.0019723176956176758, 0.0020266175270080566, 0.0020809173583984375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 12.0, 21.0, 16.0, 21.0, 46.0, 70.0, 110.0, 175.0, 393.0, 608.0, 1264.0, 2667.0, 7161.0, 21799.0, 84201.0, 513893.0, 314695.0, 71189.0, 18890.0, 6233.0, 2456.0, 1188.0, 602.0, 289.0, 192.0, 128.0, 65.0, 39.0, 36.0, 18.0, 12.0, 9.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.04296875, -5.86492919921875, -5.6868896484375, -5.50885009765625, -5.330810546875, -5.15277099609375, -4.9747314453125, -4.79669189453125, -4.61865234375, -4.44061279296875, -4.2625732421875, -4.08453369140625, -3.906494140625, -3.72845458984375, -3.5504150390625, -3.37237548828125, -3.1943359375, -3.01629638671875, -2.8382568359375, -2.66021728515625, -2.482177734375, -2.30413818359375, -2.1260986328125, -1.94805908203125, -1.77001953125, -1.59197998046875, -1.4139404296875, -1.23590087890625, -1.057861328125, -0.87982177734375, -0.7017822265625, -0.52374267578125, -0.345703125, -0.16766357421875, 0.0103759765625, 0.18841552734375, 0.366455078125, 0.54449462890625, 0.7225341796875, 0.90057373046875, 1.07861328125, 1.25665283203125, 1.4346923828125, 1.61273193359375, 1.790771484375, 1.96881103515625, 2.1468505859375, 2.32489013671875, 2.5029296875, 2.68096923828125, 2.8590087890625, 3.03704833984375, 3.215087890625, 3.39312744140625, 3.5711669921875, 3.74920654296875, 3.92724609375, 4.10528564453125, 4.2833251953125, 4.46136474609375, 4.639404296875, 4.81744384765625, 4.9954833984375, 5.17352294921875, 5.3515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 0.0, 6.0, 8.0, 9.0, 14.0, 25.0, 13.0, 36.0, 34.0, 49.0, 44.0, 64.0, 73.0, 77.0, 75.0, 83.0, 81.0, 57.0, 58.0, 52.0, 25.0, 24.0, 20.0, 17.0, 13.0, 10.0, 7.0, 4.0, 6.0, 3.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.7890625, -5.61181640625, -5.4345703125, -5.25732421875, -5.080078125, -4.90283203125, -4.7255859375, -4.54833984375, -4.37109375, -4.19384765625, -4.0166015625, -3.83935546875, -3.662109375, -3.48486328125, -3.3076171875, -3.13037109375, -2.953125, -2.77587890625, -2.5986328125, -2.42138671875, -2.244140625, -2.06689453125, -1.8896484375, -1.71240234375, -1.53515625, -1.35791015625, -1.1806640625, -1.00341796875, -0.826171875, -0.64892578125, -0.4716796875, -0.29443359375, -0.1171875, 0.06005859375, 0.2373046875, 0.41455078125, 0.591796875, 0.76904296875, 0.9462890625, 1.12353515625, 1.30078125, 1.47802734375, 1.6552734375, 1.83251953125, 2.009765625, 2.18701171875, 2.3642578125, 2.54150390625, 2.71875, 2.89599609375, 3.0732421875, 3.25048828125, 3.427734375, 3.60498046875, 3.7822265625, 3.95947265625, 4.13671875, 4.31396484375, 4.4912109375, 4.66845703125, 4.845703125, 5.02294921875, 5.2001953125, 5.37744140625, 5.5546875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 13.0, 18.0, 31.0, 51.0, 105.0, 136.0, 253.0, 182.0, 82.0, 51.0, 20.0, 16.0, 9.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-205.0234375, -199.57162475585938, -194.11981201171875, -188.66799926757812, -183.21620178222656, -177.76438903808594, -172.3125762939453, -166.8607635498047, -161.40896606445312, -155.9571533203125, -150.50534057617188, -145.05352783203125, -139.6017303466797, -134.14991760253906, -128.69810485839844, -123.24629211425781, -117.79447937011719, -112.34266662597656, -106.89086151123047, -101.43904876708984, -95.98724365234375, -90.53543090820312, -85.0836181640625, -79.63180541992188, -74.18000030517578, -68.72818756103516, -63.27638244628906, -57.82456970214844, -52.37276077270508, -46.92095184326172, -41.469139099121094, -36.017330169677734, -30.565521240234375, -25.113712310791016, -19.661901473999023, -14.210090637207031, -8.758281707763672, -3.3064727783203125, 2.1453399658203125, 7.597148895263672, 13.048957824707031, 18.50076675415039, 23.952577590942383, 29.404388427734375, 34.856197357177734, 40.308006286621094, 45.75981903076172, 51.21162796020508, 56.66343688964844, 62.1152458190918, 67.56705474853516, 73.01886749267578, 78.47067260742188, 83.9224853515625, 89.37429809570312, 94.82611083984375, 100.27791595458984, 105.72972869873047, 111.18153381347656, 116.63334655761719, 122.08515930175781, 127.5369644165039, 132.98876953125, 138.44058227539062, 143.89239501953125]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 2.0, 14.0, 5.0, 17.0, 19.0, 17.0, 19.0, 15.0, 36.0, 30.0, 33.0, 28.0, 29.0, 35.0, 45.0, 66.0, 72.0, 84.0, 79.0, 48.0, 46.0, 24.0, 31.0, 31.0, 27.0, 27.0, 15.0, 18.0, 14.0, 10.0, 8.0, 9.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-127.94464874267578, -123.81725311279297, -119.68984985351562, -115.56245422363281, -111.43505096435547, -107.30765533447266, -103.18025207519531, -99.0528564453125, -94.92546081542969, -90.79806518554688, -86.67066192626953, -82.54326629638672, -78.41586303710938, -74.28846740722656, -70.16107177734375, -66.0336685180664, -61.90626525878906, -57.778865814208984, -53.651466369628906, -49.524070739746094, -45.39666748046875, -41.26927185058594, -37.14187240600586, -33.01447296142578, -28.887073516845703, -24.759674072265625, -20.632274627685547, -16.5048770904541, -12.377477645874023, -8.250078201293945, -4.1226806640625, 0.004718780517578125, 4.1321258544921875, 8.259525299072266, 12.386923789978027, 16.51432228088379, 20.641721725463867, 24.769121170043945, 28.89651870727539, 33.02391815185547, 37.15131759643555, 41.278717041015625, 45.4061164855957, 49.53351593017578, 53.660911560058594, 57.78831481933594, 61.91571044921875, 66.04310607910156, 70.1705093383789, 74.29790496826172, 78.42530822753906, 82.55270385742188, 86.68010711669922, 90.80750274658203, 94.93490600585938, 99.06230163574219, 103.189697265625, 107.31709289550781, 111.44449615478516, 115.57189178466797, 119.69929504394531, 123.82669067382812, 127.95408630371094, 132.08148193359375, 136.20889282226562]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 12.0, 16.0, 23.0, 33.0, 50.0, 75.0, 123.0, 204.0, 381.0, 617.0, 1156.0, 2366.0, 5134.0, 13302.0, 42798.0, 196682.0, 1096309.0, 2129235.0, 557554.0, 104343.0, 26856.0, 9229.0, 3778.0, 1786.0, 939.0, 492.0, 298.0, 189.0, 93.0, 64.0, 34.0, 41.0, 16.0, 12.0, 16.0, 5.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -8.97119140625, -8.6845703125, -8.39794921875, -8.111328125, -7.82470703125, -7.5380859375, -7.25146484375, -6.96484375, -6.67822265625, -6.3916015625, -6.10498046875, -5.818359375, -5.53173828125, -5.2451171875, -4.95849609375, -4.671875, -4.38525390625, -4.0986328125, -3.81201171875, -3.525390625, -3.23876953125, -2.9521484375, -2.66552734375, -2.37890625, -2.09228515625, -1.8056640625, -1.51904296875, -1.232421875, -0.94580078125, -0.6591796875, -0.37255859375, -0.0859375, 0.20068359375, 0.4873046875, 0.77392578125, 1.060546875, 1.34716796875, 1.6337890625, 1.92041015625, 2.20703125, 2.49365234375, 2.7802734375, 3.06689453125, 3.353515625, 3.64013671875, 3.9267578125, 4.21337890625, 4.5, 4.78662109375, 5.0732421875, 5.35986328125, 5.646484375, 5.93310546875, 6.2197265625, 6.50634765625, 6.79296875, 7.07958984375, 7.3662109375, 7.65283203125, 7.939453125, 8.22607421875, 8.5126953125, 8.79931640625, 9.0859375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 3.0, 7.0, 9.0, 16.0, 10.0, 17.0, 25.0, 22.0, 27.0, 26.0, 33.0, 44.0, 45.0, 48.0, 55.0, 53.0, 59.0, 48.0, 54.0, 49.0, 27.0, 52.0, 47.0, 30.0, 22.0, 31.0, 26.0, 27.0, 20.0, 18.0, 10.0, 2.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.3175048828125, -9.025634765625, -8.7337646484375, -8.44189453125, -8.1500244140625, -7.858154296875, -7.5662841796875, -7.2744140625, -6.9825439453125, -6.690673828125, -6.3988037109375, -6.10693359375, -5.8150634765625, -5.523193359375, -5.2313232421875, -4.939453125, -4.6475830078125, -4.355712890625, -4.0638427734375, -3.77197265625, -3.4801025390625, -3.188232421875, -2.8963623046875, -2.6044921875, -2.3126220703125, -2.020751953125, -1.7288818359375, -1.43701171875, -1.1451416015625, -0.853271484375, -0.5614013671875, -0.26953125, 0.0223388671875, 0.314208984375, 0.6060791015625, 0.89794921875, 1.1898193359375, 1.481689453125, 1.7735595703125, 2.0654296875, 2.3572998046875, 2.649169921875, 2.9410400390625, 3.23291015625, 3.5247802734375, 3.816650390625, 4.1085205078125, 4.400390625, 4.6922607421875, 4.984130859375, 5.2760009765625, 5.56787109375, 5.8597412109375, 6.151611328125, 6.4434814453125, 6.7353515625, 7.0272216796875, 7.319091796875, 7.6109619140625, 7.90283203125, 8.1947021484375, 8.486572265625, 8.7784423828125, 9.0703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 4.0, 15.0, 16.0, 31.0, 37.0, 62.0, 91.0, 209.0, 608.0, 2767.0, 16524.0, 286867.0, 3753722.0, 119788.0, 10569.0, 1974.0, 530.0, 197.0, 80.0, 63.0, 36.0, 22.0, 20.0, 9.0, 9.0, 6.0, 6.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.09375, -36.15185546875, -35.2099609375, -34.26806640625, -33.326171875, -32.38427734375, -31.4423828125, -30.50048828125, -29.55859375, -28.61669921875, -27.6748046875, -26.73291015625, -25.791015625, -24.84912109375, -23.9072265625, -22.96533203125, -22.0234375, -21.08154296875, -20.1396484375, -19.19775390625, -18.255859375, -17.31396484375, -16.3720703125, -15.43017578125, -14.48828125, -13.54638671875, -12.6044921875, -11.66259765625, -10.720703125, -9.77880859375, -8.8369140625, -7.89501953125, -6.953125, -6.01123046875, -5.0693359375, -4.12744140625, -3.185546875, -2.24365234375, -1.3017578125, -0.35986328125, 0.58203125, 1.52392578125, 2.4658203125, 3.40771484375, 4.349609375, 5.29150390625, 6.2333984375, 7.17529296875, 8.1171875, 9.05908203125, 10.0009765625, 10.94287109375, 11.884765625, 12.82666015625, 13.7685546875, 14.71044921875, 15.65234375, 16.59423828125, 17.5361328125, 18.47802734375, 19.419921875, 20.36181640625, 21.3037109375, 22.24560546875, 23.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 14.0, 11.0, 10.0, 20.0, 26.0, 47.0, 46.0, 73.0, 127.0, 224.0, 316.0, 492.0, 656.0, 624.0, 494.0, 289.0, 181.0, 128.0, 65.0, 62.0, 39.0, 28.0, 17.0, 22.0, 13.0, 10.0, 6.0, 10.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.4765625, -14.9232177734375, -14.369873046875, -13.8165283203125, -13.26318359375, -12.7098388671875, -12.156494140625, -11.6031494140625, -11.0498046875, -10.4964599609375, -9.943115234375, -9.3897705078125, -8.83642578125, -8.2830810546875, -7.729736328125, -7.1763916015625, -6.623046875, -6.0697021484375, -5.516357421875, -4.9630126953125, -4.40966796875, -3.8563232421875, -3.302978515625, -2.7496337890625, -2.1962890625, -1.6429443359375, -1.089599609375, -0.5362548828125, 0.01708984375, 0.5704345703125, 1.123779296875, 1.6771240234375, 2.23046875, 2.7838134765625, 3.337158203125, 3.8905029296875, 4.44384765625, 4.9971923828125, 5.550537109375, 6.1038818359375, 6.6572265625, 7.2105712890625, 7.763916015625, 8.3172607421875, 8.87060546875, 9.4239501953125, 9.977294921875, 10.5306396484375, 11.083984375, 11.6373291015625, 12.190673828125, 12.7440185546875, 13.29736328125, 13.8507080078125, 14.404052734375, 14.9573974609375, 15.5107421875, 16.0640869140625, 16.617431640625, 17.1707763671875, 17.72412109375, 18.2774658203125, 18.830810546875, 19.3841552734375, 19.9375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 2.0, 14.0, 26.0, 61.0, 107.0, 158.0, 213.0, 186.0, 107.0, 52.0, 38.0, 7.0, 6.0, 8.0, 6.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-180.15582275390625, -174.40408325195312, -168.65232849121094, -162.9005889892578, -157.14883422851562, -151.3970947265625, -145.64535522460938, -139.8936004638672, -134.14186096191406, -128.39012145996094, -122.63836669921875, -116.88662719726562, -111.13488006591797, -105.38313293457031, -99.63138580322266, -93.879638671875, -88.12789154052734, -82.37614440917969, -76.62439727783203, -70.87265014648438, -65.12091064453125, -59.369163513183594, -53.61741638183594, -47.86567306518555, -42.11392593383789, -36.362178802490234, -30.610435485839844, -24.858688354492188, -19.106943130493164, -13.35519790649414, -7.603450775146484, -1.8517074584960938, 3.9000396728515625, 9.651784896850586, 15.403531074523926, 21.155277252197266, 26.90702247619629, 32.65876770019531, 38.41051483154297, 44.16225814819336, 49.914005279541016, 55.66575241088867, 61.41749572753906, 67.16924285888672, 72.92098999023438, 78.6727294921875, 84.42448425292969, 90.17622375488281, 95.92797088623047, 101.67971801757812, 107.43146514892578, 113.18321228027344, 118.93495178222656, 124.68669891357422, 130.43844604492188, 136.190185546875, 141.9419403076172, 147.6936798095703, 153.4454345703125, 159.19717407226562, 164.9489288330078, 170.70066833496094, 176.45242309570312, 182.20416259765625, 187.95590209960938]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 8.0, 7.0, 8.0, 13.0, 11.0, 18.0, 20.0, 23.0, 30.0, 28.0, 32.0, 40.0, 33.0, 43.0, 52.0, 55.0, 45.0, 49.0, 45.0, 56.0, 47.0, 49.0, 44.0, 28.0, 36.0, 21.0, 28.0, 22.0, 16.0, 14.0, 23.0, 7.0, 13.0, 6.0, 7.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-84.37347412109375, -82.02715301513672, -79.68082427978516, -77.33450317382812, -74.9881820678711, -72.64185333251953, -70.2955322265625, -67.94920349121094, -65.6028823852539, -63.25655746459961, -60.91023635864258, -58.56391143798828, -56.217586517333984, -53.87126159667969, -51.524940490722656, -49.17861557006836, -46.83229446411133, -44.48596954345703, -42.1396484375, -39.7933235168457, -37.446998596191406, -35.100677490234375, -32.75435256958008, -30.40802764892578, -28.061704635620117, -25.715381622314453, -23.369056701660156, -21.022733688354492, -18.676410675048828, -16.33008575439453, -13.983762741088867, -11.63743782043457, -9.291114807128906, -6.944790840148926, -4.5984673500061035, -2.2521438598632812, 0.09418010711669922, 2.4405040740966797, 4.786827087402344, 7.133152008056641, 9.479475021362305, 11.825798988342285, 14.172122955322266, 16.51844596862793, 18.864768981933594, 21.21109390258789, 23.557416915893555, 25.90374183654785, 28.250064849853516, 30.59638786315918, 32.942710876464844, 35.28903579711914, 37.63536071777344, 39.98168182373047, 42.328006744384766, 44.67433166503906, 47.020652770996094, 49.36697769165039, 51.71329879760742, 54.05962371826172, 56.405948638916016, 58.75227355957031, 61.098594665527344, 63.44491958618164, 65.79124450683594]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 11.0, 10.0, 6.0, 24.0, 27.0, 26.0, 42.0, 52.0, 61.0, 142.0, 169.0, 281.0, 389.0, 604.0, 995.0, 1552.0, 2475.0, 4153.0, 7235.0, 13018.0, 24064.0, 45385.0, 87082.0, 157752.0, 236027.0, 205549.0, 121508.0, 64117.0, 33438.0, 17921.0, 9960.0, 5619.0, 3390.0, 1958.0, 1209.0, 765.0, 470.0, 339.0, 237.0, 158.0, 93.0, 71.0, 51.0, 37.0, 32.0, 11.0, 8.0, 14.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.0, -7.7481689453125, -7.496337890625, -7.2445068359375, -6.99267578125, -6.7408447265625, -6.489013671875, -6.2371826171875, -5.9853515625, -5.7335205078125, -5.481689453125, -5.2298583984375, -4.97802734375, -4.7261962890625, -4.474365234375, -4.2225341796875, -3.970703125, -3.7188720703125, -3.467041015625, -3.2152099609375, -2.96337890625, -2.7115478515625, -2.459716796875, -2.2078857421875, -1.9560546875, -1.7042236328125, -1.452392578125, -1.2005615234375, -0.94873046875, -0.6968994140625, -0.445068359375, -0.1932373046875, 0.05859375, 0.3104248046875, 0.562255859375, 0.8140869140625, 1.06591796875, 1.3177490234375, 1.569580078125, 1.8214111328125, 2.0732421875, 2.3250732421875, 2.576904296875, 2.8287353515625, 3.08056640625, 3.3323974609375, 3.584228515625, 3.8360595703125, 4.087890625, 4.3397216796875, 4.591552734375, 4.8433837890625, 5.09521484375, 5.3470458984375, 5.598876953125, 5.8507080078125, 6.1025390625, 6.3543701171875, 6.606201171875, 6.8580322265625, 7.10986328125, 7.3616943359375, 7.613525390625, 7.8653564453125, 8.1171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 6.0, 6.0, 6.0, 9.0, 16.0, 17.0, 27.0, 29.0, 23.0, 41.0, 35.0, 41.0, 44.0, 37.0, 43.0, 51.0, 50.0, 55.0, 45.0, 45.0, 45.0, 36.0, 41.0, 32.0, 35.0, 34.0, 29.0, 17.0, 17.0, 17.0, 9.0, 4.0, 13.0, 8.0, 4.0, 1.0, 6.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.5352783203125, -8.250244140625, -7.9652099609375, -7.68017578125, -7.3951416015625, -7.110107421875, -6.8250732421875, -6.5400390625, -6.2550048828125, -5.969970703125, -5.6849365234375, -5.39990234375, -5.1148681640625, -4.829833984375, -4.5447998046875, -4.259765625, -3.9747314453125, -3.689697265625, -3.4046630859375, -3.11962890625, -2.8345947265625, -2.549560546875, -2.2645263671875, -1.9794921875, -1.6944580078125, -1.409423828125, -1.1243896484375, -0.83935546875, -0.5543212890625, -0.269287109375, 0.0157470703125, 0.30078125, 0.5858154296875, 0.870849609375, 1.1558837890625, 1.44091796875, 1.7259521484375, 2.010986328125, 2.2960205078125, 2.5810546875, 2.8660888671875, 3.151123046875, 3.4361572265625, 3.72119140625, 4.0062255859375, 4.291259765625, 4.5762939453125, 4.861328125, 5.1463623046875, 5.431396484375, 5.7164306640625, 6.00146484375, 6.2864990234375, 6.571533203125, 6.8565673828125, 7.1416015625, 7.4266357421875, 7.711669921875, 7.9967041015625, 8.28173828125, 8.5667724609375, 8.851806640625, 9.1368408203125, 9.421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 8.0, 11.0, 12.0, 13.0, 16.0, 22.0, 55.0, 51.0, 81.0, 119.0, 147.0, 210.0, 313.0, 521.0, 893.0, 1632.0, 3562.0, 9034.0, 28702.0, 111642.0, 595057.0, 218812.0, 52194.0, 14914.0, 5286.0, 2253.0, 1131.0, 625.0, 411.0, 245.0, 155.0, 120.0, 80.0, 69.0, 35.0, 27.0, 20.0, 16.0, 10.0, 14.0, 4.0, 6.0, 5.0, 6.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-19.5, -18.921875, -18.34375, -17.765625, -17.1875, -16.609375, -16.03125, -15.453125, -14.875, -14.296875, -13.71875, -13.140625, -12.5625, -11.984375, -11.40625, -10.828125, -10.25, -9.671875, -9.09375, -8.515625, -7.9375, -7.359375, -6.78125, -6.203125, -5.625, -5.046875, -4.46875, -3.890625, -3.3125, -2.734375, -2.15625, -1.578125, -1.0, -0.421875, 0.15625, 0.734375, 1.3125, 1.890625, 2.46875, 3.046875, 3.625, 4.203125, 4.78125, 5.359375, 5.9375, 6.515625, 7.09375, 7.671875, 8.25, 8.828125, 9.40625, 9.984375, 10.5625, 11.140625, 11.71875, 12.296875, 12.875, 13.453125, 14.03125, 14.609375, 15.1875, 15.765625, 16.34375, 16.921875, 17.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 6.0, 6.0, 8.0, 14.0, 11.0, 9.0, 16.0, 15.0, 22.0, 31.0, 37.0, 35.0, 41.0, 65.0, 65.0, 66.0, 76.0, 64.0, 53.0, 50.0, 54.0, 52.0, 44.0, 35.0, 21.0, 26.0, 15.0, 20.0, 9.0, 10.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.03125, -41.7705078125, -40.509765625, -39.2490234375, -37.98828125, -36.7275390625, -35.466796875, -34.2060546875, -32.9453125, -31.6845703125, -30.423828125, -29.1630859375, -27.90234375, -26.6416015625, -25.380859375, -24.1201171875, -22.859375, -21.5986328125, -20.337890625, -19.0771484375, -17.81640625, -16.5556640625, -15.294921875, -14.0341796875, -12.7734375, -11.5126953125, -10.251953125, -8.9912109375, -7.73046875, -6.4697265625, -5.208984375, -3.9482421875, -2.6875, -1.4267578125, -0.166015625, 1.0947265625, 2.35546875, 3.6162109375, 4.876953125, 6.1376953125, 7.3984375, 8.6591796875, 9.919921875, 11.1806640625, 12.44140625, 13.7021484375, 14.962890625, 16.2236328125, 17.484375, 18.7451171875, 20.005859375, 21.2666015625, 22.52734375, 23.7880859375, 25.048828125, 26.3095703125, 27.5703125, 28.8310546875, 30.091796875, 31.3525390625, 32.61328125, 33.8740234375, 35.134765625, 36.3955078125, 37.65625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 8.0, 11.0, 17.0, 13.0, 26.0, 27.0, 35.0, 53.0, 84.0, 120.0, 191.0, 312.0, 474.0, 872.0, 1671.0, 3576.0, 8041.0, 21809.0, 71017.0, 533259.0, 307647.0, 64307.0, 20316.0, 7552.0, 3296.0, 1604.0, 870.0, 478.0, 275.0, 174.0, 126.0, 89.0, 66.0, 23.0, 32.0, 19.0, 8.0, 10.0, 10.0, 6.0, 4.0, 1.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.833984375, -3.706024169921875, -3.57806396484375, -3.450103759765625, -3.3221435546875, -3.194183349609375, -3.06622314453125, -2.938262939453125, -2.810302734375, -2.682342529296875, -2.55438232421875, -2.426422119140625, -2.2984619140625, -2.170501708984375, -2.04254150390625, -1.914581298828125, -1.78662109375, -1.658660888671875, -1.53070068359375, -1.402740478515625, -1.2747802734375, -1.146820068359375, -1.01885986328125, -0.890899658203125, -0.762939453125, -0.634979248046875, -0.50701904296875, -0.379058837890625, -0.2510986328125, -0.123138427734375, 0.00482177734375, 0.132781982421875, 0.2607421875, 0.388702392578125, 0.51666259765625, 0.644622802734375, 0.7725830078125, 0.900543212890625, 1.02850341796875, 1.156463623046875, 1.284423828125, 1.412384033203125, 1.54034423828125, 1.668304443359375, 1.7962646484375, 1.924224853515625, 2.05218505859375, 2.180145263671875, 2.30810546875, 2.436065673828125, 2.56402587890625, 2.691986083984375, 2.8199462890625, 2.947906494140625, 3.07586669921875, 3.203826904296875, 3.331787109375, 3.459747314453125, 3.58770751953125, 3.715667724609375, 3.8436279296875, 3.971588134765625, 4.09954833984375, 4.227508544921875, 4.35546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 9.0, 16.0, 23.0, 28.0, 29.0, 50.0, 59.0, 92.0, 150.0, 160.0, 114.0, 60.0, 57.0, 45.0, 23.0, 16.0, 8.0, 13.0, 8.0, 4.0, 4.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013828277587890625, -0.0013410300016403198, -0.0012992322444915771, -0.0012574344873428345, -0.0012156367301940918, -0.0011738389730453491, -0.0011320412158966064, -0.0010902434587478638, -0.001048445701599121, -0.0010066479444503784, -0.0009648501873016357, -0.0009230524301528931, -0.0008812546730041504, -0.0008394569158554077, -0.000797659158706665, -0.0007558614015579224, -0.0007140636444091797, -0.000672265887260437, -0.0006304681301116943, -0.0005886703729629517, -0.000546872615814209, -0.0005050748586654663, -0.00046327710151672363, -0.00042147934436798096, -0.0003796815872192383, -0.0003378838300704956, -0.00029608607292175293, -0.00025428831577301025, -0.00021249055862426758, -0.0001706928014755249, -0.00012889504432678223, -8.709728717803955e-05, -4.5299530029296875e-05, -3.5017728805541992e-06, 3.8295984268188477e-05, 8.009374141693115e-05, 0.00012189149856567383, 0.0001636892557144165, 0.00020548701286315918, 0.00024728477001190186, 0.00028908252716064453, 0.0003308802843093872, 0.0003726780414581299, 0.00041447579860687256, 0.00045627355575561523, 0.0004980713129043579, 0.0005398690700531006, 0.0005816668272018433, 0.0006234645843505859, 0.0006652623414993286, 0.0007070600986480713, 0.000748857855796814, 0.0007906556129455566, 0.0008324533700942993, 0.000874251127243042, 0.0009160488843917847, 0.0009578466415405273, 0.00099964439868927, 0.0010414421558380127, 0.0010832399129867554, 0.001125037670135498, 0.0011668354272842407, 0.0012086331844329834, 0.001250430941581726, 0.0012922286987304688]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 9.0, 9.0, 18.0, 24.0, 35.0, 45.0, 85.0, 115.0, 175.0, 308.0, 577.0, 1063.0, 2345.0, 5857.0, 19205.0, 81502.0, 669564.0, 211296.0, 38646.0, 10418.0, 3786.0, 1589.0, 770.0, 420.0, 265.0, 133.0, 84.0, 47.0, 53.0, 36.0, 18.0, 16.0, 10.0, 4.0, 10.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.421875, -4.2432861328125, -4.064697265625, -3.8861083984375, -3.70751953125, -3.5289306640625, -3.350341796875, -3.1717529296875, -2.9931640625, -2.8145751953125, -2.635986328125, -2.4573974609375, -2.27880859375, -2.1002197265625, -1.921630859375, -1.7430419921875, -1.564453125, -1.3858642578125, -1.207275390625, -1.0286865234375, -0.85009765625, -0.6715087890625, -0.492919921875, -0.3143310546875, -0.1357421875, 0.0428466796875, 0.221435546875, 0.4000244140625, 0.57861328125, 0.7572021484375, 0.935791015625, 1.1143798828125, 1.29296875, 1.4715576171875, 1.650146484375, 1.8287353515625, 2.00732421875, 2.1859130859375, 2.364501953125, 2.5430908203125, 2.7216796875, 2.9002685546875, 3.078857421875, 3.2574462890625, 3.43603515625, 3.6146240234375, 3.793212890625, 3.9718017578125, 4.150390625, 4.3289794921875, 4.507568359375, 4.6861572265625, 4.86474609375, 5.0433349609375, 5.221923828125, 5.4005126953125, 5.5791015625, 5.7576904296875, 5.936279296875, 6.1148681640625, 6.29345703125, 6.4720458984375, 6.650634765625, 6.8292236328125, 7.0078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 9.0, 10.0, 25.0, 20.0, 48.0, 58.0, 84.0, 118.0, 136.0, 135.0, 91.0, 84.0, 46.0, 32.0, 24.0, 18.0, 17.0, 10.0, 3.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.828125, -9.56207275390625, -9.2960205078125, -9.02996826171875, -8.763916015625, -8.49786376953125, -8.2318115234375, -7.96575927734375, -7.69970703125, -7.43365478515625, -7.1676025390625, -6.90155029296875, -6.635498046875, -6.36944580078125, -6.1033935546875, -5.83734130859375, -5.5712890625, -5.30523681640625, -5.0391845703125, -4.77313232421875, -4.507080078125, -4.24102783203125, -3.9749755859375, -3.70892333984375, -3.44287109375, -3.17681884765625, -2.9107666015625, -2.64471435546875, -2.378662109375, -2.11260986328125, -1.8465576171875, -1.58050537109375, -1.314453125, -1.04840087890625, -0.7823486328125, -0.51629638671875, -0.250244140625, 0.01580810546875, 0.2818603515625, 0.54791259765625, 0.81396484375, 1.08001708984375, 1.3460693359375, 1.61212158203125, 1.878173828125, 2.14422607421875, 2.4102783203125, 2.67633056640625, 2.9423828125, 3.20843505859375, 3.4744873046875, 3.74053955078125, 4.006591796875, 4.27264404296875, 4.5386962890625, 4.80474853515625, 5.07080078125, 5.33685302734375, 5.6029052734375, 5.86895751953125, 6.135009765625, 6.40106201171875, 6.6671142578125, 6.93316650390625, 7.19921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 13.0, 16.0, 21.0, 48.0, 66.0, 109.0, 203.0, 229.0, 86.0, 75.0, 48.0, 36.0, 12.0, 4.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.24506378173828, -116.77388000488281, -112.30268859863281, -107.83150482177734, -103.36032104492188, -98.8891372680664, -94.41795349121094, -89.94676208496094, -85.47557830810547, -81.00439453125, -76.533203125, -72.06201934814453, -67.59083557128906, -63.119651794433594, -58.64846420288086, -54.177276611328125, -49.706092834472656, -45.23490905761719, -40.76372146606445, -36.29253387451172, -31.82135009765625, -27.35016441345215, -22.878978729248047, -18.407793045043945, -13.936607360839844, -9.465421676635742, -4.994235992431641, -0.5230503082275391, 3.9481353759765625, 8.419321060180664, 12.890506744384766, 17.361692428588867, 21.8328857421875, 26.3040714263916, 30.775257110595703, 35.24644470214844, 39.717628479003906, 44.188812255859375, 48.65999984741211, 53.131187438964844, 57.60237121582031, 62.07355499267578, 66.54473876953125, 71.01593017578125, 75.48711395263672, 79.95829772949219, 84.42948913574219, 88.90067291259766, 93.37185668945312, 97.8430404663086, 102.31422424316406, 106.78541564941406, 111.25659942626953, 115.727783203125, 120.198974609375, 124.67015838623047, 129.14134216308594, 133.61253356933594, 138.08370971679688, 142.55490112304688, 147.02609252929688, 151.4972686767578, 155.9684600830078, 160.43963623046875, 164.91082763671875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 7.0, 2.0, 7.0, 7.0, 8.0, 13.0, 15.0, 11.0, 23.0, 18.0, 17.0, 24.0, 24.0, 25.0, 35.0, 43.0, 46.0, 78.0, 100.0, 101.0, 56.0, 41.0, 33.0, 34.0, 32.0, 26.0, 31.0, 28.0, 22.0, 13.0, 11.0, 14.0, 8.0, 9.0, 7.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-138.1339874267578, -134.18905639648438, -130.244140625, -126.29920959472656, -122.35428619384766, -118.40935516357422, -114.46443176269531, -110.51950073242188, -106.57457733154297, -102.62965393066406, -98.68472290039062, -94.73979949951172, -90.79487609863281, -86.84994506835938, -82.90502166748047, -78.96009826660156, -75.01516723632812, -71.07024383544922, -67.12531280517578, -63.180389404296875, -59.2354621887207, -55.29053497314453, -51.345611572265625, -47.40068435668945, -43.45576477050781, -39.51083755493164, -35.565914154052734, -31.620986938476562, -27.67605972290039, -23.73113441467285, -19.786209106445312, -15.84128189086914, -11.896354675292969, -7.951428413391113, -4.006502628326416, -0.06157684326171875, 3.8833494186401367, 7.828275680541992, 11.773200988769531, 15.718128204345703, 19.663053512573242, 23.60797882080078, 27.552906036376953, 31.497831344604492, 35.44275665283203, 39.3876838684082, 43.332611083984375, 47.27753448486328, 51.22246170043945, 55.167388916015625, 59.11231231689453, 63.0572395324707, 67.00216674804688, 70.94709014892578, 74.89201354980469, 78.83694458007812, 82.78186798095703, 86.72679138183594, 90.67172241210938, 94.61664581298828, 98.56156921386719, 102.50650024414062, 106.45142364501953, 110.39634704589844, 114.34127807617188]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 6.0, 12.0, 11.0, 10.0, 17.0, 23.0, 39.0, 66.0, 65.0, 116.0, 168.0, 248.0, 424.0, 759.0, 1388.0, 2719.0, 5688.0, 13087.0, 34265.0, 108575.0, 414201.0, 1455456.0, 1524402.0, 448673.0, 120043.0, 37879.0, 13800.0, 5844.0, 2829.0, 1485.0, 769.0, 401.0, 287.0, 170.0, 111.0, 76.0, 47.0, 33.0, 27.0, 17.0, 16.0, 11.0, 6.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.94140625, -7.68548583984375, -7.4295654296875, -7.17364501953125, -6.917724609375, -6.66180419921875, -6.4058837890625, -6.14996337890625, -5.89404296875, -5.63812255859375, -5.3822021484375, -5.12628173828125, -4.870361328125, -4.61444091796875, -4.3585205078125, -4.10260009765625, -3.8466796875, -3.59075927734375, -3.3348388671875, -3.07891845703125, -2.822998046875, -2.56707763671875, -2.3111572265625, -2.05523681640625, -1.79931640625, -1.54339599609375, -1.2874755859375, -1.03155517578125, -0.775634765625, -0.51971435546875, -0.2637939453125, -0.00787353515625, 0.248046875, 0.50396728515625, 0.7598876953125, 1.01580810546875, 1.271728515625, 1.52764892578125, 1.7835693359375, 2.03948974609375, 2.29541015625, 2.55133056640625, 2.8072509765625, 3.06317138671875, 3.319091796875, 3.57501220703125, 3.8309326171875, 4.08685302734375, 4.3427734375, 4.59869384765625, 4.8546142578125, 5.11053466796875, 5.366455078125, 5.62237548828125, 5.8782958984375, 6.13421630859375, 6.39013671875, 6.64605712890625, 6.9019775390625, 7.15789794921875, 7.413818359375, 7.66973876953125, 7.9256591796875, 8.18157958984375, 8.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 2.0, 10.0, 1.0, 4.0, 4.0, 6.0, 15.0, 11.0, 25.0, 22.0, 22.0, 30.0, 38.0, 42.0, 42.0, 49.0, 49.0, 53.0, 47.0, 57.0, 58.0, 36.0, 47.0, 40.0, 49.0, 42.0, 36.0, 29.0, 33.0, 21.0, 20.0, 13.0, 13.0, 8.0, 7.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.828125, -8.527587890625, -8.22705078125, -7.926513671875, -7.6259765625, -7.325439453125, -7.02490234375, -6.724365234375, -6.423828125, -6.123291015625, -5.82275390625, -5.522216796875, -5.2216796875, -4.921142578125, -4.62060546875, -4.320068359375, -4.01953125, -3.718994140625, -3.41845703125, -3.117919921875, -2.8173828125, -2.516845703125, -2.21630859375, -1.915771484375, -1.615234375, -1.314697265625, -1.01416015625, -0.713623046875, -0.4130859375, -0.112548828125, 0.18798828125, 0.488525390625, 0.7890625, 1.089599609375, 1.39013671875, 1.690673828125, 1.9912109375, 2.291748046875, 2.59228515625, 2.892822265625, 3.193359375, 3.493896484375, 3.79443359375, 4.094970703125, 4.3955078125, 4.696044921875, 4.99658203125, 5.297119140625, 5.59765625, 5.898193359375, 6.19873046875, 6.499267578125, 6.7998046875, 7.100341796875, 7.40087890625, 7.701416015625, 8.001953125, 8.302490234375, 8.60302734375, 8.903564453125, 9.2041015625, 9.504638671875, 9.80517578125, 10.105712890625, 10.40625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 11.0, 15.0, 23.0, 31.0, 58.0, 85.0, 158.0, 348.0, 952.0, 3981.0, 33527.0, 1595886.0, 2509063.0, 43742.0, 4621.0, 1010.0, 375.0, 159.0, 77.0, 48.0, 27.0, 24.0, 15.0, 8.0, 8.0, 11.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.3125, -27.400634765625, -26.48876953125, -25.576904296875, -24.6650390625, -23.753173828125, -22.84130859375, -21.929443359375, -21.017578125, -20.105712890625, -19.19384765625, -18.281982421875, -17.3701171875, -16.458251953125, -15.54638671875, -14.634521484375, -13.72265625, -12.810791015625, -11.89892578125, -10.987060546875, -10.0751953125, -9.163330078125, -8.25146484375, -7.339599609375, -6.427734375, -5.515869140625, -4.60400390625, -3.692138671875, -2.7802734375, -1.868408203125, -0.95654296875, -0.044677734375, 0.8671875, 1.779052734375, 2.69091796875, 3.602783203125, 4.5146484375, 5.426513671875, 6.33837890625, 7.250244140625, 8.162109375, 9.073974609375, 9.98583984375, 10.897705078125, 11.8095703125, 12.721435546875, 13.63330078125, 14.545166015625, 15.45703125, 16.368896484375, 17.28076171875, 18.192626953125, 19.1044921875, 20.016357421875, 20.92822265625, 21.840087890625, 22.751953125, 23.663818359375, 24.57568359375, 25.487548828125, 26.3994140625, 27.311279296875, 28.22314453125, 29.135009765625, 30.046875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 7.0, 3.0, 9.0, 4.0, 7.0, 19.0, 30.0, 35.0, 39.0, 55.0, 100.0, 153.0, 229.0, 373.0, 542.0, 684.0, 609.0, 395.0, 257.0, 152.0, 112.0, 70.0, 62.0, 39.0, 24.0, 17.0, 15.0, 12.0, 6.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.91943359375, -18.3232421875, -17.72705078125, -17.130859375, -16.53466796875, -15.9384765625, -15.34228515625, -14.74609375, -14.14990234375, -13.5537109375, -12.95751953125, -12.361328125, -11.76513671875, -11.1689453125, -10.57275390625, -9.9765625, -9.38037109375, -8.7841796875, -8.18798828125, -7.591796875, -6.99560546875, -6.3994140625, -5.80322265625, -5.20703125, -4.61083984375, -4.0146484375, -3.41845703125, -2.822265625, -2.22607421875, -1.6298828125, -1.03369140625, -0.4375, 0.15869140625, 0.7548828125, 1.35107421875, 1.947265625, 2.54345703125, 3.1396484375, 3.73583984375, 4.33203125, 4.92822265625, 5.5244140625, 6.12060546875, 6.716796875, 7.31298828125, 7.9091796875, 8.50537109375, 9.1015625, 9.69775390625, 10.2939453125, 10.89013671875, 11.486328125, 12.08251953125, 12.6787109375, 13.27490234375, 13.87109375, 14.46728515625, 15.0634765625, 15.65966796875, 16.255859375, 16.85205078125, 17.4482421875, 18.04443359375, 18.640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 7.0, 9.0, 29.0, 38.0, 61.0, 92.0, 147.0, 161.0, 160.0, 131.0, 59.0, 44.0, 22.0, 14.0, 9.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.23345947265625, -152.586669921875, -147.93988037109375, -143.29307556152344, -138.6462860107422, -133.99949645996094, -129.3527069091797, -124.7059097290039, -120.05911254882812, -115.41232299804688, -110.7655258178711, -106.11873626708984, -101.47193908691406, -96.82514953613281, -92.17835998535156, -87.53156280517578, -82.88477325439453, -78.23798370361328, -73.5911865234375, -68.94439697265625, -64.29759979248047, -59.65081024169922, -55.0040168762207, -50.35722351074219, -45.71043014526367, -41.063636779785156, -36.41684341430664, -31.770051956176758, -27.123258590698242, -22.476465225219727, -17.829673767089844, -13.182880401611328, -8.536087036132812, -3.889294147491455, 0.7574987411499023, 5.404291152954102, 10.051084518432617, 14.697877883911133, 19.344669342041016, 23.99146270751953, 28.638256072998047, 33.28504943847656, 37.93184280395508, 42.578636169433594, 47.225425720214844, 51.872222900390625, 56.519012451171875, 61.16580581665039, 65.8125991821289, 70.45938873291016, 75.10618591308594, 79.75297546386719, 84.39977264404297, 89.04656219482422, 93.693359375, 98.34014892578125, 102.9869384765625, 107.63372802734375, 112.28052520751953, 116.92731475830078, 121.57411193847656, 126.22090148925781, 130.86769104003906, 135.51449584960938, 140.16128540039062]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 7.0, 13.0, 19.0, 14.0, 22.0, 20.0, 14.0, 26.0, 23.0, 39.0, 30.0, 35.0, 41.0, 38.0, 32.0, 38.0, 41.0, 51.0, 52.0, 37.0, 30.0, 43.0, 44.0, 42.0, 28.0, 29.0, 34.0, 21.0, 22.0, 21.0, 12.0, 14.0, 15.0, 7.0, 4.0, 7.0, 5.0, 4.0, 0.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.135498046875, -78.60028076171875, -76.0650634765625, -73.52985382080078, -70.99463653564453, -68.45941925048828, -65.92420196533203, -63.38898468017578, -60.8537712097168, -58.31855392456055, -55.78334045410156, -53.24812316894531, -50.71290588378906, -48.17769241333008, -45.64247512817383, -43.107261657714844, -40.572044372558594, -38.036827087402344, -35.50161361694336, -32.96639633178711, -30.431180953979492, -27.895965576171875, -25.360748291015625, -22.825532913208008, -20.29031753540039, -17.755102157592773, -15.21988582611084, -12.684669494628906, -10.149454116821289, -7.614238739013672, -5.079022407531738, -2.5438060760498047, -0.0085906982421875, 2.526625156402588, 5.061841011047363, 7.597056865692139, 10.132272720336914, 12.667488098144531, 15.202704429626465, 17.7379207611084, 20.273136138916016, 22.808351516723633, 25.34356689453125, 27.8787841796875, 30.413999557495117, 32.949214935302734, 35.484432220458984, 38.01964569091797, 40.55486297607422, 43.09008026123047, 45.62529373168945, 48.1605110168457, 50.69572448730469, 53.23094177246094, 55.76615905761719, 58.30137634277344, 60.83658981323242, 63.37180709838867, 65.90702056884766, 68.4422378540039, 70.97745513916016, 73.51266479492188, 76.04788208007812, 78.58309936523438, 81.11831665039062]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 7.0, 10.0, 17.0, 36.0, 43.0, 87.0, 149.0, 229.0, 414.0, 723.0, 1365.0, 2702.0, 5568.0, 11989.0, 28238.0, 70062.0, 181946.0, 358186.0, 231795.0, 90294.0, 35999.0, 14966.0, 6899.0, 3149.0, 1669.0, 899.0, 476.0, 266.0, 129.0, 76.0, 58.0, 36.0, 25.0, 17.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.22216796875, -13.8115234375, -13.40087890625, -12.990234375, -12.57958984375, -12.1689453125, -11.75830078125, -11.34765625, -10.93701171875, -10.5263671875, -10.11572265625, -9.705078125, -9.29443359375, -8.8837890625, -8.47314453125, -8.0625, -7.65185546875, -7.2412109375, -6.83056640625, -6.419921875, -6.00927734375, -5.5986328125, -5.18798828125, -4.77734375, -4.36669921875, -3.9560546875, -3.54541015625, -3.134765625, -2.72412109375, -2.3134765625, -1.90283203125, -1.4921875, -1.08154296875, -0.6708984375, -0.26025390625, 0.150390625, 0.56103515625, 0.9716796875, 1.38232421875, 1.79296875, 2.20361328125, 2.6142578125, 3.02490234375, 3.435546875, 3.84619140625, 4.2568359375, 4.66748046875, 5.078125, 5.48876953125, 5.8994140625, 6.31005859375, 6.720703125, 7.13134765625, 7.5419921875, 7.95263671875, 8.36328125, 8.77392578125, 9.1845703125, 9.59521484375, 10.005859375, 10.41650390625, 10.8271484375, 11.23779296875, 11.6484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 5.0, 10.0, 11.0, 19.0, 22.0, 15.0, 29.0, 26.0, 25.0, 39.0, 34.0, 40.0, 42.0, 55.0, 59.0, 57.0, 40.0, 48.0, 52.0, 50.0, 41.0, 49.0, 42.0, 27.0, 23.0, 30.0, 18.0, 13.0, 17.0, 12.0, 11.0, 7.0, 7.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.671875, -8.361572265625, -8.05126953125, -7.740966796875, -7.4306640625, -7.120361328125, -6.81005859375, -6.499755859375, -6.189453125, -5.879150390625, -5.56884765625, -5.258544921875, -4.9482421875, -4.637939453125, -4.32763671875, -4.017333984375, -3.70703125, -3.396728515625, -3.08642578125, -2.776123046875, -2.4658203125, -2.155517578125, -1.84521484375, -1.534912109375, -1.224609375, -0.914306640625, -0.60400390625, -0.293701171875, 0.0166015625, 0.326904296875, 0.63720703125, 0.947509765625, 1.2578125, 1.568115234375, 1.87841796875, 2.188720703125, 2.4990234375, 2.809326171875, 3.11962890625, 3.429931640625, 3.740234375, 4.050537109375, 4.36083984375, 4.671142578125, 4.9814453125, 5.291748046875, 5.60205078125, 5.912353515625, 6.22265625, 6.532958984375, 6.84326171875, 7.153564453125, 7.4638671875, 7.774169921875, 8.08447265625, 8.394775390625, 8.705078125, 9.015380859375, 9.32568359375, 9.635986328125, 9.9462890625, 10.256591796875, 10.56689453125, 10.877197265625, 11.1875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 12.0, 23.0, 31.0, 32.0, 56.0, 58.0, 87.0, 142.0, 191.0, 254.0, 354.0, 641.0, 924.0, 1666.0, 3669.0, 10293.0, 40822.0, 246439.0, 653307.0, 64671.0, 14654.0, 4858.0, 2047.0, 1182.0, 689.0, 428.0, 262.0, 218.0, 140.0, 100.0, 80.0, 58.0, 36.0, 34.0, 29.0, 11.0, 10.0, 11.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.875, -22.163330078125, -21.45166015625, -20.739990234375, -20.0283203125, -19.316650390625, -18.60498046875, -17.893310546875, -17.181640625, -16.469970703125, -15.75830078125, -15.046630859375, -14.3349609375, -13.623291015625, -12.91162109375, -12.199951171875, -11.48828125, -10.776611328125, -10.06494140625, -9.353271484375, -8.6416015625, -7.929931640625, -7.21826171875, -6.506591796875, -5.794921875, -5.083251953125, -4.37158203125, -3.659912109375, -2.9482421875, -2.236572265625, -1.52490234375, -0.813232421875, -0.1015625, 0.610107421875, 1.32177734375, 2.033447265625, 2.7451171875, 3.456787109375, 4.16845703125, 4.880126953125, 5.591796875, 6.303466796875, 7.01513671875, 7.726806640625, 8.4384765625, 9.150146484375, 9.86181640625, 10.573486328125, 11.28515625, 11.996826171875, 12.70849609375, 13.420166015625, 14.1318359375, 14.843505859375, 15.55517578125, 16.266845703125, 16.978515625, 17.690185546875, 18.40185546875, 19.113525390625, 19.8251953125, 20.536865234375, 21.24853515625, 21.960205078125, 22.671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 3.0, 9.0, 15.0, 10.0, 17.0, 20.0, 23.0, 19.0, 28.0, 29.0, 46.0, 40.0, 55.0, 58.0, 68.0, 68.0, 48.0, 55.0, 54.0, 59.0, 45.0, 39.0, 37.0, 20.0, 28.0, 23.0, 12.0, 14.0, 11.0, 2.0, 10.0, 13.0, 3.0, 7.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-38.1875, -37.0224609375, -35.857421875, -34.6923828125, -33.52734375, -32.3623046875, -31.197265625, -30.0322265625, -28.8671875, -27.7021484375, -26.537109375, -25.3720703125, -24.20703125, -23.0419921875, -21.876953125, -20.7119140625, -19.546875, -18.3818359375, -17.216796875, -16.0517578125, -14.88671875, -13.7216796875, -12.556640625, -11.3916015625, -10.2265625, -9.0615234375, -7.896484375, -6.7314453125, -5.56640625, -4.4013671875, -3.236328125, -2.0712890625, -0.90625, 0.2587890625, 1.423828125, 2.5888671875, 3.75390625, 4.9189453125, 6.083984375, 7.2490234375, 8.4140625, 9.5791015625, 10.744140625, 11.9091796875, 13.07421875, 14.2392578125, 15.404296875, 16.5693359375, 17.734375, 18.8994140625, 20.064453125, 21.2294921875, 22.39453125, 23.5595703125, 24.724609375, 25.8896484375, 27.0546875, 28.2197265625, 29.384765625, 30.5498046875, 31.71484375, 32.8798828125, 34.044921875, 35.2099609375, 36.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 14.0, 16.0, 25.0, 21.0, 26.0, 43.0, 63.0, 111.0, 151.0, 233.0, 477.0, 956.0, 2433.0, 7993.0, 37578.0, 711626.0, 251592.0, 25201.0, 6104.0, 1979.0, 837.0, 396.0, 224.0, 127.0, 87.0, 65.0, 20.0, 32.0, 23.0, 21.0, 19.0, 10.0, 7.0, 12.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.0546875, -4.89105224609375, -4.7274169921875, -4.56378173828125, -4.400146484375, -4.23651123046875, -4.0728759765625, -3.90924072265625, -3.74560546875, -3.58197021484375, -3.4183349609375, -3.25469970703125, -3.091064453125, -2.92742919921875, -2.7637939453125, -2.60015869140625, -2.4365234375, -2.27288818359375, -2.1092529296875, -1.94561767578125, -1.781982421875, -1.61834716796875, -1.4547119140625, -1.29107666015625, -1.12744140625, -0.96380615234375, -0.8001708984375, -0.63653564453125, -0.472900390625, -0.30926513671875, -0.1456298828125, 0.01800537109375, 0.181640625, 0.34527587890625, 0.5089111328125, 0.67254638671875, 0.836181640625, 0.99981689453125, 1.1634521484375, 1.32708740234375, 1.49072265625, 1.65435791015625, 1.8179931640625, 1.98162841796875, 2.145263671875, 2.30889892578125, 2.4725341796875, 2.63616943359375, 2.7998046875, 2.96343994140625, 3.1270751953125, 3.29071044921875, 3.454345703125, 3.61798095703125, 3.7816162109375, 3.94525146484375, 4.10888671875, 4.27252197265625, 4.4361572265625, 4.59979248046875, 4.763427734375, 4.92706298828125, 5.0906982421875, 5.25433349609375, 5.41796875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 5.0, 8.0, 7.0, 13.0, 15.0, 21.0, 34.0, 58.0, 81.0, 116.0, 170.0, 143.0, 104.0, 70.0, 31.0, 23.0, 11.0, 7.0, 11.0, 8.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0012054443359375, -0.0011696070432662964, -0.0011337697505950928, -0.0010979324579238892, -0.0010620951652526855, -0.001026257872581482, -0.0009904205799102783, -0.0009545832872390747, -0.0009187459945678711, -0.0008829087018966675, -0.0008470714092254639, -0.0008112341165542603, -0.0007753968238830566, -0.000739559531211853, -0.0007037222385406494, -0.0006678849458694458, -0.0006320476531982422, -0.0005962103605270386, -0.000560373067855835, -0.0005245357751846313, -0.0004886984825134277, -0.0004528611898422241, -0.0004170238971710205, -0.0003811866044998169, -0.0003453493118286133, -0.00030951201915740967, -0.00027367472648620605, -0.00023783743381500244, -0.00020200014114379883, -0.00016616284847259521, -0.0001303255558013916, -9.448826313018799e-05, -5.8650970458984375e-05, -2.2813677787780762e-05, 1.3023614883422852e-05, 4.8860907554626465e-05, 8.469820022583008e-05, 0.00012053549289703369, 0.0001563727855682373, 0.00019221007823944092, 0.00022804737091064453, 0.00026388466358184814, 0.00029972195625305176, 0.00033555924892425537, 0.000371396541595459, 0.0004072338342666626, 0.0004430711269378662, 0.0004789084196090698, 0.0005147457122802734, 0.000550583004951477, 0.0005864202976226807, 0.0006222575902938843, 0.0006580948829650879, 0.0006939321756362915, 0.0007297694683074951, 0.0007656067609786987, 0.0008014440536499023, 0.000837281346321106, 0.0008731186389923096, 0.0009089559316635132, 0.0009447932243347168, 0.0009806305170059204, 0.001016467809677124, 0.0010523051023483276, 0.0010881423950195312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 14.0, 19.0, 32.0, 35.0, 35.0, 71.0, 107.0, 153.0, 246.0, 371.0, 639.0, 1143.0, 2335.0, 5153.0, 13697.0, 48232.0, 272256.0, 614091.0, 61475.0, 16460.0, 6026.0, 2583.0, 1306.0, 727.0, 447.0, 304.0, 179.0, 120.0, 82.0, 60.0, 31.0, 28.0, 26.0, 16.0, 16.0, 13.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.419921875, -3.302337646484375, -3.18475341796875, -3.067169189453125, -2.9495849609375, -2.832000732421875, -2.71441650390625, -2.596832275390625, -2.479248046875, -2.361663818359375, -2.24407958984375, -2.126495361328125, -2.0089111328125, -1.891326904296875, -1.77374267578125, -1.656158447265625, -1.53857421875, -1.420989990234375, -1.30340576171875, -1.185821533203125, -1.0682373046875, -0.950653076171875, -0.83306884765625, -0.715484619140625, -0.597900390625, -0.480316162109375, -0.36273193359375, -0.245147705078125, -0.1275634765625, -0.009979248046875, 0.10760498046875, 0.225189208984375, 0.3427734375, 0.460357666015625, 0.57794189453125, 0.695526123046875, 0.8131103515625, 0.930694580078125, 1.04827880859375, 1.165863037109375, 1.283447265625, 1.401031494140625, 1.51861572265625, 1.636199951171875, 1.7537841796875, 1.871368408203125, 1.98895263671875, 2.106536865234375, 2.22412109375, 2.341705322265625, 2.45928955078125, 2.576873779296875, 2.6944580078125, 2.812042236328125, 2.92962646484375, 3.047210693359375, 3.164794921875, 3.282379150390625, 3.39996337890625, 3.517547607421875, 3.6351318359375, 3.752716064453125, 3.87030029296875, 3.987884521484375, 4.10546875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 9.0, 8.0, 14.0, 20.0, 27.0, 29.0, 34.0, 35.0, 54.0, 74.0, 90.0, 77.0, 81.0, 84.0, 67.0, 63.0, 34.0, 38.0, 32.0, 18.0, 22.0, 19.0, 12.0, 7.0, 5.0, 5.0, 7.0, 3.0, 2.0, 8.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.47265625, -4.341278076171875, -4.20989990234375, -4.078521728515625, -3.9471435546875, -3.815765380859375, -3.68438720703125, -3.553009033203125, -3.421630859375, -3.290252685546875, -3.15887451171875, -3.027496337890625, -2.8961181640625, -2.764739990234375, -2.63336181640625, -2.501983642578125, -2.37060546875, -2.239227294921875, -2.10784912109375, -1.976470947265625, -1.8450927734375, -1.713714599609375, -1.58233642578125, -1.450958251953125, -1.319580078125, -1.188201904296875, -1.05682373046875, -0.925445556640625, -0.7940673828125, -0.662689208984375, -0.53131103515625, -0.399932861328125, -0.2685546875, -0.137176513671875, -0.00579833984375, 0.125579833984375, 0.2569580078125, 0.388336181640625, 0.51971435546875, 0.651092529296875, 0.782470703125, 0.913848876953125, 1.04522705078125, 1.176605224609375, 1.3079833984375, 1.439361572265625, 1.57073974609375, 1.702117919921875, 1.83349609375, 1.964874267578125, 2.09625244140625, 2.227630615234375, 2.3590087890625, 2.490386962890625, 2.62176513671875, 2.753143310546875, 2.884521484375, 3.015899658203125, 3.14727783203125, 3.278656005859375, 3.4100341796875, 3.541412353515625, 3.67279052734375, 3.804168701171875, 3.935546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 1.0, 4.0, 9.0, 17.0, 44.0, 55.0, 127.0, 380.0, 166.0, 101.0, 42.0, 19.0, 17.0, 6.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-184.843505859375, -179.34193420410156, -173.84036254882812, -168.3387908935547, -162.83721923828125, -157.33566284179688, -151.83409118652344, -146.33251953125, -140.83094787597656, -135.32937622070312, -129.8278045654297, -124.32624053955078, -118.82466888427734, -113.3230972290039, -107.821533203125, -102.31996154785156, -96.81838989257812, -91.31681823730469, -85.81524658203125, -80.31368255615234, -74.8121109008789, -69.31053924560547, -63.8089714050293, -58.307403564453125, -52.80583190917969, -47.30426025390625, -41.80269241333008, -36.301124572753906, -30.79955291748047, -25.297983169555664, -19.79641342163086, -14.294845581054688, -8.79327392578125, -3.2917041778564453, 2.2098655700683594, 7.711435317993164, 13.213005065917969, 18.714574813842773, 24.216144561767578, 29.71771240234375, 35.21928405761719, 40.720855712890625, 46.2224235534668, 51.72399139404297, 57.225563049316406, 62.727134704589844, 68.22869873046875, 73.73027038574219, 79.23184204101562, 84.73341369628906, 90.2349853515625, 95.7365493774414, 101.23812103271484, 106.73969268798828, 112.24125671386719, 117.74282836914062, 123.24440002441406, 128.7459716796875, 134.24754333496094, 139.74911499023438, 145.25067138671875, 150.7522430419922, 156.25381469726562, 161.75538635253906, 167.2569580078125]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 3.0, 11.0, 2.0, 7.0, 14.0, 18.0, 18.0, 22.0, 22.0, 33.0, 26.0, 36.0, 23.0, 44.0, 52.0, 114.0, 120.0, 77.0, 57.0, 30.0, 34.0, 33.0, 26.0, 23.0, 22.0, 18.0, 18.0, 14.0, 19.0, 11.0, 10.0, 9.0, 3.0, 4.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-124.07186126708984, -120.24730682373047, -116.4227523803711, -112.59819793701172, -108.77363586425781, -104.94908142089844, -101.12452697753906, -97.29997253417969, -93.47541809082031, -89.65086364746094, -85.82630920410156, -82.00175476074219, -78.17720031738281, -74.35264587402344, -70.52808380126953, -66.70352935791016, -62.87897491455078, -59.054420471191406, -55.22986602783203, -51.40530776977539, -47.580753326416016, -43.75619888305664, -39.931640625, -36.107086181640625, -32.28253173828125, -28.457977294921875, -24.633420944213867, -20.80886459350586, -16.984310150146484, -13.15975570678711, -9.335199356079102, -5.510643005371094, -1.6860809326171875, 2.138474464416504, 5.963029861450195, 9.787585258483887, 13.612140655517578, 17.436695098876953, 21.26125144958496, 25.08580780029297, 28.910362243652344, 32.73491668701172, 36.559471130371094, 40.384029388427734, 44.20858383178711, 48.033138275146484, 51.857696533203125, 55.6822509765625, 59.506805419921875, 63.33135986328125, 67.15591430664062, 70.98046875, 74.80502319335938, 78.62957763671875, 82.45413970947266, 86.27869415283203, 90.1032485961914, 93.92780303955078, 97.75235748291016, 101.57691192626953, 105.40147399902344, 109.22602844238281, 113.05058288574219, 116.87513732910156, 120.69969177246094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 12.0, 8.0, 10.0, 9.0, 19.0, 20.0, 40.0, 53.0, 70.0, 106.0, 146.0, 225.0, 320.0, 548.0, 888.0, 1536.0, 2958.0, 6238.0, 15937.0, 54800.0, 263145.0, 1170191.0, 1907127.0, 598606.0, 122088.0, 29766.0, 9790.0, 4293.0, 2203.0, 1182.0, 669.0, 439.0, 256.0, 169.0, 128.0, 84.0, 57.0, 40.0, 23.0, 17.0, 18.0, 14.0, 8.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-12.6171875, -12.2489013671875, -11.880615234375, -11.5123291015625, -11.14404296875, -10.7757568359375, -10.407470703125, -10.0391845703125, -9.6708984375, -9.3026123046875, -8.934326171875, -8.5660400390625, -8.19775390625, -7.8294677734375, -7.461181640625, -7.0928955078125, -6.724609375, -6.3563232421875, -5.988037109375, -5.6197509765625, -5.25146484375, -4.8831787109375, -4.514892578125, -4.1466064453125, -3.7783203125, -3.4100341796875, -3.041748046875, -2.6734619140625, -2.30517578125, -1.9368896484375, -1.568603515625, -1.2003173828125, -0.83203125, -0.4637451171875, -0.095458984375, 0.2728271484375, 0.64111328125, 1.0093994140625, 1.377685546875, 1.7459716796875, 2.1142578125, 2.4825439453125, 2.850830078125, 3.2191162109375, 3.58740234375, 3.9556884765625, 4.323974609375, 4.6922607421875, 5.060546875, 5.4288330078125, 5.797119140625, 6.1654052734375, 6.53369140625, 6.9019775390625, 7.270263671875, 7.6385498046875, 8.0068359375, 8.3751220703125, 8.743408203125, 9.1116943359375, 9.47998046875, 9.8482666015625, 10.216552734375, 10.5848388671875, 10.953125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 8.0, 16.0, 12.0, 14.0, 21.0, 20.0, 26.0, 20.0, 29.0, 33.0, 42.0, 41.0, 43.0, 65.0, 48.0, 41.0, 46.0, 53.0, 66.0, 41.0, 42.0, 47.0, 31.0, 31.0, 22.0, 28.0, 19.0, 21.0, 13.0, 10.0, 4.0, 12.0, 3.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.41357421875, -8.1318359375, -7.85009765625, -7.568359375, -7.28662109375, -7.0048828125, -6.72314453125, -6.44140625, -6.15966796875, -5.8779296875, -5.59619140625, -5.314453125, -5.03271484375, -4.7509765625, -4.46923828125, -4.1875, -3.90576171875, -3.6240234375, -3.34228515625, -3.060546875, -2.77880859375, -2.4970703125, -2.21533203125, -1.93359375, -1.65185546875, -1.3701171875, -1.08837890625, -0.806640625, -0.52490234375, -0.2431640625, 0.03857421875, 0.3203125, 0.60205078125, 0.8837890625, 1.16552734375, 1.447265625, 1.72900390625, 2.0107421875, 2.29248046875, 2.57421875, 2.85595703125, 3.1376953125, 3.41943359375, 3.701171875, 3.98291015625, 4.2646484375, 4.54638671875, 4.828125, 5.10986328125, 5.3916015625, 5.67333984375, 5.955078125, 6.23681640625, 6.5185546875, 6.80029296875, 7.08203125, 7.36376953125, 7.6455078125, 7.92724609375, 8.208984375, 8.49072265625, 8.7724609375, 9.05419921875, 9.3359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 13.0, 10.0, 10.0, 17.0, 18.0, 30.0, 38.0, 44.0, 84.0, 113.0, 156.0, 208.0, 364.0, 603.0, 1185.0, 3048.0, 10677.0, 72664.0, 3065464.0, 988634.0, 39085.0, 7153.0, 2191.0, 963.0, 513.0, 307.0, 205.0, 135.0, 85.0, 67.0, 56.0, 41.0, 31.0, 13.0, 15.0, 8.0, 10.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.453125, -25.567626953125, -24.68212890625, -23.796630859375, -22.9111328125, -22.025634765625, -21.14013671875, -20.254638671875, -19.369140625, -18.483642578125, -17.59814453125, -16.712646484375, -15.8271484375, -14.941650390625, -14.05615234375, -13.170654296875, -12.28515625, -11.399658203125, -10.51416015625, -9.628662109375, -8.7431640625, -7.857666015625, -6.97216796875, -6.086669921875, -5.201171875, -4.315673828125, -3.43017578125, -2.544677734375, -1.6591796875, -0.773681640625, 0.11181640625, 0.997314453125, 1.8828125, 2.768310546875, 3.65380859375, 4.539306640625, 5.4248046875, 6.310302734375, 7.19580078125, 8.081298828125, 8.966796875, 9.852294921875, 10.73779296875, 11.623291015625, 12.5087890625, 13.394287109375, 14.27978515625, 15.165283203125, 16.05078125, 16.936279296875, 17.82177734375, 18.707275390625, 19.5927734375, 20.478271484375, 21.36376953125, 22.249267578125, 23.134765625, 24.020263671875, 24.90576171875, 25.791259765625, 26.6767578125, 27.562255859375, 28.44775390625, 29.333251953125, 30.21875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 8.0, 7.0, 15.0, 12.0, 18.0, 30.0, 28.0, 39.0, 66.0, 77.0, 97.0, 130.0, 211.0, 307.0, 370.0, 492.0, 501.0, 434.0, 358.0, 246.0, 171.0, 119.0, 77.0, 56.0, 41.0, 28.0, 25.0, 16.0, 19.0, 11.0, 8.0, 7.0, 8.0, 5.0, 6.0, 1.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.2099609375, -20.576171875, -19.9423828125, -19.30859375, -18.6748046875, -18.041015625, -17.4072265625, -16.7734375, -16.1396484375, -15.505859375, -14.8720703125, -14.23828125, -13.6044921875, -12.970703125, -12.3369140625, -11.703125, -11.0693359375, -10.435546875, -9.8017578125, -9.16796875, -8.5341796875, -7.900390625, -7.2666015625, -6.6328125, -5.9990234375, -5.365234375, -4.7314453125, -4.09765625, -3.4638671875, -2.830078125, -2.1962890625, -1.5625, -0.9287109375, -0.294921875, 0.3388671875, 0.97265625, 1.6064453125, 2.240234375, 2.8740234375, 3.5078125, 4.1416015625, 4.775390625, 5.4091796875, 6.04296875, 6.6767578125, 7.310546875, 7.9443359375, 8.578125, 9.2119140625, 9.845703125, 10.4794921875, 11.11328125, 11.7470703125, 12.380859375, 13.0146484375, 13.6484375, 14.2822265625, 14.916015625, 15.5498046875, 16.18359375, 16.8173828125, 17.451171875, 18.0849609375, 18.71875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 8.0, 10.0, 16.0, 25.0, 31.0, 45.0, 77.0, 125.0, 153.0, 164.0, 129.0, 88.0, 41.0, 31.0, 22.0, 14.0, 6.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-179.49951171875, -172.38548278808594, -165.27145385742188, -158.15740966796875, -151.0433807373047, -143.92935180664062, -136.81532287597656, -129.7012939453125, -122.5872573852539, -115.47322845458984, -108.35919189453125, -101.24516296386719, -94.13113403320312, -87.01709747314453, -79.90306854248047, -72.78903198242188, -65.67500305175781, -58.560970306396484, -51.446937561035156, -44.332908630371094, -37.218875885009766, -30.104843139648438, -22.990814208984375, -15.876781463623047, -8.762748718261719, -1.648716926574707, 5.465314865112305, 12.579345703125, 19.693378448486328, 26.807411193847656, 33.92144012451172, 41.03547286987305, 48.149505615234375, 55.2635383605957, 62.37757110595703, 69.4916000366211, 76.60563659667969, 83.71966552734375, 90.83369445800781, 97.94772338867188, 105.06175994873047, 112.17578887939453, 119.28982543945312, 126.40385437011719, 133.51788330078125, 140.63192749023438, 147.74594116210938, 154.8599853515625, 161.97401428222656, 169.08804321289062, 176.2020721435547, 183.31610107421875, 190.43014526367188, 197.54417419433594, 204.658203125, 211.77223205566406, 218.88626098632812, 226.0002899169922, 233.11431884765625, 240.22836303710938, 247.34239196777344, 254.4564208984375, 261.5704345703125, 268.6844787597656, 275.79852294921875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 15.0, 8.0, 9.0, 11.0, 9.0, 19.0, 20.0, 26.0, 22.0, 26.0, 31.0, 27.0, 34.0, 34.0, 53.0, 37.0, 49.0, 57.0, 51.0, 50.0, 32.0, 36.0, 39.0, 29.0, 33.0, 30.0, 31.0, 36.0, 18.0, 25.0, 18.0, 15.0, 6.0, 12.0, 3.0, 4.0, 5.0, 5.0, 3.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-104.94803619384766, -101.1576156616211, -97.36720275878906, -93.5767822265625, -89.78636169433594, -85.99594116210938, -82.20552825927734, -78.41510772705078, -74.62469482421875, -70.83427429199219, -67.04386138916016, -63.253440856933594, -59.46302032470703, -55.672603607177734, -51.88218688964844, -48.091766357421875, -44.30134582519531, -40.510929107666016, -36.72050857543945, -32.930091857910156, -29.139673233032227, -25.349254608154297, -21.558837890625, -17.76841926574707, -13.97800064086914, -10.187582015991211, -6.397164344787598, -2.6067466735839844, 1.1836719512939453, 4.974090576171875, 8.764507293701172, 12.554925918579102, 16.345352172851562, 20.135770797729492, 23.926189422607422, 27.71660614013672, 31.50702476501465, 35.29744338989258, 39.087860107421875, 42.87828063964844, 46.668697357177734, 50.45911407470703, 54.249534606933594, 58.03995132446289, 61.83036804199219, 65.62078857421875, 69.41120910644531, 73.20162200927734, 76.9920425415039, 80.78246307373047, 84.5728759765625, 88.36329650878906, 92.15371704101562, 95.94413757324219, 99.73455047607422, 103.52497100830078, 107.31538391113281, 111.10580444335938, 114.8962173461914, 118.68663787841797, 122.47705841064453, 126.26747131347656, 130.05789184570312, 133.8483123779297, 137.63873291015625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 10.0, 10.0, 20.0, 34.0, 56.0, 98.0, 171.0, 269.0, 452.0, 796.0, 1531.0, 3245.0, 7660.0, 20067.0, 61939.0, 223328.0, 498038.0, 157852.0, 45725.0, 15496.0, 6059.0, 2780.0, 1277.0, 653.0, 378.0, 240.0, 136.0, 83.0, 58.0, 33.0, 18.0, 16.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.8125, -17.32275390625, -16.8330078125, -16.34326171875, -15.853515625, -15.36376953125, -14.8740234375, -14.38427734375, -13.89453125, -13.40478515625, -12.9150390625, -12.42529296875, -11.935546875, -11.44580078125, -10.9560546875, -10.46630859375, -9.9765625, -9.48681640625, -8.9970703125, -8.50732421875, -8.017578125, -7.52783203125, -7.0380859375, -6.54833984375, -6.05859375, -5.56884765625, -5.0791015625, -4.58935546875, -4.099609375, -3.60986328125, -3.1201171875, -2.63037109375, -2.140625, -1.65087890625, -1.1611328125, -0.67138671875, -0.181640625, 0.30810546875, 0.7978515625, 1.28759765625, 1.77734375, 2.26708984375, 2.7568359375, 3.24658203125, 3.736328125, 4.22607421875, 4.7158203125, 5.20556640625, 5.6953125, 6.18505859375, 6.6748046875, 7.16455078125, 7.654296875, 8.14404296875, 8.6337890625, 9.12353515625, 9.61328125, 10.10302734375, 10.5927734375, 11.08251953125, 11.572265625, 12.06201171875, 12.5517578125, 13.04150390625, 13.53125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 8.0, 10.0, 7.0, 12.0, 22.0, 25.0, 31.0, 28.0, 39.0, 37.0, 36.0, 48.0, 55.0, 67.0, 58.0, 51.0, 59.0, 61.0, 46.0, 59.0, 51.0, 35.0, 36.0, 26.0, 20.0, 16.0, 13.0, 8.0, 11.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.234375, -12.8675537109375, -12.500732421875, -12.1339111328125, -11.76708984375, -11.4002685546875, -11.033447265625, -10.6666259765625, -10.2998046875, -9.9329833984375, -9.566162109375, -9.1993408203125, -8.83251953125, -8.4656982421875, -8.098876953125, -7.7320556640625, -7.365234375, -6.9984130859375, -6.631591796875, -6.2647705078125, -5.89794921875, -5.5311279296875, -5.164306640625, -4.7974853515625, -4.4306640625, -4.0638427734375, -3.697021484375, -3.3302001953125, -2.96337890625, -2.5965576171875, -2.229736328125, -1.8629150390625, -1.49609375, -1.1292724609375, -0.762451171875, -0.3956298828125, -0.02880859375, 0.3380126953125, 0.704833984375, 1.0716552734375, 1.4384765625, 1.8052978515625, 2.172119140625, 2.5389404296875, 2.90576171875, 3.2725830078125, 3.639404296875, 4.0062255859375, 4.373046875, 4.7398681640625, 5.106689453125, 5.4735107421875, 5.84033203125, 6.2071533203125, 6.573974609375, 6.9407958984375, 7.3076171875, 7.6744384765625, 8.041259765625, 8.4080810546875, 8.77490234375, 9.1417236328125, 9.508544921875, 9.8753662109375, 10.2421875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 5.0, 6.0, 4.0, 10.0, 22.0, 33.0, 34.0, 52.0, 89.0, 130.0, 233.0, 422.0, 854.0, 2374.0, 10242.0, 122118.0, 858776.0, 44252.0, 5667.0, 1605.0, 667.0, 346.0, 175.0, 128.0, 103.0, 52.0, 52.0, 17.0, 18.0, 15.0, 13.0, 7.0, 10.0, 8.0, 6.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-22.859375, -22.080078125, -21.30078125, -20.521484375, -19.7421875, -18.962890625, -18.18359375, -17.404296875, -16.625, -15.845703125, -15.06640625, -14.287109375, -13.5078125, -12.728515625, -11.94921875, -11.169921875, -10.390625, -9.611328125, -8.83203125, -8.052734375, -7.2734375, -6.494140625, -5.71484375, -4.935546875, -4.15625, -3.376953125, -2.59765625, -1.818359375, -1.0390625, -0.259765625, 0.51953125, 1.298828125, 2.078125, 2.857421875, 3.63671875, 4.416015625, 5.1953125, 5.974609375, 6.75390625, 7.533203125, 8.3125, 9.091796875, 9.87109375, 10.650390625, 11.4296875, 12.208984375, 12.98828125, 13.767578125, 14.546875, 15.326171875, 16.10546875, 16.884765625, 17.6640625, 18.443359375, 19.22265625, 20.001953125, 20.78125, 21.560546875, 22.33984375, 23.119140625, 23.8984375, 24.677734375, 25.45703125, 26.236328125, 27.015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 9.0, 6.0, 9.0, 13.0, 13.0, 16.0, 30.0, 29.0, 43.0, 45.0, 54.0, 69.0, 101.0, 93.0, 99.0, 62.0, 52.0, 45.0, 33.0, 27.0, 37.0, 29.0, 19.0, 12.0, 13.0, 7.0, 6.0, 9.0, 1.0, 2.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.78125, -39.24658203125, -37.7119140625, -36.17724609375, -34.642578125, -33.10791015625, -31.5732421875, -30.03857421875, -28.50390625, -26.96923828125, -25.4345703125, -23.89990234375, -22.365234375, -20.83056640625, -19.2958984375, -17.76123046875, -16.2265625, -14.69189453125, -13.1572265625, -11.62255859375, -10.087890625, -8.55322265625, -7.0185546875, -5.48388671875, -3.94921875, -2.41455078125, -0.8798828125, 0.65478515625, 2.189453125, 3.72412109375, 5.2587890625, 6.79345703125, 8.328125, 9.86279296875, 11.3974609375, 12.93212890625, 14.466796875, 16.00146484375, 17.5361328125, 19.07080078125, 20.60546875, 22.14013671875, 23.6748046875, 25.20947265625, 26.744140625, 28.27880859375, 29.8134765625, 31.34814453125, 32.8828125, 34.41748046875, 35.9521484375, 37.48681640625, 39.021484375, 40.55615234375, 42.0908203125, 43.62548828125, 45.16015625, 46.69482421875, 48.2294921875, 49.76416015625, 51.298828125, 52.83349609375, 54.3681640625, 55.90283203125, 57.4375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 7.0, 3.0, 17.0, 10.0, 20.0, 27.0, 56.0, 48.0, 133.0, 173.0, 258.0, 561.0, 1280.0, 3705.0, 14211.0, 92873.0, 868815.0, 51813.0, 9707.0, 2708.0, 988.0, 411.0, 240.0, 154.0, 104.0, 58.0, 35.0, 26.0, 23.0, 13.0, 11.0, 10.0, 10.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.2835693359375, -2.205810546875, -2.1280517578125, -2.05029296875, -1.9725341796875, -1.894775390625, -1.8170166015625, -1.7392578125, -1.6614990234375, -1.583740234375, -1.5059814453125, -1.42822265625, -1.3504638671875, -1.272705078125, -1.1949462890625, -1.1171875, -1.0394287109375, -0.961669921875, -0.8839111328125, -0.80615234375, -0.7283935546875, -0.650634765625, -0.5728759765625, -0.4951171875, -0.4173583984375, -0.339599609375, -0.2618408203125, -0.18408203125, -0.1063232421875, -0.028564453125, 0.0491943359375, 0.126953125, 0.2047119140625, 0.282470703125, 0.3602294921875, 0.43798828125, 0.5157470703125, 0.593505859375, 0.6712646484375, 0.7490234375, 0.8267822265625, 0.904541015625, 0.9822998046875, 1.06005859375, 1.1378173828125, 1.215576171875, 1.2933349609375, 1.37109375, 1.4488525390625, 1.526611328125, 1.6043701171875, 1.68212890625, 1.7598876953125, 1.837646484375, 1.9154052734375, 1.9931640625, 2.0709228515625, 2.148681640625, 2.2264404296875, 2.30419921875, 2.3819580078125, 2.459716796875, 2.5374755859375, 2.615234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 6.0, 11.0, 10.0, 13.0, 12.0, 16.0, 22.0, 34.0, 35.0, 65.0, 105.0, 116.0, 126.0, 111.0, 105.0, 58.0, 31.0, 25.0, 22.0, 14.0, 14.0, 7.0, 7.0, 13.0, 7.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005545616149902344, -0.0005383715033531189, -0.0005221813917160034, -0.0005059912800788879, -0.0004898011684417725, -0.000473611056804657, -0.0004574209451675415, -0.000441230833530426, -0.00042504072189331055, -0.00040885061025619507, -0.0003926604986190796, -0.0003764703869819641, -0.00036028027534484863, -0.00034409016370773315, -0.0003279000520706177, -0.0003117099404335022, -0.0002955198287963867, -0.00027932971715927124, -0.00026313960552215576, -0.0002469494938850403, -0.0002307593822479248, -0.00021456927061080933, -0.00019837915897369385, -0.00018218904733657837, -0.0001659989356994629, -0.0001498088240623474, -0.00013361871242523193, -0.00011742860078811646, -0.00010123848915100098, -8.50483775138855e-05, -6.885826587677002e-05, -5.266815423965454e-05, -3.647804260253906e-05, -2.0287930965423584e-05, -4.0978193283081055e-06, 1.2092292308807373e-05, 2.828240394592285e-05, 4.447251558303833e-05, 6.066262722015381e-05, 7.685273885726929e-05, 9.304285049438477e-05, 0.00010923296213150024, 0.00012542307376861572, 0.0001416131854057312, 0.00015780329704284668, 0.00017399340867996216, 0.00019018352031707764, 0.00020637363195419312, 0.0002225637435913086, 0.00023875385522842407, 0.00025494396686553955, 0.00027113407850265503, 0.0002873241901397705, 0.000303514301776886, 0.00031970441341400146, 0.00033589452505111694, 0.0003520846366882324, 0.0003682747483253479, 0.0003844648599624634, 0.00040065497159957886, 0.00041684508323669434, 0.0004330351948738098, 0.0004492253065109253, 0.00046541541814804077, 0.00048160552978515625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 8.0, 2.0, 7.0, 7.0, 11.0, 18.0, 22.0, 51.0, 62.0, 100.0, 131.0, 205.0, 353.0, 588.0, 1080.0, 2223.0, 4893.0, 12605.0, 38467.0, 230551.0, 662821.0, 63326.0, 18174.0, 6579.0, 2927.0, 1343.0, 785.0, 435.0, 245.0, 165.0, 110.0, 71.0, 55.0, 34.0, 27.0, 14.0, 9.0, 14.0, 8.0, 8.0, 5.0, 3.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.66015625, -1.6085662841796875, -1.556976318359375, -1.5053863525390625, -1.45379638671875, -1.4022064208984375, -1.350616455078125, -1.2990264892578125, -1.2474365234375, -1.1958465576171875, -1.144256591796875, -1.0926666259765625, -1.04107666015625, -0.9894866943359375, -0.937896728515625, -0.8863067626953125, -0.834716796875, -0.7831268310546875, -0.731536865234375, -0.6799468994140625, -0.62835693359375, -0.5767669677734375, -0.525177001953125, -0.4735870361328125, -0.4219970703125, -0.3704071044921875, -0.318817138671875, -0.2672271728515625, -0.21563720703125, -0.1640472412109375, -0.112457275390625, -0.0608673095703125, -0.00927734375, 0.0423126220703125, 0.093902587890625, 0.1454925537109375, 0.19708251953125, 0.2486724853515625, 0.300262451171875, 0.3518524169921875, 0.4034423828125, 0.4550323486328125, 0.506622314453125, 0.5582122802734375, 0.60980224609375, 0.6613922119140625, 0.712982177734375, 0.7645721435546875, 0.816162109375, 0.8677520751953125, 0.919342041015625, 0.9709320068359375, 1.02252197265625, 1.0741119384765625, 1.125701904296875, 1.1772918701171875, 1.2288818359375, 1.2804718017578125, 1.332061767578125, 1.3836517333984375, 1.43524169921875, 1.4868316650390625, 1.538421630859375, 1.5900115966796875, 1.6416015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 11.0, 7.0, 19.0, 17.0, 17.0, 20.0, 53.0, 37.0, 42.0, 74.0, 91.0, 125.0, 126.0, 83.0, 60.0, 46.0, 35.0, 38.0, 21.0, 18.0, 8.0, 14.0, 7.0, 7.0, 6.0, 1.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.4447021484375, -2.346435546875, -2.2481689453125, -2.14990234375, -2.0516357421875, -1.953369140625, -1.8551025390625, -1.7568359375, -1.6585693359375, -1.560302734375, -1.4620361328125, -1.36376953125, -1.2655029296875, -1.167236328125, -1.0689697265625, -0.970703125, -0.8724365234375, -0.774169921875, -0.6759033203125, -0.57763671875, -0.4793701171875, -0.381103515625, -0.2828369140625, -0.1845703125, -0.0863037109375, 0.011962890625, 0.1102294921875, 0.20849609375, 0.3067626953125, 0.405029296875, 0.5032958984375, 0.6015625, 0.6998291015625, 0.798095703125, 0.8963623046875, 0.99462890625, 1.0928955078125, 1.191162109375, 1.2894287109375, 1.3876953125, 1.4859619140625, 1.584228515625, 1.6824951171875, 1.78076171875, 1.8790283203125, 1.977294921875, 2.0755615234375, 2.173828125, 2.2720947265625, 2.370361328125, 2.4686279296875, 2.56689453125, 2.6651611328125, 2.763427734375, 2.8616943359375, 2.9599609375, 3.0582275390625, 3.156494140625, 3.2547607421875, 3.35302734375, 3.4512939453125, 3.549560546875, 3.6478271484375, 3.74609375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 2.0, 2.0, 3.0, 5.0, 15.0, 12.0, 16.0, 34.0, 75.0, 186.0, 267.0, 203.0, 93.0, 48.0, 18.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-147.26199340820312, -142.27487182617188, -137.2877655029297, -132.30064392089844, -127.31353759765625, -122.326416015625, -117.33930206298828, -112.35218811035156, -107.36507415771484, -102.37796020507812, -97.3908462524414, -92.40373229980469, -87.41661071777344, -82.42950439453125, -77.4423828125, -72.45526885986328, -67.46815490722656, -62.481040954589844, -57.493927001953125, -52.50680923461914, -47.51969528198242, -42.5325813293457, -37.54546356201172, -32.558349609375, -27.57123565673828, -22.584121704101562, -17.59700584411621, -12.609890937805176, -7.622776031494141, -2.635662078857422, 2.3514537811279297, 7.338569641113281, 12.325698852539062, 17.31281280517578, 22.299928665161133, 27.287044525146484, 32.2741584777832, 37.26127243041992, 42.248390197753906, 47.235504150390625, 52.222618103027344, 57.20973205566406, 62.19684600830078, 67.1839599609375, 72.17108154296875, 77.15818786621094, 82.14530944824219, 87.1324234008789, 92.11953735351562, 97.10665130615234, 102.09376525878906, 107.08087921142578, 112.0679931640625, 117.05511474609375, 122.04222869873047, 127.02934265136719, 132.01644897460938, 137.00357055664062, 141.9906768798828, 146.97779846191406, 151.96490478515625, 156.9520263671875, 161.9391326904297, 166.92625427246094, 171.9133758544922]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 7.0, 7.0, 12.0, 9.0, 16.0, 19.0, 23.0, 24.0, 61.0, 112.0, 98.0, 44.0, 46.0, 41.0, 35.0, 63.0, 84.0, 94.0, 55.0, 38.0, 14.0, 21.0, 10.0, 11.0, 9.0, 6.0, 3.0, 7.0, 6.0, 1.0, 5.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-124.95172882080078, -121.33545684814453, -117.71917724609375, -114.1029052734375, -110.48663330078125, -106.870361328125, -103.25408935546875, -99.63780975341797, -96.02153778076172, -92.40526580810547, -88.78898620605469, -85.17271423339844, -81.55644226074219, -77.94017028808594, -74.32389831542969, -70.7076187133789, -67.09134674072266, -63.475074768066406, -59.85879898071289, -56.242523193359375, -52.626251220703125, -49.009979248046875, -45.39370346069336, -41.777427673339844, -38.161155700683594, -34.544883728027344, -30.928607940673828, -27.312334060668945, -23.696060180664062, -20.07978630065918, -16.463512420654297, -12.847238540649414, -9.230972290039062, -5.61469841003418, -1.9984245300292969, 1.617849349975586, 5.234123229980469, 8.850397109985352, 12.466670989990234, 16.082944869995117, 19.69921875, 23.315492630004883, 26.931766510009766, 30.54804039001465, 34.16431427001953, 37.78058624267578, 41.3968620300293, 45.01313781738281, 48.62940979003906, 52.24568176269531, 55.86195755004883, 59.478233337402344, 63.094505310058594, 66.71077728271484, 70.32705688476562, 73.94332885742188, 77.55960083007812, 81.17587280273438, 84.79214477539062, 88.4084243774414, 92.02469635009766, 95.6409683227539, 99.25724792480469, 102.87351989746094, 106.48979187011719]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 5.0, 8.0, 7.0, 9.0, 9.0, 14.0, 5.0, 15.0, 14.0, 23.0, 32.0, 25.0, 32.0, 32.0, 48.0, 94.0, 246.0, 96.0, 42.0, 25.0, 37.0, 33.0, 16.0, 17.0, 21.0, 14.0, 9.0, 16.0, 10.0, 5.0, 5.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.34576416015625, -7.0782470703125, -6.81072998046875, -6.543212890625, -6.27569580078125, -6.0081787109375, -5.74066162109375, -5.47314453125, -5.20562744140625, -4.9381103515625, -4.67059326171875, -4.403076171875, -4.13555908203125, -3.8680419921875, -3.60052490234375, -3.3330078125, -3.06549072265625, -2.7979736328125, -2.53045654296875, -2.262939453125, -1.99542236328125, -1.7279052734375, -1.46038818359375, -1.19287109375, -0.92535400390625, -0.6578369140625, -0.39031982421875, -0.122802734375, 0.14471435546875, 0.4122314453125, 0.67974853515625, 0.947265625, 1.21478271484375, 1.4822998046875, 1.74981689453125, 2.017333984375, 2.28485107421875, 2.5523681640625, 2.81988525390625, 3.08740234375, 3.35491943359375, 3.6224365234375, 3.88995361328125, 4.157470703125, 4.42498779296875, 4.6925048828125, 4.96002197265625, 5.2275390625, 5.49505615234375, 5.7625732421875, 6.03009033203125, 6.297607421875, 6.56512451171875, 6.8326416015625, 7.10015869140625, 7.36767578125, 7.63519287109375, 7.9027099609375, 8.17022705078125, 8.437744140625, 8.70526123046875, 8.9727783203125, 9.24029541015625, 9.5078125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 5.0, 10.0, 8.0, 12.0, 23.0, 38.0, 42.0, 75.0, 92.0, 187.0, 331.0, 764.0, 2098.0, 6646.0, 74963.0, 8287627.0, 10675.0, 2911.0, 1032.0, 449.0, 194.0, 133.0, 69.0, 44.0, 29.0, 16.0, 10.0, 16.0, 12.0, 7.0, 11.0, 9.0, 6.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-82.97441101074219, -80.68035888671875, -78.38629913330078, -76.09224700927734, -73.79818725585938, -71.50413513183594, -69.21007537841797, -66.91602325439453, -64.62196350097656, -62.32790756225586, -60.033851623535156, -57.73979568481445, -55.44573974609375, -53.15168380737305, -50.857627868652344, -48.563575744628906, -46.2695198059082, -43.9754638671875, -41.6814079284668, -39.387351989746094, -37.09329605102539, -34.79924011230469, -32.50518798828125, -30.211130142211914, -27.91707420349121, -25.623018264770508, -23.328962326049805, -21.034908294677734, -18.74085235595703, -16.446796417236328, -14.152740478515625, -11.858684539794922, -9.564624786376953, -7.27056884765625, -4.976513385772705, -2.68245792388916, -0.38840198516845703, 1.905653953552246, 4.199708938598633, 6.493764877319336, 8.787820816040039, 11.081876754760742, 13.375932693481445, 15.669987678527832, 17.96404266357422, 20.258098602294922, 22.552154541015625, 24.846210479736328, 27.14026641845703, 29.434322357177734, 31.728378295898438, 34.02243423461914, 36.316490173339844, 38.61054611206055, 40.90460205078125, 43.19865417480469, 45.492713928222656, 47.78676986694336, 50.08082580566406, 52.374881744384766, 54.66893768310547, 56.96299362182617, 59.257049560546875, 61.55110168457031, 63.845157623291016]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 8.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0, 8.0, 2.0, 1.0, 6.0, 1.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-137.78854370117188, -133.39793395996094, -129.00733947753906, -124.61672973632812, -120.22612762451172, -115.83552551269531, -111.44491577148438, -107.05431365966797, -102.66371154785156, -98.27310943603516, -93.88250732421875, -89.49189758300781, -85.1012954711914, -80.710693359375, -76.32008361816406, -71.92948150634766, -67.53887939453125, -63.148277282714844, -58.75767135620117, -54.3670654296875, -49.976463317871094, -45.58586120605469, -41.195255279541016, -36.804649353027344, -32.41404724121094, -28.0234432220459, -23.63283920288086, -19.24223518371582, -14.851631164550781, -10.461027145385742, -6.070423126220703, -1.679819107055664, 2.7107696533203125, 7.101373672485352, 11.49197769165039, 15.88258171081543, 20.27318572998047, 24.663789749145508, 29.054393768310547, 33.44499969482422, 37.835601806640625, 42.22620391845703, 46.6168098449707, 51.007415771484375, 55.39801788330078, 59.78861999511719, 64.17922973632812, 68.56983184814453, 72.96043395996094, 77.35103607177734, 81.74163818359375, 86.13224792480469, 90.5228500366211, 94.9134521484375, 99.30406188964844, 103.69466400146484, 108.08526611328125, 112.47586822509766, 116.86647033691406, 121.257080078125, 125.6476821899414, 130.0382843017578, 134.42889404296875, 138.81948852539062, 143.21009826660156]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 14.0, 22.0, 27.0, 38.0, 58.0, 84.0, 190.0, 311.0, 605.0, 1232.0, 2483.0, 5178.0, 11607.0, 25812.0, 60052.0, 127009.0, 148140.0, 78800.0, 34558.0, 15165.0, 6690.0, 3061.0, 1483.0, 734.0, 368.0, 219.0, 97.0, 86.0, 47.0, 33.0, 19.0, 9.0, 5.0, 7.0, 6.0, 7.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.1875, -53.52294921875, -51.8583984375, -50.19384765625, -48.529296875, -46.86474609375, -45.2001953125, -43.53564453125, -41.87109375, -40.20654296875, -38.5419921875, -36.87744140625, -35.212890625, -33.54833984375, -31.8837890625, -30.21923828125, -28.5546875, -26.89013671875, -25.2255859375, -23.56103515625, -21.896484375, -20.23193359375, -18.5673828125, -16.90283203125, -15.23828125, -13.57373046875, -11.9091796875, -10.24462890625, -8.580078125, -6.91552734375, -5.2509765625, -3.58642578125, -1.921875, -0.25732421875, 1.4072265625, 3.07177734375, 4.736328125, 6.40087890625, 8.0654296875, 9.72998046875, 11.39453125, 13.05908203125, 14.7236328125, 16.38818359375, 18.052734375, 19.71728515625, 21.3818359375, 23.04638671875, 24.7109375, 26.37548828125, 28.0400390625, 29.70458984375, 31.369140625, 33.03369140625, 34.6982421875, 36.36279296875, 38.02734375, 39.69189453125, 41.3564453125, 43.02099609375, 44.685546875, 46.35009765625, 48.0146484375, 49.67919921875, 51.34375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 7.0, 6.0, 13.0, 10.0, 19.0, 12.0, 27.0, 26.0, 42.0, 45.0, 54.0, 47.0, 38.0, 52.0, 63.0, 60.0, 72.0, 67.0, 48.0, 50.0, 52.0, 40.0, 33.0, 29.0, 15.0, 13.0, 7.0, 9.0, 10.0, 5.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0078125, -11.654052734375, -11.30029296875, -10.946533203125, -10.5927734375, -10.239013671875, -9.88525390625, -9.531494140625, -9.177734375, -8.823974609375, -8.47021484375, -8.116455078125, -7.7626953125, -7.408935546875, -7.05517578125, -6.701416015625, -6.34765625, -5.993896484375, -5.64013671875, -5.286376953125, -4.9326171875, -4.578857421875, -4.22509765625, -3.871337890625, -3.517578125, -3.163818359375, -2.81005859375, -2.456298828125, -2.1025390625, -1.748779296875, -1.39501953125, -1.041259765625, -0.6875, -0.333740234375, 0.02001953125, 0.373779296875, 0.7275390625, 1.081298828125, 1.43505859375, 1.788818359375, 2.142578125, 2.496337890625, 2.85009765625, 3.203857421875, 3.5576171875, 3.911376953125, 4.26513671875, 4.618896484375, 4.97265625, 5.326416015625, 5.68017578125, 6.033935546875, 6.3876953125, 6.741455078125, 7.09521484375, 7.448974609375, 7.802734375, 8.156494140625, 8.51025390625, 8.864013671875, 9.2177734375, 9.571533203125, 9.92529296875, 10.279052734375, 10.6328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 10.0, 3.0, 7.0, 10.0, 24.0, 93.0, 127.0, 108.0, 48.0, 16.0, 15.0, 6.0, 14.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.16116333007812, -144.475830078125, -140.79049682617188, -137.10516357421875, -133.41983032226562, -129.73448181152344, -126.04914855957031, -122.36381530761719, -118.67848205566406, -114.99314880371094, -111.30781555175781, -107.62247467041016, -103.93714141845703, -100.2518081665039, -96.56646728515625, -92.88113403320312, -89.19580078125, -85.51046752929688, -81.82513427734375, -78.1397933959961, -74.45446014404297, -70.76912689208984, -67.08378601074219, -63.39845275878906, -59.71311950683594, -56.02778625488281, -52.34244918823242, -48.65711212158203, -44.971778869628906, -41.28644561767578, -37.60110855102539, -33.915771484375, -30.230438232421875, -26.545103073120117, -22.85976791381836, -19.1744327545166, -15.489097595214844, -11.803762435913086, -8.118427276611328, -4.43309211730957, -0.7477569580078125, 2.9375782012939453, 6.622913360595703, 10.308248519897461, 13.993583679199219, 17.678918838500977, 21.364253997802734, 25.049589157104492, 28.73492431640625, 32.420257568359375, 36.105594635009766, 39.790931701660156, 43.47626495361328, 47.161598205566406, 50.8469352722168, 54.53227233886719, 58.21760559082031, 61.90293884277344, 65.58827209472656, 69.27361297607422, 72.95894622802734, 76.64427947998047, 80.32962036132812, 84.01495361328125, 87.70028686523438]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 6.0, 0.0, 3.0, 5.0, 11.0, 15.0, 28.0, 72.0, 94.0, 74.0, 52.0, 26.0, 19.0, 16.0, 4.0, 6.0, 8.0, 5.0, 4.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.82432556152344, -51.05133819580078, -49.27835464477539, -47.50537109375, -45.732383728027344, -43.95939636230469, -42.1864128112793, -40.413429260253906, -38.64044189453125, -36.867454528808594, -35.0944709777832, -33.32148742675781, -31.548500061035156, -29.775514602661133, -28.00252914428711, -26.229543685913086, -24.456558227539062, -22.68357276916504, -20.910587310791016, -19.137601852416992, -17.36461639404297, -15.591630935668945, -13.818645477294922, -12.045660018920898, -10.272674560546875, -8.499689102172852, -6.726703643798828, -4.953718185424805, -3.1807327270507812, -1.4077472686767578, 0.3652381896972656, 2.138223648071289, 3.911212921142578, 5.684198379516602, 7.457183837890625, 9.230169296264648, 11.003154754638672, 12.776140213012695, 14.549125671386719, 16.322111129760742, 18.095096588134766, 19.86808204650879, 21.641067504882812, 23.414052963256836, 25.18703842163086, 26.960023880004883, 28.733009338378906, 30.50599479675293, 32.27898025512695, 34.051963806152344, 35.824951171875, 37.597938537597656, 39.37092208862305, 41.14390563964844, 42.916893005371094, 44.68988037109375, 46.46286392211914, 48.23584747314453, 50.00883483886719, 51.781822204589844, 53.554805755615234, 55.327789306640625, 57.10077667236328, 58.87376403808594, 60.64674758911133]}, "eval/loss": 0.9911340475082397, "eval/wer": 0.14885806694842946, "eval/runtime": 870.6822, "eval/samples_per_second": 3.034, "eval/steps_per_second": 0.38} \ No newline at end of file