diff --git "a/wandb/run-20220313_205708-2dwk1d7p/files/wandb-summary.json" "b/wandb/run-20220313_205708-2dwk1d7p/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220313_205708-2dwk1d7p/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.4547, "train/learning_rate": 2.2425000000000003e-05, "train/epoch": 1.68, "train/global_step": 1500, "_runtime": 9981, "_timestamp": 1647215009, "_step": 1500, "gradients/decoder.lm_head.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 10.0, 6.0, 8.0, 3.0, 4.0, 101.0, 33.0, 15.0, 9.0, 10.0, 49913.0, 94.0, 24.0, 11.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.921875, -7.6397705078125, -7.357666015625, -7.0755615234375, -6.79345703125, -6.5113525390625, -6.229248046875, -5.9471435546875, -5.6650390625, -5.3829345703125, -5.100830078125, -4.8187255859375, -4.53662109375, -4.2545166015625, -3.972412109375, -3.6903076171875, -3.408203125, -3.1260986328125, -2.843994140625, -2.5618896484375, -2.27978515625, -1.9976806640625, -1.715576171875, -1.4334716796875, -1.1513671875, -0.8692626953125, -0.587158203125, -0.3050537109375, -0.02294921875, 0.2591552734375, 0.541259765625, 0.8233642578125, 1.10546875, 1.3875732421875, 1.669677734375, 1.9517822265625, 2.23388671875, 2.5159912109375, 2.798095703125, 3.0802001953125, 3.3623046875, 3.6444091796875, 3.926513671875, 4.2086181640625, 4.49072265625, 4.7728271484375, 5.054931640625, 5.3370361328125, 5.619140625, 5.9012451171875, 6.183349609375, 6.4654541015625, 6.74755859375, 7.0296630859375, 7.311767578125, 7.5938720703125, 7.8759765625, 8.1580810546875, 8.440185546875, 8.7222900390625, 9.00439453125, 9.2864990234375, 9.568603515625, 9.8507080078125, 10.1328125]}, "gradients/decoder.lm_head.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 7.0, 12.0, 16.0, 62.0, 94.0, 142.0, 177.0, 171.0, 135.0, 79.0, 51.0, 25.0, 14.0, 6.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.2724609375, -19.767065048217773, -19.261669158935547, -18.756271362304688, -18.25087547302246, -17.745479583740234, -17.240083694458008, -16.73468780517578, -16.229290008544922, -15.723894119262695, -15.218497276306152, -14.713101387023926, -14.207704544067383, -13.702308654785156, -13.19691276550293, -12.691516876220703, -12.186120986938477, -11.68072509765625, -11.175328254699707, -10.66993236541748, -10.164535522460938, -9.659139633178711, -9.153743743896484, -8.648347854614258, -8.142951011657715, -7.63755464553833, -7.132158279418945, -6.626762390136719, -6.121366024017334, -5.615969657897949, -5.110573768615723, -4.605177402496338, -4.099782943725586, -3.594386577606201, -3.0889904499053955, -2.58359432220459, -2.078197956085205, -1.5728015899658203, -1.0674054622650146, -0.562009334564209, -0.05661296844482422, 0.448783278465271, 0.9541795253753662, 1.4595757722854614, 1.9649720191955566, 2.4703683853149414, 2.975764513015747, 3.4811606407165527, 3.9865570068359375, 4.491953372955322, 4.997349739074707, 5.502745628356934, 6.008141994476318, 6.513538360595703, 7.01893424987793, 7.5243306159973145, 8.0297269821167, 8.535122871398926, 9.040519714355469, 9.545915603637695, 10.051311492919922, 10.556708335876465, 11.062104225158691, 11.567501068115234, 12.072896957397461]}, "gradients/decoder.lm_head.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 12.0, 16.0, 5.0, 14.0, 24.0, 33.0, 23.0, 28.0, 22.0, 48.0, 54.0, 55.0, 47.0, 51.0, 53.0, 52.0, 56.0, 40.0, 43.0, 56.0, 35.0, 33.0, 35.0, 21.0, 19.0, 21.0, 19.0, 14.0, 17.0, 8.0, 4.0, 7.0, 3.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65602445602417, -7.3872222900390625, -7.118420600891113, -6.849618434906006, -6.580816268920898, -6.312014579772949, -6.043212413787842, -5.774410247802734, -5.505608558654785, -5.236806392669678, -4.9680047035217285, -4.699202537536621, -4.430400848388672, -4.1615986824035645, -3.892796516418457, -3.6239945888519287, -3.3551926612854004, -3.086390733718872, -2.8175888061523438, -2.5487866401672363, -2.279984712600708, -2.0111827850341797, -1.7423807382583618, -1.473578691482544, -1.2047767639160156, -0.9359747767448425, -0.6671727895736694, -0.39837080240249634, -0.12956881523132324, 0.13923311233520508, 0.40803515911102295, 0.6768372058868408, 0.9456386566162109, 1.2144405841827393, 1.4832426309585571, 1.752044677734375, 2.0208466053009033, 2.2896485328674316, 2.558450698852539, 2.8272526264190674, 3.0960545539855957, 3.364856481552124, 3.6336584091186523, 3.9024605751037598, 4.171262741088867, 4.440064430236816, 4.708866596221924, 4.977668762207031, 5.2464704513549805, 5.515272617340088, 5.784074306488037, 6.0528764724731445, 6.321678161621094, 6.590480327606201, 6.859282493591309, 7.128084182739258, 7.396886348724365, 7.665688514709473, 7.934490203857422, 8.203291893005371, 8.472094535827637, 8.740896224975586, 9.009697914123535, 9.2785005569458, 9.54730224609375]}, "gradients/decoder.lm_head.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 3.0, 4.0, 9.0, 4.0, 4.0, 6.0, 13.0, 16.0, 10.0, 22.0, 17.0, 26.0, 30.0, 36.0, 27.0, 39.0, 51.0, 52.0, 45.0, 1699.0, 1045611.0, 428.0, 46.0, 43.0, 46.0, 46.0, 45.0, 26.0, 30.0, 22.0, 19.0, 17.0, 11.0, 13.0, 15.0, 8.0, 5.0, 11.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-175.875, -171.041015625, -166.20703125, -161.373046875, -156.5390625, -151.705078125, -146.87109375, -142.037109375, -137.203125, -132.369140625, -127.53515625, -122.701171875, -117.8671875, -113.033203125, -108.19921875, -103.365234375, -98.53125, -93.697265625, -88.86328125, -84.029296875, -79.1953125, -74.361328125, -69.52734375, -64.693359375, -59.859375, -55.025390625, -50.19140625, -45.357421875, -40.5234375, -35.689453125, -30.85546875, -26.021484375, -21.1875, -16.353515625, -11.51953125, -6.685546875, -1.8515625, 2.982421875, 7.81640625, 12.650390625, 17.484375, 22.318359375, 27.15234375, 31.986328125, 36.8203125, 41.654296875, 46.48828125, 51.322265625, 56.15625, 60.990234375, 65.82421875, 70.658203125, 75.4921875, 80.326171875, 85.16015625, 89.994140625, 94.828125, 99.662109375, 104.49609375, 109.330078125, 114.1640625, 118.998046875, 123.83203125, 128.666015625, 133.5]}, "gradients/decoder.lm_head.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 10.0, 11.0, 15.0, 12.0, 15.0, 18.0, 25.0, 26.0, 32.0, 34.0, 49.0, 46.0, 42.0, 48.0, 51.0, 93.0, 50.0, 41.0, 49.0, 52.0, 37.0, 34.0, 30.0, 33.0, 25.0, 19.0, 22.0, 14.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.40576171875, -4.2412109375, -4.07666015625, -3.912109375, -3.74755859375, -3.5830078125, -3.41845703125, -3.25390625, -3.08935546875, -2.9248046875, -2.76025390625, -2.595703125, -2.43115234375, -2.2666015625, -2.10205078125, -1.9375, -1.77294921875, -1.6083984375, -1.44384765625, -1.279296875, -1.11474609375, -0.9501953125, -0.78564453125, -0.62109375, -0.45654296875, -0.2919921875, -0.12744140625, 0.037109375, 0.20166015625, 0.3662109375, 0.53076171875, 0.6953125, 0.85986328125, 1.0244140625, 1.18896484375, 1.353515625, 1.51806640625, 1.6826171875, 1.84716796875, 2.01171875, 2.17626953125, 2.3408203125, 2.50537109375, 2.669921875, 2.83447265625, 2.9990234375, 3.16357421875, 3.328125, 3.49267578125, 3.6572265625, 3.82177734375, 3.986328125, 4.15087890625, 4.3154296875, 4.47998046875, 4.64453125, 4.80908203125, 4.9736328125, 5.13818359375, 5.302734375, 5.46728515625, 5.6318359375, 5.79638671875, 5.9609375]}, "gradients/decoder.roberta.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 7.0, 11.0, 25.0, 32.0, 69.0, 95.0, 103.0, 133.0, 132.0, 102.0, 98.0, 70.0, 53.0, 31.0, 22.0, 14.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.336587905883789, -11.039658546447754, -10.742730140686035, -10.44580078125, -10.148871421813965, -9.85194206237793, -9.555013656616211, -9.258084297180176, -8.96115493774414, -8.664225578308105, -8.367297172546387, -8.070367813110352, -7.773438453674316, -7.4765095710754395, -7.1795806884765625, -6.882651329040527, -6.58572244644165, -6.288793563842773, -5.991864204406738, -5.694935321807861, -5.398005962371826, -5.101077079772949, -4.804147720336914, -4.507218837738037, -4.21028995513916, -3.913360834121704, -3.616431713104248, -3.319502830505371, -3.022573471069336, -2.725644588470459, -2.428715467453003, -2.131786346435547, -1.83485746383667, -1.5379283428192139, -1.2409992218017578, -0.9440702199935913, -0.6471410989761353, -0.3502119779586792, -0.053282976150512695, 0.24364614486694336, 0.5405752658843994, 0.8375043869018555, 1.1344335079193115, 1.431362509727478, 1.728291630744934, 2.0252208709716797, 2.3221497535705566, 2.6190788745880127, 2.9160079956054688, 3.212937116622925, 3.509866237640381, 3.806795120239258, 4.103724479675293, 4.40065336227417, 4.697582244873047, 4.994511604309082, 5.291440963745117, 5.588369846343994, 5.885299205780029, 6.182228088378906, 6.479157447814941, 6.776086330413818, 7.073015213012695, 7.3699445724487305, 7.666873455047607]}, "gradients/decoder.roberta.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 9.0, 14.0, 11.0, 11.0, 16.0, 17.0, 26.0, 34.0, 36.0, 45.0, 36.0, 40.0, 50.0, 52.0, 56.0, 59.0, 52.0, 53.0, 57.0, 45.0, 54.0, 39.0, 27.0, 33.0, 23.0, 26.0, 18.0, 19.0, 13.0, 8.0, 7.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859719276428223, -11.4719877243042, -11.084257125854492, -10.696525573730469, -10.308794021606445, -9.921062469482422, -9.533330917358398, -9.145600318908691, -8.757868766784668, -8.370137214660645, -7.982406139373779, -7.594675064086914, -7.206943511962891, -6.819211959838867, -6.431480884552002, -6.043749809265137, -5.656018257141113, -5.26828670501709, -4.880555629730225, -4.492824554443359, -4.105093002319336, -3.7173616886138916, -3.3296303749084473, -2.941899061203003, -2.5541677474975586, -2.1664364337921143, -1.77870512008667, -1.3909738063812256, -1.0032424926757812, -0.6155111789703369, -0.22777986526489258, 0.15995144844055176, 0.5476818084716797, 0.935413122177124, 1.3231444358825684, 1.7108757495880127, 2.098607063293457, 2.4863383769989014, 2.8740696907043457, 3.26180100440979, 3.6495323181152344, 4.037263870239258, 4.424994945526123, 4.812726020812988, 5.200457572937012, 5.588189125061035, 5.9759202003479, 6.363651275634766, 6.751382827758789, 7.1391143798828125, 7.526845455169678, 7.914576530456543, 8.302308082580566, 8.69003963470459, 9.077770233154297, 9.46550178527832, 9.853233337402344, 10.240964889526367, 10.62869644165039, 11.016427040100098, 11.404158592224121, 11.791890144348145, 12.179620742797852, 12.567352294921875, 12.955083847045898]}, "gradients/decoder.roberta.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 3.0, 4.0, 5.0, 6.0, 11.0, 15.0, 19.0, 32.0, 39.0, 35.0, 55.0, 84.0, 118.0, 175.0, 346.0, 660.0, 1340.0, 3160.0, 9419.0, 34941.0, 185485.0, 1313421.0, 2148921.0, 406222.0, 65195.0, 15671.0, 4961.0, 1892.0, 862.0, 464.0, 239.0, 162.0, 85.0, 50.0, 46.0, 31.0, 27.0, 21.0, 13.0, 17.0, 11.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.359375, -9.085693359375, -8.81201171875, -8.538330078125, -8.2646484375, -7.990966796875, -7.71728515625, -7.443603515625, -7.169921875, -6.896240234375, -6.62255859375, -6.348876953125, -6.0751953125, -5.801513671875, -5.52783203125, -5.254150390625, -4.98046875, -4.706787109375, -4.43310546875, -4.159423828125, -3.8857421875, -3.612060546875, -3.33837890625, -3.064697265625, -2.791015625, -2.517333984375, -2.24365234375, -1.969970703125, -1.6962890625, -1.422607421875, -1.14892578125, -0.875244140625, -0.6015625, -0.327880859375, -0.05419921875, 0.219482421875, 0.4931640625, 0.766845703125, 1.04052734375, 1.314208984375, 1.587890625, 1.861572265625, 2.13525390625, 2.408935546875, 2.6826171875, 2.956298828125, 3.22998046875, 3.503662109375, 3.77734375, 4.051025390625, 4.32470703125, 4.598388671875, 4.8720703125, 5.145751953125, 5.41943359375, 5.693115234375, 5.966796875, 6.240478515625, 6.51416015625, 6.787841796875, 7.0615234375, 7.335205078125, 7.60888671875, 7.882568359375, 8.15625]}, "gradients/decoder.roberta.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 12.0, 9.0, 10.0, 12.0, 15.0, 26.0, 22.0, 18.0, 35.0, 34.0, 37.0, 39.0, 34.0, 42.0, 48.0, 47.0, 50.0, 61.0, 36.0, 45.0, 46.0, 46.0, 45.0, 43.0, 32.0, 23.0, 22.0, 26.0, 17.0, 18.0, 8.0, 11.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.61328125, -4.468994140625, -4.32470703125, -4.180419921875, -4.0361328125, -3.891845703125, -3.74755859375, -3.603271484375, -3.458984375, -3.314697265625, -3.17041015625, -3.026123046875, -2.8818359375, -2.737548828125, -2.59326171875, -2.448974609375, -2.3046875, -2.160400390625, -2.01611328125, -1.871826171875, -1.7275390625, -1.583251953125, -1.43896484375, -1.294677734375, -1.150390625, -1.006103515625, -0.86181640625, -0.717529296875, -0.5732421875, -0.428955078125, -0.28466796875, -0.140380859375, 0.00390625, 0.148193359375, 0.29248046875, 0.436767578125, 0.5810546875, 0.725341796875, 0.86962890625, 1.013916015625, 1.158203125, 1.302490234375, 1.44677734375, 1.591064453125, 1.7353515625, 1.879638671875, 2.02392578125, 2.168212890625, 2.3125, 2.456787109375, 2.60107421875, 2.745361328125, 2.8896484375, 3.033935546875, 3.17822265625, 3.322509765625, 3.466796875, 3.611083984375, 3.75537109375, 3.899658203125, 4.0439453125, 4.188232421875, 4.33251953125, 4.476806640625, 4.62109375]}, "gradients/decoder.roberta.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 10.0, 16.0, 21.0, 38.0, 84.0, 207.0, 832.0, 16513.0, 4171416.0, 4300.0, 548.0, 144.0, 68.0, 31.0, 21.0, 8.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.6875, -96.291015625, -92.89453125, -89.498046875, -86.1015625, -82.705078125, -79.30859375, -75.912109375, -72.515625, -69.119140625, -65.72265625, -62.326171875, -58.9296875, -55.533203125, -52.13671875, -48.740234375, -45.34375, -41.947265625, -38.55078125, -35.154296875, -31.7578125, -28.361328125, -24.96484375, -21.568359375, -18.171875, -14.775390625, -11.37890625, -7.982421875, -4.5859375, -1.189453125, 2.20703125, 5.603515625, 9.0, 12.396484375, 15.79296875, 19.189453125, 22.5859375, 25.982421875, 29.37890625, 32.775390625, 36.171875, 39.568359375, 42.96484375, 46.361328125, 49.7578125, 53.154296875, 56.55078125, 59.947265625, 63.34375, 66.740234375, 70.13671875, 73.533203125, 76.9296875, 80.326171875, 83.72265625, 87.119140625, 90.515625, 93.912109375, 97.30859375, 100.705078125, 104.1015625, 107.498046875, 110.89453125, 114.291015625, 117.6875]}, "gradients/decoder.roberta.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 21.0, 27.0, 65.0, 131.0, 345.0, 792.0, 1331.0, 759.0, 293.0, 147.0, 59.0, 32.0, 20.0, 13.0, 11.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.26953125, -6.0928955078125, -5.916259765625, -5.7396240234375, -5.56298828125, -5.3863525390625, -5.209716796875, -5.0330810546875, -4.8564453125, -4.6798095703125, -4.503173828125, -4.3265380859375, -4.14990234375, -3.9732666015625, -3.796630859375, -3.6199951171875, -3.443359375, -3.2667236328125, -3.090087890625, -2.9134521484375, -2.73681640625, -2.5601806640625, -2.383544921875, -2.2069091796875, -2.0302734375, -1.8536376953125, -1.677001953125, -1.5003662109375, -1.32373046875, -1.1470947265625, -0.970458984375, -0.7938232421875, -0.6171875, -0.4405517578125, -0.263916015625, -0.0872802734375, 0.08935546875, 0.2659912109375, 0.442626953125, 0.6192626953125, 0.7958984375, 0.9725341796875, 1.149169921875, 1.3258056640625, 1.50244140625, 1.6790771484375, 1.855712890625, 2.0323486328125, 2.208984375, 2.3856201171875, 2.562255859375, 2.7388916015625, 2.91552734375, 3.0921630859375, 3.268798828125, 3.4454345703125, 3.6220703125, 3.7987060546875, 3.975341796875, 4.1519775390625, 4.32861328125, 4.5052490234375, 4.681884765625, 4.8585205078125, 5.03515625]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 9.0, 17.0, 35.0, 41.0, 59.0, 83.0, 97.0, 123.0, 105.0, 94.0, 86.0, 84.0, 65.0, 40.0, 29.0, 12.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.872363090515137, -8.634171485900879, -8.395980834960938, -8.15778923034668, -7.919597625732422, -7.681406497955322, -7.443215370178223, -7.205023765563965, -6.966832160949707, -6.728641033172607, -6.49044942855835, -6.25225830078125, -6.014066696166992, -5.775875568389893, -5.537684440612793, -5.299492835998535, -5.0613017082214355, -4.823110580444336, -4.584918975830078, -4.3467278480529785, -4.108536243438721, -3.870345115661621, -3.6321537494659424, -3.3939623832702637, -3.155771017074585, -2.9175796508789062, -2.6793882846832275, -2.441196918487549, -2.203005790710449, -1.964814305305481, -1.7266230583190918, -1.488431692123413, -1.2502398490905762, -1.0120484828948975, -0.7738571763038635, -0.5356658697128296, -0.2974745035171509, -0.05928313732147217, 0.178908109664917, 0.4170994758605957, 0.6552908420562744, 0.8934822082519531, 1.1316735744476318, 1.369864821434021, 1.6080561876296997, 1.8462475538253784, 2.0844388008117676, 2.3226301670074463, 2.560821533203125, 2.7990128993988037, 3.0372042655944824, 3.275395393371582, 3.51358699798584, 3.7517781257629395, 3.989969491958618, 4.228160858154297, 4.466352462768555, 4.704543590545654, 4.942735195159912, 5.180926322937012, 5.4191179275512695, 5.657309055328369, 5.895500183105469, 6.133691787719727, 6.371882915496826]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 12.0, 4.0, 9.0, 13.0, 14.0, 14.0, 17.0, 12.0, 18.0, 22.0, 35.0, 29.0, 33.0, 43.0, 40.0, 33.0, 39.0, 47.0, 44.0, 50.0, 45.0, 30.0, 54.0, 35.0, 37.0, 35.0, 21.0, 29.0, 26.0, 33.0, 21.0, 16.0, 18.0, 18.0, 14.0, 6.0, 11.0, 5.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.619379758834839, -3.494044303894043, -3.368708848953247, -3.243373394012451, -3.118037700653076, -2.9927024841308594, -2.8673667907714844, -2.7420313358306885, -2.6166958808898926, -2.4913604259490967, -2.366024971008301, -2.240689516067505, -2.115354061126709, -1.9900184869766235, -1.864682912826538, -1.7393474578857422, -1.6140120029449463, -1.4886765480041504, -1.3633410930633545, -1.238005518913269, -1.1126700639724731, -0.9873346090316772, -0.8619990944862366, -0.7366635799407959, -0.611328125, -0.4859926402568817, -0.3606571555137634, -0.23532167077064514, -0.10998618602752686, 0.015349268913269043, 0.14068478345870972, 0.2660202980041504, 0.3913555145263672, 0.5166909694671631, 0.6420264840126038, 0.7673619985580444, 0.8926974534988403, 1.0180329084396362, 1.1433684825897217, 1.2687039375305176, 1.3940393924713135, 1.5193748474121094, 1.6447103023529053, 1.7700458765029907, 1.8953813314437866, 2.020716667175293, 2.146052360534668, 2.271387815475464, 2.3967232704162598, 2.5220587253570557, 2.6473941802978516, 2.7727296352386475, 2.8980650901794434, 3.0234007835388184, 3.1487362384796143, 3.27407169342041, 3.399407148361206, 3.524742603302002, 3.650078058242798, 3.7754135131835938, 3.9007492065429688, 4.0260844230651855, 4.1514201164245605, 4.276755332946777, 4.402091026306152]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 10.0, 11.0, 14.0, 19.0, 37.0, 34.0, 52.0, 81.0, 112.0, 151.0, 243.0, 329.0, 505.0, 767.0, 1148.0, 1629.0, 2588.0, 3911.0, 6420.0, 10129.0, 16836.0, 28243.0, 49562.0, 88888.0, 156975.0, 228171.0, 189631.0, 111613.0, 61976.0, 34724.0, 20475.0, 12092.0, 7460.0, 4715.0, 3093.0, 1914.0, 1335.0, 842.0, 569.0, 412.0, 235.0, 184.0, 111.0, 97.0, 55.0, 48.0, 34.0, 23.0, 15.0, 13.0, 9.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.62109375, -0.6001739501953125, -0.579254150390625, -0.5583343505859375, -0.53741455078125, -0.5164947509765625, -0.495574951171875, -0.4746551513671875, -0.4537353515625, -0.4328155517578125, -0.411895751953125, -0.3909759521484375, -0.37005615234375, -0.3491363525390625, -0.328216552734375, -0.3072967529296875, -0.286376953125, -0.2654571533203125, -0.244537353515625, -0.2236175537109375, -0.20269775390625, -0.1817779541015625, -0.160858154296875, -0.1399383544921875, -0.1190185546875, -0.0980987548828125, -0.077178955078125, -0.0562591552734375, -0.03533935546875, -0.0144195556640625, 0.006500244140625, 0.0274200439453125, 0.04833984375, 0.0692596435546875, 0.090179443359375, 0.1110992431640625, 0.13201904296875, 0.1529388427734375, 0.173858642578125, 0.1947784423828125, 0.2156982421875, 0.2366180419921875, 0.257537841796875, 0.2784576416015625, 0.29937744140625, 0.3202972412109375, 0.341217041015625, 0.3621368408203125, 0.383056640625, 0.4039764404296875, 0.424896240234375, 0.4458160400390625, 0.46673583984375, 0.4876556396484375, 0.508575439453125, 0.5294952392578125, 0.5504150390625, 0.5713348388671875, 0.592254638671875, 0.6131744384765625, 0.63409423828125, 0.6550140380859375, 0.675933837890625, 0.6968536376953125, 0.7177734375]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 5.0, 8.0, 10.0, 17.0, 14.0, 13.0, 19.0, 16.0, 18.0, 37.0, 27.0, 30.0, 39.0, 45.0, 29.0, 39.0, 52.0, 44.0, 44.0, 50.0, 32.0, 45.0, 44.0, 38.0, 35.0, 21.0, 31.0, 27.0, 34.0, 19.0, 18.0, 17.0, 17.0, 15.0, 7.0, 11.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.65234375, -3.52935791015625, -3.4063720703125, -3.28338623046875, -3.160400390625, -3.03741455078125, -2.9144287109375, -2.79144287109375, -2.66845703125, -2.54547119140625, -2.4224853515625, -2.29949951171875, -2.176513671875, -2.05352783203125, -1.9305419921875, -1.80755615234375, -1.6845703125, -1.56158447265625, -1.4385986328125, -1.31561279296875, -1.192626953125, -1.06964111328125, -0.9466552734375, -0.82366943359375, -0.70068359375, -0.57769775390625, -0.4547119140625, -0.33172607421875, -0.208740234375, -0.08575439453125, 0.0372314453125, 0.16021728515625, 0.283203125, 0.40618896484375, 0.5291748046875, 0.65216064453125, 0.775146484375, 0.89813232421875, 1.0211181640625, 1.14410400390625, 1.26708984375, 1.39007568359375, 1.5130615234375, 1.63604736328125, 1.759033203125, 1.88201904296875, 2.0050048828125, 2.12799072265625, 2.2509765625, 2.37396240234375, 2.4969482421875, 2.61993408203125, 2.742919921875, 2.86590576171875, 2.9888916015625, 3.11187744140625, 3.23486328125, 3.35784912109375, 3.4808349609375, 3.60382080078125, 3.726806640625, 3.84979248046875, 3.9727783203125, 4.09576416015625, 4.21875]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 14.0, 9.0, 8.0, 15.0, 21.0, 29.0, 45.0, 49.0, 73.0, 104.0, 161.0, 259.0, 362.0, 532.0, 992.0, 1814.0, 4046.0, 11341.0, 45734.0, 926795.0, 38228.0, 10183.0, 3600.0, 1654.0, 861.0, 520.0, 352.0, 223.0, 147.0, 91.0, 88.0, 47.0, 45.0, 26.0, 14.0, 17.0, 18.0, 8.0, 12.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.60546875, -2.522613525390625, -2.43975830078125, -2.356903076171875, -2.2740478515625, -2.191192626953125, -2.10833740234375, -2.025482177734375, -1.942626953125, -1.859771728515625, -1.77691650390625, -1.694061279296875, -1.6112060546875, -1.528350830078125, -1.44549560546875, -1.362640380859375, -1.27978515625, -1.196929931640625, -1.11407470703125, -1.031219482421875, -0.9483642578125, -0.865509033203125, -0.78265380859375, -0.699798583984375, -0.616943359375, -0.534088134765625, -0.45123291015625, -0.368377685546875, -0.2855224609375, -0.202667236328125, -0.11981201171875, -0.036956787109375, 0.0458984375, 0.128753662109375, 0.21160888671875, 0.294464111328125, 0.3773193359375, 0.460174560546875, 0.54302978515625, 0.625885009765625, 0.708740234375, 0.791595458984375, 0.87445068359375, 0.957305908203125, 1.0401611328125, 1.123016357421875, 1.20587158203125, 1.288726806640625, 1.37158203125, 1.454437255859375, 1.53729248046875, 1.620147705078125, 1.7030029296875, 1.785858154296875, 1.86871337890625, 1.951568603515625, 2.034423828125, 2.117279052734375, 2.20013427734375, 2.282989501953125, 2.3658447265625, 2.448699951171875, 2.53155517578125, 2.614410400390625, 2.697265625]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 8.0, 15.0, 7.0, 11.0, 14.0, 20.0, 19.0, 20.0, 22.0, 26.0, 22.0, 29.0, 35.0, 32.0, 40.0, 32.0, 37.0, 33.0, 44.0, 31.0, 40.0, 31.0, 47.0, 50.0, 31.0, 34.0, 28.0, 29.0, 31.0, 26.0, 21.0, 15.0, 14.0, 15.0, 15.0, 9.0, 12.0, 4.0, 3.0, 14.0, 8.0, 8.0, 3.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.44921875, -2.37677001953125, -2.3043212890625, -2.23187255859375, -2.159423828125, -2.08697509765625, -2.0145263671875, -1.94207763671875, -1.86962890625, -1.79718017578125, -1.7247314453125, -1.65228271484375, -1.579833984375, -1.50738525390625, -1.4349365234375, -1.36248779296875, -1.2900390625, -1.21759033203125, -1.1451416015625, -1.07269287109375, -1.000244140625, -0.92779541015625, -0.8553466796875, -0.78289794921875, -0.71044921875, -0.63800048828125, -0.5655517578125, -0.49310302734375, -0.420654296875, -0.34820556640625, -0.2757568359375, -0.20330810546875, -0.130859375, -0.05841064453125, 0.0140380859375, 0.08648681640625, 0.158935546875, 0.23138427734375, 0.3038330078125, 0.37628173828125, 0.44873046875, 0.52117919921875, 0.5936279296875, 0.66607666015625, 0.738525390625, 0.81097412109375, 0.8834228515625, 0.95587158203125, 1.0283203125, 1.10076904296875, 1.1732177734375, 1.24566650390625, 1.318115234375, 1.39056396484375, 1.4630126953125, 1.53546142578125, 1.60791015625, 1.68035888671875, 1.7528076171875, 1.82525634765625, 1.897705078125, 1.97015380859375, 2.0426025390625, 2.11505126953125, 2.1875]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 10.0, 2.0, 4.0, 16.0, 14.0, 28.0, 27.0, 56.0, 72.0, 109.0, 171.0, 231.0, 455.0, 852.0, 1650.0, 4160.0, 15316.0, 942813.0, 66703.0, 9750.0, 3105.0, 1297.0, 695.0, 377.0, 204.0, 136.0, 102.0, 50.0, 38.0, 33.0, 17.0, 11.0, 10.0, 11.0, 9.0, 1.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.411376953125, -0.39922332763671875, -0.3870697021484375, -0.37491607666015625, -0.362762451171875, -0.35060882568359375, -0.3384552001953125, -0.32630157470703125, -0.31414794921875, -0.30199432373046875, -0.2898406982421875, -0.27768707275390625, -0.265533447265625, -0.25337982177734375, -0.2412261962890625, -0.22907257080078125, -0.2169189453125, -0.20476531982421875, -0.1926116943359375, -0.18045806884765625, -0.168304443359375, -0.15615081787109375, -0.1439971923828125, -0.13184356689453125, -0.11968994140625, -0.10753631591796875, -0.0953826904296875, -0.08322906494140625, -0.071075439453125, -0.05892181396484375, -0.0467681884765625, -0.03461456298828125, -0.0224609375, -0.01030731201171875, 0.0018463134765625, 0.01399993896484375, 0.026153564453125, 0.03830718994140625, 0.0504608154296875, 0.06261444091796875, 0.07476806640625, 0.08692169189453125, 0.0990753173828125, 0.11122894287109375, 0.123382568359375, 0.13553619384765625, 0.1476898193359375, 0.15984344482421875, 0.1719970703125, 0.18415069580078125, 0.1963043212890625, 0.20845794677734375, 0.220611572265625, 0.23276519775390625, 0.2449188232421875, 0.25707244873046875, 0.26922607421875, 0.28137969970703125, 0.2935333251953125, 0.30568695068359375, 0.317840576171875, 0.32999420166015625, 0.3421478271484375, 0.35430145263671875, 0.366455078125]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 7.0, 10.0, 14.0, 7.0, 15.0, 17.0, 22.0, 29.0, 34.0, 33.0, 59.0, 59.0, 61.0, 57.0, 60.0, 60.0, 68.0, 67.0, 63.0, 48.0, 33.0, 36.0, 29.0, 24.0, 13.0, 22.0, 15.0, 11.0, 4.0, 6.0, 9.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.9861927032470703e-05, -2.8883107006549835e-05, -2.7904286980628967e-05, -2.69254669547081e-05, -2.594664692878723e-05, -2.4967826902866364e-05, -2.3989006876945496e-05, -2.3010186851024628e-05, -2.203136682510376e-05, -2.1052546799182892e-05, -2.0073726773262024e-05, -1.9094906747341156e-05, -1.8116086721420288e-05, -1.713726669549942e-05, -1.6158446669578552e-05, -1.5179626643657684e-05, -1.4200806617736816e-05, -1.3221986591815948e-05, -1.224316656589508e-05, -1.1264346539974213e-05, -1.0285526514053345e-05, -9.306706488132477e-06, -8.327886462211609e-06, -7.349066436290741e-06, -6.370246410369873e-06, -5.391426384449005e-06, -4.412606358528137e-06, -3.4337863326072693e-06, -2.4549663066864014e-06, -1.4761462807655334e-06, -4.973262548446655e-07, 4.814937710762024e-07, 1.4603137969970703e-06, 2.4391338229179382e-06, 3.417953848838806e-06, 4.396773874759674e-06, 5.375593900680542e-06, 6.35441392660141e-06, 7.333233952522278e-06, 8.312053978443146e-06, 9.290874004364014e-06, 1.0269694030284882e-05, 1.124851405620575e-05, 1.2227334082126617e-05, 1.3206154108047485e-05, 1.4184974133968353e-05, 1.5163794159889221e-05, 1.614261418581009e-05, 1.7121434211730957e-05, 1.8100254237651825e-05, 1.9079074263572693e-05, 2.005789428949356e-05, 2.103671431541443e-05, 2.2015534341335297e-05, 2.2994354367256165e-05, 2.3973174393177032e-05, 2.49519944190979e-05, 2.593081444501877e-05, 2.6909634470939636e-05, 2.7888454496860504e-05, 2.8867274522781372e-05, 2.984609454870224e-05, 3.082491457462311e-05, 3.1803734600543976e-05, 3.2782554626464844e-05]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 2.0, 10.0, 18.0, 17.0, 19.0, 33.0, 48.0, 107.0, 355.0, 7219.0, 867159.0, 170760.0, 2328.0, 223.0, 74.0, 46.0, 28.0, 22.0, 15.0, 5.0, 7.0, 9.0, 5.0, 3.0, 9.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68896484375, -0.6658782958984375, -0.642791748046875, -0.6197052001953125, -0.59661865234375, -0.5735321044921875, -0.550445556640625, -0.5273590087890625, -0.5042724609375, -0.4811859130859375, -0.458099365234375, -0.4350128173828125, -0.41192626953125, -0.3888397216796875, -0.365753173828125, -0.3426666259765625, -0.319580078125, -0.2964935302734375, -0.273406982421875, -0.2503204345703125, -0.22723388671875, -0.2041473388671875, -0.181060791015625, -0.1579742431640625, -0.1348876953125, -0.1118011474609375, -0.088714599609375, -0.0656280517578125, -0.04254150390625, -0.0194549560546875, 0.003631591796875, 0.0267181396484375, 0.0498046875, 0.0728912353515625, 0.095977783203125, 0.1190643310546875, 0.14215087890625, 0.1652374267578125, 0.188323974609375, 0.2114105224609375, 0.2344970703125, 0.2575836181640625, 0.280670166015625, 0.3037567138671875, 0.32684326171875, 0.3499298095703125, 0.373016357421875, 0.3961029052734375, 0.419189453125, 0.4422760009765625, 0.465362548828125, 0.4884490966796875, 0.51153564453125, 0.5346221923828125, 0.557708740234375, 0.5807952880859375, 0.6038818359375, 0.6269683837890625, 0.650054931640625, 0.6731414794921875, 0.69622802734375, 0.7193145751953125, 0.742401123046875, 0.7654876708984375, 0.78857421875]}, "gradients/decoder.roberta.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 8.0, 6.0, 7.0, 10.0, 4.0, 17.0, 25.0, 25.0, 46.0, 52.0, 68.0, 92.0, 125.0, 129.0, 84.0, 63.0, 46.0, 44.0, 38.0, 22.0, 25.0, 17.0, 2.0, 8.0, 5.0, 9.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03857421875, -0.03744363784790039, -0.03631305694580078, -0.03518247604370117, -0.03405189514160156, -0.03292131423950195, -0.031790733337402344, -0.030660152435302734, -0.029529571533203125, -0.028398990631103516, -0.027268409729003906, -0.026137828826904297, -0.025007247924804688, -0.023876667022705078, -0.02274608612060547, -0.02161550521850586, -0.02048492431640625, -0.01935434341430664, -0.01822376251220703, -0.017093181610107422, -0.015962600708007812, -0.014832019805908203, -0.013701438903808594, -0.012570858001708984, -0.011440277099609375, -0.010309696197509766, -0.009179115295410156, -0.008048534393310547, -0.0069179534912109375, -0.005787372589111328, -0.004656791687011719, -0.0035262107849121094, -0.0023956298828125, -0.0012650489807128906, -0.00013446807861328125, 0.0009961128234863281, 0.0021266937255859375, 0.003257274627685547, 0.004387855529785156, 0.005518436431884766, 0.006649017333984375, 0.007779598236083984, 0.008910179138183594, 0.010040760040283203, 0.011171340942382812, 0.012301921844482422, 0.013432502746582031, 0.01456308364868164, 0.01569366455078125, 0.01682424545288086, 0.01795482635498047, 0.019085407257080078, 0.020215988159179688, 0.021346569061279297, 0.022477149963378906, 0.023607730865478516, 0.024738311767578125, 0.025868892669677734, 0.026999473571777344, 0.028130054473876953, 0.029260635375976562, 0.030391216278076172, 0.03152179718017578, 0.03265237808227539, 0.033782958984375]}, "gradients/decoder.roberta.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 15.0, 22.0, 26.0, 29.0, 53.0, 81.0, 87.0, 89.0, 103.0, 92.0, 79.0, 79.0, 67.0, 48.0, 52.0, 29.0, 22.0, 10.0, 4.0, 2.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.50552749633789, -8.307448387145996, -8.109368324279785, -7.911289215087891, -7.713210105895996, -7.515130519866943, -7.317051410675049, -7.118971824645996, -6.920892715454102, -6.722813129425049, -6.524734020233154, -6.326654434204102, -6.128575325012207, -5.930495738983154, -5.73241662979126, -5.534337043762207, -5.3362579345703125, -5.13817834854126, -4.940099239349365, -4.7420196533203125, -4.543940544128418, -4.345860958099365, -4.147781848907471, -3.949702262878418, -3.7516226768493652, -3.5535433292388916, -3.355463981628418, -3.1573846340179443, -2.9593052864074707, -2.761225938796997, -2.5631465911865234, -2.3650670051574707, -2.166987895965576, -1.9689085483551025, -1.770829200744629, -1.5727498531341553, -1.3746705055236816, -1.176591157913208, -0.9785116910934448, -0.7804323434829712, -0.5823529958724976, -0.3842736482620239, -0.1861942708492279, 0.011885106563568115, 0.20996445417404175, 0.4080438017845154, 0.6061232089996338, 0.8042025566101074, 1.002281904220581, 1.2003612518310547, 1.3984405994415283, 1.596519947052002, 1.7945992946624756, 1.9926786422729492, 2.190758228302002, 2.3888373374938965, 2.586916923522949, 2.784996271133423, 2.9830756187438965, 3.18115496635437, 3.3792343139648438, 3.5773136615753174, 3.775393009185791, 3.9734725952148438, 4.171551704406738]}, "gradients/decoder.roberta.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 5.0, 9.0, 9.0, 17.0, 14.0, 14.0, 18.0, 15.0, 20.0, 37.0, 26.0, 30.0, 40.0, 47.0, 27.0, 38.0, 53.0, 43.0, 48.0, 46.0, 31.0, 47.0, 42.0, 39.0, 35.0, 22.0, 31.0, 27.0, 32.0, 21.0, 17.0, 17.0, 19.0, 13.0, 7.0, 11.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.653076171875, -3.5300467014312744, -3.407017230987549, -3.283987522125244, -3.1609580516815186, -3.037928581237793, -2.9148991107940674, -2.791869640350342, -2.668839931488037, -2.5458104610443115, -2.422780990600586, -2.2997512817382812, -2.1767218112945557, -2.05369234085083, -1.9306628704071045, -1.807633399963379, -1.6846039295196533, -1.5615744590759277, -1.4385448694229126, -1.315515398979187, -1.1924858093261719, -1.0694563388824463, -0.9464268684387207, -0.8233973383903503, -0.70036780834198, -0.5773382782936096, -0.45430877804756165, -0.33127927780151367, -0.2082497477531433, -0.08522021770477295, 0.03780925273895264, 0.160838782787323, 0.28386831283569336, 0.4068978428840637, 0.5299273729324341, 0.6529568433761597, 0.77598637342453, 0.8990159034729004, 1.022045373916626, 1.1450748443603516, 1.2681044340133667, 1.3911339044570923, 1.5141634941101074, 1.637192964553833, 1.7602224349975586, 1.8832520246505737, 2.0062813758850098, 2.1293110847473145, 2.25234055519104, 2.3753700256347656, 2.498399496078491, 2.621428966522217, 2.7444586753845215, 2.867488145828247, 2.9905176162719727, 3.1135470867156982, 3.236576557159424, 3.3596060276031494, 3.482635498046875, 3.6056652069091797, 3.7286946773529053, 3.851724147796631, 3.9747536182403564, 4.097783088684082, 4.220812797546387]}, "gradients/decoder.roberta.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 5.0, 9.0, 15.0, 21.0, 18.0, 34.0, 44.0, 56.0, 69.0, 106.0, 127.0, 216.0, 279.0, 459.0, 847.0, 1493.0, 3221.0, 7539.0, 18552.0, 45524.0, 112108.0, 277189.0, 335946.0, 144326.0, 58589.0, 23808.0, 9494.0, 3960.0, 1892.0, 997.0, 494.0, 342.0, 214.0, 158.0, 104.0, 93.0, 50.0, 50.0, 21.0, 17.0, 22.0, 13.0, 9.0, 4.0, 3.0, 2.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.58203125, -4.42999267578125, -4.2779541015625, -4.12591552734375, -3.973876953125, -3.82183837890625, -3.6697998046875, -3.51776123046875, -3.36572265625, -3.21368408203125, -3.0616455078125, -2.90960693359375, -2.757568359375, -2.60552978515625, -2.4534912109375, -2.30145263671875, -2.1494140625, -1.99737548828125, -1.8453369140625, -1.69329833984375, -1.541259765625, -1.38922119140625, -1.2371826171875, -1.08514404296875, -0.93310546875, -0.78106689453125, -0.6290283203125, -0.47698974609375, -0.324951171875, -0.17291259765625, -0.0208740234375, 0.13116455078125, 0.283203125, 0.43524169921875, 0.5872802734375, 0.73931884765625, 0.891357421875, 1.04339599609375, 1.1954345703125, 1.34747314453125, 1.49951171875, 1.65155029296875, 1.8035888671875, 1.95562744140625, 2.107666015625, 2.25970458984375, 2.4117431640625, 2.56378173828125, 2.7158203125, 2.86785888671875, 3.0198974609375, 3.17193603515625, 3.323974609375, 3.47601318359375, 3.6280517578125, 3.78009033203125, 3.93212890625, 4.08416748046875, 4.2362060546875, 4.38824462890625, 4.540283203125, 4.69232177734375, 4.8443603515625, 4.99639892578125, 5.1484375]}, "gradients/decoder.roberta.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 6.0, 9.0, 7.0, 12.0, 14.0, 16.0, 16.0, 15.0, 16.0, 18.0, 34.0, 32.0, 45.0, 41.0, 39.0, 45.0, 33.0, 49.0, 42.0, 55.0, 35.0, 39.0, 46.0, 42.0, 40.0, 31.0, 24.0, 38.0, 26.0, 24.0, 16.0, 18.0, 23.0, 14.0, 6.0, 12.0, 6.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.85546875, -3.72802734375, -3.6005859375, -3.47314453125, -3.345703125, -3.21826171875, -3.0908203125, -2.96337890625, -2.8359375, -2.70849609375, -2.5810546875, -2.45361328125, -2.326171875, -2.19873046875, -2.0712890625, -1.94384765625, -1.81640625, -1.68896484375, -1.5615234375, -1.43408203125, -1.306640625, -1.17919921875, -1.0517578125, -0.92431640625, -0.796875, -0.66943359375, -0.5419921875, -0.41455078125, -0.287109375, -0.15966796875, -0.0322265625, 0.09521484375, 0.22265625, 0.35009765625, 0.4775390625, 0.60498046875, 0.732421875, 0.85986328125, 0.9873046875, 1.11474609375, 1.2421875, 1.36962890625, 1.4970703125, 1.62451171875, 1.751953125, 1.87939453125, 2.0068359375, 2.13427734375, 2.26171875, 2.38916015625, 2.5166015625, 2.64404296875, 2.771484375, 2.89892578125, 3.0263671875, 3.15380859375, 3.28125, 3.40869140625, 3.5361328125, 3.66357421875, 3.791015625, 3.91845703125, 4.0458984375, 4.17333984375, 4.30078125]}, "gradients/decoder.roberta.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 2.0, 2.0, 5.0, 10.0, 9.0, 20.0, 17.0, 19.0, 27.0, 32.0, 35.0, 27.0, 38.0, 43.0, 52.0, 54.0, 45.0, 146.0, 1031248.0, 16258.0, 77.0, 49.0, 38.0, 39.0, 32.0, 39.0, 37.0, 38.0, 24.0, 20.0, 23.0, 11.0, 11.0, 9.0, 4.0, 7.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-139.0, -134.8935546875, -130.787109375, -126.6806640625, -122.57421875, -118.4677734375, -114.361328125, -110.2548828125, -106.1484375, -102.0419921875, -97.935546875, -93.8291015625, -89.72265625, -85.6162109375, -81.509765625, -77.4033203125, -73.296875, -69.1904296875, -65.083984375, -60.9775390625, -56.87109375, -52.7646484375, -48.658203125, -44.5517578125, -40.4453125, -36.3388671875, -32.232421875, -28.1259765625, -24.01953125, -19.9130859375, -15.806640625, -11.7001953125, -7.59375, -3.4873046875, 0.619140625, 4.7255859375, 8.83203125, 12.9384765625, 17.044921875, 21.1513671875, 25.2578125, 29.3642578125, 33.470703125, 37.5771484375, 41.68359375, 45.7900390625, 49.896484375, 54.0029296875, 58.109375, 62.2158203125, 66.322265625, 70.4287109375, 74.53515625, 78.6416015625, 82.748046875, 86.8544921875, 90.9609375, 95.0673828125, 99.173828125, 103.2802734375, 107.38671875, 111.4931640625, 115.599609375, 119.7060546875, 123.8125]}, "gradients/decoder.roberta.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 6.0, 12.0, 16.0, 19.0, 20.0, 30.0, 36.0, 26.0, 41.0, 33.0, 36.0, 40.0, 45.0, 49.0, 45.0, 36.0, 47.0, 44.0, 54.0, 55.0, 33.0, 33.0, 32.0, 37.0, 31.0, 21.0, 26.0, 19.0, 17.0, 16.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -4.00048828125, -3.8681640625, -3.73583984375, -3.603515625, -3.47119140625, -3.3388671875, -3.20654296875, -3.07421875, -2.94189453125, -2.8095703125, -2.67724609375, -2.544921875, -2.41259765625, -2.2802734375, -2.14794921875, -2.015625, -1.88330078125, -1.7509765625, -1.61865234375, -1.486328125, -1.35400390625, -1.2216796875, -1.08935546875, -0.95703125, -0.82470703125, -0.6923828125, -0.56005859375, -0.427734375, -0.29541015625, -0.1630859375, -0.03076171875, 0.1015625, 0.23388671875, 0.3662109375, 0.49853515625, 0.630859375, 0.76318359375, 0.8955078125, 1.02783203125, 1.16015625, 1.29248046875, 1.4248046875, 1.55712890625, 1.689453125, 1.82177734375, 1.9541015625, 2.08642578125, 2.21875, 2.35107421875, 2.4833984375, 2.61572265625, 2.748046875, 2.88037109375, 3.0126953125, 3.14501953125, 3.27734375, 3.40966796875, 3.5419921875, 3.67431640625, 3.806640625, 3.93896484375, 4.0712890625, 4.20361328125, 4.3359375]}, "gradients/decoder.roberta.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 8.0, 8.0, 15.0, 17.0, 41.0, 99.0, 166.0, 448.0, 1328.0, 11685.0, 606854.0, 416187.0, 9700.0, 1242.0, 410.0, 168.0, 70.0, 35.0, 16.0, 17.0, 8.0, 8.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.18914794921875, -7.9329833984375, -7.67681884765625, -7.420654296875, -7.16448974609375, -6.9083251953125, -6.65216064453125, -6.39599609375, -6.13983154296875, -5.8836669921875, -5.62750244140625, -5.371337890625, -5.11517333984375, -4.8590087890625, -4.60284423828125, -4.3466796875, -4.09051513671875, -3.8343505859375, -3.57818603515625, -3.322021484375, -3.06585693359375, -2.8096923828125, -2.55352783203125, -2.29736328125, -2.04119873046875, -1.7850341796875, -1.52886962890625, -1.272705078125, -1.01654052734375, -0.7603759765625, -0.50421142578125, -0.248046875, 0.00811767578125, 0.2642822265625, 0.52044677734375, 0.776611328125, 1.03277587890625, 1.2889404296875, 1.54510498046875, 1.80126953125, 2.05743408203125, 2.3135986328125, 2.56976318359375, 2.825927734375, 3.08209228515625, 3.3382568359375, 3.59442138671875, 3.8505859375, 4.10675048828125, 4.3629150390625, 4.61907958984375, 4.875244140625, 5.13140869140625, 5.3875732421875, 5.64373779296875, 5.89990234375, 6.15606689453125, 6.4122314453125, 6.66839599609375, 6.924560546875, 7.18072509765625, 7.4368896484375, 7.69305419921875, 7.94921875]}, "gradients/decoder.roberta.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 8.0, 12.0, 10.0, 24.0, 19.0, 36.0, 55.0, 58.0, 102.0, 167.0, 157.0, 87.0, 69.0, 45.0, 36.0, 26.0, 21.0, 11.0, 7.0, 6.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00038933753967285156, -0.00037881359457969666, -0.00036828964948654175, -0.00035776570439338684, -0.00034724175930023193, -0.000336717814207077, -0.0003261938691139221, -0.0003156699240207672, -0.0003051459789276123, -0.0002946220338344574, -0.0002840980887413025, -0.0002735741436481476, -0.0002630501985549927, -0.00025252625346183777, -0.00024200230836868286, -0.00023147836327552795, -0.00022095441818237305, -0.00021043047308921814, -0.00019990652799606323, -0.00018938258290290833, -0.00017885863780975342, -0.0001683346927165985, -0.0001578107476234436, -0.0001472868025302887, -0.0001367628574371338, -0.00012623891234397888, -0.00011571496725082397, -0.00010519102215766907, -9.466707706451416e-05, -8.414313197135925e-05, -7.361918687820435e-05, -6.309524178504944e-05, -5.257129669189453e-05, -4.2047351598739624e-05, -3.152340650558472e-05, -2.099946141242981e-05, -1.0475516319274902e-05, 4.842877388000488e-08, 1.0572373867034912e-05, 2.109631896018982e-05, 3.1620264053344727e-05, 4.2144209146499634e-05, 5.266815423965454e-05, 6.319209933280945e-05, 7.371604442596436e-05, 8.423998951911926e-05, 9.476393461227417e-05, 0.00010528787970542908, 0.00011581182479858398, 0.0001263357698917389, 0.0001368597149848938, 0.0001473836600780487, 0.0001579076051712036, 0.00016843155026435852, 0.00017895549535751343, 0.00018947944045066833, 0.00020000338554382324, 0.00021052733063697815, 0.00022105127573013306, 0.00023157522082328796, 0.00024209916591644287, 0.0002526231110095978, 0.0002631470561027527, 0.0002736710011959076, 0.0002841949462890625]}, "gradients/decoder.roberta.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 9.0, 17.0, 25.0, 47.0, 70.0, 369.0, 14841.0, 1031320.0, 1525.0, 143.0, 69.0, 37.0, 33.0, 12.0, 5.0, 7.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.203125, -26.333251953125, -25.46337890625, -24.593505859375, -23.7236328125, -22.853759765625, -21.98388671875, -21.114013671875, -20.244140625, -19.374267578125, -18.50439453125, -17.634521484375, -16.7646484375, -15.894775390625, -15.02490234375, -14.155029296875, -13.28515625, -12.415283203125, -11.54541015625, -10.675537109375, -9.8056640625, -8.935791015625, -8.06591796875, -7.196044921875, -6.326171875, -5.456298828125, -4.58642578125, -3.716552734375, -2.8466796875, -1.976806640625, -1.10693359375, -0.237060546875, 0.6328125, 1.502685546875, 2.37255859375, 3.242431640625, 4.1123046875, 4.982177734375, 5.85205078125, 6.721923828125, 7.591796875, 8.461669921875, 9.33154296875, 10.201416015625, 11.0712890625, 11.941162109375, 12.81103515625, 13.680908203125, 14.55078125, 15.420654296875, 16.29052734375, 17.160400390625, 18.0302734375, 18.900146484375, 19.77001953125, 20.639892578125, 21.509765625, 22.379638671875, 23.24951171875, 24.119384765625, 24.9892578125, 25.859130859375, 26.72900390625, 27.598876953125, 28.46875]}, "gradients/decoder.roberta.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 4.0, 7.0, 12.0, 20.0, 33.0, 64.0, 79.0, 138.0, 207.0, 172.0, 98.0, 59.0, 42.0, 21.0, 15.0, 8.0, 6.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2285919189453125, -1.188629150390625, -1.1486663818359375, -1.10870361328125, -1.0687408447265625, -1.028778076171875, -0.9888153076171875, -0.9488525390625, -0.9088897705078125, -0.868927001953125, -0.8289642333984375, -0.78900146484375, -0.7490386962890625, -0.709075927734375, -0.6691131591796875, -0.629150390625, -0.5891876220703125, -0.549224853515625, -0.5092620849609375, -0.46929931640625, -0.4293365478515625, -0.389373779296875, -0.3494110107421875, -0.3094482421875, -0.2694854736328125, -0.229522705078125, -0.1895599365234375, -0.14959716796875, -0.1096343994140625, -0.069671630859375, -0.0297088623046875, 0.01025390625, 0.0502166748046875, 0.090179443359375, 0.1301422119140625, 0.17010498046875, 0.2100677490234375, 0.250030517578125, 0.2899932861328125, 0.3299560546875, 0.3699188232421875, 0.409881591796875, 0.4498443603515625, 0.48980712890625, 0.5297698974609375, 0.569732666015625, 0.6096954345703125, 0.649658203125, 0.6896209716796875, 0.729583740234375, 0.7695465087890625, 0.80950927734375, 0.8494720458984375, 0.889434814453125, 0.9293975830078125, 0.9693603515625, 1.0093231201171875, 1.049285888671875, 1.0892486572265625, 1.12921142578125, 1.1691741943359375, 1.209136962890625, 1.2490997314453125, 1.2890625]}, "gradients/decoder.roberta.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 9.0, 18.0, 88.0, 160.0, 197.0, 239.0, 160.0, 97.0, 25.0, 13.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.09303092956543, -14.621273040771484, -14.149514198303223, -13.677756309509277, -13.205998420715332, -12.73423957824707, -12.262481689453125, -11.79072380065918, -11.318965911865234, -10.847208023071289, -10.375449180603027, -9.903691291809082, -9.431933403015137, -8.960174560546875, -8.48841667175293, -8.016658782958984, -7.544899940490723, -7.073141574859619, -6.601383686065674, -6.12962532043457, -5.657867431640625, -5.1861090660095215, -4.714350700378418, -4.242592811584473, -3.770834445953369, -3.2990763187408447, -2.8273181915283203, -2.355559825897217, -1.8838016986846924, -1.412043571472168, -0.9402852058410645, -0.46852707862854004, 0.0032320022583007812, 0.47499018907546997, 0.9467483758926392, 1.4185066223144531, 1.8902647495269775, 2.362022876739502, 2.8337812423706055, 3.30553936958313, 3.7772974967956543, 4.249055862426758, 4.720813751220703, 5.192572116851807, 5.66433048248291, 6.1360883712768555, 6.607846736907959, 7.0796051025390625, 7.551362991333008, 8.023120880126953, 8.494879722595215, 8.96663761138916, 9.438395500183105, 9.910154342651367, 10.381912231445312, 10.853670120239258, 11.325428009033203, 11.797185897827148, 12.26894474029541, 12.740702629089355, 13.2124605178833, 13.684219360351562, 14.155977249145508, 14.627735137939453, 15.099493980407715]}, "gradients/decoder.roberta.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 7.0, 8.0, 6.0, 5.0, 7.0, 7.0, 9.0, 15.0, 6.0, 7.0, 13.0, 16.0, 16.0, 25.0, 26.0, 22.0, 26.0, 28.0, 36.0, 30.0, 44.0, 39.0, 40.0, 40.0, 44.0, 42.0, 37.0, 38.0, 38.0, 34.0, 33.0, 28.0, 31.0, 22.0, 18.0, 24.0, 22.0, 19.0, 18.0, 10.0, 9.0, 21.0, 11.0, 4.0, 7.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.172963619232178, -4.9936089515686035, -4.814253807067871, -4.634899139404297, -4.4555439949035645, -4.27618932723999, -4.096834182739258, -3.9174795150756836, -3.7381246089935303, -3.558769702911377, -3.3794147968292236, -3.2000598907470703, -3.020705223083496, -2.8413500785827637, -2.6619954109191895, -2.482640504837036, -2.303285598754883, -2.1239306926727295, -1.9445757865905762, -1.7652209997177124, -1.585866093635559, -1.4065111875534058, -1.227156400680542, -1.0478014945983887, -0.8684465885162354, -0.689091682434082, -0.5097368359565735, -0.33038198947906494, -0.15102708339691162, 0.0283278226852417, 0.20768260955810547, 0.3870375156402588, 0.5663919448852539, 0.7457468509674072, 0.9251016974449158, 1.1044565439224243, 1.2838114500045776, 1.463166356086731, 1.6425211429595947, 1.821876049041748, 2.0012309551239014, 2.1805858612060547, 2.359940767288208, 2.5392956733703613, 2.7186503410339355, 2.898005485534668, 3.077360153198242, 3.2567150592803955, 3.436069965362549, 3.615424871444702, 3.7947797775268555, 3.9741344451904297, 4.153489589691162, 4.332844257354736, 4.512199401855469, 4.691554069519043, 4.870908737182617, 5.050263404846191, 5.229618549346924, 5.408973217010498, 5.5883283615112305, 5.767683029174805, 5.947037696838379, 6.126392841339111, 6.305747985839844]}, "gradients/decoder.roberta.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 10.0, 6.0, 8.0, 9.0, 14.0, 18.0, 34.0, 41.0, 54.0, 71.0, 117.0, 165.0, 369.0, 651.0, 1650.0, 5268.0, 23098.0, 164112.0, 1905052.0, 1896186.0, 165286.0, 23468.0, 5375.0, 1700.0, 683.0, 334.0, 160.0, 114.0, 63.0, 48.0, 30.0, 23.0, 18.0, 18.0, 6.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.078125, -11.7330322265625, -11.387939453125, -11.0428466796875, -10.69775390625, -10.3526611328125, -10.007568359375, -9.6624755859375, -9.3173828125, -8.9722900390625, -8.627197265625, -8.2821044921875, -7.93701171875, -7.5919189453125, -7.246826171875, -6.9017333984375, -6.556640625, -6.2115478515625, -5.866455078125, -5.5213623046875, -5.17626953125, -4.8311767578125, -4.486083984375, -4.1409912109375, -3.7958984375, -3.4508056640625, -3.105712890625, -2.7606201171875, -2.41552734375, -2.0704345703125, -1.725341796875, -1.3802490234375, -1.03515625, -0.6900634765625, -0.344970703125, 0.0001220703125, 0.34521484375, 0.6903076171875, 1.035400390625, 1.3804931640625, 1.7255859375, 2.0706787109375, 2.415771484375, 2.7608642578125, 3.10595703125, 3.4510498046875, 3.796142578125, 4.1412353515625, 4.486328125, 4.8314208984375, 5.176513671875, 5.5216064453125, 5.86669921875, 6.2117919921875, 6.556884765625, 6.9019775390625, 7.2470703125, 7.5921630859375, 7.937255859375, 8.2823486328125, 8.62744140625, 8.9725341796875, 9.317626953125, 9.6627197265625, 10.0078125]}, "gradients/decoder.roberta.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 8.0, 8.0, 7.0, 7.0, 6.0, 11.0, 12.0, 13.0, 16.0, 15.0, 24.0, 26.0, 30.0, 25.0, 39.0, 31.0, 32.0, 42.0, 37.0, 34.0, 41.0, 35.0, 47.0, 41.0, 49.0, 36.0, 28.0, 35.0, 35.0, 25.0, 27.0, 19.0, 28.0, 19.0, 19.0, 17.0, 15.0, 8.0, 10.0, 4.0, 9.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.45703125, -3.33984375, -3.22265625, -3.10546875, -2.98828125, -2.87109375, -2.75390625, -2.63671875, -2.51953125, -2.40234375, -2.28515625, -2.16796875, -2.05078125, -1.93359375, -1.81640625, -1.69921875, -1.58203125, -1.46484375, -1.34765625, -1.23046875, -1.11328125, -0.99609375, -0.87890625, -0.76171875, -0.64453125, -0.52734375, -0.41015625, -0.29296875, -0.17578125, -0.05859375, 0.05859375, 0.17578125, 0.29296875, 0.41015625, 0.52734375, 0.64453125, 0.76171875, 0.87890625, 0.99609375, 1.11328125, 1.23046875, 1.34765625, 1.46484375, 1.58203125, 1.69921875, 1.81640625, 1.93359375, 2.05078125, 2.16796875, 2.28515625, 2.40234375, 2.51953125, 2.63671875, 2.75390625, 2.87109375, 2.98828125, 3.10546875, 3.22265625, 3.33984375, 3.45703125, 3.57421875, 3.69140625, 3.80859375, 3.92578125, 4.04296875]}, "gradients/decoder.roberta.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 3.0, 3.0, 8.0, 20.0, 23.0, 33.0, 47.0, 73.0, 91.0, 133.0, 198.0, 294.0, 528.0, 4129.0, 4155010.0, 31905.0, 766.0, 308.0, 199.0, 144.0, 110.0, 79.0, 57.0, 35.0, 28.0, 17.0, 7.0, 9.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.875, -61.7919921875, -59.708984375, -57.6259765625, -55.54296875, -53.4599609375, -51.376953125, -49.2939453125, -47.2109375, -45.1279296875, -43.044921875, -40.9619140625, -38.87890625, -36.7958984375, -34.712890625, -32.6298828125, -30.546875, -28.4638671875, -26.380859375, -24.2978515625, -22.21484375, -20.1318359375, -18.048828125, -15.9658203125, -13.8828125, -11.7998046875, -9.716796875, -7.6337890625, -5.55078125, -3.4677734375, -1.384765625, 0.6982421875, 2.78125, 4.8642578125, 6.947265625, 9.0302734375, 11.11328125, 13.1962890625, 15.279296875, 17.3623046875, 19.4453125, 21.5283203125, 23.611328125, 25.6943359375, 27.77734375, 29.8603515625, 31.943359375, 34.0263671875, 36.109375, 38.1923828125, 40.275390625, 42.3583984375, 44.44140625, 46.5244140625, 48.607421875, 50.6904296875, 52.7734375, 54.8564453125, 56.939453125, 59.0224609375, 61.10546875, 63.1884765625, 65.271484375, 67.3544921875, 69.4375]}, "gradients/decoder.roberta.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 3.0, 5.0, 8.0, 13.0, 16.0, 24.0, 32.0, 56.0, 80.0, 93.0, 158.0, 206.0, 268.0, 383.0, 492.0, 557.0, 426.0, 378.0, 265.0, 178.0, 126.0, 87.0, 71.0, 44.0, 27.0, 24.0, 18.0, 14.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.8575439453125, -2.771728515625, -2.6859130859375, -2.60009765625, -2.5142822265625, -2.428466796875, -2.3426513671875, -2.2568359375, -2.1710205078125, -2.085205078125, -1.9993896484375, -1.91357421875, -1.8277587890625, -1.741943359375, -1.6561279296875, -1.5703125, -1.4844970703125, -1.398681640625, -1.3128662109375, -1.22705078125, -1.1412353515625, -1.055419921875, -0.9696044921875, -0.8837890625, -0.7979736328125, -0.712158203125, -0.6263427734375, -0.54052734375, -0.4547119140625, -0.368896484375, -0.2830810546875, -0.197265625, -0.1114501953125, -0.025634765625, 0.0601806640625, 0.14599609375, 0.2318115234375, 0.317626953125, 0.4034423828125, 0.4892578125, 0.5750732421875, 0.660888671875, 0.7467041015625, 0.83251953125, 0.9183349609375, 1.004150390625, 1.0899658203125, 1.17578125, 1.2615966796875, 1.347412109375, 1.4332275390625, 1.51904296875, 1.6048583984375, 1.690673828125, 1.7764892578125, 1.8623046875, 1.9481201171875, 2.033935546875, 2.1197509765625, 2.20556640625, 2.2913818359375, 2.377197265625, 2.4630126953125, 2.548828125]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 17.0, 46.0, 72.0, 107.0, 166.0, 191.0, 163.0, 101.0, 75.0, 31.0, 17.0, 9.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.263086318969727, -16.933610916137695, -16.604135513305664, -16.274660110473633, -15.945183753967285, -15.615708351135254, -15.286231994628906, -14.956756591796875, -14.627281188964844, -14.297805786132812, -13.968330383300781, -13.638854026794434, -13.309378623962402, -12.979903221130371, -12.650426864624023, -12.320951461791992, -11.991476058959961, -11.66200065612793, -11.332525253295898, -11.00304889678955, -10.67357349395752, -10.344098091125488, -10.01462173461914, -9.68514633178711, -9.355670928955078, -9.026195526123047, -8.696720123291016, -8.367243766784668, -8.037768363952637, -7.7082929611206055, -7.378817081451416, -7.049341201782227, -6.719865798950195, -6.390390396118164, -6.060914516448975, -5.731438636779785, -5.401963233947754, -5.072487831115723, -4.743011951446533, -4.413536071777344, -4.0840606689453125, -3.754585027694702, -3.425109386444092, -3.0956337451934814, -2.766158103942871, -2.4366824626922607, -2.1072068214416504, -1.77773118019104, -1.4482553005218506, -1.1187796592712402, -0.7893040180206299, -0.45982837677001953, -0.13035273551940918, 0.19912290573120117, 0.5285985469818115, 0.8580741882324219, 1.1875498294830322, 1.5170254707336426, 1.846501111984253, 2.1759767532348633, 2.5054523944854736, 2.834928035736084, 3.1644036769866943, 3.4938793182373047, 3.823354959487915]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 4.0, 12.0, 8.0, 8.0, 17.0, 18.0, 15.0, 18.0, 20.0, 22.0, 27.0, 27.0, 19.0, 42.0, 42.0, 34.0, 51.0, 48.0, 40.0, 55.0, 44.0, 40.0, 45.0, 56.0, 25.0, 26.0, 35.0, 29.0, 20.0, 19.0, 16.0, 22.0, 18.0, 17.0, 9.0, 12.0, 8.0, 6.0, 7.0, 9.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.365730285644531, -4.227023124694824, -4.088315963745117, -3.949608564376831, -3.810901403427124, -3.672194004058838, -3.533486843109131, -3.394779682159424, -3.256072521209717, -3.1173653602600098, -2.9786579608917236, -2.8399507999420166, -2.7012436389923096, -2.5625362396240234, -2.4238290786743164, -2.2851219177246094, -2.1464145183563232, -2.007707357406616, -1.8690000772476196, -1.730292797088623, -1.591585636138916, -1.4528783559799194, -1.3141710758209229, -1.1754639148712158, -1.0367566347122192, -0.8980494141578674, -0.7593421936035156, -0.620634913444519, -0.48192769289016724, -0.34322047233581543, -0.20451319217681885, -0.06580597162246704, 0.07290124893188477, 0.21160848438739777, 0.35031571984291077, 0.48902297019958496, 0.6277301907539368, 0.7664374113082886, 0.9051446914672852, 1.0438518524169922, 1.1825591325759888, 1.3212664127349854, 1.4599735736846924, 1.598680853843689, 1.7373881340026855, 1.8760952949523926, 2.0148024559020996, 2.1535098552703857, 2.2922170162200928, 2.4309241771698, 2.569631576538086, 2.708338737487793, 2.8470458984375, 2.985753059387207, 3.124460458755493, 3.2631676197052, 3.4018750190734863, 3.5405821800231934, 3.6792895793914795, 3.8179967403411865, 3.9567039012908936, 4.09541130065918, 4.234118461608887, 4.372825622558594, 4.511532783508301]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 13.0, 12.0, 22.0, 35.0, 40.0, 53.0, 100.0, 154.0, 233.0, 369.0, 589.0, 947.0, 1543.0, 2548.0, 4052.0, 6635.0, 10928.0, 18010.0, 30259.0, 54118.0, 99028.0, 179100.0, 235770.0, 176601.0, 98331.0, 52599.0, 30398.0, 17768.0, 10866.0, 6515.0, 4127.0, 2461.0, 1592.0, 989.0, 692.0, 357.0, 244.0, 158.0, 99.0, 55.0, 46.0, 31.0, 18.0, 20.0, 8.0, 7.0, 3.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.7890625, -0.7655029296875, -0.741943359375, -0.7183837890625, -0.69482421875, -0.6712646484375, -0.647705078125, -0.6241455078125, -0.6005859375, -0.5770263671875, -0.553466796875, -0.5299072265625, -0.50634765625, -0.4827880859375, -0.459228515625, -0.4356689453125, -0.412109375, -0.3885498046875, -0.364990234375, -0.3414306640625, -0.31787109375, -0.2943115234375, -0.270751953125, -0.2471923828125, -0.2236328125, -0.2000732421875, -0.176513671875, -0.1529541015625, -0.12939453125, -0.1058349609375, -0.082275390625, -0.0587158203125, -0.03515625, -0.0115966796875, 0.011962890625, 0.0355224609375, 0.05908203125, 0.0826416015625, 0.106201171875, 0.1297607421875, 0.1533203125, 0.1768798828125, 0.200439453125, 0.2239990234375, 0.24755859375, 0.2711181640625, 0.294677734375, 0.3182373046875, 0.341796875, 0.3653564453125, 0.388916015625, 0.4124755859375, 0.43603515625, 0.4595947265625, 0.483154296875, 0.5067138671875, 0.5302734375, 0.5538330078125, 0.577392578125, 0.6009521484375, 0.62451171875, 0.6480712890625, 0.671630859375, 0.6951904296875, 0.71875]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 17.0, 18.0, 19.0, 18.0, 20.0, 21.0, 27.0, 24.0, 25.0, 44.0, 38.0, 39.0, 51.0, 43.0, 42.0, 53.0, 44.0, 40.0, 53.0, 41.0, 25.0, 31.0, 32.0, 30.0, 17.0, 20.0, 15.0, 20.0, 19.0, 17.0, 10.0, 10.0, 8.0, 6.0, 7.0, 8.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.34375, -4.20794677734375, -4.0721435546875, -3.93634033203125, -3.800537109375, -3.66473388671875, -3.5289306640625, -3.39312744140625, -3.25732421875, -3.12152099609375, -2.9857177734375, -2.84991455078125, -2.714111328125, -2.57830810546875, -2.4425048828125, -2.30670166015625, -2.1708984375, -2.03509521484375, -1.8992919921875, -1.76348876953125, -1.627685546875, -1.49188232421875, -1.3560791015625, -1.22027587890625, -1.08447265625, -0.94866943359375, -0.8128662109375, -0.67706298828125, -0.541259765625, -0.40545654296875, -0.2696533203125, -0.13385009765625, 0.001953125, 0.13775634765625, 0.2735595703125, 0.40936279296875, 0.545166015625, 0.68096923828125, 0.8167724609375, 0.95257568359375, 1.08837890625, 1.22418212890625, 1.3599853515625, 1.49578857421875, 1.631591796875, 1.76739501953125, 1.9031982421875, 2.03900146484375, 2.1748046875, 2.31060791015625, 2.4464111328125, 2.58221435546875, 2.718017578125, 2.85382080078125, 2.9896240234375, 3.12542724609375, 3.26123046875, 3.39703369140625, 3.5328369140625, 3.66864013671875, 3.804443359375, 3.94024658203125, 4.0760498046875, 4.21185302734375, 4.34765625]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 9.0, 20.0, 23.0, 25.0, 29.0, 37.0, 58.0, 76.0, 97.0, 112.0, 145.0, 214.0, 305.0, 401.0, 610.0, 1029.0, 1682.0, 3403.0, 7282.0, 17330.0, 52984.0, 891917.0, 42358.0, 14621.0, 6250.0, 2946.0, 1595.0, 921.0, 571.0, 392.0, 269.0, 201.0, 154.0, 109.0, 94.0, 62.0, 46.0, 35.0, 28.0, 30.0, 18.0, 18.0, 12.0, 6.0, 8.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.921875, -1.860687255859375, -1.79949951171875, -1.738311767578125, -1.6771240234375, -1.615936279296875, -1.55474853515625, -1.493560791015625, -1.432373046875, -1.371185302734375, -1.30999755859375, -1.248809814453125, -1.1876220703125, -1.126434326171875, -1.06524658203125, -1.004058837890625, -0.94287109375, -0.881683349609375, -0.82049560546875, -0.759307861328125, -0.6981201171875, -0.636932373046875, -0.57574462890625, -0.514556884765625, -0.453369140625, -0.392181396484375, -0.33099365234375, -0.269805908203125, -0.2086181640625, -0.147430419921875, -0.08624267578125, -0.025054931640625, 0.0361328125, 0.097320556640625, 0.15850830078125, 0.219696044921875, 0.2808837890625, 0.342071533203125, 0.40325927734375, 0.464447021484375, 0.525634765625, 0.586822509765625, 0.64801025390625, 0.709197998046875, 0.7703857421875, 0.831573486328125, 0.89276123046875, 0.953948974609375, 1.01513671875, 1.076324462890625, 1.13751220703125, 1.198699951171875, 1.2598876953125, 1.321075439453125, 1.38226318359375, 1.443450927734375, 1.504638671875, 1.565826416015625, 1.62701416015625, 1.688201904296875, 1.7493896484375, 1.810577392578125, 1.87176513671875, 1.932952880859375, 1.994140625]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 9.0, 14.0, 9.0, 9.0, 12.0, 18.0, 24.0, 25.0, 18.0, 25.0, 23.0, 30.0, 35.0, 26.0, 31.0, 35.0, 41.0, 38.0, 33.0, 44.0, 27.0, 34.0, 38.0, 33.0, 41.0, 36.0, 24.0, 31.0, 30.0, 22.0, 25.0, 23.0, 19.0, 19.0, 14.0, 15.0, 7.0, 11.0, 8.0, 9.0, 9.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.330078125, -2.251190185546875, -2.17230224609375, -2.093414306640625, -2.0145263671875, -1.935638427734375, -1.85675048828125, -1.777862548828125, -1.698974609375, -1.620086669921875, -1.54119873046875, -1.462310791015625, -1.3834228515625, -1.304534912109375, -1.22564697265625, -1.146759033203125, -1.06787109375, -0.988983154296875, -0.91009521484375, -0.831207275390625, -0.7523193359375, -0.673431396484375, -0.59454345703125, -0.515655517578125, -0.436767578125, -0.357879638671875, -0.27899169921875, -0.200103759765625, -0.1212158203125, -0.042327880859375, 0.03656005859375, 0.115447998046875, 0.1943359375, 0.273223876953125, 0.35211181640625, 0.430999755859375, 0.5098876953125, 0.588775634765625, 0.66766357421875, 0.746551513671875, 0.825439453125, 0.904327392578125, 0.98321533203125, 1.062103271484375, 1.1409912109375, 1.219879150390625, 1.29876708984375, 1.377655029296875, 1.45654296875, 1.535430908203125, 1.61431884765625, 1.693206787109375, 1.7720947265625, 1.850982666015625, 1.92987060546875, 2.008758544921875, 2.087646484375, 2.166534423828125, 2.24542236328125, 2.324310302734375, 2.4031982421875, 2.482086181640625, 2.56097412109375, 2.639862060546875, 2.71875]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 5.0, 5.0, 4.0, 17.0, 13.0, 22.0, 37.0, 47.0, 72.0, 101.0, 225.0, 320.0, 555.0, 1139.0, 2700.0, 8733.0, 60316.0, 952201.0, 14934.0, 3829.0, 1584.0, 719.0, 353.0, 209.0, 140.0, 87.0, 47.0, 54.0, 28.0, 16.0, 12.0, 7.0, 7.0, 3.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466064453125, -0.4524269104003906, -0.43878936767578125, -0.4251518249511719, -0.4115142822265625, -0.3978767395019531, -0.38423919677734375, -0.3706016540527344, -0.356964111328125, -0.3433265686035156, -0.32968902587890625, -0.3160514831542969, -0.3024139404296875, -0.2887763977050781, -0.27513885498046875, -0.2615013122558594, -0.24786376953125, -0.23422622680664062, -0.22058868408203125, -0.20695114135742188, -0.1933135986328125, -0.17967605590820312, -0.16603851318359375, -0.15240097045898438, -0.138763427734375, -0.12512588500976562, -0.11148834228515625, -0.09785079956054688, -0.0842132568359375, -0.07057571411132812, -0.05693817138671875, -0.043300628662109375, -0.0296630859375, -0.016025543212890625, -0.00238800048828125, 0.011249542236328125, 0.0248870849609375, 0.038524627685546875, 0.05216217041015625, 0.06579971313476562, 0.079437255859375, 0.09307479858398438, 0.10671234130859375, 0.12034988403320312, 0.1339874267578125, 0.14762496948242188, 0.16126251220703125, 0.17490005493164062, 0.18853759765625, 0.20217514038085938, 0.21581268310546875, 0.22945022583007812, 0.2430877685546875, 0.2567253112792969, 0.27036285400390625, 0.2840003967285156, 0.297637939453125, 0.3112754821777344, 0.32491302490234375, 0.3385505676269531, 0.3521881103515625, 0.3658256530761719, 0.37946319580078125, 0.3931007385253906, 0.40673828125]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 7.0, 4.0, 10.0, 4.0, 13.0, 14.0, 21.0, 31.0, 44.0, 61.0, 68.0, 77.0, 90.0, 82.0, 91.0, 73.0, 61.0, 55.0, 45.0, 33.0, 25.0, 15.0, 22.0, 7.0, 12.0, 5.0, 4.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5881996154785156e-05, -3.479141741991043e-05, -3.3700838685035706e-05, -3.261025995016098e-05, -3.1519681215286255e-05, -3.042910248041153e-05, -2.9338523745536804e-05, -2.824794501066208e-05, -2.7157366275787354e-05, -2.6066787540912628e-05, -2.4976208806037903e-05, -2.3885630071163177e-05, -2.2795051336288452e-05, -2.1704472601413727e-05, -2.0613893866539e-05, -1.9523315131664276e-05, -1.843273639678955e-05, -1.7342157661914825e-05, -1.62515789270401e-05, -1.5161000192165375e-05, -1.407042145729065e-05, -1.2979842722415924e-05, -1.1889263987541199e-05, -1.0798685252666473e-05, -9.708106517791748e-06, -8.617527782917023e-06, -7.526949048042297e-06, -6.436370313167572e-06, -5.345791578292847e-06, -4.255212843418121e-06, -3.164634108543396e-06, -2.0740553736686707e-06, -9.834766387939453e-07, 1.0710209608078003e-07, 1.1976808309555054e-06, 2.2882595658302307e-06, 3.378838300704956e-06, 4.469417035579681e-06, 5.559995770454407e-06, 6.650574505329132e-06, 7.741153240203857e-06, 8.831731975078583e-06, 9.922310709953308e-06, 1.1012889444828033e-05, 1.2103468179702759e-05, 1.3194046914577484e-05, 1.428462564945221e-05, 1.5375204384326935e-05, 1.646578311920166e-05, 1.7556361854076385e-05, 1.864694058895111e-05, 1.9737519323825836e-05, 2.082809805870056e-05, 2.1918676793575287e-05, 2.3009255528450012e-05, 2.4099834263324738e-05, 2.5190412998199463e-05, 2.6280991733074188e-05, 2.7371570467948914e-05, 2.846214920282364e-05, 2.9552727937698364e-05, 3.064330667257309e-05, 3.1733885407447815e-05, 3.282446414232254e-05, 3.3915042877197266e-05]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 1.0, 4.0, 2.0, 6.0, 7.0, 4.0, 8.0, 14.0, 8.0, 16.0, 16.0, 22.0, 31.0, 31.0, 44.0, 96.0, 185.0, 1687.0, 590892.0, 453412.0, 1535.0, 222.0, 102.0, 53.0, 26.0, 21.0, 25.0, 17.0, 10.0, 9.0, 8.0, 10.0, 1.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.94970703125, -0.9225616455078125, -0.895416259765625, -0.8682708740234375, -0.84112548828125, -0.8139801025390625, -0.786834716796875, -0.7596893310546875, -0.7325439453125, -0.7053985595703125, -0.678253173828125, -0.6511077880859375, -0.62396240234375, -0.5968170166015625, -0.569671630859375, -0.5425262451171875, -0.515380859375, -0.4882354736328125, -0.461090087890625, -0.4339447021484375, -0.40679931640625, -0.3796539306640625, -0.352508544921875, -0.3253631591796875, -0.2982177734375, -0.2710723876953125, -0.243927001953125, -0.2167816162109375, -0.18963623046875, -0.1624908447265625, -0.135345458984375, -0.1082000732421875, -0.0810546875, -0.0539093017578125, -0.026763916015625, 0.0003814697265625, 0.02752685546875, 0.0546722412109375, 0.081817626953125, 0.1089630126953125, 0.1361083984375, 0.1632537841796875, 0.190399169921875, 0.2175445556640625, 0.24468994140625, 0.2718353271484375, 0.298980712890625, 0.3261260986328125, 0.353271484375, 0.3804168701171875, 0.407562255859375, 0.4347076416015625, 0.46185302734375, 0.4889984130859375, 0.516143798828125, 0.5432891845703125, 0.5704345703125, 0.5975799560546875, 0.624725341796875, 0.6518707275390625, 0.67901611328125, 0.7061614990234375, 0.733306884765625, 0.7604522705078125, 0.78759765625]}, "gradients/decoder.roberta.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 6.0, 8.0, 7.0, 6.0, 8.0, 16.0, 20.0, 15.0, 23.0, 34.0, 49.0, 61.0, 88.0, 89.0, 93.0, 110.0, 68.0, 69.0, 41.0, 34.0, 20.0, 29.0, 16.0, 18.0, 12.0, 11.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033355712890625, -0.032141685485839844, -0.030927658081054688, -0.02971363067626953, -0.028499603271484375, -0.02728557586669922, -0.026071548461914062, -0.024857521057128906, -0.02364349365234375, -0.022429466247558594, -0.021215438842773438, -0.02000141143798828, -0.018787384033203125, -0.01757335662841797, -0.016359329223632812, -0.015145301818847656, -0.0139312744140625, -0.012717247009277344, -0.011503219604492188, -0.010289192199707031, -0.009075164794921875, -0.007861137390136719, -0.0066471099853515625, -0.005433082580566406, -0.00421905517578125, -0.0030050277709960938, -0.0017910003662109375, -0.0005769729614257812, 0.000637054443359375, 0.0018510818481445312, 0.0030651092529296875, 0.004279136657714844, 0.0054931640625, 0.006707191467285156, 0.007921218872070312, 0.009135246276855469, 0.010349273681640625, 0.011563301086425781, 0.012777328491210938, 0.013991355895996094, 0.01520538330078125, 0.016419410705566406, 0.017633438110351562, 0.01884746551513672, 0.020061492919921875, 0.02127552032470703, 0.022489547729492188, 0.023703575134277344, 0.0249176025390625, 0.026131629943847656, 0.027345657348632812, 0.02855968475341797, 0.029773712158203125, 0.03098773956298828, 0.03220176696777344, 0.033415794372558594, 0.03462982177734375, 0.035843849182128906, 0.03705787658691406, 0.03827190399169922, 0.039485931396484375, 0.04069995880126953, 0.04191398620605469, 0.043128013610839844, 0.044342041015625]}, "gradients/decoder.roberta.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 6.0, 37.0, 95.0, 162.0, 258.0, 241.0, 131.0, 49.0, 23.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.03461265563965, -15.558653831481934, -15.082695007324219, -14.606735229492188, -14.130776405334473, -13.654817581176758, -13.178857803344727, -12.702898979187012, -12.226940155029297, -11.750981330871582, -11.275022506713867, -10.799062728881836, -10.323103904724121, -9.847145080566406, -9.371185302734375, -8.89522647857666, -8.419267654418945, -7.9433088302612305, -7.467349529266357, -6.991390228271484, -6.5154314041137695, -6.039472579956055, -5.563513278961182, -5.087553977966309, -4.611595153808594, -4.135636329650879, -3.659677028656006, -3.183717966079712, -2.707758903503418, -2.231799840927124, -1.75584077835083, -1.2798817157745361, -0.8039236068725586, -0.32796454429626465, 0.1479945182800293, 0.6239535808563232, 1.0999126434326172, 1.5758717060089111, 2.051830768585205, 2.527789831161499, 3.003748893737793, 3.479707956314087, 3.955667018890381, 4.431626319885254, 4.907585144042969, 5.383543968200684, 5.859503269195557, 6.33546257019043, 6.8114213943481445, 7.287380218505859, 7.763339519500732, 8.239298820495605, 8.71525764465332, 9.191216468811035, 9.66717529296875, 10.143135070800781, 10.619093894958496, 11.095052719116211, 11.571012496948242, 12.046971321105957, 12.522930145263672, 12.998888969421387, 13.474847793579102, 13.950807571411133, 14.426766395568848]}, "gradients/decoder.roberta.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 6.0, 8.0, 9.0, 10.0, 16.0, 20.0, 18.0, 18.0, 20.0, 20.0, 29.0, 23.0, 25.0, 44.0, 38.0, 37.0, 52.0, 44.0, 44.0, 52.0, 43.0, 41.0, 51.0, 43.0, 25.0, 29.0, 33.0, 30.0, 17.0, 21.0, 15.0, 19.0, 19.0, 18.0, 9.0, 11.0, 7.0, 6.0, 7.0, 8.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.343925952911377, -4.208105087280273, -4.072284698486328, -3.9364638328552246, -3.800642967224121, -3.6648223400115967, -3.5290017127990723, -3.3931808471679688, -3.2573602199554443, -3.12153959274292, -2.9857187271118164, -2.849898099899292, -2.7140774726867676, -2.578256607055664, -2.4424359798431396, -2.3066153526306152, -2.1707944869995117, -2.0349738597869873, -1.8991529941558838, -1.7633323669433594, -1.6275116205215454, -1.4916908740997314, -1.355870246887207, -1.220049500465393, -1.084228754043579, -0.9484080076217651, -0.812587320804596, -0.6767666339874268, -0.5409458875656128, -0.40512514114379883, -0.26930445432662964, -0.13348376750946045, 0.0023369789123535156, 0.1381576955318451, 0.27397841215133667, 0.40979912877082825, 0.5456198453903198, 0.6814405918121338, 0.817261278629303, 0.9530819654464722, 1.0889027118682861, 1.2247234582901, 1.360544204711914, 1.4963648319244385, 1.6321855783462524, 1.7680063247680664, 1.9038269519805908, 2.0396475791931152, 2.1754684448242188, 2.311289072036743, 2.4471099376678467, 2.582930564880371, 2.7187514305114746, 2.854572057723999, 2.9903926849365234, 3.126213550567627, 3.2620341777801514, 3.397854804992676, 3.5336756706237793, 3.6694962978363037, 3.805316925048828, 3.9411377906799316, 4.076958656311035, 4.2127790451049805, 4.348599910736084]}, "gradients/decoder.roberta.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 11.0, 13.0, 13.0, 23.0, 37.0, 41.0, 82.0, 109.0, 156.0, 198.0, 336.0, 564.0, 999.0, 1862.0, 3524.0, 6760.0, 12903.0, 24999.0, 48125.0, 94167.0, 201797.0, 308368.0, 172347.0, 82587.0, 41912.0, 22098.0, 11404.0, 6034.0, 3124.0, 1615.0, 892.0, 496.0, 305.0, 189.0, 134.0, 89.0, 71.0, 41.0, 29.0, 21.0, 15.0, 12.0, 13.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0], "bins": [-4.421875, -4.285400390625, -4.14892578125, -4.012451171875, -3.8759765625, -3.739501953125, -3.60302734375, -3.466552734375, -3.330078125, -3.193603515625, -3.05712890625, -2.920654296875, -2.7841796875, -2.647705078125, -2.51123046875, -2.374755859375, -2.23828125, -2.101806640625, -1.96533203125, -1.828857421875, -1.6923828125, -1.555908203125, -1.41943359375, -1.282958984375, -1.146484375, -1.010009765625, -0.87353515625, -0.737060546875, -0.6005859375, -0.464111328125, -0.32763671875, -0.191162109375, -0.0546875, 0.081787109375, 0.21826171875, 0.354736328125, 0.4912109375, 0.627685546875, 0.76416015625, 0.900634765625, 1.037109375, 1.173583984375, 1.31005859375, 1.446533203125, 1.5830078125, 1.719482421875, 1.85595703125, 1.992431640625, 2.12890625, 2.265380859375, 2.40185546875, 2.538330078125, 2.6748046875, 2.811279296875, 2.94775390625, 3.084228515625, 3.220703125, 3.357177734375, 3.49365234375, 3.630126953125, 3.7666015625, 3.903076171875, 4.03955078125, 4.176025390625, 4.3125]}, "gradients/decoder.roberta.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 5.0, 7.0, 8.0, 11.0, 13.0, 12.0, 19.0, 20.0, 18.0, 17.0, 22.0, 28.0, 20.0, 37.0, 41.0, 33.0, 42.0, 44.0, 34.0, 49.0, 43.0, 48.0, 37.0, 42.0, 48.0, 35.0, 22.0, 34.0, 31.0, 20.0, 19.0, 19.0, 17.0, 14.0, 18.0, 14.0, 9.0, 9.0, 6.0, 7.0, 4.0, 6.0, 5.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.486328125, -3.37396240234375, -3.2615966796875, -3.14923095703125, -3.036865234375, -2.92449951171875, -2.8121337890625, -2.69976806640625, -2.58740234375, -2.47503662109375, -2.3626708984375, -2.25030517578125, -2.137939453125, -2.02557373046875, -1.9132080078125, -1.80084228515625, -1.6884765625, -1.57611083984375, -1.4637451171875, -1.35137939453125, -1.239013671875, -1.12664794921875, -1.0142822265625, -0.90191650390625, -0.78955078125, -0.67718505859375, -0.5648193359375, -0.45245361328125, -0.340087890625, -0.22772216796875, -0.1153564453125, -0.00299072265625, 0.109375, 0.22174072265625, 0.3341064453125, 0.44647216796875, 0.558837890625, 0.67120361328125, 0.7835693359375, 0.89593505859375, 1.00830078125, 1.12066650390625, 1.2330322265625, 1.34539794921875, 1.457763671875, 1.57012939453125, 1.6824951171875, 1.79486083984375, 1.9072265625, 2.01959228515625, 2.1319580078125, 2.24432373046875, 2.356689453125, 2.46905517578125, 2.5814208984375, 2.69378662109375, 2.80615234375, 2.91851806640625, 3.0308837890625, 3.14324951171875, 3.255615234375, 3.36798095703125, 3.4803466796875, 3.59271240234375, 3.705078125]}, "gradients/decoder.roberta.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 4.0, 8.0, 11.0, 16.0, 22.0, 14.0, 30.0, 25.0, 30.0, 31.0, 36.0, 42.0, 54.0, 55.0, 170.0, 97065.0, 950310.0, 195.0, 74.0, 39.0, 45.0, 48.0, 32.0, 28.0, 34.0, 28.0, 25.0, 14.0, 17.0, 12.0, 8.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-125.1875, -121.28515625, -117.3828125, -113.48046875, -109.578125, -105.67578125, -101.7734375, -97.87109375, -93.96875, -90.06640625, -86.1640625, -82.26171875, -78.359375, -74.45703125, -70.5546875, -66.65234375, -62.75, -58.84765625, -54.9453125, -51.04296875, -47.140625, -43.23828125, -39.3359375, -35.43359375, -31.53125, -27.62890625, -23.7265625, -19.82421875, -15.921875, -12.01953125, -8.1171875, -4.21484375, -0.3125, 3.58984375, 7.4921875, 11.39453125, 15.296875, 19.19921875, 23.1015625, 27.00390625, 30.90625, 34.80859375, 38.7109375, 42.61328125, 46.515625, 50.41796875, 54.3203125, 58.22265625, 62.125, 66.02734375, 69.9296875, 73.83203125, 77.734375, 81.63671875, 85.5390625, 89.44140625, 93.34375, 97.24609375, 101.1484375, 105.05078125, 108.953125, 112.85546875, 116.7578125, 120.66015625, 124.5625]}, "gradients/decoder.roberta.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 8.0, 5.0, 15.0, 17.0, 19.0, 14.0, 26.0, 26.0, 34.0, 32.0, 37.0, 57.0, 44.0, 46.0, 45.0, 53.0, 63.0, 48.0, 57.0, 43.0, 50.0, 33.0, 39.0, 25.0, 25.0, 32.0, 18.0, 20.0, 23.0, 15.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.3125, -4.17913818359375, -4.0457763671875, -3.91241455078125, -3.779052734375, -3.64569091796875, -3.5123291015625, -3.37896728515625, -3.24560546875, -3.11224365234375, -2.9788818359375, -2.84552001953125, -2.712158203125, -2.57879638671875, -2.4454345703125, -2.31207275390625, -2.1787109375, -2.04534912109375, -1.9119873046875, -1.77862548828125, -1.645263671875, -1.51190185546875, -1.3785400390625, -1.24517822265625, -1.11181640625, -0.97845458984375, -0.8450927734375, -0.71173095703125, -0.578369140625, -0.44500732421875, -0.3116455078125, -0.17828369140625, -0.044921875, 0.08843994140625, 0.2218017578125, 0.35516357421875, 0.488525390625, 0.62188720703125, 0.7552490234375, 0.88861083984375, 1.02197265625, 1.15533447265625, 1.2886962890625, 1.42205810546875, 1.555419921875, 1.68878173828125, 1.8221435546875, 1.95550537109375, 2.0888671875, 2.22222900390625, 2.3555908203125, 2.48895263671875, 2.622314453125, 2.75567626953125, 2.8890380859375, 3.02239990234375, 3.15576171875, 3.28912353515625, 3.4224853515625, 3.55584716796875, 3.689208984375, 3.82257080078125, 3.9559326171875, 4.08929443359375, 4.22265625]}, "gradients/decoder.roberta.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 12.0, 9.0, 14.0, 37.0, 36.0, 91.0, 185.0, 427.0, 1008.0, 4083.0, 46820.0, 825396.0, 159096.0, 8663.0, 1587.0, 540.0, 254.0, 111.0, 61.0, 34.0, 26.0, 14.0, 14.0, 9.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.14453125, -5.94427490234375, -5.7440185546875, -5.54376220703125, -5.343505859375, -5.14324951171875, -4.9429931640625, -4.74273681640625, -4.54248046875, -4.34222412109375, -4.1419677734375, -3.94171142578125, -3.741455078125, -3.54119873046875, -3.3409423828125, -3.14068603515625, -2.9404296875, -2.74017333984375, -2.5399169921875, -2.33966064453125, -2.139404296875, -1.93914794921875, -1.7388916015625, -1.53863525390625, -1.33837890625, -1.13812255859375, -0.9378662109375, -0.73760986328125, -0.537353515625, -0.33709716796875, -0.1368408203125, 0.06341552734375, 0.263671875, 0.46392822265625, 0.6641845703125, 0.86444091796875, 1.064697265625, 1.26495361328125, 1.4652099609375, 1.66546630859375, 1.86572265625, 2.06597900390625, 2.2662353515625, 2.46649169921875, 2.666748046875, 2.86700439453125, 3.0672607421875, 3.26751708984375, 3.4677734375, 3.66802978515625, 3.8682861328125, 4.06854248046875, 4.268798828125, 4.46905517578125, 4.6693115234375, 4.86956787109375, 5.06982421875, 5.27008056640625, 5.4703369140625, 5.67059326171875, 5.870849609375, 6.07110595703125, 6.2713623046875, 6.47161865234375, 6.671875]}, "gradients/decoder.roberta.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 6.0, 6.0, 5.0, 8.0, 23.0, 25.0, 35.0, 52.0, 84.0, 112.0, 142.0, 157.0, 108.0, 90.0, 57.0, 29.0, 29.0, 11.0, 9.0, 3.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031280517578125, -0.0003007948398590088, -0.0002887845039367676, -0.00027677416801452637, -0.00026476383209228516, -0.00025275349617004395, -0.00024074316024780273, -0.00022873282432556152, -0.0002167224884033203, -0.0002047121524810791, -0.0001927018165588379, -0.00018069148063659668, -0.00016868114471435547, -0.00015667080879211426, -0.00014466047286987305, -0.00013265013694763184, -0.00012063980102539062, -0.00010862946510314941, -9.66191291809082e-05, -8.460879325866699e-05, -7.259845733642578e-05, -6.058812141418457e-05, -4.857778549194336e-05, -3.656744956970215e-05, -2.4557113647460938e-05, -1.2546777725219727e-05, -5.364418029785156e-07, 1.1473894119262695e-05, 2.3484230041503906e-05, 3.549456596374512e-05, 4.750490188598633e-05, 5.951523780822754e-05, 7.152557373046875e-05, 8.353590965270996e-05, 9.554624557495117e-05, 0.00010755658149719238, 0.0001195669174194336, 0.0001315772533416748, 0.00014358758926391602, 0.00015559792518615723, 0.00016760826110839844, 0.00017961859703063965, 0.00019162893295288086, 0.00020363926887512207, 0.00021564960479736328, 0.0002276599407196045, 0.0002396702766418457, 0.0002516806125640869, 0.0002636909484863281, 0.00027570128440856934, 0.00028771162033081055, 0.00029972195625305176, 0.00031173229217529297, 0.0003237426280975342, 0.0003357529640197754, 0.0003477632999420166, 0.0003597736358642578, 0.000371783971786499, 0.00038379430770874023, 0.00039580464363098145, 0.00040781497955322266, 0.00041982531547546387, 0.0004318356513977051, 0.0004438459873199463, 0.0004558563232421875]}, "gradients/decoder.roberta.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 7.0, 13.0, 16.0, 28.0, 38.0, 70.0, 156.0, 1018.0, 396523.0, 649122.0, 1213.0, 161.0, 77.0, 42.0, 18.0, 16.0, 8.0, 4.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.09375, -21.40380859375, -20.7138671875, -20.02392578125, -19.333984375, -18.64404296875, -17.9541015625, -17.26416015625, -16.57421875, -15.88427734375, -15.1943359375, -14.50439453125, -13.814453125, -13.12451171875, -12.4345703125, -11.74462890625, -11.0546875, -10.36474609375, -9.6748046875, -8.98486328125, -8.294921875, -7.60498046875, -6.9150390625, -6.22509765625, -5.53515625, -4.84521484375, -4.1552734375, -3.46533203125, -2.775390625, -2.08544921875, -1.3955078125, -0.70556640625, -0.015625, 0.67431640625, 1.3642578125, 2.05419921875, 2.744140625, 3.43408203125, 4.1240234375, 4.81396484375, 5.50390625, 6.19384765625, 6.8837890625, 7.57373046875, 8.263671875, 8.95361328125, 9.6435546875, 10.33349609375, 11.0234375, 11.71337890625, 12.4033203125, 13.09326171875, 13.783203125, 14.47314453125, 15.1630859375, 15.85302734375, 16.54296875, 17.23291015625, 17.9228515625, 18.61279296875, 19.302734375, 19.99267578125, 20.6826171875, 21.37255859375, 22.0625]}, "gradients/decoder.roberta.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 11.0, 7.0, 31.0, 44.0, 68.0, 90.0, 127.0, 157.0, 130.0, 91.0, 87.0, 40.0, 37.0, 14.0, 10.0, 16.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.001953125, -0.9712066650390625, -0.940460205078125, -0.9097137451171875, -0.87896728515625, -0.8482208251953125, -0.817474365234375, -0.7867279052734375, -0.7559814453125, -0.7252349853515625, -0.694488525390625, -0.6637420654296875, -0.63299560546875, -0.6022491455078125, -0.571502685546875, -0.5407562255859375, -0.510009765625, -0.4792633056640625, -0.448516845703125, -0.4177703857421875, -0.38702392578125, -0.3562774658203125, -0.325531005859375, -0.2947845458984375, -0.2640380859375, -0.2332916259765625, -0.202545166015625, -0.1717987060546875, -0.14105224609375, -0.1103057861328125, -0.079559326171875, -0.0488128662109375, -0.01806640625, 0.0126800537109375, 0.043426513671875, 0.0741729736328125, 0.10491943359375, 0.1356658935546875, 0.166412353515625, 0.1971588134765625, 0.2279052734375, 0.2586517333984375, 0.289398193359375, 0.3201446533203125, 0.35089111328125, 0.3816375732421875, 0.412384033203125, 0.4431304931640625, 0.473876953125, 0.5046234130859375, 0.535369873046875, 0.5661163330078125, 0.59686279296875, 0.6276092529296875, 0.658355712890625, 0.6891021728515625, 0.7198486328125, 0.7505950927734375, 0.781341552734375, 0.8120880126953125, 0.84283447265625, 0.8735809326171875, 0.904327392578125, 0.9350738525390625, 0.9658203125]}, "gradients/decoder.roberta.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 15.0, 40.0, 96.0, 200.0, 207.0, 233.0, 136.0, 50.0, 21.0, 11.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.380996704101562, -20.922285079956055, -20.463571548461914, -20.004859924316406, -19.5461483001709, -19.087434768676758, -18.62872314453125, -18.17000961303711, -17.7112979888916, -17.252586364746094, -16.793872833251953, -16.335161209106445, -15.876448631286621, -15.417736053466797, -14.959024429321289, -14.500311851501465, -14.04159927368164, -13.582886695861816, -13.124175071716309, -12.665462493896484, -12.20674991607666, -11.748037338256836, -11.289325714111328, -10.830613136291504, -10.371901512145996, -9.913188934326172, -9.454477310180664, -8.99576473236084, -8.537052154541016, -8.078340530395508, -7.619627952575684, -7.160915374755859, -6.702203273773193, -6.243491172790527, -5.784778594970703, -5.326066493988037, -4.867353916168213, -4.408641815185547, -3.9499294757843018, -3.4912171363830566, -3.0325047969818115, -2.5737924575805664, -2.1150801181793213, -1.6563678979873657, -1.1976555585861206, -0.738943338394165, -0.2802309989929199, 0.1784813404083252, 0.6371936798095703, 1.0959060192108154, 1.5546183586120605, 2.0133304595947266, 2.472043037414551, 2.930755138397217, 3.389467477798462, 3.848179817199707, 4.306892395019531, 4.765604496002197, 5.2243170738220215, 5.6830291748046875, 6.141741752624512, 6.600453853607178, 7.059165954589844, 7.517878532409668, 7.976590633392334]}, "gradients/decoder.roberta.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 16.0, 12.0, 10.0, 12.0, 15.0, 7.0, 18.0, 33.0, 26.0, 25.0, 29.0, 38.0, 48.0, 45.0, 43.0, 51.0, 53.0, 53.0, 39.0, 43.0, 37.0, 52.0, 43.0, 27.0, 32.0, 28.0, 24.0, 26.0, 14.0, 16.0, 17.0, 11.0, 10.0, 15.0, 4.0, 6.0, 2.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.370461463928223, -6.167806148529053, -5.965150833129883, -5.762495517730713, -5.559840202331543, -5.357184410095215, -5.154529094696045, -4.951873779296875, -4.749218463897705, -4.546563148498535, -4.343907833099365, -4.141252517700195, -3.9385969638824463, -3.7359416484832764, -3.5332860946655273, -3.3306307792663574, -3.1279754638671875, -2.9253201484680176, -2.7226648330688477, -2.5200092792510986, -2.3173539638519287, -2.114698648452759, -1.9120432138442993, -1.7093877792358398, -1.50673246383667, -1.3040771484375, -1.1014217138290405, -0.8987663388252258, -0.6961109638214111, -0.4934556484222412, -0.29080021381378174, -0.08814477920532227, 0.11451101303100586, 0.31716638803482056, 0.5198217630386353, 0.72247713804245, 0.9251325130462646, 1.1277878284454346, 1.330443263053894, 1.5330986976623535, 1.7357540130615234, 1.9384093284606934, 2.1410646438598633, 2.3437201976776123, 2.5463755130767822, 2.749030828475952, 2.951686382293701, 3.154341697692871, 3.356997013092041, 3.559652328491211, 3.762307643890381, 3.96496319770813, 4.167618751525879, 4.370273590087891, 4.572929382324219, 4.775584697723389, 4.978240013122559, 5.1808953285217285, 5.383550643920898, 5.586205959320068, 5.788861274719238, 5.991517066955566, 6.194172382354736, 6.396827697753906, 6.599483013153076]}, "gradients/decoder.roberta.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 5.0, 13.0, 15.0, 11.0, 22.0, 32.0, 36.0, 54.0, 77.0, 94.0, 152.0, 409.0, 1036.0, 3692.0, 21269.0, 412675.0, 3202712.0, 518995.0, 26547.0, 4219.0, 1202.0, 423.0, 226.0, 113.0, 70.0, 49.0, 32.0, 21.0, 22.0, 13.0, 21.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.90625, -14.5194091796875, -14.132568359375, -13.7457275390625, -13.35888671875, -12.9720458984375, -12.585205078125, -12.1983642578125, -11.8115234375, -11.4246826171875, -11.037841796875, -10.6510009765625, -10.26416015625, -9.8773193359375, -9.490478515625, -9.1036376953125, -8.716796875, -8.3299560546875, -7.943115234375, -7.5562744140625, -7.16943359375, -6.7825927734375, -6.395751953125, -6.0089111328125, -5.6220703125, -5.2352294921875, -4.848388671875, -4.4615478515625, -4.07470703125, -3.6878662109375, -3.301025390625, -2.9141845703125, -2.52734375, -2.1405029296875, -1.753662109375, -1.3668212890625, -0.97998046875, -0.5931396484375, -0.206298828125, 0.1805419921875, 0.5673828125, 0.9542236328125, 1.341064453125, 1.7279052734375, 2.11474609375, 2.5015869140625, 2.888427734375, 3.2752685546875, 3.662109375, 4.0489501953125, 4.435791015625, 4.8226318359375, 5.20947265625, 5.5963134765625, 5.983154296875, 6.3699951171875, 6.7568359375, 7.1436767578125, 7.530517578125, 7.9173583984375, 8.30419921875, 8.6910400390625, 9.077880859375, 9.4647216796875, 9.8515625]}, "gradients/decoder.roberta.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 7.0, 6.0, 13.0, 12.0, 17.0, 21.0, 24.0, 13.0, 28.0, 30.0, 37.0, 39.0, 43.0, 40.0, 37.0, 40.0, 48.0, 56.0, 46.0, 50.0, 42.0, 43.0, 29.0, 33.0, 31.0, 35.0, 33.0, 29.0, 17.0, 14.0, 18.0, 11.0, 9.0, 8.0, 5.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.1796875, -5.03363037109375, -4.8875732421875, -4.74151611328125, -4.595458984375, -4.44940185546875, -4.3033447265625, -4.15728759765625, -4.01123046875, -3.86517333984375, -3.7191162109375, -3.57305908203125, -3.427001953125, -3.28094482421875, -3.1348876953125, -2.98883056640625, -2.8427734375, -2.69671630859375, -2.5506591796875, -2.40460205078125, -2.258544921875, -2.11248779296875, -1.9664306640625, -1.82037353515625, -1.67431640625, -1.52825927734375, -1.3822021484375, -1.23614501953125, -1.090087890625, -0.94403076171875, -0.7979736328125, -0.65191650390625, -0.505859375, -0.35980224609375, -0.2137451171875, -0.06768798828125, 0.078369140625, 0.22442626953125, 0.3704833984375, 0.51654052734375, 0.66259765625, 0.80865478515625, 0.9547119140625, 1.10076904296875, 1.246826171875, 1.39288330078125, 1.5389404296875, 1.68499755859375, 1.8310546875, 1.97711181640625, 2.1231689453125, 2.26922607421875, 2.415283203125, 2.56134033203125, 2.7073974609375, 2.85345458984375, 2.99951171875, 3.14556884765625, 3.2916259765625, 3.43768310546875, 3.583740234375, 3.72979736328125, 3.8758544921875, 4.02191162109375, 4.16796875]}, "gradients/decoder.roberta.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 8.0, 13.0, 16.0, 11.0, 20.0, 29.0, 55.0, 63.0, 91.0, 92.0, 166.0, 241.0, 380.0, 826.0, 39154.0, 4149049.0, 2572.0, 483.0, 274.0, 175.0, 143.0, 97.0, 74.0, 64.0, 54.0, 27.0, 20.0, 16.0, 15.0, 8.0, 13.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.03125, -53.15185546875, -51.2724609375, -49.39306640625, -47.513671875, -45.63427734375, -43.7548828125, -41.87548828125, -39.99609375, -38.11669921875, -36.2373046875, -34.35791015625, -32.478515625, -30.59912109375, -28.7197265625, -26.84033203125, -24.9609375, -23.08154296875, -21.2021484375, -19.32275390625, -17.443359375, -15.56396484375, -13.6845703125, -11.80517578125, -9.92578125, -8.04638671875, -6.1669921875, -4.28759765625, -2.408203125, -0.52880859375, 1.3505859375, 3.22998046875, 5.109375, 6.98876953125, 8.8681640625, 10.74755859375, 12.626953125, 14.50634765625, 16.3857421875, 18.26513671875, 20.14453125, 22.02392578125, 23.9033203125, 25.78271484375, 27.662109375, 29.54150390625, 31.4208984375, 33.30029296875, 35.1796875, 37.05908203125, 38.9384765625, 40.81787109375, 42.697265625, 44.57666015625, 46.4560546875, 48.33544921875, 50.21484375, 52.09423828125, 53.9736328125, 55.85302734375, 57.732421875, 59.61181640625, 61.4912109375, 63.37060546875, 65.25]}, "gradients/decoder.roberta.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 9.0, 13.0, 13.0, 12.0, 15.0, 24.0, 34.0, 47.0, 62.0, 71.0, 110.0, 120.0, 168.0, 240.0, 307.0, 407.0, 457.0, 421.0, 375.0, 315.0, 230.0, 164.0, 103.0, 87.0, 70.0, 55.0, 36.0, 18.0, 20.0, 12.0, 15.0, 9.0, 7.0, 5.0, 3.0, 4.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.03900146484375, -1.9705810546875, -1.90216064453125, -1.833740234375, -1.76531982421875, -1.6968994140625, -1.62847900390625, -1.56005859375, -1.49163818359375, -1.4232177734375, -1.35479736328125, -1.286376953125, -1.21795654296875, -1.1495361328125, -1.08111572265625, -1.0126953125, -0.94427490234375, -0.8758544921875, -0.80743408203125, -0.739013671875, -0.67059326171875, -0.6021728515625, -0.53375244140625, -0.46533203125, -0.39691162109375, -0.3284912109375, -0.26007080078125, -0.191650390625, -0.12322998046875, -0.0548095703125, 0.01361083984375, 0.08203125, 0.15045166015625, 0.2188720703125, 0.28729248046875, 0.355712890625, 0.42413330078125, 0.4925537109375, 0.56097412109375, 0.62939453125, 0.69781494140625, 0.7662353515625, 0.83465576171875, 0.903076171875, 0.97149658203125, 1.0399169921875, 1.10833740234375, 1.1767578125, 1.24517822265625, 1.3135986328125, 1.38201904296875, 1.450439453125, 1.51885986328125, 1.5872802734375, 1.65570068359375, 1.72412109375, 1.79254150390625, 1.8609619140625, 1.92938232421875, 1.997802734375, 2.06622314453125, 2.1346435546875, 2.20306396484375, 2.271484375]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 15.0, 30.0, 27.0, 45.0, 88.0, 97.0, 131.0, 116.0, 131.0, 109.0, 75.0, 48.0, 36.0, 23.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-10.470205307006836, -10.259299278259277, -10.048394203186035, -9.837488174438477, -9.626583099365234, -9.415677070617676, -9.204771995544434, -8.993865966796875, -8.782960891723633, -8.572054862976074, -8.361149787902832, -8.150243759155273, -7.939338684082031, -7.728432655334473, -7.517527103424072, -7.306621551513672, -7.095715522766113, -6.884809970855713, -6.6739044189453125, -6.462998867034912, -6.252093315124512, -6.041187286376953, -5.830281734466553, -5.619376182556152, -5.408470630645752, -5.197565078735352, -4.986659526824951, -4.775753974914551, -4.564847946166992, -4.35394287109375, -4.143036842346191, -3.932131290435791, -3.7212255001068115, -3.510319948196411, -3.2994141578674316, -3.0885086059570312, -2.877603054046631, -2.6666975021362305, -2.45579195022583, -2.2448861598968506, -2.03398060798645, -1.8230750560760498, -1.6121693849563599, -1.40126371383667, -1.1903581619262695, -0.9794526100158691, -0.7685469388961792, -0.5576412677764893, -0.34673571586608887, -0.1358301043510437, 0.07507550716400146, 0.28598111867904663, 0.4968867301940918, 0.7077922821044922, 0.9186979532241821, 1.129603624343872, 1.3405091762542725, 1.5514147281646729, 1.7623203992843628, 1.9732260704040527, 2.184131622314453, 2.3950371742248535, 2.605942726135254, 2.8168485164642334, 3.027754068374634]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 3.0, 5.0, 9.0, 9.0, 11.0, 14.0, 7.0, 15.0, 20.0, 17.0, 15.0, 23.0, 29.0, 30.0, 41.0, 34.0, 38.0, 33.0, 33.0, 53.0, 41.0, 46.0, 31.0, 38.0, 35.0, 38.0, 39.0, 33.0, 20.0, 28.0, 24.0, 23.0, 25.0, 19.0, 12.0, 23.0, 20.0, 8.0, 10.0, 10.0, 6.0, 7.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.79621696472168, -4.654570579528809, -4.5129241943359375, -4.371277332305908, -4.229630947113037, -4.087984561920166, -3.946337938308716, -3.8046913146972656, -3.6630449295043945, -3.5213985443115234, -3.3797519207000732, -3.238105297088623, -3.096458911895752, -2.954812526702881, -2.8131659030914307, -2.6715192794799805, -2.5298728942871094, -2.3882265090942383, -2.246579885482788, -2.104933261871338, -1.9632868766784668, -1.8216403722763062, -1.6799938678741455, -1.5383473634719849, -1.3967008590698242, -1.2550543546676636, -1.113407850265503, -0.9717613458633423, -0.8301148414611816, -0.688468337059021, -0.5468218326568604, -0.4051753282546997, -0.26352834701538086, -0.12188184261322021, 0.01976466178894043, 0.16141116619110107, 0.3030576705932617, 0.44470417499542236, 0.586350679397583, 0.7279971837997437, 0.8696436882019043, 1.011290192604065, 1.1529366970062256, 1.2945832014083862, 1.4362297058105469, 1.5778762102127075, 1.7195227146148682, 1.8611692190170288, 2.0028157234191895, 2.1444621086120605, 2.2861087322235107, 2.427755355834961, 2.569401741027832, 2.711048126220703, 2.8526947498321533, 2.9943413734436035, 3.1359877586364746, 3.2776341438293457, 3.419280767440796, 3.560927391052246, 3.702573776245117, 3.8442201614379883, 3.9858667850494385, 4.127513408660889, 4.26915979385376]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 4.0, 3.0, 4.0, 6.0, 20.0, 25.0, 16.0, 43.0, 77.0, 90.0, 118.0, 181.0, 269.0, 383.0, 552.0, 838.0, 1251.0, 1791.0, 2906.0, 4451.0, 6949.0, 11750.0, 19142.0, 33281.0, 60075.0, 115371.0, 217417.0, 249560.0, 145973.0, 74894.0, 40756.0, 23132.0, 13862.0, 8412.0, 5176.0, 3230.0, 2092.0, 1433.0, 979.0, 638.0, 444.0, 301.0, 221.0, 125.0, 98.0, 74.0, 57.0, 30.0, 18.0, 18.0, 13.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.09765625, -1.0655364990234375, -1.033416748046875, -1.0012969970703125, -0.96917724609375, -0.9370574951171875, -0.904937744140625, -0.8728179931640625, -0.8406982421875, -0.8085784912109375, -0.776458740234375, -0.7443389892578125, -0.71221923828125, -0.6800994873046875, -0.647979736328125, -0.6158599853515625, -0.583740234375, -0.5516204833984375, -0.519500732421875, -0.4873809814453125, -0.45526123046875, -0.4231414794921875, -0.391021728515625, -0.3589019775390625, -0.3267822265625, -0.2946624755859375, -0.262542724609375, -0.2304229736328125, -0.19830322265625, -0.1661834716796875, -0.134063720703125, -0.1019439697265625, -0.06982421875, -0.0377044677734375, -0.005584716796875, 0.0265350341796875, 0.05865478515625, 0.0907745361328125, 0.122894287109375, 0.1550140380859375, 0.1871337890625, 0.2192535400390625, 0.251373291015625, 0.2834930419921875, 0.31561279296875, 0.3477325439453125, 0.379852294921875, 0.4119720458984375, 0.444091796875, 0.4762115478515625, 0.508331298828125, 0.5404510498046875, 0.57257080078125, 0.6046905517578125, 0.636810302734375, 0.6689300537109375, 0.7010498046875, 0.7331695556640625, 0.765289306640625, 0.7974090576171875, 0.82952880859375, 0.8616485595703125, 0.893768310546875, 0.9258880615234375, 0.9580078125]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 3.0, 7.0, 8.0, 9.0, 9.0, 16.0, 7.0, 16.0, 17.0, 20.0, 18.0, 21.0, 28.0, 37.0, 34.0, 35.0, 39.0, 29.0, 37.0, 52.0, 41.0, 45.0, 36.0, 32.0, 38.0, 37.0, 39.0, 29.0, 21.0, 29.0, 22.0, 25.0, 26.0, 17.0, 13.0, 22.0, 20.0, 9.0, 8.0, 11.0, 7.0, 3.0, 9.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.43359375, -4.29638671875, -4.1591796875, -4.02197265625, -3.884765625, -3.74755859375, -3.6103515625, -3.47314453125, -3.3359375, -3.19873046875, -3.0615234375, -2.92431640625, -2.787109375, -2.64990234375, -2.5126953125, -2.37548828125, -2.23828125, -2.10107421875, -1.9638671875, -1.82666015625, -1.689453125, -1.55224609375, -1.4150390625, -1.27783203125, -1.140625, -1.00341796875, -0.8662109375, -0.72900390625, -0.591796875, -0.45458984375, -0.3173828125, -0.18017578125, -0.04296875, 0.09423828125, 0.2314453125, 0.36865234375, 0.505859375, 0.64306640625, 0.7802734375, 0.91748046875, 1.0546875, 1.19189453125, 1.3291015625, 1.46630859375, 1.603515625, 1.74072265625, 1.8779296875, 2.01513671875, 2.15234375, 2.28955078125, 2.4267578125, 2.56396484375, 2.701171875, 2.83837890625, 2.9755859375, 3.11279296875, 3.25, 3.38720703125, 3.5244140625, 3.66162109375, 3.798828125, 3.93603515625, 4.0732421875, 4.21044921875, 4.34765625]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 4.0, 4.0, 6.0, 3.0, 5.0, 12.0, 12.0, 18.0, 17.0, 22.0, 46.0, 51.0, 65.0, 86.0, 110.0, 153.0, 228.0, 297.0, 494.0, 737.0, 1196.0, 2166.0, 4655.0, 12285.0, 45292.0, 922308.0, 37934.0, 10767.0, 4229.0, 2028.0, 1094.0, 705.0, 418.0, 325.0, 199.0, 141.0, 103.0, 89.0, 62.0, 48.0, 41.0, 28.0, 17.0, 14.0, 5.0, 9.0, 6.0, 3.0, 3.0, 9.0, 4.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.0955810546875, -2.993896484375, -2.8922119140625, -2.79052734375, -2.6888427734375, -2.587158203125, -2.4854736328125, -2.3837890625, -2.2821044921875, -2.180419921875, -2.0787353515625, -1.97705078125, -1.8753662109375, -1.773681640625, -1.6719970703125, -1.5703125, -1.4686279296875, -1.366943359375, -1.2652587890625, -1.16357421875, -1.0618896484375, -0.960205078125, -0.8585205078125, -0.7568359375, -0.6551513671875, -0.553466796875, -0.4517822265625, -0.35009765625, -0.2484130859375, -0.146728515625, -0.0450439453125, 0.056640625, 0.1583251953125, 0.260009765625, 0.3616943359375, 0.46337890625, 0.5650634765625, 0.666748046875, 0.7684326171875, 0.8701171875, 0.9718017578125, 1.073486328125, 1.1751708984375, 1.27685546875, 1.3785400390625, 1.480224609375, 1.5819091796875, 1.68359375, 1.7852783203125, 1.886962890625, 1.9886474609375, 2.09033203125, 2.1920166015625, 2.293701171875, 2.3953857421875, 2.4970703125, 2.5987548828125, 2.700439453125, 2.8021240234375, 2.90380859375, 3.0054931640625, 3.107177734375, 3.2088623046875, 3.310546875]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 7.0, 4.0, 10.0, 18.0, 15.0, 15.0, 15.0, 22.0, 32.0, 23.0, 27.0, 44.0, 51.0, 33.0, 41.0, 48.0, 33.0, 59.0, 64.0, 41.0, 46.0, 35.0, 45.0, 36.0, 28.0, 37.0, 37.0, 21.0, 28.0, 21.0, 13.0, 4.0, 10.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.81005859375, -3.7021484375, -3.59423828125, -3.486328125, -3.37841796875, -3.2705078125, -3.16259765625, -3.0546875, -2.94677734375, -2.8388671875, -2.73095703125, -2.623046875, -2.51513671875, -2.4072265625, -2.29931640625, -2.19140625, -2.08349609375, -1.9755859375, -1.86767578125, -1.759765625, -1.65185546875, -1.5439453125, -1.43603515625, -1.328125, -1.22021484375, -1.1123046875, -1.00439453125, -0.896484375, -0.78857421875, -0.6806640625, -0.57275390625, -0.46484375, -0.35693359375, -0.2490234375, -0.14111328125, -0.033203125, 0.07470703125, 0.1826171875, 0.29052734375, 0.3984375, 0.50634765625, 0.6142578125, 0.72216796875, 0.830078125, 0.93798828125, 1.0458984375, 1.15380859375, 1.26171875, 1.36962890625, 1.4775390625, 1.58544921875, 1.693359375, 1.80126953125, 1.9091796875, 2.01708984375, 2.125, 2.23291015625, 2.3408203125, 2.44873046875, 2.556640625, 2.66455078125, 2.7724609375, 2.88037109375, 2.98828125]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 9.0, 10.0, 10.0, 10.0, 19.0, 34.0, 42.0, 59.0, 106.0, 139.0, 252.0, 453.0, 890.0, 2028.0, 5770.0, 32305.0, 979555.0, 19225.0, 4318.0, 1541.0, 762.0, 367.0, 208.0, 157.0, 91.0, 54.0, 44.0, 26.0, 16.0, 20.0, 12.0, 4.0, 8.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.496337890625, -0.48101043701171875, -0.4656829833984375, -0.45035552978515625, -0.435028076171875, -0.41970062255859375, -0.4043731689453125, -0.38904571533203125, -0.37371826171875, -0.35839080810546875, -0.3430633544921875, -0.32773590087890625, -0.312408447265625, -0.29708099365234375, -0.2817535400390625, -0.26642608642578125, -0.2510986328125, -0.23577117919921875, -0.2204437255859375, -0.20511627197265625, -0.189788818359375, -0.17446136474609375, -0.1591339111328125, -0.14380645751953125, -0.12847900390625, -0.11315155029296875, -0.0978240966796875, -0.08249664306640625, -0.067169189453125, -0.05184173583984375, -0.0365142822265625, -0.02118682861328125, -0.005859375, 0.00946807861328125, 0.0247955322265625, 0.04012298583984375, 0.055450439453125, 0.07077789306640625, 0.0861053466796875, 0.10143280029296875, 0.11676025390625, 0.13208770751953125, 0.1474151611328125, 0.16274261474609375, 0.178070068359375, 0.19339752197265625, 0.2087249755859375, 0.22405242919921875, 0.2393798828125, 0.25470733642578125, 0.2700347900390625, 0.28536224365234375, 0.300689697265625, 0.31601715087890625, 0.3313446044921875, 0.34667205810546875, 0.36199951171875, 0.37732696533203125, 0.3926544189453125, 0.40798187255859375, 0.423309326171875, 0.43863677978515625, 0.4539642333984375, 0.46929168701171875, 0.484619140625]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 8.0, 5.0, 8.0, 13.0, 21.0, 18.0, 27.0, 29.0, 30.0, 35.0, 56.0, 37.0, 61.0, 63.0, 69.0, 57.0, 67.0, 41.0, 63.0, 57.0, 42.0, 38.0, 16.0, 16.0, 25.0, 19.0, 17.0, 9.0, 5.0, 5.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.4318695068359375e-05, -2.3550353944301605e-05, -2.2782012820243835e-05, -2.2013671696186066e-05, -2.1245330572128296e-05, -2.0476989448070526e-05, -1.9708648324012756e-05, -1.8940307199954987e-05, -1.8171966075897217e-05, -1.7403624951839447e-05, -1.6635283827781677e-05, -1.5866942703723907e-05, -1.5098601579666138e-05, -1.4330260455608368e-05, -1.3561919331550598e-05, -1.2793578207492828e-05, -1.2025237083435059e-05, -1.1256895959377289e-05, -1.0488554835319519e-05, -9.72021371126175e-06, -8.95187258720398e-06, -8.18353146314621e-06, -7.41519033908844e-06, -6.64684921503067e-06, -5.8785080909729e-06, -5.110166966915131e-06, -4.341825842857361e-06, -3.573484718799591e-06, -2.8051435947418213e-06, -2.0368024706840515e-06, -1.2684613466262817e-06, -5.00120222568512e-07, 2.682209014892578e-07, 1.0365620255470276e-06, 1.8049031496047974e-06, 2.573244273662567e-06, 3.341585397720337e-06, 4.109926521778107e-06, 4.8782676458358765e-06, 5.646608769893646e-06, 6.414949893951416e-06, 7.183291018009186e-06, 7.951632142066956e-06, 8.719973266124725e-06, 9.488314390182495e-06, 1.0256655514240265e-05, 1.1024996638298035e-05, 1.1793337762355804e-05, 1.2561678886413574e-05, 1.3330020010471344e-05, 1.4098361134529114e-05, 1.4866702258586884e-05, 1.5635043382644653e-05, 1.6403384506702423e-05, 1.7171725630760193e-05, 1.7940066754817963e-05, 1.8708407878875732e-05, 1.9476749002933502e-05, 2.0245090126991272e-05, 2.1013431251049042e-05, 2.178177237510681e-05, 2.255011349916458e-05, 2.331845462322235e-05, 2.408679574728012e-05, 2.485513687133789e-05]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 7.0, 6.0, 2.0, 7.0, 13.0, 12.0, 21.0, 20.0, 27.0, 36.0, 46.0, 80.0, 193.0, 882.0, 213050.0, 832175.0, 1435.0, 197.0, 89.0, 55.0, 31.0, 27.0, 15.0, 13.0, 17.0, 13.0, 14.0, 11.0, 10.0, 4.0, 8.0, 5.0, 3.0, 10.0, 3.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.86376953125, -0.8350601196289062, -0.8063507080078125, -0.7776412963867188, -0.748931884765625, -0.7202224731445312, -0.6915130615234375, -0.6628036499023438, -0.63409423828125, -0.6053848266601562, -0.5766754150390625, -0.5479660034179688, -0.519256591796875, -0.49054718017578125, -0.4618377685546875, -0.43312835693359375, -0.4044189453125, -0.37570953369140625, -0.3470001220703125, -0.31829071044921875, -0.289581298828125, -0.26087188720703125, -0.2321624755859375, -0.20345306396484375, -0.17474365234375, -0.14603424072265625, -0.1173248291015625, -0.08861541748046875, -0.059906005859375, -0.03119659423828125, -0.0024871826171875, 0.02622222900390625, 0.054931640625, 0.08364105224609375, 0.1123504638671875, 0.14105987548828125, 0.169769287109375, 0.19847869873046875, 0.2271881103515625, 0.25589752197265625, 0.28460693359375, 0.31331634521484375, 0.3420257568359375, 0.37073516845703125, 0.399444580078125, 0.42815399169921875, 0.4568634033203125, 0.48557281494140625, 0.5142822265625, 0.5429916381835938, 0.5717010498046875, 0.6004104614257812, 0.629119873046875, 0.6578292846679688, 0.6865386962890625, 0.7152481079101562, 0.74395751953125, 0.7726669311523438, 0.8013763427734375, 0.8300857543945312, 0.858795166015625, 0.8875045776367188, 0.9162139892578125, 0.9449234008789062, 0.9736328125]}, "gradients/decoder.roberta.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 3.0, 8.0, 8.0, 12.0, 12.0, 16.0, 10.0, 15.0, 16.0, 20.0, 24.0, 37.0, 48.0, 62.0, 80.0, 109.0, 108.0, 73.0, 62.0, 61.0, 34.0, 32.0, 24.0, 23.0, 19.0, 14.0, 12.0, 8.0, 4.0, 7.0, 3.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03778076171875, -0.03663825988769531, -0.035495758056640625, -0.03435325622558594, -0.03321075439453125, -0.03206825256347656, -0.030925750732421875, -0.029783248901367188, -0.0286407470703125, -0.027498245239257812, -0.026355743408203125, -0.025213241577148438, -0.02407073974609375, -0.022928237915039062, -0.021785736083984375, -0.020643234252929688, -0.019500732421875, -0.018358230590820312, -0.017215728759765625, -0.016073226928710938, -0.01493072509765625, -0.013788223266601562, -0.012645721435546875, -0.011503219604492188, -0.0103607177734375, -0.009218215942382812, -0.008075714111328125, -0.0069332122802734375, -0.00579071044921875, -0.0046482086181640625, -0.003505706787109375, -0.0023632049560546875, -0.001220703125, -7.82012939453125e-05, 0.001064300537109375, 0.0022068023681640625, 0.00334930419921875, 0.0044918060302734375, 0.005634307861328125, 0.0067768096923828125, 0.0079193115234375, 0.009061813354492188, 0.010204315185546875, 0.011346817016601562, 0.01248931884765625, 0.013631820678710938, 0.014774322509765625, 0.015916824340820312, 0.017059326171875, 0.018201828002929688, 0.019344329833984375, 0.020486831665039062, 0.02162933349609375, 0.022771835327148438, 0.023914337158203125, 0.025056838989257812, 0.0261993408203125, 0.027341842651367188, 0.028484344482421875, 0.029626846313476562, 0.03076934814453125, 0.03191184997558594, 0.033054351806640625, 0.03419685363769531, 0.03533935546875]}, "gradients/decoder.roberta.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 11.0, 49.0, 89.0, 209.0, 246.0, 232.0, 108.0, 44.0, 12.0, 12.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.341146469116211, -7.915674209594727, -7.490201473236084, -7.0647292137146, -6.639256477355957, -6.213784217834473, -5.788311958312988, -5.362839221954346, -4.937366485595703, -4.511894226074219, -4.086421489715576, -3.660949230194092, -3.235476493835449, -2.810004234313965, -2.3845317363739014, -1.959059238433838, -1.5335869789123535, -1.10811448097229, -0.6826420426368713, -0.25716960430145264, 0.16830289363861084, 0.5937752723693848, 1.0192477703094482, 1.4447202682495117, 1.8701927661895752, 2.2956652641296387, 2.721137762069702, 3.1466102600097656, 3.57208251953125, 3.9975550174713135, 4.423027515411377, 4.8485002517700195, 5.273972511291504, 5.699444770812988, 6.124917507171631, 6.550389766693115, 6.975862503051758, 7.401334762573242, 7.826807022094727, 8.252279281616211, 8.677752494812012, 9.103224754333496, 9.52869701385498, 9.954170227050781, 10.379642486572266, 10.80511474609375, 11.230587005615234, 11.656059265136719, 12.081531524658203, 12.507003784179688, 12.932476043701172, 13.357949256896973, 13.783421516418457, 14.208893775939941, 14.634366035461426, 15.059839248657227, 15.485311508178711, 15.910783767700195, 16.33625602722168, 16.761728286743164, 17.18720054626465, 17.612674713134766, 18.03814697265625, 18.463619232177734, 18.88909149169922]}, "gradients/decoder.roberta.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 2.0, 7.0, 9.0, 8.0, 10.0, 15.0, 6.0, 18.0, 16.0, 21.0, 18.0, 20.0, 29.0, 36.0, 34.0, 35.0, 40.0, 29.0, 37.0, 51.0, 41.0, 46.0, 36.0, 33.0, 36.0, 38.0, 37.0, 30.0, 23.0, 27.0, 24.0, 24.0, 24.0, 17.0, 14.0, 22.0, 20.0, 9.0, 9.0, 10.0, 6.0, 4.0, 9.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.428088188171387, -4.290980339050293, -4.153872013092041, -4.016764163970947, -3.8796558380126953, -3.7425479888916016, -3.6054399013519287, -3.468331813812256, -3.331223726272583, -3.19411563873291, -3.0570075511932373, -2.9198994636535645, -2.7827916145324707, -2.6456832885742188, -2.508575439453125, -2.371467351913452, -2.2343592643737793, -2.0972511768341064, -1.9601430892944336, -1.8230351209640503, -1.6859270334243774, -1.5488189458847046, -1.4117109775543213, -1.2746028900146484, -1.1374948024749756, -1.0003867149353027, -0.8632786870002747, -0.7261706590652466, -0.5890625715255737, -0.4519544839859009, -0.3148464560508728, -0.17773842811584473, -0.04062986373901367, 0.09647819399833679, 0.23358625173568726, 0.3706943094730377, 0.5078023672103882, 0.644910454750061, 0.7820184826850891, 0.9191265106201172, 1.05623459815979, 1.193342685699463, 1.3304507732391357, 1.467558741569519, 1.604666829109192, 1.7417749166488647, 1.878882884979248, 2.015990972518921, 2.1530990600585938, 2.2902071475982666, 2.4273152351379395, 2.5644233226776123, 2.701531410217285, 2.838639259338379, 2.9757473468780518, 3.1128554344177246, 3.2499635219573975, 3.3870716094970703, 3.524179697036743, 3.661287784576416, 3.7983956336975098, 3.9355039596557617, 4.0726118087768555, 4.209719657897949, 4.346827983856201]}, "gradients/decoder.roberta.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 1.0, 5.0, 7.0, 8.0, 11.0, 13.0, 18.0, 31.0, 49.0, 61.0, 89.0, 106.0, 150.0, 197.0, 317.0, 443.0, 667.0, 1089.0, 1785.0, 3183.0, 5748.0, 10583.0, 18530.0, 33003.0, 55480.0, 89474.0, 149522.0, 260011.0, 171404.0, 99212.0, 61906.0, 36884.0, 21102.0, 11931.0, 6387.0, 3613.0, 2019.0, 1214.0, 704.0, 453.0, 342.0, 235.0, 169.0, 125.0, 64.0, 72.0, 40.0, 35.0, 21.0, 20.0, 13.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.90234375, -3.77484130859375, -3.6473388671875, -3.51983642578125, -3.392333984375, -3.26483154296875, -3.1373291015625, -3.00982666015625, -2.88232421875, -2.75482177734375, -2.6273193359375, -2.49981689453125, -2.372314453125, -2.24481201171875, -2.1173095703125, -1.98980712890625, -1.8623046875, -1.73480224609375, -1.6072998046875, -1.47979736328125, -1.352294921875, -1.22479248046875, -1.0972900390625, -0.96978759765625, -0.84228515625, -0.71478271484375, -0.5872802734375, -0.45977783203125, -0.332275390625, -0.20477294921875, -0.0772705078125, 0.05023193359375, 0.177734375, 0.30523681640625, 0.4327392578125, 0.56024169921875, 0.687744140625, 0.81524658203125, 0.9427490234375, 1.07025146484375, 1.19775390625, 1.32525634765625, 1.4527587890625, 1.58026123046875, 1.707763671875, 1.83526611328125, 1.9627685546875, 2.09027099609375, 2.2177734375, 2.34527587890625, 2.4727783203125, 2.60028076171875, 2.727783203125, 2.85528564453125, 2.9827880859375, 3.11029052734375, 3.23779296875, 3.36529541015625, 3.4927978515625, 3.62030029296875, 3.747802734375, 3.87530517578125, 4.0028076171875, 4.13031005859375, 4.2578125]}, "gradients/decoder.roberta.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 7.0, 6.0, 17.0, 11.0, 15.0, 9.0, 14.0, 19.0, 16.0, 23.0, 26.0, 28.0, 38.0, 33.0, 37.0, 48.0, 32.0, 39.0, 40.0, 43.0, 38.0, 42.0, 39.0, 36.0, 38.0, 37.0, 24.0, 17.0, 25.0, 19.0, 27.0, 21.0, 12.0, 21.0, 18.0, 16.0, 9.0, 9.0, 10.0, 9.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.05078125, -2.957489013671875, -2.86419677734375, -2.770904541015625, -2.6776123046875, -2.584320068359375, -2.49102783203125, -2.397735595703125, -2.304443359375, -2.211151123046875, -2.11785888671875, -2.024566650390625, -1.9312744140625, -1.837982177734375, -1.74468994140625, -1.651397705078125, -1.55810546875, -1.464813232421875, -1.37152099609375, -1.278228759765625, -1.1849365234375, -1.091644287109375, -0.99835205078125, -0.905059814453125, -0.811767578125, -0.718475341796875, -0.62518310546875, -0.531890869140625, -0.4385986328125, -0.345306396484375, -0.25201416015625, -0.158721923828125, -0.0654296875, 0.027862548828125, 0.12115478515625, 0.214447021484375, 0.3077392578125, 0.401031494140625, 0.49432373046875, 0.587615966796875, 0.680908203125, 0.774200439453125, 0.86749267578125, 0.960784912109375, 1.0540771484375, 1.147369384765625, 1.24066162109375, 1.333953857421875, 1.42724609375, 1.520538330078125, 1.61383056640625, 1.707122802734375, 1.8004150390625, 1.893707275390625, 1.98699951171875, 2.080291748046875, 2.173583984375, 2.266876220703125, 2.36016845703125, 2.453460693359375, 2.5467529296875, 2.640045166015625, 2.73333740234375, 2.826629638671875, 2.919921875]}, "gradients/decoder.roberta.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 9.0, 5.0, 11.0, 15.0, 13.0, 17.0, 21.0, 29.0, 22.0, 30.0, 31.0, 41.0, 39.0, 57.0, 66.0, 168.0, 607.0, 771580.0, 274665.0, 547.0, 142.0, 73.0, 43.0, 38.0, 36.0, 36.0, 26.0, 30.0, 28.0, 14.0, 29.0, 12.0, 7.0, 10.0, 7.0, 8.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.375, -71.9716796875, -69.568359375, -67.1650390625, -64.76171875, -62.3583984375, -59.955078125, -57.5517578125, -55.1484375, -52.7451171875, -50.341796875, -47.9384765625, -45.53515625, -43.1318359375, -40.728515625, -38.3251953125, -35.921875, -33.5185546875, -31.115234375, -28.7119140625, -26.30859375, -23.9052734375, -21.501953125, -19.0986328125, -16.6953125, -14.2919921875, -11.888671875, -9.4853515625, -7.08203125, -4.6787109375, -2.275390625, 0.1279296875, 2.53125, 4.9345703125, 7.337890625, 9.7412109375, 12.14453125, 14.5478515625, 16.951171875, 19.3544921875, 21.7578125, 24.1611328125, 26.564453125, 28.9677734375, 31.37109375, 33.7744140625, 36.177734375, 38.5810546875, 40.984375, 43.3876953125, 45.791015625, 48.1943359375, 50.59765625, 53.0009765625, 55.404296875, 57.8076171875, 60.2109375, 62.6142578125, 65.017578125, 67.4208984375, 69.82421875, 72.2275390625, 74.630859375, 77.0341796875, 79.4375]}, "gradients/decoder.roberta.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 13.0, 10.0, 11.0, 15.0, 11.0, 21.0, 26.0, 28.0, 27.0, 31.0, 34.0, 33.0, 40.0, 39.0, 35.0, 30.0, 59.0, 47.0, 44.0, 46.0, 35.0, 42.0, 37.0, 30.0, 23.0, 33.0, 24.0, 27.0, 27.0, 18.0, 12.0, 17.0, 12.0, 12.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.857421875, -2.76678466796875, -2.6761474609375, -2.58551025390625, -2.494873046875, -2.40423583984375, -2.3135986328125, -2.22296142578125, -2.13232421875, -2.04168701171875, -1.9510498046875, -1.86041259765625, -1.769775390625, -1.67913818359375, -1.5885009765625, -1.49786376953125, -1.4072265625, -1.31658935546875, -1.2259521484375, -1.13531494140625, -1.044677734375, -0.95404052734375, -0.8634033203125, -0.77276611328125, -0.68212890625, -0.59149169921875, -0.5008544921875, -0.41021728515625, -0.319580078125, -0.22894287109375, -0.1383056640625, -0.04766845703125, 0.04296875, 0.13360595703125, 0.2242431640625, 0.31488037109375, 0.405517578125, 0.49615478515625, 0.5867919921875, 0.67742919921875, 0.76806640625, 0.85870361328125, 0.9493408203125, 1.03997802734375, 1.130615234375, 1.22125244140625, 1.3118896484375, 1.40252685546875, 1.4931640625, 1.58380126953125, 1.6744384765625, 1.76507568359375, 1.855712890625, 1.94635009765625, 2.0369873046875, 2.12762451171875, 2.21826171875, 2.30889892578125, 2.3995361328125, 2.49017333984375, 2.580810546875, 2.67144775390625, 2.7620849609375, 2.85272216796875, 2.943359375]}, "gradients/decoder.roberta.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 7.0, 18.0, 21.0, 56.0, 222.0, 1124.0, 22886.0, 1005822.0, 17116.0, 944.0, 214.0, 63.0, 23.0, 13.0, 7.0, 9.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4921875, -12.053466796875, -11.61474609375, -11.176025390625, -10.7373046875, -10.298583984375, -9.85986328125, -9.421142578125, -8.982421875, -8.543701171875, -8.10498046875, -7.666259765625, -7.2275390625, -6.788818359375, -6.35009765625, -5.911376953125, -5.47265625, -5.033935546875, -4.59521484375, -4.156494140625, -3.7177734375, -3.279052734375, -2.84033203125, -2.401611328125, -1.962890625, -1.524169921875, -1.08544921875, -0.646728515625, -0.2080078125, 0.230712890625, 0.66943359375, 1.108154296875, 1.546875, 1.985595703125, 2.42431640625, 2.863037109375, 3.3017578125, 3.740478515625, 4.17919921875, 4.617919921875, 5.056640625, 5.495361328125, 5.93408203125, 6.372802734375, 6.8115234375, 7.250244140625, 7.68896484375, 8.127685546875, 8.56640625, 9.005126953125, 9.44384765625, 9.882568359375, 10.3212890625, 10.760009765625, 11.19873046875, 11.637451171875, 12.076171875, 12.514892578125, 12.95361328125, 13.392333984375, 13.8310546875, 14.269775390625, 14.70849609375, 15.147216796875, 15.5859375]}, "gradients/decoder.roberta.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 10.0, 13.0, 36.0, 41.0, 96.0, 127.0, 248.0, 197.0, 85.0, 54.0, 37.0, 19.0, 13.0, 14.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000667572021484375, -0.0006488561630249023, -0.0006301403045654297, -0.000611424446105957, -0.0005927085876464844, -0.0005739927291870117, -0.0005552768707275391, -0.0005365610122680664, -0.0005178451538085938, -0.0004991292953491211, -0.00048041343688964844, -0.0004616975784301758, -0.0004429817199707031, -0.00042426586151123047, -0.0004055500030517578, -0.00038683414459228516, -0.0003681182861328125, -0.00034940242767333984, -0.0003306865692138672, -0.00031197071075439453, -0.0002932548522949219, -0.0002745389938354492, -0.00025582313537597656, -0.0002371072769165039, -0.00021839141845703125, -0.0001996755599975586, -0.00018095970153808594, -0.00016224384307861328, -0.00014352798461914062, -0.00012481212615966797, -0.00010609626770019531, -8.738040924072266e-05, -6.866455078125e-05, -4.9948692321777344e-05, -3.123283386230469e-05, -1.2516975402832031e-05, 6.198883056640625e-06, 2.491474151611328e-05, 4.363059997558594e-05, 6.23464584350586e-05, 8.106231689453125e-05, 9.97781753540039e-05, 0.00011849403381347656, 0.00013720989227294922, 0.00015592575073242188, 0.00017464160919189453, 0.0001933574676513672, 0.00021207332611083984, 0.0002307891845703125, 0.00024950504302978516, 0.0002682209014892578, 0.00028693675994873047, 0.0003056526184082031, 0.0003243684768676758, 0.00034308433532714844, 0.0003618001937866211, 0.00038051605224609375, 0.0003992319107055664, 0.00041794776916503906, 0.0004366636276245117, 0.0004553794860839844, 0.00047409534454345703, 0.0004928112030029297, 0.0005115270614624023, 0.000530242919921875]}, "gradients/decoder.roberta.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 22.0, 20.0, 48.0, 125.0, 568.0, 130690.0, 915806.0, 950.0, 150.0, 68.0, 41.0, 18.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.93505859375, -25.1513671875, -24.36767578125, -23.583984375, -22.80029296875, -22.0166015625, -21.23291015625, -20.44921875, -19.66552734375, -18.8818359375, -18.09814453125, -17.314453125, -16.53076171875, -15.7470703125, -14.96337890625, -14.1796875, -13.39599609375, -12.6123046875, -11.82861328125, -11.044921875, -10.26123046875, -9.4775390625, -8.69384765625, -7.91015625, -7.12646484375, -6.3427734375, -5.55908203125, -4.775390625, -3.99169921875, -3.2080078125, -2.42431640625, -1.640625, -0.85693359375, -0.0732421875, 0.71044921875, 1.494140625, 2.27783203125, 3.0615234375, 3.84521484375, 4.62890625, 5.41259765625, 6.1962890625, 6.97998046875, 7.763671875, 8.54736328125, 9.3310546875, 10.11474609375, 10.8984375, 11.68212890625, 12.4658203125, 13.24951171875, 14.033203125, 14.81689453125, 15.6005859375, 16.38427734375, 17.16796875, 17.95166015625, 18.7353515625, 19.51904296875, 20.302734375, 21.08642578125, 21.8701171875, 22.65380859375, 23.4375]}, "gradients/decoder.roberta.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 7.0, 8.0, 15.0, 38.0, 51.0, 71.0, 146.0, 236.0, 189.0, 97.0, 60.0, 33.0, 17.0, 15.0, 8.0, 5.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.168365478515625, -1.12774658203125, -1.087127685546875, -1.0465087890625, -1.005889892578125, -0.96527099609375, -0.924652099609375, -0.884033203125, -0.843414306640625, -0.80279541015625, -0.762176513671875, -0.7215576171875, -0.680938720703125, -0.64031982421875, -0.599700927734375, -0.55908203125, -0.518463134765625, -0.47784423828125, -0.437225341796875, -0.3966064453125, -0.355987548828125, -0.31536865234375, -0.274749755859375, -0.234130859375, -0.193511962890625, -0.15289306640625, -0.112274169921875, -0.0716552734375, -0.031036376953125, 0.00958251953125, 0.050201416015625, 0.0908203125, 0.131439208984375, 0.17205810546875, 0.212677001953125, 0.2532958984375, 0.293914794921875, 0.33453369140625, 0.375152587890625, 0.415771484375, 0.456390380859375, 0.49700927734375, 0.537628173828125, 0.5782470703125, 0.618865966796875, 0.65948486328125, 0.700103759765625, 0.74072265625, 0.781341552734375, 0.82196044921875, 0.862579345703125, 0.9031982421875, 0.943817138671875, 0.98443603515625, 1.025054931640625, 1.065673828125, 1.106292724609375, 1.14691162109375, 1.187530517578125, 1.2281494140625, 1.268768310546875, 1.30938720703125, 1.350006103515625, 1.390625]}, "gradients/decoder.roberta.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 14.0, 56.0, 185.0, 349.0, 277.0, 105.0, 17.0, 8.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.591257095336914, -19.98025131225586, -19.369247436523438, -18.758243560791016, -18.14723777770996, -17.536231994628906, -16.925228118896484, -16.314224243164062, -15.703218460083008, -15.09221363067627, -14.481208801269531, -13.870203971862793, -13.259199142456055, -12.648194313049316, -12.037189483642578, -11.42618465423584, -10.815179824829102, -10.204174995422363, -9.593170166015625, -8.982165336608887, -8.371160507202148, -7.76015567779541, -7.149150848388672, -6.538146018981934, -5.927141189575195, -5.316136360168457, -4.705131530761719, -4.0941267013549805, -3.483121871948242, -2.872117042541504, -2.2611122131347656, -1.6501073837280273, -1.0391044616699219, -0.4280996322631836, 0.1829051971435547, 0.793910026550293, 1.4049148559570312, 2.0159196853637695, 2.626924514770508, 3.237929344177246, 3.8489341735839844, 4.459939002990723, 5.070943832397461, 5.681948661804199, 6.2929534912109375, 6.903958320617676, 7.514963150024414, 8.125967979431152, 8.73697280883789, 9.347977638244629, 9.958982467651367, 10.569987297058105, 11.180992126464844, 11.791996955871582, 12.40300178527832, 13.014006614685059, 13.625011444091797, 14.236016273498535, 14.847021102905273, 15.458025932312012, 16.06903076171875, 16.680034637451172, 17.291040420532227, 17.90204620361328, 18.513050079345703]}, "gradients/decoder.roberta.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 5.0, 3.0, 9.0, 10.0, 9.0, 10.0, 10.0, 22.0, 26.0, 23.0, 34.0, 37.0, 48.0, 50.0, 40.0, 44.0, 49.0, 48.0, 46.0, 57.0, 46.0, 41.0, 47.0, 44.0, 38.0, 36.0, 33.0, 24.0, 23.0, 9.0, 21.0, 13.0, 9.0, 13.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.95082950592041, -5.760390758514404, -5.569952011108398, -5.379513740539551, -5.189074993133545, -4.998636245727539, -4.808197498321533, -4.617758750915527, -4.4273200035095215, -4.236881256103516, -4.04644250869751, -3.856003999710083, -3.665565252304077, -3.4751267433166504, -3.2846879959106445, -3.0942492485046387, -2.903810739517212, -2.713371992111206, -2.5229334831237793, -2.3324947357177734, -2.1420559883117676, -1.9516173601150513, -1.761178731918335, -1.570739984512329, -1.3803013563156128, -1.1898627281188965, -0.9994239807128906, -0.8089853525161743, -0.6185466647148132, -0.42810797691345215, -0.23766934871673584, -0.04723060131072998, 0.14320802688598633, 0.3336467146873474, 0.5240854024887085, 0.7145240306854248, 0.9049627184867859, 1.095401406288147, 1.2858400344848633, 1.4762787818908691, 1.6667174100875854, 1.8571560382843018, 2.0475947856903076, 2.2380332946777344, 2.4284720420837402, 2.618910789489746, 2.809349536895752, 2.999788284301758, 3.1902267932891846, 3.3806655406951904, 3.571104049682617, 3.761542797088623, 3.951981544494629, 4.142420291900635, 4.332859039306641, 4.523297309875488, 4.713736057281494, 4.9041748046875, 5.094613552093506, 5.285052299499512, 5.475490570068359, 5.665929317474365, 5.856368064880371, 6.046806812286377, 6.237245559692383]}, "gradients/decoder.roberta.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 0.0, 9.0, 13.0, 23.0, 32.0, 43.0, 84.0, 151.0, 198.0, 310.0, 556.0, 1063.0, 2114.0, 5062.0, 15148.0, 59938.0, 321861.0, 1440642.0, 1780452.0, 452330.0, 81638.0, 19954.0, 6853.0, 2741.0, 1305.0, 734.0, 396.0, 223.0, 148.0, 80.0, 71.0, 44.0, 21.0, 19.0, 9.0, 11.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.4375, -6.2685546875, -6.099609375, -5.9306640625, -5.76171875, -5.5927734375, -5.423828125, -5.2548828125, -5.0859375, -4.9169921875, -4.748046875, -4.5791015625, -4.41015625, -4.2412109375, -4.072265625, -3.9033203125, -3.734375, -3.5654296875, -3.396484375, -3.2275390625, -3.05859375, -2.8896484375, -2.720703125, -2.5517578125, -2.3828125, -2.2138671875, -2.044921875, -1.8759765625, -1.70703125, -1.5380859375, -1.369140625, -1.2001953125, -1.03125, -0.8623046875, -0.693359375, -0.5244140625, -0.35546875, -0.1865234375, -0.017578125, 0.1513671875, 0.3203125, 0.4892578125, 0.658203125, 0.8271484375, 0.99609375, 1.1650390625, 1.333984375, 1.5029296875, 1.671875, 1.8408203125, 2.009765625, 2.1787109375, 2.34765625, 2.5166015625, 2.685546875, 2.8544921875, 3.0234375, 3.1923828125, 3.361328125, 3.5302734375, 3.69921875, 3.8681640625, 4.037109375, 4.2060546875, 4.375]}, "gradients/decoder.roberta.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 4.0, 8.0, 17.0, 8.0, 19.0, 16.0, 15.0, 25.0, 28.0, 24.0, 30.0, 40.0, 50.0, 42.0, 47.0, 44.0, 46.0, 37.0, 55.0, 45.0, 36.0, 46.0, 33.0, 34.0, 40.0, 26.0, 30.0, 21.0, 13.0, 21.0, 25.0, 6.0, 9.0, 12.0, 9.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.98333740234375, -3.8533935546875, -3.72344970703125, -3.593505859375, -3.46356201171875, -3.3336181640625, -3.20367431640625, -3.07373046875, -2.94378662109375, -2.8138427734375, -2.68389892578125, -2.553955078125, -2.42401123046875, -2.2940673828125, -2.16412353515625, -2.0341796875, -1.90423583984375, -1.7742919921875, -1.64434814453125, -1.514404296875, -1.38446044921875, -1.2545166015625, -1.12457275390625, -0.99462890625, -0.86468505859375, -0.7347412109375, -0.60479736328125, -0.474853515625, -0.34490966796875, -0.2149658203125, -0.08502197265625, 0.044921875, 0.17486572265625, 0.3048095703125, 0.43475341796875, 0.564697265625, 0.69464111328125, 0.8245849609375, 0.95452880859375, 1.08447265625, 1.21441650390625, 1.3443603515625, 1.47430419921875, 1.604248046875, 1.73419189453125, 1.8641357421875, 1.99407958984375, 2.1240234375, 2.25396728515625, 2.3839111328125, 2.51385498046875, 2.643798828125, 2.77374267578125, 2.9036865234375, 3.03363037109375, 3.16357421875, 3.29351806640625, 3.4234619140625, 3.55340576171875, 3.683349609375, 3.81329345703125, 3.9432373046875, 4.07318115234375, 4.203125]}, "gradients/decoder.roberta.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 6.0, 11.0, 16.0, 26.0, 38.0, 65.0, 100.0, 145.0, 272.0, 462.0, 1473.0, 3591482.0, 598024.0, 1089.0, 409.0, 225.0, 142.0, 103.0, 62.0, 47.0, 32.0, 13.0, 6.0, 7.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-83.125, -80.93408203125, -78.7431640625, -76.55224609375, -74.361328125, -72.17041015625, -69.9794921875, -67.78857421875, -65.59765625, -63.40673828125, -61.2158203125, -59.02490234375, -56.833984375, -54.64306640625, -52.4521484375, -50.26123046875, -48.0703125, -45.87939453125, -43.6884765625, -41.49755859375, -39.306640625, -37.11572265625, -34.9248046875, -32.73388671875, -30.54296875, -28.35205078125, -26.1611328125, -23.97021484375, -21.779296875, -19.58837890625, -17.3974609375, -15.20654296875, -13.015625, -10.82470703125, -8.6337890625, -6.44287109375, -4.251953125, -2.06103515625, 0.1298828125, 2.32080078125, 4.51171875, 6.70263671875, 8.8935546875, 11.08447265625, 13.275390625, 15.46630859375, 17.6572265625, 19.84814453125, 22.0390625, 24.22998046875, 26.4208984375, 28.61181640625, 30.802734375, 32.99365234375, 35.1845703125, 37.37548828125, 39.56640625, 41.75732421875, 43.9482421875, 46.13916015625, 48.330078125, 50.52099609375, 52.7119140625, 54.90283203125, 57.09375]}, "gradients/decoder.roberta.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 3.0, 7.0, 8.0, 17.0, 30.0, 53.0, 65.0, 100.0, 139.0, 220.0, 353.0, 502.0, 641.0, 619.0, 476.0, 289.0, 220.0, 109.0, 88.0, 44.0, 33.0, 14.0, 12.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.34259033203125, -2.2515869140625, -2.16058349609375, -2.069580078125, -1.97857666015625, -1.8875732421875, -1.79656982421875, -1.70556640625, -1.61456298828125, -1.5235595703125, -1.43255615234375, -1.341552734375, -1.25054931640625, -1.1595458984375, -1.06854248046875, -0.9775390625, -0.88653564453125, -0.7955322265625, -0.70452880859375, -0.613525390625, -0.52252197265625, -0.4315185546875, -0.34051513671875, -0.24951171875, -0.15850830078125, -0.0675048828125, 0.02349853515625, 0.114501953125, 0.20550537109375, 0.2965087890625, 0.38751220703125, 0.478515625, 0.56951904296875, 0.6605224609375, 0.75152587890625, 0.842529296875, 0.93353271484375, 1.0245361328125, 1.11553955078125, 1.20654296875, 1.29754638671875, 1.3885498046875, 1.47955322265625, 1.570556640625, 1.66156005859375, 1.7525634765625, 1.84356689453125, 1.9345703125, 2.02557373046875, 2.1165771484375, 2.20758056640625, 2.298583984375, 2.38958740234375, 2.4805908203125, 2.57159423828125, 2.66259765625, 2.75360107421875, 2.8446044921875, 2.93560791015625, 3.026611328125, 3.11761474609375, 3.2086181640625, 3.29962158203125, 3.390625]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 21.0, 31.0, 32.0, 59.0, 104.0, 133.0, 138.0, 129.0, 111.0, 102.0, 62.0, 26.0, 34.0, 11.0, 6.0, 3.0, 2.0, 2.0], "bins": [-11.71621322631836, -11.494498252868652, -11.272784233093262, -11.051069259643555, -10.829354286193848, -10.60763931274414, -10.38592529296875, -10.164210319519043, -9.942495346069336, -9.720780372619629, -9.499066352844238, -9.277351379394531, -9.055636405944824, -8.833921432495117, -8.612207412719727, -8.39049243927002, -8.168777465820312, -7.947062969207764, -7.725347995758057, -7.503633499145508, -7.281918525695801, -7.060204029083252, -6.838489055633545, -6.616774559020996, -6.395060062408447, -6.173345565795898, -5.951630592346191, -5.729916095733643, -5.5082011222839355, -5.286486625671387, -5.06477165222168, -4.843057155609131, -4.621342182159424, -4.399627685546875, -4.177912712097168, -3.95619797706604, -3.734483242034912, -3.5127687454223633, -3.2910537719726562, -3.0693392753601074, -2.8476243019104004, -2.6259095668792725, -2.4041948318481445, -2.1824800968170166, -1.9607653617858887, -1.7390507459640503, -1.5173360109329224, -1.2956212759017944, -1.073906660079956, -0.8521919250488281, -0.6304771900177002, -0.40876251459121704, -0.1870477795600891, 0.03466689586639404, 0.256381630897522, 0.4780963659286499, 0.6998111009597778, 0.9215258359909058, 1.1432405710220337, 1.364955186843872, 1.586669921875, 1.808384656906128, 2.030099391937256, 2.251814126968384, 2.4735288619995117]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 5.0, 10.0, 9.0, 7.0, 15.0, 12.0, 14.0, 20.0, 18.0, 35.0, 23.0, 33.0, 33.0, 42.0, 44.0, 37.0, 49.0, 46.0, 45.0, 48.0, 29.0, 49.0, 46.0, 39.0, 39.0, 31.0, 29.0, 40.0, 24.0, 18.0, 19.0, 13.0, 11.0, 19.0, 11.0, 8.0, 4.0, 3.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.062344074249268, -4.909416198730469, -4.75648832321167, -4.603560447692871, -4.450632572174072, -4.297704696655273, -4.144776821136475, -3.991848945617676, -3.838921070098877, -3.685993194580078, -3.5330653190612793, -3.3801374435424805, -3.2272095680236816, -3.074281692504883, -2.921353816986084, -2.768425941467285, -2.6154978275299072, -2.4625699520111084, -2.3096420764923096, -2.1567142009735107, -2.003786325454712, -1.850858449935913, -1.6979304552078247, -1.5450025796890259, -1.392074704170227, -1.2391468286514282, -1.0862189531326294, -0.9332910180091858, -0.780363142490387, -0.6274352669715881, -0.47450733184814453, -0.3215794563293457, -0.16865158081054688, -0.015723690390586853, 0.13720420002937317, 0.2901321053504944, 0.4430599808692932, 0.595987856388092, 0.7489157915115356, 0.9018436670303345, 1.0547715425491333, 1.2076994180679321, 1.360627293586731, 1.5135552883148193, 1.6664831638336182, 1.819411039352417, 1.9723389148712158, 2.1252667903900146, 2.2781946659088135, 2.4311225414276123, 2.584050416946411, 2.73697829246521, 2.889906167984009, 3.0428340435028076, 3.1957621574401855, 3.3486900329589844, 3.501617908477783, 3.654545783996582, 3.807473659515381, 3.9604015350341797, 4.1133294105529785, 4.266257286071777, 4.419185161590576, 4.572113037109375, 4.725040912628174]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 13.0, 12.0, 19.0, 37.0, 42.0, 50.0, 83.0, 107.0, 166.0, 265.0, 375.0, 620.0, 879.0, 1289.0, 1915.0, 2894.0, 4506.0, 7139.0, 11441.0, 18628.0, 31390.0, 54676.0, 97963.0, 174717.0, 235182.0, 172838.0, 96639.0, 53714.0, 30934.0, 18536.0, 11252.0, 7043.0, 4484.0, 2908.0, 1965.0, 1272.0, 838.0, 545.0, 380.0, 269.0, 166.0, 128.0, 65.0, 52.0, 40.0, 25.0, 14.0, 13.0, 8.0, 8.0, 6.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.89599609375, -0.8692398071289062, -0.8424835205078125, -0.8157272338867188, -0.788970947265625, -0.7622146606445312, -0.7354583740234375, -0.7087020874023438, -0.68194580078125, -0.6551895141601562, -0.6284332275390625, -0.6016769409179688, -0.574920654296875, -0.5481643676757812, -0.5214080810546875, -0.49465179443359375, -0.4678955078125, -0.44113922119140625, -0.4143829345703125, -0.38762664794921875, -0.360870361328125, -0.33411407470703125, -0.3073577880859375, -0.28060150146484375, -0.25384521484375, -0.22708892822265625, -0.2003326416015625, -0.17357635498046875, -0.146820068359375, -0.12006378173828125, -0.0933074951171875, -0.06655120849609375, -0.039794921875, -0.01303863525390625, 0.0137176513671875, 0.04047393798828125, 0.067230224609375, 0.09398651123046875, 0.1207427978515625, 0.14749908447265625, 0.17425537109375, 0.20101165771484375, 0.2277679443359375, 0.25452423095703125, 0.281280517578125, 0.30803680419921875, 0.3347930908203125, 0.36154937744140625, 0.3883056640625, 0.41506195068359375, 0.4418182373046875, 0.46857452392578125, 0.495330810546875, 0.5220870971679688, 0.5488433837890625, 0.5755996704101562, 0.60235595703125, 0.6291122436523438, 0.6558685302734375, 0.6826248168945312, 0.709381103515625, 0.7361373901367188, 0.7628936767578125, 0.7896499633789062, 0.81640625]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 10.0, 9.0, 9.0, 12.0, 13.0, 14.0, 20.0, 20.0, 34.0, 22.0, 33.0, 34.0, 43.0, 51.0, 31.0, 49.0, 44.0, 46.0, 47.0, 29.0, 50.0, 47.0, 37.0, 40.0, 33.0, 33.0, 32.0, 24.0, 19.0, 19.0, 12.0, 12.0, 18.0, 11.0, 8.0, 4.0, 3.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0390625, -4.88946533203125, -4.7398681640625, -4.59027099609375, -4.440673828125, -4.29107666015625, -4.1414794921875, -3.99188232421875, -3.84228515625, -3.69268798828125, -3.5430908203125, -3.39349365234375, -3.243896484375, -3.09429931640625, -2.9447021484375, -2.79510498046875, -2.6455078125, -2.49591064453125, -2.3463134765625, -2.19671630859375, -2.047119140625, -1.89752197265625, -1.7479248046875, -1.59832763671875, -1.44873046875, -1.29913330078125, -1.1495361328125, -0.99993896484375, -0.850341796875, -0.70074462890625, -0.5511474609375, -0.40155029296875, -0.251953125, -0.10235595703125, 0.0472412109375, 0.19683837890625, 0.346435546875, 0.49603271484375, 0.6456298828125, 0.79522705078125, 0.94482421875, 1.09442138671875, 1.2440185546875, 1.39361572265625, 1.543212890625, 1.69281005859375, 1.8424072265625, 1.99200439453125, 2.1416015625, 2.29119873046875, 2.4407958984375, 2.59039306640625, 2.739990234375, 2.88958740234375, 3.0391845703125, 3.18878173828125, 3.33837890625, 3.48797607421875, 3.6375732421875, 3.78717041015625, 3.936767578125, 4.08636474609375, 4.2359619140625, 4.38555908203125, 4.53515625]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 1.0, 8.0, 8.0, 11.0, 19.0, 17.0, 31.0, 43.0, 52.0, 62.0, 88.0, 127.0, 150.0, 232.0, 325.0, 478.0, 732.0, 1222.0, 2260.0, 4879.0, 12677.0, 44722.0, 915280.0, 42350.0, 12174.0, 4810.0, 2175.0, 1218.0, 728.0, 517.0, 312.0, 220.0, 158.0, 114.0, 80.0, 63.0, 52.0, 45.0, 24.0, 25.0, 12.0, 11.0, 8.0, 7.0, 9.0, 5.0, 2.0, 8.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.841796875, -2.756927490234375, -2.67205810546875, -2.587188720703125, -2.5023193359375, -2.417449951171875, -2.33258056640625, -2.247711181640625, -2.162841796875, -2.077972412109375, -1.99310302734375, -1.908233642578125, -1.8233642578125, -1.738494873046875, -1.65362548828125, -1.568756103515625, -1.48388671875, -1.399017333984375, -1.31414794921875, -1.229278564453125, -1.1444091796875, -1.059539794921875, -0.97467041015625, -0.889801025390625, -0.804931640625, -0.720062255859375, -0.63519287109375, -0.550323486328125, -0.4654541015625, -0.380584716796875, -0.29571533203125, -0.210845947265625, -0.1259765625, -0.041107177734375, 0.04376220703125, 0.128631591796875, 0.2135009765625, 0.298370361328125, 0.38323974609375, 0.468109130859375, 0.552978515625, 0.637847900390625, 0.72271728515625, 0.807586669921875, 0.8924560546875, 0.977325439453125, 1.06219482421875, 1.147064208984375, 1.23193359375, 1.316802978515625, 1.40167236328125, 1.486541748046875, 1.5714111328125, 1.656280517578125, 1.74114990234375, 1.826019287109375, 1.910888671875, 1.995758056640625, 2.08062744140625, 2.165496826171875, 2.2503662109375, 2.335235595703125, 2.42010498046875, 2.504974365234375, 2.58984375]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 8.0, 10.0, 11.0, 12.0, 12.0, 22.0, 23.0, 25.0, 25.0, 27.0, 26.0, 29.0, 38.0, 35.0, 38.0, 39.0, 33.0, 54.0, 40.0, 39.0, 38.0, 28.0, 52.0, 38.0, 38.0, 26.0, 26.0, 22.0, 29.0, 35.0, 22.0, 20.0, 11.0, 15.0, 11.0, 6.0, 8.0, 4.0, 5.0, 8.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.96484375, -2.87786865234375, -2.7908935546875, -2.70391845703125, -2.616943359375, -2.52996826171875, -2.4429931640625, -2.35601806640625, -2.26904296875, -2.18206787109375, -2.0950927734375, -2.00811767578125, -1.921142578125, -1.83416748046875, -1.7471923828125, -1.66021728515625, -1.5732421875, -1.48626708984375, -1.3992919921875, -1.31231689453125, -1.225341796875, -1.13836669921875, -1.0513916015625, -0.96441650390625, -0.87744140625, -0.79046630859375, -0.7034912109375, -0.61651611328125, -0.529541015625, -0.44256591796875, -0.3555908203125, -0.26861572265625, -0.181640625, -0.09466552734375, -0.0076904296875, 0.07928466796875, 0.166259765625, 0.25323486328125, 0.3402099609375, 0.42718505859375, 0.51416015625, 0.60113525390625, 0.6881103515625, 0.77508544921875, 0.862060546875, 0.94903564453125, 1.0360107421875, 1.12298583984375, 1.2099609375, 1.29693603515625, 1.3839111328125, 1.47088623046875, 1.557861328125, 1.64483642578125, 1.7318115234375, 1.81878662109375, 1.90576171875, 1.99273681640625, 2.0797119140625, 2.16668701171875, 2.253662109375, 2.34063720703125, 2.4276123046875, 2.51458740234375, 2.6015625]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 1.0, 9.0, 6.0, 9.0, 11.0, 30.0, 22.0, 47.0, 49.0, 66.0, 97.0, 183.0, 221.0, 358.0, 673.0, 1170.0, 2698.0, 7497.0, 38689.0, 964411.0, 22110.0, 5509.0, 2109.0, 1019.0, 557.0, 316.0, 219.0, 115.0, 91.0, 47.0, 50.0, 35.0, 36.0, 19.0, 14.0, 11.0, 10.0, 7.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.32861328125, -0.3177909851074219, -0.30696868896484375, -0.2961463928222656, -0.2853240966796875, -0.2745018005371094, -0.26367950439453125, -0.2528572082519531, -0.242034912109375, -0.23121261596679688, -0.22039031982421875, -0.20956802368164062, -0.1987457275390625, -0.18792343139648438, -0.17710113525390625, -0.16627883911132812, -0.15545654296875, -0.14463424682617188, -0.13381195068359375, -0.12298965454101562, -0.1121673583984375, -0.10134506225585938, -0.09052276611328125, -0.07970046997070312, -0.068878173828125, -0.058055877685546875, -0.04723358154296875, -0.036411285400390625, -0.0255889892578125, -0.014766693115234375, -0.00394439697265625, 0.006877899169921875, 0.0177001953125, 0.028522491455078125, 0.03934478759765625, 0.050167083740234375, 0.0609893798828125, 0.07181167602539062, 0.08263397216796875, 0.09345626831054688, 0.104278564453125, 0.11510086059570312, 0.12592315673828125, 0.13674545288085938, 0.1475677490234375, 0.15839004516601562, 0.16921234130859375, 0.18003463745117188, 0.19085693359375, 0.20167922973632812, 0.21250152587890625, 0.22332382202148438, 0.2341461181640625, 0.24496841430664062, 0.25579071044921875, 0.2666130065917969, 0.277435302734375, 0.2882575988769531, 0.29907989501953125, 0.3099021911621094, 0.3207244873046875, 0.3315467834472656, 0.34236907958984375, 0.3531913757324219, 0.364013671875]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 2.0, 10.0, 5.0, 10.0, 22.0, 21.0, 30.0, 33.0, 47.0, 57.0, 71.0, 84.0, 99.0, 64.0, 76.0, 46.0, 76.0, 47.0, 52.0, 36.0, 30.0, 17.0, 16.0, 10.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0338764190673828e-05, -2.931058406829834e-05, -2.828240394592285e-05, -2.7254223823547363e-05, -2.6226043701171875e-05, -2.5197863578796387e-05, -2.41696834564209e-05, -2.314150333404541e-05, -2.2113323211669922e-05, -2.1085143089294434e-05, -2.0056962966918945e-05, -1.9028782844543457e-05, -1.800060272216797e-05, -1.697242259979248e-05, -1.5944242477416992e-05, -1.4916062355041504e-05, -1.3887882232666016e-05, -1.2859702110290527e-05, -1.1831521987915039e-05, -1.080334186553955e-05, -9.775161743164062e-06, -8.746981620788574e-06, -7.718801498413086e-06, -6.690621376037598e-06, -5.662441253662109e-06, -4.634261131286621e-06, -3.606081008911133e-06, -2.5779008865356445e-06, -1.5497207641601562e-06, -5.21540641784668e-07, 5.066394805908203e-07, 1.5348196029663086e-06, 2.562999725341797e-06, 3.591179847717285e-06, 4.6193599700927734e-06, 5.647540092468262e-06, 6.67572021484375e-06, 7.703900337219238e-06, 8.732080459594727e-06, 9.760260581970215e-06, 1.0788440704345703e-05, 1.1816620826721191e-05, 1.284480094909668e-05, 1.3872981071472168e-05, 1.4901161193847656e-05, 1.5929341316223145e-05, 1.6957521438598633e-05, 1.798570156097412e-05, 1.901388168334961e-05, 2.0042061805725098e-05, 2.1070241928100586e-05, 2.2098422050476074e-05, 2.3126602172851562e-05, 2.415478229522705e-05, 2.518296241760254e-05, 2.6211142539978027e-05, 2.7239322662353516e-05, 2.8267502784729004e-05, 2.9295682907104492e-05, 3.032386302947998e-05, 3.135204315185547e-05, 3.238022327423096e-05, 3.3408403396606445e-05, 3.4436583518981934e-05, 3.546476364135742e-05]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 5.0, 2.0, 7.0, 15.0, 8.0, 17.0, 15.0, 24.0, 43.0, 55.0, 130.0, 318.0, 4842.0, 1023780.0, 18464.0, 412.0, 131.0, 77.0, 56.0, 23.0, 27.0, 14.0, 14.0, 11.0, 9.0, 6.0, 9.0, 2.0, 7.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86865234375, -0.84027099609375, -0.8118896484375, -0.78350830078125, -0.755126953125, -0.72674560546875, -0.6983642578125, -0.66998291015625, -0.6416015625, -0.61322021484375, -0.5848388671875, -0.55645751953125, -0.528076171875, -0.49969482421875, -0.4713134765625, -0.44293212890625, -0.41455078125, -0.38616943359375, -0.3577880859375, -0.32940673828125, -0.301025390625, -0.27264404296875, -0.2442626953125, -0.21588134765625, -0.1875, -0.15911865234375, -0.1307373046875, -0.10235595703125, -0.073974609375, -0.04559326171875, -0.0172119140625, 0.01116943359375, 0.03955078125, 0.06793212890625, 0.0963134765625, 0.12469482421875, 0.153076171875, 0.18145751953125, 0.2098388671875, 0.23822021484375, 0.2666015625, 0.29498291015625, 0.3233642578125, 0.35174560546875, 0.380126953125, 0.40850830078125, 0.4368896484375, 0.46527099609375, 0.49365234375, 0.52203369140625, 0.5504150390625, 0.57879638671875, 0.607177734375, 0.63555908203125, 0.6639404296875, 0.69232177734375, 0.720703125, 0.74908447265625, 0.7774658203125, 0.80584716796875, 0.834228515625, 0.86260986328125, 0.8909912109375, 0.91937255859375, 0.94775390625]}, "gradients/decoder.roberta.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 4.0, 5.0, 9.0, 12.0, 5.0, 11.0, 14.0, 17.0, 22.0, 18.0, 37.0, 40.0, 77.0, 114.0, 146.0, 126.0, 86.0, 61.0, 44.0, 30.0, 24.0, 13.0, 16.0, 13.0, 11.0, 3.0, 4.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.040740966796875, -0.03957223892211914, -0.03840351104736328, -0.03723478317260742, -0.03606605529785156, -0.0348973274230957, -0.033728599548339844, -0.032559871673583984, -0.031391143798828125, -0.030222415924072266, -0.029053688049316406, -0.027884960174560547, -0.026716232299804688, -0.025547504425048828, -0.02437877655029297, -0.02321004867553711, -0.02204132080078125, -0.02087259292602539, -0.01970386505126953, -0.018535137176513672, -0.017366409301757812, -0.016197681427001953, -0.015028953552246094, -0.013860225677490234, -0.012691497802734375, -0.011522769927978516, -0.010354042053222656, -0.009185314178466797, -0.008016586303710938, -0.006847858428955078, -0.005679130554199219, -0.004510402679443359, -0.0033416748046875, -0.0021729469299316406, -0.0010042190551757812, 0.00016450881958007812, 0.0013332366943359375, 0.002501964569091797, 0.0036706924438476562, 0.004839420318603516, 0.006008148193359375, 0.007176876068115234, 0.008345603942871094, 0.009514331817626953, 0.010683059692382812, 0.011851787567138672, 0.013020515441894531, 0.01418924331665039, 0.01535797119140625, 0.01652669906616211, 0.01769542694091797, 0.018864154815673828, 0.020032882690429688, 0.021201610565185547, 0.022370338439941406, 0.023539066314697266, 0.024707794189453125, 0.025876522064208984, 0.027045249938964844, 0.028213977813720703, 0.029382705688476562, 0.030551433563232422, 0.03172016143798828, 0.03288888931274414, 0.0340576171875]}, "gradients/decoder.roberta.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 19.0, 57.0, 128.0, 246.0, 276.0, 180.0, 74.0, 26.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.631829261779785, -10.191444396972656, -9.751060485839844, -9.310675621032715, -8.870290756225586, -8.429905891418457, -7.989521503448486, -7.549137115478516, -7.108752250671387, -6.668367385864258, -6.227982997894287, -5.787598609924316, -5.3472137451171875, -4.906828880310059, -4.466444492340088, -4.026060104370117, -3.5856752395629883, -3.1452906131744385, -2.7049059867858887, -2.264521360397339, -1.824136734008789, -1.3837521076202393, -0.9433674812316895, -0.5029828548431396, -0.06259822845458984, 0.37778639793395996, 0.8181710243225098, 1.2585556507110596, 1.6989402770996094, 2.139324903488159, 2.579709529876709, 3.020094156265259, 3.460477828979492, 3.900862455368042, 4.341247081756592, 4.7816314697265625, 5.222016334533691, 5.66240119934082, 6.102785587310791, 6.543169975280762, 6.983554840087891, 7.4239397048950195, 7.86432409286499, 8.304708480834961, 8.74509334564209, 9.185478210449219, 9.625862121582031, 10.06624698638916, 10.506631851196289, 10.947016716003418, 11.387401580810547, 11.82778549194336, 12.268170356750488, 12.708555221557617, 13.14893913269043, 13.589323997497559, 14.029708862304688, 14.470093727111816, 14.910478591918945, 15.350862503051758, 15.791247367858887, 16.231632232666016, 16.672016143798828, 17.112401962280273, 17.552785873413086]}, "gradients/decoder.roberta.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 5.0, 10.0, 9.0, 9.0, 13.0, 12.0, 14.0, 20.0, 22.0, 32.0, 22.0, 34.0, 34.0, 42.0, 49.0, 34.0, 47.0, 47.0, 44.0, 48.0, 28.0, 50.0, 47.0, 38.0, 40.0, 32.0, 33.0, 31.0, 26.0, 18.0, 19.0, 12.0, 13.0, 16.0, 12.0, 8.0, 4.0, 3.0, 3.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.037006855010986, -4.887447834014893, -4.737888336181641, -4.588329315185547, -4.438769817352295, -4.289210796356201, -4.139651298522949, -3.9900922775268555, -3.8405327796936035, -3.6909735202789307, -3.541414260864258, -3.391855001449585, -3.242295742034912, -3.0927364826202393, -2.9431772232055664, -2.7936182022094727, -2.6440589427948, -2.494499683380127, -2.344940423965454, -2.1953811645507812, -2.0458219051361084, -1.8962626457214355, -1.7467035055160522, -1.5971442461013794, -1.4475849866867065, -1.2980257272720337, -1.1484664678573608, -0.9989072680473328, -0.8493480086326599, -0.6997887492179871, -0.550229549407959, -0.40067028999328613, -0.2511110305786133, -0.10155178606510162, 0.048007458448410034, 0.1975666880607605, 0.34712594747543335, 0.4966852068901062, 0.6462444067001343, 0.7958036661148071, 0.94536292552948, 1.0949221849441528, 1.2444814443588257, 1.394040584564209, 1.5435998439788818, 1.6931591033935547, 1.8427183628082275, 1.9922776222229004, 2.1418368816375732, 2.291396141052246, 2.440955400466919, 2.590514659881592, 2.7400739192962646, 2.8896331787109375, 3.0391921997070312, 3.188751697540283, 3.338310718536377, 3.48786997795105, 3.6374292373657227, 3.7869884967803955, 3.9365477561950684, 4.086106777191162, 4.235666275024414, 4.385225296020508, 4.53478479385376]}, "gradients/decoder.roberta.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 6.0, 5.0, 11.0, 25.0, 20.0, 31.0, 32.0, 53.0, 62.0, 102.0, 114.0, 183.0, 272.0, 431.0, 758.0, 1445.0, 3008.0, 6683.0, 15327.0, 34043.0, 76390.0, 178357.0, 376462.0, 199928.0, 85321.0, 37994.0, 16612.0, 7502.0, 3455.0, 1683.0, 823.0, 434.0, 286.0, 188.0, 145.0, 86.0, 75.0, 61.0, 42.0, 27.0, 23.0, 19.0, 7.0, 11.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.8203125, -5.64691162109375, -5.4735107421875, -5.30010986328125, -5.126708984375, -4.95330810546875, -4.7799072265625, -4.60650634765625, -4.43310546875, -4.25970458984375, -4.0863037109375, -3.91290283203125, -3.739501953125, -3.56610107421875, -3.3927001953125, -3.21929931640625, -3.0458984375, -2.87249755859375, -2.6990966796875, -2.52569580078125, -2.352294921875, -2.17889404296875, -2.0054931640625, -1.83209228515625, -1.65869140625, -1.48529052734375, -1.3118896484375, -1.13848876953125, -0.965087890625, -0.79168701171875, -0.6182861328125, -0.44488525390625, -0.271484375, -0.09808349609375, 0.0753173828125, 0.24871826171875, 0.422119140625, 0.59552001953125, 0.7689208984375, 0.94232177734375, 1.11572265625, 1.28912353515625, 1.4625244140625, 1.63592529296875, 1.809326171875, 1.98272705078125, 2.1561279296875, 2.32952880859375, 2.5029296875, 2.67633056640625, 2.8497314453125, 3.02313232421875, 3.196533203125, 3.36993408203125, 3.5433349609375, 3.71673583984375, 3.89013671875, 4.06353759765625, 4.2369384765625, 4.41033935546875, 4.583740234375, 4.75714111328125, 4.9305419921875, 5.10394287109375, 5.27734375]}, "gradients/decoder.roberta.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 3.0, 9.0, 9.0, 8.0, 8.0, 15.0, 17.0, 13.0, 16.0, 29.0, 30.0, 26.0, 30.0, 47.0, 35.0, 47.0, 41.0, 50.0, 48.0, 51.0, 31.0, 43.0, 48.0, 43.0, 41.0, 36.0, 38.0, 29.0, 25.0, 25.0, 17.0, 13.0, 15.0, 17.0, 11.0, 8.0, 6.0, 2.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.05859375, -3.93634033203125, -3.8140869140625, -3.69183349609375, -3.569580078125, -3.44732666015625, -3.3250732421875, -3.20281982421875, -3.08056640625, -2.95831298828125, -2.8360595703125, -2.71380615234375, -2.591552734375, -2.46929931640625, -2.3470458984375, -2.22479248046875, -2.1025390625, -1.98028564453125, -1.8580322265625, -1.73577880859375, -1.613525390625, -1.49127197265625, -1.3690185546875, -1.24676513671875, -1.12451171875, -1.00225830078125, -0.8800048828125, -0.75775146484375, -0.635498046875, -0.51324462890625, -0.3909912109375, -0.26873779296875, -0.146484375, -0.02423095703125, 0.0980224609375, 0.22027587890625, 0.342529296875, 0.46478271484375, 0.5870361328125, 0.70928955078125, 0.83154296875, 0.95379638671875, 1.0760498046875, 1.19830322265625, 1.320556640625, 1.44281005859375, 1.5650634765625, 1.68731689453125, 1.8095703125, 1.93182373046875, 2.0540771484375, 2.17633056640625, 2.298583984375, 2.42083740234375, 2.5430908203125, 2.66534423828125, 2.78759765625, 2.90985107421875, 3.0321044921875, 3.15435791015625, 3.276611328125, 3.39886474609375, 3.5211181640625, 3.64337158203125, 3.765625]}, "gradients/decoder.roberta.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 7.0, 9.0, 17.0, 14.0, 15.0, 16.0, 23.0, 23.0, 42.0, 47.0, 50.0, 42.0, 69.0, 153.0, 898.0, 1044512.0, 1949.0, 222.0, 95.0, 51.0, 55.0, 34.0, 35.0, 24.0, 25.0, 27.0, 29.0, 6.0, 18.0, 8.0, 5.0, 3.0, 1.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.625, -105.1875, -101.75, -98.3125, -94.875, -91.4375, -88.0, -84.5625, -81.125, -77.6875, -74.25, -70.8125, -67.375, -63.9375, -60.5, -57.0625, -53.625, -50.1875, -46.75, -43.3125, -39.875, -36.4375, -33.0, -29.5625, -26.125, -22.6875, -19.25, -15.8125, -12.375, -8.9375, -5.5, -2.0625, 1.375, 4.8125, 8.25, 11.6875, 15.125, 18.5625, 22.0, 25.4375, 28.875, 32.3125, 35.75, 39.1875, 42.625, 46.0625, 49.5, 52.9375, 56.375, 59.8125, 63.25, 66.6875, 70.125, 73.5625, 77.0, 80.4375, 83.875, 87.3125, 90.75, 94.1875, 97.625, 101.0625, 104.5, 107.9375, 111.375]}, "gradients/decoder.roberta.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 2.0, 4.0, 8.0, 7.0, 13.0, 17.0, 12.0, 29.0, 33.0, 24.0, 19.0, 41.0, 39.0, 50.0, 42.0, 54.0, 54.0, 46.0, 50.0, 51.0, 58.0, 33.0, 36.0, 36.0, 48.0, 39.0, 24.0, 19.0, 22.0, 12.0, 24.0, 10.0, 11.0, 5.0, 2.0, 5.0, 4.0, 9.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.2109375, -4.08331298828125, -3.9556884765625, -3.82806396484375, -3.700439453125, -3.57281494140625, -3.4451904296875, -3.31756591796875, -3.18994140625, -3.06231689453125, -2.9346923828125, -2.80706787109375, -2.679443359375, -2.55181884765625, -2.4241943359375, -2.29656982421875, -2.1689453125, -2.04132080078125, -1.9136962890625, -1.78607177734375, -1.658447265625, -1.53082275390625, -1.4031982421875, -1.27557373046875, -1.14794921875, -1.02032470703125, -0.8927001953125, -0.76507568359375, -0.637451171875, -0.50982666015625, -0.3822021484375, -0.25457763671875, -0.126953125, 0.00067138671875, 0.1282958984375, 0.25592041015625, 0.383544921875, 0.51116943359375, 0.6387939453125, 0.76641845703125, 0.89404296875, 1.02166748046875, 1.1492919921875, 1.27691650390625, 1.404541015625, 1.53216552734375, 1.6597900390625, 1.78741455078125, 1.9150390625, 2.04266357421875, 2.1702880859375, 2.29791259765625, 2.425537109375, 2.55316162109375, 2.6807861328125, 2.80841064453125, 2.93603515625, 3.06365966796875, 3.1912841796875, 3.31890869140625, 3.446533203125, 3.57415771484375, 3.7017822265625, 3.82940673828125, 3.95703125]}, "gradients/decoder.roberta.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 19.0, 30.0, 46.0, 104.0, 207.0, 529.0, 1444.0, 8426.0, 264410.0, 751291.0, 18660.0, 2127.0, 702.0, 277.0, 106.0, 60.0, 32.0, 19.0, 14.0, 10.0, 4.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.7060546875, -8.443359375, -8.1806640625, -7.91796875, -7.6552734375, -7.392578125, -7.1298828125, -6.8671875, -6.6044921875, -6.341796875, -6.0791015625, -5.81640625, -5.5537109375, -5.291015625, -5.0283203125, -4.765625, -4.5029296875, -4.240234375, -3.9775390625, -3.71484375, -3.4521484375, -3.189453125, -2.9267578125, -2.6640625, -2.4013671875, -2.138671875, -1.8759765625, -1.61328125, -1.3505859375, -1.087890625, -0.8251953125, -0.5625, -0.2998046875, -0.037109375, 0.2255859375, 0.48828125, 0.7509765625, 1.013671875, 1.2763671875, 1.5390625, 1.8017578125, 2.064453125, 2.3271484375, 2.58984375, 2.8525390625, 3.115234375, 3.3779296875, 3.640625, 3.9033203125, 4.166015625, 4.4287109375, 4.69140625, 4.9541015625, 5.216796875, 5.4794921875, 5.7421875, 6.0048828125, 6.267578125, 6.5302734375, 6.79296875, 7.0556640625, 7.318359375, 7.5810546875, 7.84375]}, "gradients/decoder.roberta.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 7.0, 11.0, 8.0, 12.0, 22.0, 25.0, 41.0, 61.0, 75.0, 114.0, 136.0, 168.0, 92.0, 57.0, 40.0, 37.0, 26.0, 21.0, 7.0, 15.0, 6.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00048828125, -0.00047606974840164185, -0.0004638582468032837, -0.00045164674520492554, -0.0004394352436065674, -0.00042722374200820923, -0.0004150122404098511, -0.0004028007388114929, -0.00039058923721313477, -0.0003783777356147766, -0.00036616623401641846, -0.0003539547324180603, -0.00034174323081970215, -0.000329531729221344, -0.00031732022762298584, -0.0003051087260246277, -0.00029289722442626953, -0.0002806857228279114, -0.0002684742212295532, -0.00025626271963119507, -0.00024405121803283691, -0.00023183971643447876, -0.0002196282148361206, -0.00020741671323776245, -0.0001952052116394043, -0.00018299371004104614, -0.000170782208442688, -0.00015857070684432983, -0.00014635920524597168, -0.00013414770364761353, -0.00012193620204925537, -0.00010972470045089722, -9.751319885253906e-05, -8.530169725418091e-05, -7.309019565582275e-05, -6.08786940574646e-05, -4.8667192459106445e-05, -3.645569086074829e-05, -2.4244189262390137e-05, -1.2032687664031982e-05, 1.7881393432617188e-07, 1.2390315532684326e-05, 2.460181713104248e-05, 3.6813318729400635e-05, 4.902482032775879e-05, 6.123632192611694e-05, 7.34478235244751e-05, 8.565932512283325e-05, 9.78708267211914e-05, 0.00011008232831954956, 0.00012229382991790771, 0.00013450533151626587, 0.00014671683311462402, 0.00015892833471298218, 0.00017113983631134033, 0.00018335133790969849, 0.00019556283950805664, 0.0002077743411064148, 0.00021998584270477295, 0.0002321973443031311, 0.00024440884590148926, 0.0002566203474998474, 0.00026883184909820557, 0.0002810433506965637, 0.0002932548522949219]}, "gradients/decoder.roberta.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 2.0, 7.0, 14.0, 21.0, 39.0, 71.0, 175.0, 1012.0, 938623.0, 107722.0, 592.0, 132.0, 54.0, 36.0, 22.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.921875, -29.0390625, -28.15625, -27.2734375, -26.390625, -25.5078125, -24.625, -23.7421875, -22.859375, -21.9765625, -21.09375, -20.2109375, -19.328125, -18.4453125, -17.5625, -16.6796875, -15.796875, -14.9140625, -14.03125, -13.1484375, -12.265625, -11.3828125, -10.5, -9.6171875, -8.734375, -7.8515625, -6.96875, -6.0859375, -5.203125, -4.3203125, -3.4375, -2.5546875, -1.671875, -0.7890625, 0.09375, 0.9765625, 1.859375, 2.7421875, 3.625, 4.5078125, 5.390625, 6.2734375, 7.15625, 8.0390625, 8.921875, 9.8046875, 10.6875, 11.5703125, 12.453125, 13.3359375, 14.21875, 15.1015625, 15.984375, 16.8671875, 17.75, 18.6328125, 19.515625, 20.3984375, 21.28125, 22.1640625, 23.046875, 23.9296875, 24.8125, 25.6953125, 26.578125]}, "gradients/decoder.roberta.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 19.0, 31.0, 49.0, 71.0, 108.0, 221.0, 201.0, 111.0, 67.0, 43.0, 31.0, 7.0, 13.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2960205078125, -1.251220703125, -1.2064208984375, -1.16162109375, -1.1168212890625, -1.072021484375, -1.0272216796875, -0.982421875, -0.9376220703125, -0.892822265625, -0.8480224609375, -0.80322265625, -0.7584228515625, -0.713623046875, -0.6688232421875, -0.6240234375, -0.5792236328125, -0.534423828125, -0.4896240234375, -0.44482421875, -0.4000244140625, -0.355224609375, -0.3104248046875, -0.265625, -0.2208251953125, -0.176025390625, -0.1312255859375, -0.08642578125, -0.0416259765625, 0.003173828125, 0.0479736328125, 0.0927734375, 0.1375732421875, 0.182373046875, 0.2271728515625, 0.27197265625, 0.3167724609375, 0.361572265625, 0.4063720703125, 0.451171875, 0.4959716796875, 0.540771484375, 0.5855712890625, 0.63037109375, 0.6751708984375, 0.719970703125, 0.7647705078125, 0.8095703125, 0.8543701171875, 0.899169921875, 0.9439697265625, 0.98876953125, 1.0335693359375, 1.078369140625, 1.1231689453125, 1.16796875, 1.2127685546875, 1.257568359375, 1.3023681640625, 1.34716796875, 1.3919677734375, 1.436767578125, 1.4815673828125, 1.5263671875]}, "gradients/decoder.roberta.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 33.0, 61.0, 114.0, 203.0, 197.0, 193.0, 107.0, 51.0, 23.0, 17.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.976033210754395, -11.637297630310059, -11.298563003540039, -10.959827423095703, -10.621091842651367, -10.282356262207031, -9.943620681762695, -9.604886054992676, -9.26615047454834, -8.927414894104004, -8.588680267333984, -8.249944686889648, -7.9112091064453125, -7.572473526000977, -7.233738422393799, -6.895003318786621, -6.556267738342285, -6.217532157897949, -5.8787970542907715, -5.540061950683594, -5.201326370239258, -4.862590789794922, -4.523855686187744, -4.185120582580566, -3.8463850021362305, -3.5076496601104736, -3.168914318084717, -2.83017897605896, -2.491443634033203, -2.1527082920074463, -1.8139729499816895, -1.4752376079559326, -1.1365013122558594, -0.7977659702301025, -0.4590306282043457, -0.12029528617858887, 0.21844005584716797, 0.5571753978729248, 0.8959107398986816, 1.2346460819244385, 1.5733814239501953, 1.9121167659759521, 2.250852108001709, 2.589587450027466, 2.9283227920532227, 3.2670581340789795, 3.6057934761047363, 3.944528818130493, 4.28326416015625, 4.621999740600586, 4.960734844207764, 5.299469947814941, 5.638205528259277, 5.976941108703613, 6.315676212310791, 6.654411315917969, 6.993146896362305, 7.331882476806641, 7.670617580413818, 8.009352684020996, 8.348088264465332, 8.686823844909668, 9.025558471679688, 9.364294052124023, 9.70302963256836]}, "gradients/decoder.roberta.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 7.0, 7.0, 7.0, 4.0, 4.0, 5.0, 12.0, 11.0, 16.0, 18.0, 21.0, 12.0, 20.0, 25.0, 27.0, 28.0, 28.0, 36.0, 48.0, 40.0, 53.0, 42.0, 43.0, 50.0, 46.0, 49.0, 49.0, 41.0, 38.0, 38.0, 34.0, 19.0, 25.0, 14.0, 18.0, 12.0, 17.0, 14.0, 9.0, 5.0, 8.0, 0.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0], "bins": [-6.6140055656433105, -6.434468746185303, -6.254931449890137, -6.075394630432129, -5.895857810974121, -5.716320514678955, -5.536783695220947, -5.357246398925781, -5.177709579467773, -4.998172760009766, -4.8186354637146, -4.639098644256592, -4.459561824798584, -4.280024528503418, -4.10048770904541, -3.9209506511688232, -3.7414138317108154, -3.5618767738342285, -3.3823399543762207, -3.202802896499634, -3.023265838623047, -2.843729019165039, -2.664191961288452, -2.4846549034118652, -2.3051180839538574, -2.1255810260772705, -1.9460440874099731, -1.7665071487426758, -1.5869700908660889, -1.4074331521987915, -1.2278962135314941, -1.0483591556549072, -0.8688220977783203, -0.6892850995063782, -0.509748101234436, -0.33021116256713867, -0.15067416429519653, 0.028862833976745605, 0.20839977264404297, 0.3879368305206299, 0.5674737691879272, 0.7470107674598694, 0.9265477657318115, 1.1060847043991089, 1.2856216430664062, 1.4651587009429932, 1.6446956396102905, 1.8242326974868774, 2.003769636154175, 2.1833066940307617, 2.3628435134887695, 2.5423805713653564, 2.7219176292419434, 2.901454448699951, 3.080991506576538, 3.260528564453125, 3.440065383911133, 3.6196024417877197, 3.7991392612457275, 3.9786763191223145, 4.158213138580322, 4.337750434875488, 4.517287254333496, 4.696824073791504, 4.87636137008667]}, "gradients/decoder.roberta.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 13.0, 11.0, 14.0, 17.0, 17.0, 31.0, 36.0, 34.0, 60.0, 81.0, 96.0, 134.0, 188.0, 281.0, 433.0, 681.0, 1357.0, 2540.0, 5973.0, 16810.0, 65542.0, 359960.0, 1613331.0, 1620774.0, 397405.0, 76715.0, 19112.0, 6369.0, 2747.0, 1324.0, 749.0, 467.0, 250.0, 210.0, 130.0, 102.0, 72.0, 56.0, 40.0, 34.0, 25.0, 14.0, 11.0, 12.0, 5.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-5.84765625, -5.67578125, -5.50390625, -5.33203125, -5.16015625, -4.98828125, -4.81640625, -4.64453125, -4.47265625, -4.30078125, -4.12890625, -3.95703125, -3.78515625, -3.61328125, -3.44140625, -3.26953125, -3.09765625, -2.92578125, -2.75390625, -2.58203125, -2.41015625, -2.23828125, -2.06640625, -1.89453125, -1.72265625, -1.55078125, -1.37890625, -1.20703125, -1.03515625, -0.86328125, -0.69140625, -0.51953125, -0.34765625, -0.17578125, -0.00390625, 0.16796875, 0.33984375, 0.51171875, 0.68359375, 0.85546875, 1.02734375, 1.19921875, 1.37109375, 1.54296875, 1.71484375, 1.88671875, 2.05859375, 2.23046875, 2.40234375, 2.57421875, 2.74609375, 2.91796875, 3.08984375, 3.26171875, 3.43359375, 3.60546875, 3.77734375, 3.94921875, 4.12109375, 4.29296875, 4.46484375, 4.63671875, 4.80859375, 4.98046875, 5.15234375]}, "gradients/decoder.roberta.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 1.0, 7.0, 5.0, 5.0, 5.0, 8.0, 9.0, 10.0, 10.0, 17.0, 15.0, 19.0, 25.0, 28.0, 28.0, 25.0, 28.0, 31.0, 35.0, 40.0, 46.0, 45.0, 45.0, 50.0, 50.0, 41.0, 42.0, 46.0, 50.0, 26.0, 33.0, 32.0, 26.0, 21.0, 22.0, 17.0, 12.0, 14.0, 11.0, 7.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 3.0], "bins": [-4.78125, -4.65478515625, -4.5283203125, -4.40185546875, -4.275390625, -4.14892578125, -4.0224609375, -3.89599609375, -3.76953125, -3.64306640625, -3.5166015625, -3.39013671875, -3.263671875, -3.13720703125, -3.0107421875, -2.88427734375, -2.7578125, -2.63134765625, -2.5048828125, -2.37841796875, -2.251953125, -2.12548828125, -1.9990234375, -1.87255859375, -1.74609375, -1.61962890625, -1.4931640625, -1.36669921875, -1.240234375, -1.11376953125, -0.9873046875, -0.86083984375, -0.734375, -0.60791015625, -0.4814453125, -0.35498046875, -0.228515625, -0.10205078125, 0.0244140625, 0.15087890625, 0.27734375, 0.40380859375, 0.5302734375, 0.65673828125, 0.783203125, 0.90966796875, 1.0361328125, 1.16259765625, 1.2890625, 1.41552734375, 1.5419921875, 1.66845703125, 1.794921875, 1.92138671875, 2.0478515625, 2.17431640625, 2.30078125, 2.42724609375, 2.5537109375, 2.68017578125, 2.806640625, 2.93310546875, 3.0595703125, 3.18603515625, 3.3125]}, "gradients/decoder.roberta.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 8.0, 8.0, 14.0, 20.0, 37.0, 50.0, 70.0, 108.0, 170.0, 272.0, 576.0, 1631.0, 347344.0, 3839971.0, 2465.0, 593.0, 332.0, 179.0, 134.0, 67.0, 59.0, 44.0, 40.0, 21.0, 17.0, 7.0, 9.0, 3.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-64.5625, -62.91162109375, -61.2607421875, -59.60986328125, -57.958984375, -56.30810546875, -54.6572265625, -53.00634765625, -51.35546875, -49.70458984375, -48.0537109375, -46.40283203125, -44.751953125, -43.10107421875, -41.4501953125, -39.79931640625, -38.1484375, -36.49755859375, -34.8466796875, -33.19580078125, -31.544921875, -29.89404296875, -28.2431640625, -26.59228515625, -24.94140625, -23.29052734375, -21.6396484375, -19.98876953125, -18.337890625, -16.68701171875, -15.0361328125, -13.38525390625, -11.734375, -10.08349609375, -8.4326171875, -6.78173828125, -5.130859375, -3.47998046875, -1.8291015625, -0.17822265625, 1.47265625, 3.12353515625, 4.7744140625, 6.42529296875, 8.076171875, 9.72705078125, 11.3779296875, 13.02880859375, 14.6796875, 16.33056640625, 17.9814453125, 19.63232421875, 21.283203125, 22.93408203125, 24.5849609375, 26.23583984375, 27.88671875, 29.53759765625, 31.1884765625, 32.83935546875, 34.490234375, 36.14111328125, 37.7919921875, 39.44287109375, 41.09375]}, "gradients/decoder.roberta.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 10.0, 11.0, 9.0, 22.0, 29.0, 51.0, 47.0, 56.0, 112.0, 155.0, 225.0, 304.0, 459.0, 591.0, 612.0, 453.0, 309.0, 215.0, 120.0, 82.0, 60.0, 39.0, 30.0, 21.0, 9.0, 8.0, 8.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7080078125, -1.6362457275390625, -1.564483642578125, -1.4927215576171875, -1.42095947265625, -1.3491973876953125, -1.277435302734375, -1.2056732177734375, -1.1339111328125, -1.0621490478515625, -0.990386962890625, -0.9186248779296875, -0.84686279296875, -0.7751007080078125, -0.703338623046875, -0.6315765380859375, -0.559814453125, -0.4880523681640625, -0.416290283203125, -0.3445281982421875, -0.27276611328125, -0.2010040283203125, -0.129241943359375, -0.0574798583984375, 0.0142822265625, 0.0860443115234375, 0.157806396484375, 0.2295684814453125, 0.30133056640625, 0.3730926513671875, 0.444854736328125, 0.5166168212890625, 0.58837890625, 0.6601409912109375, 0.731903076171875, 0.8036651611328125, 0.87542724609375, 0.9471893310546875, 1.018951416015625, 1.0907135009765625, 1.1624755859375, 1.2342376708984375, 1.305999755859375, 1.3777618408203125, 1.44952392578125, 1.5212860107421875, 1.593048095703125, 1.6648101806640625, 1.736572265625, 1.8083343505859375, 1.880096435546875, 1.9518585205078125, 2.02362060546875, 2.0953826904296875, 2.167144775390625, 2.2389068603515625, 2.3106689453125, 2.3824310302734375, 2.454193115234375, 2.5259552001953125, 2.59771728515625, 2.6694793701171875, 2.741241455078125, 2.8130035400390625, 2.884765625]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 15.0, 13.0, 21.0, 41.0, 31.0, 49.0, 62.0, 69.0, 68.0, 84.0, 68.0, 66.0, 75.0, 59.0, 64.0, 49.0, 41.0, 23.0, 23.0, 20.0, 17.0, 7.0, 8.0, 7.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-4.810624599456787, -4.698017597198486, -4.5854105949401855, -4.472803592681885, -4.360196590423584, -4.247589588165283, -4.134982585906982, -4.022375106811523, -3.9097683429718018, -3.797161340713501, -3.6845543384552, -3.5719473361968994, -3.4593400955200195, -3.3467330932617188, -3.234126091003418, -3.121519088745117, -3.0089120864868164, -2.8963050842285156, -2.783698081970215, -2.671091079711914, -2.5584840774536133, -2.4458770751953125, -2.3332698345184326, -2.220662832260132, -2.108055830001831, -1.9954488277435303, -1.8828418254852295, -1.7702347040176392, -1.6576277017593384, -1.5450206995010376, -1.4324135780334473, -1.3198065757751465, -1.2071998119354248, -1.094592809677124, -0.9819857478141785, -0.8693786859512329, -0.7567716836929321, -0.6441646814346313, -0.5315576195716858, -0.41895055770874023, -0.30634355545043945, -0.19373652338981628, -0.08112949132919312, 0.031477540731430054, 0.14408457279205322, 0.256691575050354, 0.36929863691329956, 0.4819056987762451, 0.5945127010345459, 0.7071197032928467, 0.8197267651557922, 0.9323338270187378, 1.0449408292770386, 1.1575478315353394, 1.2701549530029297, 1.3827619552612305, 1.4953689575195312, 1.607975959777832, 1.7205829620361328, 1.8331900835037231, 1.945797085762024, 2.058403968811035, 2.171011209487915, 2.283618211746216, 2.3962252140045166]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 8.0, 11.0, 10.0, 12.0, 24.0, 17.0, 21.0, 28.0, 20.0, 31.0, 31.0, 31.0, 33.0, 45.0, 44.0, 36.0, 45.0, 41.0, 38.0, 39.0, 44.0, 41.0, 48.0, 34.0, 35.0, 26.0, 30.0, 19.0, 31.0, 18.0, 16.0, 14.0, 9.0, 11.0, 12.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.261424541473389, -4.125936508178711, -3.9904489517211914, -3.8549609184265137, -3.719473123550415, -3.5839853286743164, -3.4484972953796387, -3.31300950050354, -3.1775217056274414, -3.0420339107513428, -2.906546115875244, -2.7710580825805664, -2.6355702877044678, -2.500082492828369, -2.3645944595336914, -2.2291066646575928, -2.093618869781494, -1.9581310749053955, -1.8226431608200073, -1.6871552467346191, -1.5516674518585205, -1.4161796569824219, -1.2806917428970337, -1.1452038288116455, -1.0097160339355469, -0.8742281794548035, -0.7387403249740601, -0.6032524704933167, -0.46776461601257324, -0.33227676153182983, -0.19678890705108643, -0.06130105257034302, 0.07418680191040039, 0.2096746563911438, 0.3451625108718872, 0.4806503653526306, 0.616138219833374, 0.7516260743141174, 0.8871139287948608, 1.022601842880249, 1.1580896377563477, 1.2935774326324463, 1.4290653467178345, 1.5645532608032227, 1.7000410556793213, 1.83552885055542, 1.971016764640808, 2.1065046787261963, 2.241992473602295, 2.3774802684783936, 2.512968063354492, 2.64845609664917, 2.7839438915252686, 2.919431686401367, 3.054919719696045, 3.1904075145721436, 3.325895309448242, 3.461383104324341, 3.5968708992004395, 3.732358932495117, 3.867846727371216, 4.0033345222473145, 4.138822555541992, 4.274310111999512, 4.4097981452941895]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 6.0, 10.0, 13.0, 17.0, 19.0, 45.0, 59.0, 73.0, 118.0, 162.0, 270.0, 376.0, 585.0, 888.0, 1333.0, 2014.0, 3183.0, 4930.0, 8019.0, 12973.0, 21213.0, 35500.0, 62219.0, 109065.0, 179659.0, 218038.0, 159180.0, 94258.0, 53724.0, 30820.0, 18420.0, 11421.0, 7057.0, 4457.0, 2845.0, 1900.0, 1191.0, 807.0, 546.0, 365.0, 265.0, 164.0, 103.0, 73.0, 64.0, 32.0, 27.0, 17.0, 15.0, 9.0, 5.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.68310546875, -0.6620025634765625, -0.640899658203125, -0.6197967529296875, -0.59869384765625, -0.5775909423828125, -0.556488037109375, -0.5353851318359375, -0.5142822265625, -0.4931793212890625, -0.472076416015625, -0.4509735107421875, -0.42987060546875, -0.4087677001953125, -0.387664794921875, -0.3665618896484375, -0.345458984375, -0.3243560791015625, -0.303253173828125, -0.2821502685546875, -0.26104736328125, -0.2399444580078125, -0.218841552734375, -0.1977386474609375, -0.1766357421875, -0.1555328369140625, -0.134429931640625, -0.1133270263671875, -0.09222412109375, -0.0711212158203125, -0.050018310546875, -0.0289154052734375, -0.0078125, 0.0132904052734375, 0.034393310546875, 0.0554962158203125, 0.07659912109375, 0.0977020263671875, 0.118804931640625, 0.1399078369140625, 0.1610107421875, 0.1821136474609375, 0.203216552734375, 0.2243194580078125, 0.24542236328125, 0.2665252685546875, 0.287628173828125, 0.3087310791015625, 0.329833984375, 0.3509368896484375, 0.372039794921875, 0.3931427001953125, 0.41424560546875, 0.4353485107421875, 0.456451416015625, 0.4775543212890625, 0.4986572265625, 0.5197601318359375, 0.540863037109375, 0.5619659423828125, 0.58306884765625, 0.6041717529296875, 0.625274658203125, 0.6463775634765625, 0.66748046875]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 6.0, 8.0, 9.0, 10.0, 10.0, 12.0, 23.0, 16.0, 23.0, 28.0, 20.0, 28.0, 35.0, 31.0, 32.0, 44.0, 47.0, 35.0, 44.0, 41.0, 39.0, 35.0, 46.0, 43.0, 46.0, 33.0, 35.0, 28.0, 31.0, 18.0, 32.0, 17.0, 15.0, 15.0, 9.0, 11.0, 12.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.14508056640625, -4.0128173828125, -3.88055419921875, -3.748291015625, -3.61602783203125, -3.4837646484375, -3.35150146484375, -3.21923828125, -3.08697509765625, -2.9547119140625, -2.82244873046875, -2.690185546875, -2.55792236328125, -2.4256591796875, -2.29339599609375, -2.1611328125, -2.02886962890625, -1.8966064453125, -1.76434326171875, -1.632080078125, -1.49981689453125, -1.3675537109375, -1.23529052734375, -1.10302734375, -0.97076416015625, -0.8385009765625, -0.70623779296875, -0.573974609375, -0.44171142578125, -0.3094482421875, -0.17718505859375, -0.044921875, 0.08734130859375, 0.2196044921875, 0.35186767578125, 0.484130859375, 0.61639404296875, 0.7486572265625, 0.88092041015625, 1.01318359375, 1.14544677734375, 1.2777099609375, 1.40997314453125, 1.542236328125, 1.67449951171875, 1.8067626953125, 1.93902587890625, 2.0712890625, 2.20355224609375, 2.3358154296875, 2.46807861328125, 2.600341796875, 2.73260498046875, 2.8648681640625, 2.99713134765625, 3.12939453125, 3.26165771484375, 3.3939208984375, 3.52618408203125, 3.658447265625, 3.79071044921875, 3.9229736328125, 4.05523681640625, 4.1875]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 15.0, 15.0, 17.0, 28.0, 29.0, 35.0, 53.0, 80.0, 111.0, 155.0, 215.0, 276.0, 419.0, 683.0, 1131.0, 2107.0, 4482.0, 11459.0, 37973.0, 908070.0, 54312.0, 15051.0, 5598.0, 2505.0, 1325.0, 785.0, 451.0, 316.0, 241.0, 145.0, 109.0, 93.0, 65.0, 48.0, 35.0, 28.0, 17.0, 15.0, 15.0, 8.0, 8.0, 4.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.2421875, -2.171295166015625, -2.10040283203125, -2.029510498046875, -1.9586181640625, -1.887725830078125, -1.81683349609375, -1.745941162109375, -1.675048828125, -1.604156494140625, -1.53326416015625, -1.462371826171875, -1.3914794921875, -1.320587158203125, -1.24969482421875, -1.178802490234375, -1.10791015625, -1.037017822265625, -0.96612548828125, -0.895233154296875, -0.8243408203125, -0.753448486328125, -0.68255615234375, -0.611663818359375, -0.540771484375, -0.469879150390625, -0.39898681640625, -0.328094482421875, -0.2572021484375, -0.186309814453125, -0.11541748046875, -0.044525146484375, 0.0263671875, 0.097259521484375, 0.16815185546875, 0.239044189453125, 0.3099365234375, 0.380828857421875, 0.45172119140625, 0.522613525390625, 0.593505859375, 0.664398193359375, 0.73529052734375, 0.806182861328125, 0.8770751953125, 0.947967529296875, 1.01885986328125, 1.089752197265625, 1.16064453125, 1.231536865234375, 1.30242919921875, 1.373321533203125, 1.4442138671875, 1.515106201171875, 1.58599853515625, 1.656890869140625, 1.727783203125, 1.798675537109375, 1.86956787109375, 1.940460205078125, 2.0113525390625, 2.082244873046875, 2.15313720703125, 2.224029541015625, 2.294921875]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 3.0, 5.0, 9.0, 7.0, 13.0, 12.0, 16.0, 13.0, 19.0, 17.0, 29.0, 24.0, 25.0, 25.0, 34.0, 40.0, 55.0, 34.0, 42.0, 32.0, 45.0, 27.0, 40.0, 41.0, 32.0, 33.0, 31.0, 30.0, 31.0, 33.0, 39.0, 17.0, 24.0, 24.0, 21.0, 18.0, 11.0, 9.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.336181640625, -2.25634765625, -2.176513671875, -2.0966796875, -2.016845703125, -1.93701171875, -1.857177734375, -1.77734375, -1.697509765625, -1.61767578125, -1.537841796875, -1.4580078125, -1.378173828125, -1.29833984375, -1.218505859375, -1.138671875, -1.058837890625, -0.97900390625, -0.899169921875, -0.8193359375, -0.739501953125, -0.65966796875, -0.579833984375, -0.5, -0.420166015625, -0.34033203125, -0.260498046875, -0.1806640625, -0.100830078125, -0.02099609375, 0.058837890625, 0.138671875, 0.218505859375, 0.29833984375, 0.378173828125, 0.4580078125, 0.537841796875, 0.61767578125, 0.697509765625, 0.77734375, 0.857177734375, 0.93701171875, 1.016845703125, 1.0966796875, 1.176513671875, 1.25634765625, 1.336181640625, 1.416015625, 1.495849609375, 1.57568359375, 1.655517578125, 1.7353515625, 1.815185546875, 1.89501953125, 1.974853515625, 2.0546875, 2.134521484375, 2.21435546875, 2.294189453125, 2.3740234375, 2.453857421875, 2.53369140625, 2.613525390625, 2.693359375]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 0.0, 3.0, 3.0, 14.0, 15.0, 13.0, 14.0, 19.0, 26.0, 41.0, 51.0, 84.0, 110.0, 162.0, 234.0, 346.0, 586.0, 1060.0, 2282.0, 5527.0, 19645.0, 954500.0, 47944.0, 9060.0, 3189.0, 1467.0, 772.0, 487.0, 271.0, 193.0, 112.0, 92.0, 49.0, 42.0, 30.0, 24.0, 25.0, 13.0, 10.0, 7.0, 5.0, 9.0, 6.0, 3.0, 3.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.349853515625, -0.3397789001464844, -0.32970428466796875, -0.3196296691894531, -0.3095550537109375, -0.2994804382324219, -0.28940582275390625, -0.2793312072753906, -0.269256591796875, -0.2591819763183594, -0.24910736083984375, -0.23903274536132812, -0.2289581298828125, -0.21888351440429688, -0.20880889892578125, -0.19873428344726562, -0.18865966796875, -0.17858505249023438, -0.16851043701171875, -0.15843582153320312, -0.1483612060546875, -0.13828659057617188, -0.12821197509765625, -0.11813735961914062, -0.108062744140625, -0.09798812866210938, -0.08791351318359375, -0.07783889770507812, -0.0677642822265625, -0.057689666748046875, -0.04761505126953125, -0.037540435791015625, -0.0274658203125, -0.017391204833984375, -0.00731658935546875, 0.002758026123046875, 0.0128326416015625, 0.022907257080078125, 0.03298187255859375, 0.043056488037109375, 0.053131103515625, 0.06320571899414062, 0.07328033447265625, 0.08335494995117188, 0.0934295654296875, 0.10350418090820312, 0.11357879638671875, 0.12365341186523438, 0.13372802734375, 0.14380264282226562, 0.15387725830078125, 0.16395187377929688, 0.1740264892578125, 0.18410110473632812, 0.19417572021484375, 0.20425033569335938, 0.214324951171875, 0.22439956665039062, 0.23447418212890625, 0.24454879760742188, 0.2546234130859375, 0.2646980285644531, 0.27477264404296875, 0.2848472595214844, 0.294921875]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 4.0, 5.0, 5.0, 4.0, 10.0, 7.0, 13.0, 10.0, 22.0, 17.0, 25.0, 30.0, 53.0, 42.0, 55.0, 78.0, 66.0, 65.0, 68.0, 75.0, 76.0, 45.0, 45.0, 32.0, 30.0, 25.0, 15.0, 14.0, 12.0, 11.0, 8.0, 10.0, 4.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9146671295166016e-05, -2.8156675398349762e-05, -2.7166679501533508e-05, -2.6176683604717255e-05, -2.5186687707901e-05, -2.4196691811084747e-05, -2.3206695914268494e-05, -2.221670001745224e-05, -2.1226704120635986e-05, -2.0236708223819733e-05, -1.924671232700348e-05, -1.8256716430187225e-05, -1.726672053337097e-05, -1.6276724636554718e-05, -1.5286728739738464e-05, -1.429673284292221e-05, -1.3306736946105957e-05, -1.2316741049289703e-05, -1.132674515247345e-05, -1.0336749255657196e-05, -9.346753358840942e-06, -8.356757462024689e-06, -7.366761565208435e-06, -6.376765668392181e-06, -5.386769771575928e-06, -4.396773874759674e-06, -3.4067779779434204e-06, -2.4167820811271667e-06, -1.426786184310913e-06, -4.367902874946594e-07, 5.532056093215942e-07, 1.543201506137848e-06, 2.5331974029541016e-06, 3.5231932997703552e-06, 4.513189196586609e-06, 5.5031850934028625e-06, 6.493180990219116e-06, 7.48317688703537e-06, 8.473172783851624e-06, 9.463168680667877e-06, 1.0453164577484131e-05, 1.1443160474300385e-05, 1.2433156371116638e-05, 1.3423152267932892e-05, 1.4413148164749146e-05, 1.54031440615654e-05, 1.6393139958381653e-05, 1.7383135855197906e-05, 1.837313175201416e-05, 1.9363127648830414e-05, 2.0353123545646667e-05, 2.134311944246292e-05, 2.2333115339279175e-05, 2.332311123609543e-05, 2.4313107132911682e-05, 2.5303103029727936e-05, 2.629309892654419e-05, 2.7283094823360443e-05, 2.8273090720176697e-05, 2.926308661699295e-05, 3.0253082513809204e-05, 3.124307841062546e-05, 3.223307430744171e-05, 3.3223070204257965e-05, 3.421306610107422e-05]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 4.0, 3.0, 8.0, 9.0, 6.0, 13.0, 10.0, 19.0, 24.0, 26.0, 33.0, 51.0, 82.0, 162.0, 571.0, 100577.0, 944928.0, 1458.0, 228.0, 98.0, 54.0, 46.0, 30.0, 24.0, 16.0, 16.0, 18.0, 8.0, 8.0, 2.0, 7.0, 5.0, 5.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.8037948608398438, -0.7779998779296875, -0.7522048950195312, -0.726409912109375, -0.7006149291992188, -0.6748199462890625, -0.6490249633789062, -0.62322998046875, -0.5974349975585938, -0.5716400146484375, -0.5458450317382812, -0.520050048828125, -0.49425506591796875, -0.4684600830078125, -0.44266510009765625, -0.4168701171875, -0.39107513427734375, -0.3652801513671875, -0.33948516845703125, -0.313690185546875, -0.28789520263671875, -0.2621002197265625, -0.23630523681640625, -0.21051025390625, -0.18471527099609375, -0.1589202880859375, -0.13312530517578125, -0.107330322265625, -0.08153533935546875, -0.0557403564453125, -0.02994537353515625, -0.004150390625, 0.02164459228515625, 0.0474395751953125, 0.07323455810546875, 0.099029541015625, 0.12482452392578125, 0.1506195068359375, 0.17641448974609375, 0.20220947265625, 0.22800445556640625, 0.2537994384765625, 0.27959442138671875, 0.305389404296875, 0.33118438720703125, 0.3569793701171875, 0.38277435302734375, 0.4085693359375, 0.43436431884765625, 0.4601593017578125, 0.48595428466796875, 0.511749267578125, 0.5375442504882812, 0.5633392333984375, 0.5891342163085938, 0.61492919921875, 0.6407241821289062, 0.6665191650390625, 0.6923141479492188, 0.718109130859375, 0.7439041137695312, 0.7696990966796875, 0.7954940795898438, 0.8212890625]}, "gradients/decoder.roberta.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 12.0, 10.0, 14.0, 11.0, 22.0, 29.0, 22.0, 36.0, 50.0, 71.0, 115.0, 151.0, 121.0, 84.0, 43.0, 40.0, 31.0, 20.0, 14.0, 23.0, 12.0, 9.0, 8.0, 6.0, 7.0, 3.0, 5.0, 2.0, 1.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034027099609375, -0.03294849395751953, -0.03186988830566406, -0.030791282653808594, -0.029712677001953125, -0.028634071350097656, -0.027555465698242188, -0.02647686004638672, -0.02539825439453125, -0.02431964874267578, -0.023241043090820312, -0.022162437438964844, -0.021083831787109375, -0.020005226135253906, -0.018926620483398438, -0.01784801483154297, -0.0167694091796875, -0.01569080352783203, -0.014612197875976562, -0.013533592224121094, -0.012454986572265625, -0.011376380920410156, -0.010297775268554688, -0.009219169616699219, -0.00814056396484375, -0.007061958312988281, -0.0059833526611328125, -0.004904747009277344, -0.003826141357421875, -0.0027475357055664062, -0.0016689300537109375, -0.0005903244018554688, 0.00048828125, 0.0015668869018554688, 0.0026454925537109375, 0.0037240982055664062, 0.004802703857421875, 0.005881309509277344, 0.0069599151611328125, 0.008038520812988281, 0.00911712646484375, 0.010195732116699219, 0.011274337768554688, 0.012352943420410156, 0.013431549072265625, 0.014510154724121094, 0.015588760375976562, 0.01666736602783203, 0.0177459716796875, 0.01882457733154297, 0.019903182983398438, 0.020981788635253906, 0.022060394287109375, 0.023138999938964844, 0.024217605590820312, 0.02529621124267578, 0.02637481689453125, 0.02745342254638672, 0.028532028198242188, 0.029610633850097656, 0.030689239501953125, 0.031767845153808594, 0.03284645080566406, 0.03392505645751953, 0.035003662109375]}, "gradients/decoder.roberta.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 17.0, 23.0, 51.0, 40.0, 81.0, 101.0, 110.0, 87.0, 91.0, 93.0, 90.0, 68.0, 40.0, 42.0, 23.0, 14.0, 8.0, 12.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.114887237548828, -3.961808204650879, -3.808729410171509, -3.6556503772735596, -3.5025715827941895, -3.3494925498962402, -3.196413516998291, -3.043334484100342, -2.8902556896209717, -2.7371766567230225, -2.5840978622436523, -2.431018829345703, -2.277939796447754, -2.124861001968384, -1.9717819690704346, -1.818703055381775, -1.6656241416931152, -1.5125452280044556, -1.359466314315796, -1.2063872814178467, -1.053308367729187, -0.9002294540405273, -0.7471504807472229, -0.5940715074539185, -0.4409925937652588, -0.28791365027427673, -0.13483470678329468, 0.018244236707687378, 0.17132318019866943, 0.3244020938873291, 0.47748106718063354, 0.630560040473938, 0.7836384773254395, 0.9367173910140991, 1.0897963047027588, 1.242875337600708, 1.3959542512893677, 1.5490331649780273, 1.7021121978759766, 1.8551911115646362, 2.008270025253296, 2.161349058151245, 2.3144278526306152, 2.4675068855285645, 2.6205859184265137, 2.773664712905884, 2.926743745803833, 3.079822540283203, 3.2329015731811523, 3.3859806060791016, 3.5390594005584717, 3.692138433456421, 3.845217227935791, 3.9982962608337402, 4.1513752937316895, 4.304454326629639, 4.45753288269043, 4.610611915588379, 4.763690948486328, 4.916769504547119, 5.069848537445068, 5.222927570343018, 5.376006603240967, 5.529085636138916, 5.682164669036865]}, "gradients/decoder.roberta.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 4.0, 5.0, 6.0, 7.0, 10.0, 9.0, 10.0, 13.0, 23.0, 16.0, 22.0, 29.0, 19.0, 29.0, 35.0, 31.0, 30.0, 46.0, 45.0, 34.0, 47.0, 40.0, 40.0, 33.0, 47.0, 44.0, 46.0, 33.0, 35.0, 29.0, 27.0, 21.0, 30.0, 19.0, 15.0, 14.0, 9.0, 12.0, 12.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.283318996429443, -4.150961875915527, -4.0186052322387695, -3.8862481117248535, -3.7538909912109375, -3.6215341091156006, -3.4891772270202637, -3.3568201065063477, -3.2244629859924316, -3.0921061038970947, -2.9597489833831787, -2.827392101287842, -2.695034980773926, -2.562678098678589, -2.430321216583252, -2.297964096069336, -2.165607213973999, -2.033250331878662, -1.900893211364746, -1.7685363292694092, -1.6361792087554932, -1.5038223266601562, -1.3714653253555298, -1.2391083240509033, -1.1067513227462769, -0.9743943214416504, -0.8420373201370239, -0.7096803784370422, -0.5773233771324158, -0.4449663758277893, -0.3126094341278076, -0.18025243282318115, -0.04789543151855469, 0.08446155488491058, 0.21681854128837585, 0.34917551279067993, 0.4815325140953064, 0.6138895153999329, 0.7462464570999146, 0.878603458404541, 1.0109604597091675, 1.143317461013794, 1.2756744623184204, 1.4080314636230469, 1.5403883457183838, 1.6727454662322998, 1.8051023483276367, 1.9374593496322632, 2.0698163509368896, 2.2021732330322266, 2.3345303535461426, 2.4668872356414795, 2.5992443561553955, 2.7316012382507324, 2.8639583587646484, 2.9963152408599854, 3.1286721229553223, 3.261029005050659, 3.393386125564575, 3.525743007659912, 3.658100128173828, 3.790457010269165, 3.922813892364502, 4.055171012878418, 4.187528133392334]}, "gradients/decoder.roberta.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 2.0, 10.0, 14.0, 15.0, 15.0, 35.0, 35.0, 60.0, 110.0, 176.0, 265.0, 468.0, 894.0, 1672.0, 4290.0, 10311.0, 26874.0, 73223.0, 194465.0, 360306.0, 232009.0, 88700.0, 32784.0, 12393.0, 4910.0, 2155.0, 1020.0, 472.0, 308.0, 206.0, 114.0, 77.0, 47.0, 26.0, 17.0, 24.0, 7.0, 8.0, 4.0, 3.0, 5.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75, -5.5736083984375, -5.397216796875, -5.2208251953125, -5.04443359375, -4.8680419921875, -4.691650390625, -4.5152587890625, -4.3388671875, -4.1624755859375, -3.986083984375, -3.8096923828125, -3.63330078125, -3.4569091796875, -3.280517578125, -3.1041259765625, -2.927734375, -2.7513427734375, -2.574951171875, -2.3985595703125, -2.22216796875, -2.0457763671875, -1.869384765625, -1.6929931640625, -1.5166015625, -1.3402099609375, -1.163818359375, -0.9874267578125, -0.81103515625, -0.6346435546875, -0.458251953125, -0.2818603515625, -0.10546875, 0.0709228515625, 0.247314453125, 0.4237060546875, 0.60009765625, 0.7764892578125, 0.952880859375, 1.1292724609375, 1.3056640625, 1.4820556640625, 1.658447265625, 1.8348388671875, 2.01123046875, 2.1876220703125, 2.364013671875, 2.5404052734375, 2.716796875, 2.8931884765625, 3.069580078125, 3.2459716796875, 3.42236328125, 3.5987548828125, 3.775146484375, 3.9515380859375, 4.1279296875, 4.3043212890625, 4.480712890625, 4.6571044921875, 4.83349609375, 5.0098876953125, 5.186279296875, 5.3626708984375, 5.5390625]}, "gradients/decoder.roberta.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 6.0, 5.0, 4.0, 12.0, 8.0, 12.0, 15.0, 22.0, 16.0, 22.0, 23.0, 25.0, 25.0, 42.0, 28.0, 37.0, 43.0, 45.0, 36.0, 29.0, 52.0, 52.0, 32.0, 41.0, 42.0, 37.0, 47.0, 28.0, 32.0, 30.0, 22.0, 28.0, 16.0, 14.0, 9.0, 14.0, 17.0, 6.0, 5.0, 1.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.834259033203125, -3.71148681640625, -3.588714599609375, -3.4659423828125, -3.343170166015625, -3.22039794921875, -3.097625732421875, -2.974853515625, -2.852081298828125, -2.72930908203125, -2.606536865234375, -2.4837646484375, -2.360992431640625, -2.23822021484375, -2.115447998046875, -1.99267578125, -1.869903564453125, -1.74713134765625, -1.624359130859375, -1.5015869140625, -1.378814697265625, -1.25604248046875, -1.133270263671875, -1.010498046875, -0.887725830078125, -0.76495361328125, -0.642181396484375, -0.5194091796875, -0.396636962890625, -0.27386474609375, -0.151092529296875, -0.0283203125, 0.094451904296875, 0.21722412109375, 0.339996337890625, 0.4627685546875, 0.585540771484375, 0.70831298828125, 0.831085205078125, 0.953857421875, 1.076629638671875, 1.19940185546875, 1.322174072265625, 1.4449462890625, 1.567718505859375, 1.69049072265625, 1.813262939453125, 1.93603515625, 2.058807373046875, 2.18157958984375, 2.304351806640625, 2.4271240234375, 2.549896240234375, 2.67266845703125, 2.795440673828125, 2.918212890625, 3.040985107421875, 3.16375732421875, 3.286529541015625, 3.4093017578125, 3.532073974609375, 3.65484619140625, 3.777618408203125, 3.900390625]}, "gradients/decoder.roberta.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 3.0, 5.0, 12.0, 10.0, 18.0, 11.0, 16.0, 19.0, 42.0, 43.0, 42.0, 90.0, 126.0, 734.0, 1046057.0, 813.0, 139.0, 81.0, 65.0, 59.0, 42.0, 27.0, 26.0, 12.0, 16.0, 15.0, 7.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.125, -148.71875, -143.3125, -137.90625, -132.5, -127.09375, -121.6875, -116.28125, -110.875, -105.46875, -100.0625, -94.65625, -89.25, -83.84375, -78.4375, -73.03125, -67.625, -62.21875, -56.8125, -51.40625, -46.0, -40.59375, -35.1875, -29.78125, -24.375, -18.96875, -13.5625, -8.15625, -2.75, 2.65625, 8.0625, 13.46875, 18.875, 24.28125, 29.6875, 35.09375, 40.5, 45.90625, 51.3125, 56.71875, 62.125, 67.53125, 72.9375, 78.34375, 83.75, 89.15625, 94.5625, 99.96875, 105.375, 110.78125, 116.1875, 121.59375, 127.0, 132.40625, 137.8125, 143.21875, 148.625, 154.03125, 159.4375, 164.84375, 170.25, 175.65625, 181.0625, 186.46875, 191.875]}, "gradients/decoder.roberta.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 7.0, 18.0, 15.0, 22.0, 22.0, 29.0, 48.0, 66.0, 67.0, 56.0, 58.0, 70.0, 64.0, 69.0, 56.0, 67.0, 41.0, 44.0, 46.0, 25.0, 15.0, 15.0, 14.0, 11.0, 12.0, 8.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6953125, -6.50653076171875, -6.3177490234375, -6.12896728515625, -5.940185546875, -5.75140380859375, -5.5626220703125, -5.37384033203125, -5.18505859375, -4.99627685546875, -4.8074951171875, -4.61871337890625, -4.429931640625, -4.24114990234375, -4.0523681640625, -3.86358642578125, -3.6748046875, -3.48602294921875, -3.2972412109375, -3.10845947265625, -2.919677734375, -2.73089599609375, -2.5421142578125, -2.35333251953125, -2.16455078125, -1.97576904296875, -1.7869873046875, -1.59820556640625, -1.409423828125, -1.22064208984375, -1.0318603515625, -0.84307861328125, -0.654296875, -0.46551513671875, -0.2767333984375, -0.08795166015625, 0.100830078125, 0.28961181640625, 0.4783935546875, 0.66717529296875, 0.85595703125, 1.04473876953125, 1.2335205078125, 1.42230224609375, 1.611083984375, 1.79986572265625, 1.9886474609375, 2.17742919921875, 2.3662109375, 2.55499267578125, 2.7437744140625, 2.93255615234375, 3.121337890625, 3.31011962890625, 3.4989013671875, 3.68768310546875, 3.87646484375, 4.06524658203125, 4.2540283203125, 4.44281005859375, 4.631591796875, 4.82037353515625, 5.0091552734375, 5.19793701171875, 5.38671875]}, "gradients/decoder.roberta.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 9.0, 1.0, 10.0, 10.0, 33.0, 58.0, 145.0, 376.0, 960.0, 3677.0, 101482.0, 911877.0, 26520.0, 2208.0, 689.0, 286.0, 117.0, 48.0, 24.0, 10.0, 8.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.40625, -8.1463623046875, -7.886474609375, -7.6265869140625, -7.36669921875, -7.1068115234375, -6.846923828125, -6.5870361328125, -6.3271484375, -6.0672607421875, -5.807373046875, -5.5474853515625, -5.28759765625, -5.0277099609375, -4.767822265625, -4.5079345703125, -4.248046875, -3.9881591796875, -3.728271484375, -3.4683837890625, -3.20849609375, -2.9486083984375, -2.688720703125, -2.4288330078125, -2.1689453125, -1.9090576171875, -1.649169921875, -1.3892822265625, -1.12939453125, -0.8695068359375, -0.609619140625, -0.3497314453125, -0.08984375, 0.1700439453125, 0.429931640625, 0.6898193359375, 0.94970703125, 1.2095947265625, 1.469482421875, 1.7293701171875, 1.9892578125, 2.2491455078125, 2.509033203125, 2.7689208984375, 3.02880859375, 3.2886962890625, 3.548583984375, 3.8084716796875, 4.068359375, 4.3282470703125, 4.588134765625, 4.8480224609375, 5.10791015625, 5.3677978515625, 5.627685546875, 5.8875732421875, 6.1474609375, 6.4073486328125, 6.667236328125, 6.9271240234375, 7.18701171875, 7.4468994140625, 7.706787109375, 7.9666748046875, 8.2265625]}, "gradients/decoder.roberta.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 13.0, 11.0, 26.0, 23.0, 84.0, 103.0, 135.0, 182.0, 155.0, 101.0, 65.0, 33.0, 31.0, 12.0, 12.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006380081176757812, -0.0006210505962371826, -0.000604093074798584, -0.0005871355533599854, -0.0005701780319213867, -0.0005532205104827881, -0.0005362629890441895, -0.0005193054676055908, -0.0005023479461669922, -0.00048539042472839355, -0.0004684329032897949, -0.0004514753818511963, -0.00043451786041259766, -0.000417560338973999, -0.0004006028175354004, -0.00038364529609680176, -0.0003666877746582031, -0.0003497302532196045, -0.00033277273178100586, -0.0003158152103424072, -0.0002988576889038086, -0.00028190016746520996, -0.00026494264602661133, -0.0002479851245880127, -0.00023102760314941406, -0.00021407008171081543, -0.0001971125602722168, -0.00018015503883361816, -0.00016319751739501953, -0.0001462399959564209, -0.00012928247451782227, -0.00011232495307922363, -9.5367431640625e-05, -7.840991020202637e-05, -6.145238876342773e-05, -4.44948673248291e-05, -2.753734588623047e-05, -1.0579824447631836e-05, 6.377696990966797e-06, 2.333521842956543e-05, 4.029273986816406e-05, 5.7250261306762695e-05, 7.420778274536133e-05, 9.116530418395996e-05, 0.0001081228256225586, 0.00012508034706115723, 0.00014203786849975586, 0.0001589953899383545, 0.00017595291137695312, 0.00019291043281555176, 0.0002098679542541504, 0.00022682547569274902, 0.00024378299713134766, 0.0002607405185699463, 0.0002776980400085449, 0.00029465556144714355, 0.0003116130828857422, 0.0003285706043243408, 0.00034552812576293945, 0.0003624856472015381, 0.0003794431686401367, 0.00039640069007873535, 0.000413358211517334, 0.0004303157329559326, 0.00044727325439453125]}, "gradients/decoder.roberta.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 10.0, 16.0, 21.0, 31.0, 65.0, 125.0, 222.0, 1510.0, 1019861.0, 25862.0, 448.0, 144.0, 85.0, 54.0, 33.0, 24.0, 13.0, 6.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.489013671875, -20.79052734375, -20.092041015625, -19.3935546875, -18.695068359375, -17.99658203125, -17.298095703125, -16.599609375, -15.901123046875, -15.20263671875, -14.504150390625, -13.8056640625, -13.107177734375, -12.40869140625, -11.710205078125, -11.01171875, -10.313232421875, -9.61474609375, -8.916259765625, -8.2177734375, -7.519287109375, -6.82080078125, -6.122314453125, -5.423828125, -4.725341796875, -4.02685546875, -3.328369140625, -2.6298828125, -1.931396484375, -1.23291015625, -0.534423828125, 0.1640625, 0.862548828125, 1.56103515625, 2.259521484375, 2.9580078125, 3.656494140625, 4.35498046875, 5.053466796875, 5.751953125, 6.450439453125, 7.14892578125, 7.847412109375, 8.5458984375, 9.244384765625, 9.94287109375, 10.641357421875, 11.33984375, 12.038330078125, 12.73681640625, 13.435302734375, 14.1337890625, 14.832275390625, 15.53076171875, 16.229248046875, 16.927734375, 17.626220703125, 18.32470703125, 19.023193359375, 19.7216796875, 20.420166015625, 21.11865234375, 21.817138671875, 22.515625]}, "gradients/decoder.roberta.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 7.0, 7.0, 10.0, 22.0, 31.0, 45.0, 59.0, 66.0, 111.0, 143.0, 128.0, 111.0, 85.0, 68.0, 46.0, 22.0, 14.0, 12.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1611328125, -1.12689208984375, -1.0926513671875, -1.05841064453125, -1.024169921875, -0.98992919921875, -0.9556884765625, -0.92144775390625, -0.88720703125, -0.85296630859375, -0.8187255859375, -0.78448486328125, -0.750244140625, -0.71600341796875, -0.6817626953125, -0.64752197265625, -0.61328125, -0.57904052734375, -0.5447998046875, -0.51055908203125, -0.476318359375, -0.44207763671875, -0.4078369140625, -0.37359619140625, -0.33935546875, -0.30511474609375, -0.2708740234375, -0.23663330078125, -0.202392578125, -0.16815185546875, -0.1339111328125, -0.09967041015625, -0.0654296875, -0.03118896484375, 0.0030517578125, 0.03729248046875, 0.071533203125, 0.10577392578125, 0.1400146484375, 0.17425537109375, 0.20849609375, 0.24273681640625, 0.2769775390625, 0.31121826171875, 0.345458984375, 0.37969970703125, 0.4139404296875, 0.44818115234375, 0.482421875, 0.51666259765625, 0.5509033203125, 0.58514404296875, 0.619384765625, 0.65362548828125, 0.6878662109375, 0.72210693359375, 0.75634765625, 0.79058837890625, 0.8248291015625, 0.85906982421875, 0.893310546875, 0.92755126953125, 0.9617919921875, 0.99603271484375, 1.0302734375]}, "gradients/decoder.roberta.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 8.0, 16.0, 46.0, 115.0, 133.0, 171.0, 189.0, 144.0, 97.0, 43.0, 24.0, 17.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.068089008331299, -4.787145137786865, -4.506201267242432, -4.225257873535156, -3.9443140029907227, -3.663370132446289, -3.3824262619018555, -3.101482391357422, -2.8205387592315674, -2.539594888687134, -2.2586512565612793, -1.9777073860168457, -1.6967636346817017, -1.4158198833465576, -1.134876012802124, -0.85393226146698, -0.5729885101318359, -0.2920447289943695, -0.011100947856903076, 0.26984286308288574, 0.5507866144180298, 0.8317303657531738, 1.1126742362976074, 1.3936179876327515, 1.6745617389678955, 1.9555054903030396, 2.2364492416381836, 2.517393112182617, 2.798336982727051, 3.0792806148529053, 3.360224485397339, 3.6411681175231934, 3.9221115112304688, 4.203055381774902, 4.483999252319336, 4.7649431228637695, 5.045886516571045, 5.3268303871154785, 5.607774257659912, 5.888718128204346, 6.169661521911621, 6.450605392456055, 6.731549263000488, 7.012493133544922, 7.293436527252197, 7.574380397796631, 7.8553242683410645, 8.13626766204834, 8.417211532592773, 8.698155403137207, 8.97909927368164, 9.260043144226074, 9.540987014770508, 9.821929931640625, 10.102874755859375, 10.383817672729492, 10.664762496948242, 10.945706367492676, 11.22665023803711, 11.507594108581543, 11.788537979125977, 12.069480895996094, 12.350425720214844, 12.631368637084961, 12.912312507629395]}, "gradients/decoder.roberta.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 2.0, 11.0, 6.0, 8.0, 14.0, 9.0, 18.0, 17.0, 19.0, 26.0, 29.0, 34.0, 47.0, 28.0, 30.0, 35.0, 43.0, 36.0, 49.0, 48.0, 42.0, 42.0, 37.0, 47.0, 44.0, 42.0, 28.0, 34.0, 22.0, 28.0, 22.0, 17.0, 13.0, 17.0, 13.0, 8.0, 5.0, 3.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.3925886154174805, -5.224756717681885, -5.056924819946289, -4.889092922210693, -4.721261024475098, -4.553429126739502, -4.385597229003906, -4.217765808105469, -4.049933433532715, -3.882101535797119, -3.7142696380615234, -3.5464377403259277, -3.378605842590332, -3.2107739448547363, -3.0429422855377197, -2.875110387802124, -2.7072787284851074, -2.5394468307495117, -2.371614933013916, -2.2037830352783203, -2.0359511375427246, -1.8681193590164185, -1.7002875804901123, -1.5324556827545166, -1.364623785018921, -1.1967918872833252, -1.0289599895477295, -0.8611282110214233, -0.6932963132858276, -0.5254644155502319, -0.3576326370239258, -0.18980073928833008, -0.021968364715576172, 0.14586350321769714, 0.31369537115097046, 0.4815272092819214, 0.6493591070175171, 0.8171910047531128, 0.985022783279419, 1.1528546810150146, 1.3206865787506104, 1.488518476486206, 1.6563503742218018, 1.824182152748108, 1.9920140504837036, 2.1598458290100098, 2.3276777267456055, 2.495509624481201, 2.663341522216797, 2.8311734199523926, 2.9990053176879883, 3.166837215423584, 3.3346691131591797, 3.5025010108947754, 3.670332670211792, 3.8381645679473877, 4.0059967041015625, 4.173828601837158, 4.341660499572754, 4.50949239730835, 4.677324295043945, 4.845156192779541, 5.012988090515137, 5.180819511413574, 5.34865140914917]}, "gradients/decoder.roberta.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 4.0, 2.0, 13.0, 7.0, 11.0, 15.0, 35.0, 36.0, 46.0, 67.0, 110.0, 150.0, 206.0, 333.0, 522.0, 875.0, 1735.0, 3771.0, 10663.0, 42588.0, 310096.0, 2217543.0, 1403769.0, 160894.0, 26853.0, 7603.0, 2901.0, 1365.0, 719.0, 469.0, 276.0, 198.0, 142.0, 82.0, 41.0, 42.0, 33.0, 24.0, 14.0, 5.0, 9.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-7.33984375, -7.12921142578125, -6.9185791015625, -6.70794677734375, -6.497314453125, -6.28668212890625, -6.0760498046875, -5.86541748046875, -5.65478515625, -5.44415283203125, -5.2335205078125, -5.02288818359375, -4.812255859375, -4.60162353515625, -4.3909912109375, -4.18035888671875, -3.9697265625, -3.75909423828125, -3.5484619140625, -3.33782958984375, -3.127197265625, -2.91656494140625, -2.7059326171875, -2.49530029296875, -2.28466796875, -2.07403564453125, -1.8634033203125, -1.65277099609375, -1.442138671875, -1.23150634765625, -1.0208740234375, -0.81024169921875, -0.599609375, -0.38897705078125, -0.1783447265625, 0.03228759765625, 0.242919921875, 0.45355224609375, 0.6641845703125, 0.87481689453125, 1.08544921875, 1.29608154296875, 1.5067138671875, 1.71734619140625, 1.927978515625, 2.13861083984375, 2.3492431640625, 2.55987548828125, 2.7705078125, 2.98114013671875, 3.1917724609375, 3.40240478515625, 3.613037109375, 3.82366943359375, 4.0343017578125, 4.24493408203125, 4.45556640625, 4.66619873046875, 4.8768310546875, 5.08746337890625, 5.298095703125, 5.50872802734375, 5.7193603515625, 5.92999267578125, 6.140625]}, "gradients/decoder.roberta.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 9.0, 5.0, 3.0, 7.0, 7.0, 12.0, 18.0, 18.0, 16.0, 19.0, 25.0, 29.0, 31.0, 29.0, 35.0, 40.0, 58.0, 37.0, 38.0, 37.0, 47.0, 37.0, 41.0, 45.0, 44.0, 34.0, 31.0, 35.0, 35.0, 37.0, 17.0, 17.0, 24.0, 14.0, 14.0, 18.0, 10.0, 10.0, 7.0, 2.0, 3.0, 0.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3359375, -3.229583740234375, -3.12322998046875, -3.016876220703125, -2.9105224609375, -2.804168701171875, -2.69781494140625, -2.591461181640625, -2.485107421875, -2.378753662109375, -2.27239990234375, -2.166046142578125, -2.0596923828125, -1.953338623046875, -1.84698486328125, -1.740631103515625, -1.63427734375, -1.527923583984375, -1.42156982421875, -1.315216064453125, -1.2088623046875, -1.102508544921875, -0.99615478515625, -0.889801025390625, -0.783447265625, -0.677093505859375, -0.57073974609375, -0.464385986328125, -0.3580322265625, -0.251678466796875, -0.14532470703125, -0.038970947265625, 0.0673828125, 0.173736572265625, 0.28009033203125, 0.386444091796875, 0.4927978515625, 0.599151611328125, 0.70550537109375, 0.811859130859375, 0.918212890625, 1.024566650390625, 1.13092041015625, 1.237274169921875, 1.3436279296875, 1.449981689453125, 1.55633544921875, 1.662689208984375, 1.76904296875, 1.875396728515625, 1.98175048828125, 2.088104248046875, 2.1944580078125, 2.300811767578125, 2.40716552734375, 2.513519287109375, 2.619873046875, 2.726226806640625, 2.83258056640625, 2.938934326171875, 3.0452880859375, 3.151641845703125, 3.25799560546875, 3.364349365234375, 3.470703125]}, "gradients/decoder.roberta.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 8.0, 16.0, 55.0, 119.0, 404.0, 2145.0, 4187702.0, 3078.0, 490.0, 155.0, 63.0, 27.0, 14.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.0, -77.703125, -74.40625, -71.109375, -67.8125, -64.515625, -61.21875, -57.921875, -54.625, -51.328125, -48.03125, -44.734375, -41.4375, -38.140625, -34.84375, -31.546875, -28.25, -24.953125, -21.65625, -18.359375, -15.0625, -11.765625, -8.46875, -5.171875, -1.875, 1.421875, 4.71875, 8.015625, 11.3125, 14.609375, 17.90625, 21.203125, 24.5, 27.796875, 31.09375, 34.390625, 37.6875, 40.984375, 44.28125, 47.578125, 50.875, 54.171875, 57.46875, 60.765625, 64.0625, 67.359375, 70.65625, 73.953125, 77.25, 80.546875, 83.84375, 87.140625, 90.4375, 93.734375, 97.03125, 100.328125, 103.625, 106.921875, 110.21875, 113.515625, 116.8125, 120.109375, 123.40625, 126.703125, 130.0]}, "gradients/decoder.roberta.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 11.0, 16.0, 41.0, 84.0, 308.0, 923.0, 1584.0, 755.0, 241.0, 84.0, 22.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.65625, -6.48291015625, -6.3095703125, -6.13623046875, -5.962890625, -5.78955078125, -5.6162109375, -5.44287109375, -5.26953125, -5.09619140625, -4.9228515625, -4.74951171875, -4.576171875, -4.40283203125, -4.2294921875, -4.05615234375, -3.8828125, -3.70947265625, -3.5361328125, -3.36279296875, -3.189453125, -3.01611328125, -2.8427734375, -2.66943359375, -2.49609375, -2.32275390625, -2.1494140625, -1.97607421875, -1.802734375, -1.62939453125, -1.4560546875, -1.28271484375, -1.109375, -0.93603515625, -0.7626953125, -0.58935546875, -0.416015625, -0.24267578125, -0.0693359375, 0.10400390625, 0.27734375, 0.45068359375, 0.6240234375, 0.79736328125, 0.970703125, 1.14404296875, 1.3173828125, 1.49072265625, 1.6640625, 1.83740234375, 2.0107421875, 2.18408203125, 2.357421875, 2.53076171875, 2.7041015625, 2.87744140625, 3.05078125, 3.22412109375, 3.3974609375, 3.57080078125, 3.744140625, 3.91748046875, 4.0908203125, 4.26416015625, 4.4375]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 7.0, 14.0, 10.0, 15.0, 14.0, 22.0, 41.0, 47.0, 51.0, 53.0, 63.0, 74.0, 89.0, 78.0, 72.0, 73.0, 55.0, 45.0, 37.0, 38.0, 25.0, 20.0, 23.0, 10.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7228543758392334, -3.6196320056915283, -3.516409397125244, -3.413187026977539, -3.309964656829834, -3.206742286682129, -3.103519916534424, -3.0002973079681396, -2.8970749378204346, -2.7938525676727295, -2.6906299591064453, -2.5874075889587402, -2.484185218811035, -2.38096284866333, -2.277740478515625, -2.174517869949341, -2.0712954998016357, -1.9680731296539307, -1.864850640296936, -1.7616281509399414, -1.6584057807922363, -1.5551834106445312, -1.4519609212875366, -1.348738431930542, -1.245516061782837, -1.1422936916351318, -1.0390712022781372, -0.9358487725257874, -0.8326263427734375, -0.7294039130210876, -0.6261814832687378, -0.5229590535163879, -0.4197366237640381, -0.31651419401168823, -0.21329176425933838, -0.11006933450698853, -0.006846904754638672, 0.09637552499771118, 0.19959795475006104, 0.3028203845024109, 0.40604281425476074, 0.5092652440071106, 0.6124876737594604, 0.7157101035118103, 0.8189325332641602, 0.92215496301651, 1.0253773927688599, 1.1285998821258545, 1.2318222522735596, 1.3350446224212646, 1.4382671117782593, 1.541489601135254, 1.644711971282959, 1.747934341430664, 1.8511568307876587, 1.9543793201446533, 2.0576016902923584, 2.1608240604400635, 2.2640466690063477, 2.3672690391540527, 2.470491409301758, 2.573713779449463, 2.676936149597168, 2.780158758163452, 2.8833811283111572]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 8.0, 8.0, 16.0, 17.0, 22.0, 17.0, 17.0, 32.0, 25.0, 20.0, 40.0, 22.0, 42.0, 39.0, 45.0, 47.0, 46.0, 40.0, 39.0, 41.0, 38.0, 45.0, 39.0, 31.0, 39.0, 21.0, 27.0, 24.0, 21.0, 21.0, 18.0, 14.0, 9.0, 13.0, 9.0, 5.0, 9.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.974435329437256, -3.8541512489318848, -3.7338674068450928, -3.6135833263397217, -3.4932992458343506, -3.3730154037475586, -3.2527313232421875, -3.1324472427368164, -3.0121631622314453, -2.891879081726074, -2.7715952396392822, -2.651311159133911, -2.53102707862854, -2.410743236541748, -2.290459156036377, -2.170175075531006, -2.049891233444214, -1.9296072721481323, -1.8093231916427612, -1.6890392303466797, -1.5687551498413086, -1.448471188545227, -1.3281872272491455, -1.2079031467437744, -1.0876191854476929, -0.9673351645469666, -0.8470511436462402, -0.7267671823501587, -0.6064831614494324, -0.48619914054870605, -0.3659151792526245, -0.2456311583518982, -0.12534737586975098, -0.005063369870185852, 0.11522063612937927, 0.2355046272277832, 0.3557886481285095, 0.47607266902923584, 0.5963566303253174, 0.7166406512260437, 0.83692467212677, 0.9572086930274963, 1.0774927139282227, 1.1977766752243042, 1.3180606365203857, 1.4383447170257568, 1.5586286783218384, 1.67891263961792, 1.799196720123291, 1.9194806814193726, 2.039764642715454, 2.160048723220825, 2.2803328037261963, 2.4006166458129883, 2.5209007263183594, 2.6411848068237305, 2.7614688873291016, 2.8817529678344727, 3.0020368099212646, 3.1223208904266357, 3.242604970932007, 3.362888813018799, 3.48317289352417, 3.603456974029541, 3.723740816116333]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 16.0, 13.0, 16.0, 29.0, 35.0, 49.0, 66.0, 124.0, 159.0, 239.0, 332.0, 497.0, 733.0, 1170.0, 1786.0, 2770.0, 4370.0, 7078.0, 11468.0, 19668.0, 34330.0, 64352.0, 124810.0, 221716.0, 239023.0, 143259.0, 74580.0, 39317.0, 21916.0, 12884.0, 7950.0, 4911.0, 3073.0, 1985.0, 1278.0, 820.0, 548.0, 386.0, 247.0, 162.0, 122.0, 87.0, 59.0, 43.0, 27.0, 12.0, 10.0, 8.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.69970703125, -0.677215576171875, -0.65472412109375, -0.632232666015625, -0.6097412109375, -0.587249755859375, -0.56475830078125, -0.542266845703125, -0.519775390625, -0.497283935546875, -0.47479248046875, -0.452301025390625, -0.4298095703125, -0.407318115234375, -0.38482666015625, -0.362335205078125, -0.33984375, -0.317352294921875, -0.29486083984375, -0.272369384765625, -0.2498779296875, -0.227386474609375, -0.20489501953125, -0.182403564453125, -0.159912109375, -0.137420654296875, -0.11492919921875, -0.092437744140625, -0.0699462890625, -0.047454833984375, -0.02496337890625, -0.002471923828125, 0.02001953125, 0.042510986328125, 0.06500244140625, 0.087493896484375, 0.1099853515625, 0.132476806640625, 0.15496826171875, 0.177459716796875, 0.199951171875, 0.222442626953125, 0.24493408203125, 0.267425537109375, 0.2899169921875, 0.312408447265625, 0.33489990234375, 0.357391357421875, 0.3798828125, 0.402374267578125, 0.42486572265625, 0.447357177734375, 0.4698486328125, 0.492340087890625, 0.51483154296875, 0.537322998046875, 0.559814453125, 0.582305908203125, 0.60479736328125, 0.627288818359375, 0.6497802734375, 0.672271728515625, 0.69476318359375, 0.717254638671875, 0.73974609375]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 8.0, 8.0, 7.0, 17.0, 16.0, 23.0, 17.0, 17.0, 31.0, 27.0, 21.0, 39.0, 21.0, 42.0, 41.0, 41.0, 48.0, 46.0, 42.0, 37.0, 42.0, 38.0, 44.0, 37.0, 33.0, 39.0, 21.0, 27.0, 24.0, 21.0, 22.0, 18.0, 14.0, 9.0, 13.0, 8.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.0, -3.883392333984375, -3.76678466796875, -3.650177001953125, -3.5335693359375, -3.416961669921875, -3.30035400390625, -3.183746337890625, -3.067138671875, -2.950531005859375, -2.83392333984375, -2.717315673828125, -2.6007080078125, -2.484100341796875, -2.36749267578125, -2.250885009765625, -2.13427734375, -2.017669677734375, -1.90106201171875, -1.784454345703125, -1.6678466796875, -1.551239013671875, -1.43463134765625, -1.318023681640625, -1.201416015625, -1.084808349609375, -0.96820068359375, -0.851593017578125, -0.7349853515625, -0.618377685546875, -0.50177001953125, -0.385162353515625, -0.2685546875, -0.151947021484375, -0.03533935546875, 0.081268310546875, 0.1978759765625, 0.314483642578125, 0.43109130859375, 0.547698974609375, 0.664306640625, 0.780914306640625, 0.89752197265625, 1.014129638671875, 1.1307373046875, 1.247344970703125, 1.36395263671875, 1.480560302734375, 1.59716796875, 1.713775634765625, 1.83038330078125, 1.946990966796875, 2.0635986328125, 2.180206298828125, 2.29681396484375, 2.413421630859375, 2.530029296875, 2.646636962890625, 2.76324462890625, 2.879852294921875, 2.9964599609375, 3.113067626953125, 3.22967529296875, 3.346282958984375, 3.462890625]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 9.0, 14.0, 11.0, 26.0, 25.0, 32.0, 35.0, 39.0, 72.0, 100.0, 135.0, 182.0, 246.0, 363.0, 532.0, 892.0, 1548.0, 2985.0, 6998.0, 21077.0, 878028.0, 100954.0, 20197.0, 6955.0, 2892.0, 1466.0, 867.0, 557.0, 383.0, 257.0, 166.0, 146.0, 102.0, 59.0, 41.0, 37.0, 29.0, 27.0, 17.0, 14.0, 10.0, 5.0, 5.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.375, -2.300750732421875, -2.22650146484375, -2.152252197265625, -2.0780029296875, -2.003753662109375, -1.92950439453125, -1.855255126953125, -1.781005859375, -1.706756591796875, -1.63250732421875, -1.558258056640625, -1.4840087890625, -1.409759521484375, -1.33551025390625, -1.261260986328125, -1.18701171875, -1.112762451171875, -1.03851318359375, -0.964263916015625, -0.8900146484375, -0.815765380859375, -0.74151611328125, -0.667266845703125, -0.593017578125, -0.518768310546875, -0.44451904296875, -0.370269775390625, -0.2960205078125, -0.221771240234375, -0.14752197265625, -0.073272705078125, 0.0009765625, 0.075225830078125, 0.14947509765625, 0.223724365234375, 0.2979736328125, 0.372222900390625, 0.44647216796875, 0.520721435546875, 0.594970703125, 0.669219970703125, 0.74346923828125, 0.817718505859375, 0.8919677734375, 0.966217041015625, 1.04046630859375, 1.114715576171875, 1.18896484375, 1.263214111328125, 1.33746337890625, 1.411712646484375, 1.4859619140625, 1.560211181640625, 1.63446044921875, 1.708709716796875, 1.782958984375, 1.857208251953125, 1.93145751953125, 2.005706787109375, 2.0799560546875, 2.154205322265625, 2.22845458984375, 2.302703857421875, 2.376953125]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 4.0, 2.0, 6.0, 12.0, 11.0, 13.0, 17.0, 13.0, 15.0, 25.0, 26.0, 26.0, 27.0, 34.0, 39.0, 34.0, 36.0, 36.0, 40.0, 46.0, 39.0, 47.0, 52.0, 26.0, 31.0, 36.0, 38.0, 21.0, 29.0, 26.0, 17.0, 23.0, 17.0, 16.0, 15.0, 12.0, 19.0, 14.0, 8.0, 7.0, 10.0, 8.0, 4.0, 0.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.212890625, -2.141082763671875, -2.06927490234375, -1.997467041015625, -1.9256591796875, -1.853851318359375, -1.78204345703125, -1.710235595703125, -1.638427734375, -1.566619873046875, -1.49481201171875, -1.423004150390625, -1.3511962890625, -1.279388427734375, -1.20758056640625, -1.135772705078125, -1.06396484375, -0.992156982421875, -0.92034912109375, -0.848541259765625, -0.7767333984375, -0.704925537109375, -0.63311767578125, -0.561309814453125, -0.489501953125, -0.417694091796875, -0.34588623046875, -0.274078369140625, -0.2022705078125, -0.130462646484375, -0.05865478515625, 0.013153076171875, 0.0849609375, 0.156768798828125, 0.22857666015625, 0.300384521484375, 0.3721923828125, 0.444000244140625, 0.51580810546875, 0.587615966796875, 0.659423828125, 0.731231689453125, 0.80303955078125, 0.874847412109375, 0.9466552734375, 1.018463134765625, 1.09027099609375, 1.162078857421875, 1.23388671875, 1.305694580078125, 1.37750244140625, 1.449310302734375, 1.5211181640625, 1.592926025390625, 1.66473388671875, 1.736541748046875, 1.808349609375, 1.880157470703125, 1.95196533203125, 2.023773193359375, 2.0955810546875, 2.167388916015625, 2.23919677734375, 2.311004638671875, 2.3828125]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 4.0, 9.0, 4.0, 10.0, 17.0, 20.0, 21.0, 35.0, 50.0, 102.0, 155.0, 279.0, 556.0, 1139.0, 3707.0, 21225.0, 996969.0, 18480.0, 3366.0, 1235.0, 518.0, 249.0, 136.0, 82.0, 68.0, 33.0, 23.0, 16.0, 13.0, 11.0, 5.0, 2.0, 4.0, 8.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.42595672607421875, -0.4109954833984375, -0.39603424072265625, -0.381072998046875, -0.36611175537109375, -0.3511505126953125, -0.33618927001953125, -0.32122802734375, -0.30626678466796875, -0.2913055419921875, -0.27634429931640625, -0.261383056640625, -0.24642181396484375, -0.2314605712890625, -0.21649932861328125, -0.2015380859375, -0.18657684326171875, -0.1716156005859375, -0.15665435791015625, -0.141693115234375, -0.12673187255859375, -0.1117706298828125, -0.09680938720703125, -0.08184814453125, -0.06688690185546875, -0.0519256591796875, -0.03696441650390625, -0.022003173828125, -0.00704193115234375, 0.0079193115234375, 0.02288055419921875, 0.037841796875, 0.05280303955078125, 0.0677642822265625, 0.08272552490234375, 0.097686767578125, 0.11264801025390625, 0.1276092529296875, 0.14257049560546875, 0.15753173828125, 0.17249298095703125, 0.1874542236328125, 0.20241546630859375, 0.217376708984375, 0.23233795166015625, 0.2472991943359375, 0.26226043701171875, 0.2772216796875, 0.29218292236328125, 0.3071441650390625, 0.32210540771484375, 0.337066650390625, 0.35202789306640625, 0.3669891357421875, 0.38195037841796875, 0.39691162109375, 0.41187286376953125, 0.4268341064453125, 0.44179534912109375, 0.456756591796875, 0.47171783447265625, 0.4866790771484375, 0.5016403198242188, 0.5166015625]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 9.0, 5.0, 5.0, 6.0, 8.0, 18.0, 15.0, 15.0, 20.0, 21.0, 19.0, 29.0, 28.0, 23.0, 56.0, 50.0, 60.0, 44.0, 62.0, 55.0, 57.0, 60.0, 45.0, 31.0, 41.0, 34.0, 36.0, 34.0, 19.0, 19.0, 20.0, 8.0, 13.0, 10.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0384788513183594e-05, -1.9708648324012756e-05, -1.903250813484192e-05, -1.835636794567108e-05, -1.7680227756500244e-05, -1.7004087567329407e-05, -1.632794737815857e-05, -1.5651807188987732e-05, -1.4975666999816895e-05, -1.4299526810646057e-05, -1.362338662147522e-05, -1.2947246432304382e-05, -1.2271106243133545e-05, -1.1594966053962708e-05, -1.091882586479187e-05, -1.0242685675621033e-05, -9.566545486450195e-06, -8.890405297279358e-06, -8.21426510810852e-06, -7.538124918937683e-06, -6.861984729766846e-06, -6.185844540596008e-06, -5.509704351425171e-06, -4.8335641622543335e-06, -4.157423973083496e-06, -3.4812837839126587e-06, -2.8051435947418213e-06, -2.129003405570984e-06, -1.4528632164001465e-06, -7.767230272293091e-07, -1.0058283805847168e-07, 5.755573511123657e-07, 1.2516975402832031e-06, 1.9278377294540405e-06, 2.603977918624878e-06, 3.2801181077957153e-06, 3.956258296966553e-06, 4.63239848613739e-06, 5.3085386753082275e-06, 5.984678864479065e-06, 6.660819053649902e-06, 7.33695924282074e-06, 8.013099431991577e-06, 8.689239621162415e-06, 9.365379810333252e-06, 1.004151999950409e-05, 1.0717660188674927e-05, 1.1393800377845764e-05, 1.2069940567016602e-05, 1.2746080756187439e-05, 1.3422220945358276e-05, 1.4098361134529114e-05, 1.4774501323699951e-05, 1.545064151287079e-05, 1.6126781702041626e-05, 1.6802921891212463e-05, 1.74790620803833e-05, 1.8155202269554138e-05, 1.8831342458724976e-05, 1.9507482647895813e-05, 2.018362283706665e-05, 2.0859763026237488e-05, 2.1535903215408325e-05, 2.2212043404579163e-05, 2.288818359375e-05]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 3.0, 4.0, 2.0, 9.0, 12.0, 14.0, 19.0, 24.0, 41.0, 54.0, 77.0, 160.0, 530.0, 66385.0, 978942.0, 1711.0, 201.0, 102.0, 69.0, 41.0, 37.0, 28.0, 12.0, 11.0, 9.0, 13.0, 6.0, 5.0, 7.0, 1.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.86376953125, -0.8377532958984375, -0.811737060546875, -0.7857208251953125, -0.75970458984375, -0.7336883544921875, -0.707672119140625, -0.6816558837890625, -0.6556396484375, -0.6296234130859375, -0.603607177734375, -0.5775909423828125, -0.55157470703125, -0.5255584716796875, -0.499542236328125, -0.4735260009765625, -0.447509765625, -0.4214935302734375, -0.395477294921875, -0.3694610595703125, -0.34344482421875, -0.3174285888671875, -0.291412353515625, -0.2653961181640625, -0.2393798828125, -0.2133636474609375, -0.187347412109375, -0.1613311767578125, -0.13531494140625, -0.1092987060546875, -0.083282470703125, -0.0572662353515625, -0.03125, -0.0052337646484375, 0.020782470703125, 0.0467987060546875, 0.07281494140625, 0.0988311767578125, 0.124847412109375, 0.1508636474609375, 0.1768798828125, 0.2028961181640625, 0.228912353515625, 0.2549285888671875, 0.28094482421875, 0.3069610595703125, 0.332977294921875, 0.3589935302734375, 0.385009765625, 0.4110260009765625, 0.437042236328125, 0.4630584716796875, 0.48907470703125, 0.5150909423828125, 0.541107177734375, 0.5671234130859375, 0.5931396484375, 0.6191558837890625, 0.645172119140625, 0.6711883544921875, 0.69720458984375, 0.7232208251953125, 0.749237060546875, 0.7752532958984375, 0.80126953125]}, "gradients/decoder.roberta.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 7.0, 8.0, 8.0, 6.0, 16.0, 20.0, 26.0, 34.0, 35.0, 60.0, 131.0, 181.0, 160.0, 99.0, 55.0, 35.0, 18.0, 25.0, 16.0, 11.0, 7.0, 5.0, 7.0, 5.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04022216796875, -0.038915157318115234, -0.03760814666748047, -0.0363011360168457, -0.03499412536621094, -0.03368711471557617, -0.032380104064941406, -0.03107309341430664, -0.029766082763671875, -0.02845907211303711, -0.027152061462402344, -0.025845050811767578, -0.024538040161132812, -0.023231029510498047, -0.02192401885986328, -0.020617008209228516, -0.01930999755859375, -0.018002986907958984, -0.01669597625732422, -0.015388965606689453, -0.014081954956054688, -0.012774944305419922, -0.011467933654785156, -0.01016092300415039, -0.008853912353515625, -0.007546901702880859, -0.006239891052246094, -0.004932880401611328, -0.0036258697509765625, -0.002318859100341797, -0.0010118484497070312, 0.0002951622009277344, 0.0016021728515625, 0.0029091835021972656, 0.004216194152832031, 0.005523204803466797, 0.0068302154541015625, 0.008137226104736328, 0.009444236755371094, 0.01075124740600586, 0.012058258056640625, 0.01336526870727539, 0.014672279357910156, 0.015979290008544922, 0.017286300659179688, 0.018593311309814453, 0.01990032196044922, 0.021207332611083984, 0.02251434326171875, 0.023821353912353516, 0.02512836456298828, 0.026435375213623047, 0.027742385864257812, 0.029049396514892578, 0.030356407165527344, 0.03166341781616211, 0.032970428466796875, 0.03427743911743164, 0.035584449768066406, 0.03689146041870117, 0.03819847106933594, 0.0395054817199707, 0.04081249237060547, 0.042119503021240234, 0.043426513671875]}, "gradients/decoder.roberta.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 13.0, 17.0, 37.0, 51.0, 94.0, 110.0, 136.0, 144.0, 138.0, 87.0, 66.0, 53.0, 28.0, 13.0, 10.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6350257396698, -3.446544647216797, -3.258063793182373, -3.06958270072937, -2.881101608276367, -2.6926207542419434, -2.5041396617889404, -2.3156585693359375, -2.1271777153015137, -1.9386967420578003, -1.7502156496047974, -1.561734676361084, -1.373253583908081, -1.1847726106643677, -0.9962916374206543, -0.8078105449676514, -0.6193294525146484, -0.4308484196662903, -0.24236741662025452, -0.05388641357421875, 0.1345946192741394, 0.32307565212249756, 0.5115566253662109, 0.7000377178192139, 0.8885186910629272, 1.0769996643066406, 1.2654807567596436, 1.453961730003357, 1.6424427032470703, 1.8309237957000732, 2.019404888153076, 2.2078857421875, 2.396366596221924, 2.5848476886749268, 2.7733285427093506, 2.9618096351623535, 3.1502907276153564, 3.3387718200683594, 3.527252674102783, 3.715733766555786, 3.904214859008789, 4.092695713043213, 4.281177043914795, 4.469657897949219, 4.658138751983643, 4.846620082855225, 5.035100936889648, 5.2235822677612305, 5.412062644958496, 5.60054349899292, 5.789024829864502, 5.977505683898926, 6.16598653793335, 6.354467868804932, 6.5429487228393555, 6.7314300537109375, 6.919910907745361, 7.108391761779785, 7.296873092651367, 7.485353946685791, 7.673834800720215, 7.862316131591797, 8.050796508789062, 8.239277839660645, 8.427759170532227]}, "gradients/decoder.roberta.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 9.0, 7.0, 7.0, 17.0, 13.0, 24.0, 19.0, 16.0, 32.0, 25.0, 22.0, 37.0, 24.0, 40.0, 41.0, 43.0, 46.0, 48.0, 39.0, 40.0, 39.0, 39.0, 43.0, 39.0, 31.0, 37.0, 26.0, 27.0, 24.0, 21.0, 22.0, 18.0, 13.0, 10.0, 13.0, 8.0, 6.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.005408763885498, -3.8887624740600586, -3.77211594581604, -3.6554696559906006, -3.538823366165161, -3.4221768379211426, -3.305530548095703, -3.1888842582702637, -3.072237968444824, -2.9555916786193848, -2.838945150375366, -2.7222988605499268, -2.6056525707244873, -2.4890060424804688, -2.3723597526550293, -2.25571346282959, -2.1390671730041504, -2.022420883178711, -1.905774474143982, -1.789128065109253, -1.6724817752838135, -1.5558353662490845, -1.4391889572143555, -1.322542667388916, -1.2058961391448975, -1.0892497301101685, -0.972603440284729, -0.85595703125, -0.7393107414245605, -0.6226643323898315, -0.5060179829597473, -0.3893716335296631, -0.27272534370422363, -0.1560789942741394, -0.03943262994289398, 0.07721373438835144, 0.19386008381843567, 0.3105064630508423, 0.4271528124809265, 0.5437991619110107, 0.660445511341095, 0.7770918607711792, 0.8937382102012634, 1.0103845596313477, 1.1270309686660767, 1.2436773777008057, 1.3603236675262451, 1.4769699573516846, 1.5936163663864136, 1.7102627754211426, 1.826909065246582, 1.943555474281311, 2.06020188331604, 2.1768481731414795, 2.293494462966919, 2.4101409912109375, 2.526787281036377, 2.6434335708618164, 2.760080099105835, 2.8767263889312744, 2.993372678756714, 3.1100192070007324, 3.226665496826172, 3.3433117866516113, 3.459958076477051]}, "gradients/decoder.roberta.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 6.0, 12.0, 19.0, 15.0, 19.0, 35.0, 29.0, 52.0, 84.0, 78.0, 119.0, 157.0, 263.0, 454.0, 754.0, 1551.0, 3039.0, 6621.0, 14584.0, 34298.0, 81176.0, 179950.0, 295302.0, 231940.0, 111899.0, 47924.0, 20513.0, 8903.0, 4150.0, 1911.0, 1042.0, 574.0, 303.0, 204.0, 142.0, 112.0, 76.0, 50.0, 37.0, 33.0, 27.0, 21.0, 13.0, 18.0, 10.0, 5.0, 5.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0], "bins": [-3.861328125, -3.74322509765625, -3.6251220703125, -3.50701904296875, -3.388916015625, -3.27081298828125, -3.1527099609375, -3.03460693359375, -2.91650390625, -2.79840087890625, -2.6802978515625, -2.56219482421875, -2.444091796875, -2.32598876953125, -2.2078857421875, -2.08978271484375, -1.9716796875, -1.85357666015625, -1.7354736328125, -1.61737060546875, -1.499267578125, -1.38116455078125, -1.2630615234375, -1.14495849609375, -1.02685546875, -0.90875244140625, -0.7906494140625, -0.67254638671875, -0.554443359375, -0.43634033203125, -0.3182373046875, -0.20013427734375, -0.08203125, 0.03607177734375, 0.1541748046875, 0.27227783203125, 0.390380859375, 0.50848388671875, 0.6265869140625, 0.74468994140625, 0.86279296875, 0.98089599609375, 1.0989990234375, 1.21710205078125, 1.335205078125, 1.45330810546875, 1.5714111328125, 1.68951416015625, 1.8076171875, 1.92572021484375, 2.0438232421875, 2.16192626953125, 2.280029296875, 2.39813232421875, 2.5162353515625, 2.63433837890625, 2.75244140625, 2.87054443359375, 2.9886474609375, 3.10675048828125, 3.224853515625, 3.34295654296875, 3.4610595703125, 3.57916259765625, 3.697265625]}, "gradients/decoder.roberta.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 7.0, 10.0, 7.0, 11.0, 8.0, 20.0, 24.0, 19.0, 17.0, 25.0, 28.0, 23.0, 33.0, 25.0, 44.0, 44.0, 44.0, 38.0, 44.0, 48.0, 39.0, 37.0, 45.0, 30.0, 46.0, 45.0, 30.0, 29.0, 24.0, 21.0, 26.0, 14.0, 19.0, 13.0, 9.0, 13.0, 10.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.876953125, -3.760589599609375, -3.64422607421875, -3.527862548828125, -3.4114990234375, -3.295135498046875, -3.17877197265625, -3.062408447265625, -2.946044921875, -2.829681396484375, -2.71331787109375, -2.596954345703125, -2.4805908203125, -2.364227294921875, -2.24786376953125, -2.131500244140625, -2.01513671875, -1.898773193359375, -1.78240966796875, -1.666046142578125, -1.5496826171875, -1.433319091796875, -1.31695556640625, -1.200592041015625, -1.084228515625, -0.967864990234375, -0.85150146484375, -0.735137939453125, -0.6187744140625, -0.502410888671875, -0.38604736328125, -0.269683837890625, -0.1533203125, -0.036956787109375, 0.07940673828125, 0.195770263671875, 0.3121337890625, 0.428497314453125, 0.54486083984375, 0.661224365234375, 0.777587890625, 0.893951416015625, 1.01031494140625, 1.126678466796875, 1.2430419921875, 1.359405517578125, 1.47576904296875, 1.592132568359375, 1.70849609375, 1.824859619140625, 1.94122314453125, 2.057586669921875, 2.1739501953125, 2.290313720703125, 2.40667724609375, 2.523040771484375, 2.639404296875, 2.755767822265625, 2.87213134765625, 2.988494873046875, 3.1048583984375, 3.221221923828125, 3.33758544921875, 3.453948974609375, 3.5703125]}, "gradients/decoder.roberta.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 5.0, 4.0, 9.0, 7.0, 12.0, 13.0, 10.0, 15.0, 25.0, 26.0, 30.0, 37.0, 22.0, 30.0, 47.0, 49.0, 74.0, 163.0, 888.0, 1045843.0, 671.0, 135.0, 57.0, 52.0, 45.0, 45.0, 28.0, 28.0, 29.0, 24.0, 20.0, 22.0, 15.0, 12.0, 10.0, 10.0, 12.0, 9.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.1875, -107.537109375, -103.88671875, -100.236328125, -96.5859375, -92.935546875, -89.28515625, -85.634765625, -81.984375, -78.333984375, -74.68359375, -71.033203125, -67.3828125, -63.732421875, -60.08203125, -56.431640625, -52.78125, -49.130859375, -45.48046875, -41.830078125, -38.1796875, -34.529296875, -30.87890625, -27.228515625, -23.578125, -19.927734375, -16.27734375, -12.626953125, -8.9765625, -5.326171875, -1.67578125, 1.974609375, 5.625, 9.275390625, 12.92578125, 16.576171875, 20.2265625, 23.876953125, 27.52734375, 31.177734375, 34.828125, 38.478515625, 42.12890625, 45.779296875, 49.4296875, 53.080078125, 56.73046875, 60.380859375, 64.03125, 67.681640625, 71.33203125, 74.982421875, 78.6328125, 82.283203125, 85.93359375, 89.583984375, 93.234375, 96.884765625, 100.53515625, 104.185546875, 107.8359375, 111.486328125, 115.13671875, 118.787109375, 122.4375]}, "gradients/decoder.roberta.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 3.0, 7.0, 8.0, 10.0, 11.0, 11.0, 12.0, 13.0, 18.0, 21.0, 24.0, 29.0, 33.0, 33.0, 41.0, 34.0, 40.0, 27.0, 42.0, 45.0, 39.0, 38.0, 41.0, 51.0, 41.0, 44.0, 35.0, 33.0, 21.0, 29.0, 26.0, 36.0, 18.0, 10.0, 15.0, 13.0, 11.0, 8.0, 4.0, 7.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.23828125, -4.11309814453125, -3.9879150390625, -3.86273193359375, -3.737548828125, -3.61236572265625, -3.4871826171875, -3.36199951171875, -3.23681640625, -3.11163330078125, -2.9864501953125, -2.86126708984375, -2.736083984375, -2.61090087890625, -2.4857177734375, -2.36053466796875, -2.2353515625, -2.11016845703125, -1.9849853515625, -1.85980224609375, -1.734619140625, -1.60943603515625, -1.4842529296875, -1.35906982421875, -1.23388671875, -1.10870361328125, -0.9835205078125, -0.85833740234375, -0.733154296875, -0.60797119140625, -0.4827880859375, -0.35760498046875, -0.232421875, -0.10723876953125, 0.0179443359375, 0.14312744140625, 0.268310546875, 0.39349365234375, 0.5186767578125, 0.64385986328125, 0.76904296875, 0.89422607421875, 1.0194091796875, 1.14459228515625, 1.269775390625, 1.39495849609375, 1.5201416015625, 1.64532470703125, 1.7705078125, 1.89569091796875, 2.0208740234375, 2.14605712890625, 2.271240234375, 2.39642333984375, 2.5216064453125, 2.64678955078125, 2.77197265625, 2.89715576171875, 3.0223388671875, 3.14752197265625, 3.272705078125, 3.39788818359375, 3.5230712890625, 3.64825439453125, 3.7734375]}, "gradients/decoder.roberta.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 10.0, 14.0, 21.0, 29.0, 83.0, 157.0, 584.0, 3017.0, 448524.0, 591792.0, 3382.0, 598.0, 177.0, 65.0, 29.0, 33.0, 14.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.640380859375, -9.29638671875, -8.952392578125, -8.6083984375, -8.264404296875, -7.92041015625, -7.576416015625, -7.232421875, -6.888427734375, -6.54443359375, -6.200439453125, -5.8564453125, -5.512451171875, -5.16845703125, -4.824462890625, -4.48046875, -4.136474609375, -3.79248046875, -3.448486328125, -3.1044921875, -2.760498046875, -2.41650390625, -2.072509765625, -1.728515625, -1.384521484375, -1.04052734375, -0.696533203125, -0.3525390625, -0.008544921875, 0.33544921875, 0.679443359375, 1.0234375, 1.367431640625, 1.71142578125, 2.055419921875, 2.3994140625, 2.743408203125, 3.08740234375, 3.431396484375, 3.775390625, 4.119384765625, 4.46337890625, 4.807373046875, 5.1513671875, 5.495361328125, 5.83935546875, 6.183349609375, 6.52734375, 6.871337890625, 7.21533203125, 7.559326171875, 7.9033203125, 8.247314453125, 8.59130859375, 8.935302734375, 9.279296875, 9.623291015625, 9.96728515625, 10.311279296875, 10.6552734375, 10.999267578125, 11.34326171875, 11.687255859375, 12.03125]}, "gradients/decoder.roberta.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 10.0, 9.0, 12.0, 19.0, 27.0, 36.0, 77.0, 68.0, 83.0, 143.0, 132.0, 112.0, 83.0, 54.0, 46.0, 34.0, 19.0, 16.0, 7.0, 3.0, 6.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00046133995056152344, -0.0004506688565015793, -0.00043999776244163513, -0.000429326668381691, -0.0004186555743217468, -0.0004079844802618027, -0.0003973133862018585, -0.00038664229214191437, -0.0003759711980819702, -0.00036530010402202606, -0.0003546290099620819, -0.00034395791590213776, -0.0003332868218421936, -0.00032261572778224945, -0.0003119446337223053, -0.00030127353966236115, -0.000290602445602417, -0.00027993135154247284, -0.0002692602574825287, -0.00025858916342258453, -0.0002479180693626404, -0.00023724697530269623, -0.00022657588124275208, -0.00021590478718280792, -0.00020523369312286377, -0.00019456259906291962, -0.00018389150500297546, -0.0001732204109430313, -0.00016254931688308716, -0.000151878222823143, -0.00014120712876319885, -0.0001305360347032547, -0.00011986494064331055, -0.0001091938465833664, -9.852275252342224e-05, -8.785165846347809e-05, -7.718056440353394e-05, -6.650947034358978e-05, -5.583837628364563e-05, -4.516728222370148e-05, -3.4496188163757324e-05, -2.382509410381317e-05, -1.3154000043869019e-05, -2.4829059839248657e-06, 8.188188076019287e-06, 1.885928213596344e-05, 2.9530376195907593e-05, 4.0201470255851746e-05, 5.08725643157959e-05, 6.154365837574005e-05, 7.22147524356842e-05, 8.288584649562836e-05, 9.355694055557251e-05, 0.00010422803461551666, 0.00011489912867546082, 0.00012557022273540497, 0.00013624131679534912, 0.00014691241085529327, 0.00015758350491523743, 0.00016825459897518158, 0.00017892569303512573, 0.00018959678709506989, 0.00020026788115501404, 0.0002109389752149582, 0.00022161006927490234]}, "gradients/decoder.roberta.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 9.0, 8.0, 14.0, 26.0, 48.0, 71.0, 137.0, 330.0, 3948.0, 1040146.0, 3195.0, 330.0, 121.0, 72.0, 38.0, 26.0, 11.0, 11.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.53125, -24.790771484375, -24.05029296875, -23.309814453125, -22.5693359375, -21.828857421875, -21.08837890625, -20.347900390625, -19.607421875, -18.866943359375, -18.12646484375, -17.385986328125, -16.6455078125, -15.905029296875, -15.16455078125, -14.424072265625, -13.68359375, -12.943115234375, -12.20263671875, -11.462158203125, -10.7216796875, -9.981201171875, -9.24072265625, -8.500244140625, -7.759765625, -7.019287109375, -6.27880859375, -5.538330078125, -4.7978515625, -4.057373046875, -3.31689453125, -2.576416015625, -1.8359375, -1.095458984375, -0.35498046875, 0.385498046875, 1.1259765625, 1.866455078125, 2.60693359375, 3.347412109375, 4.087890625, 4.828369140625, 5.56884765625, 6.309326171875, 7.0498046875, 7.790283203125, 8.53076171875, 9.271240234375, 10.01171875, 10.752197265625, 11.49267578125, 12.233154296875, 12.9736328125, 13.714111328125, 14.45458984375, 15.195068359375, 15.935546875, 16.676025390625, 17.41650390625, 18.156982421875, 18.8974609375, 19.637939453125, 20.37841796875, 21.118896484375, 21.859375]}, "gradients/decoder.roberta.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 11.0, 9.0, 19.0, 20.0, 59.0, 66.0, 97.0, 117.0, 158.0, 145.0, 93.0, 82.0, 45.0, 26.0, 25.0, 12.0, 9.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.034027099609375, -0.99774169921875, -0.961456298828125, -0.9251708984375, -0.888885498046875, -0.85260009765625, -0.816314697265625, -0.780029296875, -0.743743896484375, -0.70745849609375, -0.671173095703125, -0.6348876953125, -0.598602294921875, -0.56231689453125, -0.526031494140625, -0.48974609375, -0.453460693359375, -0.41717529296875, -0.380889892578125, -0.3446044921875, -0.308319091796875, -0.27203369140625, -0.235748291015625, -0.199462890625, -0.163177490234375, -0.12689208984375, -0.090606689453125, -0.0543212890625, -0.018035888671875, 0.01824951171875, 0.054534912109375, 0.0908203125, 0.127105712890625, 0.16339111328125, 0.199676513671875, 0.2359619140625, 0.272247314453125, 0.30853271484375, 0.344818115234375, 0.381103515625, 0.417388916015625, 0.45367431640625, 0.489959716796875, 0.5262451171875, 0.562530517578125, 0.59881591796875, 0.635101318359375, 0.67138671875, 0.707672119140625, 0.74395751953125, 0.780242919921875, 0.8165283203125, 0.852813720703125, 0.88909912109375, 0.925384521484375, 0.961669921875, 0.997955322265625, 1.03424072265625, 1.070526123046875, 1.1068115234375, 1.143096923828125, 1.17938232421875, 1.215667724609375, 1.251953125]}, "gradients/decoder.roberta.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 11.0, 27.0, 45.0, 72.0, 101.0, 158.0, 153.0, 122.0, 110.0, 73.0, 46.0, 42.0, 24.0, 10.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.56854248046875, -5.359595775604248, -5.150648593902588, -4.941701889038086, -4.732754707336426, -4.523808002471924, -4.314861297607422, -4.105914115905762, -3.8969674110412598, -3.6880204677581787, -3.4790735244750977, -3.2701268196105957, -3.0611798763275146, -2.8522329330444336, -2.6432862281799316, -2.4343392848968506, -2.2253923416137695, -2.0164453983306885, -1.807498574256897, -1.5985517501831055, -1.3896048069000244, -1.1806578636169434, -0.9717110395431519, -0.7627642154693604, -0.5538172721862793, -0.344870388507843, -0.13592350482940674, 0.07302337884902954, 0.2819702625274658, 0.4909172058105469, 0.6998640298843384, 0.9088108539581299, 1.1177582740783691, 1.3267052173614502, 1.5356520414352417, 1.7445988655090332, 1.9535458087921143, 2.1624927520751953, 2.3714394569396973, 2.5803864002227783, 2.7893333435058594, 2.9982802867889404, 3.2072272300720215, 3.4161739349365234, 3.6251208782196045, 3.8340678215026855, 4.0430145263671875, 4.251961708068848, 4.46090841293335, 4.669855117797852, 4.878802299499512, 5.087749004364014, 5.296695709228516, 5.505642890930176, 5.714589595794678, 5.92353630065918, 6.13248348236084, 6.341430187225342, 6.550377368927002, 6.759324073791504, 6.968271255493164, 7.177217960357666, 7.386164665222168, 7.595111846923828, 7.80405855178833]}, "gradients/decoder.roberta.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 9.0, 6.0, 6.0, 8.0, 11.0, 11.0, 14.0, 16.0, 24.0, 12.0, 24.0, 17.0, 29.0, 27.0, 28.0, 31.0, 34.0, 32.0, 29.0, 50.0, 44.0, 30.0, 37.0, 42.0, 38.0, 36.0, 39.0, 29.0, 31.0, 33.0, 29.0, 27.0, 33.0, 28.0, 12.0, 18.0, 13.0, 15.0, 13.0, 6.0, 7.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0], "bins": [-4.660089492797852, -4.515333652496338, -4.370577812194824, -4.2258219718933105, -4.081066131591797, -3.936310052871704, -3.7915539741516113, -3.6467981338500977, -3.502042293548584, -3.3572864532470703, -3.2125306129455566, -3.067774534225464, -2.92301869392395, -2.7782628536224365, -2.6335067749023438, -2.48875093460083, -2.3439950942993164, -2.1992392539978027, -2.054483413696289, -1.9097273349761963, -1.7649714946746826, -1.620215654373169, -1.4754596948623657, -1.3307037353515625, -1.1859478950500488, -1.0411920547485352, -0.8964360952377319, -0.7516801953315735, -0.606924295425415, -0.4621683955192566, -0.31741249561309814, -0.17265653610229492, -0.027900218963623047, 0.1168556809425354, 0.26161158084869385, 0.4063674807548523, 0.5511233806610107, 0.6958792805671692, 0.8406351804733276, 0.9853911399841309, 1.1301469802856445, 1.2749028205871582, 1.4196587800979614, 1.5644147396087646, 1.7091705799102783, 1.853926420211792, 1.9986823797225952, 2.1434383392333984, 2.288194179534912, 2.432950019836426, 2.5777058601379395, 2.7224619388580322, 2.867217779159546, 3.0119736194610596, 3.1567296981811523, 3.301485538482666, 3.4462413787841797, 3.5909972190856934, 3.735753059387207, 3.8805091381073, 4.025264739990234, 4.170021057128906, 4.31477689743042, 4.459532737731934, 4.604288578033447]}, "gradients/decoder.roberta.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 6.0, 4.0, 6.0, 6.0, 5.0, 10.0, 7.0, 24.0, 18.0, 21.0, 39.0, 67.0, 64.0, 68.0, 80.0, 130.0, 188.0, 231.0, 384.0, 545.0, 809.0, 1698.0, 4070.0, 15065.0, 102259.0, 1184594.0, 2487768.0, 346992.0, 35888.0, 7390.0, 2480.0, 1129.0, 678.0, 417.0, 284.0, 199.0, 158.0, 127.0, 83.0, 62.0, 51.0, 36.0, 34.0, 27.0, 25.0, 18.0, 4.0, 11.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.77734375, -6.55328369140625, -6.3292236328125, -6.10516357421875, -5.881103515625, -5.65704345703125, -5.4329833984375, -5.20892333984375, -4.98486328125, -4.76080322265625, -4.5367431640625, -4.31268310546875, -4.088623046875, -3.86456298828125, -3.6405029296875, -3.41644287109375, -3.1923828125, -2.96832275390625, -2.7442626953125, -2.52020263671875, -2.296142578125, -2.07208251953125, -1.8480224609375, -1.62396240234375, -1.39990234375, -1.17584228515625, -0.9517822265625, -0.72772216796875, -0.503662109375, -0.27960205078125, -0.0555419921875, 0.16851806640625, 0.392578125, 0.61663818359375, 0.8406982421875, 1.06475830078125, 1.288818359375, 1.51287841796875, 1.7369384765625, 1.96099853515625, 2.18505859375, 2.40911865234375, 2.6331787109375, 2.85723876953125, 3.081298828125, 3.30535888671875, 3.5294189453125, 3.75347900390625, 3.9775390625, 4.20159912109375, 4.4256591796875, 4.64971923828125, 4.873779296875, 5.09783935546875, 5.3218994140625, 5.54595947265625, 5.77001953125, 5.99407958984375, 6.2181396484375, 6.44219970703125, 6.666259765625, 6.89031982421875, 7.1143798828125, 7.33843994140625, 7.5625]}, "gradients/decoder.roberta.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 2.0, 8.0, 10.0, 7.0, 15.0, 11.0, 14.0, 20.0, 23.0, 28.0, 26.0, 25.0, 22.0, 26.0, 22.0, 43.0, 42.0, 34.0, 47.0, 40.0, 33.0, 34.0, 45.0, 39.0, 39.0, 43.0, 26.0, 40.0, 34.0, 27.0, 24.0, 25.0, 17.0, 15.0, 13.0, 21.0, 11.0, 8.0, 6.0, 6.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.216796875, -3.12054443359375, -3.0242919921875, -2.92803955078125, -2.831787109375, -2.73553466796875, -2.6392822265625, -2.54302978515625, -2.44677734375, -2.35052490234375, -2.2542724609375, -2.15802001953125, -2.061767578125, -1.96551513671875, -1.8692626953125, -1.77301025390625, -1.6767578125, -1.58050537109375, -1.4842529296875, -1.38800048828125, -1.291748046875, -1.19549560546875, -1.0992431640625, -1.00299072265625, -0.90673828125, -0.81048583984375, -0.7142333984375, -0.61798095703125, -0.521728515625, -0.42547607421875, -0.3292236328125, -0.23297119140625, -0.13671875, -0.04046630859375, 0.0557861328125, 0.15203857421875, 0.248291015625, 0.34454345703125, 0.4407958984375, 0.53704833984375, 0.63330078125, 0.72955322265625, 0.8258056640625, 0.92205810546875, 1.018310546875, 1.11456298828125, 1.2108154296875, 1.30706787109375, 1.4033203125, 1.49957275390625, 1.5958251953125, 1.69207763671875, 1.788330078125, 1.88458251953125, 1.9808349609375, 2.07708740234375, 2.17333984375, 2.26959228515625, 2.3658447265625, 2.46209716796875, 2.558349609375, 2.65460205078125, 2.7508544921875, 2.84710693359375, 2.943359375]}, "gradients/decoder.roberta.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 12.0, 12.0, 16.0, 22.0, 37.0, 53.0, 67.0, 82.0, 130.0, 202.0, 290.0, 573.0, 1083.0, 8370.0, 4081749.0, 97833.0, 1835.0, 688.0, 392.0, 258.0, 161.0, 115.0, 74.0, 63.0, 39.0, 33.0, 20.0, 17.0, 13.0, 11.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.0, -33.99169921875, -32.9833984375, -31.97509765625, -30.966796875, -29.95849609375, -28.9501953125, -27.94189453125, -26.93359375, -25.92529296875, -24.9169921875, -23.90869140625, -22.900390625, -21.89208984375, -20.8837890625, -19.87548828125, -18.8671875, -17.85888671875, -16.8505859375, -15.84228515625, -14.833984375, -13.82568359375, -12.8173828125, -11.80908203125, -10.80078125, -9.79248046875, -8.7841796875, -7.77587890625, -6.767578125, -5.75927734375, -4.7509765625, -3.74267578125, -2.734375, -1.72607421875, -0.7177734375, 0.29052734375, 1.298828125, 2.30712890625, 3.3154296875, 4.32373046875, 5.33203125, 6.34033203125, 7.3486328125, 8.35693359375, 9.365234375, 10.37353515625, 11.3818359375, 12.39013671875, 13.3984375, 14.40673828125, 15.4150390625, 16.42333984375, 17.431640625, 18.43994140625, 19.4482421875, 20.45654296875, 21.46484375, 22.47314453125, 23.4814453125, 24.48974609375, 25.498046875, 26.50634765625, 27.5146484375, 28.52294921875, 29.53125]}, "gradients/decoder.roberta.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 8.0, 12.0, 21.0, 37.0, 35.0, 57.0, 81.0, 100.0, 186.0, 243.0, 401.0, 542.0, 618.0, 577.0, 363.0, 233.0, 173.0, 109.0, 91.0, 52.0, 33.0, 23.0, 16.0, 16.0, 8.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6513671875, -1.5933685302734375, -1.535369873046875, -1.4773712158203125, -1.41937255859375, -1.3613739013671875, -1.303375244140625, -1.2453765869140625, -1.1873779296875, -1.1293792724609375, -1.071380615234375, -1.0133819580078125, -0.95538330078125, -0.8973846435546875, -0.839385986328125, -0.7813873291015625, -0.723388671875, -0.6653900146484375, -0.607391357421875, -0.5493927001953125, -0.49139404296875, -0.4333953857421875, -0.375396728515625, -0.3173980712890625, -0.2593994140625, -0.2014007568359375, -0.143402099609375, -0.0854034423828125, -0.02740478515625, 0.0305938720703125, 0.088592529296875, 0.1465911865234375, 0.20458984375, 0.2625885009765625, 0.320587158203125, 0.3785858154296875, 0.43658447265625, 0.4945831298828125, 0.552581787109375, 0.6105804443359375, 0.6685791015625, 0.7265777587890625, 0.784576416015625, 0.8425750732421875, 0.90057373046875, 0.9585723876953125, 1.016571044921875, 1.0745697021484375, 1.132568359375, 1.1905670166015625, 1.248565673828125, 1.3065643310546875, 1.36456298828125, 1.4225616455078125, 1.480560302734375, 1.5385589599609375, 1.5965576171875, 1.6545562744140625, 1.712554931640625, 1.7705535888671875, 1.82855224609375, 1.8865509033203125, 1.944549560546875, 2.0025482177734375, 2.060546875]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 11.0, 9.0, 14.0, 14.0, 43.0, 45.0, 47.0, 68.0, 77.0, 86.0, 101.0, 78.0, 74.0, 54.0, 62.0, 53.0, 66.0, 34.0, 25.0, 15.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1411185264587402, -3.0206995010375977, -2.900280475616455, -2.7798614501953125, -2.65944242477417, -2.5390233993530273, -2.4186043739318848, -2.298185348510742, -2.1777663230895996, -2.057347297668457, -1.9369282722473145, -1.8165092468261719, -1.6960902214050293, -1.5756711959838867, -1.4552520513534546, -1.334833025932312, -1.2144138813018799, -1.0939948558807373, -0.9735758304595947, -0.8531567454338074, -0.7327377200126648, -0.6123186945915222, -0.49189960956573486, -0.3714805841445923, -0.2510615587234497, -0.13064251840114594, -0.010223478078842163, 0.1101955771446228, 0.23061460256576538, 0.35103362798690796, 0.4714527130126953, 0.5918717384338379, 0.7122907638549805, 0.832709789276123, 0.9531288146972656, 1.0735478401184082, 1.1939668655395508, 1.3143858909606934, 1.4348050355911255, 1.555224061012268, 1.6756430864334106, 1.7960621118545532, 1.9164811372756958, 2.036900281906128, 2.1573193073272705, 2.277738332748413, 2.3981573581695557, 2.5185763835906982, 2.638995409011841, 2.7594144344329834, 2.879833459854126, 3.0002524852752686, 3.120671510696411, 3.2410905361175537, 3.3615097999572754, 3.481928825378418, 3.6023478507995605, 3.722766876220703, 3.8431859016418457, 3.9636049270629883, 4.084023952484131, 4.204442977905273, 4.324862003326416, 4.445281028747559, 4.565700054168701]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 6.0, 6.0, 7.0, 8.0, 6.0, 10.0, 16.0, 26.0, 13.0, 23.0, 24.0, 26.0, 28.0, 25.0, 30.0, 33.0, 36.0, 49.0, 37.0, 35.0, 44.0, 45.0, 42.0, 30.0, 36.0, 30.0, 41.0, 25.0, 30.0, 26.0, 32.0, 26.0, 17.0, 19.0, 17.0, 16.0, 11.0, 13.0, 8.0, 10.0, 5.0, 6.0, 6.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-3.7054176330566406, -3.5996406078338623, -3.493863344192505, -3.3880863189697266, -3.2823092937469482, -3.17653226852417, -3.0707550048828125, -2.964977979660034, -2.859200954437256, -2.7534239292144775, -2.64764666557312, -2.541869640350342, -2.4360926151275635, -2.330315589904785, -2.2245383262634277, -2.1187613010406494, -2.012984037399292, -1.9072068929672241, -1.8014298677444458, -1.695652723312378, -1.5898756980895996, -1.4840985536575317, -1.3783214092254639, -1.2725443840026855, -1.1667672395706177, -1.0609900951385498, -0.9552130699157715, -0.8494359254837036, -0.7436588406562805, -0.6378817558288574, -0.5321046113967896, -0.42632752656936646, -0.32055020332336426, -0.21477310359477997, -0.10899600386619568, -0.0032188892364501953, 0.1025581955909729, 0.208335280418396, 0.31411242485046387, 0.41988950967788696, 0.5256665945053101, 0.6314436793327332, 0.7372207641601562, 0.8429979085922241, 0.9487749934196472, 1.0545520782470703, 1.1603292226791382, 1.266106367111206, 1.3718833923339844, 1.4776605367660522, 1.5834375619888306, 1.6892147064208984, 1.7949917316436768, 1.9007688760757446, 2.0065460205078125, 2.112323045730591, 2.218100070953369, 2.3238770961761475, 2.429654359817505, 2.535431385040283, 2.6412084102630615, 2.74698543548584, 2.8527626991271973, 2.9585397243499756, 3.064316987991333]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 12.0, 18.0, 22.0, 27.0, 27.0, 61.0, 67.0, 101.0, 128.0, 149.0, 262.0, 357.0, 525.0, 710.0, 1033.0, 1494.0, 2282.0, 3272.0, 4962.0, 7549.0, 11536.0, 18199.0, 30582.0, 50825.0, 88943.0, 157095.0, 226166.0, 181825.0, 105006.0, 59800.0, 35253.0, 21224.0, 13346.0, 8454.0, 5540.0, 3593.0, 2399.0, 1726.0, 1200.0, 825.0, 586.0, 391.0, 269.0, 216.0, 152.0, 108.0, 75.0, 56.0, 31.0, 27.0, 20.0, 12.0, 11.0, 6.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.60498046875, -0.5864486694335938, -0.5679168701171875, -0.5493850708007812, -0.530853271484375, -0.5123214721679688, -0.4937896728515625, -0.47525787353515625, -0.45672607421875, -0.43819427490234375, -0.4196624755859375, -0.40113067626953125, -0.382598876953125, -0.36406707763671875, -0.3455352783203125, -0.32700347900390625, -0.3084716796875, -0.28993988037109375, -0.2714080810546875, -0.25287628173828125, -0.234344482421875, -0.21581268310546875, -0.1972808837890625, -0.17874908447265625, -0.16021728515625, -0.14168548583984375, -0.1231536865234375, -0.10462188720703125, -0.086090087890625, -0.06755828857421875, -0.0490264892578125, -0.03049468994140625, -0.011962890625, 0.00656890869140625, 0.0251007080078125, 0.04363250732421875, 0.062164306640625, 0.08069610595703125, 0.0992279052734375, 0.11775970458984375, 0.13629150390625, 0.15482330322265625, 0.1733551025390625, 0.19188690185546875, 0.210418701171875, 0.22895050048828125, 0.2474822998046875, 0.26601409912109375, 0.2845458984375, 0.30307769775390625, 0.3216094970703125, 0.34014129638671875, 0.358673095703125, 0.37720489501953125, 0.3957366943359375, 0.41426849365234375, 0.43280029296875, 0.45133209228515625, 0.4698638916015625, 0.48839569091796875, 0.506927490234375, 0.5254592895507812, 0.5439910888671875, 0.5625228881835938, 0.5810546875]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 6.0, 6.0, 4.0, 9.0, 7.0, 9.0, 15.0, 24.0, 17.0, 20.0, 25.0, 22.0, 33.0, 25.0, 26.0, 38.0, 29.0, 52.0, 32.0, 44.0, 45.0, 43.0, 42.0, 30.0, 35.0, 31.0, 43.0, 24.0, 29.0, 27.0, 31.0, 26.0, 18.0, 19.0, 17.0, 16.0, 11.0, 14.0, 8.0, 10.0, 4.0, 7.0, 5.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0], "bins": [-3.6171875, -3.513763427734375, -3.41033935546875, -3.306915283203125, -3.2034912109375, -3.100067138671875, -2.99664306640625, -2.893218994140625, -2.789794921875, -2.686370849609375, -2.58294677734375, -2.479522705078125, -2.3760986328125, -2.272674560546875, -2.16925048828125, -2.065826416015625, -1.96240234375, -1.858978271484375, -1.75555419921875, -1.652130126953125, -1.5487060546875, -1.445281982421875, -1.34185791015625, -1.238433837890625, -1.135009765625, -1.031585693359375, -0.92816162109375, -0.824737548828125, -0.7213134765625, -0.617889404296875, -0.51446533203125, -0.411041259765625, -0.3076171875, -0.204193115234375, -0.10076904296875, 0.002655029296875, 0.1060791015625, 0.209503173828125, 0.31292724609375, 0.416351318359375, 0.519775390625, 0.623199462890625, 0.72662353515625, 0.830047607421875, 0.9334716796875, 1.036895751953125, 1.14031982421875, 1.243743896484375, 1.34716796875, 1.450592041015625, 1.55401611328125, 1.657440185546875, 1.7608642578125, 1.864288330078125, 1.96771240234375, 2.071136474609375, 2.174560546875, 2.277984619140625, 2.38140869140625, 2.484832763671875, 2.5882568359375, 2.691680908203125, 2.79510498046875, 2.898529052734375, 3.001953125]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 7.0, 6.0, 10.0, 8.0, 16.0, 15.0, 33.0, 48.0, 61.0, 83.0, 104.0, 153.0, 181.0, 260.0, 408.0, 636.0, 984.0, 1746.0, 3536.0, 8783.0, 27535.0, 899812.0, 73348.0, 17706.0, 6405.0, 2644.0, 1416.0, 826.0, 524.0, 340.0, 253.0, 186.0, 141.0, 87.0, 59.0, 44.0, 40.0, 28.0, 28.0, 12.0, 12.0, 6.0, 5.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9580078125, -1.8944854736328125, -1.830963134765625, -1.7674407958984375, -1.70391845703125, -1.6403961181640625, -1.576873779296875, -1.5133514404296875, -1.4498291015625, -1.3863067626953125, -1.322784423828125, -1.2592620849609375, -1.19573974609375, -1.1322174072265625, -1.068695068359375, -1.0051727294921875, -0.941650390625, -0.8781280517578125, -0.814605712890625, -0.7510833740234375, -0.68756103515625, -0.6240386962890625, -0.560516357421875, -0.4969940185546875, -0.4334716796875, -0.3699493408203125, -0.306427001953125, -0.2429046630859375, -0.17938232421875, -0.1158599853515625, -0.052337646484375, 0.0111846923828125, 0.07470703125, 0.1382293701171875, 0.201751708984375, 0.2652740478515625, 0.32879638671875, 0.3923187255859375, 0.455841064453125, 0.5193634033203125, 0.5828857421875, 0.6464080810546875, 0.709930419921875, 0.7734527587890625, 0.83697509765625, 0.9004974365234375, 0.964019775390625, 1.0275421142578125, 1.091064453125, 1.1545867919921875, 1.218109130859375, 1.2816314697265625, 1.34515380859375, 1.4086761474609375, 1.472198486328125, 1.5357208251953125, 1.5992431640625, 1.6627655029296875, 1.726287841796875, 1.7898101806640625, 1.85333251953125, 1.9168548583984375, 1.980377197265625, 2.0438995361328125, 2.107421875]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 3.0, 6.0, 5.0, 10.0, 17.0, 12.0, 22.0, 29.0, 16.0, 27.0, 39.0, 40.0, 31.0, 44.0, 40.0, 42.0, 37.0, 47.0, 58.0, 51.0, 42.0, 45.0, 32.0, 34.0, 28.0, 35.0, 22.0, 31.0, 23.0, 27.0, 18.0, 14.0, 14.0, 18.0, 5.0, 8.0, 6.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.640625, -2.5662841796875, -2.491943359375, -2.4176025390625, -2.34326171875, -2.2689208984375, -2.194580078125, -2.1202392578125, -2.0458984375, -1.9715576171875, -1.897216796875, -1.8228759765625, -1.74853515625, -1.6741943359375, -1.599853515625, -1.5255126953125, -1.451171875, -1.3768310546875, -1.302490234375, -1.2281494140625, -1.15380859375, -1.0794677734375, -1.005126953125, -0.9307861328125, -0.8564453125, -0.7821044921875, -0.707763671875, -0.6334228515625, -0.55908203125, -0.4847412109375, -0.410400390625, -0.3360595703125, -0.26171875, -0.1873779296875, -0.113037109375, -0.0386962890625, 0.03564453125, 0.1099853515625, 0.184326171875, 0.2586669921875, 0.3330078125, 0.4073486328125, 0.481689453125, 0.5560302734375, 0.63037109375, 0.7047119140625, 0.779052734375, 0.8533935546875, 0.927734375, 1.0020751953125, 1.076416015625, 1.1507568359375, 1.22509765625, 1.2994384765625, 1.373779296875, 1.4481201171875, 1.5224609375, 1.5968017578125, 1.671142578125, 1.7454833984375, 1.81982421875, 1.8941650390625, 1.968505859375, 2.0428466796875, 2.1171875]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 7.0, 23.0, 32.0, 40.0, 26.0, 55.0, 95.0, 144.0, 234.0, 350.0, 604.0, 1102.0, 2246.0, 5688.0, 20828.0, 949511.0, 50906.0, 9696.0, 3358.0, 1544.0, 775.0, 440.0, 281.0, 204.0, 100.0, 60.0, 61.0, 35.0, 26.0, 22.0, 16.0, 11.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281494140625, -0.2723350524902344, -0.26317596435546875, -0.2540168762207031, -0.2448577880859375, -0.23569869995117188, -0.22653961181640625, -0.21738052368164062, -0.208221435546875, -0.19906234741210938, -0.18990325927734375, -0.18074417114257812, -0.1715850830078125, -0.16242599487304688, -0.15326690673828125, -0.14410781860351562, -0.13494873046875, -0.12578964233398438, -0.11663055419921875, -0.10747146606445312, -0.0983123779296875, -0.08915328979492188, -0.07999420166015625, -0.07083511352539062, -0.061676025390625, -0.052516937255859375, -0.04335784912109375, -0.034198760986328125, -0.0250396728515625, -0.015880584716796875, -0.00672149658203125, 0.002437591552734375, 0.0115966796875, 0.020755767822265625, 0.02991485595703125, 0.039073944091796875, 0.0482330322265625, 0.057392120361328125, 0.06655120849609375, 0.07571029663085938, 0.084869384765625, 0.09402847290039062, 0.10318756103515625, 0.11234664916992188, 0.1215057373046875, 0.13066482543945312, 0.13982391357421875, 0.14898300170898438, 0.15814208984375, 0.16730117797851562, 0.17646026611328125, 0.18561935424804688, 0.1947784423828125, 0.20393753051757812, 0.21309661865234375, 0.22225570678710938, 0.231414794921875, 0.24057388305664062, 0.24973297119140625, 0.2588920593261719, 0.2680511474609375, 0.2772102355957031, 0.28636932373046875, 0.2955284118652344, 0.3046875]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 13.0, 11.0, 14.0, 9.0, 15.0, 15.0, 26.0, 33.0, 28.0, 58.0, 64.0, 64.0, 51.0, 57.0, 63.0, 55.0, 55.0, 54.0, 49.0, 42.0, 38.0, 37.0, 26.0, 24.0, 24.0, 14.0, 8.0, 12.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.658367156982422e-05, -2.5684013962745667e-05, -2.4784356355667114e-05, -2.3884698748588562e-05, -2.298504114151001e-05, -2.2085383534431458e-05, -2.1185725927352905e-05, -2.0286068320274353e-05, -1.93864107131958e-05, -1.848675310611725e-05, -1.7587095499038696e-05, -1.6687437891960144e-05, -1.5787780284881592e-05, -1.488812267780304e-05, -1.3988465070724487e-05, -1.3088807463645935e-05, -1.2189149856567383e-05, -1.128949224948883e-05, -1.0389834642410278e-05, -9.490177035331726e-06, -8.590519428253174e-06, -7.690861821174622e-06, -6.791204214096069e-06, -5.891546607017517e-06, -4.991888999938965e-06, -4.092231392860413e-06, -3.1925737857818604e-06, -2.292916178703308e-06, -1.3932585716247559e-06, -4.936009645462036e-07, 4.0605664253234863e-07, 1.3057142496109009e-06, 2.205371856689453e-06, 3.1050294637680054e-06, 4.004687070846558e-06, 4.90434467792511e-06, 5.804002285003662e-06, 6.703659892082214e-06, 7.603317499160767e-06, 8.502975106239319e-06, 9.402632713317871e-06, 1.0302290320396423e-05, 1.1201947927474976e-05, 1.2101605534553528e-05, 1.300126314163208e-05, 1.3900920748710632e-05, 1.4800578355789185e-05, 1.5700235962867737e-05, 1.659989356994629e-05, 1.749955117702484e-05, 1.8399208784103394e-05, 1.9298866391181946e-05, 2.0198523998260498e-05, 2.109818160533905e-05, 2.1997839212417603e-05, 2.2897496819496155e-05, 2.3797154426574707e-05, 2.469681203365326e-05, 2.559646964073181e-05, 2.6496127247810364e-05, 2.7395784854888916e-05, 2.8295442461967468e-05, 2.919510006904602e-05, 3.0094757676124573e-05, 3.0994415283203125e-05]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 3.0, 7.0, 5.0, 6.0, 10.0, 14.0, 15.0, 20.0, 16.0, 22.0, 34.0, 63.0, 78.0, 94.0, 166.0, 597.0, 18357.0, 1009717.0, 18163.0, 590.0, 191.0, 117.0, 69.0, 50.0, 30.0, 21.0, 16.0, 18.0, 20.0, 13.0, 15.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5625, -0.5427627563476562, -0.5230255126953125, -0.5032882690429688, -0.483551025390625, -0.46381378173828125, -0.4440765380859375, -0.42433929443359375, -0.40460205078125, -0.38486480712890625, -0.3651275634765625, -0.34539031982421875, -0.325653076171875, -0.30591583251953125, -0.2861785888671875, -0.26644134521484375, -0.2467041015625, -0.22696685791015625, -0.2072296142578125, -0.18749237060546875, -0.167755126953125, -0.14801788330078125, -0.1282806396484375, -0.10854339599609375, -0.08880615234375, -0.06906890869140625, -0.0493316650390625, -0.02959442138671875, -0.009857177734375, 0.00988006591796875, 0.0296173095703125, 0.04935455322265625, 0.069091796875, 0.08882904052734375, 0.1085662841796875, 0.12830352783203125, 0.148040771484375, 0.16777801513671875, 0.1875152587890625, 0.20725250244140625, 0.22698974609375, 0.24672698974609375, 0.2664642333984375, 0.28620147705078125, 0.305938720703125, 0.32567596435546875, 0.3454132080078125, 0.36515045166015625, 0.3848876953125, 0.40462493896484375, 0.4243621826171875, 0.44409942626953125, 0.463836669921875, 0.48357391357421875, 0.5033111572265625, 0.5230484008789062, 0.54278564453125, 0.5625228881835938, 0.5822601318359375, 0.6019973754882812, 0.621734619140625, 0.6414718627929688, 0.6612091064453125, 0.6809463500976562, 0.70068359375]}, "gradients/decoder.roberta.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 5.0, 8.0, 7.0, 8.0, 7.0, 7.0, 13.0, 24.0, 33.0, 54.0, 63.0, 114.0, 174.0, 148.0, 105.0, 54.0, 39.0, 22.0, 29.0, 20.0, 10.0, 8.0, 10.0, 8.0, 9.0, 3.0, 3.0, 1.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0399169921875, -0.03880572319030762, -0.037694454193115234, -0.03658318519592285, -0.03547191619873047, -0.034360647201538086, -0.0332493782043457, -0.03213810920715332, -0.031026840209960938, -0.029915571212768555, -0.028804302215576172, -0.02769303321838379, -0.026581764221191406, -0.025470495223999023, -0.02435922622680664, -0.023247957229614258, -0.022136688232421875, -0.021025419235229492, -0.01991415023803711, -0.018802881240844727, -0.017691612243652344, -0.01658034324645996, -0.015469074249267578, -0.014357805252075195, -0.013246536254882812, -0.01213526725769043, -0.011023998260498047, -0.009912729263305664, -0.008801460266113281, -0.0076901912689208984, -0.006578922271728516, -0.005467653274536133, -0.00435638427734375, -0.003245115280151367, -0.0021338462829589844, -0.0010225772857666016, 8.869171142578125e-05, 0.001199960708618164, 0.002311229705810547, 0.0034224987030029297, 0.0045337677001953125, 0.005645036697387695, 0.006756305694580078, 0.007867574691772461, 0.008978843688964844, 0.010090112686157227, 0.01120138168334961, 0.012312650680541992, 0.013423919677734375, 0.014535188674926758, 0.01564645767211914, 0.016757726669311523, 0.017868995666503906, 0.01898026466369629, 0.020091533660888672, 0.021202802658081055, 0.022314071655273438, 0.02342534065246582, 0.024536609649658203, 0.025647878646850586, 0.02675914764404297, 0.02787041664123535, 0.028981685638427734, 0.030092954635620117, 0.0312042236328125]}, "gradients/decoder.roberta.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 10.0, 5.0, 15.0, 21.0, 43.0, 58.0, 55.0, 86.0, 93.0, 101.0, 110.0, 72.0, 79.0, 61.0, 67.0, 52.0, 33.0, 17.0, 8.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6469476222991943, -2.5093319416046143, -2.371716260910034, -2.234100818634033, -2.096485137939453, -1.958869457244873, -1.821253776550293, -1.683638095855713, -1.5460225343704224, -1.4084068536758423, -1.2707912921905518, -1.1331756114959717, -0.9955599904060364, -0.8579443693161011, -0.720328688621521, -0.5827130675315857, -0.4450974464416504, -0.3074818253517151, -0.1698661744594574, -0.03225052356719971, 0.1053650975227356, 0.2429807186126709, 0.380596399307251, 0.5182120203971863, 0.6558276414871216, 0.7934432625770569, 0.9310588836669922, 1.0686745643615723, 1.2062902450561523, 1.3439058065414429, 1.481521487236023, 1.6191370487213135, 1.7567529678344727, 1.8943686485290527, 2.031984329223633, 2.169600009918213, 2.307215452194214, 2.444831132888794, 2.582446813583374, 2.720062494277954, 2.857677936553955, 2.995293617248535, 3.1329092979431152, 3.2705249786376953, 3.4081404209136963, 3.5457561016082764, 3.6833717823028564, 3.8209874629974365, 3.9586031436920166, 4.096218585968018, 4.233834266662598, 4.371449947357178, 4.509065628051758, 4.646681308746338, 4.784296989440918, 4.921912670135498, 5.059528350830078, 5.197144031524658, 5.334759712219238, 5.472375392913818, 5.609991073608398, 5.74760627746582, 5.885222434997559, 6.0228376388549805, 6.1604533195495605]}, "gradients/decoder.roberta.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 2.0, 6.0, 6.0, 6.0, 4.0, 11.0, 5.0, 9.0, 17.0, 22.0, 17.0, 22.0, 24.0, 23.0, 32.0, 25.0, 27.0, 36.0, 31.0, 51.0, 36.0, 40.0, 44.0, 44.0, 41.0, 31.0, 38.0, 27.0, 43.0, 26.0, 31.0, 23.0, 34.0, 24.0, 18.0, 18.0, 18.0, 16.0, 12.0, 12.0, 8.0, 10.0, 4.0, 8.0, 5.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0], "bins": [-3.618126630783081, -3.5145556926727295, -3.410984992980957, -3.3074140548706055, -3.203843116760254, -3.1002721786499023, -2.99670147895813, -2.8931305408477783, -2.7895596027374268, -2.685988664627075, -2.5824179649353027, -2.478847026824951, -2.3752760887145996, -2.271705150604248, -2.1681344509124756, -2.064563512802124, -1.960992693901062, -1.857421875, -1.7538509368896484, -1.6502801179885864, -1.5467091798782349, -1.4431383609771729, -1.3395674228668213, -1.2359966039657593, -1.1324257850646973, -1.0288549661636353, -0.9252840280532837, -0.8217132091522217, -0.7181422710418701, -0.6145714521408081, -0.5110005736351013, -0.40742969512939453, -0.30385875701904297, -0.20028787851333618, -0.09671701490879059, 0.006853848695755005, 0.11042472720146179, 0.2139955759048462, 0.317566454410553, 0.42113733291625977, 0.5247082114219666, 0.6282790899276733, 0.7318499684333801, 0.8354208469390869, 0.9389916658401489, 1.042562484741211, 1.1461334228515625, 1.249704360961914, 1.353275179862976, 1.456845998764038, 1.5604169368743896, 1.6639877557754517, 1.7675586938858032, 1.8711295127868652, 1.9747004508972168, 2.0782713890075684, 2.181842088699341, 2.2854130268096924, 2.388983726501465, 2.4925546646118164, 2.596125602722168, 2.6996965408325195, 2.803267240524292, 2.9068381786346436, 3.010409116744995]}, "gradients/decoder.roberta.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 6.0, 8.0, 9.0, 21.0, 25.0, 39.0, 52.0, 50.0, 85.0, 125.0, 146.0, 199.0, 317.0, 393.0, 665.0, 981.0, 1433.0, 2288.0, 3275.0, 5110.0, 7816.0, 12617.0, 20945.0, 34780.0, 60937.0, 104581.0, 166431.0, 203657.0, 165958.0, 104476.0, 60298.0, 34679.0, 20580.0, 12504.0, 7775.0, 5117.0, 3298.0, 2210.0, 1448.0, 1002.0, 615.0, 498.0, 314.0, 221.0, 142.0, 138.0, 70.0, 62.0, 41.0, 31.0, 24.0, 22.0, 17.0, 8.0, 11.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-2.078125, -2.009979248046875, -1.94183349609375, -1.873687744140625, -1.8055419921875, -1.737396240234375, -1.66925048828125, -1.601104736328125, -1.532958984375, -1.464813232421875, -1.39666748046875, -1.328521728515625, -1.2603759765625, -1.192230224609375, -1.12408447265625, -1.055938720703125, -0.98779296875, -0.919647216796875, -0.85150146484375, -0.783355712890625, -0.7152099609375, -0.647064208984375, -0.57891845703125, -0.510772705078125, -0.442626953125, -0.374481201171875, -0.30633544921875, -0.238189697265625, -0.1700439453125, -0.101898193359375, -0.03375244140625, 0.034393310546875, 0.1025390625, 0.170684814453125, 0.23883056640625, 0.306976318359375, 0.3751220703125, 0.443267822265625, 0.51141357421875, 0.579559326171875, 0.647705078125, 0.715850830078125, 0.78399658203125, 0.852142333984375, 0.9202880859375, 0.988433837890625, 1.05657958984375, 1.124725341796875, 1.19287109375, 1.261016845703125, 1.32916259765625, 1.397308349609375, 1.4654541015625, 1.533599853515625, 1.60174560546875, 1.669891357421875, 1.738037109375, 1.806182861328125, 1.87432861328125, 1.942474365234375, 2.0106201171875, 2.078765869140625, 2.14691162109375, 2.215057373046875, 2.283203125]}, "gradients/decoder.roberta.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 7.0, 2.0, 6.0, 6.0, 10.0, 5.0, 10.0, 15.0, 17.0, 21.0, 14.0, 25.0, 21.0, 40.0, 20.0, 24.0, 41.0, 27.0, 35.0, 49.0, 36.0, 43.0, 35.0, 41.0, 37.0, 37.0, 35.0, 33.0, 34.0, 32.0, 25.0, 21.0, 34.0, 21.0, 23.0, 16.0, 16.0, 15.0, 12.0, 11.0, 5.0, 8.0, 8.0, 8.0, 2.0, 2.0, 5.0, 2.0, 4.0, 0.0, 4.0, 1.0], "bins": [-3.4453125, -3.345428466796875, -3.24554443359375, -3.145660400390625, -3.0457763671875, -2.945892333984375, -2.84600830078125, -2.746124267578125, -2.646240234375, -2.546356201171875, -2.44647216796875, -2.346588134765625, -2.2467041015625, -2.146820068359375, -2.04693603515625, -1.947052001953125, -1.84716796875, -1.747283935546875, -1.64739990234375, -1.547515869140625, -1.4476318359375, -1.347747802734375, -1.24786376953125, -1.147979736328125, -1.048095703125, -0.948211669921875, -0.84832763671875, -0.748443603515625, -0.6485595703125, -0.548675537109375, -0.44879150390625, -0.348907470703125, -0.2490234375, -0.149139404296875, -0.04925537109375, 0.050628662109375, 0.1505126953125, 0.250396728515625, 0.35028076171875, 0.450164794921875, 0.550048828125, 0.649932861328125, 0.74981689453125, 0.849700927734375, 0.9495849609375, 1.049468994140625, 1.14935302734375, 1.249237060546875, 1.34912109375, 1.449005126953125, 1.54888916015625, 1.648773193359375, 1.7486572265625, 1.848541259765625, 1.94842529296875, 2.048309326171875, 2.148193359375, 2.248077392578125, 2.34796142578125, 2.447845458984375, 2.5477294921875, 2.647613525390625, 2.74749755859375, 2.847381591796875, 2.947265625]}, "gradients/decoder.roberta.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 10.0, 12.0, 15.0, 22.0, 16.0, 29.0, 30.0, 33.0, 39.0, 40.0, 54.0, 93.0, 247.0, 1044569.0, 2723.0, 169.0, 68.0, 57.0, 42.0, 40.0, 27.0, 35.0, 28.0, 29.0, 17.0, 17.0, 14.0, 11.0, 14.0, 10.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-125.4375, -121.615234375, -117.79296875, -113.970703125, -110.1484375, -106.326171875, -102.50390625, -98.681640625, -94.859375, -91.037109375, -87.21484375, -83.392578125, -79.5703125, -75.748046875, -71.92578125, -68.103515625, -64.28125, -60.458984375, -56.63671875, -52.814453125, -48.9921875, -45.169921875, -41.34765625, -37.525390625, -33.703125, -29.880859375, -26.05859375, -22.236328125, -18.4140625, -14.591796875, -10.76953125, -6.947265625, -3.125, 0.697265625, 4.51953125, 8.341796875, 12.1640625, 15.986328125, 19.80859375, 23.630859375, 27.453125, 31.275390625, 35.09765625, 38.919921875, 42.7421875, 46.564453125, 50.38671875, 54.208984375, 58.03125, 61.853515625, 65.67578125, 69.498046875, 73.3203125, 77.142578125, 80.96484375, 84.787109375, 88.609375, 92.431640625, 96.25390625, 100.076171875, 103.8984375, 107.720703125, 111.54296875, 115.365234375, 119.1875]}, "gradients/decoder.roberta.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 2.0, 3.0, 6.0, 12.0, 11.0, 11.0, 11.0, 20.0, 13.0, 25.0, 26.0, 23.0, 40.0, 28.0, 38.0, 43.0, 44.0, 44.0, 62.0, 61.0, 52.0, 55.0, 50.0, 49.0, 35.0, 37.0, 30.0, 33.0, 23.0, 24.0, 24.0, 11.0, 14.0, 13.0, 7.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.0859375, -3.9544677734375, -3.822998046875, -3.6915283203125, -3.56005859375, -3.4285888671875, -3.297119140625, -3.1656494140625, -3.0341796875, -2.9027099609375, -2.771240234375, -2.6397705078125, -2.50830078125, -2.3768310546875, -2.245361328125, -2.1138916015625, -1.982421875, -1.8509521484375, -1.719482421875, -1.5880126953125, -1.45654296875, -1.3250732421875, -1.193603515625, -1.0621337890625, -0.9306640625, -0.7991943359375, -0.667724609375, -0.5362548828125, -0.40478515625, -0.2733154296875, -0.141845703125, -0.0103759765625, 0.12109375, 0.2525634765625, 0.384033203125, 0.5155029296875, 0.64697265625, 0.7784423828125, 0.909912109375, 1.0413818359375, 1.1728515625, 1.3043212890625, 1.435791015625, 1.5672607421875, 1.69873046875, 1.8302001953125, 1.961669921875, 2.0931396484375, 2.224609375, 2.3560791015625, 2.487548828125, 2.6190185546875, 2.75048828125, 2.8819580078125, 3.013427734375, 3.1448974609375, 3.2763671875, 3.4078369140625, 3.539306640625, 3.6707763671875, 3.80224609375, 3.9337158203125, 4.065185546875, 4.1966552734375, 4.328125]}, "gradients/decoder.roberta.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 3.0, 12.0, 33.0, 47.0, 101.0, 237.0, 934.0, 34942.0, 1008413.0, 3048.0, 455.0, 180.0, 76.0, 37.0, 24.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2734375, -12.8350830078125, -12.396728515625, -11.9583740234375, -11.52001953125, -11.0816650390625, -10.643310546875, -10.2049560546875, -9.7666015625, -9.3282470703125, -8.889892578125, -8.4515380859375, -8.01318359375, -7.5748291015625, -7.136474609375, -6.6981201171875, -6.259765625, -5.8214111328125, -5.383056640625, -4.9447021484375, -4.50634765625, -4.0679931640625, -3.629638671875, -3.1912841796875, -2.7529296875, -2.3145751953125, -1.876220703125, -1.4378662109375, -0.99951171875, -0.5611572265625, -0.122802734375, 0.3155517578125, 0.75390625, 1.1922607421875, 1.630615234375, 2.0689697265625, 2.50732421875, 2.9456787109375, 3.384033203125, 3.8223876953125, 4.2607421875, 4.6990966796875, 5.137451171875, 5.5758056640625, 6.01416015625, 6.4525146484375, 6.890869140625, 7.3292236328125, 7.767578125, 8.2059326171875, 8.644287109375, 9.0826416015625, 9.52099609375, 9.9593505859375, 10.397705078125, 10.8360595703125, 11.2744140625, 11.7127685546875, 12.151123046875, 12.5894775390625, 13.02783203125, 13.4661865234375, 13.904541015625, 14.3428955078125, 14.78125]}, "gradients/decoder.roberta.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 14.0, 13.0, 24.0, 25.0, 33.0, 61.0, 84.0, 107.0, 109.0, 142.0, 110.0, 91.0, 66.0, 44.0, 17.0, 20.0, 12.0, 9.0, 11.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002410411834716797, -0.00023211166262626648, -0.00022318214178085327, -0.00021425262093544006, -0.00020532310009002686, -0.00019639357924461365, -0.00018746405839920044, -0.00017853453755378723, -0.00016960501670837402, -0.00016067549586296082, -0.0001517459750175476, -0.0001428164541721344, -0.0001338869333267212, -0.00012495741248130798, -0.00011602789163589478, -0.00010709837079048157, -9.816884994506836e-05, -8.923932909965515e-05, -8.030980825424194e-05, -7.138028740882874e-05, -6.245076656341553e-05, -5.352124571800232e-05, -4.459172487258911e-05, -3.56622040271759e-05, -2.6732683181762695e-05, -1.7803162336349487e-05, -8.87364149093628e-06, 5.587935447692871e-08, 8.985400199890137e-06, 1.7914921045303345e-05, 2.6844441890716553e-05, 3.577396273612976e-05, 4.470348358154297e-05, 5.363300442695618e-05, 6.256252527236938e-05, 7.149204611778259e-05, 8.04215669631958e-05, 8.935108780860901e-05, 9.828060865402222e-05, 0.00010721012949943542, 0.00011613965034484863, 0.00012506917119026184, 0.00013399869203567505, 0.00014292821288108826, 0.00015185773372650146, 0.00016078725457191467, 0.00016971677541732788, 0.0001786462962627411, 0.0001875758171081543, 0.0001965053379535675, 0.0002054348587989807, 0.00021436437964439392, 0.00022329390048980713, 0.00023222342133522034, 0.00024115294218063354, 0.00025008246302604675, 0.00025901198387145996, 0.00026794150471687317, 0.0002768710255622864, 0.0002858005464076996, 0.0002947300672531128, 0.000303659588098526, 0.0003125891089439392, 0.0003215186297893524, 0.0003304481506347656]}, "gradients/decoder.roberta.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 11.0, 12.0, 27.0, 31.0, 63.0, 148.0, 318.0, 2029.0, 1027810.0, 17084.0, 600.0, 190.0, 83.0, 55.0, 33.0, 17.0, 17.0, 5.0, 10.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.15625, -16.55908203125, -15.9619140625, -15.36474609375, -14.767578125, -14.17041015625, -13.5732421875, -12.97607421875, -12.37890625, -11.78173828125, -11.1845703125, -10.58740234375, -9.990234375, -9.39306640625, -8.7958984375, -8.19873046875, -7.6015625, -7.00439453125, -6.4072265625, -5.81005859375, -5.212890625, -4.61572265625, -4.0185546875, -3.42138671875, -2.82421875, -2.22705078125, -1.6298828125, -1.03271484375, -0.435546875, 0.16162109375, 0.7587890625, 1.35595703125, 1.953125, 2.55029296875, 3.1474609375, 3.74462890625, 4.341796875, 4.93896484375, 5.5361328125, 6.13330078125, 6.73046875, 7.32763671875, 7.9248046875, 8.52197265625, 9.119140625, 9.71630859375, 10.3134765625, 10.91064453125, 11.5078125, 12.10498046875, 12.7021484375, 13.29931640625, 13.896484375, 14.49365234375, 15.0908203125, 15.68798828125, 16.28515625, 16.88232421875, 17.4794921875, 18.07666015625, 18.673828125, 19.27099609375, 19.8681640625, 20.46533203125, 21.0625]}, "gradients/decoder.roberta.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 6.0, 7.0, 8.0, 19.0, 35.0, 43.0, 81.0, 124.0, 128.0, 172.0, 123.0, 97.0, 68.0, 43.0, 17.0, 9.0, 13.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.22265625, -1.1889495849609375, -1.155242919921875, -1.1215362548828125, -1.08782958984375, -1.0541229248046875, -1.020416259765625, -0.9867095947265625, -0.9530029296875, -0.9192962646484375, -0.885589599609375, -0.8518829345703125, -0.81817626953125, -0.7844696044921875, -0.750762939453125, -0.7170562744140625, -0.683349609375, -0.6496429443359375, -0.615936279296875, -0.5822296142578125, -0.54852294921875, -0.5148162841796875, -0.481109619140625, -0.4474029541015625, -0.4136962890625, -0.3799896240234375, -0.346282958984375, -0.3125762939453125, -0.27886962890625, -0.2451629638671875, -0.211456298828125, -0.1777496337890625, -0.14404296875, -0.1103363037109375, -0.076629638671875, -0.0429229736328125, -0.00921630859375, 0.0244903564453125, 0.058197021484375, 0.0919036865234375, 0.1256103515625, 0.1593170166015625, 0.193023681640625, 0.2267303466796875, 0.26043701171875, 0.2941436767578125, 0.327850341796875, 0.3615570068359375, 0.395263671875, 0.4289703369140625, 0.462677001953125, 0.4963836669921875, 0.53009033203125, 0.5637969970703125, 0.597503662109375, 0.6312103271484375, 0.6649169921875, 0.6986236572265625, 0.732330322265625, 0.7660369873046875, 0.79974365234375, 0.8334503173828125, 0.867156982421875, 0.9008636474609375, 0.9345703125]}, "gradients/decoder.roberta.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 8.0, 5.0, 11.0, 12.0, 21.0, 14.0, 32.0, 40.0, 46.0, 57.0, 64.0, 76.0, 82.0, 60.0, 82.0, 47.0, 74.0, 56.0, 42.0, 53.0, 39.0, 29.0, 21.0, 15.0, 6.0, 4.0, 7.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8996403217315674, -2.790611743927002, -2.6815834045410156, -2.57255482673645, -2.4635262489318848, -2.3544979095458984, -2.245469331741333, -2.1364407539367676, -2.0274124145507812, -1.9183839559555054, -1.8093554973602295, -1.700326919555664, -1.5912984609603882, -1.4822700023651123, -1.3732414245605469, -1.264212965965271, -1.1551845073699951, -1.0461560487747192, -0.9371275305747986, -0.8280990123748779, -0.719070553779602, -0.6100420951843262, -0.5010135769844055, -0.39198505878448486, -0.282956600189209, -0.17392811179161072, -0.06489962339401245, 0.044128865003585815, 0.15315735340118408, 0.26218581199645996, 0.3712143301963806, 0.48024284839630127, 0.5892715454101562, 0.6983000040054321, 0.8073285222053528, 0.9163570404052734, 1.0253854990005493, 1.1344139575958252, 1.2434425354003906, 1.3524709939956665, 1.4614994525909424, 1.5705279111862183, 1.6795563697814941, 1.7885849475860596, 1.8976134061813354, 2.0066418647766113, 2.1156704425811768, 2.224699020385742, 2.3337273597717285, 2.442755937576294, 2.5517842769622803, 2.6608128547668457, 2.769841194152832, 2.8788697719573975, 2.987898349761963, 3.096926689147949, 3.2059552669525146, 3.31498384475708, 3.4240121841430664, 3.533040761947632, 3.6420693397521973, 3.7510976791381836, 3.860126256942749, 3.9691548347473145, 4.078183174133301]}, "gradients/decoder.roberta.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 6.0, 9.0, 10.0, 9.0, 9.0, 18.0, 14.0, 18.0, 18.0, 27.0, 23.0, 29.0, 26.0, 25.0, 37.0, 50.0, 36.0, 47.0, 39.0, 61.0, 59.0, 49.0, 49.0, 37.0, 34.0, 41.0, 26.0, 32.0, 24.0, 17.0, 25.0, 18.0, 14.0, 14.0, 11.0, 7.0, 3.0, 8.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.886512279510498, -4.736964225769043, -4.587416648864746, -4.437869071960449, -4.288321018218994, -4.138772964477539, -3.989225387573242, -3.839677572250366, -3.6901297569274902, -3.5405819416046143, -3.3910341262817383, -3.2414863109588623, -3.0919384956359863, -2.9423906803131104, -2.7928428649902344, -2.6432950496673584, -2.4937472343444824, -2.3441994190216064, -2.1946516036987305, -2.0451037883758545, -1.8955559730529785, -1.7460081577301025, -1.5964603424072266, -1.4469125270843506, -1.2973647117614746, -1.1478168964385986, -0.9982690811157227, -0.8487212657928467, -0.6991734504699707, -0.5496256351470947, -0.40007781982421875, -0.2505300045013428, -0.1009817123413086, 0.04856610298156738, 0.19811391830444336, 0.34766173362731934, 0.4972095489501953, 0.6467573642730713, 0.7963051795959473, 0.9458529949188232, 1.0954008102416992, 1.2449486255645752, 1.3944964408874512, 1.5440442562103271, 1.6935920715332031, 1.843139886856079, 1.992687702178955, 2.142235517501831, 2.291783332824707, 2.441331148147583, 2.590878963470459, 2.740426778793335, 2.889974594116211, 3.039522409439087, 3.189070224761963, 3.338618040084839, 3.488165855407715, 3.637713670730591, 3.787261486053467, 3.9368093013763428, 4.086357116699219, 4.235904693603516, 4.385452747344971, 4.535000801086426, 4.684548377990723]}, "gradients/decoder.roberta.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 6.0, 10.0, 7.0, 13.0, 16.0, 22.0, 17.0, 30.0, 38.0, 50.0, 57.0, 60.0, 84.0, 91.0, 158.0, 360.0, 1429.0, 13622.0, 842752.0, 3274474.0, 56391.0, 3196.0, 591.0, 209.0, 114.0, 99.0, 61.0, 63.0, 50.0, 45.0, 35.0, 23.0, 19.0, 22.0, 21.0, 7.0, 7.0, 5.0, 9.0, 4.0, 0.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -14.0306396484375, -13.608154296875, -13.1856689453125, -12.76318359375, -12.3406982421875, -11.918212890625, -11.4957275390625, -11.0732421875, -10.6507568359375, -10.228271484375, -9.8057861328125, -9.38330078125, -8.9608154296875, -8.538330078125, -8.1158447265625, -7.693359375, -7.2708740234375, -6.848388671875, -6.4259033203125, -6.00341796875, -5.5809326171875, -5.158447265625, -4.7359619140625, -4.3134765625, -3.8909912109375, -3.468505859375, -3.0460205078125, -2.62353515625, -2.2010498046875, -1.778564453125, -1.3560791015625, -0.93359375, -0.5111083984375, -0.088623046875, 0.3338623046875, 0.75634765625, 1.1788330078125, 1.601318359375, 2.0238037109375, 2.4462890625, 2.8687744140625, 3.291259765625, 3.7137451171875, 4.13623046875, 4.5587158203125, 4.981201171875, 5.4036865234375, 5.826171875, 6.2486572265625, 6.671142578125, 7.0936279296875, 7.51611328125, 7.9385986328125, 8.361083984375, 8.7835693359375, 9.2060546875, 9.6285400390625, 10.051025390625, 10.4735107421875, 10.89599609375, 11.3184814453125, 11.740966796875, 12.1634521484375, 12.5859375]}, "gradients/decoder.roberta.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 12.0, 7.0, 8.0, 8.0, 12.0, 11.0, 14.0, 15.0, 22.0, 16.0, 27.0, 29.0, 24.0, 37.0, 38.0, 38.0, 40.0, 54.0, 47.0, 44.0, 41.0, 49.0, 49.0, 36.0, 40.0, 30.0, 48.0, 34.0, 33.0, 26.0, 14.0, 15.0, 23.0, 12.0, 10.0, 7.0, 6.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.595703125, -3.49468994140625, -3.3936767578125, -3.29266357421875, -3.191650390625, -3.09063720703125, -2.9896240234375, -2.88861083984375, -2.78759765625, -2.68658447265625, -2.5855712890625, -2.48455810546875, -2.383544921875, -2.28253173828125, -2.1815185546875, -2.08050537109375, -1.9794921875, -1.87847900390625, -1.7774658203125, -1.67645263671875, -1.575439453125, -1.47442626953125, -1.3734130859375, -1.27239990234375, -1.17138671875, -1.07037353515625, -0.9693603515625, -0.86834716796875, -0.767333984375, -0.66632080078125, -0.5653076171875, -0.46429443359375, -0.36328125, -0.26226806640625, -0.1612548828125, -0.06024169921875, 0.040771484375, 0.14178466796875, 0.2427978515625, 0.34381103515625, 0.44482421875, 0.54583740234375, 0.6468505859375, 0.74786376953125, 0.848876953125, 0.94989013671875, 1.0509033203125, 1.15191650390625, 1.2529296875, 1.35394287109375, 1.4549560546875, 1.55596923828125, 1.656982421875, 1.75799560546875, 1.8590087890625, 1.96002197265625, 2.06103515625, 2.16204833984375, 2.2630615234375, 2.36407470703125, 2.465087890625, 2.56610107421875, 2.6671142578125, 2.76812744140625, 2.869140625]}, "gradients/decoder.roberta.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 11.0, 8.0, 19.0, 29.0, 35.0, 50.0, 70.0, 95.0, 155.0, 277.0, 398.0, 785.0, 3025.0, 4023393.0, 162765.0, 1531.0, 633.0, 346.0, 202.0, 142.0, 96.0, 78.0, 50.0, 28.0, 14.0, 14.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.3125, -39.0458984375, -37.779296875, -36.5126953125, -35.24609375, -33.9794921875, -32.712890625, -31.4462890625, -30.1796875, -28.9130859375, -27.646484375, -26.3798828125, -25.11328125, -23.8466796875, -22.580078125, -21.3134765625, -20.046875, -18.7802734375, -17.513671875, -16.2470703125, -14.98046875, -13.7138671875, -12.447265625, -11.1806640625, -9.9140625, -8.6474609375, -7.380859375, -6.1142578125, -4.84765625, -3.5810546875, -2.314453125, -1.0478515625, 0.21875, 1.4853515625, 2.751953125, 4.0185546875, 5.28515625, 6.5517578125, 7.818359375, 9.0849609375, 10.3515625, 11.6181640625, 12.884765625, 14.1513671875, 15.41796875, 16.6845703125, 17.951171875, 19.2177734375, 20.484375, 21.7509765625, 23.017578125, 24.2841796875, 25.55078125, 26.8173828125, 28.083984375, 29.3505859375, 30.6171875, 31.8837890625, 33.150390625, 34.4169921875, 35.68359375, 36.9501953125, 38.216796875, 39.4833984375, 40.75]}, "gradients/decoder.roberta.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 12.0, 7.0, 21.0, 35.0, 45.0, 68.0, 96.0, 149.0, 226.0, 338.0, 535.0, 634.0, 608.0, 448.0, 313.0, 178.0, 106.0, 79.0, 41.0, 38.0, 26.0, 20.0, 21.0, 10.0, 4.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.384765625, -2.319976806640625, -2.25518798828125, -2.190399169921875, -2.1256103515625, -2.060821533203125, -1.99603271484375, -1.931243896484375, -1.866455078125, -1.801666259765625, -1.73687744140625, -1.672088623046875, -1.6072998046875, -1.542510986328125, -1.47772216796875, -1.412933349609375, -1.34814453125, -1.283355712890625, -1.21856689453125, -1.153778076171875, -1.0889892578125, -1.024200439453125, -0.95941162109375, -0.894622802734375, -0.829833984375, -0.765045166015625, -0.70025634765625, -0.635467529296875, -0.5706787109375, -0.505889892578125, -0.44110107421875, -0.376312255859375, -0.3115234375, -0.246734619140625, -0.18194580078125, -0.117156982421875, -0.0523681640625, 0.012420654296875, 0.07720947265625, 0.141998291015625, 0.206787109375, 0.271575927734375, 0.33636474609375, 0.401153564453125, 0.4659423828125, 0.530731201171875, 0.59552001953125, 0.660308837890625, 0.72509765625, 0.789886474609375, 0.85467529296875, 0.919464111328125, 0.9842529296875, 1.049041748046875, 1.11383056640625, 1.178619384765625, 1.243408203125, 1.308197021484375, 1.37298583984375, 1.437774658203125, 1.5025634765625, 1.567352294921875, 1.63214111328125, 1.696929931640625, 1.76171875]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 12.0, 10.0, 23.0, 26.0, 48.0, 55.0, 89.0, 98.0, 110.0, 120.0, 90.0, 86.0, 62.0, 54.0, 44.0, 28.0, 23.0, 12.0, 5.0, 4.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.709721088409424, -2.561591863632202, -2.4134626388549805, -2.2653331756591797, -2.117203950881958, -1.9690747261047363, -1.820945382118225, -1.6728160381317139, -1.5246868133544922, -1.3765575885772705, -1.2284282445907593, -1.080298900604248, -0.9321696758270264, -0.7840403914451599, -0.6359111070632935, -0.4877817630767822, -0.33965253829956055, -0.1915232539176941, -0.04339396953582764, 0.10473531484603882, 0.2528645992279053, 0.40099388360977173, 0.5491231679916382, 0.6972525119781494, 0.8453817367553711, 0.9935110211372375, 1.141640305519104, 1.2897696495056152, 1.437898874282837, 1.5860280990600586, 1.7341574430465698, 1.882286787033081, 2.030416488647461, 2.1785457134246826, 2.3266749382019043, 2.474804401397705, 2.6229336261749268, 2.7710628509521484, 2.919192314147949, 3.067321538925171, 3.2154507637023926, 3.3635799884796143, 3.511709213256836, 3.6598386764526367, 3.8079679012298584, 3.95609712600708, 4.104226589202881, 4.252355575561523, 4.400485038757324, 4.548614501953125, 4.696743488311768, 4.844872951507568, 4.993001937866211, 5.141131401062012, 5.2892608642578125, 5.437390327453613, 5.585519313812256, 5.733648777008057, 5.881777763366699, 6.0299072265625, 6.178036689758301, 6.326165676116943, 6.474295139312744, 6.622424125671387, 6.7705535888671875]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 3.0, 7.0, 12.0, 10.0, 12.0, 16.0, 25.0, 37.0, 29.0, 38.0, 36.0, 39.0, 53.0, 36.0, 45.0, 42.0, 48.0, 47.0, 47.0, 43.0, 42.0, 42.0, 33.0, 40.0, 27.0, 38.0, 30.0, 20.0, 13.0, 20.0, 11.0, 15.0, 8.0, 9.0, 3.0, 2.0, 8.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.742563247680664, -4.608692646026611, -4.474822044372559, -4.340951442718506, -4.207080841064453, -4.073210716247559, -3.939340114593506, -3.805469512939453, -3.6715989112854004, -3.5377283096313477, -3.403857707977295, -3.2699873447418213, -3.1361167430877686, -3.002246141433716, -2.868375778198242, -2.7345051765441895, -2.6006345748901367, -2.466763973236084, -2.3328933715820312, -2.1990230083465576, -2.065152406692505, -1.9312818050384521, -1.797411322593689, -1.6635408401489258, -1.529670238494873, -1.3957996368408203, -1.2619291543960571, -1.128058671951294, -0.9941880702972412, -0.8603175282478333, -0.7264469861984253, -0.5925764441490173, -0.4587056636810303, -0.3248351216316223, -0.19096457958221436, -0.057094037532806396, 0.07677650451660156, 0.21064704656600952, 0.3445175886154175, 0.47838813066482544, 0.6122586727142334, 0.7461292147636414, 0.8799997568130493, 1.0138702392578125, 1.1477408409118652, 1.281611442565918, 1.4154819250106812, 1.5493524074554443, 1.683223009109497, 1.8170936107635498, 1.950964093208313, 2.084834575653076, 2.218705177307129, 2.3525757789611816, 2.4864463806152344, 2.620316743850708, 2.7541873455047607, 2.8880579471588135, 3.021928310394287, 3.15579891204834, 3.2896695137023926, 3.4235401153564453, 3.557410717010498, 3.6912810802459717, 3.8251516819000244]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 11.0, 20.0, 11.0, 33.0, 41.0, 56.0, 108.0, 138.0, 279.0, 419.0, 731.0, 1266.0, 2290.0, 4216.0, 8346.0, 16459.0, 33800.0, 74762.0, 184777.0, 352982.0, 208919.0, 83867.0, 37714.0, 17904.0, 8916.0, 4628.0, 2512.0, 1347.0, 793.0, 434.0, 293.0, 179.0, 99.0, 58.0, 51.0, 28.0, 15.0, 21.0, 8.0, 7.0, 8.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.978515625, -0.9454193115234375, -0.912322998046875, -0.8792266845703125, -0.84613037109375, -0.8130340576171875, -0.779937744140625, -0.7468414306640625, -0.7137451171875, -0.6806488037109375, -0.647552490234375, -0.6144561767578125, -0.58135986328125, -0.5482635498046875, -0.515167236328125, -0.4820709228515625, -0.448974609375, -0.4158782958984375, -0.382781982421875, -0.3496856689453125, -0.31658935546875, -0.2834930419921875, -0.250396728515625, -0.2173004150390625, -0.1842041015625, -0.1511077880859375, -0.118011474609375, -0.0849151611328125, -0.05181884765625, -0.0187225341796875, 0.014373779296875, 0.0474700927734375, 0.08056640625, 0.1136627197265625, 0.146759033203125, 0.1798553466796875, 0.21295166015625, 0.2460479736328125, 0.279144287109375, 0.3122406005859375, 0.3453369140625, 0.3784332275390625, 0.411529541015625, 0.4446258544921875, 0.47772216796875, 0.5108184814453125, 0.543914794921875, 0.5770111083984375, 0.610107421875, 0.6432037353515625, 0.676300048828125, 0.7093963623046875, 0.74249267578125, 0.7755889892578125, 0.808685302734375, 0.8417816162109375, 0.8748779296875, 0.9079742431640625, 0.941070556640625, 0.9741668701171875, 1.00726318359375, 1.0403594970703125, 1.073455810546875, 1.1065521240234375, 1.1396484375]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 6.0, 12.0, 11.0, 12.0, 16.0, 21.0, 39.0, 28.0, 36.0, 40.0, 37.0, 56.0, 34.0, 47.0, 40.0, 52.0, 44.0, 44.0, 45.0, 44.0, 41.0, 33.0, 39.0, 27.0, 39.0, 31.0, 19.0, 14.0, 19.0, 12.0, 15.0, 8.0, 9.0, 3.0, 1.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.71484375, -4.584136962890625, -4.45343017578125, -4.322723388671875, -4.1920166015625, -4.061309814453125, -3.93060302734375, -3.799896240234375, -3.669189453125, -3.538482666015625, -3.40777587890625, -3.277069091796875, -3.1463623046875, -3.015655517578125, -2.88494873046875, -2.754241943359375, -2.62353515625, -2.492828369140625, -2.36212158203125, -2.231414794921875, -2.1007080078125, -1.970001220703125, -1.83929443359375, -1.708587646484375, -1.577880859375, -1.447174072265625, -1.31646728515625, -1.185760498046875, -1.0550537109375, -0.924346923828125, -0.79364013671875, -0.662933349609375, -0.5322265625, -0.401519775390625, -0.27081298828125, -0.140106201171875, -0.0093994140625, 0.121307373046875, 0.25201416015625, 0.382720947265625, 0.513427734375, 0.644134521484375, 0.77484130859375, 0.905548095703125, 1.0362548828125, 1.166961669921875, 1.29766845703125, 1.428375244140625, 1.55908203125, 1.689788818359375, 1.82049560546875, 1.951202392578125, 2.0819091796875, 2.212615966796875, 2.34332275390625, 2.474029541015625, 2.604736328125, 2.735443115234375, 2.86614990234375, 2.996856689453125, 3.1275634765625, 3.258270263671875, 3.38897705078125, 3.519683837890625, 3.650390625]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 5.0, 9.0, 7.0, 14.0, 21.0, 18.0, 30.0, 36.0, 55.0, 79.0, 103.0, 130.0, 199.0, 291.0, 447.0, 713.0, 1178.0, 2117.0, 4864.0, 13497.0, 56126.0, 921558.0, 30427.0, 8667.0, 3515.0, 1647.0, 964.0, 570.0, 378.0, 261.0, 162.0, 112.0, 93.0, 94.0, 46.0, 25.0, 22.0, 21.0, 14.0, 11.0, 12.0, 8.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.544921875, -2.466156005859375, -2.38739013671875, -2.308624267578125, -2.2298583984375, -2.151092529296875, -2.07232666015625, -1.993560791015625, -1.914794921875, -1.836029052734375, -1.75726318359375, -1.678497314453125, -1.5997314453125, -1.520965576171875, -1.44219970703125, -1.363433837890625, -1.28466796875, -1.205902099609375, -1.12713623046875, -1.048370361328125, -0.9696044921875, -0.890838623046875, -0.81207275390625, -0.733306884765625, -0.654541015625, -0.575775146484375, -0.49700927734375, -0.418243408203125, -0.3394775390625, -0.260711669921875, -0.18194580078125, -0.103179931640625, -0.0244140625, 0.054351806640625, 0.13311767578125, 0.211883544921875, 0.2906494140625, 0.369415283203125, 0.44818115234375, 0.526947021484375, 0.605712890625, 0.684478759765625, 0.76324462890625, 0.842010498046875, 0.9207763671875, 0.999542236328125, 1.07830810546875, 1.157073974609375, 1.23583984375, 1.314605712890625, 1.39337158203125, 1.472137451171875, 1.5509033203125, 1.629669189453125, 1.70843505859375, 1.787200927734375, 1.865966796875, 1.944732666015625, 2.02349853515625, 2.102264404296875, 2.1810302734375, 2.259796142578125, 2.33856201171875, 2.417327880859375, 2.49609375]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 6.0, 6.0, 7.0, 11.0, 10.0, 10.0, 17.0, 15.0, 16.0, 16.0, 24.0, 24.0, 24.0, 31.0, 33.0, 23.0, 29.0, 35.0, 42.0, 38.0, 42.0, 36.0, 46.0, 37.0, 43.0, 37.0, 33.0, 31.0, 44.0, 32.0, 22.0, 26.0, 18.0, 23.0, 17.0, 18.0, 13.0, 11.0, 8.0, 8.0, 6.0, 17.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.24609375, -2.1773681640625, -2.108642578125, -2.0399169921875, -1.97119140625, -1.9024658203125, -1.833740234375, -1.7650146484375, -1.6962890625, -1.6275634765625, -1.558837890625, -1.4901123046875, -1.42138671875, -1.3526611328125, -1.283935546875, -1.2152099609375, -1.146484375, -1.0777587890625, -1.009033203125, -0.9403076171875, -0.87158203125, -0.8028564453125, -0.734130859375, -0.6654052734375, -0.5966796875, -0.5279541015625, -0.459228515625, -0.3905029296875, -0.32177734375, -0.2530517578125, -0.184326171875, -0.1156005859375, -0.046875, 0.0218505859375, 0.090576171875, 0.1593017578125, 0.22802734375, 0.2967529296875, 0.365478515625, 0.4342041015625, 0.5029296875, 0.5716552734375, 0.640380859375, 0.7091064453125, 0.77783203125, 0.8465576171875, 0.915283203125, 0.9840087890625, 1.052734375, 1.1214599609375, 1.190185546875, 1.2589111328125, 1.32763671875, 1.3963623046875, 1.465087890625, 1.5338134765625, 1.6025390625, 1.6712646484375, 1.739990234375, 1.8087158203125, 1.87744140625, 1.9461669921875, 2.014892578125, 2.0836181640625, 2.15234375]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 3.0, 17.0, 16.0, 22.0, 21.0, 35.0, 50.0, 77.0, 89.0, 147.0, 241.0, 312.0, 504.0, 942.0, 1718.0, 3810.0, 10337.0, 46548.0, 947397.0, 23382.0, 6770.0, 2640.0, 1364.0, 727.0, 473.0, 305.0, 187.0, 116.0, 71.0, 68.0, 43.0, 38.0, 25.0, 15.0, 7.0, 6.0, 12.0, 4.0, 2.0, 7.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.296875, -0.287078857421875, -0.27728271484375, -0.267486572265625, -0.2576904296875, -0.247894287109375, -0.23809814453125, -0.228302001953125, -0.218505859375, -0.208709716796875, -0.19891357421875, -0.189117431640625, -0.1793212890625, -0.169525146484375, -0.15972900390625, -0.149932861328125, -0.14013671875, -0.130340576171875, -0.12054443359375, -0.110748291015625, -0.1009521484375, -0.091156005859375, -0.08135986328125, -0.071563720703125, -0.061767578125, -0.051971435546875, -0.04217529296875, -0.032379150390625, -0.0225830078125, -0.012786865234375, -0.00299072265625, 0.006805419921875, 0.0166015625, 0.026397705078125, 0.03619384765625, 0.045989990234375, 0.0557861328125, 0.065582275390625, 0.07537841796875, 0.085174560546875, 0.094970703125, 0.104766845703125, 0.11456298828125, 0.124359130859375, 0.1341552734375, 0.143951416015625, 0.15374755859375, 0.163543701171875, 0.17333984375, 0.183135986328125, 0.19293212890625, 0.202728271484375, 0.2125244140625, 0.222320556640625, 0.23211669921875, 0.241912841796875, 0.251708984375, 0.261505126953125, 0.27130126953125, 0.281097412109375, 0.2908935546875, 0.300689697265625, 0.31048583984375, 0.320281982421875, 0.330078125]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 5.0, 7.0, 3.0, 12.0, 10.0, 15.0, 22.0, 19.0, 32.0, 36.0, 33.0, 51.0, 52.0, 61.0, 68.0, 57.0, 72.0, 57.0, 57.0, 50.0, 52.0, 43.0, 38.0, 32.0, 27.0, 17.0, 13.0, 19.0, 7.0, 11.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439188003540039e-05, -3.3359043300151825e-05, -3.232620656490326e-05, -3.1293369829654694e-05, -3.0260533094406128e-05, -2.9227696359157562e-05, -2.8194859623908997e-05, -2.716202288866043e-05, -2.6129186153411865e-05, -2.50963494181633e-05, -2.4063512682914734e-05, -2.3030675947666168e-05, -2.1997839212417603e-05, -2.0965002477169037e-05, -1.993216574192047e-05, -1.8899329006671906e-05, -1.786649227142334e-05, -1.6833655536174774e-05, -1.580081880092621e-05, -1.4767982065677643e-05, -1.3735145330429077e-05, -1.2702308595180511e-05, -1.1669471859931946e-05, -1.063663512468338e-05, -9.603798389434814e-06, -8.570961654186249e-06, -7.538124918937683e-06, -6.5052881836891174e-06, -5.472451448440552e-06, -4.439614713191986e-06, -3.4067779779434204e-06, -2.3739412426948547e-06, -1.341104507446289e-06, -3.082677721977234e-07, 7.245689630508423e-07, 1.757405698299408e-06, 2.7902424335479736e-06, 3.823079168796539e-06, 4.855915904045105e-06, 5.888752639293671e-06, 6.921589374542236e-06, 7.954426109790802e-06, 8.987262845039368e-06, 1.0020099580287933e-05, 1.1052936315536499e-05, 1.2085773050785065e-05, 1.311860978603363e-05, 1.4151446521282196e-05, 1.5184283256530762e-05, 1.6217119991779327e-05, 1.7249956727027893e-05, 1.828279346227646e-05, 1.9315630197525024e-05, 2.034846693277359e-05, 2.1381303668022156e-05, 2.241414040327072e-05, 2.3446977138519287e-05, 2.4479813873767853e-05, 2.551265060901642e-05, 2.6545487344264984e-05, 2.757832407951355e-05, 2.8611160814762115e-05, 2.964399755001068e-05, 3.067683428525925e-05, 3.170967102050781e-05]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 7.0, 16.0, 8.0, 10.0, 17.0, 11.0, 23.0, 21.0, 29.0, 57.0, 53.0, 57.0, 84.0, 96.0, 133.0, 188.0, 686.0, 23018.0, 997682.0, 24804.0, 694.0, 221.0, 125.0, 109.0, 89.0, 65.0, 54.0, 34.0, 38.0, 25.0, 26.0, 16.0, 16.0, 8.0, 9.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.623046875, -0.6044540405273438, -0.5858612060546875, -0.5672683715820312, -0.548675537109375, -0.5300827026367188, -0.5114898681640625, -0.49289703369140625, -0.47430419921875, -0.45571136474609375, -0.4371185302734375, -0.41852569580078125, -0.399932861328125, -0.38134002685546875, -0.3627471923828125, -0.34415435791015625, -0.3255615234375, -0.30696868896484375, -0.2883758544921875, -0.26978302001953125, -0.251190185546875, -0.23259735107421875, -0.2140045166015625, -0.19541168212890625, -0.17681884765625, -0.15822601318359375, -0.1396331787109375, -0.12104034423828125, -0.102447509765625, -0.08385467529296875, -0.0652618408203125, -0.04666900634765625, -0.028076171875, -0.00948333740234375, 0.0091094970703125, 0.02770233154296875, 0.046295166015625, 0.06488800048828125, 0.0834808349609375, 0.10207366943359375, 0.12066650390625, 0.13925933837890625, 0.1578521728515625, 0.17644500732421875, 0.195037841796875, 0.21363067626953125, 0.2322235107421875, 0.25081634521484375, 0.2694091796875, 0.28800201416015625, 0.3065948486328125, 0.32518768310546875, 0.343780517578125, 0.36237335205078125, 0.3809661865234375, 0.39955902099609375, 0.41815185546875, 0.43674468994140625, 0.4553375244140625, 0.47393035888671875, 0.492523193359375, 0.5111160278320312, 0.5297088623046875, 0.5483016967773438, 0.56689453125]}, "gradients/decoder.roberta.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 6.0, 9.0, 7.0, 11.0, 6.0, 7.0, 15.0, 13.0, 11.0, 17.0, 21.0, 25.0, 18.0, 31.0, 47.0, 35.0, 58.0, 66.0, 66.0, 58.0, 68.0, 61.0, 56.0, 37.0, 48.0, 22.0, 24.0, 20.0, 16.0, 17.0, 23.0, 14.0, 13.0, 10.0, 6.0, 5.0, 6.0, 1.0, 7.0, 5.0, 6.0, 7.0, 4.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.024505615234375, -0.02367091178894043, -0.02283620834350586, -0.02200150489807129, -0.02116680145263672, -0.02033209800720215, -0.019497394561767578, -0.018662691116333008, -0.017827987670898438, -0.016993284225463867, -0.016158580780029297, -0.015323877334594727, -0.014489173889160156, -0.013654470443725586, -0.012819766998291016, -0.011985063552856445, -0.011150360107421875, -0.010315656661987305, -0.009480953216552734, -0.008646249771118164, -0.007811546325683594, -0.0069768428802490234, -0.006142139434814453, -0.005307435989379883, -0.0044727325439453125, -0.003638029098510742, -0.002803325653076172, -0.0019686222076416016, -0.0011339187622070312, -0.00029921531677246094, 0.0005354881286621094, 0.0013701915740966797, 0.00220489501953125, 0.0030395984649658203, 0.0038743019104003906, 0.004709005355834961, 0.005543708801269531, 0.0063784122467041016, 0.007213115692138672, 0.008047819137573242, 0.008882522583007812, 0.009717226028442383, 0.010551929473876953, 0.011386632919311523, 0.012221336364746094, 0.013056039810180664, 0.013890743255615234, 0.014725446701049805, 0.015560150146484375, 0.016394853591918945, 0.017229557037353516, 0.018064260482788086, 0.018898963928222656, 0.019733667373657227, 0.020568370819091797, 0.021403074264526367, 0.022237777709960938, 0.023072481155395508, 0.023907184600830078, 0.02474188804626465, 0.02557659149169922, 0.02641129493713379, 0.02724599838256836, 0.02808070182800293, 0.0289154052734375]}, "gradients/decoder.roberta.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 10.0, 10.0, 16.0, 20.0, 28.0, 43.0, 59.0, 67.0, 83.0, 98.0, 85.0, 92.0, 80.0, 73.0, 59.0, 45.0, 42.0, 31.0, 26.0, 13.0, 6.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.437884569168091, -2.3147904872894287, -2.1916964054107666, -2.0686023235321045, -1.9455082416534424, -1.8224141597747803, -1.6993201971054077, -1.5762261152267456, -1.4531320333480835, -1.3300379514694214, -1.2069438695907593, -1.0838499069213867, -0.9607557654380798, -0.8376616835594177, -0.7145676612854004, -0.5914735794067383, -0.46837949752807617, -0.34528541564941406, -0.22219136357307434, -0.09909731149673462, 0.02399677038192749, 0.1470908522605896, 0.27018487453460693, 0.39327895641326904, 0.5163730382919312, 0.6394671201705933, 0.7625612020492554, 0.8856552243232727, 1.00874924659729, 1.1318433284759521, 1.2549374103546143, 1.3780314922332764, 1.5011258125305176, 1.6242198944091797, 1.7473139762878418, 1.870408058166504, 1.993502140045166, 2.116596221923828, 2.2396903038024902, 2.3627843856811523, 2.4858784675598145, 2.6089725494384766, 2.7320666313171387, 2.855160713195801, 2.978254795074463, 3.101348876953125, 3.224442958831787, 3.347537040710449, 3.4706308841705322, 3.5937249660491943, 3.7168190479278564, 3.8399131298065186, 3.9630072116851807, 4.086101055145264, 4.209195137023926, 4.332289218902588, 4.45538330078125, 4.578477382659912, 4.701571464538574, 4.824665546417236, 4.947759628295898, 5.0708537101745605, 5.193947792053223, 5.317041873931885, 5.440135955810547]}, "gradients/decoder.roberta.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 6.0, 12.0, 10.0, 14.0, 13.0, 24.0, 39.0, 27.0, 37.0, 39.0, 37.0, 56.0, 35.0, 46.0, 41.0, 47.0, 49.0, 43.0, 45.0, 43.0, 45.0, 30.0, 38.0, 30.0, 37.0, 31.0, 19.0, 14.0, 19.0, 12.0, 15.0, 8.0, 9.0, 3.0, 1.0, 10.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.717009544372559, -4.586215019226074, -4.45542049407959, -4.324625492095947, -4.193830966949463, -4.0630364418029785, -3.932241678237915, -3.8014469146728516, -3.670652389526367, -3.539857864379883, -3.4090631008148193, -3.278268337249756, -3.1474738121032715, -3.016679286956787, -2.8858845233917236, -2.75508975982666, -2.624295234680176, -2.4935007095336914, -2.362705945968628, -2.2319111824035645, -2.10111665725708, -1.9703220129013062, -1.8395273685455322, -1.7087327241897583, -1.5779380798339844, -1.4471434354782104, -1.3163487911224365, -1.1855541467666626, -1.0547595024108887, -0.9239648580551147, -0.7931702136993408, -0.6623755693435669, -0.5315811634063721, -0.40078651905059814, -0.2699918746948242, -0.1391972303390503, -0.008402585983276367, 0.12239205837249756, 0.2531867027282715, 0.3839813470840454, 0.5147759914398193, 0.6455706357955933, 0.7763652801513672, 0.9071599245071411, 1.037954568862915, 1.168749213218689, 1.299543857574463, 1.4303385019302368, 1.5611331462860107, 1.6919277906417847, 1.8227224349975586, 1.9535170793533325, 2.0843117237091064, 2.21510648727417, 2.3459010124206543, 2.4766955375671387, 2.607490301132202, 2.7382850646972656, 2.86907958984375, 2.9998741149902344, 3.130668878555298, 3.2614636421203613, 3.3922581672668457, 3.52305269241333, 3.6538474559783936]}, "gradients/decoder.roberta.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 7.0, 6.0, 10.0, 14.0, 18.0, 24.0, 49.0, 66.0, 90.0, 145.0, 250.0, 467.0, 680.0, 1226.0, 2271.0, 4691.0, 10331.0, 25470.0, 65506.0, 174207.0, 378981.0, 235512.0, 88507.0, 34009.0, 13641.0, 5974.0, 2799.0, 1515.0, 827.0, 468.0, 274.0, 168.0, 118.0, 79.0, 48.0, 37.0, 20.0, 16.0, 11.0, 8.0, 11.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.171875, -3.082916259765625, -2.99395751953125, -2.904998779296875, -2.8160400390625, -2.727081298828125, -2.63812255859375, -2.549163818359375, -2.460205078125, -2.371246337890625, -2.28228759765625, -2.193328857421875, -2.1043701171875, -2.015411376953125, -1.92645263671875, -1.837493896484375, -1.74853515625, -1.659576416015625, -1.57061767578125, -1.481658935546875, -1.3927001953125, -1.303741455078125, -1.21478271484375, -1.125823974609375, -1.036865234375, -0.947906494140625, -0.85894775390625, -0.769989013671875, -0.6810302734375, -0.592071533203125, -0.50311279296875, -0.414154052734375, -0.3251953125, -0.236236572265625, -0.14727783203125, -0.058319091796875, 0.0306396484375, 0.119598388671875, 0.20855712890625, 0.297515869140625, 0.386474609375, 0.475433349609375, 0.56439208984375, 0.653350830078125, 0.7423095703125, 0.831268310546875, 0.92022705078125, 1.009185791015625, 1.09814453125, 1.187103271484375, 1.27606201171875, 1.365020751953125, 1.4539794921875, 1.542938232421875, 1.63189697265625, 1.720855712890625, 1.809814453125, 1.898773193359375, 1.98773193359375, 2.076690673828125, 2.1656494140625, 2.254608154296875, 2.34356689453125, 2.432525634765625, 2.521484375]}, "gradients/decoder.roberta.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 5.0, 5.0, 14.0, 10.0, 17.0, 15.0, 21.0, 39.0, 35.0, 32.0, 37.0, 48.0, 44.0, 43.0, 45.0, 39.0, 53.0, 47.0, 39.0, 48.0, 37.0, 51.0, 25.0, 40.0, 35.0, 26.0, 32.0, 17.0, 20.0, 12.0, 16.0, 13.0, 5.0, 9.0, 2.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.4453125, -4.321136474609375, -4.19696044921875, -4.072784423828125, -3.9486083984375, -3.824432373046875, -3.70025634765625, -3.576080322265625, -3.451904296875, -3.327728271484375, -3.20355224609375, -3.079376220703125, -2.9552001953125, -2.831024169921875, -2.70684814453125, -2.582672119140625, -2.45849609375, -2.334320068359375, -2.21014404296875, -2.085968017578125, -1.9617919921875, -1.837615966796875, -1.71343994140625, -1.589263916015625, -1.465087890625, -1.340911865234375, -1.21673583984375, -1.092559814453125, -0.9683837890625, -0.844207763671875, -0.72003173828125, -0.595855712890625, -0.4716796875, -0.347503662109375, -0.22332763671875, -0.099151611328125, 0.0250244140625, 0.149200439453125, 0.27337646484375, 0.397552490234375, 0.521728515625, 0.645904541015625, 0.77008056640625, 0.894256591796875, 1.0184326171875, 1.142608642578125, 1.26678466796875, 1.390960693359375, 1.51513671875, 1.639312744140625, 1.76348876953125, 1.887664794921875, 2.0118408203125, 2.136016845703125, 2.26019287109375, 2.384368896484375, 2.508544921875, 2.632720947265625, 2.75689697265625, 2.881072998046875, 3.0052490234375, 3.129425048828125, 3.25360107421875, 3.377777099609375, 3.501953125]}, "gradients/decoder.roberta.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 5.0, 6.0, 11.0, 13.0, 21.0, 16.0, 12.0, 28.0, 28.0, 43.0, 41.0, 44.0, 36.0, 54.0, 58.0, 132.0, 822.0, 1046441.0, 257.0, 97.0, 60.0, 53.0, 36.0, 34.0, 28.0, 29.0, 27.0, 13.0, 19.0, 13.0, 13.0, 11.0, 8.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-112.0625, -108.58984375, -105.1171875, -101.64453125, -98.171875, -94.69921875, -91.2265625, -87.75390625, -84.28125, -80.80859375, -77.3359375, -73.86328125, -70.390625, -66.91796875, -63.4453125, -59.97265625, -56.5, -53.02734375, -49.5546875, -46.08203125, -42.609375, -39.13671875, -35.6640625, -32.19140625, -28.71875, -25.24609375, -21.7734375, -18.30078125, -14.828125, -11.35546875, -7.8828125, -4.41015625, -0.9375, 2.53515625, 6.0078125, 9.48046875, 12.953125, 16.42578125, 19.8984375, 23.37109375, 26.84375, 30.31640625, 33.7890625, 37.26171875, 40.734375, 44.20703125, 47.6796875, 51.15234375, 54.625, 58.09765625, 61.5703125, 65.04296875, 68.515625, 71.98828125, 75.4609375, 78.93359375, 82.40625, 85.87890625, 89.3515625, 92.82421875, 96.296875, 99.76953125, 103.2421875, 106.71484375, 110.1875]}, "gradients/decoder.roberta.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 3.0, 17.0, 11.0, 19.0, 6.0, 15.0, 16.0, 24.0, 27.0, 30.0, 36.0, 39.0, 41.0, 53.0, 44.0, 49.0, 40.0, 47.0, 39.0, 45.0, 46.0, 39.0, 40.0, 36.0, 47.0, 35.0, 26.0, 17.0, 15.0, 20.0, 14.0, 15.0, 7.0, 4.0, 6.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.611328125, -3.4981689453125, -3.385009765625, -3.2718505859375, -3.15869140625, -3.0455322265625, -2.932373046875, -2.8192138671875, -2.7060546875, -2.5928955078125, -2.479736328125, -2.3665771484375, -2.25341796875, -2.1402587890625, -2.027099609375, -1.9139404296875, -1.80078125, -1.6876220703125, -1.574462890625, -1.4613037109375, -1.34814453125, -1.2349853515625, -1.121826171875, -1.0086669921875, -0.8955078125, -0.7823486328125, -0.669189453125, -0.5560302734375, -0.44287109375, -0.3297119140625, -0.216552734375, -0.1033935546875, 0.009765625, 0.1229248046875, 0.236083984375, 0.3492431640625, 0.46240234375, 0.5755615234375, 0.688720703125, 0.8018798828125, 0.9150390625, 1.0281982421875, 1.141357421875, 1.2545166015625, 1.36767578125, 1.4808349609375, 1.593994140625, 1.7071533203125, 1.8203125, 1.9334716796875, 2.046630859375, 2.1597900390625, 2.27294921875, 2.3861083984375, 2.499267578125, 2.6124267578125, 2.7255859375, 2.8387451171875, 2.951904296875, 3.0650634765625, 3.17822265625, 3.2913818359375, 3.404541015625, 3.5177001953125, 3.630859375]}, "gradients/decoder.roberta.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 13.0, 7.0, 9.0, 20.0, 42.0, 107.0, 250.0, 2209.0, 1042352.0, 3064.0, 277.0, 95.0, 56.0, 22.0, 13.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.328125, -20.65185546875, -19.9755859375, -19.29931640625, -18.623046875, -17.94677734375, -17.2705078125, -16.59423828125, -15.91796875, -15.24169921875, -14.5654296875, -13.88916015625, -13.212890625, -12.53662109375, -11.8603515625, -11.18408203125, -10.5078125, -9.83154296875, -9.1552734375, -8.47900390625, -7.802734375, -7.12646484375, -6.4501953125, -5.77392578125, -5.09765625, -4.42138671875, -3.7451171875, -3.06884765625, -2.392578125, -1.71630859375, -1.0400390625, -0.36376953125, 0.3125, 0.98876953125, 1.6650390625, 2.34130859375, 3.017578125, 3.69384765625, 4.3701171875, 5.04638671875, 5.72265625, 6.39892578125, 7.0751953125, 7.75146484375, 8.427734375, 9.10400390625, 9.7802734375, 10.45654296875, 11.1328125, 11.80908203125, 12.4853515625, 13.16162109375, 13.837890625, 14.51416015625, 15.1904296875, 15.86669921875, 16.54296875, 17.21923828125, 17.8955078125, 18.57177734375, 19.248046875, 19.92431640625, 20.6005859375, 21.27685546875, 21.953125]}, "gradients/decoder.roberta.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 8.0, 6.0, 9.0, 20.0, 27.0, 36.0, 56.0, 94.0, 134.0, 144.0, 141.0, 117.0, 79.0, 35.0, 27.0, 22.0, 17.0, 13.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001989603042602539, -0.00019093044102191925, -0.0001829005777835846, -0.00017487071454524994, -0.00016684085130691528, -0.00015881098806858063, -0.00015078112483024597, -0.00014275126159191132, -0.00013472139835357666, -0.000126691535115242, -0.00011866167187690735, -0.00011063180863857269, -0.00010260194540023804, -9.457208216190338e-05, -8.654221892356873e-05, -7.851235568523407e-05, -7.048249244689941e-05, -6.245262920856476e-05, -5.44227659702301e-05, -4.639290273189545e-05, -3.836303949356079e-05, -3.0333176255226135e-05, -2.230331301689148e-05, -1.4273449778556824e-05, -6.243586540222168e-06, 1.7862766981124878e-06, 9.816139936447144e-06, 1.78460031747818e-05, 2.5875866413116455e-05, 3.390572965145111e-05, 4.1935592889785767e-05, 4.996545612812042e-05, 5.799531936645508e-05, 6.602518260478973e-05, 7.405504584312439e-05, 8.208490908145905e-05, 9.01147723197937e-05, 9.814463555812836e-05, 0.00010617449879646301, 0.00011420436203479767, 0.00012223422527313232, 0.00013026408851146698, 0.00013829395174980164, 0.0001463238149881363, 0.00015435367822647095, 0.0001623835414648056, 0.00017041340470314026, 0.00017844326794147491, 0.00018647313117980957, 0.00019450299441814423, 0.00020253285765647888, 0.00021056272089481354, 0.0002185925841331482, 0.00022662244737148285, 0.0002346523106098175, 0.00024268217384815216, 0.0002507120370864868, 0.00025874190032482147, 0.00026677176356315613, 0.0002748016268014908, 0.00028283149003982544, 0.0002908613532781601, 0.00029889121651649475, 0.0003069210797548294, 0.00031495094299316406]}, "gradients/decoder.roberta.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 7.0, 22.0, 66.0, 279.0, 2374.0, 1042417.0, 3004.0, 262.0, 67.0, 21.0, 18.0, 9.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.71875, -32.886962890625, -32.05517578125, -31.223388671875, -30.3916015625, -29.559814453125, -28.72802734375, -27.896240234375, -27.064453125, -26.232666015625, -25.40087890625, -24.569091796875, -23.7373046875, -22.905517578125, -22.07373046875, -21.241943359375, -20.41015625, -19.578369140625, -18.74658203125, -17.914794921875, -17.0830078125, -16.251220703125, -15.41943359375, -14.587646484375, -13.755859375, -12.924072265625, -12.09228515625, -11.260498046875, -10.4287109375, -9.596923828125, -8.76513671875, -7.933349609375, -7.1015625, -6.269775390625, -5.43798828125, -4.606201171875, -3.7744140625, -2.942626953125, -2.11083984375, -1.279052734375, -0.447265625, 0.384521484375, 1.21630859375, 2.048095703125, 2.8798828125, 3.711669921875, 4.54345703125, 5.375244140625, 6.20703125, 7.038818359375, 7.87060546875, 8.702392578125, 9.5341796875, 10.365966796875, 11.19775390625, 12.029541015625, 12.861328125, 13.693115234375, 14.52490234375, 15.356689453125, 16.1884765625, 17.020263671875, 17.85205078125, 18.683837890625, 19.515625]}, "gradients/decoder.roberta.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 7.0, 16.0, 27.0, 75.0, 199.0, 374.0, 186.0, 66.0, 32.0, 13.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201171875, -1.1519775390625, -1.102783203125, -1.0535888671875, -1.00439453125, -0.9552001953125, -0.906005859375, -0.8568115234375, -0.8076171875, -0.7584228515625, -0.709228515625, -0.6600341796875, -0.61083984375, -0.5616455078125, -0.512451171875, -0.4632568359375, -0.4140625, -0.3648681640625, -0.315673828125, -0.2664794921875, -0.21728515625, -0.1680908203125, -0.118896484375, -0.0697021484375, -0.0205078125, 0.0286865234375, 0.077880859375, 0.1270751953125, 0.17626953125, 0.2254638671875, 0.274658203125, 0.3238525390625, 0.373046875, 0.4222412109375, 0.471435546875, 0.5206298828125, 0.56982421875, 0.6190185546875, 0.668212890625, 0.7174072265625, 0.7666015625, 0.8157958984375, 0.864990234375, 0.9141845703125, 0.96337890625, 1.0125732421875, 1.061767578125, 1.1109619140625, 1.16015625, 1.2093505859375, 1.258544921875, 1.3077392578125, 1.35693359375, 1.4061279296875, 1.455322265625, 1.5045166015625, 1.5537109375, 1.6029052734375, 1.652099609375, 1.7012939453125, 1.75048828125, 1.7996826171875, 1.848876953125, 1.8980712890625, 1.947265625]}, "gradients/decoder.roberta.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 6.0, 10.0, 34.0, 58.0, 143.0, 193.0, 203.0, 183.0, 92.0, 59.0, 24.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7119712829589844, -2.422975540161133, -2.1339797973632812, -1.8449838161468506, -1.555988073348999, -1.2669923305511475, -0.9779964685440063, -0.6890006065368652, -0.40000486373901367, -0.11100906133651733, 0.177986741065979, 0.46698254346847534, 0.7559783458709717, 1.0449740886688232, 1.3339699506759644, 1.6229658126831055, 1.911961555480957, 2.2009572982788086, 2.48995304107666, 2.778949022293091, 3.0679447650909424, 3.356940507888794, 3.6459364891052246, 3.934932231903076, 4.223927974700928, 4.512923717498779, 4.801919460296631, 5.090915203094482, 5.379911422729492, 5.668907165527344, 5.957902908325195, 6.246898651123047, 6.535894393920898, 6.82489013671875, 7.113885879516602, 7.402881622314453, 7.691877365112305, 7.980873107910156, 8.269868850708008, 8.55886459350586, 8.847860336303711, 9.136856079101562, 9.425851821899414, 9.714847564697266, 10.003843307495117, 10.292839050292969, 10.58183479309082, 10.870830535888672, 11.15982723236084, 11.448822975158691, 11.737818717956543, 12.026814460754395, 12.315810203552246, 12.604805946350098, 12.89380168914795, 13.182798385620117, 13.471794128417969, 13.76078987121582, 14.049785614013672, 14.338781356811523, 14.627777099609375, 14.916772842407227, 15.205768585205078, 15.49476432800293, 15.783760070800781]}, "gradients/decoder.roberta.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 13.0, 5.0, 10.0, 7.0, 12.0, 19.0, 21.0, 30.0, 26.0, 28.0, 32.0, 40.0, 29.0, 33.0, 42.0, 48.0, 38.0, 41.0, 45.0, 34.0, 59.0, 41.0, 38.0, 34.0, 34.0, 39.0, 30.0, 29.0, 27.0, 18.0, 13.0, 11.0, 16.0, 13.0, 12.0, 8.0, 5.0, 2.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.487273216247559, -4.345075607299805, -4.202877998352051, -4.060680866241455, -3.918483257293701, -3.7762856483459473, -3.6340880393981934, -3.4918904304504395, -3.3496930599212646, -3.2074954509735107, -3.065298080444336, -2.923100471496582, -2.780902862548828, -2.6387054920196533, -2.4965078830718994, -2.3543105125427246, -2.2121129035949707, -2.069915294647217, -1.927717924118042, -1.785520315170288, -1.6433228254318237, -1.5011253356933594, -1.3589277267456055, -1.2167302370071411, -1.0745327472686768, -0.9323352575302124, -0.7901377081871033, -0.6479401588439941, -0.5057426691055298, -0.36354517936706543, -0.2213476300239563, -0.07915008068084717, 0.06304740905761719, 0.20524492859840393, 0.3474424481391907, 0.4896399676799774, 0.6318374872207642, 0.7740349769592285, 0.9162325263023376, 1.0584300756454468, 1.2006275653839111, 1.3428250551223755, 1.4850225448608398, 1.6272201538085938, 1.769417643547058, 1.9116151332855225, 2.0538127422332764, 2.196010112762451, 2.338207721710205, 2.480405330657959, 2.622602701187134, 2.7648003101348877, 2.9069976806640625, 3.0491952896118164, 3.1913928985595703, 3.333590507507324, 3.475787878036499, 3.617985486984253, 3.7601828575134277, 3.9023804664611816, 4.0445780754089355, 4.186775207519531, 4.328972816467285, 4.471170425415039, 4.613368034362793]}, "gradients/decoder.roberta.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 2.0, 8.0, 15.0, 13.0, 16.0, 20.0, 22.0, 29.0, 59.0, 52.0, 70.0, 77.0, 116.0, 128.0, 179.0, 262.0, 521.0, 1891.0, 54549.0, 4011639.0, 120281.0, 2622.0, 553.0, 269.0, 181.0, 155.0, 105.0, 81.0, 66.0, 60.0, 41.0, 34.0, 34.0, 28.0, 11.0, 25.0, 12.0, 11.0, 6.0, 8.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-18.90625, -18.374755859375, -17.84326171875, -17.311767578125, -16.7802734375, -16.248779296875, -15.71728515625, -15.185791015625, -14.654296875, -14.122802734375, -13.59130859375, -13.059814453125, -12.5283203125, -11.996826171875, -11.46533203125, -10.933837890625, -10.40234375, -9.870849609375, -9.33935546875, -8.807861328125, -8.2763671875, -7.744873046875, -7.21337890625, -6.681884765625, -6.150390625, -5.618896484375, -5.08740234375, -4.555908203125, -4.0244140625, -3.492919921875, -2.96142578125, -2.429931640625, -1.8984375, -1.366943359375, -0.83544921875, -0.303955078125, 0.2275390625, 0.759033203125, 1.29052734375, 1.822021484375, 2.353515625, 2.885009765625, 3.41650390625, 3.947998046875, 4.4794921875, 5.010986328125, 5.54248046875, 6.073974609375, 6.60546875, 7.136962890625, 7.66845703125, 8.199951171875, 8.7314453125, 9.262939453125, 9.79443359375, 10.325927734375, 10.857421875, 11.388916015625, 11.92041015625, 12.451904296875, 12.9833984375, 13.514892578125, 14.04638671875, 14.577880859375, 15.109375]}, "gradients/decoder.roberta.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 2.0, 5.0, 6.0, 17.0, 14.0, 13.0, 16.0, 21.0, 34.0, 30.0, 27.0, 29.0, 36.0, 22.0, 40.0, 38.0, 39.0, 47.0, 60.0, 43.0, 41.0, 46.0, 52.0, 45.0, 19.0, 26.0, 38.0, 24.0, 23.0, 20.0, 17.0, 12.0, 15.0, 12.0, 15.0, 15.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.015625, -2.92938232421875, -2.8431396484375, -2.75689697265625, -2.670654296875, -2.58441162109375, -2.4981689453125, -2.41192626953125, -2.32568359375, -2.23944091796875, -2.1531982421875, -2.06695556640625, -1.980712890625, -1.89447021484375, -1.8082275390625, -1.72198486328125, -1.6357421875, -1.54949951171875, -1.4632568359375, -1.37701416015625, -1.290771484375, -1.20452880859375, -1.1182861328125, -1.03204345703125, -0.94580078125, -0.85955810546875, -0.7733154296875, -0.68707275390625, -0.600830078125, -0.51458740234375, -0.4283447265625, -0.34210205078125, -0.255859375, -0.16961669921875, -0.0833740234375, 0.00286865234375, 0.089111328125, 0.17535400390625, 0.2615966796875, 0.34783935546875, 0.43408203125, 0.52032470703125, 0.6065673828125, 0.69281005859375, 0.779052734375, 0.86529541015625, 0.9515380859375, 1.03778076171875, 1.1240234375, 1.21026611328125, 1.2965087890625, 1.38275146484375, 1.468994140625, 1.55523681640625, 1.6414794921875, 1.72772216796875, 1.81396484375, 1.90020751953125, 1.9864501953125, 2.07269287109375, 2.158935546875, 2.24517822265625, 2.3314208984375, 2.41766357421875, 2.50390625]}, "gradients/decoder.roberta.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 8.0, 21.0, 26.0, 33.0, 62.0, 86.0, 181.0, 252.0, 432.0, 1100.0, 10978.0, 4132655.0, 45608.0, 1517.0, 539.0, 286.0, 157.0, 92.0, 71.0, 55.0, 29.0, 18.0, 16.0, 12.0, 9.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-30.4375, -29.504638671875, -28.57177734375, -27.638916015625, -26.7060546875, -25.773193359375, -24.84033203125, -23.907470703125, -22.974609375, -22.041748046875, -21.10888671875, -20.176025390625, -19.2431640625, -18.310302734375, -17.37744140625, -16.444580078125, -15.51171875, -14.578857421875, -13.64599609375, -12.713134765625, -11.7802734375, -10.847412109375, -9.91455078125, -8.981689453125, -8.048828125, -7.115966796875, -6.18310546875, -5.250244140625, -4.3173828125, -3.384521484375, -2.45166015625, -1.518798828125, -0.5859375, 0.346923828125, 1.27978515625, 2.212646484375, 3.1455078125, 4.078369140625, 5.01123046875, 5.944091796875, 6.876953125, 7.809814453125, 8.74267578125, 9.675537109375, 10.6083984375, 11.541259765625, 12.47412109375, 13.406982421875, 14.33984375, 15.272705078125, 16.20556640625, 17.138427734375, 18.0712890625, 19.004150390625, 19.93701171875, 20.869873046875, 21.802734375, 22.735595703125, 23.66845703125, 24.601318359375, 25.5341796875, 26.467041015625, 27.39990234375, 28.332763671875, 29.265625]}, "gradients/decoder.roberta.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 11.0, 7.0, 8.0, 12.0, 14.0, 32.0, 27.0, 46.0, 55.0, 89.0, 147.0, 219.0, 349.0, 504.0, 601.0, 598.0, 462.0, 302.0, 208.0, 128.0, 73.0, 57.0, 37.0, 28.0, 18.0, 16.0, 6.0, 7.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4078521728515625, -1.360626220703125, -1.3134002685546875, -1.26617431640625, -1.2189483642578125, -1.171722412109375, -1.1244964599609375, -1.0772705078125, -1.0300445556640625, -0.982818603515625, -0.9355926513671875, -0.88836669921875, -0.8411407470703125, -0.793914794921875, -0.7466888427734375, -0.699462890625, -0.6522369384765625, -0.605010986328125, -0.5577850341796875, -0.51055908203125, -0.4633331298828125, -0.416107177734375, -0.3688812255859375, -0.3216552734375, -0.2744293212890625, -0.227203369140625, -0.1799774169921875, -0.13275146484375, -0.0855255126953125, -0.038299560546875, 0.0089263916015625, 0.05615234375, 0.1033782958984375, 0.150604248046875, 0.1978302001953125, 0.24505615234375, 0.2922821044921875, 0.339508056640625, 0.3867340087890625, 0.4339599609375, 0.4811859130859375, 0.528411865234375, 0.5756378173828125, 0.62286376953125, 0.6700897216796875, 0.717315673828125, 0.7645416259765625, 0.811767578125, 0.8589935302734375, 0.906219482421875, 0.9534454345703125, 1.00067138671875, 1.0478973388671875, 1.095123291015625, 1.1423492431640625, 1.1895751953125, 1.2368011474609375, 1.284027099609375, 1.3312530517578125, 1.37847900390625, 1.4257049560546875, 1.472930908203125, 1.5201568603515625, 1.5673828125]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 23.0, 37.0, 111.0, 220.0, 265.0, 177.0, 110.0, 49.0, 14.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5990474224090576, -2.2523324489593506, -1.9056177139282227, -1.5589027404785156, -1.2121878862380981, -0.8654730319976807, -0.5187580585479736, -0.1720433235168457, 0.17467164993286133, 0.5213865041732788, 0.8681014180183411, 1.2148163318634033, 1.5615311861038208, 1.9082460403442383, 2.2549610137939453, 2.6016757488250732, 2.9483907222747803, 3.2951056957244873, 3.6418204307556152, 3.9885354042053223, 4.335250377655029, 4.681964874267578, 5.028679847717285, 5.375394821166992, 5.722109794616699, 6.068824768066406, 6.415539741516113, 6.76225471496582, 7.108969211578369, 7.455684185028076, 7.802399158477783, 8.149113655090332, 8.495829582214355, 8.842544555664062, 9.18925952911377, 9.535974502563477, 9.882689476013184, 10.22940444946289, 10.576118469238281, 10.922833442687988, 11.269548416137695, 11.616263389587402, 11.96297836303711, 12.309693336486816, 12.656408309936523, 13.003122329711914, 13.349838256835938, 13.696552276611328, 14.043268203735352, 14.389983177185059, 14.736698150634766, 15.083413124084473, 15.43012809753418, 15.77684211730957, 16.123558044433594, 16.470272064208984, 16.816986083984375, 17.163700103759766, 17.51041603088379, 17.85713005065918, 18.203845977783203, 18.550559997558594, 18.897275924682617, 19.243989944458008, 19.59070587158203]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 6.0, 7.0, 11.0, 7.0, 16.0, 16.0, 17.0, 19.0, 22.0, 29.0, 28.0, 17.0, 25.0, 43.0, 43.0, 42.0, 42.0, 43.0, 36.0, 32.0, 47.0, 50.0, 43.0, 29.0, 36.0, 26.0, 31.0, 28.0, 22.0, 27.0, 30.0, 22.0, 22.0, 6.0, 13.0, 13.0, 9.0, 7.0, 8.0, 4.0, 9.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.850046396255493, -2.7553908824920654, -2.6607353687286377, -2.566079616546631, -2.471424102783203, -2.3767685890197754, -2.2821130752563477, -2.18745756149292, -2.092802047729492, -1.9981465339660645, -1.9034909009933472, -1.8088353872299194, -1.7141798734664917, -1.6195242404937744, -1.5248687267303467, -1.430213212966919, -1.3355575799942017, -1.240902066230774, -1.1462464332580566, -1.051590919494629, -0.9569354057312012, -0.8622798323631287, -0.7676242589950562, -0.6729687452316284, -0.5783131718635559, -0.4836576282978058, -0.38900208473205566, -0.29434651136398315, -0.19969096779823303, -0.10503542423248291, -0.0103798508644104, 0.08427566289901733, 0.17893123626708984, 0.27358677983283997, 0.3682423233985901, 0.4628978967666626, 0.5575534105300903, 0.6522089838981628, 0.7468645572662354, 0.8415200710296631, 0.9361756443977356, 1.030831217765808, 1.1254867315292358, 1.2201423645019531, 1.3147978782653809, 1.4094533920288086, 1.5041089057922363, 1.598764419555664, 1.6934200525283813, 1.788075566291809, 1.8827311992645264, 1.977386713027954, 2.072042226791382, 2.1666977405548096, 2.2613534927368164, 2.356009006500244, 2.450664520263672, 2.5453200340270996, 2.6399755477905273, 2.734631061553955, 2.829286813735962, 2.9239423274993896, 3.0185978412628174, 3.113253355026245, 3.207908868789673]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 19.0, 11.0, 24.0, 32.0, 51.0, 65.0, 88.0, 112.0, 164.0, 268.0, 339.0, 502.0, 698.0, 1064.0, 1586.0, 2251.0, 3294.0, 4833.0, 7591.0, 11479.0, 18127.0, 30110.0, 51776.0, 91735.0, 166063.0, 232243.0, 179124.0, 99985.0, 56103.0, 32453.0, 19631.0, 12596.0, 7789.0, 5176.0, 3529.0, 2333.0, 1574.0, 1152.0, 817.0, 475.0, 421.0, 275.0, 187.0, 125.0, 82.0, 67.0, 40.0, 31.0, 24.0, 13.0, 10.0, 5.0, 5.0, 4.0, 5.0, 0.0, 2.0, 1.0], "bins": [-0.50537109375, -0.4893646240234375, -0.473358154296875, -0.4573516845703125, -0.44134521484375, -0.4253387451171875, -0.409332275390625, -0.3933258056640625, -0.3773193359375, -0.3613128662109375, -0.345306396484375, -0.3292999267578125, -0.31329345703125, -0.2972869873046875, -0.281280517578125, -0.2652740478515625, -0.249267578125, -0.2332611083984375, -0.217254638671875, -0.2012481689453125, -0.18524169921875, -0.1692352294921875, -0.153228759765625, -0.1372222900390625, -0.1212158203125, -0.1052093505859375, -0.089202880859375, -0.0731964111328125, -0.05718994140625, -0.0411834716796875, -0.025177001953125, -0.0091705322265625, 0.0068359375, 0.0228424072265625, 0.038848876953125, 0.0548553466796875, 0.07086181640625, 0.0868682861328125, 0.102874755859375, 0.1188812255859375, 0.1348876953125, 0.1508941650390625, 0.166900634765625, 0.1829071044921875, 0.19891357421875, 0.2149200439453125, 0.230926513671875, 0.2469329833984375, 0.262939453125, 0.2789459228515625, 0.294952392578125, 0.3109588623046875, 0.32696533203125, 0.3429718017578125, 0.358978271484375, 0.3749847412109375, 0.3909912109375, 0.4069976806640625, 0.423004150390625, 0.4390106201171875, 0.45501708984375, 0.4710235595703125, 0.487030029296875, 0.5030364990234375, 0.51904296875]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 5.0, 7.0, 7.0, 9.0, 8.0, 19.0, 14.0, 15.0, 18.0, 23.0, 31.0, 27.0, 17.0, 26.0, 45.0, 42.0, 40.0, 41.0, 45.0, 34.0, 31.0, 51.0, 49.0, 43.0, 30.0, 34.0, 25.0, 32.0, 25.0, 26.0, 28.0, 29.0, 20.0, 24.0, 6.0, 12.0, 13.0, 10.0, 6.0, 9.0, 4.0, 8.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.841796875, -2.748779296875, -2.65576171875, -2.562744140625, -2.4697265625, -2.376708984375, -2.28369140625, -2.190673828125, -2.09765625, -2.004638671875, -1.91162109375, -1.818603515625, -1.7255859375, -1.632568359375, -1.53955078125, -1.446533203125, -1.353515625, -1.260498046875, -1.16748046875, -1.074462890625, -0.9814453125, -0.888427734375, -0.79541015625, -0.702392578125, -0.609375, -0.516357421875, -0.42333984375, -0.330322265625, -0.2373046875, -0.144287109375, -0.05126953125, 0.041748046875, 0.134765625, 0.227783203125, 0.32080078125, 0.413818359375, 0.5068359375, 0.599853515625, 0.69287109375, 0.785888671875, 0.87890625, 0.971923828125, 1.06494140625, 1.157958984375, 1.2509765625, 1.343994140625, 1.43701171875, 1.530029296875, 1.623046875, 1.716064453125, 1.80908203125, 1.902099609375, 1.9951171875, 2.088134765625, 2.18115234375, 2.274169921875, 2.3671875, 2.460205078125, 2.55322265625, 2.646240234375, 2.7392578125, 2.832275390625, 2.92529296875, 3.018310546875, 3.111328125]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 8.0, 10.0, 18.0, 18.0, 31.0, 29.0, 39.0, 57.0, 87.0, 155.0, 165.0, 248.0, 366.0, 594.0, 1011.0, 1846.0, 3936.0, 10608.0, 41569.0, 928833.0, 40139.0, 10328.0, 3887.0, 1758.0, 983.0, 564.0, 376.0, 252.0, 172.0, 114.0, 98.0, 64.0, 47.0, 36.0, 22.0, 24.0, 16.0, 12.0, 10.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9521484375, -1.892059326171875, -1.83197021484375, -1.771881103515625, -1.7117919921875, -1.651702880859375, -1.59161376953125, -1.531524658203125, -1.471435546875, -1.411346435546875, -1.35125732421875, -1.291168212890625, -1.2310791015625, -1.170989990234375, -1.11090087890625, -1.050811767578125, -0.99072265625, -0.930633544921875, -0.87054443359375, -0.810455322265625, -0.7503662109375, -0.690277099609375, -0.63018798828125, -0.570098876953125, -0.510009765625, -0.449920654296875, -0.38983154296875, -0.329742431640625, -0.2696533203125, -0.209564208984375, -0.14947509765625, -0.089385986328125, -0.029296875, 0.030792236328125, 0.09088134765625, 0.150970458984375, 0.2110595703125, 0.271148681640625, 0.33123779296875, 0.391326904296875, 0.451416015625, 0.511505126953125, 0.57159423828125, 0.631683349609375, 0.6917724609375, 0.751861572265625, 0.81195068359375, 0.872039794921875, 0.93212890625, 0.992218017578125, 1.05230712890625, 1.112396240234375, 1.1724853515625, 1.232574462890625, 1.29266357421875, 1.352752685546875, 1.412841796875, 1.472930908203125, 1.53302001953125, 1.593109130859375, 1.6531982421875, 1.713287353515625, 1.77337646484375, 1.833465576171875, 1.8935546875]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 7.0, 13.0, 10.0, 13.0, 19.0, 21.0, 27.0, 29.0, 23.0, 36.0, 30.0, 42.0, 30.0, 33.0, 33.0, 48.0, 51.0, 44.0, 46.0, 44.0, 48.0, 46.0, 30.0, 27.0, 30.0, 35.0, 32.0, 24.0, 23.0, 13.0, 19.0, 19.0, 10.0, 10.0, 8.0, 7.0, 2.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1328125, -2.0696258544921875, -2.006439208984375, -1.9432525634765625, -1.88006591796875, -1.8168792724609375, -1.753692626953125, -1.6905059814453125, -1.6273193359375, -1.5641326904296875, -1.500946044921875, -1.4377593994140625, -1.37457275390625, -1.3113861083984375, -1.248199462890625, -1.1850128173828125, -1.121826171875, -1.0586395263671875, -0.995452880859375, -0.9322662353515625, -0.86907958984375, -0.8058929443359375, -0.742706298828125, -0.6795196533203125, -0.6163330078125, -0.5531463623046875, -0.489959716796875, -0.4267730712890625, -0.36358642578125, -0.3003997802734375, -0.237213134765625, -0.1740264892578125, -0.11083984375, -0.0476531982421875, 0.015533447265625, 0.0787200927734375, 0.14190673828125, 0.2050933837890625, 0.268280029296875, 0.3314666748046875, 0.3946533203125, 0.4578399658203125, 0.521026611328125, 0.5842132568359375, 0.64739990234375, 0.7105865478515625, 0.773773193359375, 0.8369598388671875, 0.900146484375, 0.9633331298828125, 1.026519775390625, 1.0897064208984375, 1.15289306640625, 1.2160797119140625, 1.279266357421875, 1.3424530029296875, 1.4056396484375, 1.4688262939453125, 1.532012939453125, 1.5951995849609375, 1.65838623046875, 1.7215728759765625, 1.784759521484375, 1.8479461669921875, 1.9111328125]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 4.0, 6.0, 9.0, 9.0, 13.0, 25.0, 31.0, 36.0, 36.0, 72.0, 84.0, 142.0, 214.0, 316.0, 527.0, 949.0, 1632.0, 3531.0, 9808.0, 48539.0, 949083.0, 21583.0, 6132.0, 2566.0, 1239.0, 705.0, 385.0, 234.0, 204.0, 110.0, 89.0, 57.0, 48.0, 37.0, 22.0, 18.0, 13.0, 12.0, 8.0, 6.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.241455078125, -0.23348236083984375, -0.2255096435546875, -0.21753692626953125, -0.209564208984375, -0.20159149169921875, -0.1936187744140625, -0.18564605712890625, -0.17767333984375, -0.16970062255859375, -0.1617279052734375, -0.15375518798828125, -0.145782470703125, -0.13780975341796875, -0.1298370361328125, -0.12186431884765625, -0.1138916015625, -0.10591888427734375, -0.0979461669921875, -0.08997344970703125, -0.082000732421875, -0.07402801513671875, -0.0660552978515625, -0.05808258056640625, -0.05010986328125, -0.04213714599609375, -0.0341644287109375, -0.02619171142578125, -0.018218994140625, -0.01024627685546875, -0.0022735595703125, 0.00569915771484375, 0.013671875, 0.02164459228515625, 0.0296173095703125, 0.03759002685546875, 0.045562744140625, 0.05353546142578125, 0.0615081787109375, 0.06948089599609375, 0.07745361328125, 0.08542633056640625, 0.0933990478515625, 0.10137176513671875, 0.109344482421875, 0.11731719970703125, 0.1252899169921875, 0.13326263427734375, 0.1412353515625, 0.14920806884765625, 0.1571807861328125, 0.16515350341796875, 0.173126220703125, 0.18109893798828125, 0.1890716552734375, 0.19704437255859375, 0.20501708984375, 0.21298980712890625, 0.2209625244140625, 0.22893524169921875, 0.236907958984375, 0.24488067626953125, 0.2528533935546875, 0.26082611083984375, 0.268798828125]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 12.0, 15.0, 11.0, 13.0, 25.0, 22.0, 36.0, 33.0, 39.0, 50.0, 51.0, 55.0, 65.0, 87.0, 56.0, 75.0, 46.0, 51.0, 43.0, 49.0, 32.0, 22.0, 22.0, 29.0, 14.0, 9.0, 11.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1888484954833984e-05, -3.094784915447235e-05, -3.0007213354110718e-05, -2.9066577553749084e-05, -2.812594175338745e-05, -2.7185305953025818e-05, -2.6244670152664185e-05, -2.530403435230255e-05, -2.4363398551940918e-05, -2.3422762751579285e-05, -2.248212695121765e-05, -2.1541491150856018e-05, -2.0600855350494385e-05, -1.966021955013275e-05, -1.8719583749771118e-05, -1.7778947949409485e-05, -1.683831214904785e-05, -1.5897676348686218e-05, -1.4957040548324585e-05, -1.4016404747962952e-05, -1.3075768947601318e-05, -1.2135133147239685e-05, -1.1194497346878052e-05, -1.0253861546516418e-05, -9.313225746154785e-06, -8.372589945793152e-06, -7.4319541454315186e-06, -6.491318345069885e-06, -5.550682544708252e-06, -4.610046744346619e-06, -3.6694109439849854e-06, -2.728775143623352e-06, -1.7881393432617188e-06, -8.475035429000854e-07, 9.313225746154785e-08, 1.0337680578231812e-06, 1.9744038581848145e-06, 2.9150396585464478e-06, 3.855675458908081e-06, 4.796311259269714e-06, 5.736947059631348e-06, 6.677582859992981e-06, 7.618218660354614e-06, 8.558854460716248e-06, 9.499490261077881e-06, 1.0440126061439514e-05, 1.1380761861801147e-05, 1.232139766216278e-05, 1.3262033462524414e-05, 1.4202669262886047e-05, 1.514330506324768e-05, 1.6083940863609314e-05, 1.7024576663970947e-05, 1.796521246433258e-05, 1.8905848264694214e-05, 1.9846484065055847e-05, 2.078711986541748e-05, 2.1727755665779114e-05, 2.2668391466140747e-05, 2.360902726650238e-05, 2.4549663066864014e-05, 2.5490298867225647e-05, 2.643093466758728e-05, 2.7371570467948914e-05, 2.8312206268310547e-05]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 2.0, 7.0, 6.0, 8.0, 13.0, 17.0, 14.0, 23.0, 23.0, 41.0, 51.0, 97.0, 191.0, 918.0, 65169.0, 975982.0, 5238.0, 326.0, 142.0, 66.0, 51.0, 35.0, 34.0, 23.0, 19.0, 9.0, 17.0, 6.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.826171875, -0.8056564331054688, -0.7851409912109375, -0.7646255493164062, -0.744110107421875, -0.7235946655273438, -0.7030792236328125, -0.6825637817382812, -0.66204833984375, -0.6415328979492188, -0.6210174560546875, -0.6005020141601562, -0.579986572265625, -0.5594711303710938, -0.5389556884765625, -0.5184402465820312, -0.4979248046875, -0.47740936279296875, -0.4568939208984375, -0.43637847900390625, -0.415863037109375, -0.39534759521484375, -0.3748321533203125, -0.35431671142578125, -0.33380126953125, -0.31328582763671875, -0.2927703857421875, -0.27225494384765625, -0.251739501953125, -0.23122406005859375, -0.2107086181640625, -0.19019317626953125, -0.169677734375, -0.14916229248046875, -0.1286468505859375, -0.10813140869140625, -0.087615966796875, -0.06710052490234375, -0.0465850830078125, -0.02606964111328125, -0.00555419921875, 0.01496124267578125, 0.0354766845703125, 0.05599212646484375, 0.076507568359375, 0.09702301025390625, 0.1175384521484375, 0.13805389404296875, 0.1585693359375, 0.17908477783203125, 0.1996002197265625, 0.22011566162109375, 0.240631103515625, 0.26114654541015625, 0.2816619873046875, 0.30217742919921875, 0.32269287109375, 0.34320831298828125, 0.3637237548828125, 0.38423919677734375, 0.404754638671875, 0.42527008056640625, 0.4457855224609375, 0.46630096435546875, 0.48681640625]}, "gradients/decoder.roberta.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 14.0, 8.0, 8.0, 10.0, 19.0, 11.0, 20.0, 19.0, 25.0, 35.0, 48.0, 67.0, 109.0, 141.0, 133.0, 76.0, 72.0, 40.0, 29.0, 16.0, 12.0, 16.0, 5.0, 11.0, 16.0, 7.0, 4.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0242767333984375, -0.023250818252563477, -0.022224903106689453, -0.02119898796081543, -0.020173072814941406, -0.019147157669067383, -0.01812124252319336, -0.017095327377319336, -0.016069412231445312, -0.015043497085571289, -0.014017581939697266, -0.012991666793823242, -0.011965751647949219, -0.010939836502075195, -0.009913921356201172, -0.008888006210327148, -0.007862091064453125, -0.0068361759185791016, -0.005810260772705078, -0.004784345626831055, -0.0037584304809570312, -0.002732515335083008, -0.0017066001892089844, -0.0006806850433349609, 0.0003452301025390625, 0.001371145248413086, 0.0023970603942871094, 0.003422975540161133, 0.004448890686035156, 0.00547480583190918, 0.006500720977783203, 0.0075266361236572266, 0.00855255126953125, 0.009578466415405273, 0.010604381561279297, 0.01163029670715332, 0.012656211853027344, 0.013682126998901367, 0.01470804214477539, 0.015733957290649414, 0.016759872436523438, 0.01778578758239746, 0.018811702728271484, 0.019837617874145508, 0.02086353302001953, 0.021889448165893555, 0.022915363311767578, 0.0239412784576416, 0.024967193603515625, 0.02599310874938965, 0.027019023895263672, 0.028044939041137695, 0.02907085418701172, 0.030096769332885742, 0.031122684478759766, 0.03214859962463379, 0.03317451477050781, 0.034200429916381836, 0.03522634506225586, 0.03625226020812988, 0.037278175354003906, 0.03830409049987793, 0.03933000564575195, 0.04035592079162598, 0.0413818359375]}, "gradients/decoder.roberta.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 38.0, 52.0, 133.0, 240.0, 244.0, 159.0, 90.0, 37.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.741995334625244, -2.4080650806427, -2.0741348266601562, -1.7402044534683228, -1.4062741994857788, -1.0723439455032349, -0.7384135723114014, -0.4044833183288574, -0.07055306434631348, 0.26337721943855286, 0.5973075032234192, 0.9312378168106079, 1.2651680707931519, 1.5990983247756958, 1.9330286979675293, 2.2669589519500732, 2.600889205932617, 2.934819459915161, 3.268749713897705, 3.602680206298828, 3.936610221862793, 4.270540714263916, 4.604471206665039, 4.938401222229004, 5.272331237792969, 5.606261730194092, 5.940191745758057, 6.27412223815918, 6.6080522537231445, 6.941982746124268, 7.275913238525391, 7.6098432540893555, 7.943774223327637, 8.277704238891602, 8.611635208129883, 8.945565223693848, 9.279495239257812, 9.613425254821777, 9.947356224060059, 10.281286239624023, 10.615216255187988, 10.949146270751953, 11.283077239990234, 11.6170072555542, 11.950937271118164, 12.284867286682129, 12.61879825592041, 12.952728271484375, 13.286659240722656, 13.620589256286621, 13.954520225524902, 14.288450241088867, 14.622380256652832, 14.956310272216797, 15.290241241455078, 15.624171257019043, 15.958101272583008, 16.29203224182129, 16.625961303710938, 16.95989227294922, 17.2938232421875, 17.62775230407715, 17.96168327331543, 18.295612335205078, 18.62954330444336]}, "gradients/decoder.roberta.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 7.0, 10.0, 7.0, 20.0, 12.0, 17.0, 18.0, 22.0, 31.0, 27.0, 20.0, 22.0, 47.0, 41.0, 41.0, 41.0, 44.0, 35.0, 34.0, 48.0, 52.0, 40.0, 30.0, 34.0, 28.0, 31.0, 26.0, 23.0, 27.0, 30.0, 20.0, 23.0, 6.0, 15.0, 10.0, 11.0, 5.0, 9.0, 5.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.842822790145874, -2.7496328353881836, -2.656442880630493, -2.5632529258728027, -2.4700629711151123, -2.376873016357422, -2.2836830615997314, -2.190493106842041, -2.0973031520843506, -2.00411319732666, -1.9109232425689697, -1.8177332878112793, -1.7245433330535889, -1.6313533782958984, -1.538163423538208, -1.4449734687805176, -1.3517835140228271, -1.2585935592651367, -1.1654036045074463, -1.0722136497497559, -0.9790236949920654, -0.885833740234375, -0.7926437854766846, -0.6994538307189941, -0.6062638759613037, -0.5130739212036133, -0.41988396644592285, -0.3266940116882324, -0.233504056930542, -0.14031410217285156, -0.04712414741516113, 0.0460658073425293, 0.13925576210021973, 0.23244571685791016, 0.3256356716156006, 0.418825626373291, 0.5120155811309814, 0.6052055358886719, 0.6983954906463623, 0.7915854454040527, 0.8847754001617432, 0.9779653549194336, 1.071155309677124, 1.1643452644348145, 1.2575352191925049, 1.3507251739501953, 1.4439151287078857, 1.5371050834655762, 1.6302950382232666, 1.723484992980957, 1.8166749477386475, 1.909864902496338, 2.0030548572540283, 2.0962448120117188, 2.189434766769409, 2.2826247215270996, 2.37581467628479, 2.4690046310424805, 2.562194585800171, 2.6553845405578613, 2.7485744953155518, 2.841764450073242, 2.9349544048309326, 3.028144359588623, 3.1213343143463135]}, "gradients/decoder.roberta.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 5.0, 4.0, 6.0, 15.0, 15.0, 18.0, 24.0, 38.0, 59.0, 87.0, 127.0, 161.0, 271.0, 419.0, 600.0, 963.0, 1521.0, 2381.0, 4124.0, 7210.0, 14422.0, 30697.0, 70508.0, 182305.0, 402668.0, 191307.0, 73124.0, 31902.0, 15123.0, 7496.0, 4234.0, 2467.0, 1435.0, 917.0, 631.0, 415.0, 282.0, 189.0, 117.0, 72.0, 63.0, 39.0, 31.0, 23.0, 10.0, 10.0, 8.0, 7.0, 6.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-2.798828125, -2.7127685546875, -2.626708984375, -2.5406494140625, -2.45458984375, -2.3685302734375, -2.282470703125, -2.1964111328125, -2.1103515625, -2.0242919921875, -1.938232421875, -1.8521728515625, -1.76611328125, -1.6800537109375, -1.593994140625, -1.5079345703125, -1.421875, -1.3358154296875, -1.249755859375, -1.1636962890625, -1.07763671875, -0.9915771484375, -0.905517578125, -0.8194580078125, -0.7333984375, -0.6473388671875, -0.561279296875, -0.4752197265625, -0.38916015625, -0.3031005859375, -0.217041015625, -0.1309814453125, -0.044921875, 0.0411376953125, 0.127197265625, 0.2132568359375, 0.29931640625, 0.3853759765625, 0.471435546875, 0.5574951171875, 0.6435546875, 0.7296142578125, 0.815673828125, 0.9017333984375, 0.98779296875, 1.0738525390625, 1.159912109375, 1.2459716796875, 1.33203125, 1.4180908203125, 1.504150390625, 1.5902099609375, 1.67626953125, 1.7623291015625, 1.848388671875, 1.9344482421875, 2.0205078125, 2.1065673828125, 2.192626953125, 2.2786865234375, 2.36474609375, 2.4508056640625, 2.536865234375, 2.6229248046875, 2.708984375]}, "gradients/decoder.roberta.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 6.0, 7.0, 9.0, 8.0, 9.0, 16.0, 19.0, 12.0, 23.0, 22.0, 33.0, 24.0, 19.0, 31.0, 27.0, 51.0, 41.0, 44.0, 38.0, 36.0, 42.0, 45.0, 49.0, 42.0, 38.0, 32.0, 26.0, 21.0, 32.0, 24.0, 28.0, 29.0, 23.0, 15.0, 11.0, 12.0, 10.0, 9.0, 11.0, 3.0, 4.0, 8.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.55181884765625, -2.4649658203125, -2.37811279296875, -2.291259765625, -2.20440673828125, -2.1175537109375, -2.03070068359375, -1.94384765625, -1.85699462890625, -1.7701416015625, -1.68328857421875, -1.596435546875, -1.50958251953125, -1.4227294921875, -1.33587646484375, -1.2490234375, -1.16217041015625, -1.0753173828125, -0.98846435546875, -0.901611328125, -0.81475830078125, -0.7279052734375, -0.64105224609375, -0.55419921875, -0.46734619140625, -0.3804931640625, -0.29364013671875, -0.206787109375, -0.11993408203125, -0.0330810546875, 0.05377197265625, 0.140625, 0.22747802734375, 0.3143310546875, 0.40118408203125, 0.488037109375, 0.57489013671875, 0.6617431640625, 0.74859619140625, 0.83544921875, 0.92230224609375, 1.0091552734375, 1.09600830078125, 1.182861328125, 1.26971435546875, 1.3565673828125, 1.44342041015625, 1.5302734375, 1.61712646484375, 1.7039794921875, 1.79083251953125, 1.877685546875, 1.96453857421875, 2.0513916015625, 2.13824462890625, 2.22509765625, 2.31195068359375, 2.3988037109375, 2.48565673828125, 2.572509765625, 2.65936279296875, 2.7462158203125, 2.83306884765625, 2.919921875]}, "gradients/decoder.roberta.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 7.0, 6.0, 10.0, 4.0, 12.0, 20.0, 18.0, 26.0, 18.0, 27.0, 47.0, 40.0, 58.0, 92.0, 128.0, 185.0, 271.0, 462.0, 1045461.0, 643.0, 277.0, 187.0, 143.0, 72.0, 57.0, 48.0, 42.0, 33.0, 29.0, 22.0, 14.0, 12.0, 17.0, 4.0, 3.0, 6.0, 12.0, 6.0, 2.0, 4.0, 6.0, 5.0, 4.0, 1.0, 2.0], "bins": [-96.25, -93.6865234375, -91.123046875, -88.5595703125, -85.99609375, -83.4326171875, -80.869140625, -78.3056640625, -75.7421875, -73.1787109375, -70.615234375, -68.0517578125, -65.48828125, -62.9248046875, -60.361328125, -57.7978515625, -55.234375, -52.6708984375, -50.107421875, -47.5439453125, -44.98046875, -42.4169921875, -39.853515625, -37.2900390625, -34.7265625, -32.1630859375, -29.599609375, -27.0361328125, -24.47265625, -21.9091796875, -19.345703125, -16.7822265625, -14.21875, -11.6552734375, -9.091796875, -6.5283203125, -3.96484375, -1.4013671875, 1.162109375, 3.7255859375, 6.2890625, 8.8525390625, 11.416015625, 13.9794921875, 16.54296875, 19.1064453125, 21.669921875, 24.2333984375, 26.796875, 29.3603515625, 31.923828125, 34.4873046875, 37.05078125, 39.6142578125, 42.177734375, 44.7412109375, 47.3046875, 49.8681640625, 52.431640625, 54.9951171875, 57.55859375, 60.1220703125, 62.685546875, 65.2490234375, 67.8125]}, "gradients/decoder.roberta.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 2.0, 3.0, 9.0, 13.0, 5.0, 5.0, 8.0, 12.0, 10.0, 19.0, 18.0, 32.0, 23.0, 32.0, 35.0, 32.0, 28.0, 48.0, 60.0, 35.0, 41.0, 44.0, 44.0, 40.0, 41.0, 35.0, 41.0, 34.0, 32.0, 35.0, 19.0, 29.0, 19.0, 23.0, 20.0, 12.0, 9.0, 11.0, 6.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.587890625, -2.493865966796875, -2.39984130859375, -2.305816650390625, -2.2117919921875, -2.117767333984375, -2.02374267578125, -1.929718017578125, -1.835693359375, -1.741668701171875, -1.64764404296875, -1.553619384765625, -1.4595947265625, -1.365570068359375, -1.27154541015625, -1.177520751953125, -1.08349609375, -0.989471435546875, -0.89544677734375, -0.801422119140625, -0.7073974609375, -0.613372802734375, -0.51934814453125, -0.425323486328125, -0.331298828125, -0.237274169921875, -0.14324951171875, -0.049224853515625, 0.0447998046875, 0.138824462890625, 0.23284912109375, 0.326873779296875, 0.4208984375, 0.514923095703125, 0.60894775390625, 0.702972412109375, 0.7969970703125, 0.891021728515625, 0.98504638671875, 1.079071044921875, 1.173095703125, 1.267120361328125, 1.36114501953125, 1.455169677734375, 1.5491943359375, 1.643218994140625, 1.73724365234375, 1.831268310546875, 1.92529296875, 2.019317626953125, 2.11334228515625, 2.207366943359375, 2.3013916015625, 2.395416259765625, 2.48944091796875, 2.583465576171875, 2.677490234375, 2.771514892578125, 2.86553955078125, 2.959564208984375, 3.0535888671875, 3.147613525390625, 3.24163818359375, 3.335662841796875, 3.4296875]}, "gradients/decoder.roberta.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 8.0, 9.0, 21.0, 37.0, 79.0, 261.0, 1410.0, 1028445.0, 17503.0, 510.0, 157.0, 58.0, 20.0, 14.0, 8.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -11.8726806640625, -11.300048828125, -10.7274169921875, -10.15478515625, -9.5821533203125, -9.009521484375, -8.4368896484375, -7.8642578125, -7.2916259765625, -6.718994140625, -6.1463623046875, -5.57373046875, -5.0010986328125, -4.428466796875, -3.8558349609375, -3.283203125, -2.7105712890625, -2.137939453125, -1.5653076171875, -0.99267578125, -0.4200439453125, 0.152587890625, 0.7252197265625, 1.2978515625, 1.8704833984375, 2.443115234375, 3.0157470703125, 3.58837890625, 4.1610107421875, 4.733642578125, 5.3062744140625, 5.87890625, 6.4515380859375, 7.024169921875, 7.5968017578125, 8.16943359375, 8.7420654296875, 9.314697265625, 9.8873291015625, 10.4599609375, 11.0325927734375, 11.605224609375, 12.1778564453125, 12.75048828125, 13.3231201171875, 13.895751953125, 14.4683837890625, 15.041015625, 15.6136474609375, 16.186279296875, 16.7589111328125, 17.33154296875, 17.9041748046875, 18.476806640625, 19.0494384765625, 19.6220703125, 20.1947021484375, 20.767333984375, 21.3399658203125, 21.91259765625, 22.4852294921875, 23.057861328125, 23.6304931640625, 24.203125]}, "gradients/decoder.roberta.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 6.0, 15.0, 28.0, 24.0, 35.0, 68.0, 77.0, 120.0, 157.0, 140.0, 97.0, 72.0, 40.0, 25.0, 26.0, 16.0, 8.0, 8.0, 4.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016045570373535156, -0.0001541823148727417, -0.00014790892601013184, -0.00014163553714752197, -0.0001353621482849121, -0.00012908875942230225, -0.00012281537055969238, -0.00011654198169708252, -0.00011026859283447266, -0.00010399520397186279, -9.772181510925293e-05, -9.144842624664307e-05, -8.51750373840332e-05, -7.890164852142334e-05, -7.262825965881348e-05, -6.635487079620361e-05, -6.008148193359375e-05, -5.380809307098389e-05, -4.7534704208374023e-05, -4.126131534576416e-05, -3.49879264831543e-05, -2.8714537620544434e-05, -2.244114875793457e-05, -1.6167759895324707e-05, -9.894371032714844e-06, -3.6209821701049805e-06, 2.652406692504883e-06, 8.925795555114746e-06, 1.519918441772461e-05, 2.1472573280334473e-05, 2.7745962142944336e-05, 3.40193510055542e-05, 4.029273986816406e-05, 4.6566128730773926e-05, 5.283951759338379e-05, 5.911290645599365e-05, 6.538629531860352e-05, 7.165968418121338e-05, 7.793307304382324e-05, 8.42064619064331e-05, 9.047985076904297e-05, 9.675323963165283e-05, 0.0001030266284942627, 0.00010930001735687256, 0.00011557340621948242, 0.00012184679508209229, 0.00012812018394470215, 0.000134393572807312, 0.00014066696166992188, 0.00014694035053253174, 0.0001532137393951416, 0.00015948712825775146, 0.00016576051712036133, 0.0001720339059829712, 0.00017830729484558105, 0.00018458068370819092, 0.00019085407257080078, 0.00019712746143341064, 0.0002034008502960205, 0.00020967423915863037, 0.00021594762802124023, 0.0002222210168838501, 0.00022849440574645996, 0.00023476779460906982, 0.0002410411834716797]}, "gradients/decoder.roberta.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 10.0, 12.0, 25.0, 38.0, 102.0, 551.0, 14169.0, 1030828.0, 2362.0, 310.0, 77.0, 20.0, 20.0, 13.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.4305419921875, -12.900146484375, -12.3697509765625, -11.83935546875, -11.3089599609375, -10.778564453125, -10.2481689453125, -9.7177734375, -9.1873779296875, -8.656982421875, -8.1265869140625, -7.59619140625, -7.0657958984375, -6.535400390625, -6.0050048828125, -5.474609375, -4.9442138671875, -4.413818359375, -3.8834228515625, -3.35302734375, -2.8226318359375, -2.292236328125, -1.7618408203125, -1.2314453125, -0.7010498046875, -0.170654296875, 0.3597412109375, 0.89013671875, 1.4205322265625, 1.950927734375, 2.4813232421875, 3.01171875, 3.5421142578125, 4.072509765625, 4.6029052734375, 5.13330078125, 5.6636962890625, 6.194091796875, 6.7244873046875, 7.2548828125, 7.7852783203125, 8.315673828125, 8.8460693359375, 9.37646484375, 9.9068603515625, 10.437255859375, 10.9676513671875, 11.498046875, 12.0284423828125, 12.558837890625, 13.0892333984375, 13.61962890625, 14.1500244140625, 14.680419921875, 15.2108154296875, 15.7412109375, 16.2716064453125, 16.802001953125, 17.3323974609375, 17.86279296875, 18.3931884765625, 18.923583984375, 19.4539794921875, 19.984375]}, "gradients/decoder.roberta.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 10.0, 18.0, 21.0, 68.0, 95.0, 219.0, 260.0, 128.0, 81.0, 28.0, 21.0, 19.0, 10.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1025390625, -1.07366943359375, -1.0447998046875, -1.01593017578125, -0.987060546875, -0.95819091796875, -0.9293212890625, -0.90045166015625, -0.87158203125, -0.84271240234375, -0.8138427734375, -0.78497314453125, -0.756103515625, -0.72723388671875, -0.6983642578125, -0.66949462890625, -0.640625, -0.61175537109375, -0.5828857421875, -0.55401611328125, -0.525146484375, -0.49627685546875, -0.4674072265625, -0.43853759765625, -0.40966796875, -0.38079833984375, -0.3519287109375, -0.32305908203125, -0.294189453125, -0.26531982421875, -0.2364501953125, -0.20758056640625, -0.1787109375, -0.14984130859375, -0.1209716796875, -0.09210205078125, -0.063232421875, -0.03436279296875, -0.0054931640625, 0.02337646484375, 0.05224609375, 0.08111572265625, 0.1099853515625, 0.13885498046875, 0.167724609375, 0.19659423828125, 0.2254638671875, 0.25433349609375, 0.283203125, 0.31207275390625, 0.3409423828125, 0.36981201171875, 0.398681640625, 0.42755126953125, 0.4564208984375, 0.48529052734375, 0.51416015625, 0.54302978515625, 0.5718994140625, 0.60076904296875, 0.629638671875, 0.65850830078125, 0.6873779296875, 0.71624755859375, 0.7451171875]}, "gradients/decoder.roberta.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 5.0, 13.0, 43.0, 66.0, 142.0, 218.0, 186.0, 147.0, 112.0, 48.0, 24.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6835100650787354, -2.392770767211914, -2.1020312309265137, -1.8112918138504028, -1.520552396774292, -1.2298129796981812, -0.9390735626220703, -0.648334264755249, -0.35759472846984863, -0.06685531139373779, 0.22388410568237305, 0.5146235227584839, 0.8053629398345947, 1.0961023569107056, 1.3868417739868164, 1.6775810718536377, 1.968320608139038, 2.2590599060058594, 2.5497994422912598, 2.84053897857666, 3.1312782764434814, 3.4220175743103027, 3.712757110595703, 4.003496170043945, 4.294236183166504, 4.584975719451904, 4.875715255737305, 5.166454315185547, 5.457193851470947, 5.747933387756348, 6.03867244720459, 6.32941198348999, 6.620151519775391, 6.910891056060791, 7.201630592346191, 7.492369651794434, 7.783109188079834, 8.073848724365234, 8.364587783813477, 8.655326843261719, 8.946066856384277, 9.23680591583252, 9.527545928955078, 9.81828498840332, 10.109024047851562, 10.399764060974121, 10.690503120422363, 10.981243133544922, 11.271982192993164, 11.562721252441406, 11.853461265563965, 12.144200325012207, 12.434940338134766, 12.725679397583008, 13.01641845703125, 13.307157516479492, 13.59789752960205, 13.888636589050293, 14.179376602172852, 14.470115661621094, 14.760854721069336, 15.051594734191895, 15.342333793640137, 15.633073806762695, 15.923812866210938]}, "gradients/decoder.roberta.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 6.0, 5.0, 5.0, 5.0, 9.0, 22.0, 14.0, 16.0, 16.0, 27.0, 28.0, 24.0, 37.0, 32.0, 36.0, 28.0, 42.0, 43.0, 49.0, 39.0, 35.0, 37.0, 47.0, 43.0, 30.0, 35.0, 30.0, 33.0, 28.0, 32.0, 24.0, 26.0, 21.0, 22.0, 14.0, 11.0, 12.0, 10.0, 10.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.325441837310791, -3.222960948944092, -3.1204802989959717, -3.0179994106292725, -2.9155187606811523, -2.813037872314453, -2.710556983947754, -2.6080760955810547, -2.5055954456329346, -2.4031145572662354, -2.3006339073181152, -2.198153018951416, -2.095672130584717, -1.9931914806365967, -1.8907105922698975, -1.7882298231124878, -1.6857490539550781, -1.5832682847976685, -1.4807875156402588, -1.3783066272735596, -1.27582585811615, -1.1733450889587402, -1.070864200592041, -0.9683834314346313, -0.8659026622772217, -0.763421893119812, -0.6609410643577576, -0.5584602355957031, -0.45597946643829346, -0.3534986972808838, -0.25101786851882935, -0.1485370397567749, -0.04605603218078613, 0.05642476677894592, 0.15890556573867798, 0.26138636469841003, 0.3638671636581421, 0.46634793281555176, 0.5688287615776062, 0.6713095903396606, 0.7737903594970703, 0.87627112865448, 0.9787519574165344, 1.0812327861785889, 1.1837135553359985, 1.2861943244934082, 1.3886752128601074, 1.491155982017517, 1.5936367511749268, 1.6961175203323364, 1.798598289489746, 1.9010791778564453, 2.0035600662231445, 2.1060407161712646, 2.208521604537964, 2.311002254486084, 2.413483142852783, 2.5159640312194824, 2.6184446811676025, 2.7209255695343018, 2.823406219482422, 2.925887107849121, 3.0283679962158203, 3.1308488845825195, 3.2333295345306396]}, "gradients/decoder.roberta.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 4.0, 2.0, 6.0, 8.0, 13.0, 10.0, 11.0, 29.0, 38.0, 37.0, 59.0, 70.0, 86.0, 102.0, 151.0, 261.0, 325.0, 474.0, 692.0, 937.0, 1596.0, 2842.0, 5582.0, 12015.0, 29452.0, 87154.0, 294629.0, 1042664.0, 1788150.0, 650148.0, 180069.0, 55946.0, 20738.0, 9131.0, 4254.0, 2287.0, 1336.0, 888.0, 596.0, 406.0, 295.0, 198.0, 146.0, 114.0, 76.0, 56.0, 50.0, 45.0, 35.0, 25.0, 23.0, 17.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.693359375, -2.607330322265625, -2.52130126953125, -2.435272216796875, -2.3492431640625, -2.263214111328125, -2.17718505859375, -2.091156005859375, -2.005126953125, -1.919097900390625, -1.83306884765625, -1.747039794921875, -1.6610107421875, -1.574981689453125, -1.48895263671875, -1.402923583984375, -1.31689453125, -1.230865478515625, -1.14483642578125, -1.058807373046875, -0.9727783203125, -0.886749267578125, -0.80072021484375, -0.714691162109375, -0.628662109375, -0.542633056640625, -0.45660400390625, -0.370574951171875, -0.2845458984375, -0.198516845703125, -0.11248779296875, -0.026458740234375, 0.0595703125, 0.145599365234375, 0.23162841796875, 0.317657470703125, 0.4036865234375, 0.489715576171875, 0.57574462890625, 0.661773681640625, 0.747802734375, 0.833831787109375, 0.91986083984375, 1.005889892578125, 1.0919189453125, 1.177947998046875, 1.26397705078125, 1.350006103515625, 1.43603515625, 1.522064208984375, 1.60809326171875, 1.694122314453125, 1.7801513671875, 1.866180419921875, 1.95220947265625, 2.038238525390625, 2.124267578125, 2.210296630859375, 2.29632568359375, 2.382354736328125, 2.4683837890625, 2.554412841796875, 2.64044189453125, 2.726470947265625, 2.8125]}, "gradients/decoder.roberta.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 8.0, 11.0, 12.0, 8.0, 22.0, 22.0, 15.0, 21.0, 24.0, 29.0, 33.0, 33.0, 43.0, 44.0, 29.0, 48.0, 45.0, 40.0, 41.0, 34.0, 36.0, 31.0, 35.0, 31.0, 37.0, 38.0, 28.0, 20.0, 21.0, 16.0, 23.0, 16.0, 21.0, 12.0, 12.0, 8.0, 9.0, 6.0, 6.0, 1.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-2.48046875, -2.4075927734375, -2.334716796875, -2.2618408203125, -2.18896484375, -2.1160888671875, -2.043212890625, -1.9703369140625, -1.8974609375, -1.8245849609375, -1.751708984375, -1.6788330078125, -1.60595703125, -1.5330810546875, -1.460205078125, -1.3873291015625, -1.314453125, -1.2415771484375, -1.168701171875, -1.0958251953125, -1.02294921875, -0.9500732421875, -0.877197265625, -0.8043212890625, -0.7314453125, -0.6585693359375, -0.585693359375, -0.5128173828125, -0.43994140625, -0.3670654296875, -0.294189453125, -0.2213134765625, -0.1484375, -0.0755615234375, -0.002685546875, 0.0701904296875, 0.14306640625, 0.2159423828125, 0.288818359375, 0.3616943359375, 0.4345703125, 0.5074462890625, 0.580322265625, 0.6531982421875, 0.72607421875, 0.7989501953125, 0.871826171875, 0.9447021484375, 1.017578125, 1.0904541015625, 1.163330078125, 1.2362060546875, 1.30908203125, 1.3819580078125, 1.454833984375, 1.5277099609375, 1.6005859375, 1.6734619140625, 1.746337890625, 1.8192138671875, 1.89208984375, 1.9649658203125, 2.037841796875, 2.1107177734375, 2.18359375]}, "gradients/decoder.roberta.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 13.0, 18.0, 10.0, 23.0, 27.0, 30.0, 66.0, 94.0, 149.0, 287.0, 584.0, 3826.0, 4034244.0, 152486.0, 1417.0, 423.0, 214.0, 114.0, 70.0, 60.0, 37.0, 28.0, 16.0, 9.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -31.9892578125, -30.916015625, -29.8427734375, -28.76953125, -27.6962890625, -26.623046875, -25.5498046875, -24.4765625, -23.4033203125, -22.330078125, -21.2568359375, -20.18359375, -19.1103515625, -18.037109375, -16.9638671875, -15.890625, -14.8173828125, -13.744140625, -12.6708984375, -11.59765625, -10.5244140625, -9.451171875, -8.3779296875, -7.3046875, -6.2314453125, -5.158203125, -4.0849609375, -3.01171875, -1.9384765625, -0.865234375, 0.2080078125, 1.28125, 2.3544921875, 3.427734375, 4.5009765625, 5.57421875, 6.6474609375, 7.720703125, 8.7939453125, 9.8671875, 10.9404296875, 12.013671875, 13.0869140625, 14.16015625, 15.2333984375, 16.306640625, 17.3798828125, 18.453125, 19.5263671875, 20.599609375, 21.6728515625, 22.74609375, 23.8193359375, 24.892578125, 25.9658203125, 27.0390625, 28.1123046875, 29.185546875, 30.2587890625, 31.33203125, 32.4052734375, 33.478515625, 34.5517578125, 35.625]}, "gradients/decoder.roberta.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 10.0, 14.0, 27.0, 36.0, 50.0, 81.0, 121.0, 175.0, 347.0, 490.0, 695.0, 698.0, 471.0, 309.0, 200.0, 110.0, 71.0, 48.0, 33.0, 20.0, 22.0, 10.0, 6.0, 9.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7265625, -1.6741485595703125, -1.621734619140625, -1.5693206787109375, -1.51690673828125, -1.4644927978515625, -1.412078857421875, -1.3596649169921875, -1.3072509765625, -1.2548370361328125, -1.202423095703125, -1.1500091552734375, -1.09759521484375, -1.0451812744140625, -0.992767333984375, -0.9403533935546875, -0.887939453125, -0.8355255126953125, -0.783111572265625, -0.7306976318359375, -0.67828369140625, -0.6258697509765625, -0.573455810546875, -0.5210418701171875, -0.4686279296875, -0.4162139892578125, -0.363800048828125, -0.3113861083984375, -0.25897216796875, -0.2065582275390625, -0.154144287109375, -0.1017303466796875, -0.04931640625, 0.0030975341796875, 0.055511474609375, 0.1079254150390625, 0.16033935546875, 0.2127532958984375, 0.265167236328125, 0.3175811767578125, 0.3699951171875, 0.4224090576171875, 0.474822998046875, 0.5272369384765625, 0.57965087890625, 0.6320648193359375, 0.684478759765625, 0.7368927001953125, 0.789306640625, 0.8417205810546875, 0.894134521484375, 0.9465484619140625, 0.99896240234375, 1.0513763427734375, 1.103790283203125, 1.1562042236328125, 1.2086181640625, 1.2610321044921875, 1.313446044921875, 1.3658599853515625, 1.41827392578125, 1.4706878662109375, 1.523101806640625, 1.5755157470703125, 1.6279296875]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 13.0, 34.0, 63.0, 85.0, 145.0, 161.0, 182.0, 136.0, 95.0, 50.0, 23.0, 15.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6306469440460205, -2.3922266960144043, -2.153806447982788, -1.9153861999511719, -1.6769659519195557, -1.438545823097229, -1.2001255750656128, -0.9617053270339966, -0.7232850790023804, -0.48486483097076416, -0.24644461274147034, -0.008024394512176514, 0.2303958535194397, 0.46881604194641113, 0.7072362899780273, 0.9456565380096436, 1.1840767860412598, 1.422497034072876, 1.6609172821044922, 1.8993375301361084, 2.1377577781677246, 2.3761777877807617, 2.614598274230957, 2.853018283843994, 3.0914387702941895, 3.3298590183258057, 3.568279266357422, 3.806699514389038, 4.045119762420654, 4.283539772033691, 4.521960258483887, 4.760380268096924, 4.998800754547119, 5.237220764160156, 5.475641250610352, 5.714061260223389, 5.952481746673584, 6.190901756286621, 6.429322242736816, 6.6677422523498535, 6.906162738800049, 7.144582748413086, 7.383003234863281, 7.621423244476318, 7.859843730926514, 8.09826374053955, 8.336684226989746, 8.575104713439941, 8.81352424621582, 9.051944732666016, 9.290364265441895, 9.52878475189209, 9.767205238342285, 10.00562572479248, 10.24404525756836, 10.482465744018555, 10.72088623046875, 10.959306716918945, 11.197726249694824, 11.43614673614502, 11.674567222595215, 11.91298770904541, 12.151407241821289, 12.389827728271484, 12.62824821472168]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 6.0, 6.0, 9.0, 14.0, 12.0, 13.0, 14.0, 16.0, 17.0, 15.0, 26.0, 34.0, 22.0, 37.0, 34.0, 41.0, 34.0, 50.0, 41.0, 38.0, 30.0, 31.0, 37.0, 38.0, 28.0, 34.0, 41.0, 39.0, 27.0, 26.0, 28.0, 28.0, 23.0, 22.0, 13.0, 9.0, 10.0, 6.0, 6.0, 8.0, 11.0, 3.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.4835362434387207, -2.399184226989746, -2.3148324489593506, -2.230480432510376, -2.1461286544799805, -2.061776638031006, -1.9774247407913208, -1.8930728435516357, -1.8087209463119507, -1.7243690490722656, -1.6400171518325806, -1.5556652545928955, -1.471313238143921, -1.3869614601135254, -1.3026094436645508, -1.2182575464248657, -1.1339056491851807, -1.0495537519454956, -0.9652018547058105, -0.8808498978614807, -0.7964980006217957, -0.7121461033821106, -0.6277941465377808, -0.5434422492980957, -0.45909035205841064, -0.3747384548187256, -0.29038652777671814, -0.2060346007347107, -0.12168270349502563, -0.037330806255340576, 0.04702115058898926, 0.13137304782867432, 0.21572470664978027, 0.30007660388946533, 0.3844285309314728, 0.4687804579734802, 0.5531323552131653, 0.6374842524528503, 0.7218362092971802, 0.8061881065368652, 0.8905400037765503, 0.9748919010162354, 1.0592437982559204, 1.1435956954956055, 1.22794771194458, 1.3122994899749756, 1.3966515064239502, 1.4810034036636353, 1.5653553009033203, 1.6497071981430054, 1.7340590953826904, 1.818411111831665, 1.9027628898620605, 1.9871149063110352, 2.0714669227600098, 2.1558187007904053, 2.240170478820801, 2.3245224952697754, 2.408874273300171, 2.4932262897491455, 2.577578067779541, 2.6619300842285156, 2.7462821006774902, 2.8306338787078857, 2.9149858951568604]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 5.0, 5.0, 3.0, 4.0, 15.0, 20.0, 22.0, 33.0, 46.0, 74.0, 76.0, 121.0, 153.0, 219.0, 338.0, 509.0, 665.0, 1045.0, 1455.0, 2113.0, 3191.0, 5006.0, 7281.0, 11181.0, 17801.0, 28484.0, 46860.0, 80212.0, 141908.0, 218643.0, 194658.0, 115239.0, 65453.0, 38423.0, 23657.0, 14714.0, 9717.0, 6229.0, 4153.0, 2801.0, 1861.0, 1306.0, 864.0, 531.0, 414.0, 319.0, 215.0, 142.0, 94.0, 92.0, 57.0, 33.0, 33.0, 23.0, 23.0, 7.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.490966796875, -0.4750328063964844, -0.45909881591796875, -0.4431648254394531, -0.4272308349609375, -0.4112968444824219, -0.39536285400390625, -0.3794288635253906, -0.363494873046875, -0.3475608825683594, -0.33162689208984375, -0.3156929016113281, -0.2997589111328125, -0.2838249206542969, -0.26789093017578125, -0.2519569396972656, -0.23602294921875, -0.22008895874023438, -0.20415496826171875, -0.18822097778320312, -0.1722869873046875, -0.15635299682617188, -0.14041900634765625, -0.12448501586914062, -0.108551025390625, -0.09261703491210938, -0.07668304443359375, -0.060749053955078125, -0.0448150634765625, -0.028881072998046875, -0.01294708251953125, 0.002986907958984375, 0.0189208984375, 0.034854888916015625, 0.05078887939453125, 0.06672286987304688, 0.0826568603515625, 0.09859085083007812, 0.11452484130859375, 0.13045883178710938, 0.146392822265625, 0.16232681274414062, 0.17826080322265625, 0.19419479370117188, 0.2101287841796875, 0.22606277465820312, 0.24199676513671875, 0.2579307556152344, 0.27386474609375, 0.2897987365722656, 0.30573272705078125, 0.3216667175292969, 0.3376007080078125, 0.3535346984863281, 0.36946868896484375, 0.3854026794433594, 0.401336669921875, 0.4172706604003906, 0.43320465087890625, 0.4491386413574219, 0.4650726318359375, 0.4810066223144531, 0.49694061279296875, 0.5128746032714844, 0.52880859375]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 6.0, 7.0, 10.0, 12.0, 14.0, 10.0, 17.0, 15.0, 16.0, 16.0, 27.0, 33.0, 23.0, 35.0, 41.0, 33.0, 35.0, 51.0, 39.0, 41.0, 28.0, 35.0, 38.0, 34.0, 26.0, 35.0, 40.0, 41.0, 29.0, 28.0, 21.0, 30.0, 22.0, 22.0, 13.0, 10.0, 11.0, 4.0, 7.0, 7.0, 11.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.521484375, -2.438751220703125, -2.35601806640625, -2.273284912109375, -2.1905517578125, -2.107818603515625, -2.02508544921875, -1.942352294921875, -1.859619140625, -1.776885986328125, -1.69415283203125, -1.611419677734375, -1.5286865234375, -1.445953369140625, -1.36322021484375, -1.280487060546875, -1.19775390625, -1.115020751953125, -1.03228759765625, -0.949554443359375, -0.8668212890625, -0.784088134765625, -0.70135498046875, -0.618621826171875, -0.535888671875, -0.453155517578125, -0.37042236328125, -0.287689208984375, -0.2049560546875, -0.122222900390625, -0.03948974609375, 0.043243408203125, 0.1259765625, 0.208709716796875, 0.29144287109375, 0.374176025390625, 0.4569091796875, 0.539642333984375, 0.62237548828125, 0.705108642578125, 0.787841796875, 0.870574951171875, 0.95330810546875, 1.036041259765625, 1.1187744140625, 1.201507568359375, 1.28424072265625, 1.366973876953125, 1.44970703125, 1.532440185546875, 1.61517333984375, 1.697906494140625, 1.7806396484375, 1.863372802734375, 1.94610595703125, 2.028839111328125, 2.111572265625, 2.194305419921875, 2.27703857421875, 2.359771728515625, 2.4425048828125, 2.525238037109375, 2.60797119140625, 2.690704345703125, 2.7734375]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 7.0, 9.0, 22.0, 15.0, 15.0, 33.0, 45.0, 67.0, 77.0, 99.0, 142.0, 195.0, 316.0, 449.0, 649.0, 1106.0, 2083.0, 4420.0, 11960.0, 48789.0, 928104.0, 32521.0, 9093.0, 3589.0, 1783.0, 962.0, 612.0, 428.0, 267.0, 182.0, 128.0, 82.0, 81.0, 59.0, 45.0, 28.0, 19.0, 13.0, 15.0, 10.0, 6.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.955169677734375, -1.89080810546875, -1.826446533203125, -1.7620849609375, -1.697723388671875, -1.63336181640625, -1.569000244140625, -1.504638671875, -1.440277099609375, -1.37591552734375, -1.311553955078125, -1.2471923828125, -1.182830810546875, -1.11846923828125, -1.054107666015625, -0.98974609375, -0.925384521484375, -0.86102294921875, -0.796661376953125, -0.7322998046875, -0.667938232421875, -0.60357666015625, -0.539215087890625, -0.474853515625, -0.410491943359375, -0.34613037109375, -0.281768798828125, -0.2174072265625, -0.153045654296875, -0.08868408203125, -0.024322509765625, 0.0400390625, 0.104400634765625, 0.16876220703125, 0.233123779296875, 0.2974853515625, 0.361846923828125, 0.42620849609375, 0.490570068359375, 0.554931640625, 0.619293212890625, 0.68365478515625, 0.748016357421875, 0.8123779296875, 0.876739501953125, 0.94110107421875, 1.005462646484375, 1.06982421875, 1.134185791015625, 1.19854736328125, 1.262908935546875, 1.3272705078125, 1.391632080078125, 1.45599365234375, 1.520355224609375, 1.584716796875, 1.649078369140625, 1.71343994140625, 1.777801513671875, 1.8421630859375, 1.906524658203125, 1.97088623046875, 2.035247802734375, 2.099609375]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 4.0, 3.0, 8.0, 2.0, 5.0, 9.0, 9.0, 17.0, 17.0, 14.0, 21.0, 19.0, 25.0, 36.0, 25.0, 24.0, 33.0, 41.0, 31.0, 44.0, 32.0, 41.0, 45.0, 53.0, 44.0, 43.0, 39.0, 44.0, 33.0, 30.0, 35.0, 24.0, 22.0, 21.0, 25.0, 17.0, 15.0, 10.0, 5.0, 12.0, 6.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7958984375, -1.7402191162109375, -1.684539794921875, -1.6288604736328125, -1.57318115234375, -1.5175018310546875, -1.461822509765625, -1.4061431884765625, -1.3504638671875, -1.2947845458984375, -1.239105224609375, -1.1834259033203125, -1.12774658203125, -1.0720672607421875, -1.016387939453125, -0.9607086181640625, -0.905029296875, -0.8493499755859375, -0.793670654296875, -0.7379913330078125, -0.68231201171875, -0.6266326904296875, -0.570953369140625, -0.5152740478515625, -0.4595947265625, -0.4039154052734375, -0.348236083984375, -0.2925567626953125, -0.23687744140625, -0.1811981201171875, -0.125518798828125, -0.0698394775390625, -0.01416015625, 0.0415191650390625, 0.097198486328125, 0.1528778076171875, 0.20855712890625, 0.2642364501953125, 0.319915771484375, 0.3755950927734375, 0.4312744140625, 0.4869537353515625, 0.542633056640625, 0.5983123779296875, 0.65399169921875, 0.7096710205078125, 0.765350341796875, 0.8210296630859375, 0.876708984375, 0.9323883056640625, 0.988067626953125, 1.0437469482421875, 1.09942626953125, 1.1551055908203125, 1.210784912109375, 1.2664642333984375, 1.3221435546875, 1.3778228759765625, 1.433502197265625, 1.4891815185546875, 1.54486083984375, 1.6005401611328125, 1.656219482421875, 1.7118988037109375, 1.767578125]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 11.0, 16.0, 20.0, 19.0, 43.0, 68.0, 83.0, 128.0, 234.0, 337.0, 626.0, 1122.0, 2371.0, 6366.0, 26305.0, 957853.0, 38807.0, 8272.0, 2826.0, 1340.0, 642.0, 379.0, 238.0, 128.0, 97.0, 74.0, 42.0, 37.0, 20.0, 10.0, 11.0, 10.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.210205078125, -0.203948974609375, -0.19769287109375, -0.191436767578125, -0.1851806640625, -0.178924560546875, -0.17266845703125, -0.166412353515625, -0.16015625, -0.153900146484375, -0.14764404296875, -0.141387939453125, -0.1351318359375, -0.128875732421875, -0.12261962890625, -0.116363525390625, -0.110107421875, -0.103851318359375, -0.09759521484375, -0.091339111328125, -0.0850830078125, -0.078826904296875, -0.07257080078125, -0.066314697265625, -0.06005859375, -0.053802490234375, -0.04754638671875, -0.041290283203125, -0.0350341796875, -0.028778076171875, -0.02252197265625, -0.016265869140625, -0.010009765625, -0.003753662109375, 0.00250244140625, 0.008758544921875, 0.0150146484375, 0.021270751953125, 0.02752685546875, 0.033782958984375, 0.0400390625, 0.046295166015625, 0.05255126953125, 0.058807373046875, 0.0650634765625, 0.071319580078125, 0.07757568359375, 0.083831787109375, 0.090087890625, 0.096343994140625, 0.10260009765625, 0.108856201171875, 0.1151123046875, 0.121368408203125, 0.12762451171875, 0.133880615234375, 0.14013671875, 0.146392822265625, 0.15264892578125, 0.158905029296875, 0.1651611328125, 0.171417236328125, 0.17767333984375, 0.183929443359375, 0.190185546875]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 4.0, 7.0, 5.0, 12.0, 12.0, 19.0, 15.0, 25.0, 33.0, 38.0, 37.0, 56.0, 66.0, 56.0, 81.0, 65.0, 68.0, 59.0, 71.0, 48.0, 42.0, 27.0, 28.0, 25.0, 18.0, 14.0, 10.0, 13.0, 4.0, 10.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.291534423828125e-05, -4.162639379501343e-05, -4.0337443351745605e-05, -3.904849290847778e-05, -3.775954246520996e-05, -3.647059202194214e-05, -3.5181641578674316e-05, -3.3892691135406494e-05, -3.260374069213867e-05, -3.131479024887085e-05, -3.0025839805603027e-05, -2.8736889362335205e-05, -2.7447938919067383e-05, -2.615898847579956e-05, -2.4870038032531738e-05, -2.3581087589263916e-05, -2.2292137145996094e-05, -2.100318670272827e-05, -1.971423625946045e-05, -1.8425285816192627e-05, -1.7136335372924805e-05, -1.5847384929656982e-05, -1.455843448638916e-05, -1.3269484043121338e-05, -1.1980533599853516e-05, -1.0691583156585693e-05, -9.402632713317871e-06, -8.113682270050049e-06, -6.8247318267822266e-06, -5.535781383514404e-06, -4.246830940246582e-06, -2.9578804969787598e-06, -1.6689300537109375e-06, -3.7997961044311523e-07, 9.08970832824707e-07, 2.1979212760925293e-06, 3.4868717193603516e-06, 4.775822162628174e-06, 6.064772605895996e-06, 7.353723049163818e-06, 8.64267349243164e-06, 9.931623935699463e-06, 1.1220574378967285e-05, 1.2509524822235107e-05, 1.379847526550293e-05, 1.5087425708770752e-05, 1.6376376152038574e-05, 1.7665326595306396e-05, 1.895427703857422e-05, 2.024322748184204e-05, 2.1532177925109863e-05, 2.2821128368377686e-05, 2.4110078811645508e-05, 2.539902925491333e-05, 2.6687979698181152e-05, 2.7976930141448975e-05, 2.9265880584716797e-05, 3.055483102798462e-05, 3.184378147125244e-05, 3.3132731914520264e-05, 3.4421682357788086e-05, 3.571063280105591e-05, 3.699958324432373e-05, 3.828853368759155e-05, 3.9577484130859375e-05]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 2.0, 13.0, 13.0, 13.0, 21.0, 61.0, 90.0, 477.0, 33292.0, 1004195.0, 9851.0, 285.0, 101.0, 44.0, 20.0, 12.0, 14.0, 5.0, 3.0, 5.0, 6.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.488037109375, -0.4714317321777344, -0.45482635498046875, -0.4382209777832031, -0.4216156005859375, -0.4050102233886719, -0.38840484619140625, -0.3717994689941406, -0.355194091796875, -0.3385887145996094, -0.32198333740234375, -0.3053779602050781, -0.2887725830078125, -0.2721672058105469, -0.25556182861328125, -0.23895645141601562, -0.22235107421875, -0.20574569702148438, -0.18914031982421875, -0.17253494262695312, -0.1559295654296875, -0.13932418823242188, -0.12271881103515625, -0.10611343383789062, -0.089508056640625, -0.07290267944335938, -0.05629730224609375, -0.039691925048828125, -0.0230865478515625, -0.006481170654296875, 0.01012420654296875, 0.026729583740234375, 0.0433349609375, 0.059940338134765625, 0.07654571533203125, 0.09315109252929688, 0.1097564697265625, 0.12636184692382812, 0.14296722412109375, 0.15957260131835938, 0.176177978515625, 0.19278335571289062, 0.20938873291015625, 0.22599411010742188, 0.2425994873046875, 0.2592048645019531, 0.27581024169921875, 0.2924156188964844, 0.30902099609375, 0.3256263732910156, 0.34223175048828125, 0.3588371276855469, 0.3754425048828125, 0.3920478820800781, 0.40865325927734375, 0.4252586364746094, 0.441864013671875, 0.4584693908691406, 0.47507476806640625, 0.4916801452636719, 0.5082855224609375, 0.5248908996582031, 0.5414962768554688, 0.5581016540527344, 0.57470703125]}, "gradients/decoder.roberta.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 12.0, 5.0, 6.0, 7.0, 13.0, 28.0, 33.0, 37.0, 49.0, 76.0, 71.0, 123.0, 123.0, 100.0, 84.0, 56.0, 34.0, 28.0, 20.0, 18.0, 23.0, 12.0, 7.0, 6.0, 8.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01885986328125, -0.018309593200683594, -0.017759323120117188, -0.01720905303955078, -0.016658782958984375, -0.01610851287841797, -0.015558242797851562, -0.015007972717285156, -0.01445770263671875, -0.013907432556152344, -0.013357162475585938, -0.012806892395019531, -0.012256622314453125, -0.011706352233886719, -0.011156082153320312, -0.010605812072753906, -0.0100555419921875, -0.009505271911621094, -0.008955001831054688, -0.008404731750488281, -0.007854461669921875, -0.007304191589355469, -0.0067539215087890625, -0.006203651428222656, -0.00565338134765625, -0.005103111267089844, -0.0045528411865234375, -0.004002571105957031, -0.003452301025390625, -0.0029020309448242188, -0.0023517608642578125, -0.0018014907836914062, -0.001251220703125, -0.0007009506225585938, -0.0001506805419921875, 0.00039958953857421875, 0.000949859619140625, 0.0015001296997070312, 0.0020503997802734375, 0.0026006698608398438, 0.00315093994140625, 0.0037012100219726562, 0.0042514801025390625, 0.004801750183105469, 0.005352020263671875, 0.005902290344238281, 0.0064525604248046875, 0.007002830505371094, 0.0075531005859375, 0.008103370666503906, 0.008653640747070312, 0.009203910827636719, 0.009754180908203125, 0.010304450988769531, 0.010854721069335938, 0.011404991149902344, 0.01195526123046875, 0.012505531311035156, 0.013055801391601562, 0.013606071472167969, 0.014156341552734375, 0.014706611633300781, 0.015256881713867188, 0.015807151794433594, 0.016357421875]}, "gradients/decoder.roberta.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 13.0, 29.0, 71.0, 110.0, 212.0, 188.0, 189.0, 110.0, 54.0, 21.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6760406494140625, -2.3942885398864746, -2.1125364303588867, -1.8307842016220093, -1.5490320920944214, -1.2672799825668335, -0.985527753829956, -0.7037756443023682, -0.4220235347747803, -0.14027139544487, 0.14148074388504028, 0.42323291301727295, 0.7049850225448608, 0.9867371320724487, 1.2684893608093262, 1.550241470336914, 1.831993579864502, 2.11374568939209, 2.3954977989196777, 2.6772499084472656, 2.9590020179748535, 3.2407541275024414, 3.5225064754486084, 3.8042585849761963, 4.086010932922363, 4.367763042449951, 4.649515151977539, 4.931267261505127, 5.213019371032715, 5.494771480560303, 5.776523590087891, 6.058276176452637, 6.340027809143066, 6.621779918670654, 6.903532028198242, 7.18528413772583, 7.467036247253418, 7.748788356781006, 8.030540466308594, 8.31229305267334, 8.59404468536377, 8.875797271728516, 9.157548904418945, 9.439301490783691, 9.721053123474121, 10.002805709838867, 10.284557342529297, 10.566309928894043, 10.848062515258789, 11.129815101623535, 11.411566734313965, 11.693319320678711, 11.97507095336914, 12.256823539733887, 12.538575172424316, 12.820327758789062, 13.102079391479492, 13.383831977844238, 13.665583610534668, 13.947336196899414, 14.229087829589844, 14.51084041595459, 14.79259204864502, 15.074344635009766, 15.356096267700195]}, "gradients/decoder.roberta.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 6.0, 7.0, 10.0, 12.0, 14.0, 10.0, 17.0, 15.0, 16.0, 15.0, 28.0, 32.0, 23.0, 37.0, 40.0, 34.0, 35.0, 49.0, 40.0, 43.0, 25.0, 35.0, 39.0, 33.0, 27.0, 35.0, 41.0, 39.0, 31.0, 27.0, 21.0, 30.0, 22.0, 22.0, 13.0, 10.0, 11.0, 4.0, 7.0, 7.0, 11.0, 4.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.5205140113830566, -2.4378206729888916, -2.3551273345947266, -2.2724339962005615, -2.1897406578063965, -2.1070473194122314, -2.0243539810180664, -1.9416605234146118, -1.8589671850204468, -1.7762738466262817, -1.6935805082321167, -1.6108871698379517, -1.528193712234497, -1.445500373840332, -1.362807035446167, -1.280113697052002, -1.197420358657837, -1.1147270202636719, -1.0320336818695068, -0.949340283870697, -0.866646945476532, -0.7839536070823669, -0.7012602090835571, -0.6185668706893921, -0.535873532295227, -0.453180193901062, -0.3704868257045746, -0.28779345750808716, -0.20510011911392212, -0.12240678071975708, -0.03971341252326965, 0.04297995567321777, 0.1256730556488037, 0.20836640894412994, 0.2910597622394562, 0.3737531304359436, 0.45644646883010864, 0.5391398072242737, 0.6218332052230835, 0.7045265436172485, 0.7872198820114136, 0.8699132204055786, 0.9526065587997437, 1.0352998971939087, 1.1179933547973633, 1.2006866931915283, 1.2833800315856934, 1.3660733699798584, 1.4487667083740234, 1.5314600467681885, 1.6141533851623535, 1.6968467235565186, 1.7795400619506836, 1.8622334003448486, 1.9449268579483032, 2.027620315551758, 2.1103134155273438, 2.193006753921509, 2.275700092315674, 2.358393430709839, 2.441086769104004, 2.523780107498169, 2.606473445892334, 2.689167022705078, 2.771860361099243]}, "gradients/decoder.roberta.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 11.0, 7.0, 10.0, 7.0, 15.0, 14.0, 16.0, 18.0, 21.0, 36.0, 34.0, 53.0, 117.0, 135.0, 331.0, 704.0, 2563.0, 13802.0, 96376.0, 559573.0, 319773.0, 45235.0, 7011.0, 1493.0, 513.0, 226.0, 111.0, 73.0, 54.0, 53.0, 33.0, 21.0, 18.0, 19.0, 12.0, 7.0, 10.0, 11.0, 6.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.81640625, -5.62762451171875, -5.4388427734375, -5.25006103515625, -5.061279296875, -4.87249755859375, -4.6837158203125, -4.49493408203125, -4.30615234375, -4.11737060546875, -3.9285888671875, -3.73980712890625, -3.551025390625, -3.36224365234375, -3.1734619140625, -2.98468017578125, -2.7958984375, -2.60711669921875, -2.4183349609375, -2.22955322265625, -2.040771484375, -1.85198974609375, -1.6632080078125, -1.47442626953125, -1.28564453125, -1.09686279296875, -0.9080810546875, -0.71929931640625, -0.530517578125, -0.34173583984375, -0.1529541015625, 0.03582763671875, 0.224609375, 0.41339111328125, 0.6021728515625, 0.79095458984375, 0.979736328125, 1.16851806640625, 1.3572998046875, 1.54608154296875, 1.73486328125, 1.92364501953125, 2.1124267578125, 2.30120849609375, 2.489990234375, 2.67877197265625, 2.8675537109375, 3.05633544921875, 3.2451171875, 3.43389892578125, 3.6226806640625, 3.81146240234375, 4.000244140625, 4.18902587890625, 4.3778076171875, 4.56658935546875, 4.75537109375, 4.94415283203125, 5.1329345703125, 5.32171630859375, 5.510498046875, 5.69927978515625, 5.8880615234375, 6.07684326171875, 6.265625]}, "gradients/decoder.roberta.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 0.0, 7.0, 8.0, 10.0, 4.0, 15.0, 13.0, 12.0, 13.0, 16.0, 12.0, 21.0, 23.0, 36.0, 24.0, 30.0, 34.0, 43.0, 41.0, 52.0, 39.0, 38.0, 32.0, 32.0, 39.0, 34.0, 26.0, 36.0, 45.0, 35.0, 30.0, 26.0, 32.0, 22.0, 22.0, 25.0, 8.0, 14.0, 8.0, 4.0, 8.0, 9.0, 6.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.52734375, -2.4444580078125, -2.361572265625, -2.2786865234375, -2.19580078125, -2.1129150390625, -2.030029296875, -1.9471435546875, -1.8642578125, -1.7813720703125, -1.698486328125, -1.6156005859375, -1.53271484375, -1.4498291015625, -1.366943359375, -1.2840576171875, -1.201171875, -1.1182861328125, -1.035400390625, -0.9525146484375, -0.86962890625, -0.7867431640625, -0.703857421875, -0.6209716796875, -0.5380859375, -0.4552001953125, -0.372314453125, -0.2894287109375, -0.20654296875, -0.1236572265625, -0.040771484375, 0.0421142578125, 0.125, 0.2078857421875, 0.290771484375, 0.3736572265625, 0.45654296875, 0.5394287109375, 0.622314453125, 0.7052001953125, 0.7880859375, 0.8709716796875, 0.953857421875, 1.0367431640625, 1.11962890625, 1.2025146484375, 1.285400390625, 1.3682861328125, 1.451171875, 1.5340576171875, 1.616943359375, 1.6998291015625, 1.78271484375, 1.8656005859375, 1.948486328125, 2.0313720703125, 2.1142578125, 2.1971435546875, 2.280029296875, 2.3629150390625, 2.44580078125, 2.5286865234375, 2.611572265625, 2.6944580078125, 2.77734375]}, "gradients/decoder.roberta.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 4.0, 3.0, 7.0, 7.0, 11.0, 15.0, 13.0, 15.0, 19.0, 17.0, 26.0, 36.0, 55.0, 41.0, 52.0, 64.0, 91.0, 137.0, 172.0, 24981.0, 1021808.0, 208.0, 171.0, 112.0, 83.0, 70.0, 43.0, 44.0, 46.0, 31.0, 23.0, 20.0, 16.0, 18.0, 16.0, 15.0, 7.0, 8.0, 6.0, 4.0, 7.0, 5.0, 6.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-86.5625, -83.947265625, -81.33203125, -78.716796875, -76.1015625, -73.486328125, -70.87109375, -68.255859375, -65.640625, -63.025390625, -60.41015625, -57.794921875, -55.1796875, -52.564453125, -49.94921875, -47.333984375, -44.71875, -42.103515625, -39.48828125, -36.873046875, -34.2578125, -31.642578125, -29.02734375, -26.412109375, -23.796875, -21.181640625, -18.56640625, -15.951171875, -13.3359375, -10.720703125, -8.10546875, -5.490234375, -2.875, -0.259765625, 2.35546875, 4.970703125, 7.5859375, 10.201171875, 12.81640625, 15.431640625, 18.046875, 20.662109375, 23.27734375, 25.892578125, 28.5078125, 31.123046875, 33.73828125, 36.353515625, 38.96875, 41.583984375, 44.19921875, 46.814453125, 49.4296875, 52.044921875, 54.66015625, 57.275390625, 59.890625, 62.505859375, 65.12109375, 67.736328125, 70.3515625, 72.966796875, 75.58203125, 78.197265625, 80.8125]}, "gradients/decoder.roberta.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 6.0, 4.0, 5.0, 5.0, 10.0, 17.0, 17.0, 20.0, 13.0, 23.0, 31.0, 24.0, 34.0, 39.0, 33.0, 33.0, 45.0, 44.0, 49.0, 35.0, 40.0, 37.0, 32.0, 42.0, 29.0, 36.0, 31.0, 38.0, 34.0, 29.0, 21.0, 18.0, 23.0, 12.0, 10.0, 15.0, 14.0, 8.0, 3.0, 4.0, 5.0, 5.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.70745849609375, -2.6160888671875, -2.52471923828125, -2.433349609375, -2.34197998046875, -2.2506103515625, -2.15924072265625, -2.06787109375, -1.97650146484375, -1.8851318359375, -1.79376220703125, -1.702392578125, -1.61102294921875, -1.5196533203125, -1.42828369140625, -1.3369140625, -1.24554443359375, -1.1541748046875, -1.06280517578125, -0.971435546875, -0.88006591796875, -0.7886962890625, -0.69732666015625, -0.60595703125, -0.51458740234375, -0.4232177734375, -0.33184814453125, -0.240478515625, -0.14910888671875, -0.0577392578125, 0.03363037109375, 0.125, 0.21636962890625, 0.3077392578125, 0.39910888671875, 0.490478515625, 0.58184814453125, 0.6732177734375, 0.76458740234375, 0.85595703125, 0.94732666015625, 1.0386962890625, 1.13006591796875, 1.221435546875, 1.31280517578125, 1.4041748046875, 1.49554443359375, 1.5869140625, 1.67828369140625, 1.7696533203125, 1.86102294921875, 1.952392578125, 2.04376220703125, 2.1351318359375, 2.22650146484375, 2.31787109375, 2.40924072265625, 2.5006103515625, 2.59197998046875, 2.683349609375, 2.77471923828125, 2.8660888671875, 2.95745849609375, 3.048828125]}, "gradients/decoder.roberta.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 17.0, 38.0, 62.0, 176.0, 651.0, 4117.0, 951266.0, 90138.0, 1511.0, 367.0, 108.0, 57.0, 21.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.859375, -5.52978515625, -5.2001953125, -4.87060546875, -4.541015625, -4.21142578125, -3.8818359375, -3.55224609375, -3.22265625, -2.89306640625, -2.5634765625, -2.23388671875, -1.904296875, -1.57470703125, -1.2451171875, -0.91552734375, -0.5859375, -0.25634765625, 0.0732421875, 0.40283203125, 0.732421875, 1.06201171875, 1.3916015625, 1.72119140625, 2.05078125, 2.38037109375, 2.7099609375, 3.03955078125, 3.369140625, 3.69873046875, 4.0283203125, 4.35791015625, 4.6875, 5.01708984375, 5.3466796875, 5.67626953125, 6.005859375, 6.33544921875, 6.6650390625, 6.99462890625, 7.32421875, 7.65380859375, 7.9833984375, 8.31298828125, 8.642578125, 8.97216796875, 9.3017578125, 9.63134765625, 9.9609375, 10.29052734375, 10.6201171875, 10.94970703125, 11.279296875, 11.60888671875, 11.9384765625, 12.26806640625, 12.59765625, 12.92724609375, 13.2568359375, 13.58642578125, 13.916015625, 14.24560546875, 14.5751953125, 14.90478515625, 15.234375]}, "gradients/decoder.roberta.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 6.0, 9.0, 28.0, 43.0, 53.0, 113.0, 210.0, 229.0, 139.0, 71.0, 44.0, 27.0, 14.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031828880310058594, -0.0003050602972507477, -0.0002918317914009094, -0.00027860328555107117, -0.0002653747797012329, -0.00025214627385139465, -0.0002389177680015564, -0.00022568926215171814, -0.00021246075630187988, -0.00019923225045204163, -0.00018600374460220337, -0.0001727752387523651, -0.00015954673290252686, -0.0001463182270526886, -0.00013308972120285034, -0.00011986121535301208, -0.00010663270950317383, -9.340420365333557e-05, -8.017569780349731e-05, -6.694719195365906e-05, -5.37186861038208e-05, -4.0490180253982544e-05, -2.7261674404144287e-05, -1.403316855430603e-05, -8.046627044677734e-07, 1.2423843145370483e-05, 2.565234899520874e-05, 3.8880854845047e-05, 5.2109360694885254e-05, 6.533786654472351e-05, 7.856637239456177e-05, 9.179487824440002e-05, 0.00010502338409423828, 0.00011825188994407654, 0.0001314803957939148, 0.00014470890164375305, 0.0001579374074935913, 0.00017116591334342957, 0.00018439441919326782, 0.00019762292504310608, 0.00021085143089294434, 0.0002240799367427826, 0.00023730844259262085, 0.0002505369484424591, 0.00026376545429229736, 0.0002769939601421356, 0.0002902224659919739, 0.00030345097184181213, 0.0003166794776916504, 0.00032990798354148865, 0.0003431364893913269, 0.00035636499524116516, 0.0003695935010910034, 0.0003828220069408417, 0.00039605051279067993, 0.0004092790186405182, 0.00042250752449035645, 0.0004357360303401947, 0.00044896453619003296, 0.0004621930420398712, 0.00047542154788970947, 0.0004886500537395477, 0.000501878559589386, 0.0005151070654392242, 0.0005283355712890625]}, "gradients/decoder.roberta.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 14.0, 11.0, 12.0, 18.0, 24.0, 54.0, 134.0, 1060.0, 853502.0, 192693.0, 755.0, 115.0, 62.0, 38.0, 17.0, 11.0, 15.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9765625, -13.4158935546875, -12.855224609375, -12.2945556640625, -11.73388671875, -11.1732177734375, -10.612548828125, -10.0518798828125, -9.4912109375, -8.9305419921875, -8.369873046875, -7.8092041015625, -7.24853515625, -6.6878662109375, -6.127197265625, -5.5665283203125, -5.005859375, -4.4451904296875, -3.884521484375, -3.3238525390625, -2.76318359375, -2.2025146484375, -1.641845703125, -1.0811767578125, -0.5205078125, 0.0401611328125, 0.600830078125, 1.1614990234375, 1.72216796875, 2.2828369140625, 2.843505859375, 3.4041748046875, 3.96484375, 4.5255126953125, 5.086181640625, 5.6468505859375, 6.20751953125, 6.7681884765625, 7.328857421875, 7.8895263671875, 8.4501953125, 9.0108642578125, 9.571533203125, 10.1322021484375, 10.69287109375, 11.2535400390625, 11.814208984375, 12.3748779296875, 12.935546875, 13.4962158203125, 14.056884765625, 14.6175537109375, 15.17822265625, 15.7388916015625, 16.299560546875, 16.8602294921875, 17.4208984375, 17.9815673828125, 18.542236328125, 19.1029052734375, 19.66357421875, 20.2242431640625, 20.784912109375, 21.3455810546875, 21.90625]}, "gradients/decoder.roberta.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 9.0, 9.0, 9.0, 17.0, 33.0, 65.0, 66.0, 106.0, 165.0, 194.0, 116.0, 73.0, 52.0, 18.0, 18.0, 15.0, 9.0, 12.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0869140625, -1.0604476928710938, -1.0339813232421875, -1.0075149536132812, -0.981048583984375, -0.9545822143554688, -0.9281158447265625, -0.9016494750976562, -0.87518310546875, -0.8487167358398438, -0.8222503662109375, -0.7957839965820312, -0.769317626953125, -0.7428512573242188, -0.7163848876953125, -0.6899185180664062, -0.6634521484375, -0.6369857788085938, -0.6105194091796875, -0.5840530395507812, -0.557586669921875, -0.5311203002929688, -0.5046539306640625, -0.47818756103515625, -0.45172119140625, -0.42525482177734375, -0.3987884521484375, -0.37232208251953125, -0.345855712890625, -0.31938934326171875, -0.2929229736328125, -0.26645660400390625, -0.239990234375, -0.21352386474609375, -0.1870574951171875, -0.16059112548828125, -0.134124755859375, -0.10765838623046875, -0.0811920166015625, -0.05472564697265625, -0.02825927734375, -0.00179290771484375, 0.0246734619140625, 0.05113983154296875, 0.077606201171875, 0.10407257080078125, 0.1305389404296875, 0.15700531005859375, 0.1834716796875, 0.20993804931640625, 0.2364044189453125, 0.26287078857421875, 0.289337158203125, 0.31580352783203125, 0.3422698974609375, 0.36873626708984375, 0.39520263671875, 0.42166900634765625, 0.4481353759765625, 0.47460174560546875, 0.501068115234375, 0.5275344848632812, 0.5540008544921875, 0.5804672241210938, 0.60693359375]}, "gradients/decoder.roberta.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 4.0, 21.0, 32.0, 43.0, 65.0, 83.0, 93.0, 119.0, 116.0, 112.0, 97.0, 87.0, 47.0, 37.0, 25.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.102502822875977, -6.917678356170654, -6.732853412628174, -6.548028945922852, -6.363204002380371, -6.178379535675049, -5.993555068969727, -5.808730125427246, -5.623905181884766, -5.439080715179443, -5.254255771636963, -5.069431304931641, -4.88460636138916, -4.699781894683838, -4.514957427978516, -4.330132484436035, -4.145308017730713, -3.9604833126068115, -3.77565860748291, -3.590834140777588, -3.4060091972351074, -3.221184730529785, -3.036360025405884, -2.8515353202819824, -2.666710615158081, -2.4818859100341797, -2.2970612049102783, -2.112236499786377, -1.9274119138717651, -1.7425872087478638, -1.557762622833252, -1.3729379177093506, -1.188112735748291, -1.0032880306243896, -0.8184633851051331, -0.6336387395858765, -0.4488140344619751, -0.26398932933807373, -0.07916474342346191, 0.10565996170043945, 0.2904846668243408, 0.4753093421459198, 0.6601340174674988, 0.8449586629867554, 1.0297833681106567, 1.214608073234558, 1.39943265914917, 1.5842573642730713, 1.7690820693969727, 1.953906774520874, 2.1387314796447754, 2.3235559463500977, 2.508380889892578, 2.6932053565979004, 2.8780300617218018, 3.062854766845703, 3.2476794719696045, 3.432504177093506, 3.6173288822174072, 3.8021535873413086, 3.986978054046631, 4.171802997589111, 4.356627464294434, 4.541452407836914, 4.726276874542236]}, "gradients/decoder.roberta.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 7.0, 5.0, 8.0, 7.0, 9.0, 12.0, 13.0, 29.0, 21.0, 18.0, 26.0, 21.0, 18.0, 17.0, 22.0, 25.0, 37.0, 37.0, 42.0, 46.0, 38.0, 38.0, 37.0, 44.0, 32.0, 26.0, 50.0, 46.0, 27.0, 34.0, 25.0, 23.0, 26.0, 23.0, 11.0, 13.0, 16.0, 10.0, 14.0, 11.0, 7.0, 4.0, 9.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.668219804763794, -3.569429397583008, -3.4706389904022217, -3.3718485832214355, -3.2730584144592285, -3.1742680072784424, -3.0754776000976562, -2.97668719291687, -2.877896785736084, -2.779106378555298, -2.6803159713745117, -2.5815255641937256, -2.4827351570129395, -2.3839449882507324, -2.2851545810699463, -2.18636417388916, -2.087573766708374, -1.988783359527588, -1.8899929523468018, -1.7912026643753052, -1.692412257194519, -1.593621850013733, -1.4948315620422363, -1.3960411548614502, -1.297250747680664, -1.198460340499878, -1.0996699333190918, -1.0008796453475952, -0.9020892381668091, -0.803298830986023, -0.7045084834098816, -0.6057181358337402, -0.506927490234375, -0.40813711285591125, -0.3093467354774475, -0.21055635809898376, -0.11176598072052002, -0.012975603342056274, 0.08581477403640747, 0.18460512161254883, 0.28339552879333496, 0.3821859061717987, 0.48097628355026245, 0.5797666311264038, 0.6785570383071899, 0.7773474454879761, 0.8761377930641174, 0.9749281406402588, 1.073718547821045, 1.172508955001831, 1.2712993621826172, 1.3700896501541138, 1.4688800573349, 1.567670464515686, 1.6664607524871826, 1.7652511596679688, 1.8640415668487549, 1.962831974029541, 2.061622381210327, 2.1604127883911133, 2.2592029571533203, 2.3579933643341064, 2.4567837715148926, 2.5555741786956787, 2.654364585876465]}, "gradients/decoder.roberta.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 3.0, 6.0, 2.0, 6.0, 8.0, 3.0, 11.0, 14.0, 13.0, 22.0, 30.0, 47.0, 50.0, 66.0, 80.0, 112.0, 167.0, 211.0, 348.0, 694.0, 1866.0, 7545.0, 71314.0, 2066093.0, 1966783.0, 67762.0, 7393.0, 1701.0, 687.0, 357.0, 235.0, 144.0, 117.0, 89.0, 70.0, 56.0, 34.0, 31.0, 21.0, 23.0, 19.0, 16.0, 8.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 4.0], "bins": [-8.1171875, -7.87115478515625, -7.6251220703125, -7.37908935546875, -7.133056640625, -6.88702392578125, -6.6409912109375, -6.39495849609375, -6.14892578125, -5.90289306640625, -5.6568603515625, -5.41082763671875, -5.164794921875, -4.91876220703125, -4.6727294921875, -4.42669677734375, -4.1806640625, -3.93463134765625, -3.6885986328125, -3.44256591796875, -3.196533203125, -2.95050048828125, -2.7044677734375, -2.45843505859375, -2.21240234375, -1.96636962890625, -1.7203369140625, -1.47430419921875, -1.228271484375, -0.98223876953125, -0.7362060546875, -0.49017333984375, -0.244140625, 0.00189208984375, 0.2479248046875, 0.49395751953125, 0.739990234375, 0.98602294921875, 1.2320556640625, 1.47808837890625, 1.72412109375, 1.97015380859375, 2.2161865234375, 2.46221923828125, 2.708251953125, 2.95428466796875, 3.2003173828125, 3.44635009765625, 3.6923828125, 3.93841552734375, 4.1844482421875, 4.43048095703125, 4.676513671875, 4.92254638671875, 5.1685791015625, 5.41461181640625, 5.66064453125, 5.90667724609375, 6.1527099609375, 6.39874267578125, 6.644775390625, 6.89080810546875, 7.1368408203125, 7.38287353515625, 7.62890625]}, "gradients/decoder.roberta.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 6.0, 7.0, 5.0, 5.0, 10.0, 7.0, 14.0, 10.0, 6.0, 18.0, 23.0, 21.0, 16.0, 22.0, 32.0, 19.0, 21.0, 30.0, 38.0, 46.0, 42.0, 45.0, 34.0, 45.0, 38.0, 29.0, 40.0, 38.0, 37.0, 35.0, 30.0, 23.0, 32.0, 28.0, 18.0, 23.0, 19.0, 18.0, 16.0, 11.0, 9.0, 10.0, 3.0, 4.0, 6.0, 3.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 4.0], "bins": [-2.3203125, -2.2493896484375, -2.178466796875, -2.1075439453125, -2.03662109375, -1.9656982421875, -1.894775390625, -1.8238525390625, -1.7529296875, -1.6820068359375, -1.611083984375, -1.5401611328125, -1.46923828125, -1.3983154296875, -1.327392578125, -1.2564697265625, -1.185546875, -1.1146240234375, -1.043701171875, -0.9727783203125, -0.90185546875, -0.8309326171875, -0.760009765625, -0.6890869140625, -0.6181640625, -0.5472412109375, -0.476318359375, -0.4053955078125, -0.33447265625, -0.2635498046875, -0.192626953125, -0.1217041015625, -0.05078125, 0.0201416015625, 0.091064453125, 0.1619873046875, 0.23291015625, 0.3038330078125, 0.374755859375, 0.4456787109375, 0.5166015625, 0.5875244140625, 0.658447265625, 0.7293701171875, 0.80029296875, 0.8712158203125, 0.942138671875, 1.0130615234375, 1.083984375, 1.1549072265625, 1.225830078125, 1.2967529296875, 1.36767578125, 1.4385986328125, 1.509521484375, 1.5804443359375, 1.6513671875, 1.7222900390625, 1.793212890625, 1.8641357421875, 1.93505859375, 2.0059814453125, 2.076904296875, 2.1478271484375, 2.21875]}, "gradients/decoder.roberta.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 5.0, 9.0, 22.0, 21.0, 42.0, 64.0, 78.0, 123.0, 210.0, 368.0, 1229.0, 192330.0, 3996041.0, 2596.0, 464.0, 257.0, 145.0, 76.0, 68.0, 34.0, 26.0, 15.0, 13.0, 11.0, 7.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.453125, -28.282470703125, -27.11181640625, -25.941162109375, -24.7705078125, -23.599853515625, -22.42919921875, -21.258544921875, -20.087890625, -18.917236328125, -17.74658203125, -16.575927734375, -15.4052734375, -14.234619140625, -13.06396484375, -11.893310546875, -10.72265625, -9.552001953125, -8.38134765625, -7.210693359375, -6.0400390625, -4.869384765625, -3.69873046875, -2.528076171875, -1.357421875, -0.186767578125, 0.98388671875, 2.154541015625, 3.3251953125, 4.495849609375, 5.66650390625, 6.837158203125, 8.0078125, 9.178466796875, 10.34912109375, 11.519775390625, 12.6904296875, 13.861083984375, 15.03173828125, 16.202392578125, 17.373046875, 18.543701171875, 19.71435546875, 20.885009765625, 22.0556640625, 23.226318359375, 24.39697265625, 25.567626953125, 26.73828125, 27.908935546875, 29.07958984375, 30.250244140625, 31.4208984375, 32.591552734375, 33.76220703125, 34.932861328125, 36.103515625, 37.274169921875, 38.44482421875, 39.615478515625, 40.7861328125, 41.956787109375, 43.12744140625, 44.298095703125, 45.46875]}, "gradients/decoder.roberta.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 5.0, 6.0, 5.0, 10.0, 9.0, 16.0, 31.0, 54.0, 57.0, 99.0, 173.0, 274.0, 430.0, 672.0, 832.0, 518.0, 335.0, 194.0, 103.0, 92.0, 58.0, 45.0, 17.0, 12.0, 14.0, 3.0, 4.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1875, -2.1316070556640625, -2.075714111328125, -2.0198211669921875, -1.96392822265625, -1.9080352783203125, -1.852142333984375, -1.7962493896484375, -1.7403564453125, -1.6844635009765625, -1.628570556640625, -1.5726776123046875, -1.51678466796875, -1.4608917236328125, -1.404998779296875, -1.3491058349609375, -1.293212890625, -1.2373199462890625, -1.181427001953125, -1.1255340576171875, -1.06964111328125, -1.0137481689453125, -0.957855224609375, -0.9019622802734375, -0.8460693359375, -0.7901763916015625, -0.734283447265625, -0.6783905029296875, -0.62249755859375, -0.5666046142578125, -0.510711669921875, -0.4548187255859375, -0.39892578125, -0.3430328369140625, -0.287139892578125, -0.2312469482421875, -0.17535400390625, -0.1194610595703125, -0.063568115234375, -0.0076751708984375, 0.0482177734375, 0.1041107177734375, 0.160003662109375, 0.2158966064453125, 0.27178955078125, 0.3276824951171875, 0.383575439453125, 0.4394683837890625, 0.495361328125, 0.5512542724609375, 0.607147216796875, 0.6630401611328125, 0.71893310546875, 0.7748260498046875, 0.830718994140625, 0.8866119384765625, 0.9425048828125, 0.9983978271484375, 1.054290771484375, 1.1101837158203125, 1.16607666015625, 1.2219696044921875, 1.277862548828125, 1.3337554931640625, 1.3896484375]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 12.0, 17.0, 17.0, 26.0, 44.0, 48.0, 76.0, 68.0, 85.0, 73.0, 78.0, 113.0, 69.0, 81.0, 49.0, 33.0, 33.0, 19.0, 16.0, 16.0, 12.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8248233795166016, -2.7081105709075928, -2.591398000717163, -2.4746851921081543, -2.3579723834991455, -2.2412595748901367, -2.124547004699707, -2.0078341960906982, -1.8911213874816895, -1.7744086980819702, -1.6576958894729614, -1.5409832000732422, -1.4242703914642334, -1.3075577020645142, -1.190845012664795, -1.0741322040557861, -0.9574195146560669, -0.8407067656517029, -0.7239940166473389, -0.6072813272476196, -0.4905685484409332, -0.3738558292388916, -0.2571430802345276, -0.14043033123016357, -0.02371758222579956, 0.09299515932798386, 0.20970790088176727, 0.3264206349849701, 0.4431333839893341, 0.5598461031913757, 0.6765588521957397, 0.7932716012001038, 0.9099843502044678, 1.026697039604187, 1.1434098482131958, 1.260122537612915, 1.3768353462219238, 1.493548035621643, 1.6102607250213623, 1.726973533630371, 1.8436863422393799, 1.9603990316390991, 2.0771117210388184, 2.193824529647827, 2.310537338256836, 2.4272499084472656, 2.5439627170562744, 2.660675525665283, 2.777388095855713, 2.8941009044647217, 3.0108134746551514, 3.12752628326416, 3.244239091873169, 3.3609519004821777, 3.4776644706726074, 3.594377279281616, 3.711090087890625, 3.827802896499634, 3.9445154666900635, 4.061228275299072, 4.177940845489502, 4.29465389251709, 4.4113664627075195, 4.528079032897949, 4.644792079925537]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 9.0, 5.0, 8.0, 6.0, 9.0, 12.0, 10.0, 10.0, 17.0, 22.0, 21.0, 15.0, 27.0, 28.0, 22.0, 27.0, 36.0, 40.0, 40.0, 31.0, 43.0, 39.0, 51.0, 30.0, 44.0, 44.0, 43.0, 27.0, 26.0, 37.0, 38.0, 21.0, 25.0, 19.0, 24.0, 18.0, 6.0, 18.0, 9.0, 13.0, 8.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5537259578704834, -2.4678046703338623, -2.381883144378662, -2.295961856842041, -2.210040330886841, -2.1241190433502197, -2.0381975173950195, -1.9522762298583984, -1.8663547039031982, -1.7804332971572876, -1.694511890411377, -1.6085904836654663, -1.5226690769195557, -1.436747670173645, -1.3508262634277344, -1.2649049758911133, -1.1789835691452026, -1.093062162399292, -1.0071407556533813, -0.9212193489074707, -0.8352979421615601, -0.7493765354156494, -0.6634551882743835, -0.5775337815284729, -0.49161237478256226, -0.4056909680366516, -0.31976956129074097, -0.2338481843471527, -0.14792677760124207, -0.06200537085533142, 0.023916006088256836, 0.10983741283416748, 0.19575881958007812, 0.28168022632598877, 0.3676016330718994, 0.45352301001548767, 0.5394444465637207, 0.6253658533096313, 0.7112872004508972, 0.7972086071968079, 0.8831300139427185, 0.9690514206886292, 1.054972767829895, 1.1408941745758057, 1.2268155813217163, 1.312736988067627, 1.3986583948135376, 1.4845798015594482, 1.5705012083053589, 1.6564226150512695, 1.7423440217971802, 1.8282654285430908, 1.9141868352890015, 2.000108242034912, 2.086029529571533, 2.1719510555267334, 2.2578723430633545, 2.3437936305999756, 2.429715156555176, 2.515636444091797, 2.601557970046997, 2.687479257583618, 2.7734007835388184, 2.8593220710754395, 2.9452435970306396]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 8.0, 7.0, 14.0, 14.0, 14.0, 29.0, 49.0, 60.0, 95.0, 125.0, 186.0, 246.0, 318.0, 468.0, 708.0, 976.0, 1371.0, 1900.0, 2707.0, 3902.0, 5742.0, 8544.0, 12597.0, 19347.0, 30481.0, 49411.0, 83338.0, 137975.0, 197668.0, 182078.0, 118178.0, 69609.0, 41874.0, 26384.0, 16903.0, 10933.0, 7506.0, 4996.0, 3519.0, 2455.0, 1703.0, 1183.0, 855.0, 611.0, 445.0, 325.0, 226.0, 121.0, 101.0, 67.0, 67.0, 44.0, 37.0, 16.0, 10.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.397705078125, -0.3848075866699219, -0.37191009521484375, -0.3590126037597656, -0.3461151123046875, -0.3332176208496094, -0.32032012939453125, -0.3074226379394531, -0.294525146484375, -0.2816276550292969, -0.26873016357421875, -0.2558326721191406, -0.2429351806640625, -0.23003768920898438, -0.21714019775390625, -0.20424270629882812, -0.19134521484375, -0.17844772338867188, -0.16555023193359375, -0.15265274047851562, -0.1397552490234375, -0.12685775756835938, -0.11396026611328125, -0.10106277465820312, -0.088165283203125, -0.07526779174804688, -0.06237030029296875, -0.049472808837890625, -0.0365753173828125, -0.023677825927734375, -0.01078033447265625, 0.002117156982421875, 0.0150146484375, 0.027912139892578125, 0.04080963134765625, 0.053707122802734375, 0.0666046142578125, 0.07950210571289062, 0.09239959716796875, 0.10529708862304688, 0.118194580078125, 0.13109207153320312, 0.14398956298828125, 0.15688705444335938, 0.1697845458984375, 0.18268203735351562, 0.19557952880859375, 0.20847702026367188, 0.22137451171875, 0.23427200317382812, 0.24716949462890625, 0.2600669860839844, 0.2729644775390625, 0.2858619689941406, 0.29875946044921875, 0.3116569519042969, 0.324554443359375, 0.3374519348144531, 0.35034942626953125, 0.3632469177246094, 0.3761444091796875, 0.3890419006347656, 0.40193939208984375, 0.4148368835449219, 0.427734375]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 8.0, 6.0, 9.0, 12.0, 9.0, 12.0, 18.0, 20.0, 21.0, 14.0, 30.0, 26.0, 21.0, 28.0, 36.0, 39.0, 41.0, 32.0, 41.0, 40.0, 49.0, 30.0, 45.0, 43.0, 46.0, 26.0, 25.0, 38.0, 38.0, 19.0, 28.0, 18.0, 24.0, 16.0, 7.0, 18.0, 10.0, 12.0, 9.0, 7.0, 5.0, 8.0, 3.0, 1.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.640625, -2.5565185546875, -2.472412109375, -2.3883056640625, -2.30419921875, -2.2200927734375, -2.135986328125, -2.0518798828125, -1.9677734375, -1.8836669921875, -1.799560546875, -1.7154541015625, -1.63134765625, -1.5472412109375, -1.463134765625, -1.3790283203125, -1.294921875, -1.2108154296875, -1.126708984375, -1.0426025390625, -0.95849609375, -0.8743896484375, -0.790283203125, -0.7061767578125, -0.6220703125, -0.5379638671875, -0.453857421875, -0.3697509765625, -0.28564453125, -0.2015380859375, -0.117431640625, -0.0333251953125, 0.05078125, 0.1348876953125, 0.218994140625, 0.3031005859375, 0.38720703125, 0.4713134765625, 0.555419921875, 0.6395263671875, 0.7236328125, 0.8077392578125, 0.891845703125, 0.9759521484375, 1.06005859375, 1.1441650390625, 1.228271484375, 1.3123779296875, 1.396484375, 1.4805908203125, 1.564697265625, 1.6488037109375, 1.73291015625, 1.8170166015625, 1.901123046875, 1.9852294921875, 2.0693359375, 2.1534423828125, 2.237548828125, 2.3216552734375, 2.40576171875, 2.4898681640625, 2.573974609375, 2.6580810546875, 2.7421875]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 5.0, 9.0, 13.0, 15.0, 22.0, 19.0, 29.0, 39.0, 58.0, 84.0, 105.0, 145.0, 192.0, 282.0, 396.0, 596.0, 929.0, 1603.0, 3194.0, 7385.0, 21253.0, 95340.0, 878214.0, 22751.0, 7763.0, 3318.0, 1689.0, 976.0, 645.0, 420.0, 265.0, 202.0, 183.0, 106.0, 90.0, 55.0, 37.0, 29.0, 26.0, 11.0, 11.0, 16.0, 6.0, 8.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6181640625, -1.5676422119140625, -1.517120361328125, -1.4665985107421875, -1.41607666015625, -1.3655548095703125, -1.315032958984375, -1.2645111083984375, -1.2139892578125, -1.1634674072265625, -1.112945556640625, -1.0624237060546875, -1.01190185546875, -0.9613800048828125, -0.910858154296875, -0.8603363037109375, -0.809814453125, -0.7592926025390625, -0.708770751953125, -0.6582489013671875, -0.60772705078125, -0.5572052001953125, -0.506683349609375, -0.4561614990234375, -0.4056396484375, -0.3551177978515625, -0.304595947265625, -0.2540740966796875, -0.20355224609375, -0.1530303955078125, -0.102508544921875, -0.0519866943359375, -0.00146484375, 0.0490570068359375, 0.099578857421875, 0.1501007080078125, 0.20062255859375, 0.2511444091796875, 0.301666259765625, 0.3521881103515625, 0.4027099609375, 0.4532318115234375, 0.503753662109375, 0.5542755126953125, 0.60479736328125, 0.6553192138671875, 0.705841064453125, 0.7563629150390625, 0.806884765625, 0.8574066162109375, 0.907928466796875, 0.9584503173828125, 1.00897216796875, 1.0594940185546875, 1.110015869140625, 1.1605377197265625, 1.2110595703125, 1.2615814208984375, 1.312103271484375, 1.3626251220703125, 1.41314697265625, 1.4636688232421875, 1.514190673828125, 1.5647125244140625, 1.615234375]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 9.0, 10.0, 6.0, 10.0, 14.0, 16.0, 11.0, 19.0, 29.0, 16.0, 21.0, 28.0, 20.0, 32.0, 35.0, 34.0, 43.0, 42.0, 48.0, 44.0, 37.0, 37.0, 43.0, 33.0, 41.0, 25.0, 26.0, 22.0, 28.0, 22.0, 28.0, 29.0, 20.0, 17.0, 21.0, 13.0, 5.0, 10.0, 10.0, 8.0, 13.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4560546875, -1.4042816162109375, -1.352508544921875, -1.3007354736328125, -1.24896240234375, -1.1971893310546875, -1.145416259765625, -1.0936431884765625, -1.0418701171875, -0.9900970458984375, -0.938323974609375, -0.8865509033203125, -0.83477783203125, -0.7830047607421875, -0.731231689453125, -0.6794586181640625, -0.627685546875, -0.5759124755859375, -0.524139404296875, -0.4723663330078125, -0.42059326171875, -0.3688201904296875, -0.317047119140625, -0.2652740478515625, -0.2135009765625, -0.1617279052734375, -0.109954833984375, -0.0581817626953125, -0.00640869140625, 0.0453643798828125, 0.097137451171875, 0.1489105224609375, 0.20068359375, 0.2524566650390625, 0.304229736328125, 0.3560028076171875, 0.40777587890625, 0.4595489501953125, 0.511322021484375, 0.5630950927734375, 0.6148681640625, 0.6666412353515625, 0.718414306640625, 0.7701873779296875, 0.82196044921875, 0.8737335205078125, 0.925506591796875, 0.9772796630859375, 1.029052734375, 1.0808258056640625, 1.132598876953125, 1.1843719482421875, 1.23614501953125, 1.2879180908203125, 1.339691162109375, 1.3914642333984375, 1.4432373046875, 1.4950103759765625, 1.546783447265625, 1.5985565185546875, 1.65032958984375, 1.7021026611328125, 1.753875732421875, 1.8056488037109375, 1.857421875]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 5.0, 7.0, 5.0, 10.0, 12.0, 35.0, 29.0, 41.0, 47.0, 51.0, 83.0, 110.0, 154.0, 253.0, 322.0, 484.0, 807.0, 1363.0, 2456.0, 5469.0, 14652.0, 67044.0, 918221.0, 21927.0, 7298.0, 3233.0, 1599.0, 959.0, 584.0, 368.0, 255.0, 184.0, 140.0, 73.0, 62.0, 54.0, 37.0, 32.0, 20.0, 20.0, 14.0, 7.0, 8.0, 5.0, 1.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1749267578125, -0.1693134307861328, -0.16370010375976562, -0.15808677673339844, -0.15247344970703125, -0.14686012268066406, -0.14124679565429688, -0.1356334686279297, -0.1300201416015625, -0.12440681457519531, -0.11879348754882812, -0.11318016052246094, -0.10756683349609375, -0.10195350646972656, -0.09634017944335938, -0.09072685241699219, -0.085113525390625, -0.07950019836425781, -0.07388687133789062, -0.06827354431152344, -0.06266021728515625, -0.05704689025878906, -0.051433563232421875, -0.04582023620605469, -0.0402069091796875, -0.03459358215332031, -0.028980255126953125, -0.023366928100585938, -0.01775360107421875, -0.012140274047851562, -0.006526947021484375, -0.0009136199951171875, 0.00469970703125, 0.010313034057617188, 0.015926361083984375, 0.021539688110351562, 0.02715301513671875, 0.03276634216308594, 0.038379669189453125, 0.04399299621582031, 0.0496063232421875, 0.05521965026855469, 0.060832977294921875, 0.06644630432128906, 0.07205963134765625, 0.07767295837402344, 0.08328628540039062, 0.08889961242675781, 0.094512939453125, 0.10012626647949219, 0.10573959350585938, 0.11135292053222656, 0.11696624755859375, 0.12257957458496094, 0.12819290161132812, 0.1338062286376953, 0.1394195556640625, 0.1450328826904297, 0.15064620971679688, 0.15625953674316406, 0.16187286376953125, 0.16748619079589844, 0.17309951782226562, 0.1787128448486328, 0.184326171875]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 18.0, 18.0, 16.0, 23.0, 25.0, 34.0, 38.0, 49.0, 59.0, 67.0, 65.0, 70.0, 64.0, 74.0, 60.0, 57.0, 45.0, 43.0, 36.0, 27.0, 14.0, 15.0, 14.0, 8.0, 5.0, 9.0, 2.0, 10.0, 10.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.855062484741211e-05, -2.7531757950782776e-05, -2.6512891054153442e-05, -2.549402415752411e-05, -2.4475157260894775e-05, -2.3456290364265442e-05, -2.243742346763611e-05, -2.1418556571006775e-05, -2.039968967437744e-05, -1.9380822777748108e-05, -1.8361955881118774e-05, -1.734308898448944e-05, -1.6324222087860107e-05, -1.5305355191230774e-05, -1.428648829460144e-05, -1.3267621397972107e-05, -1.2248754501342773e-05, -1.122988760471344e-05, -1.0211020708084106e-05, -9.192153811454773e-06, -8.17328691482544e-06, -7.154420018196106e-06, -6.1355531215667725e-06, -5.116686224937439e-06, -4.0978193283081055e-06, -3.078952431678772e-06, -2.0600855350494385e-06, -1.041218638420105e-06, -2.2351741790771484e-08, 9.96515154838562e-07, 2.0153820514678955e-06, 3.034248948097229e-06, 4.0531158447265625e-06, 5.071982741355896e-06, 6.0908496379852295e-06, 7.109716534614563e-06, 8.128583431243896e-06, 9.14745032787323e-06, 1.0166317224502563e-05, 1.1185184121131897e-05, 1.220405101776123e-05, 1.3222917914390564e-05, 1.4241784811019897e-05, 1.526065170764923e-05, 1.6279518604278564e-05, 1.7298385500907898e-05, 1.831725239753723e-05, 1.9336119294166565e-05, 2.03549861907959e-05, 2.1373853087425232e-05, 2.2392719984054565e-05, 2.34115868806839e-05, 2.4430453777313232e-05, 2.5449320673942566e-05, 2.64681875705719e-05, 2.7487054467201233e-05, 2.8505921363830566e-05, 2.95247882604599e-05, 3.0543655157089233e-05, 3.156252205371857e-05, 3.25813889503479e-05, 3.3600255846977234e-05, 3.461912274360657e-05, 3.56379896402359e-05, 3.6656856536865234e-05]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 8.0, 6.0, 21.0, 18.0, 19.0, 38.0, 84.0, 106.0, 418.0, 8503.0, 1013664.0, 24759.0, 517.0, 149.0, 79.0, 36.0, 21.0, 23.0, 13.0, 11.0, 13.0, 2.0, 7.0, 5.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61083984375, -0.5915069580078125, -0.572174072265625, -0.5528411865234375, -0.53350830078125, -0.5141754150390625, -0.494842529296875, -0.4755096435546875, -0.4561767578125, -0.4368438720703125, -0.417510986328125, -0.3981781005859375, -0.37884521484375, -0.3595123291015625, -0.340179443359375, -0.3208465576171875, -0.301513671875, -0.2821807861328125, -0.262847900390625, -0.2435150146484375, -0.22418212890625, -0.2048492431640625, -0.185516357421875, -0.1661834716796875, -0.1468505859375, -0.1275177001953125, -0.108184814453125, -0.0888519287109375, -0.06951904296875, -0.0501861572265625, -0.030853271484375, -0.0115203857421875, 0.0078125, 0.0271453857421875, 0.046478271484375, 0.0658111572265625, 0.08514404296875, 0.1044769287109375, 0.123809814453125, 0.1431427001953125, 0.1624755859375, 0.1818084716796875, 0.201141357421875, 0.2204742431640625, 0.23980712890625, 0.2591400146484375, 0.278472900390625, 0.2978057861328125, 0.317138671875, 0.3364715576171875, 0.355804443359375, 0.3751373291015625, 0.39447021484375, 0.4138031005859375, 0.433135986328125, 0.4524688720703125, 0.4718017578125, 0.4911346435546875, 0.510467529296875, 0.5298004150390625, 0.54913330078125, 0.5684661865234375, 0.587799072265625, 0.6071319580078125, 0.62646484375]}, "gradients/decoder.roberta.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 4.0, 5.0, 8.0, 10.0, 6.0, 15.0, 22.0, 20.0, 26.0, 43.0, 57.0, 66.0, 154.0, 144.0, 125.0, 78.0, 53.0, 41.0, 32.0, 18.0, 19.0, 15.0, 10.0, 9.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0306396484375, -0.02969646453857422, -0.028753280639648438, -0.027810096740722656, -0.026866912841796875, -0.025923728942871094, -0.024980545043945312, -0.02403736114501953, -0.02309417724609375, -0.02215099334716797, -0.021207809448242188, -0.020264625549316406, -0.019321441650390625, -0.018378257751464844, -0.017435073852539062, -0.01649188995361328, -0.0155487060546875, -0.014605522155761719, -0.013662338256835938, -0.012719154357910156, -0.011775970458984375, -0.010832786560058594, -0.009889602661132812, -0.008946418762207031, -0.00800323486328125, -0.007060050964355469, -0.0061168670654296875, -0.005173683166503906, -0.004230499267578125, -0.0032873153686523438, -0.0023441314697265625, -0.0014009475708007812, -0.000457763671875, 0.00048542022705078125, 0.0014286041259765625, 0.0023717880249023438, 0.003314971923828125, 0.004258155822753906, 0.0052013397216796875, 0.006144523620605469, 0.00708770751953125, 0.008030891418457031, 0.008974075317382812, 0.009917259216308594, 0.010860443115234375, 0.011803627014160156, 0.012746810913085938, 0.013689994812011719, 0.0146331787109375, 0.015576362609863281, 0.016519546508789062, 0.017462730407714844, 0.018405914306640625, 0.019349098205566406, 0.020292282104492188, 0.02123546600341797, 0.02217864990234375, 0.02312183380126953, 0.024065017700195312, 0.025008201599121094, 0.025951385498046875, 0.026894569396972656, 0.027837753295898438, 0.02878093719482422, 0.02972412109375]}, "gradients/decoder.roberta.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 11.0, 15.0, 23.0, 32.0, 42.0, 43.0, 67.0, 63.0, 69.0, 82.0, 87.0, 75.0, 89.0, 64.0, 59.0, 44.0, 33.0, 21.0, 20.0, 15.0, 16.0, 7.0, 10.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2752368450164795, -2.169095516204834, -2.0629544258117676, -1.956813097000122, -1.8506718873977661, -1.7445306777954102, -1.6383893489837646, -1.5322481393814087, -1.4261069297790527, -1.3199657201766968, -1.2138245105743408, -1.1076831817626953, -1.0015419721603394, -0.8954007625579834, -0.7892594933509827, -0.6831182241439819, -0.576977014541626, -0.47083577513694763, -0.3646945357322693, -0.25855329632759094, -0.1524120569229126, -0.04627084732055664, 0.05987042188644409, 0.16601169109344482, 0.2721529006958008, 0.3782941401004791, 0.48443537950515747, 0.5905766487121582, 0.6967178583145142, 0.8028590679168701, 0.9090003371238708, 1.0151416063308716, 1.1212830543518066, 1.2274242639541626, 1.3335654735565186, 1.439706802368164, 1.54584801197052, 1.651989221572876, 1.7581305503845215, 1.8642717599868774, 1.9704129695892334, 2.076554298400879, 2.1826953887939453, 2.288836717605591, 2.3949780464172363, 2.5011191368103027, 2.6072604656219482, 2.7134017944335938, 2.81954288482666, 2.9256842136383057, 3.031825304031372, 3.1379666328430176, 3.244107723236084, 3.3502490520477295, 3.456390380859375, 3.5625314712524414, 3.668672800064087, 3.7748141288757324, 3.880955219268799, 3.9870965480804443, 4.09323787689209, 4.199378967285156, 4.305520057678223, 4.411661624908447, 4.517802715301514]}, "gradients/decoder.roberta.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 6.0, 8.0, 6.0, 9.0, 12.0, 9.0, 11.0, 19.0, 20.0, 21.0, 15.0, 31.0, 24.0, 21.0, 28.0, 38.0, 36.0, 41.0, 34.0, 39.0, 41.0, 51.0, 29.0, 43.0, 46.0, 44.0, 26.0, 27.0, 38.0, 36.0, 21.0, 27.0, 17.0, 24.0, 17.0, 8.0, 17.0, 9.0, 12.0, 9.0, 8.0, 4.0, 7.0, 4.0, 1.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6424121856689453, -2.558215379714966, -2.4740185737609863, -2.389821767807007, -2.3056249618530273, -2.221428155899048, -2.1372313499450684, -2.0530343055725098, -1.9688376188278198, -1.8846408128738403, -1.8004440069198608, -1.7162470817565918, -1.6320502758026123, -1.5478534698486328, -1.4636566638946533, -1.3794598579406738, -1.2952630519866943, -1.2110662460327148, -1.1268694400787354, -1.0426726341247559, -0.9584757685661316, -0.8742789626121521, -0.7900820970535278, -0.7058852910995483, -0.6216884851455688, -0.5374916791915894, -0.4532948434352875, -0.3690980076789856, -0.2849012017250061, -0.2007043957710266, -0.11650753021240234, -0.03231072425842285, 0.05188608169555664, 0.13608290255069733, 0.220279723405838, 0.3044765591621399, 0.3886733651161194, 0.4728701710700989, 0.5570670366287231, 0.6412638425827026, 0.7254606485366821, 0.8096574544906616, 0.8938542604446411, 0.9780511260032654, 1.0622479915618896, 1.1464447975158691, 1.2306416034698486, 1.3148384094238281, 1.3990352153778076, 1.483232021331787, 1.5674288272857666, 1.651625633239746, 1.7358224391937256, 1.820019245147705, 1.9042161703109741, 1.9884129762649536, 2.0726099014282227, 2.156806707382202, 2.2410035133361816, 2.325200319290161, 2.4093971252441406, 2.49359393119812, 2.5777907371520996, 2.661987781524658, 2.7461843490600586]}, "gradients/decoder.roberta.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 8.0, 10.0, 13.0, 14.0, 17.0, 21.0, 35.0, 66.0, 76.0, 112.0, 174.0, 290.0, 513.0, 852.0, 1466.0, 2788.0, 5194.0, 9844.0, 19020.0, 37909.0, 77971.0, 178956.0, 350953.0, 194542.0, 84311.0, 40455.0, 20198.0, 10535.0, 5471.0, 2878.0, 1574.0, 872.0, 528.0, 293.0, 199.0, 132.0, 78.0, 51.0, 40.0, 26.0, 24.0, 10.0, 7.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9921875, -1.926971435546875, -1.86175537109375, -1.796539306640625, -1.7313232421875, -1.666107177734375, -1.60089111328125, -1.535675048828125, -1.470458984375, -1.405242919921875, -1.34002685546875, -1.274810791015625, -1.2095947265625, -1.144378662109375, -1.07916259765625, -1.013946533203125, -0.94873046875, -0.883514404296875, -0.81829833984375, -0.753082275390625, -0.6878662109375, -0.622650146484375, -0.55743408203125, -0.492218017578125, -0.427001953125, -0.361785888671875, -0.29656982421875, -0.231353759765625, -0.1661376953125, -0.100921630859375, -0.03570556640625, 0.029510498046875, 0.0947265625, 0.159942626953125, 0.22515869140625, 0.290374755859375, 0.3555908203125, 0.420806884765625, 0.48602294921875, 0.551239013671875, 0.616455078125, 0.681671142578125, 0.74688720703125, 0.812103271484375, 0.8773193359375, 0.942535400390625, 1.00775146484375, 1.072967529296875, 1.13818359375, 1.203399658203125, 1.26861572265625, 1.333831787109375, 1.3990478515625, 1.464263916015625, 1.52947998046875, 1.594696044921875, 1.659912109375, 1.725128173828125, 1.79034423828125, 1.855560302734375, 1.9207763671875, 1.985992431640625, 2.05120849609375, 2.116424560546875, 2.181640625]}, "gradients/decoder.roberta.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 9.0, 9.0, 6.0, 9.0, 13.0, 6.0, 14.0, 22.0, 14.0, 25.0, 15.0, 27.0, 24.0, 26.0, 24.0, 37.0, 39.0, 37.0, 34.0, 42.0, 43.0, 39.0, 39.0, 44.0, 40.0, 44.0, 24.0, 36.0, 39.0, 31.0, 22.0, 28.0, 16.0, 23.0, 17.0, 10.0, 15.0, 10.0, 13.0, 11.0, 5.0, 4.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.462890625, -2.384490966796875, -2.30609130859375, -2.227691650390625, -2.1492919921875, -2.070892333984375, -1.99249267578125, -1.914093017578125, -1.835693359375, -1.757293701171875, -1.67889404296875, -1.600494384765625, -1.5220947265625, -1.443695068359375, -1.36529541015625, -1.286895751953125, -1.20849609375, -1.130096435546875, -1.05169677734375, -0.973297119140625, -0.8948974609375, -0.816497802734375, -0.73809814453125, -0.659698486328125, -0.581298828125, -0.502899169921875, -0.42449951171875, -0.346099853515625, -0.2677001953125, -0.189300537109375, -0.11090087890625, -0.032501220703125, 0.0458984375, 0.124298095703125, 0.20269775390625, 0.281097412109375, 0.3594970703125, 0.437896728515625, 0.51629638671875, 0.594696044921875, 0.673095703125, 0.751495361328125, 0.82989501953125, 0.908294677734375, 0.9866943359375, 1.065093994140625, 1.14349365234375, 1.221893310546875, 1.30029296875, 1.378692626953125, 1.45709228515625, 1.535491943359375, 1.6138916015625, 1.692291259765625, 1.77069091796875, 1.849090576171875, 1.927490234375, 2.005889892578125, 2.08428955078125, 2.162689208984375, 2.2410888671875, 2.319488525390625, 2.39788818359375, 2.476287841796875, 2.5546875]}, "gradients/decoder.roberta.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 6.0, 7.0, 4.0, 9.0, 15.0, 14.0, 15.0, 20.0, 32.0, 41.0, 55.0, 61.0, 76.0, 114.0, 132.0, 171.0, 480.0, 1046359.0, 234.0, 146.0, 137.0, 91.0, 69.0, 52.0, 46.0, 49.0, 33.0, 22.0, 14.0, 7.0, 11.0, 4.0, 5.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-104.1875, -101.15625, -98.125, -95.09375, -92.0625, -89.03125, -86.0, -82.96875, -79.9375, -76.90625, -73.875, -70.84375, -67.8125, -64.78125, -61.75, -58.71875, -55.6875, -52.65625, -49.625, -46.59375, -43.5625, -40.53125, -37.5, -34.46875, -31.4375, -28.40625, -25.375, -22.34375, -19.3125, -16.28125, -13.25, -10.21875, -7.1875, -4.15625, -1.125, 1.90625, 4.9375, 7.96875, 11.0, 14.03125, 17.0625, 20.09375, 23.125, 26.15625, 29.1875, 32.21875, 35.25, 38.28125, 41.3125, 44.34375, 47.375, 50.40625, 53.4375, 56.46875, 59.5, 62.53125, 65.5625, 68.59375, 71.625, 74.65625, 77.6875, 80.71875, 83.75, 86.78125, 89.8125]}, "gradients/decoder.roberta.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 8.0, 5.0, 6.0, 8.0, 11.0, 10.0, 23.0, 33.0, 44.0, 32.0, 40.0, 38.0, 49.0, 47.0, 48.0, 51.0, 60.0, 49.0, 58.0, 60.0, 47.0, 47.0, 36.0, 40.0, 32.0, 22.0, 20.0, 15.0, 17.0, 11.0, 6.0, 3.0, 8.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.40234375, -3.2906494140625, -3.178955078125, -3.0672607421875, -2.95556640625, -2.8438720703125, -2.732177734375, -2.6204833984375, -2.5087890625, -2.3970947265625, -2.285400390625, -2.1737060546875, -2.06201171875, -1.9503173828125, -1.838623046875, -1.7269287109375, -1.615234375, -1.5035400390625, -1.391845703125, -1.2801513671875, -1.16845703125, -1.0567626953125, -0.945068359375, -0.8333740234375, -0.7216796875, -0.6099853515625, -0.498291015625, -0.3865966796875, -0.27490234375, -0.1632080078125, -0.051513671875, 0.0601806640625, 0.171875, 0.2835693359375, 0.395263671875, 0.5069580078125, 0.61865234375, 0.7303466796875, 0.842041015625, 0.9537353515625, 1.0654296875, 1.1771240234375, 1.288818359375, 1.4005126953125, 1.51220703125, 1.6239013671875, 1.735595703125, 1.8472900390625, 1.958984375, 2.0706787109375, 2.182373046875, 2.2940673828125, 2.40576171875, 2.5174560546875, 2.629150390625, 2.7408447265625, 2.8525390625, 2.9642333984375, 3.075927734375, 3.1876220703125, 3.29931640625, 3.4110107421875, 3.522705078125, 3.6343994140625, 3.74609375]}, "gradients/decoder.roberta.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 6.0, 7.0, 15.0, 43.0, 65.0, 161.0, 345.0, 1190.0, 8001.0, 680144.0, 351049.0, 5927.0, 969.0, 333.0, 124.0, 81.0, 31.0, 23.0, 17.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7734375, -7.54443359375, -7.3154296875, -7.08642578125, -6.857421875, -6.62841796875, -6.3994140625, -6.17041015625, -5.94140625, -5.71240234375, -5.4833984375, -5.25439453125, -5.025390625, -4.79638671875, -4.5673828125, -4.33837890625, -4.109375, -3.88037109375, -3.6513671875, -3.42236328125, -3.193359375, -2.96435546875, -2.7353515625, -2.50634765625, -2.27734375, -2.04833984375, -1.8193359375, -1.59033203125, -1.361328125, -1.13232421875, -0.9033203125, -0.67431640625, -0.4453125, -0.21630859375, 0.0126953125, 0.24169921875, 0.470703125, 0.69970703125, 0.9287109375, 1.15771484375, 1.38671875, 1.61572265625, 1.8447265625, 2.07373046875, 2.302734375, 2.53173828125, 2.7607421875, 2.98974609375, 3.21875, 3.44775390625, 3.6767578125, 3.90576171875, 4.134765625, 4.36376953125, 4.5927734375, 4.82177734375, 5.05078125, 5.27978515625, 5.5087890625, 5.73779296875, 5.966796875, 6.19580078125, 6.4248046875, 6.65380859375, 6.8828125]}, "gradients/decoder.roberta.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 2.0, 6.0, 9.0, 12.0, 34.0, 38.0, 57.0, 116.0, 225.0, 224.0, 104.0, 76.0, 43.0, 19.0, 17.0, 11.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021529197692871094, -0.00020395591855049133, -0.00019261986017227173, -0.00018128380179405212, -0.00016994774341583252, -0.00015861168503761292, -0.0001472756266593933, -0.0001359395682811737, -0.0001246035099029541, -0.0001132674515247345, -0.00010193139314651489, -9.059533476829529e-05, -7.925927639007568e-05, -6.792321801185608e-05, -5.6587159633636475e-05, -4.525110125541687e-05, -3.3915042877197266e-05, -2.257898449897766e-05, -1.1242926120758057e-05, 9.313225746154785e-08, 1.1429190635681152e-05, 2.2765249013900757e-05, 3.410130739212036e-05, 4.5437365770339966e-05, 5.677342414855957e-05, 6.810948252677917e-05, 7.944554090499878e-05, 9.078159928321838e-05, 0.00010211765766143799, 0.00011345371603965759, 0.0001247897744178772, 0.0001361258327960968, 0.0001474618911743164, 0.000158797949552536, 0.00017013400793075562, 0.00018147006630897522, 0.00019280612468719482, 0.00020414218306541443, 0.00021547824144363403, 0.00022681429982185364, 0.00023815035820007324, 0.00024948641657829285, 0.00026082247495651245, 0.00027215853333473206, 0.00028349459171295166, 0.00029483065009117126, 0.00030616670846939087, 0.0003175027668476105, 0.0003288388252258301, 0.0003401748836040497, 0.0003515109419822693, 0.0003628470003604889, 0.0003741830587387085, 0.0003855191171169281, 0.0003968551754951477, 0.0004081912338733673, 0.0004195272922515869, 0.0004308633506298065, 0.0004421994090080261, 0.00045353546738624573, 0.00046487152576446533, 0.00047620758414268494, 0.00048754364252090454, 0.0004988797008991241, 0.0005102157592773438]}, "gradients/decoder.roberta.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 7.0, 4.0, 12.0, 13.0, 35.0, 41.0, 60.0, 216.0, 1482.0, 110616.0, 932190.0, 3250.0, 358.0, 95.0, 44.0, 30.0, 25.0, 14.0, 8.0, 11.0, 9.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.734375, -13.332275390625, -12.93017578125, -12.528076171875, -12.1259765625, -11.723876953125, -11.32177734375, -10.919677734375, -10.517578125, -10.115478515625, -9.71337890625, -9.311279296875, -8.9091796875, -8.507080078125, -8.10498046875, -7.702880859375, -7.30078125, -6.898681640625, -6.49658203125, -6.094482421875, -5.6923828125, -5.290283203125, -4.88818359375, -4.486083984375, -4.083984375, -3.681884765625, -3.27978515625, -2.877685546875, -2.4755859375, -2.073486328125, -1.67138671875, -1.269287109375, -0.8671875, -0.465087890625, -0.06298828125, 0.339111328125, 0.7412109375, 1.143310546875, 1.54541015625, 1.947509765625, 2.349609375, 2.751708984375, 3.15380859375, 3.555908203125, 3.9580078125, 4.360107421875, 4.76220703125, 5.164306640625, 5.56640625, 5.968505859375, 6.37060546875, 6.772705078125, 7.1748046875, 7.576904296875, 7.97900390625, 8.381103515625, 8.783203125, 9.185302734375, 9.58740234375, 9.989501953125, 10.3916015625, 10.793701171875, 11.19580078125, 11.597900390625, 12.0]}, "gradients/decoder.roberta.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 8.0, 8.0, 10.0, 9.0, 24.0, 31.0, 32.0, 47.0, 70.0, 114.0, 144.0, 133.0, 117.0, 67.0, 51.0, 35.0, 31.0, 14.0, 10.0, 7.0, 7.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64111328125, -0.6210861206054688, -0.6010589599609375, -0.5810317993164062, -0.561004638671875, -0.5409774780273438, -0.5209503173828125, -0.5009231567382812, -0.48089599609375, -0.46086883544921875, -0.4408416748046875, -0.42081451416015625, -0.400787353515625, -0.38076019287109375, -0.3607330322265625, -0.34070587158203125, -0.3206787109375, -0.30065155029296875, -0.2806243896484375, -0.26059722900390625, -0.240570068359375, -0.22054290771484375, -0.2005157470703125, -0.18048858642578125, -0.16046142578125, -0.14043426513671875, -0.1204071044921875, -0.10037994384765625, -0.080352783203125, -0.06032562255859375, -0.0402984619140625, -0.02027130126953125, -0.000244140625, 0.01978302001953125, 0.0398101806640625, 0.05983734130859375, 0.079864501953125, 0.09989166259765625, 0.1199188232421875, 0.13994598388671875, 0.15997314453125, 0.18000030517578125, 0.2000274658203125, 0.22005462646484375, 0.240081787109375, 0.26010894775390625, 0.2801361083984375, 0.30016326904296875, 0.3201904296875, 0.34021759033203125, 0.3602447509765625, 0.38027191162109375, 0.400299072265625, 0.42032623291015625, 0.4403533935546875, 0.46038055419921875, 0.48040771484375, 0.5004348754882812, 0.5204620361328125, 0.5404891967773438, 0.560516357421875, 0.5805435180664062, 0.6005706787109375, 0.6205978393554688, 0.640625]}, "gradients/decoder.roberta.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 11.0, 6.0, 19.0, 18.0, 29.0, 35.0, 53.0, 65.0, 76.0, 83.0, 81.0, 90.0, 79.0, 74.0, 73.0, 47.0, 47.0, 36.0, 21.0, 14.0, 17.0, 9.0, 10.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796326160430908, -2.6803855895996094, -2.5644447803497314, -2.4485042095184326, -2.3325634002685547, -2.216622829437256, -2.100682258605957, -1.9847415685653687, -1.8688008785247803, -1.752860188484192, -1.6369194984436035, -1.5209789276123047, -1.4050382375717163, -1.289097547531128, -1.173156976699829, -1.0572162866592407, -0.9412755966186523, -0.825334906578064, -0.7093942761421204, -0.5934536457061768, -0.4775129556655884, -0.361572265625, -0.2456316351890564, -0.1296910047531128, -0.013750314712524414, 0.10219034552574158, 0.21813100576400757, 0.33407166600227356, 0.45001232624053955, 0.5659530162811279, 0.6818936467170715, 0.7978342771530151, 0.9137749671936035, 1.029715657234192, 1.1456563472747803, 1.261596918106079, 1.3775376081466675, 1.4934782981872559, 1.6094188690185547, 1.725359559059143, 1.8413002490997314, 1.9572409391403198, 2.073181629180908, 2.189122200012207, 2.305062770843506, 2.421003580093384, 2.5369441509246826, 2.6528849601745605, 2.7688255310058594, 2.884766101837158, 3.000706911087036, 3.116647481918335, 3.232588291168213, 3.3485288619995117, 3.4644694328308105, 3.5804100036621094, 3.6963508129119873, 3.812291383743286, 3.928232192993164, 4.044172763824463, 4.160113334655762, 4.276054382324219, 4.391994953155518, 4.507935523986816, 4.623876094818115]}, "gradients/decoder.roberta.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 5.0, 3.0, 1.0, 5.0, 8.0, 8.0, 9.0, 13.0, 10.0, 10.0, 21.0, 12.0, 21.0, 27.0, 24.0, 21.0, 29.0, 27.0, 30.0, 36.0, 34.0, 28.0, 32.0, 37.0, 34.0, 36.0, 37.0, 40.0, 50.0, 33.0, 35.0, 31.0, 15.0, 20.0, 31.0, 28.0, 22.0, 20.0, 17.0, 12.0, 16.0, 22.0, 6.0, 8.0, 9.0, 7.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.8642399311065674, -2.7685136795043945, -2.672787666320801, -2.577061414718628, -2.481335163116455, -2.3856089115142822, -2.2898828983306885, -2.1941566467285156, -2.0984303951263428, -2.00270414352417, -1.9069780111312866, -1.8112518787384033, -1.7155256271362305, -1.6197994947433472, -1.5240733623504639, -1.428347110748291, -1.3326209783554077, -1.2368948459625244, -1.1411685943603516, -1.0454424619674683, -0.9497162103652954, -0.8539900779724121, -0.758263885974884, -0.662537693977356, -0.5668115019798279, -0.4710853099822998, -0.37535911798477173, -0.27963295578956604, -0.18390676379203796, -0.08818057179450989, 0.007545590400695801, 0.10327178239822388, 0.19899797439575195, 0.29472416639328003, 0.3904503583908081, 0.4861765205860138, 0.5819027423858643, 0.6776288747787476, 0.7733550667762756, 0.8690812587738037, 0.9648074507713318, 1.0605336427688599, 1.1562597751617432, 1.251986026763916, 1.3477121591567993, 1.4434384107589722, 1.5391645431518555, 1.6348907947540283, 1.7306169271469116, 1.826343059539795, 1.9220693111419678, 2.0177955627441406, 2.1135215759277344, 2.2092478275299072, 2.30497407913208, 2.400700092315674, 2.4964263439178467, 2.5921525955200195, 2.6878786087036133, 2.783604860305786, 2.879331111907959, 2.975057363510132, 3.0707833766937256, 3.1665096282958984, 3.2622358798980713]}, "gradients/decoder.roberta.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 8.0, 8.0, 8.0, 17.0, 19.0, 21.0, 49.0, 40.0, 48.0, 50.0, 64.0, 90.0, 119.0, 145.0, 198.0, 262.0, 418.0, 894.0, 2913.0, 17731.0, 261878.0, 3489522.0, 390482.0, 23207.0, 3487.0, 966.0, 463.0, 292.0, 173.0, 116.0, 116.0, 87.0, 77.0, 56.0, 55.0, 38.0, 51.0, 31.0, 18.0, 16.0, 9.0, 7.0, 7.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.63671875, -7.37835693359375, -7.1199951171875, -6.86163330078125, -6.603271484375, -6.34490966796875, -6.0865478515625, -5.82818603515625, -5.56982421875, -5.31146240234375, -5.0531005859375, -4.79473876953125, -4.536376953125, -4.27801513671875, -4.0196533203125, -3.76129150390625, -3.5029296875, -3.24456787109375, -2.9862060546875, -2.72784423828125, -2.469482421875, -2.21112060546875, -1.9527587890625, -1.69439697265625, -1.43603515625, -1.17767333984375, -0.9193115234375, -0.66094970703125, -0.402587890625, -0.14422607421875, 0.1141357421875, 0.37249755859375, 0.630859375, 0.88922119140625, 1.1475830078125, 1.40594482421875, 1.664306640625, 1.92266845703125, 2.1810302734375, 2.43939208984375, 2.69775390625, 2.95611572265625, 3.2144775390625, 3.47283935546875, 3.731201171875, 3.98956298828125, 4.2479248046875, 4.50628662109375, 4.7646484375, 5.02301025390625, 5.2813720703125, 5.53973388671875, 5.798095703125, 6.05645751953125, 6.3148193359375, 6.57318115234375, 6.83154296875, 7.08990478515625, 7.3482666015625, 7.60662841796875, 7.864990234375, 8.12335205078125, 8.3817138671875, 8.64007568359375, 8.8984375]}, "gradients/decoder.roberta.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 6.0, 7.0, 9.0, 7.0, 11.0, 9.0, 18.0, 17.0, 17.0, 29.0, 22.0, 34.0, 29.0, 24.0, 33.0, 37.0, 39.0, 41.0, 55.0, 35.0, 48.0, 42.0, 48.0, 40.0, 33.0, 31.0, 26.0, 28.0, 28.0, 27.0, 24.0, 23.0, 13.0, 19.0, 18.0, 14.0, 11.0, 9.0, 8.0, 3.0, 9.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.255859375, -2.18109130859375, -2.1063232421875, -2.03155517578125, -1.956787109375, -1.88201904296875, -1.8072509765625, -1.73248291015625, -1.65771484375, -1.58294677734375, -1.5081787109375, -1.43341064453125, -1.358642578125, -1.28387451171875, -1.2091064453125, -1.13433837890625, -1.0595703125, -0.98480224609375, -0.9100341796875, -0.83526611328125, -0.760498046875, -0.68572998046875, -0.6109619140625, -0.53619384765625, -0.46142578125, -0.38665771484375, -0.3118896484375, -0.23712158203125, -0.162353515625, -0.08758544921875, -0.0128173828125, 0.06195068359375, 0.13671875, 0.21148681640625, 0.2862548828125, 0.36102294921875, 0.435791015625, 0.51055908203125, 0.5853271484375, 0.66009521484375, 0.73486328125, 0.80963134765625, 0.8843994140625, 0.95916748046875, 1.033935546875, 1.10870361328125, 1.1834716796875, 1.25823974609375, 1.3330078125, 1.40777587890625, 1.4825439453125, 1.55731201171875, 1.632080078125, 1.70684814453125, 1.7816162109375, 1.85638427734375, 1.93115234375, 2.00592041015625, 2.0806884765625, 2.15545654296875, 2.230224609375, 2.30499267578125, 2.3797607421875, 2.45452880859375, 2.529296875]}, "gradients/decoder.roberta.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 17.0, 26.0, 36.0, 46.0, 73.0, 121.0, 207.0, 459.0, 1562.0, 283637.0, 3903733.0, 3101.0, 558.0, 263.0, 145.0, 86.0, 50.0, 49.0, 28.0, 20.0, 17.0, 8.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.42041015625, -33.2783203125, -32.13623046875, -30.994140625, -29.85205078125, -28.7099609375, -27.56787109375, -26.42578125, -25.28369140625, -24.1416015625, -22.99951171875, -21.857421875, -20.71533203125, -19.5732421875, -18.43115234375, -17.2890625, -16.14697265625, -15.0048828125, -13.86279296875, -12.720703125, -11.57861328125, -10.4365234375, -9.29443359375, -8.15234375, -7.01025390625, -5.8681640625, -4.72607421875, -3.583984375, -2.44189453125, -1.2998046875, -0.15771484375, 0.984375, 2.12646484375, 3.2685546875, 4.41064453125, 5.552734375, 6.69482421875, 7.8369140625, 8.97900390625, 10.12109375, 11.26318359375, 12.4052734375, 13.54736328125, 14.689453125, 15.83154296875, 16.9736328125, 18.11572265625, 19.2578125, 20.39990234375, 21.5419921875, 22.68408203125, 23.826171875, 24.96826171875, 26.1103515625, 27.25244140625, 28.39453125, 29.53662109375, 30.6787109375, 31.82080078125, 32.962890625, 34.10498046875, 35.2470703125, 36.38916015625, 37.53125]}, "gradients/decoder.roberta.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 4.0, 8.0, 17.0, 19.0, 31.0, 38.0, 57.0, 70.0, 126.0, 181.0, 266.0, 434.0, 627.0, 718.0, 530.0, 346.0, 193.0, 127.0, 94.0, 59.0, 37.0, 23.0, 19.0, 11.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.375, -1.32440185546875, -1.2738037109375, -1.22320556640625, -1.172607421875, -1.12200927734375, -1.0714111328125, -1.02081298828125, -0.97021484375, -0.91961669921875, -0.8690185546875, -0.81842041015625, -0.767822265625, -0.71722412109375, -0.6666259765625, -0.61602783203125, -0.5654296875, -0.51483154296875, -0.4642333984375, -0.41363525390625, -0.363037109375, -0.31243896484375, -0.2618408203125, -0.21124267578125, -0.16064453125, -0.11004638671875, -0.0594482421875, -0.00885009765625, 0.041748046875, 0.09234619140625, 0.1429443359375, 0.19354248046875, 0.244140625, 0.29473876953125, 0.3453369140625, 0.39593505859375, 0.446533203125, 0.49713134765625, 0.5477294921875, 0.59832763671875, 0.64892578125, 0.69952392578125, 0.7501220703125, 0.80072021484375, 0.851318359375, 0.90191650390625, 0.9525146484375, 1.00311279296875, 1.0537109375, 1.10430908203125, 1.1549072265625, 1.20550537109375, 1.256103515625, 1.30670166015625, 1.3572998046875, 1.40789794921875, 1.45849609375, 1.50909423828125, 1.5596923828125, 1.61029052734375, 1.660888671875, 1.71148681640625, 1.7620849609375, 1.81268310546875, 1.86328125]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 7.0, 17.0, 20.0, 46.0, 63.0, 87.0, 91.0, 132.0, 136.0, 112.0, 96.0, 66.0, 56.0, 32.0, 15.0, 13.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.446404218673706, -3.283931016921997, -3.121457815170288, -2.958984375, -2.796511173248291, -2.634037971496582, -2.471564769744873, -2.309091567993164, -2.146618366241455, -1.984145164489746, -1.8216718435287476, -1.6591986417770386, -1.49672532081604, -1.334252119064331, -1.171778917312622, -1.0093055963516235, -0.846832275390625, -0.6843590140342712, -0.5218857526779175, -0.3594125509262085, -0.19693928956985474, -0.03446602821350098, 0.128007173538208, 0.29048049449920654, 0.4529536962509155, 0.6154269576072693, 0.777900218963623, 0.940373420715332, 1.102846622467041, 1.2653199434280396, 1.4277931451797485, 1.590266466140747, 1.7527399063110352, 1.9152131080627441, 2.077686309814453, 2.240159511566162, 2.40263295173645, 2.565106153488159, 2.727579355239868, 2.8900527954101562, 3.0525259971618652, 3.214999198913574, 3.377472400665283, 3.539945602416992, 3.7024190425872803, 3.8648922443389893, 4.027365684509277, 4.189838886260986, 4.352312088012695, 4.514785289764404, 4.677258491516113, 4.839731693267822, 5.002204895019531, 5.164678573608398, 5.327151298522949, 5.489624977111816, 5.652097702026367, 5.814570903778076, 5.977044105529785, 6.139517307281494, 6.301990509033203, 6.46446418762207, 6.626936912536621, 6.789410591125488, 6.951883792877197]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 8.0, 15.0, 8.0, 14.0, 24.0, 14.0, 25.0, 28.0, 17.0, 33.0, 31.0, 41.0, 38.0, 41.0, 41.0, 41.0, 48.0, 43.0, 41.0, 39.0, 42.0, 41.0, 34.0, 39.0, 31.0, 33.0, 32.0, 30.0, 30.0, 12.0, 8.0, 14.0, 13.0, 11.0, 11.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.144338846206665, -3.0519158840179443, -2.9594931602478027, -2.867070198059082, -2.7746472358703613, -2.6822245121002197, -2.589801549911499, -2.4973788261413574, -2.4049558639526367, -2.312532901763916, -2.2201101779937744, -2.1276872158050537, -2.035264492034912, -1.9428415298461914, -1.8504185676574707, -1.7579957246780396, -1.6655728816986084, -1.5731500387191772, -1.480727195739746, -1.3883042335510254, -1.2958813905715942, -1.203458547592163, -1.1110355854034424, -1.0186127424240112, -0.9261898994445801, -0.8337670564651489, -0.741344153881073, -0.6489212512969971, -0.5564984083175659, -0.4640755355358124, -0.37165266275405884, -0.2792297601699829, -0.18680691719055176, -0.09438404440879822, -0.0019611716270446777, 0.09046170115470886, 0.1828845739364624, 0.27530744671821594, 0.3677303194999695, 0.4601532220840454, 0.5525760650634766, 0.6449989080429077, 0.7374218106269836, 0.8298447132110596, 0.9222675561904907, 1.0146903991699219, 1.1071133613586426, 1.1995362043380737, 1.2919590473175049, 1.384381890296936, 1.4768047332763672, 1.569227695465088, 1.661650538444519, 1.7540733814239502, 1.846496343612671, 1.938919186592102, 2.031342029571533, 2.123764991760254, 2.2161877155303955, 2.308610677719116, 2.401033401489258, 2.4934563636779785, 2.585879325866699, 2.67830228805542, 2.7707250118255615]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 12.0, 16.0, 20.0, 43.0, 54.0, 77.0, 115.0, 176.0, 247.0, 360.0, 606.0, 793.0, 1289.0, 2080.0, 3085.0, 4878.0, 7971.0, 12936.0, 21542.0, 36787.0, 65339.0, 122146.0, 213446.0, 231987.0, 141978.0, 75785.0, 42065.0, 23952.0, 14363.0, 8763.0, 5517.0, 3445.0, 2303.0, 1457.0, 984.0, 669.0, 433.0, 301.0, 183.0, 133.0, 73.0, 48.0, 33.0, 20.0, 21.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4543952941894531, -0.43930816650390625, -0.4242210388183594, -0.4091339111328125, -0.3940467834472656, -0.37895965576171875, -0.3638725280761719, -0.348785400390625, -0.3336982727050781, -0.31861114501953125, -0.3035240173339844, -0.2884368896484375, -0.2733497619628906, -0.25826263427734375, -0.24317550659179688, -0.22808837890625, -0.21300125122070312, -0.19791412353515625, -0.18282699584960938, -0.1677398681640625, -0.15265274047851562, -0.13756561279296875, -0.12247848510742188, -0.107391357421875, -0.09230422973632812, -0.07721710205078125, -0.062129974365234375, -0.0470428466796875, -0.031955718994140625, -0.01686859130859375, -0.001781463623046875, 0.0133056640625, 0.028392791748046875, 0.04347991943359375, 0.058567047119140625, 0.0736541748046875, 0.08874130249023438, 0.10382843017578125, 0.11891555786132812, 0.134002685546875, 0.14908981323242188, 0.16417694091796875, 0.17926406860351562, 0.1943511962890625, 0.20943832397460938, 0.22452545166015625, 0.23961257934570312, 0.25469970703125, 0.2697868347167969, 0.28487396240234375, 0.2999610900878906, 0.3150482177734375, 0.3301353454589844, 0.34522247314453125, 0.3603096008300781, 0.375396728515625, 0.3904838562011719, 0.40557098388671875, 0.4206581115722656, 0.4357452392578125, 0.4508323669433594, 0.46591949462890625, 0.4810066223144531, 0.49609375]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 8.0, 16.0, 7.0, 16.0, 21.0, 15.0, 25.0, 28.0, 16.0, 35.0, 31.0, 40.0, 38.0, 43.0, 37.0, 47.0, 45.0, 45.0, 34.0, 43.0, 43.0, 39.0, 34.0, 40.0, 30.0, 34.0, 35.0, 28.0, 30.0, 10.0, 9.0, 15.0, 12.0, 12.0, 10.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.138671875, -3.047882080078125, -2.95709228515625, -2.866302490234375, -2.7755126953125, -2.684722900390625, -2.59393310546875, -2.503143310546875, -2.412353515625, -2.321563720703125, -2.23077392578125, -2.139984130859375, -2.0491943359375, -1.958404541015625, -1.86761474609375, -1.776824951171875, -1.68603515625, -1.595245361328125, -1.50445556640625, -1.413665771484375, -1.3228759765625, -1.232086181640625, -1.14129638671875, -1.050506591796875, -0.959716796875, -0.868927001953125, -0.77813720703125, -0.687347412109375, -0.5965576171875, -0.505767822265625, -0.41497802734375, -0.324188232421875, -0.2333984375, -0.142608642578125, -0.05181884765625, 0.038970947265625, 0.1297607421875, 0.220550537109375, 0.31134033203125, 0.402130126953125, 0.492919921875, 0.583709716796875, 0.67449951171875, 0.765289306640625, 0.8560791015625, 0.946868896484375, 1.03765869140625, 1.128448486328125, 1.21923828125, 1.310028076171875, 1.40081787109375, 1.491607666015625, 1.5823974609375, 1.673187255859375, 1.76397705078125, 1.854766845703125, 1.945556640625, 2.036346435546875, 2.12713623046875, 2.217926025390625, 2.3087158203125, 2.399505615234375, 2.49029541015625, 2.581085205078125, 2.671875]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 17.0, 12.0, 17.0, 23.0, 31.0, 31.0, 45.0, 84.0, 105.0, 158.0, 205.0, 310.0, 415.0, 833.0, 1269.0, 2599.0, 6378.0, 19977.0, 99095.0, 882223.0, 21577.0, 6704.0, 2783.0, 1346.0, 788.0, 459.0, 329.0, 209.0, 143.0, 102.0, 78.0, 38.0, 41.0, 33.0, 27.0, 16.0, 14.0, 11.0, 5.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5986328125, -1.5471038818359375, -1.495574951171875, -1.4440460205078125, -1.39251708984375, -1.3409881591796875, -1.289459228515625, -1.2379302978515625, -1.1864013671875, -1.1348724365234375, -1.083343505859375, -1.0318145751953125, -0.98028564453125, -0.9287567138671875, -0.877227783203125, -0.8256988525390625, -0.774169921875, -0.7226409912109375, -0.671112060546875, -0.6195831298828125, -0.56805419921875, -0.5165252685546875, -0.464996337890625, -0.4134674072265625, -0.3619384765625, -0.3104095458984375, -0.258880615234375, -0.2073516845703125, -0.15582275390625, -0.1042938232421875, -0.052764892578125, -0.0012359619140625, 0.05029296875, 0.1018218994140625, 0.153350830078125, 0.2048797607421875, 0.25640869140625, 0.3079376220703125, 0.359466552734375, 0.4109954833984375, 0.4625244140625, 0.5140533447265625, 0.565582275390625, 0.6171112060546875, 0.66864013671875, 0.7201690673828125, 0.771697998046875, 0.8232269287109375, 0.874755859375, 0.9262847900390625, 0.977813720703125, 1.0293426513671875, 1.08087158203125, 1.1324005126953125, 1.183929443359375, 1.2354583740234375, 1.2869873046875, 1.3385162353515625, 1.390045166015625, 1.4415740966796875, 1.49310302734375, 1.5446319580078125, 1.596160888671875, 1.6476898193359375, 1.69921875]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 4.0, 8.0, 10.0, 10.0, 14.0, 21.0, 18.0, 17.0, 18.0, 22.0, 28.0, 34.0, 31.0, 39.0, 31.0, 38.0, 43.0, 46.0, 35.0, 44.0, 34.0, 26.0, 38.0, 28.0, 39.0, 27.0, 25.0, 37.0, 25.0, 33.0, 24.0, 17.0, 12.0, 13.0, 14.0, 14.0, 16.0, 9.0, 14.0, 6.0, 9.0, 7.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.7587890625, -1.709320068359375, -1.65985107421875, -1.610382080078125, -1.5609130859375, -1.511444091796875, -1.46197509765625, -1.412506103515625, -1.363037109375, -1.313568115234375, -1.26409912109375, -1.214630126953125, -1.1651611328125, -1.115692138671875, -1.06622314453125, -1.016754150390625, -0.96728515625, -0.917816162109375, -0.86834716796875, -0.818878173828125, -0.7694091796875, -0.719940185546875, -0.67047119140625, -0.621002197265625, -0.571533203125, -0.522064208984375, -0.47259521484375, -0.423126220703125, -0.3736572265625, -0.324188232421875, -0.27471923828125, -0.225250244140625, -0.17578125, -0.126312255859375, -0.07684326171875, -0.027374267578125, 0.0220947265625, 0.071563720703125, 0.12103271484375, 0.170501708984375, 0.219970703125, 0.269439697265625, 0.31890869140625, 0.368377685546875, 0.4178466796875, 0.467315673828125, 0.51678466796875, 0.566253662109375, 0.61572265625, 0.665191650390625, 0.71466064453125, 0.764129638671875, 0.8135986328125, 0.863067626953125, 0.91253662109375, 0.962005615234375, 1.011474609375, 1.060943603515625, 1.11041259765625, 1.159881591796875, 1.2093505859375, 1.258819580078125, 1.30828857421875, 1.357757568359375, 1.4072265625]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 5.0, 3.0, 11.0, 15.0, 24.0, 25.0, 29.0, 47.0, 62.0, 64.0, 89.0, 171.0, 233.0, 381.0, 610.0, 1093.0, 2092.0, 4530.0, 13273.0, 78338.0, 918845.0, 17525.0, 5445.0, 2422.0, 1250.0, 651.0, 402.0, 274.0, 189.0, 141.0, 87.0, 43.0, 43.0, 42.0, 33.0, 14.0, 8.0, 6.0, 10.0, 8.0, 6.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.2255859375, -0.21897125244140625, -0.2123565673828125, -0.20574188232421875, -0.199127197265625, -0.19251251220703125, -0.1858978271484375, -0.17928314208984375, -0.17266845703125, -0.16605377197265625, -0.1594390869140625, -0.15282440185546875, -0.146209716796875, -0.13959503173828125, -0.1329803466796875, -0.12636566162109375, -0.1197509765625, -0.11313629150390625, -0.1065216064453125, -0.09990692138671875, -0.093292236328125, -0.08667755126953125, -0.0800628662109375, -0.07344818115234375, -0.06683349609375, -0.06021881103515625, -0.0536041259765625, -0.04698944091796875, -0.040374755859375, -0.03376007080078125, -0.0271453857421875, -0.02053070068359375, -0.013916015625, -0.00730133056640625, -0.0006866455078125, 0.00592803955078125, 0.012542724609375, 0.01915740966796875, 0.0257720947265625, 0.03238677978515625, 0.03900146484375, 0.04561614990234375, 0.0522308349609375, 0.05884552001953125, 0.065460205078125, 0.07207489013671875, 0.0786895751953125, 0.08530426025390625, 0.0919189453125, 0.09853363037109375, 0.1051483154296875, 0.11176300048828125, 0.118377685546875, 0.12499237060546875, 0.1316070556640625, 0.13822174072265625, 0.14483642578125, 0.15145111083984375, 0.1580657958984375, 0.16468048095703125, 0.171295166015625, 0.17790985107421875, 0.1845245361328125, 0.19113922119140625, 0.19775390625]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 12.0, 19.0, 21.0, 33.0, 26.0, 37.0, 53.0, 62.0, 79.0, 76.0, 80.0, 88.0, 75.0, 65.0, 57.0, 64.0, 25.0, 27.0, 26.0, 17.0, 9.0, 10.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.398822784423828e-05, -4.264805465936661e-05, -4.1307881474494934e-05, -3.996770828962326e-05, -3.862753510475159e-05, -3.728736191987991e-05, -3.594718873500824e-05, -3.4607015550136566e-05, -3.326684236526489e-05, -3.192666918039322e-05, -3.0586495995521545e-05, -2.9246322810649872e-05, -2.7906149625778198e-05, -2.6565976440906525e-05, -2.522580325603485e-05, -2.3885630071163177e-05, -2.2545456886291504e-05, -2.120528370141983e-05, -1.9865110516548157e-05, -1.8524937331676483e-05, -1.718476414680481e-05, -1.5844590961933136e-05, -1.4504417777061462e-05, -1.3164244592189789e-05, -1.1824071407318115e-05, -1.0483898222446442e-05, -9.143725037574768e-06, -7.803551852703094e-06, -6.463378667831421e-06, -5.123205482959747e-06, -3.7830322980880737e-06, -2.4428591132164e-06, -1.1026859283447266e-06, 2.3748725652694702e-07, 1.5776604413986206e-06, 2.917833626270294e-06, 4.258006811141968e-06, 5.598179996013641e-06, 6.938353180885315e-06, 8.278526365756989e-06, 9.618699550628662e-06, 1.0958872735500336e-05, 1.229904592037201e-05, 1.3639219105243683e-05, 1.4979392290115356e-05, 1.631956547498703e-05, 1.7659738659858704e-05, 1.8999911844730377e-05, 2.034008502960205e-05, 2.1680258214473724e-05, 2.3020431399345398e-05, 2.436060458421707e-05, 2.5700777769088745e-05, 2.704095095396042e-05, 2.8381124138832092e-05, 2.9721297323703766e-05, 3.106147050857544e-05, 3.240164369344711e-05, 3.374181687831879e-05, 3.508199006319046e-05, 3.6422163248062134e-05, 3.776233643293381e-05, 3.910250961780548e-05, 4.0442682802677155e-05, 4.178285598754883e-05]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 7.0, 4.0, 4.0, 6.0, 9.0, 12.0, 11.0, 15.0, 18.0, 24.0, 41.0, 66.0, 103.0, 298.0, 3618.0, 901381.0, 141132.0, 1316.0, 209.0, 86.0, 52.0, 33.0, 20.0, 33.0, 15.0, 7.0, 6.0, 7.0, 5.0, 2.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.601715087890625, -0.58282470703125, -0.563934326171875, -0.5450439453125, -0.526153564453125, -0.50726318359375, -0.488372802734375, -0.469482421875, -0.450592041015625, -0.43170166015625, -0.412811279296875, -0.3939208984375, -0.375030517578125, -0.35614013671875, -0.337249755859375, -0.318359375, -0.299468994140625, -0.28057861328125, -0.261688232421875, -0.2427978515625, -0.223907470703125, -0.20501708984375, -0.186126708984375, -0.167236328125, -0.148345947265625, -0.12945556640625, -0.110565185546875, -0.0916748046875, -0.072784423828125, -0.05389404296875, -0.035003662109375, -0.01611328125, 0.002777099609375, 0.02166748046875, 0.040557861328125, 0.0594482421875, 0.078338623046875, 0.09722900390625, 0.116119384765625, 0.135009765625, 0.153900146484375, 0.17279052734375, 0.191680908203125, 0.2105712890625, 0.229461669921875, 0.24835205078125, 0.267242431640625, 0.2861328125, 0.305023193359375, 0.32391357421875, 0.342803955078125, 0.3616943359375, 0.380584716796875, 0.39947509765625, 0.418365478515625, 0.437255859375, 0.456146240234375, 0.47503662109375, 0.493927001953125, 0.5128173828125, 0.531707763671875, 0.55059814453125, 0.569488525390625, 0.58837890625]}, "gradients/decoder.roberta.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 8.0, 10.0, 22.0, 18.0, 25.0, 23.0, 44.0, 48.0, 71.0, 113.0, 155.0, 129.0, 88.0, 44.0, 32.0, 33.0, 27.0, 20.0, 20.0, 9.0, 12.0, 5.0, 3.0, 10.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.032562255859375, -0.03159189224243164, -0.03062152862548828, -0.029651165008544922, -0.028680801391601562, -0.027710437774658203, -0.026740074157714844, -0.025769710540771484, -0.024799346923828125, -0.023828983306884766, -0.022858619689941406, -0.021888256072998047, -0.020917892456054688, -0.019947528839111328, -0.01897716522216797, -0.01800680160522461, -0.01703643798828125, -0.01606607437133789, -0.015095710754394531, -0.014125347137451172, -0.013154983520507812, -0.012184619903564453, -0.011214256286621094, -0.010243892669677734, -0.009273529052734375, -0.008303165435791016, -0.007332801818847656, -0.006362438201904297, -0.0053920745849609375, -0.004421710968017578, -0.0034513473510742188, -0.0024809837341308594, -0.0015106201171875, -0.0005402565002441406, 0.00043010711669921875, 0.0014004707336425781, 0.0023708343505859375, 0.003341197967529297, 0.004311561584472656, 0.005281925201416016, 0.006252288818359375, 0.007222652435302734, 0.008193016052246094, 0.009163379669189453, 0.010133743286132812, 0.011104106903076172, 0.012074470520019531, 0.01304483413696289, 0.01401519775390625, 0.01498556137084961, 0.01595592498779297, 0.016926288604736328, 0.017896652221679688, 0.018867015838623047, 0.019837379455566406, 0.020807743072509766, 0.021778106689453125, 0.022748470306396484, 0.023718833923339844, 0.024689197540283203, 0.025659561157226562, 0.026629924774169922, 0.02760028839111328, 0.02857065200805664, 0.029541015625]}, "gradients/decoder.roberta.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 10.0, 24.0, 45.0, 54.0, 99.0, 109.0, 153.0, 149.0, 109.0, 100.0, 71.0, 35.0, 19.0, 15.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.880477428436279, -5.697067737579346, -5.513658046722412, -5.3302483558654785, -5.146838188171387, -4.963428497314453, -4.7800188064575195, -4.596609115600586, -4.413199424743652, -4.229789733886719, -4.046380043029785, -3.8629701137542725, -3.679560422897339, -3.4961507320404053, -3.3127408027648926, -3.129331111907959, -2.9459214210510254, -2.762511730194092, -2.579102039337158, -2.3956921100616455, -2.212282419204712, -2.0288727283477783, -1.8454629182815552, -1.662053108215332, -1.4786434173583984, -1.2952337265014648, -1.1118239164352417, -0.9284141659736633, -0.745004415512085, -0.5615946650505066, -0.3781849145889282, -0.19477510452270508, -0.011365413665771484, 0.17204433679580688, 0.35545408725738525, 0.5388638377189636, 0.722273588180542, 0.9056833386421204, 1.0890930891036987, 1.2725028991699219, 1.4559125900268555, 1.639322280883789, 1.8227320909500122, 2.0061419010162354, 2.189551591873169, 2.3729612827301025, 2.5563712120056152, 2.739780902862549, 2.9231905937194824, 3.106600284576416, 3.2900099754333496, 3.4734199047088623, 3.656829595565796, 3.8402392864227295, 4.023649215698242, 4.207058906555176, 4.390468597412109, 4.573878288269043, 4.757287979125977, 4.94069766998291, 5.124107360839844, 5.3075175285339355, 5.490927219390869, 5.674336910247803, 5.857746601104736]}, "gradients/decoder.roberta.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 9.0, 13.0, 8.0, 15.0, 23.0, 14.0, 26.0, 27.0, 16.0, 35.0, 31.0, 39.0, 38.0, 43.0, 37.0, 46.0, 47.0, 44.0, 35.0, 43.0, 39.0, 41.0, 35.0, 40.0, 31.0, 34.0, 33.0, 29.0, 31.0, 11.0, 10.0, 14.0, 12.0, 12.0, 10.0, 6.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.1424784660339355, -3.051708936691284, -2.960939645767212, -2.8701701164245605, -2.7794008255004883, -2.688631296157837, -2.5978617668151855, -2.5070924758911133, -2.416322946548462, -2.3255534172058105, -2.2347841262817383, -2.144014596939087, -2.0532450675964355, -1.9624757766723633, -1.871706247329712, -1.78093683719635, -1.6901674270629883, -1.5993980169296265, -1.5086286067962646, -1.4178590774536133, -1.3270896673202515, -1.2363202571868896, -1.1455507278442383, -1.0547813177108765, -0.9640119075775146, -0.8732424974441528, -0.7824730277061462, -0.6917035579681396, -0.6009341478347778, -0.510164737701416, -0.4193952679634094, -0.32862579822540283, -0.23785638809204102, -0.1470869481563568, -0.05631750822067261, 0.0344519317150116, 0.1252213716506958, 0.21599081158638, 0.3067602515220642, 0.3975297212600708, 0.4882991313934326, 0.5790685415267944, 0.669838011264801, 0.7606074810028076, 0.8513768911361694, 0.9421463012695312, 1.0329158306121826, 1.1236852407455444, 1.2144546508789062, 1.305224061012268, 1.3959934711456299, 1.4867630004882812, 1.577532410621643, 1.6683018207550049, 1.7590713500976562, 1.849840760231018, 1.9406101703643799, 2.0313796997070312, 2.1221489906311035, 2.212918519973755, 2.3036880493164062, 2.3944573402404785, 2.48522686958313, 2.5759963989257812, 2.6667656898498535]}, "gradients/decoder.roberta.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 3.0, 3.0, 5.0, 8.0, 16.0, 14.0, 26.0, 34.0, 37.0, 69.0, 104.0, 171.0, 301.0, 668.0, 1420.0, 3487.0, 8847.0, 24161.0, 69007.0, 210408.0, 456619.0, 179274.0, 59487.0, 21097.0, 7614.0, 2990.0, 1303.0, 596.0, 282.0, 189.0, 100.0, 67.0, 41.0, 26.0, 25.0, 12.0, 17.0, 4.0, 7.0, 6.0, 3.0, 1.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.125, -4.008575439453125, -3.89215087890625, -3.775726318359375, -3.6593017578125, -3.542877197265625, -3.42645263671875, -3.310028076171875, -3.193603515625, -3.077178955078125, -2.96075439453125, -2.844329833984375, -2.7279052734375, -2.611480712890625, -2.49505615234375, -2.378631591796875, -2.26220703125, -2.145782470703125, -2.02935791015625, -1.912933349609375, -1.7965087890625, -1.680084228515625, -1.56365966796875, -1.447235107421875, -1.330810546875, -1.214385986328125, -1.09796142578125, -0.981536865234375, -0.8651123046875, -0.748687744140625, -0.63226318359375, -0.515838623046875, -0.3994140625, -0.282989501953125, -0.16656494140625, -0.050140380859375, 0.0662841796875, 0.182708740234375, 0.29913330078125, 0.415557861328125, 0.531982421875, 0.648406982421875, 0.76483154296875, 0.881256103515625, 0.9976806640625, 1.114105224609375, 1.23052978515625, 1.346954345703125, 1.46337890625, 1.579803466796875, 1.69622802734375, 1.812652587890625, 1.9290771484375, 2.045501708984375, 2.16192626953125, 2.278350830078125, 2.394775390625, 2.511199951171875, 2.62762451171875, 2.744049072265625, 2.8604736328125, 2.976898193359375, 3.09332275390625, 3.209747314453125, 3.326171875]}, "gradients/decoder.roberta.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 11.0, 10.0, 13.0, 19.0, 21.0, 22.0, 25.0, 21.0, 31.0, 31.0, 41.0, 38.0, 37.0, 40.0, 54.0, 44.0, 36.0, 46.0, 36.0, 42.0, 41.0, 49.0, 40.0, 29.0, 32.0, 34.0, 27.0, 29.0, 13.0, 10.0, 14.0, 12.0, 12.0, 6.0, 8.0, 3.0, 4.0, 1.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.330078125, -3.2366943359375, -3.143310546875, -3.0499267578125, -2.95654296875, -2.8631591796875, -2.769775390625, -2.6763916015625, -2.5830078125, -2.4896240234375, -2.396240234375, -2.3028564453125, -2.20947265625, -2.1160888671875, -2.022705078125, -1.9293212890625, -1.8359375, -1.7425537109375, -1.649169921875, -1.5557861328125, -1.46240234375, -1.3690185546875, -1.275634765625, -1.1822509765625, -1.0888671875, -0.9954833984375, -0.902099609375, -0.8087158203125, -0.71533203125, -0.6219482421875, -0.528564453125, -0.4351806640625, -0.341796875, -0.2484130859375, -0.155029296875, -0.0616455078125, 0.03173828125, 0.1251220703125, 0.218505859375, 0.3118896484375, 0.4052734375, 0.4986572265625, 0.592041015625, 0.6854248046875, 0.77880859375, 0.8721923828125, 0.965576171875, 1.0589599609375, 1.15234375, 1.2457275390625, 1.339111328125, 1.4324951171875, 1.52587890625, 1.6192626953125, 1.712646484375, 1.8060302734375, 1.8994140625, 1.9927978515625, 2.086181640625, 2.1795654296875, 2.27294921875, 2.3663330078125, 2.459716796875, 2.5531005859375, 2.646484375]}, "gradients/decoder.roberta.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 13.0, 5.0, 12.0, 5.0, 9.0, 22.0, 19.0, 18.0, 26.0, 35.0, 42.0, 63.0, 55.0, 68.0, 98.0, 125.0, 129.0, 329.0, 1045171.0, 1500.0, 171.0, 129.0, 107.0, 87.0, 49.0, 49.0, 37.0, 43.0, 23.0, 23.0, 16.0, 20.0, 11.0, 8.0, 9.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.1875, -81.5322265625, -78.876953125, -76.2216796875, -73.56640625, -70.9111328125, -68.255859375, -65.6005859375, -62.9453125, -60.2900390625, -57.634765625, -54.9794921875, -52.32421875, -49.6689453125, -47.013671875, -44.3583984375, -41.703125, -39.0478515625, -36.392578125, -33.7373046875, -31.08203125, -28.4267578125, -25.771484375, -23.1162109375, -20.4609375, -17.8056640625, -15.150390625, -12.4951171875, -9.83984375, -7.1845703125, -4.529296875, -1.8740234375, 0.78125, 3.4365234375, 6.091796875, 8.7470703125, 11.40234375, 14.0576171875, 16.712890625, 19.3681640625, 22.0234375, 24.6787109375, 27.333984375, 29.9892578125, 32.64453125, 35.2998046875, 37.955078125, 40.6103515625, 43.265625, 45.9208984375, 48.576171875, 51.2314453125, 53.88671875, 56.5419921875, 59.197265625, 61.8525390625, 64.5078125, 67.1630859375, 69.818359375, 72.4736328125, 75.12890625, 77.7841796875, 80.439453125, 83.0947265625, 85.75]}, "gradients/decoder.roberta.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 0.0, 3.0, 5.0, 4.0, 3.0, 10.0, 7.0, 14.0, 13.0, 16.0, 15.0, 26.0, 28.0, 36.0, 27.0, 46.0, 35.0, 32.0, 52.0, 48.0, 40.0, 54.0, 47.0, 36.0, 42.0, 34.0, 31.0, 41.0, 45.0, 37.0, 26.0, 35.0, 16.0, 21.0, 22.0, 6.0, 11.0, 10.0, 6.0, 14.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.310546875, -3.212493896484375, -3.11444091796875, -3.016387939453125, -2.9183349609375, -2.820281982421875, -2.72222900390625, -2.624176025390625, -2.526123046875, -2.428070068359375, -2.33001708984375, -2.231964111328125, -2.1339111328125, -2.035858154296875, -1.93780517578125, -1.839752197265625, -1.74169921875, -1.643646240234375, -1.54559326171875, -1.447540283203125, -1.3494873046875, -1.251434326171875, -1.15338134765625, -1.055328369140625, -0.957275390625, -0.859222412109375, -0.76116943359375, -0.663116455078125, -0.5650634765625, -0.467010498046875, -0.36895751953125, -0.270904541015625, -0.1728515625, -0.074798583984375, 0.02325439453125, 0.121307373046875, 0.2193603515625, 0.317413330078125, 0.41546630859375, 0.513519287109375, 0.611572265625, 0.709625244140625, 0.80767822265625, 0.905731201171875, 1.0037841796875, 1.101837158203125, 1.19989013671875, 1.297943115234375, 1.39599609375, 1.494049072265625, 1.59210205078125, 1.690155029296875, 1.7882080078125, 1.886260986328125, 1.98431396484375, 2.082366943359375, 2.180419921875, 2.278472900390625, 2.37652587890625, 2.474578857421875, 2.5726318359375, 2.670684814453125, 2.76873779296875, 2.866790771484375, 2.96484375]}, "gradients/decoder.roberta.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 5.0, 11.0, 23.0, 40.0, 159.0, 493.0, 2043.0, 132120.0, 907334.0, 5277.0, 714.0, 217.0, 78.0, 19.0, 14.0, 5.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.71484375, -7.39581298828125, -7.0767822265625, -6.75775146484375, -6.438720703125, -6.11968994140625, -5.8006591796875, -5.48162841796875, -5.16259765625, -4.84356689453125, -4.5245361328125, -4.20550537109375, -3.886474609375, -3.56744384765625, -3.2484130859375, -2.92938232421875, -2.6103515625, -2.29132080078125, -1.9722900390625, -1.65325927734375, -1.334228515625, -1.01519775390625, -0.6961669921875, -0.37713623046875, -0.05810546875, 0.26092529296875, 0.5799560546875, 0.89898681640625, 1.218017578125, 1.53704833984375, 1.8560791015625, 2.17510986328125, 2.494140625, 2.81317138671875, 3.1322021484375, 3.45123291015625, 3.770263671875, 4.08929443359375, 4.4083251953125, 4.72735595703125, 5.04638671875, 5.36541748046875, 5.6844482421875, 6.00347900390625, 6.322509765625, 6.64154052734375, 6.9605712890625, 7.27960205078125, 7.5986328125, 7.91766357421875, 8.2366943359375, 8.55572509765625, 8.874755859375, 9.19378662109375, 9.5128173828125, 9.83184814453125, 10.15087890625, 10.46990966796875, 10.7889404296875, 11.10797119140625, 11.427001953125, 11.74603271484375, 12.0650634765625, 12.38409423828125, 12.703125]}, "gradients/decoder.roberta.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 8.0, 5.0, 17.0, 23.0, 29.0, 55.0, 74.0, 96.0, 199.0, 183.0, 98.0, 75.0, 51.0, 32.0, 30.0, 10.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00024437904357910156, -0.00023375079035758972, -0.00022312253713607788, -0.00021249428391456604, -0.0002018660306930542, -0.00019123777747154236, -0.00018060952425003052, -0.00016998127102851868, -0.00015935301780700684, -0.000148724764585495, -0.00013809651136398315, -0.0001274682581424713, -0.00011684000492095947, -0.00010621175169944763, -9.558349847793579e-05, -8.495524525642395e-05, -7.432699203491211e-05, -6.369873881340027e-05, -5.307048559188843e-05, -4.244223237037659e-05, -3.1813979148864746e-05, -2.1185725927352905e-05, -1.0557472705841064e-05, 7.078051567077637e-08, 1.0699033737182617e-05, 2.1327286958694458e-05, 3.19555401802063e-05, 4.258379340171814e-05, 5.321204662322998e-05, 6.384029984474182e-05, 7.446855306625366e-05, 8.50968062877655e-05, 9.572505950927734e-05, 0.00010635331273078918, 0.00011698156595230103, 0.00012760981917381287, 0.0001382380723953247, 0.00014886632561683655, 0.0001594945788383484, 0.00017012283205986023, 0.00018075108528137207, 0.0001913793385028839, 0.00020200759172439575, 0.0002126358449459076, 0.00022326409816741943, 0.00023389235138893127, 0.0002445206046104431, 0.00025514885783195496, 0.0002657771110534668, 0.00027640536427497864, 0.0002870336174964905, 0.0002976618707180023, 0.00030829012393951416, 0.000318918377161026, 0.00032954663038253784, 0.0003401748836040497, 0.0003508031368255615, 0.00036143139004707336, 0.0003720596432685852, 0.00038268789649009705, 0.0003933161497116089, 0.00040394440293312073, 0.00041457265615463257, 0.0004252009093761444, 0.00043582916259765625]}, "gradients/decoder.roberta.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 22.0, 24.0, 89.0, 537.0, 1029004.0, 18543.0, 200.0, 61.0, 32.0, 17.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.3125, -23.3330078125, -22.353515625, -21.3740234375, -20.39453125, -19.4150390625, -18.435546875, -17.4560546875, -16.4765625, -15.4970703125, -14.517578125, -13.5380859375, -12.55859375, -11.5791015625, -10.599609375, -9.6201171875, -8.640625, -7.6611328125, -6.681640625, -5.7021484375, -4.72265625, -3.7431640625, -2.763671875, -1.7841796875, -0.8046875, 0.1748046875, 1.154296875, 2.1337890625, 3.11328125, 4.0927734375, 5.072265625, 6.0517578125, 7.03125, 8.0107421875, 8.990234375, 9.9697265625, 10.94921875, 11.9287109375, 12.908203125, 13.8876953125, 14.8671875, 15.8466796875, 16.826171875, 17.8056640625, 18.78515625, 19.7646484375, 20.744140625, 21.7236328125, 22.703125, 23.6826171875, 24.662109375, 25.6416015625, 26.62109375, 27.6005859375, 28.580078125, 29.5595703125, 30.5390625, 31.5185546875, 32.498046875, 33.4775390625, 34.45703125, 35.4365234375, 36.416015625, 37.3955078125, 38.375]}, "gradients/decoder.roberta.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 10.0, 18.0, 34.0, 80.0, 136.0, 331.0, 207.0, 99.0, 42.0, 18.0, 16.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.775360107421875, -1.72943115234375, -1.683502197265625, -1.6375732421875, -1.591644287109375, -1.54571533203125, -1.499786376953125, -1.453857421875, -1.407928466796875, -1.36199951171875, -1.316070556640625, -1.2701416015625, -1.224212646484375, -1.17828369140625, -1.132354736328125, -1.08642578125, -1.040496826171875, -0.99456787109375, -0.948638916015625, -0.9027099609375, -0.856781005859375, -0.81085205078125, -0.764923095703125, -0.718994140625, -0.673065185546875, -0.62713623046875, -0.581207275390625, -0.5352783203125, -0.489349365234375, -0.44342041015625, -0.397491455078125, -0.3515625, -0.305633544921875, -0.25970458984375, -0.213775634765625, -0.1678466796875, -0.121917724609375, -0.07598876953125, -0.030059814453125, 0.015869140625, 0.061798095703125, 0.10772705078125, 0.153656005859375, 0.1995849609375, 0.245513916015625, 0.29144287109375, 0.337371826171875, 0.38330078125, 0.429229736328125, 0.47515869140625, 0.521087646484375, 0.5670166015625, 0.612945556640625, 0.65887451171875, 0.704803466796875, 0.750732421875, 0.796661376953125, 0.84259033203125, 0.888519287109375, 0.9344482421875, 0.980377197265625, 1.02630615234375, 1.072235107421875, 1.1181640625]}, "gradients/decoder.roberta.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 23.0, 32.0, 72.0, 101.0, 124.0, 155.0, 148.0, 131.0, 91.0, 57.0, 38.0, 14.0, 9.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.661076545715332, -10.438068389892578, -10.215060234069824, -9.99205207824707, -9.769043922424316, -9.546035766601562, -9.323027610778809, -9.100019454956055, -8.8770112991333, -8.654003143310547, -8.430994987487793, -8.207986831665039, -7.984978675842285, -7.761970520019531, -7.538962364196777, -7.315954208374023, -7.092946529388428, -6.869938373565674, -6.64693021774292, -6.423922061920166, -6.200913906097412, -5.977905750274658, -5.7548980712890625, -5.531889915466309, -5.308881759643555, -5.085873603820801, -4.862865447998047, -4.639857292175293, -4.416849136352539, -4.193840980529785, -3.9708330631256104, -3.7478249073028564, -3.5248165130615234, -3.3018083572387695, -3.0788002014160156, -2.8557920455932617, -2.632783889770508, -2.409775733947754, -2.186767816543579, -1.9637596607208252, -1.7407515048980713, -1.5177433490753174, -1.2947351932525635, -1.0717271566390991, -0.8487190008163452, -0.6257108449935913, -0.40270280838012695, -0.17969465255737305, 0.04331350326538086, 0.2663216292858124, 0.4893297553062439, 0.712337851524353, 0.9353460073471069, 1.1583541631698608, 1.3813621997833252, 1.604370355606079, 1.827378511428833, 2.050386667251587, 2.273394823074341, 2.4964027404785156, 2.7194108963012695, 2.9424190521240234, 3.1654272079467773, 3.3884353637695312, 3.611443519592285]}, "gradients/decoder.roberta.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 11.0, 12.0, 10.0, 11.0, 16.0, 20.0, 24.0, 21.0, 24.0, 26.0, 33.0, 27.0, 40.0, 41.0, 29.0, 38.0, 36.0, 49.0, 38.0, 39.0, 47.0, 45.0, 38.0, 33.0, 33.0, 34.0, 33.0, 21.0, 15.0, 21.0, 15.0, 25.0, 11.0, 18.0, 7.0, 8.0, 10.0, 8.0, 8.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.382699489593506, -3.266721487045288, -3.1507437229156494, -3.0347657203674316, -2.918787956237793, -2.802809953689575, -2.6868321895599365, -2.5708541870117188, -2.45487642288208, -2.3388984203338623, -2.2229206562042236, -2.106942653656006, -1.9909648895263672, -1.8749868869781494, -1.7590091228485107, -1.643031120300293, -1.5270532369613647, -1.4110753536224365, -1.2950974702835083, -1.17911958694458, -1.0631417036056519, -0.9471637606620789, -0.8311858773231506, -0.7152079939842224, -0.5992301106452942, -0.48325222730636597, -0.36727434396743774, -0.25129643082618713, -0.1353185474872589, -0.0193406343460083, 0.09663724899291992, 0.21261513233184814, 0.32859301567077637, 0.4445708990097046, 0.5605487823486328, 0.676526665687561, 0.7925045490264893, 0.9084824919700623, 1.0244603157043457, 1.1404383182525635, 1.2564160823822021, 1.3723939657211304, 1.4883718490600586, 1.6043497323989868, 1.720327615737915, 1.8363056182861328, 1.9522833824157715, 2.0682613849639893, 2.184239387512207, 2.300217390060425, 2.4161951541900635, 2.5321731567382812, 2.64815092086792, 2.7641289234161377, 2.8801066875457764, 2.996084690093994, 3.112062454223633, 3.2280404567718506, 3.3440182209014893, 3.459996223449707, 3.5759739875793457, 3.6919519901275635, 3.807929754257202, 3.92390775680542, 4.039885520935059]}, "gradients/decoder.roberta.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 10.0, 16.0, 17.0, 27.0, 37.0, 42.0, 68.0, 84.0, 90.0, 109.0, 151.0, 169.0, 253.0, 390.0, 886.0, 2962.0, 20524.0, 424570.0, 3507967.0, 218091.0, 13435.0, 2230.0, 706.0, 361.0, 239.0, 175.0, 129.0, 100.0, 101.0, 67.0, 56.0, 49.0, 40.0, 22.0, 22.0, 23.0, 14.0, 14.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.0, -8.7222900390625, -8.444580078125, -8.1668701171875, -7.88916015625, -7.6114501953125, -7.333740234375, -7.0560302734375, -6.7783203125, -6.5006103515625, -6.222900390625, -5.9451904296875, -5.66748046875, -5.3897705078125, -5.112060546875, -4.8343505859375, -4.556640625, -4.2789306640625, -4.001220703125, -3.7235107421875, -3.44580078125, -3.1680908203125, -2.890380859375, -2.6126708984375, -2.3349609375, -2.0572509765625, -1.779541015625, -1.5018310546875, -1.22412109375, -0.9464111328125, -0.668701171875, -0.3909912109375, -0.11328125, 0.1644287109375, 0.442138671875, 0.7198486328125, 0.99755859375, 1.2752685546875, 1.552978515625, 1.8306884765625, 2.1083984375, 2.3861083984375, 2.663818359375, 2.9415283203125, 3.21923828125, 3.4969482421875, 3.774658203125, 4.0523681640625, 4.330078125, 4.6077880859375, 4.885498046875, 5.1632080078125, 5.44091796875, 5.7186279296875, 5.996337890625, 6.2740478515625, 6.5517578125, 6.8294677734375, 7.107177734375, 7.3848876953125, 7.66259765625, 7.9403076171875, 8.218017578125, 8.4957275390625, 8.7734375]}, "gradients/decoder.roberta.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 7.0, 8.0, 8.0, 15.0, 25.0, 17.0, 20.0, 23.0, 28.0, 27.0, 30.0, 37.0, 40.0, 37.0, 41.0, 36.0, 58.0, 45.0, 52.0, 38.0, 50.0, 42.0, 42.0, 31.0, 39.0, 28.0, 24.0, 23.0, 24.0, 15.0, 18.0, 17.0, 11.0, 11.0, 6.0, 6.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.947265625, -2.85723876953125, -2.7672119140625, -2.67718505859375, -2.587158203125, -2.49713134765625, -2.4071044921875, -2.31707763671875, -2.22705078125, -2.13702392578125, -2.0469970703125, -1.95697021484375, -1.866943359375, -1.77691650390625, -1.6868896484375, -1.59686279296875, -1.5068359375, -1.41680908203125, -1.3267822265625, -1.23675537109375, -1.146728515625, -1.05670166015625, -0.9666748046875, -0.87664794921875, -0.78662109375, -0.69659423828125, -0.6065673828125, -0.51654052734375, -0.426513671875, -0.33648681640625, -0.2464599609375, -0.15643310546875, -0.06640625, 0.02362060546875, 0.1136474609375, 0.20367431640625, 0.293701171875, 0.38372802734375, 0.4737548828125, 0.56378173828125, 0.65380859375, 0.74383544921875, 0.8338623046875, 0.92388916015625, 1.013916015625, 1.10394287109375, 1.1939697265625, 1.28399658203125, 1.3740234375, 1.46405029296875, 1.5540771484375, 1.64410400390625, 1.734130859375, 1.82415771484375, 1.9141845703125, 2.00421142578125, 2.09423828125, 2.18426513671875, 2.2742919921875, 2.36431884765625, 2.454345703125, 2.54437255859375, 2.6343994140625, 2.72442626953125, 2.814453125]}, "gradients/decoder.roberta.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 13.0, 8.0, 20.0, 23.0, 46.0, 77.0, 119.0, 244.0, 485.0, 3275.0, 4091187.0, 96884.0, 1079.0, 334.0, 178.0, 119.0, 59.0, 36.0, 17.0, 22.0, 13.0, 9.0, 8.0, 8.0, 1.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.3681640625, -37.080078125, -35.7919921875, -34.50390625, -33.2158203125, -31.927734375, -30.6396484375, -29.3515625, -28.0634765625, -26.775390625, -25.4873046875, -24.19921875, -22.9111328125, -21.623046875, -20.3349609375, -19.046875, -17.7587890625, -16.470703125, -15.1826171875, -13.89453125, -12.6064453125, -11.318359375, -10.0302734375, -8.7421875, -7.4541015625, -6.166015625, -4.8779296875, -3.58984375, -2.3017578125, -1.013671875, 0.2744140625, 1.5625, 2.8505859375, 4.138671875, 5.4267578125, 6.71484375, 8.0029296875, 9.291015625, 10.5791015625, 11.8671875, 13.1552734375, 14.443359375, 15.7314453125, 17.01953125, 18.3076171875, 19.595703125, 20.8837890625, 22.171875, 23.4599609375, 24.748046875, 26.0361328125, 27.32421875, 28.6123046875, 29.900390625, 31.1884765625, 32.4765625, 33.7646484375, 35.052734375, 36.3408203125, 37.62890625, 38.9169921875, 40.205078125, 41.4931640625, 42.78125]}, "gradients/decoder.roberta.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 5.0, 5.0, 11.0, 10.0, 14.0, 22.0, 30.0, 46.0, 108.0, 127.0, 238.0, 367.0, 627.0, 806.0, 683.0, 390.0, 220.0, 128.0, 90.0, 57.0, 27.0, 15.0, 16.0, 8.0, 9.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9261474609375, -1.866943359375, -1.8077392578125, -1.74853515625, -1.6893310546875, -1.630126953125, -1.5709228515625, -1.51171875, -1.4525146484375, -1.393310546875, -1.3341064453125, -1.27490234375, -1.2156982421875, -1.156494140625, -1.0972900390625, -1.0380859375, -0.9788818359375, -0.919677734375, -0.8604736328125, -0.80126953125, -0.7420654296875, -0.682861328125, -0.6236572265625, -0.564453125, -0.5052490234375, -0.446044921875, -0.3868408203125, -0.32763671875, -0.2684326171875, -0.209228515625, -0.1500244140625, -0.0908203125, -0.0316162109375, 0.027587890625, 0.0867919921875, 0.14599609375, 0.2052001953125, 0.264404296875, 0.3236083984375, 0.3828125, 0.4420166015625, 0.501220703125, 0.5604248046875, 0.61962890625, 0.6788330078125, 0.738037109375, 0.7972412109375, 0.8564453125, 0.9156494140625, 0.974853515625, 1.0340576171875, 1.09326171875, 1.1524658203125, 1.211669921875, 1.2708740234375, 1.330078125, 1.3892822265625, 1.448486328125, 1.5076904296875, 1.56689453125, 1.6260986328125, 1.685302734375, 1.7445068359375, 1.8037109375]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 11.0, 10.0, 14.0, 18.0, 24.0, 31.0, 47.0, 66.0, 65.0, 82.0, 97.0, 78.0, 73.0, 78.0, 74.0, 62.0, 36.0, 36.0, 24.0, 21.0, 14.0, 8.0, 11.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.080933570861816, -3.9749772548675537, -3.869020938873291, -3.7630646228790283, -3.6571083068847656, -3.551151752471924, -3.445195436477661, -3.3392391204833984, -3.2332828044891357, -3.127326488494873, -3.0213701725006104, -2.9154138565063477, -2.809457302093506, -2.7035012245178223, -2.5975446701049805, -2.4915883541107178, -2.385632038116455, -2.2796757221221924, -2.1737194061279297, -2.067763090133667, -1.9618066549301147, -1.855850338935852, -1.7498939037322998, -1.643937587738037, -1.5379812717437744, -1.4320249557495117, -1.326068639755249, -1.2201122045516968, -1.114155888557434, -1.0081995725631714, -0.9022431969642639, -0.7962868213653564, -0.6903302669525146, -0.584373950958252, -0.4784175753593445, -0.3724612295627594, -0.2665048837661743, -0.16054856777191162, -0.05459219217300415, 0.05136418342590332, 0.15732049942016602, 0.2632768452167511, 0.3692331910133362, 0.47518953680992126, 0.5811458826065063, 0.687102198600769, 0.7930585741996765, 0.899014949798584, 1.0049712657928467, 1.1109275817871094, 1.216883897781372, 1.3228403329849243, 1.428796648979187, 1.5347529649734497, 1.640709400177002, 1.7466657161712646, 1.8526220321655273, 1.95857834815979, 2.0645346641540527, 2.1704909801483154, 2.276447296142578, 2.38240385055542, 2.4883601665496826, 2.5943164825439453, 2.700272798538208]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 12.0, 8.0, 4.0, 19.0, 20.0, 19.0, 13.0, 27.0, 20.0, 35.0, 28.0, 34.0, 30.0, 41.0, 36.0, 33.0, 35.0, 54.0, 54.0, 49.0, 40.0, 37.0, 46.0, 40.0, 32.0, 21.0, 25.0, 23.0, 25.0, 18.0, 17.0, 16.0, 21.0, 10.0, 9.0, 11.0, 9.0, 6.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.7628726959228516, -2.6665525436401367, -2.570232391357422, -2.473912239074707, -2.377592086791992, -2.2812716960906982, -2.1849515438079834, -2.0886313915252686, -1.9923112392425537, -1.8959910869598389, -1.799670934677124, -1.7033506631851196, -1.6070305109024048, -1.51071035861969, -1.4143900871276855, -1.3180699348449707, -1.2217497825622559, -1.125429630279541, -1.0291094779968262, -0.9327892065048218, -0.8364690542221069, -0.7401489019393921, -0.6438286900520325, -0.5475084781646729, -0.451188325881958, -0.3548681437969208, -0.25854796171188354, -0.1622277796268463, -0.06590759754180908, 0.03041258454322815, 0.12673276662826538, 0.223052978515625, 0.31937313079833984, 0.4156933128833771, 0.5120134949684143, 0.6083337068557739, 0.7046538591384888, 0.8009740114212036, 0.8972942233085632, 0.9936144351959229, 1.0899345874786377, 1.1862547397613525, 1.2825748920440674, 1.3788951635360718, 1.4752153158187866, 1.5715354681015015, 1.6678557395935059, 1.7641758918762207, 1.8604960441589355, 1.9568161964416504, 2.0531363487243652, 2.14945650100708, 2.245776653289795, 2.342097043991089, 2.4384171962738037, 2.5347373485565186, 2.6310575008392334, 2.7273776531219482, 2.823697805404663, 2.920017957687378, 3.016338348388672, 3.1126585006713867, 3.2089786529541016, 3.3052988052368164, 3.4016189575195312]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 7.0, 3.0, 6.0, 15.0, 24.0, 24.0, 31.0, 57.0, 84.0, 123.0, 195.0, 296.0, 392.0, 669.0, 1011.0, 1493.0, 2294.0, 3747.0, 5969.0, 9714.0, 15852.0, 26180.0, 45045.0, 82398.0, 152489.0, 235024.0, 199965.0, 114316.0, 61737.0, 35191.0, 20696.0, 12382.0, 7787.0, 4938.0, 3074.0, 1834.0, 1271.0, 775.0, 499.0, 327.0, 207.0, 161.0, 77.0, 72.0, 43.0, 27.0, 5.0, 12.0, 8.0, 7.0, 5.0], "bins": [-0.619140625, -0.6031684875488281, -0.5871963500976562, -0.5712242126464844, -0.5552520751953125, -0.5392799377441406, -0.5233078002929688, -0.5073356628417969, -0.491363525390625, -0.4753913879394531, -0.45941925048828125, -0.4434471130371094, -0.4274749755859375, -0.4115028381347656, -0.39553070068359375, -0.3795585632324219, -0.36358642578125, -0.3476142883300781, -0.33164215087890625, -0.3156700134277344, -0.2996978759765625, -0.2837257385253906, -0.26775360107421875, -0.2517814636230469, -0.235809326171875, -0.21983718872070312, -0.20386505126953125, -0.18789291381835938, -0.1719207763671875, -0.15594863891601562, -0.13997650146484375, -0.12400436401367188, -0.1080322265625, -0.09206008911132812, -0.07608795166015625, -0.060115814208984375, -0.0441436767578125, -0.028171539306640625, -0.01219940185546875, 0.003772735595703125, 0.019744873046875, 0.035717010498046875, 0.05168914794921875, 0.06766128540039062, 0.0836334228515625, 0.09960556030273438, 0.11557769775390625, 0.13154983520507812, 0.14752197265625, 0.16349411010742188, 0.17946624755859375, 0.19543838500976562, 0.2114105224609375, 0.22738265991210938, 0.24335479736328125, 0.2593269348144531, 0.275299072265625, 0.2912712097167969, 0.30724334716796875, 0.3232154846191406, 0.3391876220703125, 0.3551597595214844, 0.37113189697265625, 0.3871040344238281, 0.403076171875]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 12.0, 8.0, 4.0, 19.0, 20.0, 20.0, 13.0, 24.0, 23.0, 34.0, 30.0, 29.0, 34.0, 40.0, 35.0, 35.0, 35.0, 55.0, 51.0, 49.0, 42.0, 39.0, 44.0, 39.0, 32.0, 22.0, 24.0, 26.0, 23.0, 18.0, 17.0, 16.0, 21.0, 10.0, 8.0, 12.0, 9.0, 6.0, 6.0, 6.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.66015625, -2.56658935546875, -2.4730224609375, -2.37945556640625, -2.285888671875, -2.19232177734375, -2.0987548828125, -2.00518798828125, -1.91162109375, -1.81805419921875, -1.7244873046875, -1.63092041015625, -1.537353515625, -1.44378662109375, -1.3502197265625, -1.25665283203125, -1.1630859375, -1.06951904296875, -0.9759521484375, -0.88238525390625, -0.788818359375, -0.69525146484375, -0.6016845703125, -0.50811767578125, -0.41455078125, -0.32098388671875, -0.2274169921875, -0.13385009765625, -0.040283203125, 0.05328369140625, 0.1468505859375, 0.24041748046875, 0.333984375, 0.42755126953125, 0.5211181640625, 0.61468505859375, 0.708251953125, 0.80181884765625, 0.8953857421875, 0.98895263671875, 1.08251953125, 1.17608642578125, 1.2696533203125, 1.36322021484375, 1.456787109375, 1.55035400390625, 1.6439208984375, 1.73748779296875, 1.8310546875, 1.92462158203125, 2.0181884765625, 2.11175537109375, 2.205322265625, 2.29888916015625, 2.3924560546875, 2.48602294921875, 2.57958984375, 2.67315673828125, 2.7667236328125, 2.86029052734375, 2.953857421875, 3.04742431640625, 3.1409912109375, 3.23455810546875, 3.328125]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 8.0, 8.0, 8.0, 14.0, 22.0, 15.0, 29.0, 36.0, 43.0, 56.0, 83.0, 111.0, 146.0, 185.0, 244.0, 407.0, 543.0, 843.0, 1292.0, 2501.0, 5318.0, 13054.0, 44844.0, 912504.0, 42147.0, 12579.0, 5030.0, 2432.0, 1328.0, 805.0, 547.0, 355.0, 242.0, 198.0, 142.0, 87.0, 81.0, 65.0, 43.0, 36.0, 22.0, 26.0, 18.0, 13.0, 11.0, 11.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0], "bins": [-1.5087890625, -1.4608612060546875, -1.412933349609375, -1.3650054931640625, -1.31707763671875, -1.2691497802734375, -1.221221923828125, -1.1732940673828125, -1.1253662109375, -1.0774383544921875, -1.029510498046875, -0.9815826416015625, -0.93365478515625, -0.8857269287109375, -0.837799072265625, -0.7898712158203125, -0.741943359375, -0.6940155029296875, -0.646087646484375, -0.5981597900390625, -0.55023193359375, -0.5023040771484375, -0.454376220703125, -0.4064483642578125, -0.3585205078125, -0.3105926513671875, -0.262664794921875, -0.2147369384765625, -0.16680908203125, -0.1188812255859375, -0.070953369140625, -0.0230255126953125, 0.02490234375, 0.0728302001953125, 0.120758056640625, 0.1686859130859375, 0.21661376953125, 0.2645416259765625, 0.312469482421875, 0.3603973388671875, 0.4083251953125, 0.4562530517578125, 0.504180908203125, 0.5521087646484375, 0.60003662109375, 0.6479644775390625, 0.695892333984375, 0.7438201904296875, 0.791748046875, 0.8396759033203125, 0.887603759765625, 0.9355316162109375, 0.98345947265625, 1.0313873291015625, 1.079315185546875, 1.1272430419921875, 1.1751708984375, 1.2230987548828125, 1.271026611328125, 1.3189544677734375, 1.36688232421875, 1.4148101806640625, 1.462738037109375, 1.5106658935546875, 1.55859375]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 4.0, 12.0, 9.0, 8.0, 7.0, 17.0, 20.0, 18.0, 25.0, 26.0, 17.0, 23.0, 25.0, 33.0, 25.0, 30.0, 49.0, 45.0, 48.0, 37.0, 45.0, 49.0, 41.0, 54.0, 32.0, 41.0, 29.0, 30.0, 35.0, 36.0, 13.0, 19.0, 15.0, 12.0, 19.0, 11.0, 6.0, 13.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.84375, -1.784393310546875, -1.72503662109375, -1.665679931640625, -1.6063232421875, -1.546966552734375, -1.48760986328125, -1.428253173828125, -1.368896484375, -1.309539794921875, -1.25018310546875, -1.190826416015625, -1.1314697265625, -1.072113037109375, -1.01275634765625, -0.953399658203125, -0.89404296875, -0.834686279296875, -0.77532958984375, -0.715972900390625, -0.6566162109375, -0.597259521484375, -0.53790283203125, -0.478546142578125, -0.419189453125, -0.359832763671875, -0.30047607421875, -0.241119384765625, -0.1817626953125, -0.122406005859375, -0.06304931640625, -0.003692626953125, 0.0556640625, 0.115020751953125, 0.17437744140625, 0.233734130859375, 0.2930908203125, 0.352447509765625, 0.41180419921875, 0.471160888671875, 0.530517578125, 0.589874267578125, 0.64923095703125, 0.708587646484375, 0.7679443359375, 0.827301025390625, 0.88665771484375, 0.946014404296875, 1.00537109375, 1.064727783203125, 1.12408447265625, 1.183441162109375, 1.2427978515625, 1.302154541015625, 1.36151123046875, 1.420867919921875, 1.480224609375, 1.539581298828125, 1.59893798828125, 1.658294677734375, 1.7176513671875, 1.777008056640625, 1.83636474609375, 1.895721435546875, 1.955078125]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 8.0, 7.0, 3.0, 10.0, 9.0, 24.0, 28.0, 31.0, 61.0, 76.0, 104.0, 138.0, 187.0, 328.0, 451.0, 774.0, 1396.0, 2947.0, 7157.0, 25893.0, 947521.0, 43288.0, 10066.0, 3695.0, 1714.0, 950.0, 556.0, 365.0, 207.0, 150.0, 96.0, 66.0, 53.0, 46.0, 36.0, 29.0, 12.0, 13.0, 16.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1788330078125, -0.17280006408691406, -0.16676712036132812, -0.1607341766357422, -0.15470123291015625, -0.1486682891845703, -0.14263534545898438, -0.13660240173339844, -0.1305694580078125, -0.12453651428222656, -0.11850357055664062, -0.11247062683105469, -0.10643768310546875, -0.10040473937988281, -0.09437179565429688, -0.08833885192871094, -0.082305908203125, -0.07627296447753906, -0.07024002075195312, -0.06420707702636719, -0.05817413330078125, -0.05214118957519531, -0.046108245849609375, -0.04007530212402344, -0.0340423583984375, -0.028009414672851562, -0.021976470947265625, -0.015943527221679688, -0.00991058349609375, -0.0038776397705078125, 0.002155303955078125, 0.008188247680664062, 0.01422119140625, 0.020254135131835938, 0.026287078857421875, 0.03232002258300781, 0.03835296630859375, 0.04438591003417969, 0.050418853759765625, 0.05645179748535156, 0.0624847412109375, 0.06851768493652344, 0.07455062866210938, 0.08058357238769531, 0.08661651611328125, 0.09264945983886719, 0.09868240356445312, 0.10471534729003906, 0.110748291015625, 0.11678123474121094, 0.12281417846679688, 0.1288471221923828, 0.13488006591796875, 0.1409130096435547, 0.14694595336914062, 0.15297889709472656, 0.1590118408203125, 0.16504478454589844, 0.17107772827148438, 0.1771106719970703, 0.18314361572265625, 0.1891765594482422, 0.19520950317382812, 0.20124244689941406, 0.207275390625]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 8.0, 9.0, 15.0, 12.0, 19.0, 23.0, 30.0, 25.0, 52.0, 35.0, 54.0, 58.0, 49.0, 71.0, 51.0, 52.0, 60.0, 50.0, 43.0, 52.0, 42.0, 34.0, 35.0, 22.0, 8.0, 11.0, 15.0, 7.0, 8.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.159046173095703e-05, -3.064796328544617e-05, -2.9705464839935303e-05, -2.876296639442444e-05, -2.7820467948913574e-05, -2.687796950340271e-05, -2.5935471057891846e-05, -2.499297261238098e-05, -2.4050474166870117e-05, -2.3107975721359253e-05, -2.216547727584839e-05, -2.1222978830337524e-05, -2.028048038482666e-05, -1.9337981939315796e-05, -1.839548349380493e-05, -1.7452985048294067e-05, -1.6510486602783203e-05, -1.556798815727234e-05, -1.4625489711761475e-05, -1.368299126625061e-05, -1.2740492820739746e-05, -1.1797994375228882e-05, -1.0855495929718018e-05, -9.912997484207153e-06, -8.970499038696289e-06, -8.028000593185425e-06, -7.0855021476745605e-06, -6.143003702163696e-06, -5.200505256652832e-06, -4.258006811141968e-06, -3.3155083656311035e-06, -2.3730099201202393e-06, -1.430511474609375e-06, -4.880130290985107e-07, 4.544854164123535e-07, 1.3969838619232178e-06, 2.339482307434082e-06, 3.2819807529449463e-06, 4.2244791984558105e-06, 5.166977643966675e-06, 6.109476089477539e-06, 7.051974534988403e-06, 7.994472980499268e-06, 8.936971426010132e-06, 9.879469871520996e-06, 1.082196831703186e-05, 1.1764466762542725e-05, 1.2706965208053589e-05, 1.3649463653564453e-05, 1.4591962099075317e-05, 1.553446054458618e-05, 1.6476958990097046e-05, 1.741945743560791e-05, 1.8361955881118774e-05, 1.930445432662964e-05, 2.0246952772140503e-05, 2.1189451217651367e-05, 2.213194966316223e-05, 2.3074448108673096e-05, 2.401694655418396e-05, 2.4959444999694824e-05, 2.590194344520569e-05, 2.6844441890716553e-05, 2.7786940336227417e-05, 2.872943878173828e-05]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 6.0, 8.0, 16.0, 15.0, 17.0, 16.0, 32.0, 47.0, 48.0, 199.0, 772.0, 25977.0, 977397.0, 42369.0, 1106.0, 211.0, 78.0, 53.0, 33.0, 26.0, 21.0, 13.0, 12.0, 11.0, 9.0, 7.0, 6.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.431884765625, -0.41901397705078125, -0.4061431884765625, -0.39327239990234375, -0.380401611328125, -0.36753082275390625, -0.3546600341796875, -0.34178924560546875, -0.32891845703125, -0.31604766845703125, -0.3031768798828125, -0.29030609130859375, -0.277435302734375, -0.26456451416015625, -0.2516937255859375, -0.23882293701171875, -0.2259521484375, -0.21308135986328125, -0.2002105712890625, -0.18733978271484375, -0.174468994140625, -0.16159820556640625, -0.1487274169921875, -0.13585662841796875, -0.12298583984375, -0.11011505126953125, -0.0972442626953125, -0.08437347412109375, -0.071502685546875, -0.05863189697265625, -0.0457611083984375, -0.03289031982421875, -0.02001953125, -0.00714874267578125, 0.0057220458984375, 0.01859283447265625, 0.031463623046875, 0.04433441162109375, 0.0572052001953125, 0.07007598876953125, 0.08294677734375, 0.09581756591796875, 0.1086883544921875, 0.12155914306640625, 0.134429931640625, 0.14730072021484375, 0.1601715087890625, 0.17304229736328125, 0.1859130859375, 0.19878387451171875, 0.2116546630859375, 0.22452545166015625, 0.237396240234375, 0.25026702880859375, 0.2631378173828125, 0.27600860595703125, 0.28887939453125, 0.30175018310546875, 0.3146209716796875, 0.32749176025390625, 0.340362548828125, 0.35323333740234375, 0.3661041259765625, 0.37897491455078125, 0.391845703125]}, "gradients/decoder.roberta.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 6.0, 3.0, 9.0, 10.0, 13.0, 21.0, 15.0, 23.0, 33.0, 32.0, 74.0, 78.0, 128.0, 149.0, 123.0, 76.0, 35.0, 28.0, 27.0, 16.0, 12.0, 12.0, 14.0, 6.0, 6.0, 7.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0185089111328125, -0.017918109893798828, -0.017327308654785156, -0.016736507415771484, -0.016145706176757812, -0.01555490493774414, -0.014964103698730469, -0.014373302459716797, -0.013782501220703125, -0.013191699981689453, -0.012600898742675781, -0.01201009750366211, -0.011419296264648438, -0.010828495025634766, -0.010237693786621094, -0.009646892547607422, -0.00905609130859375, -0.008465290069580078, -0.007874488830566406, -0.007283687591552734, -0.0066928863525390625, -0.006102085113525391, -0.005511283874511719, -0.004920482635498047, -0.004329681396484375, -0.003738880157470703, -0.0031480789184570312, -0.0025572776794433594, -0.0019664764404296875, -0.0013756752014160156, -0.0007848739624023438, -0.00019407272338867188, 0.000396728515625, 0.0009875297546386719, 0.0015783309936523438, 0.0021691322326660156, 0.0027599334716796875, 0.0033507347106933594, 0.003941535949707031, 0.004532337188720703, 0.005123138427734375, 0.005713939666748047, 0.006304740905761719, 0.006895542144775391, 0.0074863433837890625, 0.008077144622802734, 0.008667945861816406, 0.009258747100830078, 0.00984954833984375, 0.010440349578857422, 0.011031150817871094, 0.011621952056884766, 0.012212753295898438, 0.01280355453491211, 0.013394355773925781, 0.013985157012939453, 0.014575958251953125, 0.015166759490966797, 0.01575756072998047, 0.01634836196899414, 0.016939163208007812, 0.017529964447021484, 0.018120765686035156, 0.018711566925048828, 0.0193023681640625]}, "gradients/decoder.roberta.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 11.0, 10.0, 15.0, 19.0, 22.0, 34.0, 50.0, 56.0, 61.0, 89.0, 75.0, 75.0, 70.0, 80.0, 50.0, 75.0, 45.0, 36.0, 32.0, 23.0, 19.0, 15.0, 5.0, 12.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6910080909729004, -3.5934150218963623, -3.495821714401245, -3.398228645324707, -3.30063533782959, -3.2030422687530518, -3.1054491996765137, -3.0078558921813965, -2.9102625846862793, -2.812669515609741, -2.715076208114624, -2.617483139038086, -2.5198898315429688, -2.4222967624664307, -2.3247036933898926, -2.2271103858947754, -2.1295173168182373, -2.031924247741699, -1.934330940246582, -1.836737871170044, -1.7391445636749268, -1.6415514945983887, -1.543958306312561, -1.4463651180267334, -1.3487719297409058, -1.2511787414550781, -1.1535855531692505, -1.0559923648834229, -0.95839923620224, -0.8608060479164124, -0.7632129192352295, -0.6656197309494019, -0.5680263042449951, -0.4704331159591675, -0.37283995747566223, -0.275246798992157, -0.17765361070632935, -0.08006042242050171, 0.017532706260681152, 0.11512589454650879, 0.21271908283233643, 0.31031227111816406, 0.4079054296016693, 0.5054985880851746, 0.6030917763710022, 0.7006849646568298, 0.7982780933380127, 0.8958712816238403, 0.993464469909668, 1.0910576581954956, 1.1886508464813232, 1.2862439155578613, 1.3838372230529785, 1.4814302921295166, 1.5790234804153442, 1.6766166687011719, 1.7742098569869995, 1.8718030452728271, 1.9693962335586548, 2.0669894218444824, 2.1645824909210205, 2.2621757984161377, 2.359768867492676, 2.457362174987793, 2.554955244064331]}, "gradients/decoder.roberta.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 10.0, 9.0, 5.0, 19.0, 19.0, 20.0, 14.0, 25.0, 21.0, 34.0, 30.0, 32.0, 31.0, 41.0, 37.0, 32.0, 39.0, 52.0, 50.0, 51.0, 42.0, 37.0, 45.0, 38.0, 33.0, 22.0, 23.0, 26.0, 24.0, 17.0, 17.0, 16.0, 21.0, 11.0, 8.0, 11.0, 9.0, 6.0, 6.0, 6.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.656170606613159, -2.562673568725586, -2.4691762924194336, -2.3756792545318604, -2.282181978225708, -2.1886849403381348, -2.0951876640319824, -2.001690626144409, -1.908193588256836, -1.8146964311599731, -1.7211992740631104, -1.627702236175537, -1.5342050790786743, -1.4407079219818115, -1.3472107648849487, -1.253713607788086, -1.1602164506912231, -1.0667192935943604, -0.9732221961021423, -0.8797250390052795, -0.7862279415130615, -0.6927307844161987, -0.5992336273193359, -0.5057365298271179, -0.4122393727302551, -0.3187422454357147, -0.22524510324001312, -0.13174796104431152, -0.03825083374977112, 0.05524629354476929, 0.14874345064163208, 0.2422405481338501, 0.3357377052307129, 0.4292348325252533, 0.5227319598197937, 0.6162291169166565, 0.7097262144088745, 0.8032233715057373, 0.8967205286026001, 0.9902176260948181, 1.0837147235870361, 1.177211880683899, 1.2707090377807617, 1.364206075668335, 1.4577032327651978, 1.5512003898620605, 1.6446975469589233, 1.7381947040557861, 1.831691861152649, 1.9251890182495117, 2.018686056137085, 2.1121833324432373, 2.2056803703308105, 2.299177646636963, 2.392674684524536, 2.4861717224121094, 2.5796689987182617, 2.673166036605835, 2.7666633129119873, 2.8601603507995605, 2.953657627105713, 3.047154664993286, 3.1406517028808594, 3.2341489791870117, 3.327646017074585]}, "gradients/decoder.roberta.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 9.0, 10.0, 15.0, 17.0, 20.0, 34.0, 32.0, 47.0, 67.0, 95.0, 111.0, 136.0, 227.0, 282.0, 430.0, 838.0, 1821.0, 4499.0, 12109.0, 32947.0, 92257.0, 295498.0, 404149.0, 129831.0, 44932.0, 16714.0, 6153.0, 2448.0, 1050.0, 552.0, 322.0, 244.0, 155.0, 132.0, 102.0, 56.0, 57.0, 35.0, 28.0, 29.0, 25.0, 10.0, 5.0, 7.0, 4.0, 2.0, 8.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.728515625, -3.619354248046875, -3.51019287109375, -3.401031494140625, -3.2918701171875, -3.182708740234375, -3.07354736328125, -2.964385986328125, -2.855224609375, -2.746063232421875, -2.63690185546875, -2.527740478515625, -2.4185791015625, -2.309417724609375, -2.20025634765625, -2.091094970703125, -1.98193359375, -1.872772216796875, -1.76361083984375, -1.654449462890625, -1.5452880859375, -1.436126708984375, -1.32696533203125, -1.217803955078125, -1.108642578125, -0.999481201171875, -0.89031982421875, -0.781158447265625, -0.6719970703125, -0.562835693359375, -0.45367431640625, -0.344512939453125, -0.2353515625, -0.126190185546875, -0.01702880859375, 0.092132568359375, 0.2012939453125, 0.310455322265625, 0.41961669921875, 0.528778076171875, 0.637939453125, 0.747100830078125, 0.85626220703125, 0.965423583984375, 1.0745849609375, 1.183746337890625, 1.29290771484375, 1.402069091796875, 1.51123046875, 1.620391845703125, 1.72955322265625, 1.838714599609375, 1.9478759765625, 2.057037353515625, 2.16619873046875, 2.275360107421875, 2.384521484375, 2.493682861328125, 2.60284423828125, 2.712005615234375, 2.8211669921875, 2.930328369140625, 3.03948974609375, 3.148651123046875, 3.2578125]}, "gradients/decoder.roberta.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 15.0, 3.0, 5.0, 16.0, 23.0, 20.0, 12.0, 23.0, 30.0, 21.0, 33.0, 38.0, 34.0, 38.0, 35.0, 32.0, 46.0, 45.0, 52.0, 48.0, 40.0, 41.0, 43.0, 39.0, 32.0, 23.0, 25.0, 18.0, 30.0, 20.0, 15.0, 20.0, 17.0, 11.0, 14.0, 7.0, 9.0, 7.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.69140625, -2.5966796875, -2.501953125, -2.4072265625, -2.3125, -2.2177734375, -2.123046875, -2.0283203125, -1.93359375, -1.8388671875, -1.744140625, -1.6494140625, -1.5546875, -1.4599609375, -1.365234375, -1.2705078125, -1.17578125, -1.0810546875, -0.986328125, -0.8916015625, -0.796875, -0.7021484375, -0.607421875, -0.5126953125, -0.41796875, -0.3232421875, -0.228515625, -0.1337890625, -0.0390625, 0.0556640625, 0.150390625, 0.2451171875, 0.33984375, 0.4345703125, 0.529296875, 0.6240234375, 0.71875, 0.8134765625, 0.908203125, 1.0029296875, 1.09765625, 1.1923828125, 1.287109375, 1.3818359375, 1.4765625, 1.5712890625, 1.666015625, 1.7607421875, 1.85546875, 1.9501953125, 2.044921875, 2.1396484375, 2.234375, 2.3291015625, 2.423828125, 2.5185546875, 2.61328125, 2.7080078125, 2.802734375, 2.8974609375, 2.9921875, 3.0869140625, 3.181640625, 3.2763671875, 3.37109375]}, "gradients/decoder.roberta.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 9.0, 9.0, 12.0, 19.0, 22.0, 24.0, 34.0, 28.0, 56.0, 66.0, 75.0, 112.0, 163.0, 251.0, 1039227.0, 7685.0, 181.0, 144.0, 82.0, 71.0, 59.0, 51.0, 37.0, 26.0, 18.0, 15.0, 12.0, 9.0, 13.0, 11.0, 9.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.5, -82.4306640625, -79.361328125, -76.2919921875, -73.22265625, -70.1533203125, -67.083984375, -64.0146484375, -60.9453125, -57.8759765625, -54.806640625, -51.7373046875, -48.66796875, -45.5986328125, -42.529296875, -39.4599609375, -36.390625, -33.3212890625, -30.251953125, -27.1826171875, -24.11328125, -21.0439453125, -17.974609375, -14.9052734375, -11.8359375, -8.7666015625, -5.697265625, -2.6279296875, 0.44140625, 3.5107421875, 6.580078125, 9.6494140625, 12.71875, 15.7880859375, 18.857421875, 21.9267578125, 24.99609375, 28.0654296875, 31.134765625, 34.2041015625, 37.2734375, 40.3427734375, 43.412109375, 46.4814453125, 49.55078125, 52.6201171875, 55.689453125, 58.7587890625, 61.828125, 64.8974609375, 67.966796875, 71.0361328125, 74.10546875, 77.1748046875, 80.244140625, 83.3134765625, 86.3828125, 89.4521484375, 92.521484375, 95.5908203125, 98.66015625, 101.7294921875, 104.798828125, 107.8681640625, 110.9375]}, "gradients/decoder.roberta.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 13.0, 11.0, 11.0, 11.0, 10.0, 17.0, 21.0, 32.0, 29.0, 48.0, 41.0, 40.0, 43.0, 51.0, 45.0, 58.0, 65.0, 48.0, 52.0, 40.0, 50.0, 50.0, 42.0, 23.0, 30.0, 21.0, 22.0, 10.0, 20.0, 14.0, 7.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.935546875, -3.82623291015625, -3.7169189453125, -3.60760498046875, -3.498291015625, -3.38897705078125, -3.2796630859375, -3.17034912109375, -3.06103515625, -2.95172119140625, -2.8424072265625, -2.73309326171875, -2.623779296875, -2.51446533203125, -2.4051513671875, -2.29583740234375, -2.1865234375, -2.07720947265625, -1.9678955078125, -1.85858154296875, -1.749267578125, -1.63995361328125, -1.5306396484375, -1.42132568359375, -1.31201171875, -1.20269775390625, -1.0933837890625, -0.98406982421875, -0.874755859375, -0.76544189453125, -0.6561279296875, -0.54681396484375, -0.4375, -0.32818603515625, -0.2188720703125, -0.10955810546875, -0.000244140625, 0.10906982421875, 0.2183837890625, 0.32769775390625, 0.43701171875, 0.54632568359375, 0.6556396484375, 0.76495361328125, 0.874267578125, 0.98358154296875, 1.0928955078125, 1.20220947265625, 1.3115234375, 1.42083740234375, 1.5301513671875, 1.63946533203125, 1.748779296875, 1.85809326171875, 1.9674072265625, 2.07672119140625, 2.18603515625, 2.29534912109375, 2.4046630859375, 2.51397705078125, 2.623291015625, 2.73260498046875, 2.8419189453125, 2.95123291015625, 3.060546875]}, "gradients/decoder.roberta.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 6.0, 4.0, 10.0, 8.0, 12.0, 16.0, 28.0, 39.0, 59.0, 95.0, 237.0, 403.0, 825.0, 2195.0, 11507.0, 171887.0, 811753.0, 42265.0, 4640.0, 1244.0, 608.0, 299.0, 155.0, 87.0, 59.0, 28.0, 23.0, 18.0, 6.0, 8.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6796875, -4.519775390625, -4.35986328125, -4.199951171875, -4.0400390625, -3.880126953125, -3.72021484375, -3.560302734375, -3.400390625, -3.240478515625, -3.08056640625, -2.920654296875, -2.7607421875, -2.600830078125, -2.44091796875, -2.281005859375, -2.12109375, -1.961181640625, -1.80126953125, -1.641357421875, -1.4814453125, -1.321533203125, -1.16162109375, -1.001708984375, -0.841796875, -0.681884765625, -0.52197265625, -0.362060546875, -0.2021484375, -0.042236328125, 0.11767578125, 0.277587890625, 0.4375, 0.597412109375, 0.75732421875, 0.917236328125, 1.0771484375, 1.237060546875, 1.39697265625, 1.556884765625, 1.716796875, 1.876708984375, 2.03662109375, 2.196533203125, 2.3564453125, 2.516357421875, 2.67626953125, 2.836181640625, 2.99609375, 3.156005859375, 3.31591796875, 3.475830078125, 3.6357421875, 3.795654296875, 3.95556640625, 4.115478515625, 4.275390625, 4.435302734375, 4.59521484375, 4.755126953125, 4.9150390625, 5.074951171875, 5.23486328125, 5.394775390625, 5.5546875]}, "gradients/decoder.roberta.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 7.0, 7.0, 12.0, 19.0, 28.0, 52.0, 91.0, 149.0, 253.0, 175.0, 86.0, 45.0, 31.0, 21.0, 13.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033783912658691406, -0.0003234781324863434, -0.0003091171383857727, -0.000294756144285202, -0.00028039515018463135, -0.00026603415608406067, -0.00025167316198349, -0.0002373121678829193, -0.00022295117378234863, -0.00020859017968177795, -0.00019422918558120728, -0.0001798681914806366, -0.00016550719738006592, -0.00015114620327949524, -0.00013678520917892456, -0.00012242421507835388, -0.0001080632209777832, -9.370222687721252e-05, -7.934123277664185e-05, -6.498023867607117e-05, -5.061924457550049e-05, -3.625825047492981e-05, -2.189725637435913e-05, -7.536262273788452e-06, 6.8247318267822266e-06, 2.1185725927352905e-05, 3.5546720027923584e-05, 4.990771412849426e-05, 6.426870822906494e-05, 7.862970232963562e-05, 9.29906964302063e-05, 0.00010735169053077698, 0.00012171268463134766, 0.00013607367873191833, 0.00015043467283248901, 0.0001647956669330597, 0.00017915666103363037, 0.00019351765513420105, 0.00020787864923477173, 0.0002222396433353424, 0.00023660063743591309, 0.00025096163153648376, 0.00026532262563705444, 0.0002796836197376251, 0.0002940446138381958, 0.0003084056079387665, 0.00032276660203933716, 0.00033712759613990784, 0.0003514885902404785, 0.0003658495843410492, 0.0003802105784416199, 0.00039457157254219055, 0.00040893256664276123, 0.0004232935607433319, 0.0004376545548439026, 0.00045201554894447327, 0.00046637654304504395, 0.0004807375371456146, 0.0004950985312461853, 0.000509459525346756, 0.0005238205194473267, 0.0005381815135478973, 0.000552542507648468, 0.0005669035017490387, 0.0005812644958496094]}, "gradients/decoder.roberta.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 10.0, 1.0, 5.0, 9.0, 4.0, 9.0, 18.0, 18.0, 28.0, 57.0, 125.0, 362.0, 1777.0, 40389.0, 995557.0, 8753.0, 972.0, 238.0, 87.0, 49.0, 22.0, 15.0, 21.0, 11.0, 6.0, 5.0, 5.0, 7.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-17.03125, -16.619140625, -16.20703125, -15.794921875, -15.3828125, -14.970703125, -14.55859375, -14.146484375, -13.734375, -13.322265625, -12.91015625, -12.498046875, -12.0859375, -11.673828125, -11.26171875, -10.849609375, -10.4375, -10.025390625, -9.61328125, -9.201171875, -8.7890625, -8.376953125, -7.96484375, -7.552734375, -7.140625, -6.728515625, -6.31640625, -5.904296875, -5.4921875, -5.080078125, -4.66796875, -4.255859375, -3.84375, -3.431640625, -3.01953125, -2.607421875, -2.1953125, -1.783203125, -1.37109375, -0.958984375, -0.546875, -0.134765625, 0.27734375, 0.689453125, 1.1015625, 1.513671875, 1.92578125, 2.337890625, 2.75, 3.162109375, 3.57421875, 3.986328125, 4.3984375, 4.810546875, 5.22265625, 5.634765625, 6.046875, 6.458984375, 6.87109375, 7.283203125, 7.6953125, 8.107421875, 8.51953125, 8.931640625, 9.34375]}, "gradients/decoder.roberta.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 3.0, 5.0, 4.0, 9.0, 10.0, 20.0, 18.0, 28.0, 38.0, 39.0, 70.0, 99.0, 142.0, 150.0, 102.0, 81.0, 45.0, 36.0, 26.0, 22.0, 15.0, 8.0, 7.0, 11.0, 0.0, 4.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.513671875, -0.49309539794921875, -0.4725189208984375, -0.45194244384765625, -0.431365966796875, -0.41078948974609375, -0.3902130126953125, -0.36963653564453125, -0.34906005859375, -0.32848358154296875, -0.3079071044921875, -0.28733062744140625, -0.266754150390625, -0.24617767333984375, -0.2256011962890625, -0.20502471923828125, -0.1844482421875, -0.16387176513671875, -0.1432952880859375, -0.12271881103515625, -0.102142333984375, -0.08156585693359375, -0.0609893798828125, -0.04041290283203125, -0.01983642578125, 0.00074005126953125, 0.0213165283203125, 0.04189300537109375, 0.062469482421875, 0.08304595947265625, 0.1036224365234375, 0.12419891357421875, 0.144775390625, 0.16535186767578125, 0.1859283447265625, 0.20650482177734375, 0.227081298828125, 0.24765777587890625, 0.2682342529296875, 0.28881072998046875, 0.30938720703125, 0.32996368408203125, 0.3505401611328125, 0.37111663818359375, 0.391693115234375, 0.41226959228515625, 0.4328460693359375, 0.45342254638671875, 0.4739990234375, 0.49457550048828125, 0.5151519775390625, 0.5357284545898438, 0.556304931640625, 0.5768814086914062, 0.5974578857421875, 0.6180343627929688, 0.63861083984375, 0.6591873168945312, 0.6797637939453125, 0.7003402709960938, 0.720916748046875, 0.7414932250976562, 0.7620697021484375, 0.7826461791992188, 0.80322265625]}, "gradients/decoder.roberta.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 14.0, 17.0, 29.0, 47.0, 75.0, 90.0, 107.0, 129.0, 107.0, 101.0, 97.0, 84.0, 38.0, 28.0, 14.0, 9.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953302383422852, -4.788397789001465, -4.62349271774292, -4.458588123321533, -4.2936835289001465, -4.128778457641602, -3.963873863220215, -3.798969268798828, -3.6340644359588623, -3.4691596031188965, -3.3042550086975098, -3.139350175857544, -2.974445343017578, -2.8095407485961914, -2.6446359157562256, -2.4797310829162598, -2.314826488494873, -2.1499216556549072, -1.9850170612335205, -1.8201122283935547, -1.6552075147628784, -1.4903028011322021, -1.3253979682922363, -1.16049325466156, -0.9955885410308838, -0.8306838274002075, -0.6657790541648865, -0.5008742809295654, -0.33596956729888916, -0.1710648536682129, -0.006160080432891846, 0.1587446928024292, 0.32364988327026367, 0.48855462670326233, 0.653459370136261, 0.818364143371582, 0.9832688570022583, 1.1481735706329346, 1.3130784034729004, 1.4779831171035767, 1.642887830734253, 1.8077925443649292, 1.9726972579956055, 2.1376020908355713, 2.302506923675537, 2.467411518096924, 2.6323163509368896, 2.7972211837768555, 2.962125778198242, 3.127030611038208, 3.2919352054595947, 3.4568400382995605, 3.6217446327209473, 3.786649465560913, 3.951554298400879, 4.116458892822266, 4.281363487243652, 4.446268081665039, 4.611173152923584, 4.776077747344971, 4.940982341766357, 5.105887413024902, 5.270792007446289, 5.435696601867676, 5.600601673126221]}, "gradients/decoder.roberta.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 8.0, 3.0, 4.0, 8.0, 14.0, 14.0, 9.0, 22.0, 17.0, 10.0, 23.0, 22.0, 16.0, 23.0, 27.0, 25.0, 41.0, 31.0, 42.0, 42.0, 44.0, 40.0, 45.0, 34.0, 34.0, 36.0, 38.0, 42.0, 28.0, 27.0, 25.0, 26.0, 22.0, 31.0, 12.0, 18.0, 19.0, 14.0, 12.0, 18.0, 9.0, 5.0, 6.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.532188653945923, -3.4250974655151367, -3.3180062770843506, -3.2109150886535645, -3.103823661804199, -2.996732711791992, -2.889641284942627, -2.782550096511841, -2.6754589080810547, -2.5683677196502686, -2.4612765312194824, -2.3541853427886963, -2.24709415435791, -2.140002727508545, -2.032911539077759, -1.9258203506469727, -1.8187291622161865, -1.7116379737854004, -1.6045467853546143, -1.4974554777145386, -1.3903642892837524, -1.2832731008529663, -1.1761817932128906, -1.0690906047821045, -0.9619994163513184, -0.8549082279205322, -0.7478169798851013, -0.6407257318496704, -0.5336345434188843, -0.42654335498809814, -0.31945210695266724, -0.21236085891723633, -0.1052694320678711, 0.0018217861652374268, 0.10891300439834595, 0.21600422263145447, 0.323095440864563, 0.4301866292953491, 0.53727787733078, 0.6443691253662109, 0.7514603137969971, 0.8585515022277832, 0.9656427502632141, 1.072733998298645, 1.1798251867294312, 1.2869163751602173, 1.394007682800293, 1.501098871231079, 1.6081900596618652, 1.7152812480926514, 1.8223724365234375, 1.9294637441635132, 2.0365548133850098, 2.143646240234375, 2.250737428665161, 2.3578286170959473, 2.4649198055267334, 2.5720109939575195, 2.6791021823883057, 2.786193370819092, 2.893284797668457, 3.000375747680664, 3.1074671745300293, 3.2145583629608154, 3.3216495513916016]}, "gradients/decoder.roberta.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 10.0, 7.0, 13.0, 20.0, 27.0, 29.0, 38.0, 51.0, 63.0, 79.0, 86.0, 125.0, 147.0, 244.0, 354.0, 769.0, 3015.0, 26701.0, 1126499.0, 2977284.0, 51642.0, 4707.0, 986.0, 399.0, 259.0, 162.0, 102.0, 105.0, 93.0, 54.0, 46.0, 37.0, 26.0, 23.0, 26.0, 16.0, 12.0, 6.0, 10.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.484375, -11.1375732421875, -10.790771484375, -10.4439697265625, -10.09716796875, -9.7503662109375, -9.403564453125, -9.0567626953125, -8.7099609375, -8.3631591796875, -8.016357421875, -7.6695556640625, -7.32275390625, -6.9759521484375, -6.629150390625, -6.2823486328125, -5.935546875, -5.5887451171875, -5.241943359375, -4.8951416015625, -4.54833984375, -4.2015380859375, -3.854736328125, -3.5079345703125, -3.1611328125, -2.8143310546875, -2.467529296875, -2.1207275390625, -1.77392578125, -1.4271240234375, -1.080322265625, -0.7335205078125, -0.38671875, -0.0399169921875, 0.306884765625, 0.6536865234375, 1.00048828125, 1.3472900390625, 1.694091796875, 2.0408935546875, 2.3876953125, 2.7344970703125, 3.081298828125, 3.4281005859375, 3.77490234375, 4.1217041015625, 4.468505859375, 4.8153076171875, 5.162109375, 5.5089111328125, 5.855712890625, 6.2025146484375, 6.54931640625, 6.8961181640625, 7.242919921875, 7.5897216796875, 7.9365234375, 8.2833251953125, 8.630126953125, 8.9769287109375, 9.32373046875, 9.6705322265625, 10.017333984375, 10.3641357421875, 10.7109375]}, "gradients/decoder.roberta.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 2.0, 9.0, 9.0, 13.0, 8.0, 10.0, 12.0, 15.0, 12.0, 34.0, 28.0, 24.0, 22.0, 24.0, 40.0, 39.0, 43.0, 32.0, 39.0, 43.0, 46.0, 40.0, 45.0, 33.0, 36.0, 47.0, 28.0, 26.0, 23.0, 31.0, 22.0, 21.0, 23.0, 18.0, 15.0, 20.0, 14.0, 9.0, 8.0, 7.0, 5.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.138885498046875, -2.06488037109375, -1.990875244140625, -1.9168701171875, -1.842864990234375, -1.76885986328125, -1.694854736328125, -1.620849609375, -1.546844482421875, -1.47283935546875, -1.398834228515625, -1.3248291015625, -1.250823974609375, -1.17681884765625, -1.102813720703125, -1.02880859375, -0.954803466796875, -0.88079833984375, -0.806793212890625, -0.7327880859375, -0.658782958984375, -0.58477783203125, -0.510772705078125, -0.436767578125, -0.362762451171875, -0.28875732421875, -0.214752197265625, -0.1407470703125, -0.066741943359375, 0.00726318359375, 0.081268310546875, 0.1552734375, 0.229278564453125, 0.30328369140625, 0.377288818359375, 0.4512939453125, 0.525299072265625, 0.59930419921875, 0.673309326171875, 0.747314453125, 0.821319580078125, 0.89532470703125, 0.969329833984375, 1.0433349609375, 1.117340087890625, 1.19134521484375, 1.265350341796875, 1.33935546875, 1.413360595703125, 1.48736572265625, 1.561370849609375, 1.6353759765625, 1.709381103515625, 1.78338623046875, 1.857391357421875, 1.931396484375, 2.005401611328125, 2.07940673828125, 2.153411865234375, 2.2274169921875, 2.301422119140625, 2.37542724609375, 2.449432373046875, 2.5234375]}, "gradients/decoder.roberta.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 11.0, 8.0, 18.0, 24.0, 35.0, 37.0, 55.0, 80.0, 149.0, 253.0, 630.0, 3716.0, 1592589.0, 2591124.0, 4150.0, 675.0, 264.0, 145.0, 93.0, 59.0, 39.0, 30.0, 30.0, 18.0, 12.0, 6.0, 10.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.765625, -26.808837890625, -25.85205078125, -24.895263671875, -23.9384765625, -22.981689453125, -22.02490234375, -21.068115234375, -20.111328125, -19.154541015625, -18.19775390625, -17.240966796875, -16.2841796875, -15.327392578125, -14.37060546875, -13.413818359375, -12.45703125, -11.500244140625, -10.54345703125, -9.586669921875, -8.6298828125, -7.673095703125, -6.71630859375, -5.759521484375, -4.802734375, -3.845947265625, -2.88916015625, -1.932373046875, -0.9755859375, -0.018798828125, 0.93798828125, 1.894775390625, 2.8515625, 3.808349609375, 4.76513671875, 5.721923828125, 6.6787109375, 7.635498046875, 8.59228515625, 9.549072265625, 10.505859375, 11.462646484375, 12.41943359375, 13.376220703125, 14.3330078125, 15.289794921875, 16.24658203125, 17.203369140625, 18.16015625, 19.116943359375, 20.07373046875, 21.030517578125, 21.9873046875, 22.944091796875, 23.90087890625, 24.857666015625, 25.814453125, 26.771240234375, 27.72802734375, 28.684814453125, 29.6416015625, 30.598388671875, 31.55517578125, 32.511962890625, 33.46875]}, "gradients/decoder.roberta.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 7.0, 7.0, 17.0, 21.0, 35.0, 35.0, 55.0, 87.0, 126.0, 232.0, 355.0, 576.0, 822.0, 650.0, 387.0, 228.0, 150.0, 86.0, 61.0, 44.0, 25.0, 22.0, 14.0, 11.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.8818359375, -1.8289794921875, -1.776123046875, -1.7232666015625, -1.67041015625, -1.6175537109375, -1.564697265625, -1.5118408203125, -1.458984375, -1.4061279296875, -1.353271484375, -1.3004150390625, -1.24755859375, -1.1947021484375, -1.141845703125, -1.0889892578125, -1.0361328125, -0.9832763671875, -0.930419921875, -0.8775634765625, -0.82470703125, -0.7718505859375, -0.718994140625, -0.6661376953125, -0.61328125, -0.5604248046875, -0.507568359375, -0.4547119140625, -0.40185546875, -0.3489990234375, -0.296142578125, -0.2432861328125, -0.1904296875, -0.1375732421875, -0.084716796875, -0.0318603515625, 0.02099609375, 0.0738525390625, 0.126708984375, 0.1795654296875, 0.232421875, 0.2852783203125, 0.338134765625, 0.3909912109375, 0.44384765625, 0.4967041015625, 0.549560546875, 0.6024169921875, 0.6552734375, 0.7081298828125, 0.760986328125, 0.8138427734375, 0.86669921875, 0.9195556640625, 0.972412109375, 1.0252685546875, 1.078125, 1.1309814453125, 1.183837890625, 1.2366943359375, 1.28955078125, 1.3424072265625, 1.395263671875, 1.4481201171875, 1.5009765625]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 4.0, 11.0, 21.0, 26.0, 55.0, 68.0, 92.0, 149.0, 147.0, 129.0, 106.0, 73.0, 48.0, 37.0, 11.0, 20.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1458141803741455, -1.975105881690979, -1.8043975830078125, -1.6336894035339355, -1.462981104850769, -1.2922728061676025, -1.1215646266937256, -0.9508563280105591, -0.7801480293273926, -0.6094397306442261, -0.43873149156570435, -0.2680232524871826, -0.09731495380401611, 0.07339334487915039, 0.24410152435302734, 0.41480982303619385, 0.5855181217193604, 0.7562264204025269, 0.9269346594810486, 1.0976428985595703, 1.2683511972427368, 1.4390594959259033, 1.6097676753997803, 1.7804759740829468, 1.9511842727661133, 2.1218924522399902, 2.2926008701324463, 2.4633090496063232, 2.6340174674987793, 2.8047256469726562, 2.975433826446533, 3.14614200592041, 3.3168506622314453, 3.4875588417053223, 3.6582672595977783, 3.8289754390716553, 3.9996838569641113, 4.170392036437988, 4.341100215911865, 4.511808395385742, 4.682517051696777, 4.853225231170654, 5.023933410644531, 5.194642066955566, 5.365350246429443, 5.53605842590332, 5.706766605377197, 5.877474784851074, 6.048182964324951, 6.218891143798828, 6.389599323272705, 6.560307502746582, 6.731016159057617, 6.901724338531494, 7.072432518005371, 7.243140697479248, 7.413848876953125, 7.584557056427002, 7.755265235900879, 7.925973892211914, 8.096681594848633, 8.267390251159668, 8.438098907470703, 8.608806610107422, 8.779515266418457]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 6.0, 6.0, 7.0, 7.0, 9.0, 11.0, 12.0, 14.0, 14.0, 14.0, 18.0, 22.0, 23.0, 26.0, 30.0, 44.0, 35.0, 38.0, 32.0, 45.0, 29.0, 42.0, 44.0, 34.0, 37.0, 41.0, 39.0, 35.0, 29.0, 23.0, 19.0, 21.0, 33.0, 19.0, 17.0, 21.0, 10.0, 13.0, 16.0, 11.0, 9.0, 5.0, 9.0, 4.0, 8.0, 6.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.2370152473449707, -2.1595730781555176, -2.0821306705474854, -2.004688262939453, -1.92724609375, -1.8498038053512573, -1.7723615169525146, -1.694919228553772, -1.6174769401550293, -1.5400346517562866, -1.462592363357544, -1.3851500749588013, -1.3077077865600586, -1.230265498161316, -1.1528232097625732, -1.0753809213638306, -0.9979386329650879, -0.9204963445663452, -0.8430540561676025, -0.7656117677688599, -0.6881694793701172, -0.6107271909713745, -0.5332849025726318, -0.45584261417388916, -0.3784003257751465, -0.3009580373764038, -0.22351574897766113, -0.14607346057891846, -0.06863117218017578, 0.008811116218566895, 0.08625340461730957, 0.16369569301605225, 0.24113774299621582, 0.3185800313949585, 0.39602231979370117, 0.47346460819244385, 0.5509068965911865, 0.6283491849899292, 0.7057914733886719, 0.7832337617874146, 0.8606760501861572, 0.9381183385848999, 1.0155606269836426, 1.0930029153823853, 1.170445203781128, 1.2478874921798706, 1.3253297805786133, 1.402772068977356, 1.4802143573760986, 1.5576566457748413, 1.635098934173584, 1.7125412225723267, 1.7899835109710693, 1.867425799369812, 1.9448680877685547, 2.022310256958008, 2.09975266456604, 2.1771950721740723, 2.2546372413635254, 2.3320794105529785, 2.4095218181610107, 2.486964225769043, 2.564406394958496, 2.641848564147949, 2.7192909717559814]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [5.0, 3.0, 6.0, 3.0, 13.0, 15.0, 26.0, 30.0, 52.0, 77.0, 130.0, 181.0, 276.0, 397.0, 585.0, 860.0, 1308.0, 1873.0, 2805.0, 4279.0, 6827.0, 10182.0, 16599.0, 27411.0, 48016.0, 85246.0, 155569.0, 232112.0, 192348.0, 110307.0, 60362.0, 34342.0, 20759.0, 12408.0, 7877.0, 5070.0, 3370.0, 2237.0, 1502.0, 1009.0, 677.0, 430.0, 319.0, 216.0, 146.0, 88.0, 58.0, 41.0, 36.0, 26.0, 15.0, 18.0, 9.0, 5.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40966796875, -0.3948822021484375, -0.380096435546875, -0.3653106689453125, -0.35052490234375, -0.3357391357421875, -0.320953369140625, -0.3061676025390625, -0.2913818359375, -0.2765960693359375, -0.261810302734375, -0.2470245361328125, -0.23223876953125, -0.2174530029296875, -0.202667236328125, -0.1878814697265625, -0.173095703125, -0.1583099365234375, -0.143524169921875, -0.1287384033203125, -0.11395263671875, -0.0991668701171875, -0.084381103515625, -0.0695953369140625, -0.0548095703125, -0.0400238037109375, -0.025238037109375, -0.0104522705078125, 0.00433349609375, 0.0191192626953125, 0.033905029296875, 0.0486907958984375, 0.0634765625, 0.0782623291015625, 0.093048095703125, 0.1078338623046875, 0.12261962890625, 0.1374053955078125, 0.152191162109375, 0.1669769287109375, 0.1817626953125, 0.1965484619140625, 0.211334228515625, 0.2261199951171875, 0.24090576171875, 0.2556915283203125, 0.270477294921875, 0.2852630615234375, 0.300048828125, 0.3148345947265625, 0.329620361328125, 0.3444061279296875, 0.35919189453125, 0.3739776611328125, 0.388763427734375, 0.4035491943359375, 0.4183349609375, 0.4331207275390625, 0.447906494140625, 0.4626922607421875, 0.47747802734375, 0.4922637939453125, 0.507049560546875, 0.5218353271484375, 0.53662109375]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 7.0, 7.0, 14.0, 10.0, 13.0, 16.0, 14.0, 18.0, 23.0, 24.0, 29.0, 28.0, 41.0, 34.0, 38.0, 36.0, 38.0, 36.0, 43.0, 38.0, 37.0, 34.0, 43.0, 37.0, 36.0, 31.0, 21.0, 19.0, 19.0, 35.0, 21.0, 13.0, 22.0, 10.0, 13.0, 16.0, 12.0, 9.0, 5.0, 10.0, 4.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.126953125, -2.052001953125, -1.97705078125, -1.902099609375, -1.8271484375, -1.752197265625, -1.67724609375, -1.602294921875, -1.52734375, -1.452392578125, -1.37744140625, -1.302490234375, -1.2275390625, -1.152587890625, -1.07763671875, -1.002685546875, -0.927734375, -0.852783203125, -0.77783203125, -0.702880859375, -0.6279296875, -0.552978515625, -0.47802734375, -0.403076171875, -0.328125, -0.253173828125, -0.17822265625, -0.103271484375, -0.0283203125, 0.046630859375, 0.12158203125, 0.196533203125, 0.271484375, 0.346435546875, 0.42138671875, 0.496337890625, 0.5712890625, 0.646240234375, 0.72119140625, 0.796142578125, 0.87109375, 0.946044921875, 1.02099609375, 1.095947265625, 1.1708984375, 1.245849609375, 1.32080078125, 1.395751953125, 1.470703125, 1.545654296875, 1.62060546875, 1.695556640625, 1.7705078125, 1.845458984375, 1.92041015625, 1.995361328125, 2.0703125, 2.145263671875, 2.22021484375, 2.295166015625, 2.3701171875, 2.445068359375, 2.52001953125, 2.594970703125, 2.669921875]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 9.0, 12.0, 28.0, 17.0, 34.0, 43.0, 66.0, 102.0, 137.0, 249.0, 285.0, 467.0, 826.0, 1493.0, 3165.0, 8662.0, 33295.0, 931133.0, 49104.0, 11270.0, 3883.0, 1733.0, 926.0, 540.0, 349.0, 211.0, 178.0, 77.0, 75.0, 42.0, 34.0, 43.0, 24.0, 18.0, 3.0, 4.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9462890625, -1.8866119384765625, -1.826934814453125, -1.7672576904296875, -1.70758056640625, -1.6479034423828125, -1.588226318359375, -1.5285491943359375, -1.4688720703125, -1.4091949462890625, -1.349517822265625, -1.2898406982421875, -1.23016357421875, -1.1704864501953125, -1.110809326171875, -1.0511322021484375, -0.991455078125, -0.9317779541015625, -0.872100830078125, -0.8124237060546875, -0.75274658203125, -0.6930694580078125, -0.633392333984375, -0.5737152099609375, -0.5140380859375, -0.4543609619140625, -0.394683837890625, -0.3350067138671875, -0.27532958984375, -0.2156524658203125, -0.155975341796875, -0.0962982177734375, -0.03662109375, 0.0230560302734375, 0.082733154296875, 0.1424102783203125, 0.20208740234375, 0.2617645263671875, 0.321441650390625, 0.3811187744140625, 0.4407958984375, 0.5004730224609375, 0.560150146484375, 0.6198272705078125, 0.67950439453125, 0.7391815185546875, 0.798858642578125, 0.8585357666015625, 0.918212890625, 0.9778900146484375, 1.037567138671875, 1.0972442626953125, 1.15692138671875, 1.2165985107421875, 1.276275634765625, 1.3359527587890625, 1.3956298828125, 1.4553070068359375, 1.514984130859375, 1.5746612548828125, 1.63433837890625, 1.6940155029296875, 1.753692626953125, 1.8133697509765625, 1.873046875]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 8.0, 6.0, 7.0, 8.0, 6.0, 12.0, 9.0, 20.0, 22.0, 18.0, 22.0, 25.0, 20.0, 19.0, 20.0, 32.0, 43.0, 37.0, 34.0, 37.0, 49.0, 41.0, 43.0, 42.0, 41.0, 27.0, 33.0, 33.0, 32.0, 28.0, 34.0, 27.0, 29.0, 15.0, 20.0, 14.0, 16.0, 25.0, 10.0, 11.0, 7.0, 9.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.728515625, -1.6769561767578125, -1.625396728515625, -1.5738372802734375, -1.52227783203125, -1.4707183837890625, -1.419158935546875, -1.3675994873046875, -1.3160400390625, -1.2644805908203125, -1.212921142578125, -1.1613616943359375, -1.10980224609375, -1.0582427978515625, -1.006683349609375, -0.9551239013671875, -0.903564453125, -0.8520050048828125, -0.800445556640625, -0.7488861083984375, -0.69732666015625, -0.6457672119140625, -0.594207763671875, -0.5426483154296875, -0.4910888671875, -0.4395294189453125, -0.387969970703125, -0.3364105224609375, -0.28485107421875, -0.2332916259765625, -0.181732177734375, -0.1301727294921875, -0.07861328125, -0.0270538330078125, 0.024505615234375, 0.0760650634765625, 0.12762451171875, 0.1791839599609375, 0.230743408203125, 0.2823028564453125, 0.3338623046875, 0.3854217529296875, 0.436981201171875, 0.4885406494140625, 0.54010009765625, 0.5916595458984375, 0.643218994140625, 0.6947784423828125, 0.746337890625, 0.7978973388671875, 0.849456787109375, 0.9010162353515625, 0.95257568359375, 1.0041351318359375, 1.055694580078125, 1.1072540283203125, 1.1588134765625, 1.2103729248046875, 1.261932373046875, 1.3134918212890625, 1.36505126953125, 1.4166107177734375, 1.468170166015625, 1.5197296142578125, 1.5712890625]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 8.0, 12.0, 7.0, 21.0, 28.0, 43.0, 56.0, 105.0, 146.0, 258.0, 531.0, 1161.0, 3346.0, 16727.0, 990903.0, 28080.0, 4318.0, 1369.0, 655.0, 305.0, 165.0, 102.0, 48.0, 38.0, 26.0, 14.0, 16.0, 13.0, 8.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.407958984375, -0.39544677734375, -0.3829345703125, -0.37042236328125, -0.35791015625, -0.34539794921875, -0.3328857421875, -0.32037353515625, -0.307861328125, -0.29534912109375, -0.2828369140625, -0.27032470703125, -0.2578125, -0.24530029296875, -0.2327880859375, -0.22027587890625, -0.207763671875, -0.19525146484375, -0.1827392578125, -0.17022705078125, -0.15771484375, -0.14520263671875, -0.1326904296875, -0.12017822265625, -0.107666015625, -0.09515380859375, -0.0826416015625, -0.07012939453125, -0.0576171875, -0.04510498046875, -0.0325927734375, -0.02008056640625, -0.007568359375, 0.00494384765625, 0.0174560546875, 0.02996826171875, 0.04248046875, 0.05499267578125, 0.0675048828125, 0.08001708984375, 0.092529296875, 0.10504150390625, 0.1175537109375, 0.13006591796875, 0.142578125, 0.15509033203125, 0.1676025390625, 0.18011474609375, 0.192626953125, 0.20513916015625, 0.2176513671875, 0.23016357421875, 0.24267578125, 0.25518798828125, 0.2677001953125, 0.28021240234375, 0.292724609375, 0.30523681640625, 0.3177490234375, 0.33026123046875, 0.3427734375, 0.35528564453125, 0.3677978515625, 0.38031005859375, 0.392822265625]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 6.0, 6.0, 8.0, 10.0, 10.0, 6.0, 10.0, 17.0, 18.0, 23.0, 18.0, 35.0, 40.0, 38.0, 41.0, 37.0, 43.0, 43.0, 68.0, 57.0, 48.0, 41.0, 48.0, 48.0, 37.0, 30.0, 22.0, 28.0, 23.0, 18.0, 22.0, 16.0, 17.0, 9.0, 9.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2411346435546875e-05, -2.1647661924362183e-05, -2.088397741317749e-05, -2.0120292901992798e-05, -1.9356608390808105e-05, -1.8592923879623413e-05, -1.782923936843872e-05, -1.706555485725403e-05, -1.6301870346069336e-05, -1.5538185834884644e-05, -1.4774501323699951e-05, -1.4010816812515259e-05, -1.3247132301330566e-05, -1.2483447790145874e-05, -1.1719763278961182e-05, -1.095607876777649e-05, -1.0192394256591797e-05, -9.428709745407104e-06, -8.665025234222412e-06, -7.90134072303772e-06, -7.137656211853027e-06, -6.373971700668335e-06, -5.610287189483643e-06, -4.84660267829895e-06, -4.082918167114258e-06, -3.3192336559295654e-06, -2.555549144744873e-06, -1.7918646335601807e-06, -1.0281801223754883e-06, -2.644956111907959e-07, 4.991888999938965e-07, 1.2628734111785889e-06, 2.0265579223632812e-06, 2.7902424335479736e-06, 3.553926944732666e-06, 4.317611455917358e-06, 5.081295967102051e-06, 5.844980478286743e-06, 6.6086649894714355e-06, 7.372349500656128e-06, 8.13603401184082e-06, 8.899718523025513e-06, 9.663403034210205e-06, 1.0427087545394897e-05, 1.119077205657959e-05, 1.1954456567764282e-05, 1.2718141078948975e-05, 1.3481825590133667e-05, 1.424551010131836e-05, 1.5009194612503052e-05, 1.5772879123687744e-05, 1.6536563634872437e-05, 1.730024814605713e-05, 1.806393265724182e-05, 1.8827617168426514e-05, 1.9591301679611206e-05, 2.03549861907959e-05, 2.111867070198059e-05, 2.1882355213165283e-05, 2.2646039724349976e-05, 2.3409724235534668e-05, 2.417340874671936e-05, 2.4937093257904053e-05, 2.5700777769088745e-05, 2.6464462280273438e-05]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 9.0, 7.0, 15.0, 26.0, 53.0, 112.0, 234.0, 5616.0, 1033843.0, 8096.0, 261.0, 103.0, 51.0, 31.0, 18.0, 18.0, 13.0, 14.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63916015625, -0.6119918823242188, -0.5848236083984375, -0.5576553344726562, -0.530487060546875, -0.5033187866210938, -0.4761505126953125, -0.44898223876953125, -0.42181396484375, -0.39464569091796875, -0.3674774169921875, -0.34030914306640625, -0.313140869140625, -0.28597259521484375, -0.2588043212890625, -0.23163604736328125, -0.2044677734375, -0.17729949951171875, -0.1501312255859375, -0.12296295166015625, -0.095794677734375, -0.06862640380859375, -0.0414581298828125, -0.01428985595703125, 0.01287841796875, 0.04004669189453125, 0.0672149658203125, 0.09438323974609375, 0.121551513671875, 0.14871978759765625, 0.1758880615234375, 0.20305633544921875, 0.230224609375, 0.25739288330078125, 0.2845611572265625, 0.31172943115234375, 0.338897705078125, 0.36606597900390625, 0.3932342529296875, 0.42040252685546875, 0.44757080078125, 0.47473907470703125, 0.5019073486328125, 0.5290756225585938, 0.556243896484375, 0.5834121704101562, 0.6105804443359375, 0.6377487182617188, 0.6649169921875, 0.6920852661132812, 0.7192535400390625, 0.7464218139648438, 0.773590087890625, 0.8007583618164062, 0.8279266357421875, 0.8550949096679688, 0.88226318359375, 0.9094314575195312, 0.9365997314453125, 0.9637680053710938, 0.990936279296875, 1.0181045532226562, 1.0452728271484375, 1.0724411010742188, 1.099609375]}, "gradients/decoder.roberta.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 10.0, 7.0, 12.0, 8.0, 22.0, 24.0, 35.0, 53.0, 84.0, 154.0, 172.0, 158.0, 86.0, 59.0, 46.0, 18.0, 14.0, 9.0, 8.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.049468994140625, -0.048247337341308594, -0.04702568054199219, -0.04580402374267578, -0.044582366943359375, -0.04336071014404297, -0.04213905334472656, -0.040917396545410156, -0.03969573974609375, -0.038474082946777344, -0.03725242614746094, -0.03603076934814453, -0.034809112548828125, -0.03358745574951172, -0.03236579895019531, -0.031144142150878906, -0.0299224853515625, -0.028700828552246094, -0.027479171752929688, -0.02625751495361328, -0.025035858154296875, -0.02381420135498047, -0.022592544555664062, -0.021370887756347656, -0.02014923095703125, -0.018927574157714844, -0.017705917358398438, -0.01648426055908203, -0.015262603759765625, -0.014040946960449219, -0.012819290161132812, -0.011597633361816406, -0.0103759765625, -0.009154319763183594, -0.007932662963867188, -0.006711006164550781, -0.005489349365234375, -0.004267692565917969, -0.0030460357666015625, -0.0018243789672851562, -0.00060272216796875, 0.0006189346313476562, 0.0018405914306640625, 0.0030622482299804688, 0.004283905029296875, 0.005505561828613281, 0.0067272186279296875, 0.007948875427246094, 0.0091705322265625, 0.010392189025878906, 0.011613845825195312, 0.012835502624511719, 0.014057159423828125, 0.015278816223144531, 0.016500473022460938, 0.017722129821777344, 0.01894378662109375, 0.020165443420410156, 0.021387100219726562, 0.02260875701904297, 0.023830413818359375, 0.02505207061767578, 0.026273727416992188, 0.027495384216308594, 0.028717041015625]}, "gradients/decoder.roberta.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 11.0, 37.0, 88.0, 131.0, 215.0, 203.0, 146.0, 97.0, 43.0, 23.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.748126983642578, -9.485807418823242, -9.223488807678223, -8.961170196533203, -8.698850631713867, -8.436531066894531, -8.174212455749512, -7.911893367767334, -7.649574279785156, -7.3872551918029785, -7.124936103820801, -6.862617015838623, -6.600297927856445, -6.337978839874268, -6.07565975189209, -5.813340663909912, -5.551021575927734, -5.288702487945557, -5.026383399963379, -4.764064311981201, -4.501745223999023, -4.239426136016846, -3.977107048034668, -3.7147879600524902, -3.4524688720703125, -3.1901497840881348, -2.927830696105957, -2.6655116081237793, -2.4031925201416016, -2.140873432159424, -1.878554344177246, -1.6162352561950684, -1.353917121887207, -1.0915980339050293, -0.8292789459228516, -0.5669598579406738, -0.3046407699584961, -0.04232168197631836, 0.21999740600585938, 0.4823164939880371, 0.7446355819702148, 1.0069546699523926, 1.2692737579345703, 1.531592845916748, 1.7939119338989258, 2.0562310218811035, 2.3185501098632812, 2.580869197845459, 2.8431882858276367, 3.1055073738098145, 3.367826461791992, 3.63014554977417, 3.8924646377563477, 4.154783725738525, 4.417102813720703, 4.679421901702881, 4.941740989685059, 5.204060077667236, 5.466379165649414, 5.728698253631592, 5.9910173416137695, 6.253336429595947, 6.515655517578125, 6.777974605560303, 7.0402936935424805]}, "gradients/decoder.roberta.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 7.0, 8.0, 7.0, 6.0, 12.0, 13.0, 13.0, 15.0, 15.0, 18.0, 23.0, 23.0, 27.0, 31.0, 39.0, 34.0, 39.0, 35.0, 39.0, 35.0, 41.0, 39.0, 40.0, 33.0, 41.0, 38.0, 38.0, 31.0, 20.0, 19.0, 18.0, 35.0, 21.0, 15.0, 21.0, 10.0, 14.0, 16.0, 12.0, 9.0, 5.0, 10.0, 3.0, 8.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1320836544036865, -2.057063102722168, -1.982042670249939, -1.90702223777771, -1.8320016860961914, -1.7569812536239624, -1.6819608211517334, -1.6069402694702148, -1.5319198369979858, -1.4568994045257568, -1.3818788528442383, -1.3068584203720093, -1.2318379878997803, -1.1568174362182617, -1.0817970037460327, -1.0067765712738037, -0.9317560195922852, -0.8567355275154114, -0.7817150354385376, -0.7066946029663086, -0.6316741108894348, -0.556653618812561, -0.48163315653800964, -0.40661269426345825, -0.3315922021865845, -0.2565717101097107, -0.1815512478351593, -0.10653077065944672, -0.03151029348373413, 0.04351019859313965, 0.11853066086769104, 0.19355112314224243, 0.2685718536376953, 0.3435923457145691, 0.4186128079891205, 0.4936332702636719, 0.5686537623405457, 0.6436742544174194, 0.7186946868896484, 0.7937151789665222, 0.868735671043396, 0.9437561631202698, 1.0187766551971436, 1.0937970876693726, 1.1688175201416016, 1.2438380718231201, 1.3188585042953491, 1.3938789367675781, 1.4688994884490967, 1.5439199209213257, 1.6189404726028442, 1.6939609050750732, 1.7689814567565918, 1.8440018892288208, 1.9190223217010498, 1.9940428733825684, 2.069063186645508, 2.1440837383270264, 2.219104051589966, 2.2941246032714844, 2.369145154953003, 2.4441657066345215, 2.519186019897461, 2.5942065715789795, 2.669227123260498]}, "gradients/decoder.roberta.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 2.0, 10.0, 8.0, 13.0, 14.0, 19.0, 26.0, 29.0, 32.0, 58.0, 78.0, 84.0, 118.0, 185.0, 274.0, 445.0, 781.0, 1223.0, 2340.0, 4455.0, 9909.0, 22894.0, 59138.0, 177089.0, 418008.0, 225045.0, 74320.0, 28277.0, 11818.0, 5476.0, 2638.0, 1420.0, 813.0, 480.0, 322.0, 193.0, 146.0, 102.0, 68.0, 56.0, 32.0, 32.0, 27.0, 16.0, 10.0, 11.0, 6.0, 8.0, 5.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.486328125, -3.364471435546875, -3.24261474609375, -3.120758056640625, -2.9989013671875, -2.877044677734375, -2.75518798828125, -2.633331298828125, -2.511474609375, -2.389617919921875, -2.26776123046875, -2.145904541015625, -2.0240478515625, -1.902191162109375, -1.78033447265625, -1.658477783203125, -1.53662109375, -1.414764404296875, -1.29290771484375, -1.171051025390625, -1.0491943359375, -0.927337646484375, -0.80548095703125, -0.683624267578125, -0.561767578125, -0.439910888671875, -0.31805419921875, -0.196197509765625, -0.0743408203125, 0.047515869140625, 0.16937255859375, 0.291229248046875, 0.4130859375, 0.534942626953125, 0.65679931640625, 0.778656005859375, 0.9005126953125, 1.022369384765625, 1.14422607421875, 1.266082763671875, 1.387939453125, 1.509796142578125, 1.63165283203125, 1.753509521484375, 1.8753662109375, 1.997222900390625, 2.11907958984375, 2.240936279296875, 2.36279296875, 2.484649658203125, 2.60650634765625, 2.728363037109375, 2.8502197265625, 2.972076416015625, 3.09393310546875, 3.215789794921875, 3.337646484375, 3.459503173828125, 3.58135986328125, 3.703216552734375, 3.8250732421875, 3.946929931640625, 4.06878662109375, 4.190643310546875, 4.3125]}, "gradients/decoder.roberta.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 7.0, 4.0, 13.0, 6.0, 10.0, 13.0, 9.0, 15.0, 12.0, 19.0, 16.0, 27.0, 26.0, 27.0, 39.0, 36.0, 39.0, 39.0, 37.0, 30.0, 51.0, 33.0, 35.0, 42.0, 35.0, 39.0, 48.0, 27.0, 20.0, 25.0, 23.0, 31.0, 23.0, 14.0, 19.0, 15.0, 14.0, 14.0, 11.0, 6.0, 9.0, 9.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.240234375, -2.162322998046875, -2.08441162109375, -2.006500244140625, -1.9285888671875, -1.850677490234375, -1.77276611328125, -1.694854736328125, -1.616943359375, -1.539031982421875, -1.46112060546875, -1.383209228515625, -1.3052978515625, -1.227386474609375, -1.14947509765625, -1.071563720703125, -0.99365234375, -0.915740966796875, -0.83782958984375, -0.759918212890625, -0.6820068359375, -0.604095458984375, -0.52618408203125, -0.448272705078125, -0.370361328125, -0.292449951171875, -0.21453857421875, -0.136627197265625, -0.0587158203125, 0.019195556640625, 0.09710693359375, 0.175018310546875, 0.2529296875, 0.330841064453125, 0.40875244140625, 0.486663818359375, 0.5645751953125, 0.642486572265625, 0.72039794921875, 0.798309326171875, 0.876220703125, 0.954132080078125, 1.03204345703125, 1.109954833984375, 1.1878662109375, 1.265777587890625, 1.34368896484375, 1.421600341796875, 1.49951171875, 1.577423095703125, 1.65533447265625, 1.733245849609375, 1.8111572265625, 1.889068603515625, 1.96697998046875, 2.044891357421875, 2.122802734375, 2.200714111328125, 2.27862548828125, 2.356536865234375, 2.4344482421875, 2.512359619140625, 2.59027099609375, 2.668182373046875, 2.74609375]}, "gradients/decoder.roberta.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 4.0, 10.0, 10.0, 8.0, 19.0, 13.0, 15.0, 16.0, 28.0, 36.0, 39.0, 60.0, 62.0, 92.0, 115.0, 258.0, 2599.0, 1043934.0, 490.0, 210.0, 105.0, 82.0, 59.0, 45.0, 46.0, 32.0, 32.0, 12.0, 16.0, 16.0, 14.0, 19.0, 5.0, 11.0, 4.0, 3.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-90.6875, -88.044921875, -85.40234375, -82.759765625, -80.1171875, -77.474609375, -74.83203125, -72.189453125, -69.546875, -66.904296875, -64.26171875, -61.619140625, -58.9765625, -56.333984375, -53.69140625, -51.048828125, -48.40625, -45.763671875, -43.12109375, -40.478515625, -37.8359375, -35.193359375, -32.55078125, -29.908203125, -27.265625, -24.623046875, -21.98046875, -19.337890625, -16.6953125, -14.052734375, -11.41015625, -8.767578125, -6.125, -3.482421875, -0.83984375, 1.802734375, 4.4453125, 7.087890625, 9.73046875, 12.373046875, 15.015625, 17.658203125, 20.30078125, 22.943359375, 25.5859375, 28.228515625, 30.87109375, 33.513671875, 36.15625, 38.798828125, 41.44140625, 44.083984375, 46.7265625, 49.369140625, 52.01171875, 54.654296875, 57.296875, 59.939453125, 62.58203125, 65.224609375, 67.8671875, 70.509765625, 73.15234375, 75.794921875, 78.4375]}, "gradients/decoder.roberta.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 6.0, 7.0, 7.0, 16.0, 15.0, 17.0, 17.0, 12.0, 28.0, 36.0, 40.0, 42.0, 40.0, 35.0, 51.0, 38.0, 47.0, 53.0, 53.0, 45.0, 42.0, 45.0, 42.0, 35.0, 35.0, 36.0, 31.0, 21.0, 9.0, 17.0, 13.0, 9.0, 14.0, 7.0, 6.0, 7.0, 8.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.75860595703125, -2.6656494140625, -2.57269287109375, -2.479736328125, -2.38677978515625, -2.2938232421875, -2.20086669921875, -2.10791015625, -2.01495361328125, -1.9219970703125, -1.82904052734375, -1.736083984375, -1.64312744140625, -1.5501708984375, -1.45721435546875, -1.3642578125, -1.27130126953125, -1.1783447265625, -1.08538818359375, -0.992431640625, -0.89947509765625, -0.8065185546875, -0.71356201171875, -0.62060546875, -0.52764892578125, -0.4346923828125, -0.34173583984375, -0.248779296875, -0.15582275390625, -0.0628662109375, 0.03009033203125, 0.123046875, 0.21600341796875, 0.3089599609375, 0.40191650390625, 0.494873046875, 0.58782958984375, 0.6807861328125, 0.77374267578125, 0.86669921875, 0.95965576171875, 1.0526123046875, 1.14556884765625, 1.238525390625, 1.33148193359375, 1.4244384765625, 1.51739501953125, 1.6103515625, 1.70330810546875, 1.7962646484375, 1.88922119140625, 1.982177734375, 2.07513427734375, 2.1680908203125, 2.26104736328125, 2.35400390625, 2.44696044921875, 2.5399169921875, 2.63287353515625, 2.725830078125, 2.81878662109375, 2.9117431640625, 3.00469970703125, 3.09765625]}, "gradients/decoder.roberta.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 9.0, 9.0, 12.0, 30.0, 65.0, 110.0, 258.0, 563.0, 1404.0, 7591.0, 296514.0, 723183.0, 15484.0, 2013.0, 674.0, 309.0, 135.0, 73.0, 48.0, 22.0, 15.0, 8.0, 4.0, 3.0, 8.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3046875, -5.12255859375, -4.9404296875, -4.75830078125, -4.576171875, -4.39404296875, -4.2119140625, -4.02978515625, -3.84765625, -3.66552734375, -3.4833984375, -3.30126953125, -3.119140625, -2.93701171875, -2.7548828125, -2.57275390625, -2.390625, -2.20849609375, -2.0263671875, -1.84423828125, -1.662109375, -1.47998046875, -1.2978515625, -1.11572265625, -0.93359375, -0.75146484375, -0.5693359375, -0.38720703125, -0.205078125, -0.02294921875, 0.1591796875, 0.34130859375, 0.5234375, 0.70556640625, 0.8876953125, 1.06982421875, 1.251953125, 1.43408203125, 1.6162109375, 1.79833984375, 1.98046875, 2.16259765625, 2.3447265625, 2.52685546875, 2.708984375, 2.89111328125, 3.0732421875, 3.25537109375, 3.4375, 3.61962890625, 3.8017578125, 3.98388671875, 4.166015625, 4.34814453125, 4.5302734375, 4.71240234375, 4.89453125, 5.07666015625, 5.2587890625, 5.44091796875, 5.623046875, 5.80517578125, 5.9873046875, 6.16943359375, 6.3515625]}, "gradients/decoder.roberta.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 7.0, 7.0, 14.0, 25.0, 40.0, 50.0, 91.0, 150.0, 210.0, 142.0, 90.0, 66.0, 45.0, 32.0, 13.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003094673156738281, -0.0002973601222038269, -0.0002852529287338257, -0.00027314573526382446, -0.00026103854179382324, -0.000248931348323822, -0.0002368241548538208, -0.00022471696138381958, -0.00021260976791381836, -0.00020050257444381714, -0.00018839538097381592, -0.0001762881875038147, -0.00016418099403381348, -0.00015207380056381226, -0.00013996660709381104, -0.00012785941362380981, -0.0001157522201538086, -0.00010364502668380737, -9.153783321380615e-05, -7.943063974380493e-05, -6.732344627380371e-05, -5.521625280380249e-05, -4.310905933380127e-05, -3.100186586380005e-05, -1.8894672393798828e-05, -6.787478923797607e-06, 5.319714546203613e-06, 1.7426908016204834e-05, 2.9534101486206055e-05, 4.1641294956207275e-05, 5.3748488426208496e-05, 6.585568189620972e-05, 7.796287536621094e-05, 9.007006883621216e-05, 0.00010217726230621338, 0.0001142844557762146, 0.00012639164924621582, 0.00013849884271621704, 0.00015060603618621826, 0.00016271322965621948, 0.0001748204231262207, 0.00018692761659622192, 0.00019903481006622314, 0.00021114200353622437, 0.00022324919700622559, 0.0002353563904762268, 0.00024746358394622803, 0.00025957077741622925, 0.00027167797088623047, 0.0002837851643562317, 0.0002958923578262329, 0.00030799955129623413, 0.00032010674476623535, 0.00033221393823623657, 0.0003443211317062378, 0.000356428325176239, 0.00036853551864624023, 0.00038064271211624146, 0.0003927499055862427, 0.0004048570990562439, 0.0004169642925262451, 0.00042907148599624634, 0.00044117867946624756, 0.0004532858729362488, 0.00046539306640625]}, "gradients/decoder.roberta.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 13.0, 19.0, 13.0, 35.0, 48.0, 68.0, 116.0, 498.0, 4458.0, 986961.0, 54523.0, 1323.0, 210.0, 83.0, 63.0, 46.0, 25.0, 13.0, 10.0, 10.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.35498046875, -9.9677734375, -9.58056640625, -9.193359375, -8.80615234375, -8.4189453125, -8.03173828125, -7.64453125, -7.25732421875, -6.8701171875, -6.48291015625, -6.095703125, -5.70849609375, -5.3212890625, -4.93408203125, -4.546875, -4.15966796875, -3.7724609375, -3.38525390625, -2.998046875, -2.61083984375, -2.2236328125, -1.83642578125, -1.44921875, -1.06201171875, -0.6748046875, -0.28759765625, 0.099609375, 0.48681640625, 0.8740234375, 1.26123046875, 1.6484375, 2.03564453125, 2.4228515625, 2.81005859375, 3.197265625, 3.58447265625, 3.9716796875, 4.35888671875, 4.74609375, 5.13330078125, 5.5205078125, 5.90771484375, 6.294921875, 6.68212890625, 7.0693359375, 7.45654296875, 7.84375, 8.23095703125, 8.6181640625, 9.00537109375, 9.392578125, 9.77978515625, 10.1669921875, 10.55419921875, 10.94140625, 11.32861328125, 11.7158203125, 12.10302734375, 12.490234375, 12.87744140625, 13.2646484375, 13.65185546875, 14.0390625]}, "gradients/decoder.roberta.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 6.0, 14.0, 18.0, 21.0, 38.0, 47.0, 44.0, 43.0, 72.0, 105.0, 114.0, 97.0, 91.0, 67.0, 41.0, 42.0, 42.0, 29.0, 12.0, 18.0, 11.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.67529296875, -0.6591148376464844, -0.6429367065429688, -0.6267585754394531, -0.6105804443359375, -0.5944023132324219, -0.5782241821289062, -0.5620460510253906, -0.545867919921875, -0.5296897888183594, -0.5135116577148438, -0.4973335266113281, -0.4811553955078125, -0.4649772644042969, -0.44879913330078125, -0.4326210021972656, -0.41644287109375, -0.4002647399902344, -0.38408660888671875, -0.3679084777832031, -0.3517303466796875, -0.3355522155761719, -0.31937408447265625, -0.3031959533691406, -0.287017822265625, -0.2708396911621094, -0.25466156005859375, -0.23848342895507812, -0.2223052978515625, -0.20612716674804688, -0.18994903564453125, -0.17377090454101562, -0.1575927734375, -0.14141464233398438, -0.12523651123046875, -0.10905838012695312, -0.0928802490234375, -0.07670211791992188, -0.06052398681640625, -0.044345855712890625, -0.028167724609375, -0.011989593505859375, 0.00418853759765625, 0.020366668701171875, 0.0365447998046875, 0.052722930908203125, 0.06890106201171875, 0.08507919311523438, 0.10125732421875, 0.11743545532226562, 0.13361358642578125, 0.14979171752929688, 0.1659698486328125, 0.18214797973632812, 0.19832611083984375, 0.21450424194335938, 0.230682373046875, 0.24686050415039062, 0.26303863525390625, 0.2792167663574219, 0.2953948974609375, 0.3115730285644531, 0.32775115966796875, 0.3439292907714844, 0.360107421875]}, "gradients/decoder.roberta.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 10.0, 10.0, 10.0, 15.0, 21.0, 32.0, 34.0, 38.0, 50.0, 60.0, 84.0, 78.0, 69.0, 82.0, 68.0, 59.0, 65.0, 54.0, 44.0, 24.0, 27.0, 25.0, 12.0, 4.0, 14.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1970772743225098, -2.096527338027954, -1.9959772825241089, -1.8954273462295532, -1.794877290725708, -1.6943273544311523, -1.5937774181365967, -1.4932273626327515, -1.3926773071289062, -1.2921273708343506, -1.1915773153305054, -1.0910273790359497, -0.9904773235321045, -0.8899273872375488, -0.7893773913383484, -0.688827395439148, -0.5882774591445923, -0.48772746324539185, -0.3871774673461914, -0.28662750124931335, -0.18607750535011292, -0.08552753925323486, 0.015022456645965576, 0.11557245254516602, 0.21612244844436646, 0.3166724443435669, 0.41722244024276733, 0.5177724361419678, 0.6183223724365234, 0.7188723683357239, 0.8194223642349243, 0.9199723601341248, 1.0205223560333252, 1.1210722923278809, 1.221622347831726, 1.3221722841262817, 1.422722339630127, 1.5232722759246826, 1.6238222122192383, 1.7243722677230835, 1.8249223232269287, 1.9254722595214844, 2.02602219581604, 2.126572370529175, 2.2271223068237305, 2.327672243118286, 2.428222179412842, 2.5287723541259766, 2.629322052001953, 2.729871988296509, 2.8304219245910645, 2.930972099304199, 3.031522035598755, 3.1320719718933105, 3.232621908187866, 3.333171844482422, 3.4337220191955566, 3.5342719554901123, 3.634821891784668, 3.7353720664978027, 3.8359220027923584, 3.936471939086914, 4.037022113800049, 4.137571811676025, 4.23812198638916]}, "gradients/decoder.roberta.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 6.0, 4.0, 3.0, 12.0, 14.0, 18.0, 17.0, 29.0, 33.0, 29.0, 19.0, 23.0, 30.0, 34.0, 32.0, 33.0, 55.0, 35.0, 34.0, 50.0, 43.0, 36.0, 39.0, 42.0, 27.0, 39.0, 31.0, 43.0, 22.0, 28.0, 21.0, 18.0, 11.0, 8.0, 11.0, 12.0, 8.0, 14.0, 3.0, 7.0, 4.0, 7.0, 1.0, 3.0, 3.0, 2.0], "bins": [-3.770637273788452, -3.6685822010040283, -3.5665273666381836, -3.4644722938537598, -3.362417221069336, -3.260362148284912, -3.1583073139190674, -3.0562522411346436, -2.954197406768799, -2.852142333984375, -2.7500874996185303, -2.6480324268341064, -2.5459773540496826, -2.443922519683838, -2.341867446899414, -2.2398123741149902, -2.1377573013305664, -2.0357022285461426, -1.9336472749710083, -1.831592321395874, -1.7295372486114502, -1.627482295036316, -1.5254273414611816, -1.4233722686767578, -1.3213173151016235, -1.2192623615264893, -1.1172072887420654, -1.0151523351669312, -0.9130973219871521, -0.811042308807373, -0.7089873552322388, -0.6069323420524597, -0.5048770904541016, -0.4028220772743225, -0.30076709389686584, -0.19871211051940918, -0.09665709733963013, 0.005397915840148926, 0.1074528694152832, 0.20950788259506226, 0.3115628957748413, 0.41361790895462036, 0.5156729221343994, 0.6177278757095337, 0.7197828888893127, 0.8218379020690918, 0.9238928556442261, 1.0259478092193604, 1.1280028820037842, 1.2300578355789185, 1.3321129083633423, 1.4341678619384766, 1.5362229347229004, 1.6382778882980347, 1.740332841873169, 1.8423879146575928, 1.944442868232727, 2.0464978218078613, 2.148552894592285, 2.250607967376709, 2.3526628017425537, 2.4547178745269775, 2.5567727088928223, 2.658827781677246, 2.76088285446167]}, "gradients/decoder.roberta.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 13.0, 9.0, 11.0, 11.0, 12.0, 22.0, 29.0, 48.0, 53.0, 66.0, 107.0, 135.0, 198.0, 272.0, 410.0, 569.0, 891.0, 1998.0, 6592.0, 33533.0, 311407.0, 3304257.0, 475388.0, 44721.0, 8084.0, 2335.0, 1029.0, 601.0, 396.0, 286.0, 202.0, 147.0, 132.0, 91.0, 48.0, 51.0, 30.0, 15.0, 27.0, 15.0, 16.0, 5.0, 6.0, 11.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.07421875, -6.863525390625, -6.65283203125, -6.442138671875, -6.2314453125, -6.020751953125, -5.81005859375, -5.599365234375, -5.388671875, -5.177978515625, -4.96728515625, -4.756591796875, -4.5458984375, -4.335205078125, -4.12451171875, -3.913818359375, -3.703125, -3.492431640625, -3.28173828125, -3.071044921875, -2.8603515625, -2.649658203125, -2.43896484375, -2.228271484375, -2.017578125, -1.806884765625, -1.59619140625, -1.385498046875, -1.1748046875, -0.964111328125, -0.75341796875, -0.542724609375, -0.33203125, -0.121337890625, 0.08935546875, 0.300048828125, 0.5107421875, 0.721435546875, 0.93212890625, 1.142822265625, 1.353515625, 1.564208984375, 1.77490234375, 1.985595703125, 2.1962890625, 2.406982421875, 2.61767578125, 2.828369140625, 3.0390625, 3.249755859375, 3.46044921875, 3.671142578125, 3.8818359375, 4.092529296875, 4.30322265625, 4.513916015625, 4.724609375, 4.935302734375, 5.14599609375, 5.356689453125, 5.5673828125, 5.778076171875, 5.98876953125, 6.199462890625, 6.41015625]}, "gradients/decoder.roberta.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 7.0, 11.0, 19.0, 9.0, 20.0, 24.0, 33.0, 30.0, 28.0, 31.0, 37.0, 39.0, 31.0, 40.0, 45.0, 50.0, 38.0, 45.0, 38.0, 44.0, 43.0, 34.0, 36.0, 26.0, 26.0, 30.0, 16.0, 29.0, 16.0, 13.0, 16.0, 13.0, 10.0, 7.0, 13.0, 7.0, 9.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.416015625, -2.347869873046875, -2.27972412109375, -2.211578369140625, -2.1434326171875, -2.075286865234375, -2.00714111328125, -1.938995361328125, -1.870849609375, -1.802703857421875, -1.73455810546875, -1.666412353515625, -1.5982666015625, -1.530120849609375, -1.46197509765625, -1.393829345703125, -1.32568359375, -1.257537841796875, -1.18939208984375, -1.121246337890625, -1.0531005859375, -0.984954833984375, -0.91680908203125, -0.848663330078125, -0.780517578125, -0.712371826171875, -0.64422607421875, -0.576080322265625, -0.5079345703125, -0.439788818359375, -0.37164306640625, -0.303497314453125, -0.2353515625, -0.167205810546875, -0.09906005859375, -0.030914306640625, 0.0372314453125, 0.105377197265625, 0.17352294921875, 0.241668701171875, 0.309814453125, 0.377960205078125, 0.44610595703125, 0.514251708984375, 0.5823974609375, 0.650543212890625, 0.71868896484375, 0.786834716796875, 0.85498046875, 0.923126220703125, 0.99127197265625, 1.059417724609375, 1.1275634765625, 1.195709228515625, 1.26385498046875, 1.332000732421875, 1.400146484375, 1.468292236328125, 1.53643798828125, 1.604583740234375, 1.6727294921875, 1.740875244140625, 1.80902099609375, 1.877166748046875, 1.9453125]}, "gradients/decoder.roberta.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 6.0, 8.0, 9.0, 14.0, 17.0, 28.0, 19.0, 38.0, 40.0, 75.0, 91.0, 155.0, 279.0, 579.0, 2687.0, 49602.0, 4050544.0, 85059.0, 3492.0, 666.0, 292.0, 185.0, 95.0, 70.0, 58.0, 38.0, 35.0, 14.0, 15.0, 14.0, 8.0, 10.0, 10.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-21.890625, -21.23828125, -20.5859375, -19.93359375, -19.28125, -18.62890625, -17.9765625, -17.32421875, -16.671875, -16.01953125, -15.3671875, -14.71484375, -14.0625, -13.41015625, -12.7578125, -12.10546875, -11.453125, -10.80078125, -10.1484375, -9.49609375, -8.84375, -8.19140625, -7.5390625, -6.88671875, -6.234375, -5.58203125, -4.9296875, -4.27734375, -3.625, -2.97265625, -2.3203125, -1.66796875, -1.015625, -0.36328125, 0.2890625, 0.94140625, 1.59375, 2.24609375, 2.8984375, 3.55078125, 4.203125, 4.85546875, 5.5078125, 6.16015625, 6.8125, 7.46484375, 8.1171875, 8.76953125, 9.421875, 10.07421875, 10.7265625, 11.37890625, 12.03125, 12.68359375, 13.3359375, 13.98828125, 14.640625, 15.29296875, 15.9453125, 16.59765625, 17.25, 17.90234375, 18.5546875, 19.20703125, 19.859375]}, "gradients/decoder.roberta.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 6.0, 10.0, 5.0, 8.0, 14.0, 13.0, 16.0, 27.0, 29.0, 48.0, 57.0, 99.0, 118.0, 158.0, 252.0, 361.0, 515.0, 652.0, 479.0, 365.0, 241.0, 156.0, 116.0, 78.0, 57.0, 41.0, 33.0, 27.0, 13.0, 25.0, 5.0, 8.0, 7.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9765625, -0.9410552978515625, -0.905548095703125, -0.8700408935546875, -0.83453369140625, -0.7990264892578125, -0.763519287109375, -0.7280120849609375, -0.6925048828125, -0.6569976806640625, -0.621490478515625, -0.5859832763671875, -0.55047607421875, -0.5149688720703125, -0.479461669921875, -0.4439544677734375, -0.408447265625, -0.3729400634765625, -0.337432861328125, -0.3019256591796875, -0.26641845703125, -0.2309112548828125, -0.195404052734375, -0.1598968505859375, -0.1243896484375, -0.0888824462890625, -0.053375244140625, -0.0178680419921875, 0.01763916015625, 0.0531463623046875, 0.088653564453125, 0.1241607666015625, 0.15966796875, 0.1951751708984375, 0.230682373046875, 0.2661895751953125, 0.30169677734375, 0.3372039794921875, 0.372711181640625, 0.4082183837890625, 0.4437255859375, 0.4792327880859375, 0.514739990234375, 0.5502471923828125, 0.58575439453125, 0.6212615966796875, 0.656768798828125, 0.6922760009765625, 0.727783203125, 0.7632904052734375, 0.798797607421875, 0.8343048095703125, 0.86981201171875, 0.9053192138671875, 0.940826416015625, 0.9763336181640625, 1.0118408203125, 1.0473480224609375, 1.082855224609375, 1.1183624267578125, 1.15386962890625, 1.1893768310546875, 1.224884033203125, 1.2603912353515625, 1.2958984375]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 8.0, 13.0, 16.0, 14.0, 23.0, 34.0, 29.0, 54.0, 52.0, 68.0, 76.0, 72.0, 75.0, 77.0, 87.0, 59.0, 58.0, 45.0, 38.0, 29.0, 19.0, 9.0, 11.0, 6.0, 11.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.862617015838623, -3.7592320442199707, -3.6558470726013184, -3.552462100982666, -3.4490768909454346, -3.3456919193267822, -3.24230694770813, -3.1389219760894775, -3.035536766052246, -2.9321517944335938, -2.8287668228149414, -2.725381851196289, -2.6219966411590576, -2.5186116695404053, -2.415226697921753, -2.3118417263031006, -2.2084567546844482, -2.105071783065796, -2.0016868114471436, -1.8983017206192017, -1.7949166297912598, -1.6915316581726074, -1.588146686553955, -1.4847617149353027, -1.3813766241073608, -1.2779916524887085, -1.1746065616607666, -1.0712215900421143, -0.9678365588188171, -0.86445152759552, -0.7610665559768677, -0.6576815247535706, -0.5542964935302734, -0.4509114623069763, -0.3475264608860016, -0.24414145946502686, -0.14075642824172974, -0.03737139701843262, 0.06601357460021973, 0.16939860582351685, 0.27278363704681396, 0.3761686682701111, 0.4795536696910858, 0.5829386711120605, 0.6863237023353577, 0.7897087335586548, 0.8930937051773071, 0.9964787364006042, 1.0998637676239014, 1.2032487392425537, 1.3066338300704956, 1.410018801689148, 1.5134038925170898, 1.6167888641357422, 1.7201738357543945, 1.8235588073730469, 1.9269438982009888, 2.0303289890289307, 2.133713960647583, 2.2370989322662354, 2.3404839038848877, 2.443869113922119, 2.5472540855407715, 2.650639057159424, 2.754024028778076]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 17.0, 11.0, 14.0, 18.0, 25.0, 25.0, 24.0, 29.0, 24.0, 27.0, 41.0, 39.0, 37.0, 35.0, 44.0, 51.0, 43.0, 45.0, 46.0, 34.0, 33.0, 31.0, 41.0, 34.0, 40.0, 21.0, 12.0, 31.0, 18.0, 8.0, 11.0, 12.0, 14.0, 9.0, 5.0, 9.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.600794553756714, -2.519680976867676, -2.4385673999786377, -2.3574538230895996, -2.2763402462005615, -2.1952266693115234, -2.1141130924224854, -2.0329995155334473, -1.9518860578536987, -1.8707724809646606, -1.7896589040756226, -1.7085453271865845, -1.627431869506836, -1.5463182926177979, -1.4652047157287598, -1.3840911388397217, -1.3029775619506836, -1.2218639850616455, -1.1407504081726074, -1.0596368312835693, -0.978523313999176, -0.8974097371101379, -0.8162962198257446, -0.7351826429367065, -0.6540690660476685, -0.5729554891586304, -0.4918419420719147, -0.410728394985199, -0.3296148180961609, -0.2485012412071228, -0.1673876941204071, -0.0862741470336914, -0.00516057014465332, 0.07595299184322357, 0.15706655383110046, 0.23818011581897736, 0.31929367780685425, 0.40040725469589233, 0.48152080178260803, 0.5626343488693237, 0.6437479257583618, 0.7248615026473999, 0.805975079536438, 0.8870885968208313, 0.9682021737098694, 1.0493156909942627, 1.1304292678833008, 1.2115428447723389, 1.292656421661377, 1.373769998550415, 1.4548835754394531, 1.5359971523284912, 1.6171107292175293, 1.6982243061065674, 1.779337763786316, 1.860451340675354, 1.941564917564392, 2.0226783752441406, 2.1037919521331787, 2.184905529022217, 2.266019105911255, 2.347132682800293, 2.428246259689331, 2.509359836578369, 2.5904734134674072]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 4.0, 9.0, 14.0, 15.0, 28.0, 29.0, 42.0, 59.0, 90.0, 131.0, 161.0, 286.0, 334.0, 518.0, 770.0, 1183.0, 1715.0, 2627.0, 4142.0, 6469.0, 10592.0, 17886.0, 31506.0, 58711.0, 116233.0, 226118.0, 258675.0, 144965.0, 72304.0, 38024.0, 21241.0, 12509.0, 7434.0, 4706.0, 2975.0, 1881.0, 1360.0, 838.0, 617.0, 407.0, 292.0, 190.0, 134.0, 85.0, 70.0, 50.0, 28.0, 36.0, 23.0, 16.0, 6.0, 9.0, 3.0, 3.0, 0.0, 4.0, 3.0], "bins": [-0.53955078125, -0.5232772827148438, -0.5070037841796875, -0.49073028564453125, -0.474456787109375, -0.45818328857421875, -0.4419097900390625, -0.42563629150390625, -0.40936279296875, -0.39308929443359375, -0.3768157958984375, -0.36054229736328125, -0.344268798828125, -0.32799530029296875, -0.3117218017578125, -0.29544830322265625, -0.2791748046875, -0.26290130615234375, -0.2466278076171875, -0.23035430908203125, -0.214080810546875, -0.19780731201171875, -0.1815338134765625, -0.16526031494140625, -0.14898681640625, -0.13271331787109375, -0.1164398193359375, -0.10016632080078125, -0.083892822265625, -0.06761932373046875, -0.0513458251953125, -0.03507232666015625, -0.018798828125, -0.00252532958984375, 0.0137481689453125, 0.03002166748046875, 0.046295166015625, 0.06256866455078125, 0.0788421630859375, 0.09511566162109375, 0.11138916015625, 0.12766265869140625, 0.1439361572265625, 0.16020965576171875, 0.176483154296875, 0.19275665283203125, 0.2090301513671875, 0.22530364990234375, 0.2415771484375, 0.25785064697265625, 0.2741241455078125, 0.29039764404296875, 0.306671142578125, 0.32294464111328125, 0.3392181396484375, 0.35549163818359375, 0.37176513671875, 0.38803863525390625, 0.4043121337890625, 0.42058563232421875, 0.436859130859375, 0.45313262939453125, 0.4694061279296875, 0.48567962646484375, 0.501953125]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 15.0, 9.0, 15.0, 20.0, 23.0, 24.0, 24.0, 29.0, 26.0, 28.0, 39.0, 40.0, 35.0, 31.0, 46.0, 50.0, 41.0, 48.0, 40.0, 39.0, 32.0, 32.0, 38.0, 39.0, 35.0, 27.0, 13.0, 28.0, 16.0, 11.0, 11.0, 13.0, 12.0, 10.0, 7.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.486328125, -2.40789794921875, -2.3294677734375, -2.25103759765625, -2.172607421875, -2.09417724609375, -2.0157470703125, -1.93731689453125, -1.85888671875, -1.78045654296875, -1.7020263671875, -1.62359619140625, -1.545166015625, -1.46673583984375, -1.3883056640625, -1.30987548828125, -1.2314453125, -1.15301513671875, -1.0745849609375, -0.99615478515625, -0.917724609375, -0.83929443359375, -0.7608642578125, -0.68243408203125, -0.60400390625, -0.52557373046875, -0.4471435546875, -0.36871337890625, -0.290283203125, -0.21185302734375, -0.1334228515625, -0.05499267578125, 0.0234375, 0.10186767578125, 0.1802978515625, 0.25872802734375, 0.337158203125, 0.41558837890625, 0.4940185546875, 0.57244873046875, 0.65087890625, 0.72930908203125, 0.8077392578125, 0.88616943359375, 0.964599609375, 1.04302978515625, 1.1214599609375, 1.19989013671875, 1.2783203125, 1.35675048828125, 1.4351806640625, 1.51361083984375, 1.592041015625, 1.67047119140625, 1.7489013671875, 1.82733154296875, 1.90576171875, 1.98419189453125, 2.0626220703125, 2.14105224609375, 2.219482421875, 2.29791259765625, 2.3763427734375, 2.45477294921875, 2.533203125]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 8.0, 1.0, 2.0, 3.0, 4.0, 10.0, 11.0, 12.0, 16.0, 22.0, 23.0, 23.0, 33.0, 66.0, 62.0, 70.0, 134.0, 149.0, 203.0, 283.0, 420.0, 621.0, 968.0, 1536.0, 2838.0, 6031.0, 16432.0, 68776.0, 905117.0, 26688.0, 8818.0, 3666.0, 1962.0, 1130.0, 689.0, 438.0, 334.0, 221.0, 180.0, 124.0, 87.0, 69.0, 58.0, 42.0, 47.0, 30.0, 21.0, 16.0, 17.0, 14.0, 7.0, 5.0, 7.0, 7.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.5205078125, -1.471771240234375, -1.42303466796875, -1.374298095703125, -1.3255615234375, -1.276824951171875, -1.22808837890625, -1.179351806640625, -1.130615234375, -1.081878662109375, -1.03314208984375, -0.984405517578125, -0.9356689453125, -0.886932373046875, -0.83819580078125, -0.789459228515625, -0.74072265625, -0.691986083984375, -0.64324951171875, -0.594512939453125, -0.5457763671875, -0.497039794921875, -0.44830322265625, -0.399566650390625, -0.350830078125, -0.302093505859375, -0.25335693359375, -0.204620361328125, -0.1558837890625, -0.107147216796875, -0.05841064453125, -0.009674072265625, 0.0390625, 0.087799072265625, 0.13653564453125, 0.185272216796875, 0.2340087890625, 0.282745361328125, 0.33148193359375, 0.380218505859375, 0.428955078125, 0.477691650390625, 0.52642822265625, 0.575164794921875, 0.6239013671875, 0.672637939453125, 0.72137451171875, 0.770111083984375, 0.81884765625, 0.867584228515625, 0.91632080078125, 0.965057373046875, 1.0137939453125, 1.062530517578125, 1.11126708984375, 1.160003662109375, 1.208740234375, 1.257476806640625, 1.30621337890625, 1.354949951171875, 1.4036865234375, 1.452423095703125, 1.50115966796875, 1.549896240234375, 1.5986328125]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 10.0, 8.0, 13.0, 11.0, 18.0, 16.0, 13.0, 14.0, 17.0, 16.0, 27.0, 28.0, 28.0, 41.0, 26.0, 30.0, 28.0, 39.0, 34.0, 38.0, 37.0, 37.0, 39.0, 37.0, 41.0, 33.0, 53.0, 33.0, 28.0, 25.0, 28.0, 21.0, 27.0, 14.0, 9.0, 14.0, 11.0, 8.0, 9.0, 8.0, 4.0, 12.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.4921875, -1.4439544677734375, -1.395721435546875, -1.3474884033203125, -1.29925537109375, -1.2510223388671875, -1.202789306640625, -1.1545562744140625, -1.1063232421875, -1.0580902099609375, -1.009857177734375, -0.9616241455078125, -0.91339111328125, -0.8651580810546875, -0.816925048828125, -0.7686920166015625, -0.720458984375, -0.6722259521484375, -0.623992919921875, -0.5757598876953125, -0.52752685546875, -0.4792938232421875, -0.431060791015625, -0.3828277587890625, -0.3345947265625, -0.2863616943359375, -0.238128662109375, -0.1898956298828125, -0.14166259765625, -0.0934295654296875, -0.045196533203125, 0.0030364990234375, 0.05126953125, 0.0995025634765625, 0.147735595703125, 0.1959686279296875, 0.24420166015625, 0.2924346923828125, 0.340667724609375, 0.3889007568359375, 0.4371337890625, 0.4853668212890625, 0.533599853515625, 0.5818328857421875, 0.63006591796875, 0.6782989501953125, 0.726531982421875, 0.7747650146484375, 0.822998046875, 0.8712310791015625, 0.919464111328125, 0.9676971435546875, 1.01593017578125, 1.0641632080078125, 1.112396240234375, 1.1606292724609375, 1.2088623046875, 1.2570953369140625, 1.305328369140625, 1.3535614013671875, 1.40179443359375, 1.4500274658203125, 1.498260498046875, 1.5464935302734375, 1.5947265625]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 2.0, 5.0, 13.0, 26.0, 26.0, 32.0, 28.0, 33.0, 63.0, 90.0, 134.0, 178.0, 271.0, 376.0, 570.0, 1045.0, 1702.0, 3420.0, 8199.0, 26403.0, 928681.0, 53482.0, 12964.0, 5024.0, 2338.0, 1188.0, 757.0, 457.0, 279.0, 235.0, 152.0, 96.0, 74.0, 53.0, 41.0, 35.0, 25.0, 14.0, 11.0, 14.0, 9.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1640625, -0.1591968536376953, -0.15433120727539062, -0.14946556091308594, -0.14459991455078125, -0.13973426818847656, -0.13486862182617188, -0.1300029754638672, -0.1251373291015625, -0.12027168273925781, -0.11540603637695312, -0.11054039001464844, -0.10567474365234375, -0.10080909729003906, -0.09594345092773438, -0.09107780456542969, -0.086212158203125, -0.08134651184082031, -0.07648086547851562, -0.07161521911621094, -0.06674957275390625, -0.06188392639160156, -0.057018280029296875, -0.05215263366699219, -0.0472869873046875, -0.04242134094238281, -0.037555694580078125, -0.03269004821777344, -0.02782440185546875, -0.022958755493164062, -0.018093109130859375, -0.013227462768554688, -0.00836181640625, -0.0034961700439453125, 0.001369476318359375, 0.0062351226806640625, 0.01110076904296875, 0.015966415405273438, 0.020832061767578125, 0.025697708129882812, 0.0305633544921875, 0.03542900085449219, 0.040294647216796875, 0.04516029357910156, 0.05002593994140625, 0.05489158630371094, 0.059757232666015625, 0.06462287902832031, 0.069488525390625, 0.07435417175292969, 0.07921981811523438, 0.08408546447753906, 0.08895111083984375, 0.09381675720214844, 0.09868240356445312, 0.10354804992675781, 0.1084136962890625, 0.11327934265136719, 0.11814498901367188, 0.12301063537597656, 0.12787628173828125, 0.13274192810058594, 0.13760757446289062, 0.1424732208251953, 0.1473388671875]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 2.0, 10.0, 9.0, 2.0, 13.0, 14.0, 15.0, 14.0, 23.0, 32.0, 26.0, 36.0, 32.0, 32.0, 41.0, 40.0, 33.0, 44.0, 56.0, 59.0, 61.0, 49.0, 45.0, 30.0, 37.0, 33.0, 26.0, 24.0, 29.0, 28.0, 19.0, 17.0, 13.0, 11.0, 9.0, 9.0, 10.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5451183319091797e-05, -2.4660490453243256e-05, -2.3869797587394714e-05, -2.3079104721546173e-05, -2.2288411855697632e-05, -2.149771898984909e-05, -2.070702612400055e-05, -1.9916333258152008e-05, -1.9125640392303467e-05, -1.8334947526454926e-05, -1.7544254660606384e-05, -1.6753561794757843e-05, -1.5962868928909302e-05, -1.517217606306076e-05, -1.438148319721222e-05, -1.3590790331363678e-05, -1.2800097465515137e-05, -1.2009404599666595e-05, -1.1218711733818054e-05, -1.0428018867969513e-05, -9.637326002120972e-06, -8.84663313627243e-06, -8.05594027042389e-06, -7.265247404575348e-06, -6.474554538726807e-06, -5.683861672878265e-06, -4.893168807029724e-06, -4.102475941181183e-06, -3.3117830753326416e-06, -2.5210902094841003e-06, -1.730397343635559e-06, -9.397044777870178e-07, -1.4901161193847656e-07, 6.416812539100647e-07, 1.432374119758606e-06, 2.2230669856071472e-06, 3.0137598514556885e-06, 3.8044527173042297e-06, 4.595145583152771e-06, 5.385838449001312e-06, 6.1765313148498535e-06, 6.967224180698395e-06, 7.757917046546936e-06, 8.548609912395477e-06, 9.339302778244019e-06, 1.012999564409256e-05, 1.0920688509941101e-05, 1.1711381375789642e-05, 1.2502074241638184e-05, 1.3292767107486725e-05, 1.4083459973335266e-05, 1.4874152839183807e-05, 1.566484570503235e-05, 1.645553857088089e-05, 1.724623143672943e-05, 1.8036924302577972e-05, 1.8827617168426514e-05, 1.9618310034275055e-05, 2.0409002900123596e-05, 2.1199695765972137e-05, 2.199038863182068e-05, 2.278108149766922e-05, 2.357177436351776e-05, 2.4362467229366302e-05, 2.5153160095214844e-05]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 2.0, 9.0, 6.0, 5.0, 14.0, 23.0, 14.0, 29.0, 39.0, 45.0, 79.0, 111.0, 331.0, 2025.0, 62131.0, 936565.0, 44920.0, 1633.0, 243.0, 104.0, 49.0, 52.0, 24.0, 20.0, 14.0, 11.0, 8.0, 12.0, 3.0, 1.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32666015625, -0.3151817321777344, -0.30370330810546875, -0.2922248840332031, -0.2807464599609375, -0.2692680358886719, -0.25778961181640625, -0.24631118774414062, -0.234832763671875, -0.22335433959960938, -0.21187591552734375, -0.20039749145507812, -0.1889190673828125, -0.17744064331054688, -0.16596221923828125, -0.15448379516601562, -0.14300537109375, -0.13152694702148438, -0.12004852294921875, -0.10857009887695312, -0.0970916748046875, -0.08561325073242188, -0.07413482666015625, -0.06265640258789062, -0.051177978515625, -0.039699554443359375, -0.02822113037109375, -0.016742706298828125, -0.0052642822265625, 0.006214141845703125, 0.01769256591796875, 0.029170989990234375, 0.0406494140625, 0.052127838134765625, 0.06360626220703125, 0.07508468627929688, 0.0865631103515625, 0.09804153442382812, 0.10951995849609375, 0.12099838256835938, 0.132476806640625, 0.14395523071289062, 0.15543365478515625, 0.16691207885742188, 0.1783905029296875, 0.18986892700195312, 0.20134735107421875, 0.21282577514648438, 0.22430419921875, 0.23578262329101562, 0.24726104736328125, 0.2587394714355469, 0.2702178955078125, 0.2816963195800781, 0.29317474365234375, 0.3046531677246094, 0.316131591796875, 0.3276100158691406, 0.33908843994140625, 0.3505668640136719, 0.3620452880859375, 0.3735237121582031, 0.38500213623046875, 0.3964805603027344, 0.407958984375]}, "gradients/decoder.roberta.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 3.0, 6.0, 6.0, 10.0, 9.0, 9.0, 17.0, 15.0, 23.0, 23.0, 24.0, 41.0, 55.0, 61.0, 89.0, 115.0, 101.0, 78.0, 49.0, 50.0, 38.0, 31.0, 27.0, 17.0, 21.0, 17.0, 9.0, 10.0, 8.0, 8.0, 3.0, 4.0, 8.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.020751953125, -0.02016758918762207, -0.01958322525024414, -0.01899886131286621, -0.01841449737548828, -0.01783013343811035, -0.017245769500732422, -0.016661405563354492, -0.016077041625976562, -0.015492677688598633, -0.014908313751220703, -0.014323949813842773, -0.013739585876464844, -0.013155221939086914, -0.012570858001708984, -0.011986494064331055, -0.011402130126953125, -0.010817766189575195, -0.010233402252197266, -0.009649038314819336, -0.009064674377441406, -0.008480310440063477, -0.007895946502685547, -0.007311582565307617, -0.0067272186279296875, -0.006142854690551758, -0.005558490753173828, -0.0049741268157958984, -0.004389762878417969, -0.003805398941040039, -0.0032210350036621094, -0.0026366710662841797, -0.00205230712890625, -0.0014679431915283203, -0.0008835792541503906, -0.00029921531677246094, 0.00028514862060546875, 0.0008695125579833984, 0.0014538764953613281, 0.002038240432739258, 0.0026226043701171875, 0.003206968307495117, 0.003791332244873047, 0.0043756961822509766, 0.004960060119628906, 0.005544424057006836, 0.006128787994384766, 0.006713151931762695, 0.007297515869140625, 0.007881879806518555, 0.008466243743896484, 0.009050607681274414, 0.009634971618652344, 0.010219335556030273, 0.010803699493408203, 0.011388063430786133, 0.011972427368164062, 0.012556791305541992, 0.013141155242919922, 0.013725519180297852, 0.014309883117675781, 0.014894247055053711, 0.01547861099243164, 0.01606297492980957, 0.0166473388671875]}, "gradients/decoder.roberta.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 16.0, 17.0, 31.0, 34.0, 48.0, 47.0, 70.0, 100.0, 70.0, 93.0, 89.0, 86.0, 76.0, 59.0, 42.0, 33.0, 27.0, 12.0, 13.0, 7.0, 6.0, 8.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.446108818054199, -4.327529430389404, -4.208950042724609, -4.090371131896973, -3.9717915058135986, -3.853212356567383, -3.734632968902588, -3.616053581237793, -3.497474193572998, -3.378894805908203, -3.2603156566619873, -3.1417362689971924, -3.0231568813323975, -2.9045777320861816, -2.7859983444213867, -2.667418956756592, -2.548839807510376, -2.430260419845581, -2.3116812705993652, -2.1931018829345703, -2.0745224952697754, -1.95594322681427, -1.8373639583587646, -1.7187845706939697, -1.6002053022384644, -1.481626033782959, -1.363046646118164, -1.2444673776626587, -1.1258881092071533, -1.0073087215423584, -0.888729453086853, -0.7701501250267029, -0.6515707969665527, -0.5329914689064026, -0.41441217064857483, -0.29583287239074707, -0.17725354433059692, -0.05867421627044678, 0.059905052185058594, 0.17848438024520874, 0.2970637083053589, 0.41564303636550903, 0.5342223644256592, 0.6528016328811646, 0.7713809609413147, 0.8899602890014648, 1.0085395574569702, 1.1271188259124756, 1.2456982135772705, 1.3642774820327759, 1.4828568696975708, 1.6014361381530762, 1.720015525817871, 1.8385947942733765, 1.9571740627288818, 2.0757534503936768, 2.1943325996398926, 2.3129119873046875, 2.4314911365509033, 2.5500705242156982, 2.668649911880493, 2.787229061126709, 2.905808448791504, 3.024387836456299, 3.1429672241210938]}, "gradients/decoder.roberta.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 10.0, 15.0, 10.0, 14.0, 19.0, 24.0, 24.0, 27.0, 27.0, 25.0, 28.0, 39.0, 39.0, 33.0, 34.0, 45.0, 51.0, 41.0, 48.0, 41.0, 38.0, 31.0, 31.0, 40.0, 39.0, 36.0, 25.0, 13.0, 28.0, 17.0, 11.0, 10.0, 13.0, 13.0, 10.0, 7.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.486125946044922, -2.4077281951904297, -2.3293304443359375, -2.250932455062866, -2.172534704208374, -2.094136953353882, -2.0157389640808105, -1.9373412132263184, -1.8589434623718262, -1.780545711517334, -1.7021478414535522, -1.6237499713897705, -1.5453522205352783, -1.4669544696807861, -1.3885565996170044, -1.3101587295532227, -1.2317609786987305, -1.1533632278442383, -1.0749653577804565, -0.9965675473213196, -0.9181697368621826, -0.8397719264030457, -0.7613741159439087, -0.6829763054847717, -0.6045784950256348, -0.5261806845664978, -0.44778287410736084, -0.3693850636482239, -0.2909872531890869, -0.21258944272994995, -0.134191632270813, -0.055793821811676025, 0.02260422706604004, 0.101002037525177, 0.17939984798431396, 0.2577976584434509, 0.3361954689025879, 0.41459327936172485, 0.4929910898208618, 0.5713889002799988, 0.6497867107391357, 0.7281845211982727, 0.8065823316574097, 0.8849801421165466, 0.9633779525756836, 1.0417757034301758, 1.1201735734939575, 1.1985714435577393, 1.2769691944122314, 1.3553669452667236, 1.4337648153305054, 1.512162685394287, 1.5905604362487793, 1.6689581871032715, 1.7473560571670532, 1.825753927230835, 1.9041516780853271, 1.9825494289398193, 2.0609474182128906, 2.139345169067383, 2.217742919921875, 2.296140670776367, 2.3745384216308594, 2.4529364109039307, 2.531334161758423]}, "gradients/decoder.roberta.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 4.0, 4.0, 8.0, 8.0, 22.0, 19.0, 26.0, 46.0, 48.0, 90.0, 118.0, 173.0, 278.0, 437.0, 710.0, 1239.0, 2122.0, 4022.0, 7769.0, 15728.0, 32098.0, 67076.0, 134591.0, 231988.0, 247251.0, 152123.0, 76396.0, 36676.0, 17910.0, 9057.0, 4540.0, 2444.0, 1341.0, 783.0, 468.0, 302.0, 185.0, 141.0, 106.0, 58.0, 40.0, 32.0, 32.0, 15.0, 12.0, 6.0, 3.0, 7.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.835479736328125, -2.74713134765625, -2.658782958984375, -2.5704345703125, -2.482086181640625, -2.39373779296875, -2.305389404296875, -2.217041015625, -2.128692626953125, -2.04034423828125, -1.951995849609375, -1.8636474609375, -1.775299072265625, -1.68695068359375, -1.598602294921875, -1.51025390625, -1.421905517578125, -1.33355712890625, -1.245208740234375, -1.1568603515625, -1.068511962890625, -0.98016357421875, -0.891815185546875, -0.803466796875, -0.715118408203125, -0.62677001953125, -0.538421630859375, -0.4500732421875, -0.361724853515625, -0.27337646484375, -0.185028076171875, -0.0966796875, -0.008331298828125, 0.08001708984375, 0.168365478515625, 0.2567138671875, 0.345062255859375, 0.43341064453125, 0.521759033203125, 0.610107421875, 0.698455810546875, 0.78680419921875, 0.875152587890625, 0.9635009765625, 1.051849365234375, 1.14019775390625, 1.228546142578125, 1.31689453125, 1.405242919921875, 1.49359130859375, 1.581939697265625, 1.6702880859375, 1.758636474609375, 1.84698486328125, 1.935333251953125, 2.023681640625, 2.112030029296875, 2.20037841796875, 2.288726806640625, 2.3770751953125, 2.465423583984375, 2.55377197265625, 2.642120361328125, 2.73046875]}, "gradients/decoder.roberta.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 11.0, 8.0, 11.0, 17.0, 15.0, 20.0, 22.0, 29.0, 23.0, 22.0, 36.0, 34.0, 39.0, 30.0, 44.0, 34.0, 60.0, 47.0, 48.0, 36.0, 42.0, 34.0, 39.0, 39.0, 33.0, 35.0, 34.0, 18.0, 22.0, 19.0, 11.0, 11.0, 15.0, 12.0, 7.0, 9.0, 8.0, 7.0, 2.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.775390625, -2.68597412109375, -2.5965576171875, -2.50714111328125, -2.417724609375, -2.32830810546875, -2.2388916015625, -2.14947509765625, -2.06005859375, -1.97064208984375, -1.8812255859375, -1.79180908203125, -1.702392578125, -1.61297607421875, -1.5235595703125, -1.43414306640625, -1.3447265625, -1.25531005859375, -1.1658935546875, -1.07647705078125, -0.987060546875, -0.89764404296875, -0.8082275390625, -0.71881103515625, -0.62939453125, -0.53997802734375, -0.4505615234375, -0.36114501953125, -0.271728515625, -0.18231201171875, -0.0928955078125, -0.00347900390625, 0.0859375, 0.17535400390625, 0.2647705078125, 0.35418701171875, 0.443603515625, 0.53302001953125, 0.6224365234375, 0.71185302734375, 0.80126953125, 0.89068603515625, 0.9801025390625, 1.06951904296875, 1.158935546875, 1.24835205078125, 1.3377685546875, 1.42718505859375, 1.5166015625, 1.60601806640625, 1.6954345703125, 1.78485107421875, 1.874267578125, 1.96368408203125, 2.0531005859375, 2.14251708984375, 2.23193359375, 2.32135009765625, 2.4107666015625, 2.50018310546875, 2.589599609375, 2.67901611328125, 2.7684326171875, 2.85784912109375, 2.947265625]}, "gradients/decoder.roberta.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 14.0, 7.0, 8.0, 7.0, 7.0, 15.0, 19.0, 30.0, 23.0, 23.0, 36.0, 42.0, 65.0, 80.0, 120.0, 255.0, 956.0, 1045376.0, 737.0, 200.0, 119.0, 74.0, 55.0, 42.0, 26.0, 31.0, 24.0, 27.0, 24.0, 17.0, 15.0, 15.0, 12.0, 13.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-90.3125, -87.833984375, -85.35546875, -82.876953125, -80.3984375, -77.919921875, -75.44140625, -72.962890625, -70.484375, -68.005859375, -65.52734375, -63.048828125, -60.5703125, -58.091796875, -55.61328125, -53.134765625, -50.65625, -48.177734375, -45.69921875, -43.220703125, -40.7421875, -38.263671875, -35.78515625, -33.306640625, -30.828125, -28.349609375, -25.87109375, -23.392578125, -20.9140625, -18.435546875, -15.95703125, -13.478515625, -11.0, -8.521484375, -6.04296875, -3.564453125, -1.0859375, 1.392578125, 3.87109375, 6.349609375, 8.828125, 11.306640625, 13.78515625, 16.263671875, 18.7421875, 21.220703125, 23.69921875, 26.177734375, 28.65625, 31.134765625, 33.61328125, 36.091796875, 38.5703125, 41.048828125, 43.52734375, 46.005859375, 48.484375, 50.962890625, 53.44140625, 55.919921875, 58.3984375, 60.876953125, 63.35546875, 65.833984375, 68.3125]}, "gradients/decoder.roberta.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 11.0, 9.0, 12.0, 15.0, 18.0, 14.0, 22.0, 30.0, 25.0, 20.0, 29.0, 38.0, 37.0, 48.0, 48.0, 36.0, 44.0, 58.0, 37.0, 30.0, 56.0, 47.0, 48.0, 43.0, 38.0, 21.0, 30.0, 23.0, 26.0, 13.0, 10.0, 7.0, 7.0, 8.0, 9.0, 9.0, 10.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.533203125, -2.44549560546875, -2.3577880859375, -2.27008056640625, -2.182373046875, -2.09466552734375, -2.0069580078125, -1.91925048828125, -1.83154296875, -1.74383544921875, -1.6561279296875, -1.56842041015625, -1.480712890625, -1.39300537109375, -1.3052978515625, -1.21759033203125, -1.1298828125, -1.04217529296875, -0.9544677734375, -0.86676025390625, -0.779052734375, -0.69134521484375, -0.6036376953125, -0.51593017578125, -0.42822265625, -0.34051513671875, -0.2528076171875, -0.16510009765625, -0.077392578125, 0.01031494140625, 0.0980224609375, 0.18572998046875, 0.2734375, 0.36114501953125, 0.4488525390625, 0.53656005859375, 0.624267578125, 0.71197509765625, 0.7996826171875, 0.88739013671875, 0.97509765625, 1.06280517578125, 1.1505126953125, 1.23822021484375, 1.325927734375, 1.41363525390625, 1.5013427734375, 1.58905029296875, 1.6767578125, 1.76446533203125, 1.8521728515625, 1.93988037109375, 2.027587890625, 2.11529541015625, 2.2030029296875, 2.29071044921875, 2.37841796875, 2.46612548828125, 2.5538330078125, 2.64154052734375, 2.729248046875, 2.81695556640625, 2.9046630859375, 2.99237060546875, 3.080078125]}, "gradients/decoder.roberta.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 10.0, 10.0, 26.0, 40.0, 55.0, 127.0, 279.0, 478.0, 1174.0, 4489.0, 85431.0, 834497.0, 114210.0, 5341.0, 1290.0, 521.0, 259.0, 131.0, 76.0, 43.0, 23.0, 12.0, 10.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.22265625, -5.05706787109375, -4.8914794921875, -4.72589111328125, -4.560302734375, -4.39471435546875, -4.2291259765625, -4.06353759765625, -3.89794921875, -3.73236083984375, -3.5667724609375, -3.40118408203125, -3.235595703125, -3.07000732421875, -2.9044189453125, -2.73883056640625, -2.5732421875, -2.40765380859375, -2.2420654296875, -2.07647705078125, -1.910888671875, -1.74530029296875, -1.5797119140625, -1.41412353515625, -1.24853515625, -1.08294677734375, -0.9173583984375, -0.75177001953125, -0.586181640625, -0.42059326171875, -0.2550048828125, -0.08941650390625, 0.076171875, 0.24176025390625, 0.4073486328125, 0.57293701171875, 0.738525390625, 0.90411376953125, 1.0697021484375, 1.23529052734375, 1.40087890625, 1.56646728515625, 1.7320556640625, 1.89764404296875, 2.063232421875, 2.22882080078125, 2.3944091796875, 2.55999755859375, 2.7255859375, 2.89117431640625, 3.0567626953125, 3.22235107421875, 3.387939453125, 3.55352783203125, 3.7191162109375, 3.88470458984375, 4.05029296875, 4.21588134765625, 4.3814697265625, 4.54705810546875, 4.712646484375, 4.87823486328125, 5.0438232421875, 5.20941162109375, 5.375]}, "gradients/decoder.roberta.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 13.0, 18.0, 25.0, 39.0, 51.0, 68.0, 82.0, 104.0, 110.0, 144.0, 93.0, 79.0, 58.0, 31.0, 37.0, 9.0, 10.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003294944763183594, -0.00031901895999908447, -0.00030854344367980957, -0.00029806792736053467, -0.00028759241104125977, -0.00027711689472198486, -0.00026664137840270996, -0.00025616586208343506, -0.00024569034576416016, -0.00023521482944488525, -0.00022473931312561035, -0.00021426379680633545, -0.00020378828048706055, -0.00019331276416778564, -0.00018283724784851074, -0.00017236173152923584, -0.00016188621520996094, -0.00015141069889068604, -0.00014093518257141113, -0.00013045966625213623, -0.00011998414993286133, -0.00010950863361358643, -9.903311729431152e-05, -8.855760097503662e-05, -7.808208465576172e-05, -6.760656833648682e-05, -5.7131052017211914e-05, -4.665553569793701e-05, -3.618001937866211e-05, -2.5704503059387207e-05, -1.5228986740112305e-05, -4.753470420837402e-06, 5.7220458984375e-06, 1.6197562217712402e-05, 2.6673078536987305e-05, 3.714859485626221e-05, 4.762411117553711e-05, 5.809962749481201e-05, 6.857514381408691e-05, 7.905066013336182e-05, 8.952617645263672e-05, 0.00010000169277191162, 0.00011047720909118652, 0.00012095272541046143, 0.00013142824172973633, 0.00014190375804901123, 0.00015237927436828613, 0.00016285479068756104, 0.00017333030700683594, 0.00018380582332611084, 0.00019428133964538574, 0.00020475685596466064, 0.00021523237228393555, 0.00022570788860321045, 0.00023618340492248535, 0.00024665892124176025, 0.00025713443756103516, 0.00026760995388031006, 0.00027808547019958496, 0.00028856098651885986, 0.00029903650283813477, 0.00030951201915740967, 0.00031998753547668457, 0.00033046305179595947, 0.0003409385681152344]}, "gradients/decoder.roberta.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 10.0, 17.0, 20.0, 34.0, 56.0, 67.0, 123.0, 989.0, 307067.0, 738507.0, 1264.0, 156.0, 84.0, 60.0, 26.0, 26.0, 17.0, 10.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.6396484375, -17.998046875, -17.3564453125, -16.71484375, -16.0732421875, -15.431640625, -14.7900390625, -14.1484375, -13.5068359375, -12.865234375, -12.2236328125, -11.58203125, -10.9404296875, -10.298828125, -9.6572265625, -9.015625, -8.3740234375, -7.732421875, -7.0908203125, -6.44921875, -5.8076171875, -5.166015625, -4.5244140625, -3.8828125, -3.2412109375, -2.599609375, -1.9580078125, -1.31640625, -0.6748046875, -0.033203125, 0.6083984375, 1.25, 1.8916015625, 2.533203125, 3.1748046875, 3.81640625, 4.4580078125, 5.099609375, 5.7412109375, 6.3828125, 7.0244140625, 7.666015625, 8.3076171875, 8.94921875, 9.5908203125, 10.232421875, 10.8740234375, 11.515625, 12.1572265625, 12.798828125, 13.4404296875, 14.08203125, 14.7236328125, 15.365234375, 16.0068359375, 16.6484375, 17.2900390625, 17.931640625, 18.5732421875, 19.21484375, 19.8564453125, 20.498046875, 21.1396484375, 21.78125]}, "gradients/decoder.roberta.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 12.0, 19.0, 26.0, 31.0, 67.0, 63.0, 82.0, 101.0, 135.0, 123.0, 81.0, 68.0, 68.0, 37.0, 29.0, 17.0, 16.0, 5.0, 6.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9755859375, -0.9465255737304688, -0.9174652099609375, -0.8884048461914062, -0.859344482421875, -0.8302841186523438, -0.8012237548828125, -0.7721633911132812, -0.74310302734375, -0.7140426635742188, -0.6849822998046875, -0.6559219360351562, -0.626861572265625, -0.5978012084960938, -0.5687408447265625, -0.5396804809570312, -0.5106201171875, -0.48155975341796875, -0.4524993896484375, -0.42343902587890625, -0.394378662109375, -0.36531829833984375, -0.3362579345703125, -0.30719757080078125, -0.27813720703125, -0.24907684326171875, -0.2200164794921875, -0.19095611572265625, -0.161895751953125, -0.13283538818359375, -0.1037750244140625, -0.07471466064453125, -0.045654296875, -0.01659393310546875, 0.0124664306640625, 0.04152679443359375, 0.070587158203125, 0.09964752197265625, 0.1287078857421875, 0.15776824951171875, 0.18682861328125, 0.21588897705078125, 0.2449493408203125, 0.27400970458984375, 0.303070068359375, 0.33213043212890625, 0.3611907958984375, 0.39025115966796875, 0.4193115234375, 0.44837188720703125, 0.4774322509765625, 0.5064926147460938, 0.535552978515625, 0.5646133422851562, 0.5936737060546875, 0.6227340698242188, 0.65179443359375, 0.6808547973632812, 0.7099151611328125, 0.7389755249023438, 0.768035888671875, 0.7970962524414062, 0.8261566162109375, 0.8552169799804688, 0.88427734375]}, "gradients/decoder.roberta.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 13.0, 17.0, 35.0, 39.0, 55.0, 82.0, 106.0, 119.0, 113.0, 122.0, 106.0, 67.0, 53.0, 32.0, 23.0, 9.0, 5.0, 6.0, 4.0, 0.0, 3.0, 1.0], "bins": [-9.81706714630127, -9.621916770935059, -9.426767349243164, -9.231616973876953, -9.036466598510742, -8.841316223144531, -8.646166801452637, -8.451016426086426, -8.255866050720215, -8.060715675354004, -7.865565776824951, -7.670415878295898, -7.4752655029296875, -7.280115604400635, -7.084965705871582, -6.889815330505371, -6.694665908813477, -6.499516010284424, -6.304365634918213, -6.10921573638916, -5.914065361022949, -5.7189154624938965, -5.523765563964844, -5.328615188598633, -5.133464813232422, -4.938314914703369, -4.743164539337158, -4.5480146408081055, -4.3528642654418945, -4.157714366912842, -3.96256422996521, -3.767414093017578, -3.5722641944885254, -3.3771140575408936, -3.1819639205932617, -2.986814022064209, -2.791663885116577, -2.5965137481689453, -2.4013636112213135, -2.2062134742736816, -2.011063575744629, -1.815913438796997, -1.6207634210586548, -1.425613284111023, -1.2304632663726807, -1.0353131294250488, -0.840162992477417, -0.6450129747390747, -0.4498627185821533, -0.25471264123916626, -0.05956253409385681, 0.13558757305145264, 0.3307376503944397, 0.5258877277374268, 0.7210378646850586, 0.9161878824234009, 1.1113380193710327, 1.3064881563186646, 1.5016381740570068, 1.6967883110046387, 1.8919384479522705, 2.0870885848999023, 2.282238483428955, 2.477388620376587, 2.6725387573242188]}, "gradients/decoder.roberta.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 7.0, 2.0, 11.0, 9.0, 17.0, 17.0, 12.0, 18.0, 21.0, 29.0, 24.0, 21.0, 30.0, 23.0, 35.0, 46.0, 44.0, 58.0, 36.0, 40.0, 50.0, 35.0, 33.0, 46.0, 46.0, 30.0, 34.0, 24.0, 25.0, 20.0, 28.0, 24.0, 18.0, 10.0, 19.0, 9.0, 11.0, 5.0, 8.0, 8.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34708833694458, -4.2330756187438965, -4.119062900543213, -4.005050182342529, -3.8910374641418457, -3.777024745941162, -3.6630120277404785, -3.548999309539795, -3.4349865913391113, -3.3209738731384277, -3.206961154937744, -3.0929484367370605, -2.978935718536377, -2.8649230003356934, -2.7509102821350098, -2.636897563934326, -2.5228848457336426, -2.408872127532959, -2.2948594093322754, -2.180846691131592, -2.066833972930908, -1.9528212547302246, -1.838808536529541, -1.7247958183288574, -1.6107831001281738, -1.4967703819274902, -1.3827576637268066, -1.268744945526123, -1.1547322273254395, -1.0407195091247559, -0.9267067909240723, -0.8126940727233887, -0.698681116104126, -0.5846683979034424, -0.4706556797027588, -0.3566429615020752, -0.2426302433013916, -0.128617525100708, -0.014604806900024414, 0.09940791130065918, 0.21342062950134277, 0.32743334770202637, 0.44144606590270996, 0.5554587841033936, 0.6694715023040771, 0.7834842205047607, 0.8974969387054443, 1.011509656906128, 1.1255223751068115, 1.2395350933074951, 1.3535478115081787, 1.4675605297088623, 1.581573247909546, 1.6955859661102295, 1.809598684310913, 1.9236114025115967, 2.0376241207122803, 2.151636838912964, 2.2656495571136475, 2.379662275314331, 2.4936749935150146, 2.6076877117156982, 2.721700429916382, 2.8357131481170654, 2.949725866317749]}, "gradients/decoder.roberta.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 8.0, 12.0, 11.0, 23.0, 20.0, 26.0, 41.0, 53.0, 78.0, 107.0, 153.0, 207.0, 308.0, 431.0, 718.0, 1203.0, 2606.0, 7549.0, 29492.0, 185689.0, 2471239.0, 1351204.0, 111844.0, 20333.0, 5778.0, 2197.0, 1049.0, 555.0, 396.0, 254.0, 177.0, 121.0, 84.0, 79.0, 60.0, 36.0, 38.0, 18.0, 12.0, 15.0, 17.0, 12.0, 10.0, 3.0, 3.0, 7.0, 2.0, 4.0, 2.0, 1.0], "bins": [-6.3828125, -6.1998291015625, -6.016845703125, -5.8338623046875, -5.65087890625, -5.4678955078125, -5.284912109375, -5.1019287109375, -4.9189453125, -4.7359619140625, -4.552978515625, -4.3699951171875, -4.18701171875, -4.0040283203125, -3.821044921875, -3.6380615234375, -3.455078125, -3.2720947265625, -3.089111328125, -2.9061279296875, -2.72314453125, -2.5401611328125, -2.357177734375, -2.1741943359375, -1.9912109375, -1.8082275390625, -1.625244140625, -1.4422607421875, -1.25927734375, -1.0762939453125, -0.893310546875, -0.7103271484375, -0.52734375, -0.3443603515625, -0.161376953125, 0.0216064453125, 0.20458984375, 0.3875732421875, 0.570556640625, 0.7535400390625, 0.9365234375, 1.1195068359375, 1.302490234375, 1.4854736328125, 1.66845703125, 1.8514404296875, 2.034423828125, 2.2174072265625, 2.400390625, 2.5833740234375, 2.766357421875, 2.9493408203125, 3.13232421875, 3.3153076171875, 3.498291015625, 3.6812744140625, 3.8642578125, 4.0472412109375, 4.230224609375, 4.4132080078125, 4.59619140625, 4.7791748046875, 4.962158203125, 5.1451416015625, 5.328125]}, "gradients/decoder.roberta.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 1.0, 7.0, 7.0, 3.0, 10.0, 20.0, 13.0, 19.0, 23.0, 13.0, 20.0, 31.0, 25.0, 34.0, 36.0, 40.0, 45.0, 37.0, 51.0, 45.0, 35.0, 55.0, 29.0, 46.0, 37.0, 36.0, 31.0, 28.0, 35.0, 22.0, 28.0, 22.0, 21.0, 12.0, 17.0, 10.0, 13.0, 8.0, 6.0, 6.0, 7.0, 8.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3359375, -2.2623291015625, -2.188720703125, -2.1151123046875, -2.04150390625, -1.9678955078125, -1.894287109375, -1.8206787109375, -1.7470703125, -1.6734619140625, -1.599853515625, -1.5262451171875, -1.45263671875, -1.3790283203125, -1.305419921875, -1.2318115234375, -1.158203125, -1.0845947265625, -1.010986328125, -0.9373779296875, -0.86376953125, -0.7901611328125, -0.716552734375, -0.6429443359375, -0.5693359375, -0.4957275390625, -0.422119140625, -0.3485107421875, -0.27490234375, -0.2012939453125, -0.127685546875, -0.0540771484375, 0.01953125, 0.0931396484375, 0.166748046875, 0.2403564453125, 0.31396484375, 0.3875732421875, 0.461181640625, 0.5347900390625, 0.6083984375, 0.6820068359375, 0.755615234375, 0.8292236328125, 0.90283203125, 0.9764404296875, 1.050048828125, 1.1236572265625, 1.197265625, 1.2708740234375, 1.344482421875, 1.4180908203125, 1.49169921875, 1.5653076171875, 1.638916015625, 1.7125244140625, 1.7861328125, 1.8597412109375, 1.933349609375, 2.0069580078125, 2.08056640625, 2.1541748046875, 2.227783203125, 2.3013916015625, 2.375]}, "gradients/decoder.roberta.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 9.0, 11.0, 7.0, 4.0, 12.0, 16.0, 37.0, 41.0, 61.0, 93.0, 126.0, 195.0, 356.0, 954.0, 16242.0, 4027147.0, 145044.0, 2686.0, 499.0, 221.0, 141.0, 108.0, 56.0, 46.0, 33.0, 26.0, 21.0, 11.0, 11.0, 6.0, 11.0, 15.0, 10.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-27.671875, -26.874755859375, -26.07763671875, -25.280517578125, -24.4833984375, -23.686279296875, -22.88916015625, -22.092041015625, -21.294921875, -20.497802734375, -19.70068359375, -18.903564453125, -18.1064453125, -17.309326171875, -16.51220703125, -15.715087890625, -14.91796875, -14.120849609375, -13.32373046875, -12.526611328125, -11.7294921875, -10.932373046875, -10.13525390625, -9.338134765625, -8.541015625, -7.743896484375, -6.94677734375, -6.149658203125, -5.3525390625, -4.555419921875, -3.75830078125, -2.961181640625, -2.1640625, -1.366943359375, -0.56982421875, 0.227294921875, 1.0244140625, 1.821533203125, 2.61865234375, 3.415771484375, 4.212890625, 5.010009765625, 5.80712890625, 6.604248046875, 7.4013671875, 8.198486328125, 8.99560546875, 9.792724609375, 10.58984375, 11.386962890625, 12.18408203125, 12.981201171875, 13.7783203125, 14.575439453125, 15.37255859375, 16.169677734375, 16.966796875, 17.763916015625, 18.56103515625, 19.358154296875, 20.1552734375, 20.952392578125, 21.74951171875, 22.546630859375, 23.34375]}, "gradients/decoder.roberta.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 9.0, 6.0, 7.0, 7.0, 8.0, 11.0, 15.0, 22.0, 22.0, 23.0, 37.0, 54.0, 83.0, 116.0, 134.0, 225.0, 348.0, 479.0, 670.0, 531.0, 366.0, 254.0, 172.0, 119.0, 102.0, 71.0, 53.0, 28.0, 30.0, 16.0, 5.0, 11.0, 9.0, 8.0, 4.0, 6.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.18359375, -1.14508056640625, -1.1065673828125, -1.06805419921875, -1.029541015625, -0.99102783203125, -0.9525146484375, -0.91400146484375, -0.87548828125, -0.83697509765625, -0.7984619140625, -0.75994873046875, -0.721435546875, -0.68292236328125, -0.6444091796875, -0.60589599609375, -0.5673828125, -0.52886962890625, -0.4903564453125, -0.45184326171875, -0.413330078125, -0.37481689453125, -0.3363037109375, -0.29779052734375, -0.25927734375, -0.22076416015625, -0.1822509765625, -0.14373779296875, -0.105224609375, -0.06671142578125, -0.0281982421875, 0.01031494140625, 0.048828125, 0.08734130859375, 0.1258544921875, 0.16436767578125, 0.202880859375, 0.24139404296875, 0.2799072265625, 0.31842041015625, 0.35693359375, 0.39544677734375, 0.4339599609375, 0.47247314453125, 0.510986328125, 0.54949951171875, 0.5880126953125, 0.62652587890625, 0.6650390625, 0.70355224609375, 0.7420654296875, 0.78057861328125, 0.819091796875, 0.85760498046875, 0.8961181640625, 0.93463134765625, 0.97314453125, 1.01165771484375, 1.0501708984375, 1.08868408203125, 1.127197265625, 1.16571044921875, 1.2042236328125, 1.24273681640625, 1.28125]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 8.0, 28.0, 29.0, 50.0, 60.0, 82.0, 79.0, 117.0, 120.0, 109.0, 83.0, 71.0, 52.0, 40.0, 21.0, 15.0, 15.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1786885261535645, -7.029301643371582, -6.879915237426758, -6.730528354644775, -6.581141948699951, -6.431755065917969, -6.2823686599731445, -6.132981777191162, -5.983595371246338, -5.8342084884643555, -5.684822082519531, -5.535435199737549, -5.386048793792725, -5.236661911010742, -5.087275505065918, -4.9378886222839355, -4.788501739501953, -4.639114856719971, -4.4897284507751465, -4.340341567993164, -4.19095516204834, -4.041568279266357, -3.892181873321533, -3.742794990539551, -3.5934085845947266, -3.4440219402313232, -3.29463529586792, -3.1452486515045166, -2.9958620071411133, -2.84647536277771, -2.6970887184143066, -2.547701835632324, -2.3983154296875, -2.2489287853240967, -2.0995421409606934, -1.95015549659729, -1.8007688522338867, -1.6513822078704834, -1.5019954442977905, -1.3526087999343872, -1.2032221555709839, -1.0538355112075806, -0.9044488668441772, -0.7550621628761292, -0.6056755185127258, -0.4562888741493225, -0.3069021701812744, -0.1575155258178711, -0.008128881454467773, 0.14125777781009674, 0.29064443707466125, 0.44003111124038696, 0.5894177556037903, 0.7388043999671936, 0.8881911039352417, 1.037577748298645, 1.1869643926620483, 1.3363510370254517, 1.485737681388855, 1.6351244449615479, 1.7845110893249512, 1.9338977336883545, 2.083284378051758, 2.232671022415161, 2.3820576667785645]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 10.0, 5.0, 5.0, 6.0, 12.0, 13.0, 11.0, 15.0, 20.0, 23.0, 22.0, 25.0, 28.0, 45.0, 41.0, 40.0, 55.0, 46.0, 56.0, 54.0, 43.0, 43.0, 46.0, 43.0, 37.0, 39.0, 35.0, 24.0, 30.0, 27.0, 19.0, 17.0, 16.0, 13.0, 11.0, 9.0, 10.0, 4.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.17228627204895, -3.0710408687591553, -2.9697954654693604, -2.8685503005981445, -2.7673048973083496, -2.6660594940185547, -2.5648140907287598, -2.463568687438965, -2.36232328414917, -2.261077880859375, -2.15983247756958, -2.058587074279785, -1.9573419094085693, -1.8560965061187744, -1.7548511028289795, -1.6536056995391846, -1.5523605346679688, -1.4511151313781738, -1.3498698472976685, -1.2486244440078735, -1.1473791599273682, -1.0461337566375732, -0.9448883533477783, -0.8436430096626282, -0.742397665977478, -0.6411523222923279, -0.5399069786071777, -0.4386615753173828, -0.33741623163223267, -0.23617088794708252, -0.1349254846572876, -0.03368014097213745, 0.0675654411315918, 0.16881079971790314, 0.2700561583042145, 0.371301531791687, 0.47254687547683716, 0.5737922191619873, 0.6750376224517822, 0.7762829661369324, 0.8775283098220825, 0.9787736535072327, 1.0800189971923828, 1.1812644004821777, 1.2825098037719727, 1.383755087852478, 1.485000491142273, 1.5862457752227783, 1.6874911785125732, 1.7887365818023682, 1.8899818658828735, 1.9912272691726685, 2.092472553253174, 2.1937179565429688, 2.2949633598327637, 2.3962087631225586, 2.4974541664123535, 2.5986995697021484, 2.6999449729919434, 2.8011903762817383, 2.902435541152954, 3.003680944442749, 3.104926347732544, 3.206171751022339, 3.3074169158935547]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 17.0, 19.0, 34.0, 62.0, 63.0, 114.0, 194.0, 274.0, 437.0, 641.0, 1055.0, 1614.0, 2528.0, 4304.0, 7219.0, 12864.0, 23898.0, 47066.0, 101460.0, 234281.0, 314339.0, 153416.0, 68076.0, 33088.0, 17314.0, 9785.0, 5642.0, 3180.0, 1994.0, 1189.0, 791.0, 558.0, 334.0, 219.0, 143.0, 98.0, 70.0, 50.0, 40.0, 22.0, 22.0, 12.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.6796875, -0.6579360961914062, -0.6361846923828125, -0.6144332885742188, -0.592681884765625, -0.5709304809570312, -0.5491790771484375, -0.5274276733398438, -0.50567626953125, -0.48392486572265625, -0.4621734619140625, -0.44042205810546875, -0.418670654296875, -0.39691925048828125, -0.3751678466796875, -0.35341644287109375, -0.3316650390625, -0.30991363525390625, -0.2881622314453125, -0.26641082763671875, -0.244659423828125, -0.22290802001953125, -0.2011566162109375, -0.17940521240234375, -0.15765380859375, -0.13590240478515625, -0.1141510009765625, -0.09239959716796875, -0.070648193359375, -0.04889678955078125, -0.0271453857421875, -0.00539398193359375, 0.016357421875, 0.03810882568359375, 0.0598602294921875, 0.08161163330078125, 0.103363037109375, 0.12511444091796875, 0.1468658447265625, 0.16861724853515625, 0.19036865234375, 0.21212005615234375, 0.2338714599609375, 0.25562286376953125, 0.277374267578125, 0.29912567138671875, 0.3208770751953125, 0.34262847900390625, 0.3643798828125, 0.38613128662109375, 0.4078826904296875, 0.42963409423828125, 0.451385498046875, 0.47313690185546875, 0.4948883056640625, 0.5166397094726562, 0.53839111328125, 0.5601425170898438, 0.5818939208984375, 0.6036453247070312, 0.625396728515625, 0.6471481323242188, 0.6688995361328125, 0.6906509399414062, 0.71240234375]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 10.0, 4.0, 6.0, 5.0, 12.0, 12.0, 14.0, 14.0, 22.0, 20.0, 24.0, 26.0, 36.0, 40.0, 40.0, 42.0, 53.0, 49.0, 61.0, 46.0, 44.0, 45.0, 47.0, 36.0, 41.0, 36.0, 33.0, 24.0, 34.0, 23.0, 20.0, 17.0, 16.0, 16.0, 7.0, 8.0, 10.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03515625, -2.9365234375, -2.837890625, -2.7392578125, -2.640625, -2.5419921875, -2.443359375, -2.3447265625, -2.24609375, -2.1474609375, -2.048828125, -1.9501953125, -1.8515625, -1.7529296875, -1.654296875, -1.5556640625, -1.45703125, -1.3583984375, -1.259765625, -1.1611328125, -1.0625, -0.9638671875, -0.865234375, -0.7666015625, -0.66796875, -0.5693359375, -0.470703125, -0.3720703125, -0.2734375, -0.1748046875, -0.076171875, 0.0224609375, 0.12109375, 0.2197265625, 0.318359375, 0.4169921875, 0.515625, 0.6142578125, 0.712890625, 0.8115234375, 0.91015625, 1.0087890625, 1.107421875, 1.2060546875, 1.3046875, 1.4033203125, 1.501953125, 1.6005859375, 1.69921875, 1.7978515625, 1.896484375, 1.9951171875, 2.09375, 2.1923828125, 2.291015625, 2.3896484375, 2.48828125, 2.5869140625, 2.685546875, 2.7841796875, 2.8828125, 2.9814453125, 3.080078125, 3.1787109375, 3.27734375]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 7.0, 9.0, 20.0, 15.0, 21.0, 23.0, 33.0, 41.0, 53.0, 76.0, 118.0, 108.0, 188.0, 232.0, 349.0, 452.0, 701.0, 1074.0, 1923.0, 3634.0, 8239.0, 23518.0, 884344.0, 87264.0, 20228.0, 7360.0, 3304.0, 1860.0, 990.0, 674.0, 457.0, 300.0, 225.0, 170.0, 144.0, 92.0, 64.0, 54.0, 36.0, 35.0, 30.0, 17.0, 19.0, 9.0, 9.0, 10.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6650390625, -1.6128997802734375, -1.560760498046875, -1.5086212158203125, -1.45648193359375, -1.4043426513671875, -1.352203369140625, -1.3000640869140625, -1.2479248046875, -1.1957855224609375, -1.143646240234375, -1.0915069580078125, -1.03936767578125, -0.9872283935546875, -0.935089111328125, -0.8829498291015625, -0.830810546875, -0.7786712646484375, -0.726531982421875, -0.6743927001953125, -0.62225341796875, -0.5701141357421875, -0.517974853515625, -0.4658355712890625, -0.4136962890625, -0.3615570068359375, -0.309417724609375, -0.2572784423828125, -0.20513916015625, -0.1529998779296875, -0.100860595703125, -0.0487213134765625, 0.00341796875, 0.0555572509765625, 0.107696533203125, 0.1598358154296875, 0.21197509765625, 0.2641143798828125, 0.316253662109375, 0.3683929443359375, 0.4205322265625, 0.4726715087890625, 0.524810791015625, 0.5769500732421875, 0.62908935546875, 0.6812286376953125, 0.733367919921875, 0.7855072021484375, 0.837646484375, 0.8897857666015625, 0.941925048828125, 0.9940643310546875, 1.04620361328125, 1.0983428955078125, 1.150482177734375, 1.2026214599609375, 1.2547607421875, 1.3069000244140625, 1.359039306640625, 1.4111785888671875, 1.46331787109375, 1.5154571533203125, 1.567596435546875, 1.6197357177734375, 1.671875]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 12.0, 13.0, 6.0, 11.0, 10.0, 21.0, 19.0, 19.0, 19.0, 26.0, 33.0, 27.0, 34.0, 25.0, 35.0, 39.0, 42.0, 42.0, 52.0, 42.0, 45.0, 48.0, 44.0, 33.0, 41.0, 34.0, 31.0, 26.0, 31.0, 14.0, 24.0, 13.0, 16.0, 16.0, 10.0, 10.0, 10.0, 10.0, 0.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.759765625, -1.702728271484375, -1.64569091796875, -1.588653564453125, -1.5316162109375, -1.474578857421875, -1.41754150390625, -1.360504150390625, -1.303466796875, -1.246429443359375, -1.18939208984375, -1.132354736328125, -1.0753173828125, -1.018280029296875, -0.96124267578125, -0.904205322265625, -0.84716796875, -0.790130615234375, -0.73309326171875, -0.676055908203125, -0.6190185546875, -0.561981201171875, -0.50494384765625, -0.447906494140625, -0.390869140625, -0.333831787109375, -0.27679443359375, -0.219757080078125, -0.1627197265625, -0.105682373046875, -0.04864501953125, 0.008392333984375, 0.0654296875, 0.122467041015625, 0.17950439453125, 0.236541748046875, 0.2935791015625, 0.350616455078125, 0.40765380859375, 0.464691162109375, 0.521728515625, 0.578765869140625, 0.63580322265625, 0.692840576171875, 0.7498779296875, 0.806915283203125, 0.86395263671875, 0.920989990234375, 0.97802734375, 1.035064697265625, 1.09210205078125, 1.149139404296875, 1.2061767578125, 1.263214111328125, 1.32025146484375, 1.377288818359375, 1.434326171875, 1.491363525390625, 1.54840087890625, 1.605438232421875, 1.6624755859375, 1.719512939453125, 1.77655029296875, 1.833587646484375, 1.890625]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 1.0, 9.0, 24.0, 21.0, 31.0, 56.0, 117.0, 128.0, 262.0, 434.0, 938.0, 2037.0, 6003.0, 33534.0, 974337.0, 22251.0, 4867.0, 1747.0, 747.0, 422.0, 203.0, 158.0, 70.0, 42.0, 37.0, 28.0, 9.0, 10.0, 14.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25146484375, -0.243194580078125, -0.23492431640625, -0.226654052734375, -0.2183837890625, -0.210113525390625, -0.20184326171875, -0.193572998046875, -0.185302734375, -0.177032470703125, -0.16876220703125, -0.160491943359375, -0.1522216796875, -0.143951416015625, -0.13568115234375, -0.127410888671875, -0.119140625, -0.110870361328125, -0.10260009765625, -0.094329833984375, -0.0860595703125, -0.077789306640625, -0.06951904296875, -0.061248779296875, -0.052978515625, -0.044708251953125, -0.03643798828125, -0.028167724609375, -0.0198974609375, -0.011627197265625, -0.00335693359375, 0.004913330078125, 0.01318359375, 0.021453857421875, 0.02972412109375, 0.037994384765625, 0.0462646484375, 0.054534912109375, 0.06280517578125, 0.071075439453125, 0.079345703125, 0.087615966796875, 0.09588623046875, 0.104156494140625, 0.1124267578125, 0.120697021484375, 0.12896728515625, 0.137237548828125, 0.1455078125, 0.153778076171875, 0.16204833984375, 0.170318603515625, 0.1785888671875, 0.186859130859375, 0.19512939453125, 0.203399658203125, 0.211669921875, 0.219940185546875, 0.22821044921875, 0.236480712890625, 0.2447509765625, 0.253021240234375, 0.26129150390625, 0.269561767578125, 0.27783203125]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 3.0, 2.0, 9.0, 6.0, 9.0, 10.0, 13.0, 9.0, 10.0, 21.0, 27.0, 35.0, 27.0, 39.0, 35.0, 52.0, 51.0, 47.0, 55.0, 61.0, 45.0, 45.0, 73.0, 46.0, 43.0, 41.0, 33.0, 37.0, 29.0, 14.0, 10.0, 14.0, 7.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.872943878173828e-05, -2.7846544981002808e-05, -2.6963651180267334e-05, -2.608075737953186e-05, -2.5197863578796387e-05, -2.4314969778060913e-05, -2.343207597732544e-05, -2.2549182176589966e-05, -2.1666288375854492e-05, -2.078339457511902e-05, -1.9900500774383545e-05, -1.901760697364807e-05, -1.8134713172912598e-05, -1.7251819372177124e-05, -1.636892557144165e-05, -1.5486031770706177e-05, -1.4603137969970703e-05, -1.372024416923523e-05, -1.2837350368499756e-05, -1.1954456567764282e-05, -1.1071562767028809e-05, -1.0188668966293335e-05, -9.305775165557861e-06, -8.422881364822388e-06, -7.539987564086914e-06, -6.6570937633514404e-06, -5.774199962615967e-06, -4.891306161880493e-06, -4.0084123611450195e-06, -3.125518560409546e-06, -2.2426247596740723e-06, -1.3597309589385986e-06, -4.76837158203125e-07, 4.0605664253234863e-07, 1.2889504432678223e-06, 2.171844244003296e-06, 3.0547380447387695e-06, 3.937631845474243e-06, 4.820525646209717e-06, 5.7034194469451904e-06, 6.586313247680664e-06, 7.469207048416138e-06, 8.352100849151611e-06, 9.234994649887085e-06, 1.0117888450622559e-05, 1.1000782251358032e-05, 1.1883676052093506e-05, 1.276656985282898e-05, 1.3649463653564453e-05, 1.4532357454299927e-05, 1.54152512550354e-05, 1.6298145055770874e-05, 1.7181038856506348e-05, 1.806393265724182e-05, 1.8946826457977295e-05, 1.982972025871277e-05, 2.0712614059448242e-05, 2.1595507860183716e-05, 2.247840166091919e-05, 2.3361295461654663e-05, 2.4244189262390137e-05, 2.512708306312561e-05, 2.6009976863861084e-05, 2.6892870664596558e-05, 2.777576446533203e-05]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 8.0, 2.0, 7.0, 15.0, 9.0, 14.0, 18.0, 28.0, 46.0, 77.0, 174.0, 898.0, 44630.0, 985183.0, 16557.0, 526.0, 141.0, 65.0, 44.0, 24.0, 18.0, 12.0, 12.0, 8.0, 5.0, 8.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.450927734375, -0.4360923767089844, -0.42125701904296875, -0.4064216613769531, -0.3915863037109375, -0.3767509460449219, -0.36191558837890625, -0.3470802307128906, -0.332244873046875, -0.3174095153808594, -0.30257415771484375, -0.2877388000488281, -0.2729034423828125, -0.2580680847167969, -0.24323272705078125, -0.22839736938476562, -0.21356201171875, -0.19872665405273438, -0.18389129638671875, -0.16905593872070312, -0.1542205810546875, -0.13938522338867188, -0.12454986572265625, -0.10971450805664062, -0.094879150390625, -0.08004379272460938, -0.06520843505859375, -0.050373077392578125, -0.0355377197265625, -0.020702362060546875, -0.00586700439453125, 0.008968353271484375, 0.0238037109375, 0.038639068603515625, 0.05347442626953125, 0.06830978393554688, 0.0831451416015625, 0.09798049926757812, 0.11281585693359375, 0.12765121459960938, 0.142486572265625, 0.15732192993164062, 0.17215728759765625, 0.18699264526367188, 0.2018280029296875, 0.21666336059570312, 0.23149871826171875, 0.24633407592773438, 0.26116943359375, 0.2760047912597656, 0.29084014892578125, 0.3056755065917969, 0.3205108642578125, 0.3353462219238281, 0.35018157958984375, 0.3650169372558594, 0.379852294921875, 0.3946876525878906, 0.40952301025390625, 0.4243583679199219, 0.4391937255859375, 0.4540290832519531, 0.46886444091796875, 0.4836997985839844, 0.49853515625]}, "gradients/decoder.roberta.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 8.0, 4.0, 9.0, 6.0, 10.0, 24.0, 24.0, 26.0, 47.0, 50.0, 64.0, 97.0, 158.0, 132.0, 90.0, 56.0, 44.0, 38.0, 18.0, 19.0, 11.0, 8.0, 16.0, 9.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0251312255859375, -0.024386882781982422, -0.023642539978027344, -0.022898197174072266, -0.022153854370117188, -0.02140951156616211, -0.02066516876220703, -0.019920825958251953, -0.019176483154296875, -0.018432140350341797, -0.01768779754638672, -0.01694345474243164, -0.016199111938476562, -0.015454769134521484, -0.014710426330566406, -0.013966083526611328, -0.01322174072265625, -0.012477397918701172, -0.011733055114746094, -0.010988712310791016, -0.010244369506835938, -0.00950002670288086, -0.008755683898925781, -0.008011341094970703, -0.007266998291015625, -0.006522655487060547, -0.005778312683105469, -0.005033969879150391, -0.0042896270751953125, -0.0035452842712402344, -0.0028009414672851562, -0.002056598663330078, -0.001312255859375, -0.0005679130554199219, 0.00017642974853515625, 0.0009207725524902344, 0.0016651153564453125, 0.0024094581604003906, 0.0031538009643554688, 0.003898143768310547, 0.004642486572265625, 0.005386829376220703, 0.006131172180175781, 0.006875514984130859, 0.0076198577880859375, 0.008364200592041016, 0.009108543395996094, 0.009852886199951172, 0.01059722900390625, 0.011341571807861328, 0.012085914611816406, 0.012830257415771484, 0.013574600219726562, 0.01431894302368164, 0.015063285827636719, 0.015807628631591797, 0.016551971435546875, 0.017296314239501953, 0.01804065704345703, 0.01878499984741211, 0.019529342651367188, 0.020273685455322266, 0.021018028259277344, 0.021762371063232422, 0.0225067138671875]}, "gradients/decoder.roberta.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 5.0, 16.0, 32.0, 44.0, 50.0, 71.0, 92.0, 98.0, 118.0, 122.0, 93.0, 74.0, 61.0, 50.0, 27.0, 16.0, 17.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.05853271484375, -6.906725883483887, -6.754919052124023, -6.60311222076416, -6.451304912567139, -6.299498081207275, -6.147691249847412, -5.995884418487549, -5.8440775871276855, -5.692270755767822, -5.540463924407959, -5.3886566162109375, -5.236849784851074, -5.085042953491211, -4.933236122131348, -4.781429290771484, -4.629622459411621, -4.477815628051758, -4.3260087966918945, -4.174201965332031, -4.02239465713501, -3.8705878257751465, -3.718780994415283, -3.56697416305542, -3.4151668548583984, -3.263360023498535, -3.1115529537200928, -2.9597461223602295, -2.807939291000366, -2.656132221221924, -2.5043253898620605, -2.3525185585021973, -2.200711488723755, -2.0489046573638916, -1.8970977067947388, -1.745290756225586, -1.5934839248657227, -1.4416769742965698, -1.289870023727417, -1.1380631923675537, -0.9862562417984009, -0.8344493508338928, -0.6826424598693848, -0.5308355093002319, -0.3790286183357239, -0.22722172737121582, -0.07541477680206299, 0.07639205455780029, 0.22819900512695312, 0.3800058960914612, 0.5318127870559692, 0.6836197376251221, 0.8354266285896301, 0.9872335195541382, 1.139040470123291, 1.2908473014831543, 1.4426542520523071, 1.59446120262146, 1.7462680339813232, 1.898074984550476, 2.049881935119629, 2.201688766479492, 2.3534955978393555, 2.5053024291992188, 2.657109498977661]}, "gradients/decoder.roberta.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 9.0, 6.0, 6.0, 5.0, 11.0, 13.0, 13.0, 14.0, 22.0, 20.0, 24.0, 25.0, 34.0, 41.0, 40.0, 41.0, 55.0, 46.0, 62.0, 47.0, 45.0, 46.0, 46.0, 37.0, 40.0, 37.0, 32.0, 26.0, 32.0, 24.0, 20.0, 18.0, 16.0, 16.0, 5.0, 9.0, 10.0, 4.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0432896614074707, -2.944566249847412, -2.8458428382873535, -2.747119426727295, -2.6483960151672363, -2.5496723651885986, -2.45094895362854, -2.3522255420684814, -2.253502130508423, -2.1547787189483643, -2.0560553073883057, -1.9573317766189575, -1.858608365058899, -1.7598849534988403, -1.6611614227294922, -1.5624380111694336, -1.463714599609375, -1.3649911880493164, -1.2662677764892578, -1.1675442457199097, -1.068820834159851, -0.9700974225997925, -0.8713739514350891, -0.7726504802703857, -0.6739270687103271, -0.5752036571502686, -0.4764801859855652, -0.3777567446231842, -0.2790333032608032, -0.18030986189842224, -0.08158642053604126, 0.01713705062866211, 0.1158607006072998, 0.2145841419696808, 0.31330758333206177, 0.41203102469444275, 0.5107544660568237, 0.6094778776168823, 0.7082013487815857, 0.8069248199462891, 0.9056482315063477, 1.0043716430664062, 1.1030950546264648, 1.201818585395813, 1.3005419969558716, 1.3992654085159302, 1.4979889392852783, 1.596712350845337, 1.6954357624053955, 1.794159173965454, 1.8928825855255127, 1.9916061162948608, 2.090329647064209, 2.1890530586242676, 2.287776470184326, 2.3864998817443848, 2.4852232933044434, 2.583946704864502, 2.6826701164245605, 2.781393527984619, 2.8801169395446777, 2.9788405895233154, 3.077564001083374, 3.1762874126434326, 3.275010824203491]}, "gradients/decoder.roberta.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 9.0, 10.0, 12.0, 14.0, 13.0, 24.0, 30.0, 48.0, 57.0, 96.0, 116.0, 241.0, 430.0, 832.0, 1825.0, 4400.0, 11056.0, 31022.0, 97892.0, 327274.0, 390691.0, 121808.0, 37703.0, 13466.0, 5166.0, 2131.0, 943.0, 515.0, 261.0, 153.0, 102.0, 65.0, 41.0, 30.0, 26.0, 17.0, 11.0, 11.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.67767333984375, -4.5272216796875, -4.37677001953125, -4.226318359375, -4.07586669921875, -3.9254150390625, -3.77496337890625, -3.62451171875, -3.47406005859375, -3.3236083984375, -3.17315673828125, -3.022705078125, -2.87225341796875, -2.7218017578125, -2.57135009765625, -2.4208984375, -2.27044677734375, -2.1199951171875, -1.96954345703125, -1.819091796875, -1.66864013671875, -1.5181884765625, -1.36773681640625, -1.21728515625, -1.06683349609375, -0.9163818359375, -0.76593017578125, -0.615478515625, -0.46502685546875, -0.3145751953125, -0.16412353515625, -0.013671875, 0.13677978515625, 0.2872314453125, 0.43768310546875, 0.588134765625, 0.73858642578125, 0.8890380859375, 1.03948974609375, 1.18994140625, 1.34039306640625, 1.4908447265625, 1.64129638671875, 1.791748046875, 1.94219970703125, 2.0926513671875, 2.24310302734375, 2.3935546875, 2.54400634765625, 2.6944580078125, 2.84490966796875, 2.995361328125, 3.14581298828125, 3.2962646484375, 3.44671630859375, 3.59716796875, 3.74761962890625, 3.8980712890625, 4.04852294921875, 4.198974609375, 4.34942626953125, 4.4998779296875, 4.65032958984375, 4.80078125]}, "gradients/decoder.roberta.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 9.0, 3.0, 7.0, 8.0, 16.0, 16.0, 16.0, 17.0, 26.0, 24.0, 29.0, 34.0, 41.0, 40.0, 43.0, 57.0, 53.0, 46.0, 57.0, 48.0, 48.0, 47.0, 36.0, 42.0, 36.0, 25.0, 35.0, 27.0, 14.0, 16.0, 21.0, 19.0, 10.0, 7.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15625, -3.055755615234375, -2.95526123046875, -2.854766845703125, -2.7542724609375, -2.653778076171875, -2.55328369140625, -2.452789306640625, -2.352294921875, -2.251800537109375, -2.15130615234375, -2.050811767578125, -1.9503173828125, -1.849822998046875, -1.74932861328125, -1.648834228515625, -1.54833984375, -1.447845458984375, -1.34735107421875, -1.246856689453125, -1.1463623046875, -1.045867919921875, -0.94537353515625, -0.844879150390625, -0.744384765625, -0.643890380859375, -0.54339599609375, -0.442901611328125, -0.3424072265625, -0.241912841796875, -0.14141845703125, -0.040924072265625, 0.0595703125, 0.160064697265625, 0.26055908203125, 0.361053466796875, 0.4615478515625, 0.562042236328125, 0.66253662109375, 0.763031005859375, 0.863525390625, 0.964019775390625, 1.06451416015625, 1.165008544921875, 1.2655029296875, 1.365997314453125, 1.46649169921875, 1.566986083984375, 1.66748046875, 1.767974853515625, 1.86846923828125, 1.968963623046875, 2.0694580078125, 2.169952392578125, 2.27044677734375, 2.370941162109375, 2.471435546875, 2.571929931640625, 2.67242431640625, 2.772918701171875, 2.8734130859375, 2.973907470703125, 3.07440185546875, 3.174896240234375, 3.275390625]}, "gradients/decoder.roberta.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 8.0, 6.0, 8.0, 10.0, 11.0, 17.0, 18.0, 24.0, 22.0, 28.0, 24.0, 30.0, 45.0, 63.0, 123.0, 256.0, 650.0, 1042407.0, 3822.0, 397.0, 168.0, 83.0, 57.0, 35.0, 45.0, 28.0, 33.0, 19.0, 21.0, 15.0, 15.0, 11.0, 9.0, 12.0, 6.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.3125, -74.6220703125, -71.931640625, -69.2412109375, -66.55078125, -63.8603515625, -61.169921875, -58.4794921875, -55.7890625, -53.0986328125, -50.408203125, -47.7177734375, -45.02734375, -42.3369140625, -39.646484375, -36.9560546875, -34.265625, -31.5751953125, -28.884765625, -26.1943359375, -23.50390625, -20.8134765625, -18.123046875, -15.4326171875, -12.7421875, -10.0517578125, -7.361328125, -4.6708984375, -1.98046875, 0.7099609375, 3.400390625, 6.0908203125, 8.78125, 11.4716796875, 14.162109375, 16.8525390625, 19.54296875, 22.2333984375, 24.923828125, 27.6142578125, 30.3046875, 32.9951171875, 35.685546875, 38.3759765625, 41.06640625, 43.7568359375, 46.447265625, 49.1376953125, 51.828125, 54.5185546875, 57.208984375, 59.8994140625, 62.58984375, 65.2802734375, 67.970703125, 70.6611328125, 73.3515625, 76.0419921875, 78.732421875, 81.4228515625, 84.11328125, 86.8037109375, 89.494140625, 92.1845703125, 94.875]}, "gradients/decoder.roberta.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 9.0, 10.0, 9.0, 16.0, 18.0, 17.0, 24.0, 28.0, 33.0, 41.0, 32.0, 36.0, 50.0, 47.0, 59.0, 37.0, 44.0, 47.0, 58.0, 51.0, 39.0, 48.0, 26.0, 25.0, 29.0, 23.0, 24.0, 20.0, 19.0, 12.0, 8.0, 9.0, 7.0, 10.0, 6.0, 0.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.275390625, -3.18304443359375, -3.0906982421875, -2.99835205078125, -2.906005859375, -2.81365966796875, -2.7213134765625, -2.62896728515625, -2.53662109375, -2.44427490234375, -2.3519287109375, -2.25958251953125, -2.167236328125, -2.07489013671875, -1.9825439453125, -1.89019775390625, -1.7978515625, -1.70550537109375, -1.6131591796875, -1.52081298828125, -1.428466796875, -1.33612060546875, -1.2437744140625, -1.15142822265625, -1.05908203125, -0.96673583984375, -0.8743896484375, -0.78204345703125, -0.689697265625, -0.59735107421875, -0.5050048828125, -0.41265869140625, -0.3203125, -0.22796630859375, -0.1356201171875, -0.04327392578125, 0.049072265625, 0.14141845703125, 0.2337646484375, 0.32611083984375, 0.41845703125, 0.51080322265625, 0.6031494140625, 0.69549560546875, 0.787841796875, 0.88018798828125, 0.9725341796875, 1.06488037109375, 1.1572265625, 1.24957275390625, 1.3419189453125, 1.43426513671875, 1.526611328125, 1.61895751953125, 1.7113037109375, 1.80364990234375, 1.89599609375, 1.98834228515625, 2.0806884765625, 2.17303466796875, 2.265380859375, 2.35772705078125, 2.4500732421875, 2.54241943359375, 2.634765625]}, "gradients/decoder.roberta.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 4.0, 13.0, 19.0, 46.0, 88.0, 276.0, 996.0, 7529.0, 882246.0, 153740.0, 2696.0, 582.0, 183.0, 63.0, 23.0, 17.0, 8.0, 7.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5546875, -11.271484375, -10.98828125, -10.705078125, -10.421875, -10.138671875, -9.85546875, -9.572265625, -9.2890625, -9.005859375, -8.72265625, -8.439453125, -8.15625, -7.873046875, -7.58984375, -7.306640625, -7.0234375, -6.740234375, -6.45703125, -6.173828125, -5.890625, -5.607421875, -5.32421875, -5.041015625, -4.7578125, -4.474609375, -4.19140625, -3.908203125, -3.625, -3.341796875, -3.05859375, -2.775390625, -2.4921875, -2.208984375, -1.92578125, -1.642578125, -1.359375, -1.076171875, -0.79296875, -0.509765625, -0.2265625, 0.056640625, 0.33984375, 0.623046875, 0.90625, 1.189453125, 1.47265625, 1.755859375, 2.0390625, 2.322265625, 2.60546875, 2.888671875, 3.171875, 3.455078125, 3.73828125, 4.021484375, 4.3046875, 4.587890625, 4.87109375, 5.154296875, 5.4375, 5.720703125, 6.00390625, 6.287109375, 6.5703125]}, "gradients/decoder.roberta.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 2.0, 7.0, 2.0, 14.0, 28.0, 38.0, 41.0, 60.0, 80.0, 121.0, 138.0, 105.0, 112.0, 74.0, 57.0, 38.0, 29.0, 16.0, 13.0, 8.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002510547637939453, -0.00024165213108062744, -0.00023224949836730957, -0.0002228468656539917, -0.00021344423294067383, -0.00020404160022735596, -0.00019463896751403809, -0.00018523633480072021, -0.00017583370208740234, -0.00016643106937408447, -0.0001570284366607666, -0.00014762580394744873, -0.00013822317123413086, -0.000128820538520813, -0.00011941790580749512, -0.00011001527309417725, -0.00010061264038085938, -9.12100076675415e-05, -8.180737495422363e-05, -7.240474224090576e-05, -6.300210952758789e-05, -5.359947681427002e-05, -4.419684410095215e-05, -3.479421138763428e-05, -2.5391578674316406e-05, -1.5988945960998535e-05, -6.586313247680664e-06, 2.816319465637207e-06, 1.2218952178955078e-05, 2.162158489227295e-05, 3.102421760559082e-05, 4.042685031890869e-05, 4.982948303222656e-05, 5.9232115745544434e-05, 6.86347484588623e-05, 7.803738117218018e-05, 8.744001388549805e-05, 9.684264659881592e-05, 0.00010624527931213379, 0.00011564791202545166, 0.00012505054473876953, 0.0001344531774520874, 0.00014385581016540527, 0.00015325844287872314, 0.00016266107559204102, 0.0001720637083053589, 0.00018146634101867676, 0.00019086897373199463, 0.0002002716064453125, 0.00020967423915863037, 0.00021907687187194824, 0.0002284795045852661, 0.00023788213729858398, 0.00024728477001190186, 0.0002566874027252197, 0.0002660900354385376, 0.00027549266815185547, 0.00028489530086517334, 0.0002942979335784912, 0.0003037005662918091, 0.00031310319900512695, 0.0003225058317184448, 0.0003319084644317627, 0.00034131109714508057, 0.00035071372985839844]}, "gradients/decoder.roberta.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 27.0, 22.0, 48.0, 109.0, 524.0, 127236.0, 919424.0, 911.0, 118.0, 52.0, 35.0, 19.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.984375, -28.223388671875, -27.46240234375, -26.701416015625, -25.9404296875, -25.179443359375, -24.41845703125, -23.657470703125, -22.896484375, -22.135498046875, -21.37451171875, -20.613525390625, -19.8525390625, -19.091552734375, -18.33056640625, -17.569580078125, -16.80859375, -16.047607421875, -15.28662109375, -14.525634765625, -13.7646484375, -13.003662109375, -12.24267578125, -11.481689453125, -10.720703125, -9.959716796875, -9.19873046875, -8.437744140625, -7.6767578125, -6.915771484375, -6.15478515625, -5.393798828125, -4.6328125, -3.871826171875, -3.11083984375, -2.349853515625, -1.5888671875, -0.827880859375, -0.06689453125, 0.694091796875, 1.455078125, 2.216064453125, 2.97705078125, 3.738037109375, 4.4990234375, 5.260009765625, 6.02099609375, 6.781982421875, 7.54296875, 8.303955078125, 9.06494140625, 9.825927734375, 10.5869140625, 11.347900390625, 12.10888671875, 12.869873046875, 13.630859375, 14.391845703125, 15.15283203125, 15.913818359375, 16.6748046875, 17.435791015625, 18.19677734375, 18.957763671875, 19.71875]}, "gradients/decoder.roberta.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 18.0, 34.0, 39.0, 87.0, 126.0, 179.0, 194.0, 125.0, 85.0, 41.0, 24.0, 20.0, 5.0, 7.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91162109375, -0.8764724731445312, -0.8413238525390625, -0.8061752319335938, -0.771026611328125, -0.7358779907226562, -0.7007293701171875, -0.6655807495117188, -0.63043212890625, -0.5952835083007812, -0.5601348876953125, -0.5249862670898438, -0.489837646484375, -0.45468902587890625, -0.4195404052734375, -0.38439178466796875, -0.3492431640625, -0.31409454345703125, -0.2789459228515625, -0.24379730224609375, -0.208648681640625, -0.17350006103515625, -0.1383514404296875, -0.10320281982421875, -0.06805419921875, -0.03290557861328125, 0.0022430419921875, 0.03739166259765625, 0.072540283203125, 0.10768890380859375, 0.1428375244140625, 0.17798614501953125, 0.213134765625, 0.24828338623046875, 0.2834320068359375, 0.31858062744140625, 0.353729248046875, 0.38887786865234375, 0.4240264892578125, 0.45917510986328125, 0.49432373046875, 0.5294723510742188, 0.5646209716796875, 0.5997695922851562, 0.634918212890625, 0.6700668334960938, 0.7052154541015625, 0.7403640747070312, 0.7755126953125, 0.8106613159179688, 0.8458099365234375, 0.8809585571289062, 0.916107177734375, 0.9512557983398438, 0.9864044189453125, 1.0215530395507812, 1.05670166015625, 1.0918502807617188, 1.1269989013671875, 1.1621475219726562, 1.197296142578125, 1.2324447631835938, 1.2675933837890625, 1.3027420043945312, 1.337890625]}, "gradients/decoder.roberta.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 9.0, 7.0, 14.0, 21.0, 35.0, 59.0, 85.0, 88.0, 100.0, 118.0, 122.0, 97.0, 76.0, 72.0, 33.0, 26.0, 24.0, 13.0, 5.0, 5.0, 4.0, 1.0, 1.0], "bins": [-8.373887062072754, -8.208505630493164, -8.04312515258789, -7.877743721008301, -7.712362289428711, -7.546980857849121, -7.3815999031066895, -7.216218948364258, -7.050837516784668, -6.885456085205078, -6.7200751304626465, -6.554694175720215, -6.389312744140625, -6.223931312561035, -6.0585503578186035, -5.893169403076172, -5.727787971496582, -5.562406539916992, -5.3970255851745605, -5.231644630432129, -5.066263198852539, -4.900881767272949, -4.735500812530518, -4.570119857788086, -4.404738426208496, -4.239356994628906, -4.073976039886475, -3.908594846725464, -3.743213653564453, -3.5778324604034424, -3.4124512672424316, -3.247070074081421, -3.081688404083252, -2.916307210922241, -2.7509260177612305, -2.5855448246002197, -2.420163631439209, -2.2547824382781982, -2.0894012451171875, -1.9240200519561768, -1.758638858795166, -1.5932576656341553, -1.4278764724731445, -1.2624952793121338, -1.097114086151123, -0.9317328929901123, -0.7663516998291016, -0.6009705066680908, -0.4355893135070801, -0.27020812034606934, -0.1048269271850586, 0.06055426597595215, 0.2259354591369629, 0.39131665229797363, 0.5566978454589844, 0.7220790386199951, 0.8874602317810059, 1.0528414249420166, 1.2182226181030273, 1.383603811264038, 1.5489850044250488, 1.7143661975860596, 1.8797473907470703, 2.045128583908081, 2.210509777069092]}, "gradients/decoder.roberta.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 9.0, 9.0, 15.0, 11.0, 19.0, 23.0, 26.0, 26.0, 18.0, 40.0, 29.0, 31.0, 34.0, 32.0, 47.0, 35.0, 56.0, 37.0, 42.0, 49.0, 37.0, 32.0, 32.0, 37.0, 31.0, 29.0, 37.0, 26.0, 24.0, 23.0, 15.0, 14.0, 8.0, 12.0, 3.0, 8.0, 10.0, 6.0, 6.0, 0.0, 7.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-3.8999927043914795, -3.7909841537475586, -3.6819753646850586, -3.5729668140411377, -3.4639580249786377, -3.354949474334717, -3.245940685272217, -3.136932134628296, -3.027923583984375, -2.918915033340454, -2.809906244277954, -2.700897693634033, -2.591888904571533, -2.4828803539276123, -2.3738718032836914, -2.2648630142211914, -2.1558542251586914, -2.0468456745147705, -1.9378368854522705, -1.8288283348083496, -1.7198195457458496, -1.6108109951019287, -1.5018023252487183, -1.3927936553955078, -1.2837849855422974, -1.174776315689087, -1.0657676458358765, -0.9567590355873108, -0.8477503657341003, -0.7387416958808899, -0.6297330856323242, -0.5207244157791138, -0.4117159843444824, -0.302707314491272, -0.1936986744403839, -0.08469003438949585, 0.0243186354637146, 0.13332730531692505, 0.24233591556549072, 0.35134458541870117, 0.4603532552719116, 0.5693619251251221, 0.6783705949783325, 0.7873792052268982, 0.8963878750801086, 1.0053966045379639, 1.1144051551818848, 1.2234138250350952, 1.3324224948883057, 1.4414311647415161, 1.5504398345947266, 1.6594483852386475, 1.7684571743011475, 1.8774657249450684, 1.9864743947982788, 2.0954830646514893, 2.20449161529541, 2.313500165939331, 2.422508955001831, 2.531517505645752, 2.640526294708252, 2.749534845352173, 2.8585433959960938, 2.9675521850585938, 3.0765609741210938]}, "gradients/decoder.roberta.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 7.0, 9.0, 18.0, 26.0, 31.0, 45.0, 54.0, 76.0, 85.0, 137.0, 207.0, 268.0, 439.0, 703.0, 1240.0, 2722.0, 9639.0, 60839.0, 986913.0, 2976808.0, 129352.0, 16597.0, 4067.0, 1615.0, 798.0, 480.0, 316.0, 216.0, 146.0, 111.0, 75.0, 56.0, 46.0, 34.0, 27.0, 13.0, 17.0, 15.0, 7.0, 5.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.06640625, -6.8321533203125, -6.597900390625, -6.3636474609375, -6.12939453125, -5.8951416015625, -5.660888671875, -5.4266357421875, -5.1923828125, -4.9581298828125, -4.723876953125, -4.4896240234375, -4.25537109375, -4.0211181640625, -3.786865234375, -3.5526123046875, -3.318359375, -3.0841064453125, -2.849853515625, -2.6156005859375, -2.38134765625, -2.1470947265625, -1.912841796875, -1.6785888671875, -1.4443359375, -1.2100830078125, -0.975830078125, -0.7415771484375, -0.50732421875, -0.2730712890625, -0.038818359375, 0.1954345703125, 0.4296875, 0.6639404296875, 0.898193359375, 1.1324462890625, 1.36669921875, 1.6009521484375, 1.835205078125, 2.0694580078125, 2.3037109375, 2.5379638671875, 2.772216796875, 3.0064697265625, 3.24072265625, 3.4749755859375, 3.709228515625, 3.9434814453125, 4.177734375, 4.4119873046875, 4.646240234375, 4.8804931640625, 5.11474609375, 5.3489990234375, 5.583251953125, 5.8175048828125, 6.0517578125, 6.2860107421875, 6.520263671875, 6.7545166015625, 6.98876953125, 7.2230224609375, 7.457275390625, 7.6915283203125, 7.92578125]}, "gradients/decoder.roberta.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 8.0, 3.0, 10.0, 4.0, 12.0, 9.0, 13.0, 22.0, 21.0, 20.0, 17.0, 21.0, 23.0, 29.0, 19.0, 36.0, 35.0, 30.0, 37.0, 39.0, 37.0, 46.0, 27.0, 47.0, 45.0, 30.0, 39.0, 34.0, 27.0, 36.0, 22.0, 34.0, 21.0, 28.0, 14.0, 11.0, 15.0, 12.0, 14.0, 7.0, 9.0, 4.0, 9.0, 7.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.8876953125, -1.8275146484375, -1.767333984375, -1.7071533203125, -1.64697265625, -1.5867919921875, -1.526611328125, -1.4664306640625, -1.40625, -1.3460693359375, -1.285888671875, -1.2257080078125, -1.16552734375, -1.1053466796875, -1.045166015625, -0.9849853515625, -0.9248046875, -0.8646240234375, -0.804443359375, -0.7442626953125, -0.68408203125, -0.6239013671875, -0.563720703125, -0.5035400390625, -0.443359375, -0.3831787109375, -0.322998046875, -0.2628173828125, -0.20263671875, -0.1424560546875, -0.082275390625, -0.0220947265625, 0.0380859375, 0.0982666015625, 0.158447265625, 0.2186279296875, 0.27880859375, 0.3389892578125, 0.399169921875, 0.4593505859375, 0.51953125, 0.5797119140625, 0.639892578125, 0.7000732421875, 0.76025390625, 0.8204345703125, 0.880615234375, 0.9407958984375, 1.0009765625, 1.0611572265625, 1.121337890625, 1.1815185546875, 1.24169921875, 1.3018798828125, 1.362060546875, 1.4222412109375, 1.482421875, 1.5426025390625, 1.602783203125, 1.6629638671875, 1.72314453125, 1.7833251953125, 1.843505859375, 1.9036865234375, 1.9638671875]}, "gradients/decoder.roberta.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 0.0, 0.0, 1.0, 5.0, 11.0, 9.0, 17.0, 21.0, 31.0, 59.0, 69.0, 115.0, 236.0, 729.0, 5696.0, 2952949.0, 1228589.0, 4595.0, 661.0, 186.0, 102.0, 73.0, 36.0, 23.0, 25.0, 10.0, 14.0, 9.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.380859375, -31.48046875, -30.580078125, -29.6796875, -28.779296875, -27.87890625, -26.978515625, -26.078125, -25.177734375, -24.27734375, -23.376953125, -22.4765625, -21.576171875, -20.67578125, -19.775390625, -18.875, -17.974609375, -17.07421875, -16.173828125, -15.2734375, -14.373046875, -13.47265625, -12.572265625, -11.671875, -10.771484375, -9.87109375, -8.970703125, -8.0703125, -7.169921875, -6.26953125, -5.369140625, -4.46875, -3.568359375, -2.66796875, -1.767578125, -0.8671875, 0.033203125, 0.93359375, 1.833984375, 2.734375, 3.634765625, 4.53515625, 5.435546875, 6.3359375, 7.236328125, 8.13671875, 9.037109375, 9.9375, 10.837890625, 11.73828125, 12.638671875, 13.5390625, 14.439453125, 15.33984375, 16.240234375, 17.140625, 18.041015625, 18.94140625, 19.841796875, 20.7421875, 21.642578125, 22.54296875, 23.443359375, 24.34375]}, "gradients/decoder.roberta.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 10.0, 11.0, 17.0, 11.0, 20.0, 30.0, 50.0, 65.0, 97.0, 123.0, 195.0, 359.0, 531.0, 712.0, 600.0, 378.0, 296.0, 149.0, 108.0, 72.0, 53.0, 42.0, 30.0, 28.0, 17.0, 13.0, 9.0, 11.0, 9.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.107421875, -1.068817138671875, -1.03021240234375, -0.991607666015625, -0.9530029296875, -0.914398193359375, -0.87579345703125, -0.837188720703125, -0.798583984375, -0.759979248046875, -0.72137451171875, -0.682769775390625, -0.6441650390625, -0.605560302734375, -0.56695556640625, -0.528350830078125, -0.48974609375, -0.451141357421875, -0.41253662109375, -0.373931884765625, -0.3353271484375, -0.296722412109375, -0.25811767578125, -0.219512939453125, -0.180908203125, -0.142303466796875, -0.10369873046875, -0.065093994140625, -0.0264892578125, 0.012115478515625, 0.05072021484375, 0.089324951171875, 0.1279296875, 0.166534423828125, 0.20513916015625, 0.243743896484375, 0.2823486328125, 0.320953369140625, 0.35955810546875, 0.398162841796875, 0.436767578125, 0.475372314453125, 0.51397705078125, 0.552581787109375, 0.5911865234375, 0.629791259765625, 0.66839599609375, 0.707000732421875, 0.74560546875, 0.784210205078125, 0.82281494140625, 0.861419677734375, 0.9000244140625, 0.938629150390625, 0.97723388671875, 1.015838623046875, 1.054443359375, 1.093048095703125, 1.13165283203125, 1.170257568359375, 1.2088623046875, 1.247467041015625, 1.28607177734375, 1.324676513671875, 1.36328125]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 7.0, 26.0, 52.0, 106.0, 158.0, 209.0, 169.0, 133.0, 77.0, 54.0, 14.0, 5.0, 2.0, 1.0], "bins": [-14.453320503234863, -14.194056510925293, -13.934793472290039, -13.675529479980469, -13.416265487670898, -13.157002449035645, -12.897738456726074, -12.63847541809082, -12.37921142578125, -12.11994743347168, -11.860684394836426, -11.601420402526855, -11.342157363891602, -11.082893371582031, -10.823629379272461, -10.564366340637207, -10.305102348327637, -10.045838356018066, -9.786575317382812, -9.527311325073242, -9.268047332763672, -9.008784294128418, -8.749520301818848, -8.490257263183594, -8.230993270874023, -7.971729755401611, -7.712466239929199, -7.453202247619629, -7.193938732147217, -6.934675216674805, -6.675411224365234, -6.416147708892822, -6.15688419342041, -5.897620677947998, -5.638357162475586, -5.379093170166016, -5.1198296546936035, -4.860566139221191, -4.601302146911621, -4.342038631439209, -4.082775115966797, -3.8235116004943848, -3.5642478466033936, -3.3049840927124023, -3.0457205772399902, -2.786457061767578, -2.527193307876587, -2.2679295539855957, -2.0086660385131836, -1.749402403831482, -1.4901387691497803, -1.2308751344680786, -0.971611499786377, -0.7123478651046753, -0.45308423042297363, -0.19382059574127197, 0.06544303894042969, 0.32470667362213135, 0.583970308303833, 0.8432339429855347, 1.1024975776672363, 1.361761212348938, 1.6210248470306396, 1.8802884817123413, 2.139552116394043]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 12.0, 16.0, 17.0, 19.0, 15.0, 28.0, 25.0, 34.0, 28.0, 36.0, 32.0, 37.0, 39.0, 37.0, 42.0, 41.0, 43.0, 36.0, 46.0, 46.0, 41.0, 44.0, 42.0, 25.0, 32.0, 28.0, 26.0, 22.0, 13.0, 19.0, 12.0, 19.0, 7.0, 4.0, 9.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5005202293395996, -2.4161431789398193, -2.331766128540039, -2.247389078140259, -2.1630120277404785, -2.0786352157592773, -1.994258165359497, -1.9098811149597168, -1.8255040645599365, -1.7411270141601562, -1.656749963760376, -1.5723730325698853, -1.487995982170105, -1.4036189317703247, -1.319242000579834, -1.2348649501800537, -1.1504878997802734, -1.0661108493804932, -0.9817338585853577, -0.8973568677902222, -0.8129798173904419, -0.7286027669906616, -0.6442257761955261, -0.5598487854003906, -0.47547173500061035, -0.39109471440315247, -0.3067176938056946, -0.2223406732082367, -0.1379636526107788, -0.05358663201332092, 0.030790388584136963, 0.11516737937927246, 0.19954419136047363, 0.2839212119579315, 0.3682982325553894, 0.4526752531528473, 0.5370522737503052, 0.6214293241500854, 0.705806314945221, 0.7901833057403564, 0.8745603561401367, 0.958937406539917, 1.0433144569396973, 1.127691388130188, 1.2120684385299683, 1.2964454889297485, 1.3808224201202393, 1.4651994705200195, 1.5495765209197998, 1.63395357131958, 1.7183306217193604, 1.802707552909851, 1.8870846033096313, 1.9714616537094116, 2.0558385848999023, 2.1402156352996826, 2.224592685699463, 2.308969736099243, 2.3933467864990234, 2.4777238368988037, 2.562100887298584, 2.646477699279785, 2.7308547496795654, 2.8152318000793457, 2.899608850479126]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 6.0, 11.0, 17.0, 26.0, 28.0, 48.0, 69.0, 102.0, 164.0, 225.0, 342.0, 546.0, 845.0, 1358.0, 2285.0, 3681.0, 6118.0, 10093.0, 17354.0, 31341.0, 57522.0, 112176.0, 224460.0, 267201.0, 147463.0, 72994.0, 38770.0, 21872.0, 12484.0, 7274.0, 4412.0, 2705.0, 1673.0, 1048.0, 647.0, 389.0, 255.0, 185.0, 105.0, 84.0, 61.0, 43.0, 25.0, 18.0, 15.0, 4.0, 7.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55322265625, -0.5354843139648438, -0.5177459716796875, -0.5000076293945312, -0.482269287109375, -0.46453094482421875, -0.4467926025390625, -0.42905426025390625, -0.41131591796875, -0.39357757568359375, -0.3758392333984375, -0.35810089111328125, -0.340362548828125, -0.32262420654296875, -0.3048858642578125, -0.28714752197265625, -0.2694091796875, -0.25167083740234375, -0.2339324951171875, -0.21619415283203125, -0.198455810546875, -0.18071746826171875, -0.1629791259765625, -0.14524078369140625, -0.12750244140625, -0.10976409912109375, -0.0920257568359375, -0.07428741455078125, -0.056549072265625, -0.03881072998046875, -0.0210723876953125, -0.00333404541015625, 0.014404296875, 0.03214263916015625, 0.0498809814453125, 0.06761932373046875, 0.085357666015625, 0.10309600830078125, 0.1208343505859375, 0.13857269287109375, 0.15631103515625, 0.17404937744140625, 0.1917877197265625, 0.20952606201171875, 0.227264404296875, 0.24500274658203125, 0.2627410888671875, 0.28047943115234375, 0.2982177734375, 0.31595611572265625, 0.3336944580078125, 0.35143280029296875, 0.369171142578125, 0.38690948486328125, 0.4046478271484375, 0.42238616943359375, 0.44012451171875, 0.45786285400390625, 0.4756011962890625, 0.49333953857421875, 0.511077880859375, 0.5288162231445312, 0.5465545654296875, 0.5642929077148438, 0.58203125]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 12.0, 14.0, 18.0, 16.0, 20.0, 26.0, 22.0, 39.0, 22.0, 39.0, 30.0, 40.0, 39.0, 36.0, 40.0, 43.0, 40.0, 38.0, 47.0, 44.0, 41.0, 44.0, 38.0, 29.0, 35.0, 29.0, 24.0, 24.0, 14.0, 17.0, 12.0, 16.0, 10.0, 6.0, 7.0, 10.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.607421875, -2.525299072265625, -2.44317626953125, -2.361053466796875, -2.2789306640625, -2.196807861328125, -2.11468505859375, -2.032562255859375, -1.950439453125, -1.868316650390625, -1.78619384765625, -1.704071044921875, -1.6219482421875, -1.539825439453125, -1.45770263671875, -1.375579833984375, -1.29345703125, -1.211334228515625, -1.12921142578125, -1.047088623046875, -0.9649658203125, -0.882843017578125, -0.80072021484375, -0.718597412109375, -0.636474609375, -0.554351806640625, -0.47222900390625, -0.390106201171875, -0.3079833984375, -0.225860595703125, -0.14373779296875, -0.061614990234375, 0.0205078125, 0.102630615234375, 0.18475341796875, 0.266876220703125, 0.3489990234375, 0.431121826171875, 0.51324462890625, 0.595367431640625, 0.677490234375, 0.759613037109375, 0.84173583984375, 0.923858642578125, 1.0059814453125, 1.088104248046875, 1.17022705078125, 1.252349853515625, 1.33447265625, 1.416595458984375, 1.49871826171875, 1.580841064453125, 1.6629638671875, 1.745086669921875, 1.82720947265625, 1.909332275390625, 1.991455078125, 2.073577880859375, 2.15570068359375, 2.237823486328125, 2.3199462890625, 2.402069091796875, 2.48419189453125, 2.566314697265625, 2.6484375]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 3.0, 6.0, 12.0, 21.0, 22.0, 29.0, 45.0, 73.0, 83.0, 120.0, 196.0, 323.0, 512.0, 787.0, 1575.0, 3482.0, 10299.0, 50406.0, 939237.0, 28286.0, 7109.0, 2711.0, 1280.0, 644.0, 426.0, 303.0, 177.0, 94.0, 82.0, 67.0, 46.0, 29.0, 26.0, 17.0, 8.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.11328125, -2.047943115234375, -1.98260498046875, -1.917266845703125, -1.8519287109375, -1.786590576171875, -1.72125244140625, -1.655914306640625, -1.590576171875, -1.525238037109375, -1.45989990234375, -1.394561767578125, -1.3292236328125, -1.263885498046875, -1.19854736328125, -1.133209228515625, -1.06787109375, -1.002532958984375, -0.93719482421875, -0.871856689453125, -0.8065185546875, -0.741180419921875, -0.67584228515625, -0.610504150390625, -0.545166015625, -0.479827880859375, -0.41448974609375, -0.349151611328125, -0.2838134765625, -0.218475341796875, -0.15313720703125, -0.087799072265625, -0.0224609375, 0.042877197265625, 0.10821533203125, 0.173553466796875, 0.2388916015625, 0.304229736328125, 0.36956787109375, 0.434906005859375, 0.500244140625, 0.565582275390625, 0.63092041015625, 0.696258544921875, 0.7615966796875, 0.826934814453125, 0.89227294921875, 0.957611083984375, 1.02294921875, 1.088287353515625, 1.15362548828125, 1.218963623046875, 1.2843017578125, 1.349639892578125, 1.41497802734375, 1.480316162109375, 1.545654296875, 1.610992431640625, 1.67633056640625, 1.741668701171875, 1.8070068359375, 1.872344970703125, 1.93768310546875, 2.003021240234375, 2.068359375]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 4.0, 8.0, 18.0, 16.0, 19.0, 20.0, 17.0, 20.0, 29.0, 32.0, 44.0, 45.0, 50.0, 36.0, 33.0, 56.0, 59.0, 40.0, 48.0, 49.0, 35.0, 45.0, 28.0, 39.0, 23.0, 24.0, 28.0, 25.0, 22.0, 22.0, 11.0, 17.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.31640625, -1.260345458984375, -1.20428466796875, -1.148223876953125, -1.0921630859375, -1.036102294921875, -0.98004150390625, -0.923980712890625, -0.867919921875, -0.811859130859375, -0.75579833984375, -0.699737548828125, -0.6436767578125, -0.587615966796875, -0.53155517578125, -0.475494384765625, -0.41943359375, -0.363372802734375, -0.30731201171875, -0.251251220703125, -0.1951904296875, -0.139129638671875, -0.08306884765625, -0.027008056640625, 0.029052734375, 0.085113525390625, 0.14117431640625, 0.197235107421875, 0.2532958984375, 0.309356689453125, 0.36541748046875, 0.421478271484375, 0.4775390625, 0.533599853515625, 0.58966064453125, 0.645721435546875, 0.7017822265625, 0.757843017578125, 0.81390380859375, 0.869964599609375, 0.926025390625, 0.982086181640625, 1.03814697265625, 1.094207763671875, 1.1502685546875, 1.206329345703125, 1.26239013671875, 1.318450927734375, 1.37451171875, 1.430572509765625, 1.48663330078125, 1.542694091796875, 1.5987548828125, 1.654815673828125, 1.71087646484375, 1.766937255859375, 1.822998046875, 1.879058837890625, 1.93511962890625, 1.991180419921875, 2.0472412109375, 2.103302001953125, 2.15936279296875, 2.215423583984375, 2.271484375]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 10.0, 19.0, 17.0, 27.0, 25.0, 33.0, 50.0, 63.0, 88.0, 132.0, 178.0, 250.0, 369.0, 599.0, 1031.0, 1929.0, 3825.0, 9940.0, 39192.0, 940786.0, 32791.0, 8824.0, 3781.0, 1749.0, 1003.0, 608.0, 338.0, 254.0, 181.0, 127.0, 78.0, 52.0, 44.0, 39.0, 28.0, 25.0, 14.0, 13.0, 5.0, 11.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.1890869140625, -0.18343353271484375, -0.1777801513671875, -0.17212677001953125, -0.166473388671875, -0.16082000732421875, -0.1551666259765625, -0.14951324462890625, -0.14385986328125, -0.13820648193359375, -0.1325531005859375, -0.12689971923828125, -0.121246337890625, -0.11559295654296875, -0.1099395751953125, -0.10428619384765625, -0.0986328125, -0.09297943115234375, -0.0873260498046875, -0.08167266845703125, -0.076019287109375, -0.07036590576171875, -0.0647125244140625, -0.05905914306640625, -0.05340576171875, -0.04775238037109375, -0.0420989990234375, -0.03644561767578125, -0.030792236328125, -0.02513885498046875, -0.0194854736328125, -0.01383209228515625, -0.0081787109375, -0.00252532958984375, 0.0031280517578125, 0.00878143310546875, 0.014434814453125, 0.02008819580078125, 0.0257415771484375, 0.03139495849609375, 0.03704833984375, 0.04270172119140625, 0.0483551025390625, 0.05400848388671875, 0.059661865234375, 0.06531524658203125, 0.0709686279296875, 0.07662200927734375, 0.082275390625, 0.08792877197265625, 0.0935821533203125, 0.09923553466796875, 0.104888916015625, 0.11054229736328125, 0.1161956787109375, 0.12184906005859375, 0.12750244140625, 0.13315582275390625, 0.1388092041015625, 0.14446258544921875, 0.150115966796875, 0.15576934814453125, 0.1614227294921875, 0.16707611083984375, 0.1727294921875]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 6.0, 5.0, 6.0, 13.0, 12.0, 20.0, 16.0, 29.0, 25.0, 41.0, 46.0, 45.0, 43.0, 60.0, 66.0, 63.0, 77.0, 53.0, 53.0, 53.0, 22.0, 49.0, 53.0, 41.0, 26.0, 14.0, 10.0, 9.0, 3.0, 6.0, 2.0, 7.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.4332275390625e-05, -3.3311545848846436e-05, -3.229081630706787e-05, -3.127008676528931e-05, -3.0249357223510742e-05, -2.9228627681732178e-05, -2.8207898139953613e-05, -2.718716859817505e-05, -2.6166439056396484e-05, -2.514570951461792e-05, -2.4124979972839355e-05, -2.310425043106079e-05, -2.2083520889282227e-05, -2.1062791347503662e-05, -2.0042061805725098e-05, -1.9021332263946533e-05, -1.800060272216797e-05, -1.6979873180389404e-05, -1.595914363861084e-05, -1.4938414096832275e-05, -1.3917684555053711e-05, -1.2896955013275146e-05, -1.1876225471496582e-05, -1.0855495929718018e-05, -9.834766387939453e-06, -8.814036846160889e-06, -7.793307304382324e-06, -6.77257776260376e-06, -5.751848220825195e-06, -4.731118679046631e-06, -3.7103891372680664e-06, -2.689659595489502e-06, -1.6689300537109375e-06, -6.48200511932373e-07, 3.725290298461914e-07, 1.3932585716247559e-06, 2.4139881134033203e-06, 3.4347176551818848e-06, 4.455447196960449e-06, 5.476176738739014e-06, 6.496906280517578e-06, 7.517635822296143e-06, 8.538365364074707e-06, 9.559094905853271e-06, 1.0579824447631836e-05, 1.16005539894104e-05, 1.2621283531188965e-05, 1.364201307296753e-05, 1.4662742614746094e-05, 1.5683472156524658e-05, 1.6704201698303223e-05, 1.7724931240081787e-05, 1.874566078186035e-05, 1.9766390323638916e-05, 2.078711986541748e-05, 2.1807849407196045e-05, 2.282857894897461e-05, 2.3849308490753174e-05, 2.4870038032531738e-05, 2.5890767574310303e-05, 2.6911497116088867e-05, 2.793222665786743e-05, 2.8952956199645996e-05, 2.997368574142456e-05, 3.0994415283203125e-05]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 8.0, 10.0, 6.0, 19.0, 15.0, 14.0, 24.0, 28.0, 52.0, 62.0, 164.0, 634.0, 5440.0, 120398.0, 888211.0, 30779.0, 1984.0, 341.0, 115.0, 58.0, 34.0, 28.0, 16.0, 20.0, 21.0, 12.0, 4.0, 9.0, 10.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32373046875, -0.31268310546875, -0.3016357421875, -0.29058837890625, -0.279541015625, -0.26849365234375, -0.2574462890625, -0.24639892578125, -0.2353515625, -0.22430419921875, -0.2132568359375, -0.20220947265625, -0.191162109375, -0.18011474609375, -0.1690673828125, -0.15802001953125, -0.14697265625, -0.13592529296875, -0.1248779296875, -0.11383056640625, -0.102783203125, -0.09173583984375, -0.0806884765625, -0.06964111328125, -0.05859375, -0.04754638671875, -0.0364990234375, -0.02545166015625, -0.014404296875, -0.00335693359375, 0.0076904296875, 0.01873779296875, 0.02978515625, 0.04083251953125, 0.0518798828125, 0.06292724609375, 0.073974609375, 0.08502197265625, 0.0960693359375, 0.10711669921875, 0.1181640625, 0.12921142578125, 0.1402587890625, 0.15130615234375, 0.162353515625, 0.17340087890625, 0.1844482421875, 0.19549560546875, 0.20654296875, 0.21759033203125, 0.2286376953125, 0.23968505859375, 0.250732421875, 0.26177978515625, 0.2728271484375, 0.28387451171875, 0.294921875, 0.30596923828125, 0.3170166015625, 0.32806396484375, 0.339111328125, 0.35015869140625, 0.3612060546875, 0.37225341796875, 0.38330078125]}, "gradients/decoder.roberta.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 8.0, 8.0, 6.0, 15.0, 14.0, 18.0, 12.0, 22.0, 24.0, 22.0, 42.0, 52.0, 84.0, 97.0, 127.0, 107.0, 97.0, 48.0, 39.0, 30.0, 18.0, 22.0, 14.0, 18.0, 7.0, 8.0, 8.0, 9.0, 7.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0224151611328125, -0.02176499366760254, -0.021114826202392578, -0.020464658737182617, -0.019814491271972656, -0.019164323806762695, -0.018514156341552734, -0.017863988876342773, -0.017213821411132812, -0.01656365394592285, -0.01591348648071289, -0.01526331901550293, -0.014613151550292969, -0.013962984085083008, -0.013312816619873047, -0.012662649154663086, -0.012012481689453125, -0.011362314224243164, -0.010712146759033203, -0.010061979293823242, -0.009411811828613281, -0.00876164436340332, -0.00811147689819336, -0.0074613094329833984, -0.0068111419677734375, -0.0061609745025634766, -0.005510807037353516, -0.004860639572143555, -0.004210472106933594, -0.003560304641723633, -0.002910137176513672, -0.002259969711303711, -0.00160980224609375, -0.0009596347808837891, -0.0003094673156738281, 0.0003407001495361328, 0.0009908676147460938, 0.0016410350799560547, 0.0022912025451660156, 0.0029413700103759766, 0.0035915374755859375, 0.0042417049407958984, 0.004891872406005859, 0.00554203987121582, 0.006192207336425781, 0.006842374801635742, 0.007492542266845703, 0.008142709732055664, 0.008792877197265625, 0.009443044662475586, 0.010093212127685547, 0.010743379592895508, 0.011393547058105469, 0.01204371452331543, 0.01269388198852539, 0.013344049453735352, 0.013994216918945312, 0.014644384384155273, 0.015294551849365234, 0.015944719314575195, 0.016594886779785156, 0.017245054244995117, 0.017895221710205078, 0.01854538917541504, 0.019195556640625]}, "gradients/decoder.roberta.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 13.0, 41.0, 111.0, 220.0, 278.0, 189.0, 109.0, 47.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4854736328125, -11.131376266479492, -10.777278900146484, -10.423181533813477, -10.069085121154785, -9.714987754821777, -9.36089038848877, -9.006793022155762, -8.65269660949707, -8.298599243164062, -7.944502353668213, -7.590404987335205, -7.2363080978393555, -6.882210731506348, -6.52811336517334, -6.174015998840332, -5.819918632507324, -5.465821266174316, -5.111724376678467, -4.757627010345459, -4.403530120849609, -4.049432754516602, -3.6953353881835938, -3.341238260269165, -2.9871411323547363, -2.6330440044403076, -2.278946876525879, -1.924849510192871, -1.5707523822784424, -1.2166552543640137, -0.8625578880310059, -0.5084607601165771, -0.15436458587646484, 0.19973260164260864, 0.5538297891616821, 0.9079270362854004, 1.262024164199829, 1.6161212921142578, 1.9702186584472656, 2.3243157863616943, 2.678412914276123, 3.0325100421905518, 3.3866071701049805, 3.7407045364379883, 4.094801902770996, 4.448898792266846, 4.8029961585998535, 5.157093048095703, 5.511190414428711, 5.865287780761719, 6.219384670257568, 6.573482036590576, 6.927578926086426, 7.281676292419434, 7.635773658752441, 7.989871025085449, 8.34396743774414, 8.698064804077148, 9.052162170410156, 9.406259536743164, 9.760355949401855, 10.114453315734863, 10.468550682067871, 10.822648048400879, 11.176745414733887]}, "gradients/decoder.roberta.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 12.0, 15.0, 17.0, 16.0, 20.0, 26.0, 22.0, 38.0, 24.0, 38.0, 32.0, 38.0, 39.0, 37.0, 39.0, 42.0, 43.0, 37.0, 47.0, 43.0, 42.0, 44.0, 38.0, 28.0, 34.0, 30.0, 24.0, 23.0, 15.0, 17.0, 13.0, 17.0, 9.0, 5.0, 7.0, 10.0, 3.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6092982292175293, -2.5270636081695557, -2.444828987121582, -2.3625946044921875, -2.280359983444214, -2.1981253623962402, -2.1158909797668457, -2.033656358718872, -1.9514217376708984, -1.8691871166229248, -1.7869526147842407, -1.7047181129455566, -1.622483491897583, -1.5402488708496094, -1.4580143690109253, -1.3757798671722412, -1.2935452461242676, -1.211310625076294, -1.1290761232376099, -1.0468416213989258, -0.9646070003509521, -0.8823724389076233, -0.8001378774642944, -0.7179033160209656, -0.6356687545776367, -0.5534341931343079, -0.471199631690979, -0.38896507024765015, -0.3067305088043213, -0.22449594736099243, -0.14226138591766357, -0.06002682447433472, 0.02220749855041504, 0.1044420599937439, 0.18667662143707275, 0.2689111828804016, 0.35114574432373047, 0.4333803057670593, 0.5156148672103882, 0.597849428653717, 0.6800839900970459, 0.7623185515403748, 0.8445531129837036, 0.9267876744270325, 1.0090222358703613, 1.091256856918335, 1.173491358757019, 1.2557258605957031, 1.3379604816436768, 1.4201951026916504, 1.5024296045303345, 1.5846641063690186, 1.6668987274169922, 1.7491333484649658, 1.83136785030365, 1.913602352142334, 1.9958369731903076, 2.0780715942382812, 2.160305976867676, 2.2425405979156494, 2.324775218963623, 2.4070098400115967, 2.4892444610595703, 2.571478843688965, 2.6537134647369385]}, "gradients/decoder.roberta.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 10.0, 13.0, 27.0, 31.0, 45.0, 82.0, 128.0, 221.0, 360.0, 672.0, 1210.0, 2257.0, 4217.0, 8556.0, 18351.0, 45511.0, 138644.0, 404942.0, 279863.0, 85940.0, 30451.0, 13395.0, 6373.0, 3169.0, 1749.0, 980.0, 560.0, 309.0, 158.0, 110.0, 63.0, 52.0, 32.0, 22.0, 10.0, 13.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.189453125, -3.089141845703125, -2.98883056640625, -2.888519287109375, -2.7882080078125, -2.687896728515625, -2.58758544921875, -2.487274169921875, -2.386962890625, -2.286651611328125, -2.18634033203125, -2.086029052734375, -1.9857177734375, -1.885406494140625, -1.78509521484375, -1.684783935546875, -1.58447265625, -1.484161376953125, -1.38385009765625, -1.283538818359375, -1.1832275390625, -1.082916259765625, -0.98260498046875, -0.882293701171875, -0.781982421875, -0.681671142578125, -0.58135986328125, -0.481048583984375, -0.3807373046875, -0.280426025390625, -0.18011474609375, -0.079803466796875, 0.0205078125, 0.120819091796875, 0.22113037109375, 0.321441650390625, 0.4217529296875, 0.522064208984375, 0.62237548828125, 0.722686767578125, 0.822998046875, 0.923309326171875, 1.02362060546875, 1.123931884765625, 1.2242431640625, 1.324554443359375, 1.42486572265625, 1.525177001953125, 1.62548828125, 1.725799560546875, 1.82611083984375, 1.926422119140625, 2.0267333984375, 2.127044677734375, 2.22735595703125, 2.327667236328125, 2.427978515625, 2.528289794921875, 2.62860107421875, 2.728912353515625, 2.8292236328125, 2.929534912109375, 3.02984619140625, 3.130157470703125, 3.23046875]}, "gradients/decoder.roberta.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 11.0, 14.0, 12.0, 20.0, 20.0, 17.0, 25.0, 32.0, 31.0, 25.0, 34.0, 35.0, 39.0, 41.0, 33.0, 42.0, 50.0, 40.0, 37.0, 46.0, 46.0, 38.0, 43.0, 37.0, 36.0, 20.0, 32.0, 23.0, 20.0, 16.0, 15.0, 12.0, 18.0, 7.0, 6.0, 8.0, 7.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.716796875, -2.63018798828125, -2.5435791015625, -2.45697021484375, -2.370361328125, -2.28375244140625, -2.1971435546875, -2.11053466796875, -2.02392578125, -1.93731689453125, -1.8507080078125, -1.76409912109375, -1.677490234375, -1.59088134765625, -1.5042724609375, -1.41766357421875, -1.3310546875, -1.24444580078125, -1.1578369140625, -1.07122802734375, -0.984619140625, -0.89801025390625, -0.8114013671875, -0.72479248046875, -0.63818359375, -0.55157470703125, -0.4649658203125, -0.37835693359375, -0.291748046875, -0.20513916015625, -0.1185302734375, -0.03192138671875, 0.0546875, 0.14129638671875, 0.2279052734375, 0.31451416015625, 0.401123046875, 0.48773193359375, 0.5743408203125, 0.66094970703125, 0.74755859375, 0.83416748046875, 0.9207763671875, 1.00738525390625, 1.093994140625, 1.18060302734375, 1.2672119140625, 1.35382080078125, 1.4404296875, 1.52703857421875, 1.6136474609375, 1.70025634765625, 1.786865234375, 1.87347412109375, 1.9600830078125, 2.04669189453125, 2.13330078125, 2.21990966796875, 2.3065185546875, 2.39312744140625, 2.479736328125, 2.56634521484375, 2.6529541015625, 2.73956298828125, 2.826171875]}, "gradients/decoder.roberta.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 3.0, 4.0, 9.0, 6.0, 7.0, 16.0, 13.0, 20.0, 22.0, 29.0, 30.0, 43.0, 52.0, 53.0, 95.0, 138.0, 258.0, 768.0, 1044569.0, 1462.0, 332.0, 151.0, 114.0, 64.0, 48.0, 45.0, 31.0, 25.0, 32.0, 20.0, 24.0, 16.0, 8.0, 2.0, 7.0, 7.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.5, -79.806640625, -77.11328125, -74.419921875, -71.7265625, -69.033203125, -66.33984375, -63.646484375, -60.953125, -58.259765625, -55.56640625, -52.873046875, -50.1796875, -47.486328125, -44.79296875, -42.099609375, -39.40625, -36.712890625, -34.01953125, -31.326171875, -28.6328125, -25.939453125, -23.24609375, -20.552734375, -17.859375, -15.166015625, -12.47265625, -9.779296875, -7.0859375, -4.392578125, -1.69921875, 0.994140625, 3.6875, 6.380859375, 9.07421875, 11.767578125, 14.4609375, 17.154296875, 19.84765625, 22.541015625, 25.234375, 27.927734375, 30.62109375, 33.314453125, 36.0078125, 38.701171875, 41.39453125, 44.087890625, 46.78125, 49.474609375, 52.16796875, 54.861328125, 57.5546875, 60.248046875, 62.94140625, 65.634765625, 68.328125, 71.021484375, 73.71484375, 76.408203125, 79.1015625, 81.794921875, 84.48828125, 87.181640625, 89.875]}, "gradients/decoder.roberta.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 5.0, 7.0, 4.0, 11.0, 15.0, 20.0, 22.0, 30.0, 25.0, 26.0, 37.0, 38.0, 44.0, 40.0, 48.0, 56.0, 43.0, 43.0, 44.0, 42.0, 51.0, 40.0, 42.0, 31.0, 38.0, 26.0, 31.0, 25.0, 20.0, 12.0, 16.0, 8.0, 9.0, 9.0, 5.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.12890625, -3.03546142578125, -2.9420166015625, -2.84857177734375, -2.755126953125, -2.66168212890625, -2.5682373046875, -2.47479248046875, -2.38134765625, -2.28790283203125, -2.1944580078125, -2.10101318359375, -2.007568359375, -1.91412353515625, -1.8206787109375, -1.72723388671875, -1.6337890625, -1.54034423828125, -1.4468994140625, -1.35345458984375, -1.260009765625, -1.16656494140625, -1.0731201171875, -0.97967529296875, -0.88623046875, -0.79278564453125, -0.6993408203125, -0.60589599609375, -0.512451171875, -0.41900634765625, -0.3255615234375, -0.23211669921875, -0.138671875, -0.04522705078125, 0.0482177734375, 0.14166259765625, 0.235107421875, 0.32855224609375, 0.4219970703125, 0.51544189453125, 0.60888671875, 0.70233154296875, 0.7957763671875, 0.88922119140625, 0.982666015625, 1.07611083984375, 1.1695556640625, 1.26300048828125, 1.3564453125, 1.44989013671875, 1.5433349609375, 1.63677978515625, 1.730224609375, 1.82366943359375, 1.9171142578125, 2.01055908203125, 2.10400390625, 2.19744873046875, 2.2908935546875, 2.38433837890625, 2.477783203125, 2.57122802734375, 2.6646728515625, 2.75811767578125, 2.8515625]}, "gradients/decoder.roberta.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 9.0, 8.0, 15.0, 26.0, 41.0, 83.0, 210.0, 471.0, 1452.0, 13098.0, 779962.0, 245522.0, 5916.0, 1015.0, 382.0, 175.0, 82.0, 38.0, 15.0, 10.0, 9.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53515625, -6.3363037109375, -6.137451171875, -5.9385986328125, -5.73974609375, -5.5408935546875, -5.342041015625, -5.1431884765625, -4.9443359375, -4.7454833984375, -4.546630859375, -4.3477783203125, -4.14892578125, -3.9500732421875, -3.751220703125, -3.5523681640625, -3.353515625, -3.1546630859375, -2.955810546875, -2.7569580078125, -2.55810546875, -2.3592529296875, -2.160400390625, -1.9615478515625, -1.7626953125, -1.5638427734375, -1.364990234375, -1.1661376953125, -0.96728515625, -0.7684326171875, -0.569580078125, -0.3707275390625, -0.171875, 0.0269775390625, 0.225830078125, 0.4246826171875, 0.62353515625, 0.8223876953125, 1.021240234375, 1.2200927734375, 1.4189453125, 1.6177978515625, 1.816650390625, 2.0155029296875, 2.21435546875, 2.4132080078125, 2.612060546875, 2.8109130859375, 3.009765625, 3.2086181640625, 3.407470703125, 3.6063232421875, 3.80517578125, 4.0040283203125, 4.202880859375, 4.4017333984375, 4.6005859375, 4.7994384765625, 4.998291015625, 5.1971435546875, 5.39599609375, 5.5948486328125, 5.793701171875, 5.9925537109375, 6.19140625]}, "gradients/decoder.roberta.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 11.0, 11.0, 11.0, 14.0, 28.0, 31.0, 57.0, 76.0, 101.0, 171.0, 161.0, 115.0, 72.0, 47.0, 31.0, 18.0, 8.0, 16.0, 11.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00040602684020996094, -0.0003967583179473877, -0.00038748979568481445, -0.0003782212734222412, -0.00036895275115966797, -0.0003596842288970947, -0.0003504157066345215, -0.00034114718437194824, -0.000331878662109375, -0.00032261013984680176, -0.0003133416175842285, -0.0003040730953216553, -0.00029480457305908203, -0.0002855360507965088, -0.00027626752853393555, -0.0002669990062713623, -0.00025773048400878906, -0.0002484619617462158, -0.00023919343948364258, -0.00022992491722106934, -0.0002206563949584961, -0.00021138787269592285, -0.0002021193504333496, -0.00019285082817077637, -0.00018358230590820312, -0.00017431378364562988, -0.00016504526138305664, -0.0001557767391204834, -0.00014650821685791016, -0.00013723969459533691, -0.00012797117233276367, -0.00011870265007019043, -0.00010943412780761719, -0.00010016560554504395, -9.08970832824707e-05, -8.162856101989746e-05, -7.236003875732422e-05, -6.309151649475098e-05, -5.3822994232177734e-05, -4.455447196960449e-05, -3.528594970703125e-05, -2.6017427444458008e-05, -1.6748905181884766e-05, -7.4803829193115234e-06, 1.7881393432617188e-06, 1.1056661605834961e-05, 2.0325183868408203e-05, 2.9593706130981445e-05, 3.886222839355469e-05, 4.813075065612793e-05, 5.739927291870117e-05, 6.666779518127441e-05, 7.593631744384766e-05, 8.52048397064209e-05, 9.447336196899414e-05, 0.00010374188423156738, 0.00011301040649414062, 0.00012227892875671387, 0.0001315474510192871, 0.00014081597328186035, 0.0001500844955444336, 0.00015935301780700684, 0.00016862154006958008, 0.00017789006233215332, 0.00018715858459472656]}, "gradients/decoder.roberta.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 26.0, 31.0, 54.0, 152.0, 608.0, 19426.0, 1025401.0, 2343.0, 307.0, 92.0, 43.0, 31.0, 14.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.859375, -17.26953125, -16.6796875, -16.08984375, -15.5, -14.91015625, -14.3203125, -13.73046875, -13.140625, -12.55078125, -11.9609375, -11.37109375, -10.78125, -10.19140625, -9.6015625, -9.01171875, -8.421875, -7.83203125, -7.2421875, -6.65234375, -6.0625, -5.47265625, -4.8828125, -4.29296875, -3.703125, -3.11328125, -2.5234375, -1.93359375, -1.34375, -0.75390625, -0.1640625, 0.42578125, 1.015625, 1.60546875, 2.1953125, 2.78515625, 3.375, 3.96484375, 4.5546875, 5.14453125, 5.734375, 6.32421875, 6.9140625, 7.50390625, 8.09375, 8.68359375, 9.2734375, 9.86328125, 10.453125, 11.04296875, 11.6328125, 12.22265625, 12.8125, 13.40234375, 13.9921875, 14.58203125, 15.171875, 15.76171875, 16.3515625, 16.94140625, 17.53125, 18.12109375, 18.7109375, 19.30078125, 19.890625]}, "gradients/decoder.roberta.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 13.0, 28.0, 38.0, 57.0, 103.0, 163.0, 238.0, 137.0, 89.0, 52.0, 37.0, 23.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.09765625, -1.0656967163085938, -1.0337371826171875, -1.0017776489257812, -0.969818115234375, -0.9378585815429688, -0.9058990478515625, -0.8739395141601562, -0.84197998046875, -0.8100204467773438, -0.7780609130859375, -0.7461013793945312, -0.714141845703125, -0.6821823120117188, -0.6502227783203125, -0.6182632446289062, -0.5863037109375, -0.5543441772460938, -0.5223846435546875, -0.49042510986328125, -0.458465576171875, -0.42650604248046875, -0.3945465087890625, -0.36258697509765625, -0.33062744140625, -0.29866790771484375, -0.2667083740234375, -0.23474884033203125, -0.202789306640625, -0.17082977294921875, -0.1388702392578125, -0.10691070556640625, -0.074951171875, -0.04299163818359375, -0.0110321044921875, 0.02092742919921875, 0.052886962890625, 0.08484649658203125, 0.1168060302734375, 0.14876556396484375, 0.18072509765625, 0.21268463134765625, 0.2446441650390625, 0.27660369873046875, 0.308563232421875, 0.34052276611328125, 0.3724822998046875, 0.40444183349609375, 0.4364013671875, 0.46836090087890625, 0.5003204345703125, 0.5322799682617188, 0.564239501953125, 0.5961990356445312, 0.6281585693359375, 0.6601181030273438, 0.69207763671875, 0.7240371704101562, 0.7559967041015625, 0.7879562377929688, 0.819915771484375, 0.8518753051757812, 0.8838348388671875, 0.9157943725585938, 0.94775390625]}, "gradients/decoder.roberta.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 9.0, 36.0, 147.0, 277.0, 293.0, 167.0, 72.0, 14.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.139297485351562, -13.684526443481445, -13.229755401611328, -12.774984359741211, -12.320213317871094, -11.865442276000977, -11.41067123413086, -10.955900192260742, -10.501129150390625, -10.046358108520508, -9.59158706665039, -9.136816024780273, -8.682044982910156, -8.227273941040039, -7.772502899169922, -7.317731857299805, -6.862961292266846, -6.4081902503967285, -5.953419208526611, -5.498648166656494, -5.043877124786377, -4.589106559753418, -4.134335517883301, -3.6795642375946045, -3.2247931957244873, -2.77002215385437, -2.315251111984253, -1.8604801893234253, -1.405709147453308, -0.9509382247924805, -0.4961671829223633, -0.041396141052246094, 0.4133749008178711, 0.8681459426879883, 1.3229169845581055, 1.777687907218933, 2.23245906829834, 2.687229871749878, 3.142000913619995, 3.5967719554901123, 4.051543235778809, 4.506314277648926, 4.961085319519043, 5.41585636138916, 5.870627403259277, 6.3253984451293945, 6.780169486999512, 7.234940528869629, 7.689711093902588, 8.144481658935547, 8.599252700805664, 9.054023742675781, 9.508794784545898, 9.963565826416016, 10.418336868286133, 10.87310791015625, 11.327878952026367, 11.782649993896484, 12.237421035766602, 12.692192077636719, 13.146963119506836, 13.601734161376953, 14.05650520324707, 14.511276245117188, 14.966047286987305]}, "gradients/decoder.roberta.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 4.0, 5.0, 9.0, 13.0, 12.0, 20.0, 20.0, 34.0, 18.0, 32.0, 30.0, 28.0, 26.0, 50.0, 45.0, 37.0, 40.0, 49.0, 52.0, 51.0, 39.0, 38.0, 39.0, 54.0, 30.0, 35.0, 34.0, 25.0, 18.0, 11.0, 19.0, 16.0, 12.0, 10.0, 8.0, 5.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.1062488555908203, -2.9865472316741943, -2.8668456077575684, -2.7471439838409424, -2.6274423599243164, -2.5077409744262695, -2.3880391120910645, -2.2683377265930176, -2.1486361026763916, -2.0289344787597656, -1.9092328548431396, -1.7895312309265137, -1.6698297262191772, -1.5501281023025513, -1.4304264783859253, -1.3107249736785889, -1.1910232305526733, -1.0713216066360474, -0.9516200423240662, -0.8319184184074402, -0.712216854095459, -0.592515230178833, -0.47281360626220703, -0.35311204195022583, -0.23341041803359985, -0.11370881646871567, 0.005992785096168518, 0.1256943941116333, 0.2453959882259369, 0.3650975823402405, 0.48479920625686646, 0.6045007705688477, 0.7242023944854736, 0.8439040184020996, 0.9636055827140808, 1.0833072662353516, 1.203008770942688, 1.322710394859314, 1.44241201877594, 1.5621135234832764, 1.6818151473999023, 1.8015167713165283, 1.9212183952331543, 2.0409200191497803, 2.1606216430664062, 2.280323028564453, 2.400024890899658, 2.519726276397705, 2.63942813873291, 2.759129762649536, 2.878831386566162, 2.998533010482788, 3.118234634399414, 3.237936019897461, 3.357637882232666, 3.477339267730713, 3.597040891647339, 3.716742515563965, 3.836444139480591, 3.956145763397217, 4.075847148895264, 4.195549011230469, 4.315250396728516, 4.434952259063721, 4.554653644561768]}, "gradients/decoder.roberta.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 2.0, 6.0, 9.0, 10.0, 6.0, 13.0, 20.0, 21.0, 20.0, 44.0, 31.0, 54.0, 68.0, 82.0, 130.0, 144.0, 217.0, 243.0, 337.0, 472.0, 747.0, 1263.0, 2665.0, 6712.0, 22602.0, 107542.0, 978163.0, 2768630.0, 242477.0, 41743.0, 11174.0, 3750.0, 1743.0, 896.0, 550.0, 409.0, 305.0, 207.0, 161.0, 141.0, 96.0, 77.0, 65.0, 59.0, 58.0, 28.0, 32.0, 13.0, 16.0, 13.0, 5.0, 4.0, 6.0, 7.0, 0.0, 2.0], "bins": [-5.48046875, -5.3248291015625, -5.169189453125, -5.0135498046875, -4.85791015625, -4.7022705078125, -4.546630859375, -4.3909912109375, -4.2353515625, -4.0797119140625, -3.924072265625, -3.7684326171875, -3.61279296875, -3.4571533203125, -3.301513671875, -3.1458740234375, -2.990234375, -2.8345947265625, -2.678955078125, -2.5233154296875, -2.36767578125, -2.2120361328125, -2.056396484375, -1.9007568359375, -1.7451171875, -1.5894775390625, -1.433837890625, -1.2781982421875, -1.12255859375, -0.9669189453125, -0.811279296875, -0.6556396484375, -0.5, -0.3443603515625, -0.188720703125, -0.0330810546875, 0.12255859375, 0.2781982421875, 0.433837890625, 0.5894775390625, 0.7451171875, 0.9007568359375, 1.056396484375, 1.2120361328125, 1.36767578125, 1.5233154296875, 1.678955078125, 1.8345947265625, 1.990234375, 2.1458740234375, 2.301513671875, 2.4571533203125, 2.61279296875, 2.7684326171875, 2.924072265625, 3.0797119140625, 3.2353515625, 3.3909912109375, 3.546630859375, 3.7022705078125, 3.85791015625, 4.0135498046875, 4.169189453125, 4.3248291015625, 4.48046875]}, "gradients/decoder.roberta.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 7.0, 4.0, 6.0, 7.0, 15.0, 19.0, 18.0, 20.0, 21.0, 22.0, 27.0, 35.0, 37.0, 27.0, 43.0, 48.0, 54.0, 40.0, 35.0, 44.0, 39.0, 50.0, 42.0, 34.0, 45.0, 42.0, 32.0, 34.0, 26.0, 22.0, 20.0, 14.0, 15.0, 17.0, 6.0, 9.0, 5.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.28515625, -2.212158203125, -2.13916015625, -2.066162109375, -1.9931640625, -1.920166015625, -1.84716796875, -1.774169921875, -1.701171875, -1.628173828125, -1.55517578125, -1.482177734375, -1.4091796875, -1.336181640625, -1.26318359375, -1.190185546875, -1.1171875, -1.044189453125, -0.97119140625, -0.898193359375, -0.8251953125, -0.752197265625, -0.67919921875, -0.606201171875, -0.533203125, -0.460205078125, -0.38720703125, -0.314208984375, -0.2412109375, -0.168212890625, -0.09521484375, -0.022216796875, 0.05078125, 0.123779296875, 0.19677734375, 0.269775390625, 0.3427734375, 0.415771484375, 0.48876953125, 0.561767578125, 0.634765625, 0.707763671875, 0.78076171875, 0.853759765625, 0.9267578125, 0.999755859375, 1.07275390625, 1.145751953125, 1.21875, 1.291748046875, 1.36474609375, 1.437744140625, 1.5107421875, 1.583740234375, 1.65673828125, 1.729736328125, 1.802734375, 1.875732421875, 1.94873046875, 2.021728515625, 2.0947265625, 2.167724609375, 2.24072265625, 2.313720703125, 2.38671875]}, "gradients/decoder.roberta.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 6.0, 11.0, 15.0, 14.0, 27.0, 30.0, 35.0, 66.0, 93.0, 175.0, 266.0, 561.0, 3537.0, 222576.0, 3949781.0, 14936.0, 1196.0, 352.0, 183.0, 123.0, 80.0, 52.0, 41.0, 40.0, 17.0, 10.0, 7.0, 8.0, 4.0, 7.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.48193359375, -16.7607421875, -16.03955078125, -15.318359375, -14.59716796875, -13.8759765625, -13.15478515625, -12.43359375, -11.71240234375, -10.9912109375, -10.27001953125, -9.548828125, -8.82763671875, -8.1064453125, -7.38525390625, -6.6640625, -5.94287109375, -5.2216796875, -4.50048828125, -3.779296875, -3.05810546875, -2.3369140625, -1.61572265625, -0.89453125, -0.17333984375, 0.5478515625, 1.26904296875, 1.990234375, 2.71142578125, 3.4326171875, 4.15380859375, 4.875, 5.59619140625, 6.3173828125, 7.03857421875, 7.759765625, 8.48095703125, 9.2021484375, 9.92333984375, 10.64453125, 11.36572265625, 12.0869140625, 12.80810546875, 13.529296875, 14.25048828125, 14.9716796875, 15.69287109375, 16.4140625, 17.13525390625, 17.8564453125, 18.57763671875, 19.298828125, 20.02001953125, 20.7412109375, 21.46240234375, 22.18359375, 22.90478515625, 23.6259765625, 24.34716796875, 25.068359375, 25.78955078125, 26.5107421875, 27.23193359375, 27.953125]}, "gradients/decoder.roberta.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 9.0, 4.0, 8.0, 9.0, 26.0, 43.0, 50.0, 52.0, 80.0, 132.0, 197.0, 268.0, 485.0, 696.0, 639.0, 476.0, 288.0, 194.0, 127.0, 72.0, 59.0, 39.0, 32.0, 17.0, 19.0, 10.0, 8.0, 6.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.55078125, -1.5099334716796875, -1.469085693359375, -1.4282379150390625, -1.38739013671875, -1.3465423583984375, -1.305694580078125, -1.2648468017578125, -1.2239990234375, -1.1831512451171875, -1.142303466796875, -1.1014556884765625, -1.06060791015625, -1.0197601318359375, -0.978912353515625, -0.9380645751953125, -0.897216796875, -0.8563690185546875, -0.815521240234375, -0.7746734619140625, -0.73382568359375, -0.6929779052734375, -0.652130126953125, -0.6112823486328125, -0.5704345703125, -0.5295867919921875, -0.488739013671875, -0.4478912353515625, -0.40704345703125, -0.3661956787109375, -0.325347900390625, -0.2845001220703125, -0.24365234375, -0.2028045654296875, -0.161956787109375, -0.1211090087890625, -0.08026123046875, -0.0394134521484375, 0.001434326171875, 0.0422821044921875, 0.0831298828125, 0.1239776611328125, 0.164825439453125, 0.2056732177734375, 0.24652099609375, 0.2873687744140625, 0.328216552734375, 0.3690643310546875, 0.409912109375, 0.4507598876953125, 0.491607666015625, 0.5324554443359375, 0.57330322265625, 0.6141510009765625, 0.654998779296875, 0.6958465576171875, 0.7366943359375, 0.7775421142578125, 0.818389892578125, 0.8592376708984375, 0.90008544921875, 0.9409332275390625, 0.981781005859375, 1.0226287841796875, 1.0634765625]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 9.0, 16.0, 21.0, 42.0, 65.0, 90.0, 86.0, 102.0, 112.0, 107.0, 111.0, 80.0, 54.0, 52.0, 26.0, 15.0, 10.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.164712905883789, -5.010464668273926, -4.856216907501221, -4.701968669891357, -4.547720909118652, -4.393472671508789, -4.239224433898926, -4.0849761962890625, -3.9307284355163574, -3.7764804363250732, -3.622232437133789, -3.467984199523926, -3.3137362003326416, -3.1594882011413574, -3.005239963531494, -2.85099196434021, -2.696743965148926, -2.5424959659576416, -2.3882479667663574, -2.233999729156494, -2.07975172996521, -1.9255037307739258, -1.771255612373352, -1.6170074939727783, -1.4627594947814941, -1.30851149559021, -1.1542633771896362, -1.0000152587890625, -0.8457672595977783, -0.6915192008018494, -0.5372711420059204, -0.3830230236053467, -0.2287745475769043, -0.07452648878097534, 0.07972157001495361, 0.23396962881088257, 0.3882176876068115, 0.5424657464027405, 0.6967138051986694, 0.8509619235992432, 1.0052099227905273, 1.1594579219818115, 1.3137060403823853, 1.467954158782959, 1.6222021579742432, 1.7764501571655273, 1.930698275566101, 2.084946393966675, 2.239194393157959, 2.393442392349243, 2.5476903915405273, 2.7019386291503906, 2.856186628341675, 3.010434627532959, 3.1646828651428223, 3.3189308643341064, 3.4731788635253906, 3.627426862716675, 3.781674861907959, 3.9359230995178223, 4.090170860290527, 4.244419097900391, 4.398667335510254, 4.552915573120117, 4.707163333892822]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 6.0, 1.0, 5.0, 7.0, 8.0, 13.0, 17.0, 17.0, 17.0, 25.0, 17.0, 33.0, 30.0, 28.0, 32.0, 31.0, 42.0, 44.0, 33.0, 44.0, 61.0, 40.0, 46.0, 45.0, 40.0, 43.0, 22.0, 30.0, 25.0, 33.0, 27.0, 19.0, 23.0, 18.0, 18.0, 13.0, 9.0, 13.0, 7.0, 5.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.2238857746124268, -2.1420106887817383, -2.0601353645324707, -1.9782601594924927, -1.8963849544525146, -1.8145098686218262, -1.7326346635818481, -1.6507594585418701, -1.568884253501892, -1.487009048461914, -1.405133843421936, -1.323258638381958, -1.2413835525512695, -1.159508228302002, -1.0776331424713135, -0.9957579374313354, -0.9138827323913574, -0.8320075273513794, -0.7501323223114014, -0.6682571768760681, -0.5863819718360901, -0.5045067667961121, -0.4226315915584564, -0.3407564163208008, -0.25888121128082275, -0.17700602114200592, -0.09513083100318909, -0.013255640864372253, 0.06861954927444458, 0.1504947543144226, 0.23236992955207825, 0.3142451047897339, 0.3961203098297119, 0.47799551486968994, 0.559870719909668, 0.6417458653450012, 0.7236210703849792, 0.8054962754249573, 0.8873714208602905, 0.9692466259002686, 1.0511218309402466, 1.1329970359802246, 1.2148722410202026, 1.2967474460601807, 1.3786225318908691, 1.4604978561401367, 1.5423729419708252, 1.6242481470108032, 1.7061233520507812, 1.7879985570907593, 1.8698737621307373, 1.9517489671707153, 2.0336241722106934, 2.115499258041382, 2.1973745822906494, 2.279249668121338, 2.3611249923706055, 2.443000078201294, 2.5248754024505615, 2.60675048828125, 2.6886258125305176, 2.770500898361206, 2.8523762226104736, 2.934251308441162, 3.0161263942718506]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 14.0, 14.0, 20.0, 43.0, 48.0, 69.0, 93.0, 177.0, 262.0, 449.0, 707.0, 1059.0, 1822.0, 2836.0, 4660.0, 7855.0, 13418.0, 23474.0, 43569.0, 85441.0, 177060.0, 285405.0, 196280.0, 94647.0, 47594.0, 25439.0, 14424.0, 8386.0, 5102.0, 3158.0, 1882.0, 1159.0, 681.0, 453.0, 314.0, 177.0, 129.0, 70.0, 61.0, 35.0, 21.0, 14.0, 11.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.5859375, -0.5679473876953125, -0.549957275390625, -0.5319671630859375, -0.51397705078125, -0.4959869384765625, -0.477996826171875, -0.4600067138671875, -0.4420166015625, -0.4240264892578125, -0.406036376953125, -0.3880462646484375, -0.37005615234375, -0.3520660400390625, -0.334075927734375, -0.3160858154296875, -0.298095703125, -0.2801055908203125, -0.262115478515625, -0.2441253662109375, -0.22613525390625, -0.2081451416015625, -0.190155029296875, -0.1721649169921875, -0.1541748046875, -0.1361846923828125, -0.118194580078125, -0.1002044677734375, -0.08221435546875, -0.0642242431640625, -0.046234130859375, -0.0282440185546875, -0.01025390625, 0.0077362060546875, 0.025726318359375, 0.0437164306640625, 0.06170654296875, 0.0796966552734375, 0.097686767578125, 0.1156768798828125, 0.1336669921875, 0.1516571044921875, 0.169647216796875, 0.1876373291015625, 0.20562744140625, 0.2236175537109375, 0.241607666015625, 0.2595977783203125, 0.277587890625, 0.2955780029296875, 0.313568115234375, 0.3315582275390625, 0.34954833984375, 0.3675384521484375, 0.385528564453125, 0.4035186767578125, 0.4215087890625, 0.4394989013671875, 0.457489013671875, 0.4754791259765625, 0.49346923828125, 0.5114593505859375, 0.529449462890625, 0.5474395751953125, 0.5654296875]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 6.0, 5.0, 1.0, 5.0, 2.0, 5.0, 7.0, 8.0, 13.0, 14.0, 21.0, 14.0, 23.0, 20.0, 32.0, 31.0, 28.0, 33.0, 30.0, 39.0, 48.0, 32.0, 46.0, 55.0, 43.0, 46.0, 47.0, 38.0, 41.0, 23.0, 34.0, 24.0, 33.0, 26.0, 21.0, 20.0, 20.0, 19.0, 12.0, 9.0, 13.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.142578125, -2.062744140625, -1.98291015625, -1.903076171875, -1.8232421875, -1.743408203125, -1.66357421875, -1.583740234375, -1.50390625, -1.424072265625, -1.34423828125, -1.264404296875, -1.1845703125, -1.104736328125, -1.02490234375, -0.945068359375, -0.865234375, -0.785400390625, -0.70556640625, -0.625732421875, -0.5458984375, -0.466064453125, -0.38623046875, -0.306396484375, -0.2265625, -0.146728515625, -0.06689453125, 0.012939453125, 0.0927734375, 0.172607421875, 0.25244140625, 0.332275390625, 0.412109375, 0.491943359375, 0.57177734375, 0.651611328125, 0.7314453125, 0.811279296875, 0.89111328125, 0.970947265625, 1.05078125, 1.130615234375, 1.21044921875, 1.290283203125, 1.3701171875, 1.449951171875, 1.52978515625, 1.609619140625, 1.689453125, 1.769287109375, 1.84912109375, 1.928955078125, 2.0087890625, 2.088623046875, 2.16845703125, 2.248291015625, 2.328125, 2.407958984375, 2.48779296875, 2.567626953125, 2.6474609375, 2.727294921875, 2.80712890625, 2.886962890625, 2.966796875]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 12.0, 7.0, 9.0, 10.0, 11.0, 17.0, 27.0, 35.0, 53.0, 54.0, 85.0, 100.0, 149.0, 194.0, 285.0, 412.0, 634.0, 957.0, 1688.0, 3295.0, 7891.0, 23583.0, 886435.0, 88412.0, 19836.0, 6878.0, 3062.0, 1526.0, 919.0, 562.0, 415.0, 290.0, 174.0, 128.0, 97.0, 71.0, 65.0, 47.0, 39.0, 23.0, 18.0, 5.0, 12.0, 9.0, 7.0, 4.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5888671875, -1.540618896484375, -1.49237060546875, -1.444122314453125, -1.3958740234375, -1.347625732421875, -1.29937744140625, -1.251129150390625, -1.202880859375, -1.154632568359375, -1.10638427734375, -1.058135986328125, -1.0098876953125, -0.961639404296875, -0.91339111328125, -0.865142822265625, -0.81689453125, -0.768646240234375, -0.72039794921875, -0.672149658203125, -0.6239013671875, -0.575653076171875, -0.52740478515625, -0.479156494140625, -0.430908203125, -0.382659912109375, -0.33441162109375, -0.286163330078125, -0.2379150390625, -0.189666748046875, -0.14141845703125, -0.093170166015625, -0.044921875, 0.003326416015625, 0.05157470703125, 0.099822998046875, 0.1480712890625, 0.196319580078125, 0.24456787109375, 0.292816162109375, 0.341064453125, 0.389312744140625, 0.43756103515625, 0.485809326171875, 0.5340576171875, 0.582305908203125, 0.63055419921875, 0.678802490234375, 0.72705078125, 0.775299072265625, 0.82354736328125, 0.871795654296875, 0.9200439453125, 0.968292236328125, 1.01654052734375, 1.064788818359375, 1.113037109375, 1.161285400390625, 1.20953369140625, 1.257781982421875, 1.3060302734375, 1.354278564453125, 1.40252685546875, 1.450775146484375, 1.4990234375]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 12.0, 7.0, 5.0, 3.0, 10.0, 8.0, 18.0, 21.0, 25.0, 18.0, 31.0, 36.0, 38.0, 35.0, 36.0, 37.0, 48.0, 40.0, 39.0, 43.0, 38.0, 44.0, 40.0, 34.0, 43.0, 37.0, 28.0, 39.0, 26.0, 30.0, 24.0, 15.0, 25.0, 10.0, 12.0, 11.0, 9.0, 9.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.9150390625, -1.8620147705078125, -1.808990478515625, -1.7559661865234375, -1.70294189453125, -1.6499176025390625, -1.596893310546875, -1.5438690185546875, -1.4908447265625, -1.4378204345703125, -1.384796142578125, -1.3317718505859375, -1.27874755859375, -1.2257232666015625, -1.172698974609375, -1.1196746826171875, -1.066650390625, -1.0136260986328125, -0.960601806640625, -0.9075775146484375, -0.85455322265625, -0.8015289306640625, -0.748504638671875, -0.6954803466796875, -0.6424560546875, -0.5894317626953125, -0.536407470703125, -0.4833831787109375, -0.43035888671875, -0.3773345947265625, -0.324310302734375, -0.2712860107421875, -0.21826171875, -0.1652374267578125, -0.112213134765625, -0.0591888427734375, -0.00616455078125, 0.0468597412109375, 0.099884033203125, 0.1529083251953125, 0.2059326171875, 0.2589569091796875, 0.311981201171875, 0.3650054931640625, 0.41802978515625, 0.4710540771484375, 0.524078369140625, 0.5771026611328125, 0.630126953125, 0.6831512451171875, 0.736175537109375, 0.7891998291015625, 0.84222412109375, 0.8952484130859375, 0.948272705078125, 1.0012969970703125, 1.0543212890625, 1.1073455810546875, 1.160369873046875, 1.2133941650390625, 1.26641845703125, 1.3194427490234375, 1.372467041015625, 1.4254913330078125, 1.478515625]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 10.0, 16.0, 21.0, 21.0, 20.0, 27.0, 48.0, 73.0, 105.0, 126.0, 212.0, 361.0, 523.0, 942.0, 1688.0, 3832.0, 11205.0, 60464.0, 938209.0, 19550.0, 5660.0, 2439.0, 1172.0, 618.0, 386.0, 241.0, 166.0, 113.0, 84.0, 61.0, 35.0, 27.0, 26.0, 14.0, 8.0, 12.0, 8.0, 5.0, 8.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0], "bins": [-0.226318359375, -0.21970176696777344, -0.21308517456054688, -0.2064685821533203, -0.19985198974609375, -0.1932353973388672, -0.18661880493164062, -0.18000221252441406, -0.1733856201171875, -0.16676902770996094, -0.16015243530273438, -0.1535358428955078, -0.14691925048828125, -0.1403026580810547, -0.13368606567382812, -0.12706947326660156, -0.120452880859375, -0.11383628845214844, -0.10721969604492188, -0.10060310363769531, -0.09398651123046875, -0.08736991882324219, -0.08075332641601562, -0.07413673400878906, -0.0675201416015625, -0.06090354919433594, -0.054286956787109375, -0.04767036437988281, -0.04105377197265625, -0.03443717956542969, -0.027820587158203125, -0.021203994750976562, -0.01458740234375, -0.007970809936523438, -0.001354217529296875, 0.0052623748779296875, 0.01187896728515625, 0.018495559692382812, 0.025112152099609375, 0.03172874450683594, 0.0383453369140625, 0.04496192932128906, 0.051578521728515625, 0.05819511413574219, 0.06481170654296875, 0.07142829895019531, 0.07804489135742188, 0.08466148376464844, 0.091278076171875, 0.09789466857910156, 0.10451126098632812, 0.11112785339355469, 0.11774444580078125, 0.12436103820800781, 0.13097763061523438, 0.13759422302246094, 0.1442108154296875, 0.15082740783691406, 0.15744400024414062, 0.1640605926513672, 0.17067718505859375, 0.1772937774658203, 0.18391036987304688, 0.19052696228027344, 0.1971435546875]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 5.0, 7.0, 4.0, 6.0, 17.0, 9.0, 16.0, 17.0, 20.0, 26.0, 43.0, 50.0, 33.0, 72.0, 54.0, 61.0, 60.0, 53.0, 57.0, 62.0, 49.0, 37.0, 48.0, 29.0, 31.0, 22.0, 16.0, 18.0, 22.0, 6.0, 6.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.0650367736816406e-05, -3.954209387302399e-05, -3.843382000923157e-05, -3.732554614543915e-05, -3.621727228164673e-05, -3.510899841785431e-05, -3.400072455406189e-05, -3.289245069026947e-05, -3.178417682647705e-05, -3.067590296268463e-05, -2.9567629098892212e-05, -2.8459355235099792e-05, -2.7351081371307373e-05, -2.6242807507514954e-05, -2.5134533643722534e-05, -2.4026259779930115e-05, -2.2917985916137695e-05, -2.1809712052345276e-05, -2.0701438188552856e-05, -1.9593164324760437e-05, -1.8484890460968018e-05, -1.7376616597175598e-05, -1.626834273338318e-05, -1.516006886959076e-05, -1.405179500579834e-05, -1.294352114200592e-05, -1.1835247278213501e-05, -1.0726973414421082e-05, -9.618699550628662e-06, -8.510425686836243e-06, -7.402151823043823e-06, -6.293877959251404e-06, -5.185604095458984e-06, -4.077330231666565e-06, -2.9690563678741455e-06, -1.860782504081726e-06, -7.525086402893066e-07, 3.557652235031128e-07, 1.4640390872955322e-06, 2.5723129510879517e-06, 3.680586814880371e-06, 4.7888606786727905e-06, 5.89713454246521e-06, 7.005408406257629e-06, 8.113682270050049e-06, 9.221956133842468e-06, 1.0330229997634888e-05, 1.1438503861427307e-05, 1.2546777725219727e-05, 1.3655051589012146e-05, 1.4763325452804565e-05, 1.5871599316596985e-05, 1.6979873180389404e-05, 1.8088147044181824e-05, 1.9196420907974243e-05, 2.0304694771766663e-05, 2.1412968635559082e-05, 2.25212424993515e-05, 2.362951636314392e-05, 2.473779022693634e-05, 2.584606409072876e-05, 2.695433795452118e-05, 2.80626118183136e-05, 2.9170885682106018e-05, 3.0279159545898438e-05]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 9.0, 5.0, 4.0, 2.0, 11.0, 11.0, 20.0, 28.0, 46.0, 80.0, 262.0, 2077.0, 102486.0, 929542.0, 13006.0, 631.0, 140.0, 65.0, 30.0, 18.0, 19.0, 17.0, 8.0, 8.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50439453125, -0.4892311096191406, -0.47406768798828125, -0.4589042663574219, -0.4437408447265625, -0.4285774230957031, -0.41341400146484375, -0.3982505798339844, -0.383087158203125, -0.3679237365722656, -0.35276031494140625, -0.3375968933105469, -0.3224334716796875, -0.3072700500488281, -0.29210662841796875, -0.2769432067871094, -0.26177978515625, -0.24661636352539062, -0.23145294189453125, -0.21628952026367188, -0.2011260986328125, -0.18596267700195312, -0.17079925537109375, -0.15563583374023438, -0.140472412109375, -0.12530899047851562, -0.11014556884765625, -0.09498214721679688, -0.0798187255859375, -0.06465530395507812, -0.04949188232421875, -0.034328460693359375, -0.0191650390625, -0.004001617431640625, 0.01116180419921875, 0.026325225830078125, 0.0414886474609375, 0.056652069091796875, 0.07181549072265625, 0.08697891235351562, 0.102142333984375, 0.11730575561523438, 0.13246917724609375, 0.14763259887695312, 0.1627960205078125, 0.17795944213867188, 0.19312286376953125, 0.20828628540039062, 0.22344970703125, 0.23861312866210938, 0.25377655029296875, 0.2689399719238281, 0.2841033935546875, 0.2992668151855469, 0.31443023681640625, 0.3295936584472656, 0.344757080078125, 0.3599205017089844, 0.37508392333984375, 0.3902473449707031, 0.4054107666015625, 0.4205741882324219, 0.43573760986328125, 0.4509010314941406, 0.466064453125]}, "gradients/decoder.roberta.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 1.0, 5.0, 2.0, 8.0, 9.0, 11.0, 10.0, 21.0, 18.0, 46.0, 51.0, 77.0, 111.0, 144.0, 139.0, 108.0, 63.0, 43.0, 30.0, 20.0, 21.0, 15.0, 12.0, 4.0, 4.0, 1.0, 10.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02471923828125, -0.023919343948364258, -0.023119449615478516, -0.022319555282592773, -0.02151966094970703, -0.02071976661682129, -0.019919872283935547, -0.019119977951049805, -0.018320083618164062, -0.01752018928527832, -0.016720294952392578, -0.015920400619506836, -0.015120506286621094, -0.014320611953735352, -0.01352071762084961, -0.012720823287963867, -0.011920928955078125, -0.011121034622192383, -0.01032114028930664, -0.009521245956420898, -0.008721351623535156, -0.007921457290649414, -0.007121562957763672, -0.00632166862487793, -0.0055217742919921875, -0.004721879959106445, -0.003921985626220703, -0.003122091293334961, -0.0023221969604492188, -0.0015223026275634766, -0.0007224082946777344, 7.748603820800781e-05, 0.00087738037109375, 0.0016772747039794922, 0.0024771690368652344, 0.0032770633697509766, 0.004076957702636719, 0.004876852035522461, 0.005676746368408203, 0.006476640701293945, 0.0072765350341796875, 0.00807642936706543, 0.008876323699951172, 0.009676218032836914, 0.010476112365722656, 0.011276006698608398, 0.01207590103149414, 0.012875795364379883, 0.013675689697265625, 0.014475584030151367, 0.01527547836303711, 0.01607537269592285, 0.016875267028808594, 0.017675161361694336, 0.018475055694580078, 0.01927495002746582, 0.020074844360351562, 0.020874738693237305, 0.021674633026123047, 0.02247452735900879, 0.02327442169189453, 0.024074316024780273, 0.024874210357666016, 0.025674104690551758, 0.0264739990234375]}, "gradients/decoder.roberta.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 12.0, 31.0, 62.0, 144.0, 175.0, 208.0, 177.0, 122.0, 62.0, 15.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.652819633483887, -13.37062931060791, -13.088438987731934, -12.80624771118164, -12.524057388305664, -12.241867065429688, -11.959676742553711, -11.677486419677734, -11.395296096801758, -11.113105773925781, -10.830915451049805, -10.548725128173828, -10.266533851623535, -9.984343528747559, -9.702153205871582, -9.419962882995605, -9.137771606445312, -8.855581283569336, -8.57339096069336, -8.291200637817383, -8.00900936126709, -7.726819038391113, -7.444628715515137, -7.16243839263916, -6.880248069763184, -6.598057746887207, -6.315866947174072, -6.033676624298096, -5.751486301422119, -5.469295501708984, -5.187105178833008, -4.904914855957031, -4.622724533081055, -4.340534210205078, -4.058343410491943, -3.776153087615967, -3.4939627647399902, -3.2117722034454346, -2.929581642150879, -2.6473913192749023, -2.3652007579803467, -2.083010196685791, -1.8008198738098145, -1.5186293125152588, -1.2364388704299927, -0.9542484283447266, -0.6720578670501709, -0.3898674249649048, -0.10767698287963867, 0.17451348900794983, 0.45670396089553833, 0.7388944625854492, 1.0210849046707153, 1.3032753467559814, 1.585465908050537, 1.8676563501358032, 2.1498467922210693, 2.432037353515625, 2.7142276763916016, 2.9964182376861572, 3.278608798980713, 3.5607991218566895, 3.842989683151245, 4.125180244445801, 4.407370567321777]}, "gradients/decoder.roberta.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 7.0, 13.0, 13.0, 22.0, 14.0, 21.0, 23.0, 30.0, 32.0, 28.0, 33.0, 31.0, 36.0, 48.0, 34.0, 46.0, 55.0, 45.0, 44.0, 47.0, 37.0, 42.0, 25.0, 32.0, 24.0, 34.0, 26.0, 21.0, 20.0, 20.0, 20.0, 11.0, 9.0, 13.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1478006839752197, -2.067878246307373, -1.9879558086395264, -1.9080333709716797, -1.828110933303833, -1.7481884956359863, -1.6682661771774292, -1.5883437395095825, -1.5084213018417358, -1.4284988641738892, -1.3485764265060425, -1.2686539888381958, -1.1887316703796387, -1.108809232711792, -1.0288867950439453, -0.9489643573760986, -0.869041919708252, -0.7891194820404053, -0.7091970443725586, -0.6292746663093567, -0.54935222864151, -0.46942979097366333, -0.38950738310813904, -0.30958497524261475, -0.22966253757476807, -0.14974011480808258, -0.0698176920413971, 0.010104730725288391, 0.09002715349197388, 0.16994959115982056, 0.24987199902534485, 0.32979440689086914, 0.4097168445587158, 0.4896392822265625, 0.5695617198944092, 0.6494840979576111, 0.7294065356254578, 0.8093289732933044, 0.8892513513565063, 0.969173789024353, 1.0490962266921997, 1.1290186643600464, 1.208941102027893, 1.2888635396957397, 1.3687858581542969, 1.4487082958221436, 1.5286307334899902, 1.608553171157837, 1.6884756088256836, 1.7683980464935303, 1.848320484161377, 1.9282429218292236, 2.0081653594970703, 2.088087797164917, 2.1680102348327637, 2.2479324340820312, 2.327855110168457, 2.4077775478363037, 2.4876999855041504, 2.567622423171997, 2.6475448608398438, 2.7274672985076904, 2.807389736175537, 2.8873119354248047, 2.9672343730926514]}, "gradients/decoder.roberta.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 2.0, 3.0, 10.0, 19.0, 29.0, 42.0, 31.0, 68.0, 107.0, 149.0, 192.0, 382.0, 653.0, 1139.0, 1993.0, 3797.0, 6904.0, 13225.0, 24836.0, 47919.0, 95749.0, 225679.0, 336840.0, 145210.0, 68636.0, 35207.0, 18313.0, 9814.0, 5199.0, 2717.0, 1421.0, 900.0, 516.0, 296.0, 175.0, 122.0, 79.0, 55.0, 34.0, 30.0, 13.0, 9.0, 11.0, 4.0, 7.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0], "bins": [-2.458984375, -2.389251708984375, -2.31951904296875, -2.249786376953125, -2.1800537109375, -2.110321044921875, -2.04058837890625, -1.970855712890625, -1.901123046875, -1.831390380859375, -1.76165771484375, -1.691925048828125, -1.6221923828125, -1.552459716796875, -1.48272705078125, -1.412994384765625, -1.34326171875, -1.273529052734375, -1.20379638671875, -1.134063720703125, -1.0643310546875, -0.994598388671875, -0.92486572265625, -0.855133056640625, -0.785400390625, -0.715667724609375, -0.64593505859375, -0.576202392578125, -0.5064697265625, -0.436737060546875, -0.36700439453125, -0.297271728515625, -0.2275390625, -0.157806396484375, -0.08807373046875, -0.018341064453125, 0.0513916015625, 0.121124267578125, 0.19085693359375, 0.260589599609375, 0.330322265625, 0.400054931640625, 0.46978759765625, 0.539520263671875, 0.6092529296875, 0.678985595703125, 0.74871826171875, 0.818450927734375, 0.88818359375, 0.957916259765625, 1.02764892578125, 1.097381591796875, 1.1671142578125, 1.236846923828125, 1.30657958984375, 1.376312255859375, 1.446044921875, 1.515777587890625, 1.58551025390625, 1.655242919921875, 1.7249755859375, 1.794708251953125, 1.86444091796875, 1.934173583984375, 2.00390625]}, "gradients/decoder.roberta.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 8.0, 11.0, 17.0, 19.0, 17.0, 22.0, 24.0, 27.0, 29.0, 28.0, 32.0, 27.0, 41.0, 48.0, 37.0, 38.0, 56.0, 48.0, 44.0, 53.0, 41.0, 33.0, 33.0, 30.0, 26.0, 29.0, 28.0, 20.0, 23.0, 17.0, 20.0, 13.0, 9.0, 14.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.08203125, -2.001678466796875, -1.92132568359375, -1.840972900390625, -1.7606201171875, -1.680267333984375, -1.59991455078125, -1.519561767578125, -1.439208984375, -1.358856201171875, -1.27850341796875, -1.198150634765625, -1.1177978515625, -1.037445068359375, -0.95709228515625, -0.876739501953125, -0.79638671875, -0.716033935546875, -0.63568115234375, -0.555328369140625, -0.4749755859375, -0.394622802734375, -0.31427001953125, -0.233917236328125, -0.153564453125, -0.073211669921875, 0.00714111328125, 0.087493896484375, 0.1678466796875, 0.248199462890625, 0.32855224609375, 0.408905029296875, 0.4892578125, 0.569610595703125, 0.64996337890625, 0.730316162109375, 0.8106689453125, 0.891021728515625, 0.97137451171875, 1.051727294921875, 1.132080078125, 1.212432861328125, 1.29278564453125, 1.373138427734375, 1.4534912109375, 1.533843994140625, 1.61419677734375, 1.694549560546875, 1.77490234375, 1.855255126953125, 1.93560791015625, 2.015960693359375, 2.0963134765625, 2.176666259765625, 2.25701904296875, 2.337371826171875, 2.417724609375, 2.498077392578125, 2.57843017578125, 2.658782958984375, 2.7391357421875, 2.819488525390625, 2.89984130859375, 2.980194091796875, 3.060546875]}, "gradients/decoder.roberta.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 4.0, 12.0, 15.0, 16.0, 14.0, 26.0, 39.0, 39.0, 41.0, 63.0, 87.0, 131.0, 145.0, 188.0, 264344.0, 782571.0, 226.0, 140.0, 105.0, 82.0, 68.0, 39.0, 37.0, 26.0, 22.0, 10.0, 18.0, 10.0, 14.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-101.875, -99.123046875, -96.37109375, -93.619140625, -90.8671875, -88.115234375, -85.36328125, -82.611328125, -79.859375, -77.107421875, -74.35546875, -71.603515625, -68.8515625, -66.099609375, -63.34765625, -60.595703125, -57.84375, -55.091796875, -52.33984375, -49.587890625, -46.8359375, -44.083984375, -41.33203125, -38.580078125, -35.828125, -33.076171875, -30.32421875, -27.572265625, -24.8203125, -22.068359375, -19.31640625, -16.564453125, -13.8125, -11.060546875, -8.30859375, -5.556640625, -2.8046875, -0.052734375, 2.69921875, 5.451171875, 8.203125, 10.955078125, 13.70703125, 16.458984375, 19.2109375, 21.962890625, 24.71484375, 27.466796875, 30.21875, 32.970703125, 35.72265625, 38.474609375, 41.2265625, 43.978515625, 46.73046875, 49.482421875, 52.234375, 54.986328125, 57.73828125, 60.490234375, 63.2421875, 65.994140625, 68.74609375, 71.498046875, 74.25]}, "gradients/decoder.roberta.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 14.0, 12.0, 13.0, 25.0, 21.0, 33.0, 33.0, 37.0, 53.0, 53.0, 57.0, 61.0, 46.0, 69.0, 65.0, 59.0, 44.0, 46.0, 38.0, 29.0, 45.0, 31.0, 24.0, 16.0, 16.0, 9.0, 13.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.666015625, -2.5628662109375, -2.459716796875, -2.3565673828125, -2.25341796875, -2.1502685546875, -2.047119140625, -1.9439697265625, -1.8408203125, -1.7376708984375, -1.634521484375, -1.5313720703125, -1.42822265625, -1.3250732421875, -1.221923828125, -1.1187744140625, -1.015625, -0.9124755859375, -0.809326171875, -0.7061767578125, -0.60302734375, -0.4998779296875, -0.396728515625, -0.2935791015625, -0.1904296875, -0.0872802734375, 0.015869140625, 0.1190185546875, 0.22216796875, 0.3253173828125, 0.428466796875, 0.5316162109375, 0.634765625, 0.7379150390625, 0.841064453125, 0.9442138671875, 1.04736328125, 1.1505126953125, 1.253662109375, 1.3568115234375, 1.4599609375, 1.5631103515625, 1.666259765625, 1.7694091796875, 1.87255859375, 1.9757080078125, 2.078857421875, 2.1820068359375, 2.28515625, 2.3883056640625, 2.491455078125, 2.5946044921875, 2.69775390625, 2.8009033203125, 2.904052734375, 3.0072021484375, 3.1103515625, 3.2135009765625, 3.316650390625, 3.4197998046875, 3.52294921875, 3.6260986328125, 3.729248046875, 3.8323974609375, 3.935546875]}, "gradients/decoder.roberta.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 17.0, 9.0, 7.0, 9.0, 21.0, 23.0, 25.0, 36.0, 82.0, 119.0, 218.0, 326.0, 666.0, 1624.0, 6305.0, 39548.0, 451973.0, 495777.0, 42072.0, 6425.0, 1715.0, 644.0, 336.0, 214.0, 116.0, 73.0, 44.0, 40.0, 26.0, 15.0, 10.0, 10.0, 10.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.15234375, -3.03564453125, -2.9189453125, -2.80224609375, -2.685546875, -2.56884765625, -2.4521484375, -2.33544921875, -2.21875, -2.10205078125, -1.9853515625, -1.86865234375, -1.751953125, -1.63525390625, -1.5185546875, -1.40185546875, -1.28515625, -1.16845703125, -1.0517578125, -0.93505859375, -0.818359375, -0.70166015625, -0.5849609375, -0.46826171875, -0.3515625, -0.23486328125, -0.1181640625, -0.00146484375, 0.115234375, 0.23193359375, 0.3486328125, 0.46533203125, 0.58203125, 0.69873046875, 0.8154296875, 0.93212890625, 1.048828125, 1.16552734375, 1.2822265625, 1.39892578125, 1.515625, 1.63232421875, 1.7490234375, 1.86572265625, 1.982421875, 2.09912109375, 2.2158203125, 2.33251953125, 2.44921875, 2.56591796875, 2.6826171875, 2.79931640625, 2.916015625, 3.03271484375, 3.1494140625, 3.26611328125, 3.3828125, 3.49951171875, 3.6162109375, 3.73291015625, 3.849609375, 3.96630859375, 4.0830078125, 4.19970703125, 4.31640625]}, "gradients/decoder.roberta.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 29.0, 28.0, 23.0, 37.0, 44.0, 71.0, 87.0, 137.0, 156.0, 111.0, 70.0, 34.0, 34.0, 24.0, 23.0, 21.0, 13.0, 7.0, 10.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018143653869628906, -0.00017393752932548523, -0.0001664385199546814, -0.00015893951058387756, -0.00015144050121307373, -0.0001439414918422699, -0.00013644248247146606, -0.00012894347310066223, -0.0001214444637298584, -0.00011394545435905457, -0.00010644644498825073, -9.89474356174469e-05, -9.144842624664307e-05, -8.394941687583923e-05, -7.64504075050354e-05, -6.895139813423157e-05, -6.145238876342773e-05, -5.39533793926239e-05, -4.645437002182007e-05, -3.8955360651016235e-05, -3.14563512802124e-05, -2.395734190940857e-05, -1.6458332538604736e-05, -8.959323167800903e-06, -1.4603137969970703e-06, 6.038695573806763e-06, 1.3537704944610596e-05, 2.103671431541443e-05, 2.8535723686218262e-05, 3.6034733057022095e-05, 4.353374242782593e-05, 5.103275179862976e-05, 5.8531761169433594e-05, 6.603077054023743e-05, 7.352977991104126e-05, 8.102878928184509e-05, 8.852779865264893e-05, 9.602680802345276e-05, 0.00010352581739425659, 0.00011102482676506042, 0.00011852383613586426, 0.0001260228455066681, 0.00013352185487747192, 0.00014102086424827576, 0.0001485198736190796, 0.00015601888298988342, 0.00016351789236068726, 0.0001710169017314911, 0.00017851591110229492, 0.00018601492047309875, 0.0001935139298439026, 0.00020101293921470642, 0.00020851194858551025, 0.0002160109579563141, 0.00022350996732711792, 0.00023100897669792175, 0.00023850798606872559, 0.0002460069954395294, 0.00025350600481033325, 0.0002610050141811371, 0.0002685040235519409, 0.00027600303292274475, 0.0002835020422935486, 0.0002910010516643524, 0.00029850006103515625]}, "gradients/decoder.roberta.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 8.0, 4.0, 9.0, 17.0, 23.0, 21.0, 34.0, 78.0, 433.0, 4222.0, 999068.0, 43063.0, 1247.0, 166.0, 64.0, 25.0, 16.0, 17.0, 13.0, 8.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8984375, -14.4136962890625, -13.928955078125, -13.4442138671875, -12.95947265625, -12.4747314453125, -11.989990234375, -11.5052490234375, -11.0205078125, -10.5357666015625, -10.051025390625, -9.5662841796875, -9.08154296875, -8.5968017578125, -8.112060546875, -7.6273193359375, -7.142578125, -6.6578369140625, -6.173095703125, -5.6883544921875, -5.20361328125, -4.7188720703125, -4.234130859375, -3.7493896484375, -3.2646484375, -2.7799072265625, -2.295166015625, -1.8104248046875, -1.32568359375, -0.8409423828125, -0.356201171875, 0.1285400390625, 0.61328125, 1.0980224609375, 1.582763671875, 2.0675048828125, 2.55224609375, 3.0369873046875, 3.521728515625, 4.0064697265625, 4.4912109375, 4.9759521484375, 5.460693359375, 5.9454345703125, 6.43017578125, 6.9149169921875, 7.399658203125, 7.8843994140625, 8.369140625, 8.8538818359375, 9.338623046875, 9.8233642578125, 10.30810546875, 10.7928466796875, 11.277587890625, 11.7623291015625, 12.2470703125, 12.7318115234375, 13.216552734375, 13.7012939453125, 14.18603515625, 14.6707763671875, 15.155517578125, 15.6402587890625, 16.125]}, "gradients/decoder.roberta.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 10.0, 10.0, 17.0, 16.0, 31.0, 42.0, 62.0, 98.0, 185.0, 213.0, 99.0, 71.0, 42.0, 19.0, 24.0, 26.0, 13.0, 5.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8740234375, -0.8475875854492188, -0.8211517333984375, -0.7947158813476562, -0.768280029296875, -0.7418441772460938, -0.7154083251953125, -0.6889724731445312, -0.66253662109375, -0.6361007690429688, -0.6096649169921875, -0.5832290649414062, -0.556793212890625, -0.5303573608398438, -0.5039215087890625, -0.47748565673828125, -0.4510498046875, -0.42461395263671875, -0.3981781005859375, -0.37174224853515625, -0.345306396484375, -0.31887054443359375, -0.2924346923828125, -0.26599884033203125, -0.23956298828125, -0.21312713623046875, -0.1866912841796875, -0.16025543212890625, -0.133819580078125, -0.10738372802734375, -0.0809478759765625, -0.05451202392578125, -0.028076171875, -0.00164031982421875, 0.0247955322265625, 0.05123138427734375, 0.077667236328125, 0.10410308837890625, 0.1305389404296875, 0.15697479248046875, 0.18341064453125, 0.20984649658203125, 0.2362823486328125, 0.26271820068359375, 0.289154052734375, 0.31558990478515625, 0.3420257568359375, 0.36846160888671875, 0.3948974609375, 0.42133331298828125, 0.4477691650390625, 0.47420501708984375, 0.500640869140625, 0.5270767211914062, 0.5535125732421875, 0.5799484252929688, 0.60638427734375, 0.6328201293945312, 0.6592559814453125, 0.6856918334960938, 0.712127685546875, 0.7385635375976562, 0.7649993896484375, 0.7914352416992188, 0.81787109375]}, "gradients/decoder.roberta.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 4.0, 13.0, 21.0, 28.0, 44.0, 76.0, 85.0, 109.0, 113.0, 102.0, 113.0, 86.0, 71.0, 48.0, 38.0, 26.0, 12.0, 13.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4576282501220703, -3.2864747047424316, -3.115321159362793, -2.944167375564575, -2.7730138301849365, -2.601860284805298, -2.43070650100708, -2.2595529556274414, -2.0883994102478027, -1.917245864868164, -1.7460922002792358, -1.5749385356903076, -1.403784990310669, -1.2326314449310303, -1.061477780342102, -0.8903241157531738, -0.7191705703735352, -0.5480169653892517, -0.37686336040496826, -0.20570975542068481, -0.03455615043640137, 0.13659745454788208, 0.3077510595321655, 0.47890472412109375, 0.6500582695007324, 0.8212118744850159, 0.9923654794692993, 1.1635191440582275, 1.3346726894378662, 1.5058262348175049, 1.676979899406433, 1.8481335639953613, 2.019286632537842, 2.1904401779174805, 2.361593723297119, 2.532747507095337, 2.7039010524749756, 2.8750545978546143, 3.046208381652832, 3.2173619270324707, 3.3885154724121094, 3.559669017791748, 3.7308225631713867, 3.9019763469696045, 4.073129653930664, 4.244283676147461, 4.4154372215271, 4.586590766906738, 4.757744312286377, 4.928897857666016, 5.100051403045654, 5.271204948425293, 5.44235897064209, 5.6135125160217285, 5.784666061401367, 5.955819606781006, 6.1269731521606445, 6.298126697540283, 6.469280242919922, 6.6404337882995605, 6.811587333679199, 6.982741355895996, 7.153894901275635, 7.325048446655273, 7.496201992034912]}, "gradients/decoder.roberta.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 9.0, 14.0, 8.0, 15.0, 12.0, 9.0, 28.0, 21.0, 24.0, 19.0, 18.0, 23.0, 33.0, 35.0, 31.0, 37.0, 40.0, 36.0, 34.0, 39.0, 34.0, 46.0, 40.0, 41.0, 44.0, 34.0, 28.0, 33.0, 25.0, 20.0, 17.0, 25.0, 17.0, 19.0, 11.0, 18.0, 14.0, 11.0, 9.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.5067646503448486, -3.4046120643615723, -3.302459239959717, -3.2003066539764404, -3.098154067993164, -2.9960012435913086, -2.8938486576080322, -2.791696071624756, -2.6895434856414795, -2.587390899658203, -2.4852380752563477, -2.3830854892730713, -2.280932903289795, -2.1787800788879395, -2.076627492904663, -1.9744749069213867, -1.8723222017288208, -1.7701694965362549, -1.6680169105529785, -1.5658642053604126, -1.4637116193771362, -1.3615589141845703, -1.259406328201294, -1.157253623008728, -1.055100917816162, -0.952948272228241, -0.8507956266403198, -0.7486429214477539, -0.6464903354644775, -0.5443376302719116, -0.4421849846839905, -0.34003233909606934, -0.23787975311279297, -0.13572710752487183, -0.03357444703578949, 0.06857821345329285, 0.170730859041214, 0.2728835344314575, 0.37503618001937866, 0.4771888256072998, 0.579341471195221, 0.6814941167831421, 0.7836467623710632, 0.8857994079589844, 0.9879521131515503, 1.0901048183441162, 1.1922574043273926, 1.294409990310669, 1.3965626955032349, 1.4987154006958008, 1.6008679866790771, 1.703020691871643, 1.8051732778549194, 1.9073259830474854, 2.0094785690307617, 2.111631393432617, 2.2137839794158936, 2.31593656539917, 2.4180893898010254, 2.5202419757843018, 2.622394561767578, 2.7245473861694336, 2.82669997215271, 2.9288525581359863, 3.0310051441192627]}, "gradients/decoder.roberta.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 11.0, 6.0, 5.0, 11.0, 17.0, 11.0, 32.0, 41.0, 35.0, 61.0, 92.0, 94.0, 120.0, 126.0, 147.0, 215.0, 282.0, 397.0, 594.0, 931.0, 1808.0, 3710.0, 9463.0, 32237.0, 164817.0, 2127888.0, 1660458.0, 144218.0, 29293.0, 8907.0, 3330.0, 1683.0, 945.0, 629.0, 370.0, 300.0, 232.0, 170.0, 132.0, 104.0, 84.0, 72.0, 58.0, 30.0, 33.0, 24.0, 20.0, 13.0, 9.0, 7.0, 5.0, 6.0, 6.0, 3.0, 0.0, 2.0, 3.0], "bins": [-5.00390625, -4.85211181640625, -4.7003173828125, -4.54852294921875, -4.396728515625, -4.24493408203125, -4.0931396484375, -3.94134521484375, -3.78955078125, -3.63775634765625, -3.4859619140625, -3.33416748046875, -3.182373046875, -3.03057861328125, -2.8787841796875, -2.72698974609375, -2.5751953125, -2.42340087890625, -2.2716064453125, -2.11981201171875, -1.968017578125, -1.81622314453125, -1.6644287109375, -1.51263427734375, -1.36083984375, -1.20904541015625, -1.0572509765625, -0.90545654296875, -0.753662109375, -0.60186767578125, -0.4500732421875, -0.29827880859375, -0.146484375, 0.00531005859375, 0.1571044921875, 0.30889892578125, 0.460693359375, 0.61248779296875, 0.7642822265625, 0.91607666015625, 1.06787109375, 1.21966552734375, 1.3714599609375, 1.52325439453125, 1.675048828125, 1.82684326171875, 1.9786376953125, 2.13043212890625, 2.2822265625, 2.43402099609375, 2.5858154296875, 2.73760986328125, 2.889404296875, 3.04119873046875, 3.1929931640625, 3.34478759765625, 3.49658203125, 3.64837646484375, 3.8001708984375, 3.95196533203125, 4.103759765625, 4.25555419921875, 4.4073486328125, 4.55914306640625, 4.7109375]}, "gradients/decoder.roberta.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 8.0, 13.0, 13.0, 15.0, 15.0, 12.0, 13.0, 21.0, 25.0, 23.0, 28.0, 31.0, 31.0, 39.0, 51.0, 30.0, 45.0, 35.0, 33.0, 41.0, 41.0, 39.0, 29.0, 33.0, 35.0, 34.0, 30.0, 25.0, 25.0, 21.0, 20.0, 23.0, 21.0, 17.0, 14.0, 13.0, 6.0, 5.0, 8.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.099609375, -2.03582763671875, -1.9720458984375, -1.90826416015625, -1.844482421875, -1.78070068359375, -1.7169189453125, -1.65313720703125, -1.58935546875, -1.52557373046875, -1.4617919921875, -1.39801025390625, -1.334228515625, -1.27044677734375, -1.2066650390625, -1.14288330078125, -1.0791015625, -1.01531982421875, -0.9515380859375, -0.88775634765625, -0.823974609375, -0.76019287109375, -0.6964111328125, -0.63262939453125, -0.56884765625, -0.50506591796875, -0.4412841796875, -0.37750244140625, -0.313720703125, -0.24993896484375, -0.1861572265625, -0.12237548828125, -0.05859375, 0.00518798828125, 0.0689697265625, 0.13275146484375, 0.196533203125, 0.26031494140625, 0.3240966796875, 0.38787841796875, 0.45166015625, 0.51544189453125, 0.5792236328125, 0.64300537109375, 0.706787109375, 0.77056884765625, 0.8343505859375, 0.89813232421875, 0.9619140625, 1.02569580078125, 1.0894775390625, 1.15325927734375, 1.217041015625, 1.28082275390625, 1.3446044921875, 1.40838623046875, 1.47216796875, 1.53594970703125, 1.5997314453125, 1.66351318359375, 1.727294921875, 1.79107666015625, 1.8548583984375, 1.91864013671875, 1.982421875]}, "gradients/decoder.roberta.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 8.0, 3.0, 6.0, 9.0, 12.0, 17.0, 15.0, 41.0, 53.0, 85.0, 150.0, 360.0, 1356.0, 89278.0, 4093682.0, 7919.0, 664.0, 266.0, 138.0, 70.0, 56.0, 29.0, 25.0, 12.0, 13.0, 4.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.0, -36.05810546875, -35.1162109375, -34.17431640625, -33.232421875, -32.29052734375, -31.3486328125, -30.40673828125, -29.46484375, -28.52294921875, -27.5810546875, -26.63916015625, -25.697265625, -24.75537109375, -23.8134765625, -22.87158203125, -21.9296875, -20.98779296875, -20.0458984375, -19.10400390625, -18.162109375, -17.22021484375, -16.2783203125, -15.33642578125, -14.39453125, -13.45263671875, -12.5107421875, -11.56884765625, -10.626953125, -9.68505859375, -8.7431640625, -7.80126953125, -6.859375, -5.91748046875, -4.9755859375, -4.03369140625, -3.091796875, -2.14990234375, -1.2080078125, -0.26611328125, 0.67578125, 1.61767578125, 2.5595703125, 3.50146484375, 4.443359375, 5.38525390625, 6.3271484375, 7.26904296875, 8.2109375, 9.15283203125, 10.0947265625, 11.03662109375, 11.978515625, 12.92041015625, 13.8623046875, 14.80419921875, 15.74609375, 16.68798828125, 17.6298828125, 18.57177734375, 19.513671875, 20.45556640625, 21.3974609375, 22.33935546875, 23.28125]}, "gradients/decoder.roberta.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 8.0, 4.0, 14.0, 21.0, 31.0, 40.0, 55.0, 94.0, 174.0, 271.0, 552.0, 1017.0, 769.0, 443.0, 215.0, 131.0, 66.0, 47.0, 28.0, 27.0, 17.0, 7.0, 11.0, 8.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.267578125, -1.216461181640625, -1.16534423828125, -1.114227294921875, -1.0631103515625, -1.011993408203125, -0.96087646484375, -0.909759521484375, -0.858642578125, -0.807525634765625, -0.75640869140625, -0.705291748046875, -0.6541748046875, -0.603057861328125, -0.55194091796875, -0.500823974609375, -0.44970703125, -0.398590087890625, -0.34747314453125, -0.296356201171875, -0.2452392578125, -0.194122314453125, -0.14300537109375, -0.091888427734375, -0.040771484375, 0.010345458984375, 0.06146240234375, 0.112579345703125, 0.1636962890625, 0.214813232421875, 0.26593017578125, 0.317047119140625, 0.3681640625, 0.419281005859375, 0.47039794921875, 0.521514892578125, 0.5726318359375, 0.623748779296875, 0.67486572265625, 0.725982666015625, 0.777099609375, 0.828216552734375, 0.87933349609375, 0.930450439453125, 0.9815673828125, 1.032684326171875, 1.08380126953125, 1.134918212890625, 1.18603515625, 1.237152099609375, 1.28826904296875, 1.339385986328125, 1.3905029296875, 1.441619873046875, 1.49273681640625, 1.543853759765625, 1.594970703125, 1.646087646484375, 1.69720458984375, 1.748321533203125, 1.7994384765625, 1.850555419921875, 1.90167236328125, 1.952789306640625, 2.00390625]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 10.0, 9.0, 10.0, 13.0, 20.0, 20.0, 25.0, 38.0, 39.0, 58.0, 68.0, 67.0, 50.0, 59.0, 63.0, 79.0, 55.0, 70.0, 40.0, 44.0, 37.0, 38.0, 28.0, 16.0, 10.0, 16.0, 6.0, 5.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.222228527069092, -3.1351068019866943, -3.0479848384857178, -2.9608631134033203, -2.8737411499023438, -2.7866194248199463, -2.699497699737549, -2.6123757362365723, -2.525254011154175, -2.4381322860717773, -2.351010322570801, -2.2638885974884033, -2.176766872406006, -2.0896449089050293, -2.002523183822632, -1.9154013395309448, -1.8282794952392578, -1.7411576509475708, -1.6540358066558838, -1.5669140815734863, -1.4797922372817993, -1.3926703929901123, -1.3055486679077148, -1.2184268236160278, -1.1313049793243408, -1.0441831350326538, -0.9570613503456116, -0.8699395656585693, -0.7828177213668823, -0.6956958770751953, -0.6085740923881531, -0.5214523077011108, -0.43433046340942383, -0.3472086489200592, -0.2600868344306946, -0.17296501994132996, -0.08584320545196533, 0.001278609037399292, 0.08840042352676392, 0.17552220821380615, 0.26264405250549316, 0.3497658669948578, 0.4368876814842224, 0.5240094661712646, 0.6111313104629517, 0.6982531547546387, 0.7853749394416809, 0.8724967241287231, 0.9596185684204102, 1.0467404127120972, 1.1338622570037842, 1.2209839820861816, 1.3081058263778687, 1.3952276706695557, 1.4823493957519531, 1.5694712400436401, 1.6565930843353271, 1.7437149286270142, 1.8308367729187012, 1.9179584980010986, 2.005080223083496, 2.0922021865844727, 2.17932391166687, 2.2664456367492676, 2.353567600250244]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 8.0, 10.0, 12.0, 8.0, 15.0, 13.0, 15.0, 13.0, 22.0, 15.0, 29.0, 27.0, 29.0, 36.0, 35.0, 30.0, 28.0, 27.0, 46.0, 45.0, 41.0, 34.0, 24.0, 43.0, 35.0, 33.0, 35.0, 33.0, 24.0, 34.0, 30.0, 25.0, 18.0, 18.0, 11.0, 15.0, 16.0, 13.0, 14.0, 15.0, 7.0, 4.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0691208839416504, -1.997783899307251, -1.9264469146728516, -1.8551099300384521, -1.7837729454040527, -1.7124359607696533, -1.641098976135254, -1.5697619915008545, -1.498425006866455, -1.4270880222320557, -1.3557510375976562, -1.2844140529632568, -1.2130770683288574, -1.141740083694458, -1.0704030990600586, -0.9990661144256592, -0.9277291297912598, -0.8563921451568604, -0.7850551605224609, -0.7137181758880615, -0.6423811912536621, -0.5710442066192627, -0.4997072219848633, -0.42837023735046387, -0.35703325271606445, -0.28569626808166504, -0.21435928344726562, -0.1430222988128662, -0.0716853141784668, -0.0003483295440673828, 0.07098865509033203, 0.14232563972473145, 0.21366238594055176, 0.28499937057495117, 0.3563363552093506, 0.42767333984375, 0.4990103244781494, 0.5703473091125488, 0.6416842937469482, 0.7130212783813477, 0.7843582630157471, 0.8556952476501465, 0.9270322322845459, 0.9983692169189453, 1.0697062015533447, 1.1410431861877441, 1.2123801708221436, 1.283717155456543, 1.3550541400909424, 1.4263911247253418, 1.4977281093597412, 1.5690650939941406, 1.64040207862854, 1.7117390632629395, 1.7830760478973389, 1.8544130325317383, 1.9257500171661377, 1.997087001800537, 2.0684239864349365, 2.139760971069336, 2.2110979557037354, 2.2824349403381348, 2.353771924972534, 2.4251089096069336, 2.496445894241333]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 6.0, 7.0, 11.0, 17.0, 22.0, 32.0, 48.0, 74.0, 112.0, 184.0, 246.0, 368.0, 567.0, 812.0, 1319.0, 1989.0, 3049.0, 4787.0, 7439.0, 12139.0, 19976.0, 34051.0, 59497.0, 106612.0, 185326.0, 230480.0, 161722.0, 91362.0, 51036.0, 29242.0, 17096.0, 10396.0, 6457.0, 4084.0, 2692.0, 1739.0, 1197.0, 804.0, 511.0, 316.0, 244.0, 170.0, 108.0, 85.0, 29.0, 37.0, 21.0, 14.0, 11.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.448486328125, -0.4346275329589844, -0.42076873779296875, -0.4069099426269531, -0.3930511474609375, -0.3791923522949219, -0.36533355712890625, -0.3514747619628906, -0.337615966796875, -0.3237571716308594, -0.30989837646484375, -0.2960395812988281, -0.2821807861328125, -0.2683219909667969, -0.25446319580078125, -0.24060440063476562, -0.22674560546875, -0.21288681030273438, -0.19902801513671875, -0.18516921997070312, -0.1713104248046875, -0.15745162963867188, -0.14359283447265625, -0.12973403930664062, -0.115875244140625, -0.10201644897460938, -0.08815765380859375, -0.07429885864257812, -0.0604400634765625, -0.046581268310546875, -0.03272247314453125, -0.018863677978515625, -0.0050048828125, 0.008853912353515625, 0.02271270751953125, 0.036571502685546875, 0.0504302978515625, 0.06428909301757812, 0.07814788818359375, 0.09200668334960938, 0.105865478515625, 0.11972427368164062, 0.13358306884765625, 0.14744186401367188, 0.1613006591796875, 0.17515945434570312, 0.18901824951171875, 0.20287704467773438, 0.21673583984375, 0.23059463500976562, 0.24445343017578125, 0.2583122253417969, 0.2721710205078125, 0.2860298156738281, 0.29988861083984375, 0.3137474060058594, 0.327606201171875, 0.3414649963378906, 0.35532379150390625, 0.3691825866699219, 0.3830413818359375, 0.3969001770019531, 0.41075897216796875, 0.4246177673339844, 0.4384765625]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 6.0, 1.0, 6.0, 13.0, 11.0, 8.0, 15.0, 11.0, 17.0, 13.0, 19.0, 17.0, 24.0, 32.0, 28.0, 34.0, 35.0, 31.0, 29.0, 28.0, 43.0, 46.0, 41.0, 34.0, 25.0, 42.0, 39.0, 32.0, 34.0, 29.0, 24.0, 39.0, 29.0, 24.0, 19.0, 18.0, 10.0, 15.0, 16.0, 14.0, 14.0, 15.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.076171875, -2.00701904296875, -1.9378662109375, -1.86871337890625, -1.799560546875, -1.73040771484375, -1.6612548828125, -1.59210205078125, -1.52294921875, -1.45379638671875, -1.3846435546875, -1.31549072265625, -1.246337890625, -1.17718505859375, -1.1080322265625, -1.03887939453125, -0.9697265625, -0.90057373046875, -0.8314208984375, -0.76226806640625, -0.693115234375, -0.62396240234375, -0.5548095703125, -0.48565673828125, -0.41650390625, -0.34735107421875, -0.2781982421875, -0.20904541015625, -0.139892578125, -0.07073974609375, -0.0015869140625, 0.06756591796875, 0.13671875, 0.20587158203125, 0.2750244140625, 0.34417724609375, 0.413330078125, 0.48248291015625, 0.5516357421875, 0.62078857421875, 0.68994140625, 0.75909423828125, 0.8282470703125, 0.89739990234375, 0.966552734375, 1.03570556640625, 1.1048583984375, 1.17401123046875, 1.2431640625, 1.31231689453125, 1.3814697265625, 1.45062255859375, 1.519775390625, 1.58892822265625, 1.6580810546875, 1.72723388671875, 1.79638671875, 1.86553955078125, 1.9346923828125, 2.00384521484375, 2.072998046875, 2.14215087890625, 2.2113037109375, 2.28045654296875, 2.349609375]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 9.0, 18.0, 19.0, 24.0, 25.0, 33.0, 41.0, 61.0, 72.0, 104.0, 118.0, 176.0, 227.0, 322.0, 437.0, 670.0, 976.0, 1721.0, 3380.0, 7617.0, 19401.0, 69940.0, 891518.0, 30236.0, 10600.0, 4612.0, 2282.0, 1229.0, 789.0, 541.0, 329.0, 227.0, 176.0, 131.0, 117.0, 82.0, 68.0, 50.0, 29.0, 17.0, 27.0, 18.0, 18.0, 12.0, 9.0, 8.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 3.0], "bins": [-1.228515625, -1.1903533935546875, -1.152191162109375, -1.1140289306640625, -1.07586669921875, -1.0377044677734375, -0.999542236328125, -0.9613800048828125, -0.9232177734375, -0.8850555419921875, -0.846893310546875, -0.8087310791015625, -0.77056884765625, -0.7324066162109375, -0.694244384765625, -0.6560821533203125, -0.617919921875, -0.5797576904296875, -0.541595458984375, -0.5034332275390625, -0.46527099609375, -0.4271087646484375, -0.388946533203125, -0.3507843017578125, -0.3126220703125, -0.2744598388671875, -0.236297607421875, -0.1981353759765625, -0.15997314453125, -0.1218109130859375, -0.083648681640625, -0.0454864501953125, -0.00732421875, 0.0308380126953125, 0.069000244140625, 0.1071624755859375, 0.14532470703125, 0.1834869384765625, 0.221649169921875, 0.2598114013671875, 0.2979736328125, 0.3361358642578125, 0.374298095703125, 0.4124603271484375, 0.45062255859375, 0.4887847900390625, 0.526947021484375, 0.5651092529296875, 0.603271484375, 0.6414337158203125, 0.679595947265625, 0.7177581787109375, 0.75592041015625, 0.7940826416015625, 0.832244873046875, 0.8704071044921875, 0.9085693359375, 0.9467315673828125, 0.984893798828125, 1.0230560302734375, 1.06121826171875, 1.0993804931640625, 1.137542724609375, 1.1757049560546875, 1.2138671875]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 12.0, 17.0, 17.0, 15.0, 27.0, 18.0, 24.0, 24.0, 33.0, 34.0, 30.0, 26.0, 32.0, 43.0, 39.0, 41.0, 36.0, 37.0, 42.0, 38.0, 45.0, 33.0, 52.0, 30.0, 36.0, 34.0, 29.0, 24.0, 16.0, 13.0, 14.0, 13.0, 14.0, 9.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.431640625, -1.3860626220703125, -1.340484619140625, -1.2949066162109375, -1.24932861328125, -1.2037506103515625, -1.158172607421875, -1.1125946044921875, -1.0670166015625, -1.0214385986328125, -0.975860595703125, -0.9302825927734375, -0.88470458984375, -0.8391265869140625, -0.793548583984375, -0.7479705810546875, -0.702392578125, -0.6568145751953125, -0.611236572265625, -0.5656585693359375, -0.52008056640625, -0.4745025634765625, -0.428924560546875, -0.3833465576171875, -0.3377685546875, -0.2921905517578125, -0.246612548828125, -0.2010345458984375, -0.15545654296875, -0.1098785400390625, -0.064300537109375, -0.0187225341796875, 0.02685546875, 0.0724334716796875, 0.118011474609375, 0.1635894775390625, 0.20916748046875, 0.2547454833984375, 0.300323486328125, 0.3459014892578125, 0.3914794921875, 0.4370574951171875, 0.482635498046875, 0.5282135009765625, 0.57379150390625, 0.6193695068359375, 0.664947509765625, 0.7105255126953125, 0.756103515625, 0.8016815185546875, 0.847259521484375, 0.8928375244140625, 0.93841552734375, 0.9839935302734375, 1.029571533203125, 1.0751495361328125, 1.1207275390625, 1.1663055419921875, 1.211883544921875, 1.2574615478515625, 1.30303955078125, 1.3486175537109375, 1.394195556640625, 1.4397735595703125, 1.4853515625]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 10.0, 8.0, 17.0, 22.0, 22.0, 48.0, 70.0, 115.0, 177.0, 311.0, 549.0, 1116.0, 2403.0, 7294.0, 38908.0, 965836.0, 22442.0, 5164.0, 1932.0, 911.0, 469.0, 263.0, 174.0, 87.0, 65.0, 40.0, 27.0, 17.0, 13.0, 12.0, 8.0, 3.0, 10.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.229248046875, -0.22169876098632812, -0.21414947509765625, -0.20660018920898438, -0.1990509033203125, -0.19150161743164062, -0.18395233154296875, -0.17640304565429688, -0.168853759765625, -0.16130447387695312, -0.15375518798828125, -0.14620590209960938, -0.1386566162109375, -0.13110733032226562, -0.12355804443359375, -0.11600875854492188, -0.10845947265625, -0.10091018676757812, -0.09336090087890625, -0.08581161499023438, -0.0782623291015625, -0.07071304321289062, -0.06316375732421875, -0.055614471435546875, -0.048065185546875, -0.040515899658203125, -0.03296661376953125, -0.025417327880859375, -0.0178680419921875, -0.010318756103515625, -0.00276947021484375, 0.004779815673828125, 0.0123291015625, 0.019878387451171875, 0.02742767333984375, 0.034976959228515625, 0.0425262451171875, 0.050075531005859375, 0.05762481689453125, 0.06517410278320312, 0.072723388671875, 0.08027267456054688, 0.08782196044921875, 0.09537124633789062, 0.1029205322265625, 0.11046981811523438, 0.11801910400390625, 0.12556838989257812, 0.13311767578125, 0.14066696166992188, 0.14821624755859375, 0.15576553344726562, 0.1633148193359375, 0.17086410522460938, 0.17841339111328125, 0.18596267700195312, 0.193511962890625, 0.20106124877929688, 0.20861053466796875, 0.21615982055664062, 0.2237091064453125, 0.23125839233398438, 0.23880767822265625, 0.24635696411132812, 0.25390625]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 6.0, 6.0, 9.0, 4.0, 17.0, 13.0, 25.0, 24.0, 40.0, 40.0, 54.0, 71.0, 54.0, 92.0, 72.0, 69.0, 60.0, 66.0, 61.0, 47.0, 38.0, 31.0, 23.0, 15.0, 13.0, 13.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.127357482910156e-05, -5.971547216176987e-05, -5.815736949443817e-05, -5.6599266827106476e-05, -5.504116415977478e-05, -5.3483061492443085e-05, -5.192495882511139e-05, -5.0366856157779694e-05, -4.8808753490448e-05, -4.72506508231163e-05, -4.569254815578461e-05, -4.413444548845291e-05, -4.2576342821121216e-05, -4.101824015378952e-05, -3.9460137486457825e-05, -3.790203481912613e-05, -3.6343932151794434e-05, -3.478582948446274e-05, -3.322772681713104e-05, -3.166962414979935e-05, -3.011152148246765e-05, -2.8553418815135956e-05, -2.699531614780426e-05, -2.5437213480472565e-05, -2.387911081314087e-05, -2.2321008145809174e-05, -2.0762905478477478e-05, -1.9204802811145782e-05, -1.7646700143814087e-05, -1.608859747648239e-05, -1.4530494809150696e-05, -1.2972392141819e-05, -1.1414289474487305e-05, -9.856186807155609e-06, -8.298084139823914e-06, -6.739981472492218e-06, -5.1818788051605225e-06, -3.623776137828827e-06, -2.0656734704971313e-06, -5.075708031654358e-07, 1.0505318641662598e-06, 2.6086345314979553e-06, 4.166737198829651e-06, 5.7248398661613464e-06, 7.282942533493042e-06, 8.841045200824738e-06, 1.0399147868156433e-05, 1.1957250535488129e-05, 1.3515353202819824e-05, 1.507345587015152e-05, 1.6631558537483215e-05, 1.818966120481491e-05, 1.9747763872146606e-05, 2.1305866539478302e-05, 2.2863969206809998e-05, 2.4422071874141693e-05, 2.598017454147339e-05, 2.7538277208805084e-05, 2.909637987613678e-05, 3.0654482543468475e-05, 3.221258521080017e-05, 3.3770687878131866e-05, 3.532879054546356e-05, 3.688689321279526e-05, 3.844499588012695e-05]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 6.0, 7.0, 5.0, 14.0, 13.0, 23.0, 16.0, 27.0, 31.0, 57.0, 60.0, 111.0, 265.0, 2327.0, 57357.0, 932226.0, 53121.0, 2212.0, 252.0, 99.0, 81.0, 65.0, 29.0, 24.0, 22.0, 22.0, 18.0, 13.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.388427734375, -0.3780670166015625, -0.367706298828125, -0.3573455810546875, -0.34698486328125, -0.3366241455078125, -0.326263427734375, -0.3159027099609375, -0.3055419921875, -0.2951812744140625, -0.284820556640625, -0.2744598388671875, -0.26409912109375, -0.2537384033203125, -0.243377685546875, -0.2330169677734375, -0.22265625, -0.2122955322265625, -0.201934814453125, -0.1915740966796875, -0.18121337890625, -0.1708526611328125, -0.160491943359375, -0.1501312255859375, -0.1397705078125, -0.1294097900390625, -0.119049072265625, -0.1086883544921875, -0.09832763671875, -0.0879669189453125, -0.077606201171875, -0.0672454833984375, -0.056884765625, -0.0465240478515625, -0.036163330078125, -0.0258026123046875, -0.01544189453125, -0.0050811767578125, 0.005279541015625, 0.0156402587890625, 0.0260009765625, 0.0363616943359375, 0.046722412109375, 0.0570831298828125, 0.06744384765625, 0.0778045654296875, 0.088165283203125, 0.0985260009765625, 0.10888671875, 0.1192474365234375, 0.129608154296875, 0.1399688720703125, 0.15032958984375, 0.1606903076171875, 0.171051025390625, 0.1814117431640625, 0.1917724609375, 0.2021331787109375, 0.212493896484375, 0.2228546142578125, 0.23321533203125, 0.2435760498046875, 0.253936767578125, 0.2642974853515625, 0.274658203125]}, "gradients/decoder.roberta.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 8.0, 3.0, 5.0, 8.0, 8.0, 20.0, 19.0, 16.0, 37.0, 51.0, 73.0, 87.0, 102.0, 120.0, 114.0, 81.0, 52.0, 62.0, 32.0, 13.0, 22.0, 15.0, 12.0, 7.0, 1.0, 3.0, 1.0, 4.0, 7.0, 2.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0173187255859375, -0.016665220260620117, -0.016011714935302734, -0.015358209609985352, -0.014704704284667969, -0.014051198959350586, -0.013397693634033203, -0.01274418830871582, -0.012090682983398438, -0.011437177658081055, -0.010783672332763672, -0.010130167007446289, -0.009476661682128906, -0.008823156356811523, -0.00816965103149414, -0.007516145706176758, -0.006862640380859375, -0.006209135055541992, -0.005555629730224609, -0.0049021244049072266, -0.004248619079589844, -0.003595113754272461, -0.002941608428955078, -0.0022881031036376953, -0.0016345977783203125, -0.0009810924530029297, -0.0003275871276855469, 0.00032591819763183594, 0.0009794235229492188, 0.0016329288482666016, 0.0022864341735839844, 0.002939939498901367, 0.00359344482421875, 0.004246950149536133, 0.004900455474853516, 0.0055539608001708984, 0.006207466125488281, 0.006860971450805664, 0.007514476776123047, 0.00816798210144043, 0.008821487426757812, 0.009474992752075195, 0.010128498077392578, 0.010782003402709961, 0.011435508728027344, 0.012089014053344727, 0.01274251937866211, 0.013396024703979492, 0.014049530029296875, 0.014703035354614258, 0.01535654067993164, 0.016010046005249023, 0.016663551330566406, 0.01731705665588379, 0.017970561981201172, 0.018624067306518555, 0.019277572631835938, 0.01993107795715332, 0.020584583282470703, 0.021238088607788086, 0.02189159393310547, 0.02254509925842285, 0.023198604583740234, 0.023852109909057617, 0.024505615234375]}, "gradients/decoder.roberta.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 11.0, 20.0, 28.0, 32.0, 37.0, 62.0, 76.0, 87.0, 84.0, 88.0, 88.0, 88.0, 73.0, 72.0, 53.0, 34.0, 28.0, 21.0, 9.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.471379280090332, -5.351293087005615, -5.231206893920898, -5.111120700836182, -4.991034507751465, -4.870948314666748, -4.750862121582031, -4.6307759284973145, -4.510689735412598, -4.390603542327881, -4.270517349243164, -4.150431156158447, -4.0303449630737305, -3.9102587699890137, -3.790172576904297, -3.670086622238159, -3.5500006675720215, -3.4299144744873047, -3.309828281402588, -3.189742088317871, -3.0696558952331543, -2.9495697021484375, -2.8294835090637207, -2.709397554397583, -2.589311122894287, -2.4692249298095703, -2.3491387367248535, -2.2290525436401367, -2.10896635055542, -1.9888802766799927, -1.8687940835952759, -1.7487080097198486, -1.6286218166351318, -1.508535623550415, -1.3884494304656982, -1.2683632373809814, -1.1482771635055542, -1.0281909704208374, -0.9081047773361206, -0.7880186438560486, -0.6679324507713318, -0.547846257686615, -0.42776012420654297, -0.30767393112182617, -0.18758776783943176, -0.06750160455703735, 0.05258458852767944, 0.17267072200775146, 0.29275691509246826, 0.41284307837486267, 0.5329292416572571, 0.6530154347419739, 0.7731015682220459, 0.8931877613067627, 1.0132739543914795, 1.1333601474761963, 1.253446340560913, 1.3735325336456299, 1.4936187267303467, 1.6137049198150635, 1.7337909936904907, 1.8538771867752075, 1.9739633798599243, 2.0940494537353516, 2.2141356468200684]}, "gradients/decoder.roberta.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 13.0, 11.0, 8.0, 15.0, 12.0, 16.0, 13.0, 21.0, 15.0, 25.0, 33.0, 27.0, 34.0, 40.0, 26.0, 29.0, 28.0, 45.0, 44.0, 40.0, 34.0, 28.0, 41.0, 37.0, 32.0, 35.0, 28.0, 27.0, 37.0, 28.0, 26.0, 17.0, 18.0, 10.0, 16.0, 17.0, 12.0, 14.0, 16.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.074130058288574, -2.004951238632202, -1.93577241897583, -1.866593599319458, -1.797414779663086, -1.7282359600067139, -1.6590571403503418, -1.5898783206939697, -1.5206995010375977, -1.4515206813812256, -1.3823418617248535, -1.3131630420684814, -1.2439842224121094, -1.1748054027557373, -1.1056265830993652, -1.0364477634429932, -0.9672689437866211, -0.898090124130249, -0.828911304473877, -0.7597324848175049, -0.6905536651611328, -0.6213748455047607, -0.5521960258483887, -0.4830172061920166, -0.41383838653564453, -0.34465956687927246, -0.2754807472229004, -0.20630192756652832, -0.13712310791015625, -0.06794428825378418, 0.0012345314025878906, 0.07041335105895996, 0.13959193229675293, 0.208770751953125, 0.27794957160949707, 0.34712839126586914, 0.4163072109222412, 0.4854860305786133, 0.5546648502349854, 0.6238436698913574, 0.6930224895477295, 0.7622013092041016, 0.8313801288604736, 0.9005589485168457, 0.9697377681732178, 1.0389165878295898, 1.108095407485962, 1.177274227142334, 1.246453046798706, 1.3156318664550781, 1.3848106861114502, 1.4539895057678223, 1.5231683254241943, 1.5923471450805664, 1.6615259647369385, 1.7307047843933105, 1.7998836040496826, 1.8690624237060547, 1.9382412433624268, 2.007420063018799, 2.076598882675171, 2.145777702331543, 2.214956521987915, 2.284135341644287, 2.353314161300659]}, "gradients/decoder.roberta.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 6.0, 7.0, 17.0, 14.0, 27.0, 35.0, 60.0, 104.0, 131.0, 197.0, 304.0, 410.0, 717.0, 1167.0, 1811.0, 2857.0, 4534.0, 7246.0, 11619.0, 18618.0, 31986.0, 53583.0, 93974.0, 160916.0, 216377.0, 179431.0, 108893.0, 61153.0, 35995.0, 21548.0, 12907.0, 8079.0, 5016.0, 3197.0, 2048.0, 1252.0, 816.0, 517.0, 317.0, 239.0, 141.0, 104.0, 54.0, 44.0, 27.0, 27.0, 10.0, 4.0, 7.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0], "bins": [-1.810546875, -1.7566986083984375, -1.702850341796875, -1.6490020751953125, -1.59515380859375, -1.5413055419921875, -1.487457275390625, -1.4336090087890625, -1.3797607421875, -1.3259124755859375, -1.272064208984375, -1.2182159423828125, -1.16436767578125, -1.1105194091796875, -1.056671142578125, -1.0028228759765625, -0.948974609375, -0.8951263427734375, -0.841278076171875, -0.7874298095703125, -0.73358154296875, -0.6797332763671875, -0.625885009765625, -0.5720367431640625, -0.5181884765625, -0.4643402099609375, -0.410491943359375, -0.3566436767578125, -0.30279541015625, -0.2489471435546875, -0.195098876953125, -0.1412506103515625, -0.08740234375, -0.0335540771484375, 0.020294189453125, 0.0741424560546875, 0.12799072265625, 0.1818389892578125, 0.235687255859375, 0.2895355224609375, 0.3433837890625, 0.3972320556640625, 0.451080322265625, 0.5049285888671875, 0.55877685546875, 0.6126251220703125, 0.666473388671875, 0.7203216552734375, 0.774169921875, 0.8280181884765625, 0.881866455078125, 0.9357147216796875, 0.98956298828125, 1.0434112548828125, 1.097259521484375, 1.1511077880859375, 1.2049560546875, 1.2588043212890625, 1.312652587890625, 1.3665008544921875, 1.42034912109375, 1.4741973876953125, 1.528045654296875, 1.5818939208984375, 1.6357421875]}, "gradients/decoder.roberta.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 3.0, 3.0, 6.0, 11.0, 7.0, 13.0, 13.0, 13.0, 16.0, 12.0, 19.0, 17.0, 24.0, 27.0, 38.0, 31.0, 29.0, 29.0, 30.0, 33.0, 35.0, 44.0, 41.0, 35.0, 32.0, 37.0, 39.0, 33.0, 33.0, 32.0, 32.0, 30.0, 25.0, 33.0, 19.0, 14.0, 13.0, 21.0, 10.0, 15.0, 11.0, 15.0, 10.0, 6.0, 7.0, 1.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.01953125, -1.952789306640625, -1.88604736328125, -1.819305419921875, -1.7525634765625, -1.685821533203125, -1.61907958984375, -1.552337646484375, -1.485595703125, -1.418853759765625, -1.35211181640625, -1.285369873046875, -1.2186279296875, -1.151885986328125, -1.08514404296875, -1.018402099609375, -0.95166015625, -0.884918212890625, -0.81817626953125, -0.751434326171875, -0.6846923828125, -0.617950439453125, -0.55120849609375, -0.484466552734375, -0.417724609375, -0.350982666015625, -0.28424072265625, -0.217498779296875, -0.1507568359375, -0.084014892578125, -0.01727294921875, 0.049468994140625, 0.1162109375, 0.182952880859375, 0.24969482421875, 0.316436767578125, 0.3831787109375, 0.449920654296875, 0.51666259765625, 0.583404541015625, 0.650146484375, 0.716888427734375, 0.78363037109375, 0.850372314453125, 0.9171142578125, 0.983856201171875, 1.05059814453125, 1.117340087890625, 1.18408203125, 1.250823974609375, 1.31756591796875, 1.384307861328125, 1.4510498046875, 1.517791748046875, 1.58453369140625, 1.651275634765625, 1.718017578125, 1.784759521484375, 1.85150146484375, 1.918243408203125, 1.9849853515625, 2.051727294921875, 2.11846923828125, 2.185211181640625, 2.251953125]}, "gradients/decoder.roberta.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 12.0, 16.0, 24.0, 18.0, 19.0, 19.0, 29.0, 49.0, 53.0, 60.0, 60.0, 90.0, 103.0, 102.0, 189.0, 26873.0, 1019812.0, 257.0, 142.0, 107.0, 103.0, 83.0, 59.0, 56.0, 51.0, 32.0, 27.0, 16.0, 20.0, 12.0, 15.0, 7.0, 10.0, 4.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-74.625, -72.6689453125, -70.712890625, -68.7568359375, -66.80078125, -64.8447265625, -62.888671875, -60.9326171875, -58.9765625, -57.0205078125, -55.064453125, -53.1083984375, -51.15234375, -49.1962890625, -47.240234375, -45.2841796875, -43.328125, -41.3720703125, -39.416015625, -37.4599609375, -35.50390625, -33.5478515625, -31.591796875, -29.6357421875, -27.6796875, -25.7236328125, -23.767578125, -21.8115234375, -19.85546875, -17.8994140625, -15.943359375, -13.9873046875, -12.03125, -10.0751953125, -8.119140625, -6.1630859375, -4.20703125, -2.2509765625, -0.294921875, 1.6611328125, 3.6171875, 5.5732421875, 7.529296875, 9.4853515625, 11.44140625, 13.3974609375, 15.353515625, 17.3095703125, 19.265625, 21.2216796875, 23.177734375, 25.1337890625, 27.08984375, 29.0458984375, 31.001953125, 32.9580078125, 34.9140625, 36.8701171875, 38.826171875, 40.7822265625, 42.73828125, 44.6943359375, 46.650390625, 48.6064453125, 50.5625]}, "gradients/decoder.roberta.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 12.0, 11.0, 19.0, 18.0, 29.0, 15.0, 40.0, 34.0, 28.0, 39.0, 39.0, 38.0, 49.0, 45.0, 50.0, 56.0, 48.0, 38.0, 40.0, 39.0, 31.0, 30.0, 26.0, 30.0, 20.0, 23.0, 16.0, 19.0, 21.0, 15.0, 13.0, 11.0, 6.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9638671875, -1.8881378173828125, -1.812408447265625, -1.7366790771484375, -1.66094970703125, -1.5852203369140625, -1.509490966796875, -1.4337615966796875, -1.3580322265625, -1.2823028564453125, -1.206573486328125, -1.1308441162109375, -1.05511474609375, -0.9793853759765625, -0.903656005859375, -0.8279266357421875, -0.752197265625, -0.6764678955078125, -0.600738525390625, -0.5250091552734375, -0.44927978515625, -0.3735504150390625, -0.297821044921875, -0.2220916748046875, -0.1463623046875, -0.0706329345703125, 0.005096435546875, 0.0808258056640625, 0.15655517578125, 0.2322845458984375, 0.308013916015625, 0.3837432861328125, 0.45947265625, 0.5352020263671875, 0.610931396484375, 0.6866607666015625, 0.76239013671875, 0.8381195068359375, 0.913848876953125, 0.9895782470703125, 1.0653076171875, 1.1410369873046875, 1.216766357421875, 1.2924957275390625, 1.36822509765625, 1.4439544677734375, 1.519683837890625, 1.5954132080078125, 1.671142578125, 1.7468719482421875, 1.822601318359375, 1.8983306884765625, 1.97406005859375, 2.0497894287109375, 2.125518798828125, 2.2012481689453125, 2.2769775390625, 2.3527069091796875, 2.428436279296875, 2.5041656494140625, 2.57989501953125, 2.6556243896484375, 2.731353759765625, 2.8070831298828125, 2.8828125]}, "gradients/decoder.roberta.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 16.0, 23.0, 47.0, 66.0, 96.0, 172.0, 316.0, 734.0, 2312.0, 22060.0, 620940.0, 383774.0, 14850.0, 1946.0, 577.0, 263.0, 176.0, 79.0, 40.0, 18.0, 13.0, 7.0, 3.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.8026123046875, -5.620849609375, -5.4390869140625, -5.25732421875, -5.0755615234375, -4.893798828125, -4.7120361328125, -4.5302734375, -4.3485107421875, -4.166748046875, -3.9849853515625, -3.80322265625, -3.6214599609375, -3.439697265625, -3.2579345703125, -3.076171875, -2.8944091796875, -2.712646484375, -2.5308837890625, -2.34912109375, -2.1673583984375, -1.985595703125, -1.8038330078125, -1.6220703125, -1.4403076171875, -1.258544921875, -1.0767822265625, -0.89501953125, -0.7132568359375, -0.531494140625, -0.3497314453125, -0.16796875, 0.0137939453125, 0.195556640625, 0.3773193359375, 0.55908203125, 0.7408447265625, 0.922607421875, 1.1043701171875, 1.2861328125, 1.4678955078125, 1.649658203125, 1.8314208984375, 2.01318359375, 2.1949462890625, 2.376708984375, 2.5584716796875, 2.740234375, 2.9219970703125, 3.103759765625, 3.2855224609375, 3.46728515625, 3.6490478515625, 3.830810546875, 4.0125732421875, 4.1943359375, 4.3760986328125, 4.557861328125, 4.7396240234375, 4.92138671875, 5.1031494140625, 5.284912109375, 5.4666748046875, 5.6484375]}, "gradients/decoder.roberta.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 1.0, 0.0, 4.0, 4.0, 12.0, 16.0, 24.0, 32.0, 70.0, 128.0, 190.0, 176.0, 136.0, 90.0, 51.0, 28.0, 17.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000240325927734375, -0.00022709369659423828, -0.00021386146545410156, -0.00020062923431396484, -0.00018739700317382812, -0.0001741647720336914, -0.0001609325408935547, -0.00014770030975341797, -0.00013446807861328125, -0.00012123584747314453, -0.00010800361633300781, -9.47713851928711e-05, -8.153915405273438e-05, -6.830692291259766e-05, -5.507469177246094e-05, -4.184246063232422e-05, -2.86102294921875e-05, -1.537799835205078e-05, -2.1457672119140625e-06, 1.1086463928222656e-05, 2.4318695068359375e-05, 3.7550926208496094e-05, 5.078315734863281e-05, 6.401538848876953e-05, 7.724761962890625e-05, 9.047985076904297e-05, 0.00010371208190917969, 0.0001169443130493164, 0.00013017654418945312, 0.00014340877532958984, 0.00015664100646972656, 0.00016987323760986328, 0.00018310546875, 0.00019633769989013672, 0.00020956993103027344, 0.00022280216217041016, 0.00023603439331054688, 0.0002492666244506836, 0.0002624988555908203, 0.00027573108673095703, 0.00028896331787109375, 0.00030219554901123047, 0.0003154277801513672, 0.0003286600112915039, 0.0003418922424316406, 0.00035512447357177734, 0.00036835670471191406, 0.0003815889358520508, 0.0003948211669921875, 0.0004080533981323242, 0.00042128562927246094, 0.00043451786041259766, 0.0004477500915527344, 0.0004609823226928711, 0.0004742145538330078, 0.00048744678497314453, 0.0005006790161132812, 0.000513911247253418, 0.0005271434783935547, 0.0005403757095336914, 0.0005536079406738281, 0.0005668401718139648, 0.0005800724029541016, 0.0005933046340942383, 0.000606536865234375]}, "gradients/decoder.roberta.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 13.0, 23.0, 34.0, 37.0, 56.0, 125.0, 636.0, 7481.0, 1023355.0, 15584.0, 849.0, 165.0, 65.0, 31.0, 24.0, 25.0, 9.0, 11.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.25, -20.7508544921875, -20.251708984375, -19.7525634765625, -19.25341796875, -18.7542724609375, -18.255126953125, -17.7559814453125, -17.2568359375, -16.7576904296875, -16.258544921875, -15.7593994140625, -15.26025390625, -14.7611083984375, -14.261962890625, -13.7628173828125, -13.263671875, -12.7645263671875, -12.265380859375, -11.7662353515625, -11.26708984375, -10.7679443359375, -10.268798828125, -9.7696533203125, -9.2705078125, -8.7713623046875, -8.272216796875, -7.7730712890625, -7.27392578125, -6.7747802734375, -6.275634765625, -5.7764892578125, -5.27734375, -4.7781982421875, -4.279052734375, -3.7799072265625, -3.28076171875, -2.7816162109375, -2.282470703125, -1.7833251953125, -1.2841796875, -0.7850341796875, -0.285888671875, 0.2132568359375, 0.71240234375, 1.2115478515625, 1.710693359375, 2.2098388671875, 2.708984375, 3.2081298828125, 3.707275390625, 4.2064208984375, 4.70556640625, 5.2047119140625, 5.703857421875, 6.2030029296875, 6.7021484375, 7.2012939453125, 7.700439453125, 8.1995849609375, 8.69873046875, 9.1978759765625, 9.697021484375, 10.1961669921875, 10.6953125]}, "gradients/decoder.roberta.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 8.0, 7.0, 11.0, 12.0, 29.0, 43.0, 53.0, 91.0, 154.0, 148.0, 157.0, 77.0, 65.0, 50.0, 35.0, 22.0, 12.0, 15.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81396484375, -0.7821426391601562, -0.7503204345703125, -0.7184982299804688, -0.686676025390625, -0.6548538208007812, -0.6230316162109375, -0.5912094116210938, -0.55938720703125, -0.5275650024414062, -0.4957427978515625, -0.46392059326171875, -0.432098388671875, -0.40027618408203125, -0.3684539794921875, -0.33663177490234375, -0.3048095703125, -0.27298736572265625, -0.2411651611328125, -0.20934295654296875, -0.177520751953125, -0.14569854736328125, -0.1138763427734375, -0.08205413818359375, -0.05023193359375, -0.01840972900390625, 0.0134124755859375, 0.04523468017578125, 0.077056884765625, 0.10887908935546875, 0.1407012939453125, 0.17252349853515625, 0.204345703125, 0.23616790771484375, 0.2679901123046875, 0.29981231689453125, 0.331634521484375, 0.36345672607421875, 0.3952789306640625, 0.42710113525390625, 0.45892333984375, 0.49074554443359375, 0.5225677490234375, 0.5543899536132812, 0.586212158203125, 0.6180343627929688, 0.6498565673828125, 0.6816787719726562, 0.7135009765625, 0.7453231811523438, 0.7771453857421875, 0.8089675903320312, 0.840789794921875, 0.8726119995117188, 0.9044342041015625, 0.9362564086914062, 0.96807861328125, 0.9999008178710938, 1.0317230224609375, 1.0635452270507812, 1.095367431640625, 1.1271896362304688, 1.1590118408203125, 1.1908340454101562, 1.22265625]}, "gradients/decoder.roberta.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 13.0, 32.0, 56.0, 97.0, 157.0, 159.0, 147.0, 139.0, 89.0, 58.0, 31.0, 19.0, 4.0, 5.0], "bins": [-13.059794425964355, -12.825870513916016, -12.59194564819336, -12.35802173614502, -12.12409782409668, -11.89017391204834, -11.656249046325684, -11.422325134277344, -11.188401222229004, -10.954477310180664, -10.720552444458008, -10.486628532409668, -10.252704620361328, -10.018780708312988, -9.784855842590332, -9.550931930541992, -9.317007064819336, -9.083083152770996, -8.84915828704834, -8.615234375, -8.38131046295166, -8.14738655090332, -7.913461685180664, -7.679537773132324, -7.445613861083984, -7.211689472198486, -6.9777655601501465, -6.743841171264648, -6.509917259216309, -6.2759928703308105, -6.0420684814453125, -5.808144569396973, -5.574220180511475, -5.340295791625977, -5.106371879577637, -4.872447490692139, -4.638523578643799, -4.404599189758301, -4.170675277709961, -3.936750888824463, -3.702826976776123, -3.468902826309204, -3.234978675842285, -3.001054286956787, -2.7671303749084473, -2.533205986022949, -2.2992818355560303, -2.0653576850891113, -1.8314334154129028, -1.5975092649459839, -1.3635849952697754, -1.1296608448028564, -0.8957366943359375, -0.6618125438690186, -0.42788827419281006, -0.1939641237258911, 0.03996002674102783, 0.27388420701026917, 0.5078083872795105, 0.7417325973510742, 0.9756567478179932, 1.209580898284912, 1.4435051679611206, 1.6774293184280396, 1.9113534688949585]}, "gradients/decoder.roberta.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 9.0, 4.0, 6.0, 8.0, 7.0, 10.0, 13.0, 17.0, 9.0, 10.0, 11.0, 22.0, 22.0, 23.0, 30.0, 43.0, 35.0, 36.0, 35.0, 26.0, 42.0, 37.0, 43.0, 51.0, 41.0, 34.0, 35.0, 39.0, 37.0, 31.0, 27.0, 36.0, 27.0, 29.0, 27.0, 17.0, 30.0, 6.0, 12.0, 4.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.287794589996338, -3.183778762817383, -3.0797626972198486, -2.9757468700408936, -2.8717310428619385, -2.7677149772644043, -2.663699150085449, -2.559683322906494, -2.45566725730896, -2.351651430130005, -2.2476353645324707, -2.1436195373535156, -2.0396037101745605, -1.9355876445770264, -1.8315718173980713, -1.7275558710098267, -1.6235400438308716, -1.519524097442627, -1.4155082702636719, -1.3114923238754272, -1.2074763774871826, -1.1034605503082275, -0.9994446039199829, -0.8954286575317383, -0.7914127707481384, -0.6873968839645386, -0.583380937576294, -0.4793650507926941, -0.37534913420677185, -0.2713332176208496, -0.16731733083724976, -0.06330138444900513, 0.04071450233459473, 0.14473041892051697, 0.24874632060527802, 0.35276222229003906, 0.4567781388759613, 0.5607940554618835, 0.6648099422454834, 0.768825888633728, 0.8728417754173279, 0.9768576622009277, 1.0808736085891724, 1.184889554977417, 1.288905382156372, 1.3929213285446167, 1.4969372749328613, 1.6009531021118164, 1.704969048500061, 1.8089849948883057, 1.9130008220672607, 2.017016887664795, 2.12103271484375, 2.225048542022705, 2.32906436920166, 2.4330804347991943, 2.5370962619781494, 2.6411120891571045, 2.7451281547546387, 2.8491439819335938, 2.953159809112549, 3.057175874710083, 3.161191701889038, 3.2652077674865723, 3.3692235946655273]}, "gradients/decoder.roberta.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 10.0, 8.0, 7.0, 22.0, 19.0, 34.0, 40.0, 27.0, 57.0, 67.0, 119.0, 135.0, 203.0, 265.0, 470.0, 776.0, 1477.0, 3762.0, 14040.0, 90820.0, 2539123.0, 1454764.0, 69574.0, 11739.0, 3259.0, 1315.0, 703.0, 416.0, 270.0, 206.0, 137.0, 89.0, 75.0, 58.0, 29.0, 34.0, 26.0, 21.0, 18.0, 16.0, 5.0, 13.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-7.33984375, -7.11700439453125, -6.8941650390625, -6.67132568359375, -6.448486328125, -6.22564697265625, -6.0028076171875, -5.77996826171875, -5.55712890625, -5.33428955078125, -5.1114501953125, -4.88861083984375, -4.665771484375, -4.44293212890625, -4.2200927734375, -3.99725341796875, -3.7744140625, -3.55157470703125, -3.3287353515625, -3.10589599609375, -2.883056640625, -2.66021728515625, -2.4373779296875, -2.21453857421875, -1.99169921875, -1.76885986328125, -1.5460205078125, -1.32318115234375, -1.100341796875, -0.87750244140625, -0.6546630859375, -0.43182373046875, -0.208984375, 0.01385498046875, 0.2366943359375, 0.45953369140625, 0.682373046875, 0.90521240234375, 1.1280517578125, 1.35089111328125, 1.57373046875, 1.79656982421875, 2.0194091796875, 2.24224853515625, 2.465087890625, 2.68792724609375, 2.9107666015625, 3.13360595703125, 3.3564453125, 3.57928466796875, 3.8021240234375, 4.02496337890625, 4.247802734375, 4.47064208984375, 4.6934814453125, 4.91632080078125, 5.13916015625, 5.36199951171875, 5.5848388671875, 5.80767822265625, 6.030517578125, 6.25335693359375, 6.4761962890625, 6.69903564453125, 6.921875]}, "gradients/decoder.roberta.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 8.0, 10.0, 9.0, 16.0, 7.0, 16.0, 11.0, 14.0, 16.0, 25.0, 23.0, 27.0, 22.0, 25.0, 48.0, 47.0, 36.0, 42.0, 45.0, 43.0, 45.0, 48.0, 34.0, 55.0, 27.0, 28.0, 29.0, 34.0, 32.0, 30.0, 36.0, 22.0, 20.0, 20.0, 14.0, 7.0, 11.0, 9.0, 7.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.051177978515625, -1.98516845703125, -1.919158935546875, -1.8531494140625, -1.787139892578125, -1.72113037109375, -1.655120849609375, -1.589111328125, -1.523101806640625, -1.45709228515625, -1.391082763671875, -1.3250732421875, -1.259063720703125, -1.19305419921875, -1.127044677734375, -1.06103515625, -0.995025634765625, -0.92901611328125, -0.863006591796875, -0.7969970703125, -0.730987548828125, -0.66497802734375, -0.598968505859375, -0.532958984375, -0.466949462890625, -0.40093994140625, -0.334930419921875, -0.2689208984375, -0.202911376953125, -0.13690185546875, -0.070892333984375, -0.0048828125, 0.061126708984375, 0.12713623046875, 0.193145751953125, 0.2591552734375, 0.325164794921875, 0.39117431640625, 0.457183837890625, 0.523193359375, 0.589202880859375, 0.65521240234375, 0.721221923828125, 0.7872314453125, 0.853240966796875, 0.91925048828125, 0.985260009765625, 1.05126953125, 1.117279052734375, 1.18328857421875, 1.249298095703125, 1.3153076171875, 1.381317138671875, 1.44732666015625, 1.513336181640625, 1.579345703125, 1.645355224609375, 1.71136474609375, 1.777374267578125, 1.8433837890625, 1.909393310546875, 1.97540283203125, 2.041412353515625, 2.107421875]}, "gradients/decoder.roberta.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 2.0, 10.0, 11.0, 20.0, 25.0, 28.0, 40.0, 84.0, 120.0, 267.0, 669.0, 4934.0, 2073137.0, 2108653.0, 5032.0, 633.0, 247.0, 148.0, 64.0, 55.0, 23.0, 24.0, 16.0, 10.0, 6.0, 3.0, 4.0, 4.0, 1.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-32.8125, -31.9921875, -31.171875, -30.3515625, -29.53125, -28.7109375, -27.890625, -27.0703125, -26.25, -25.4296875, -24.609375, -23.7890625, -22.96875, -22.1484375, -21.328125, -20.5078125, -19.6875, -18.8671875, -18.046875, -17.2265625, -16.40625, -15.5859375, -14.765625, -13.9453125, -13.125, -12.3046875, -11.484375, -10.6640625, -9.84375, -9.0234375, -8.203125, -7.3828125, -6.5625, -5.7421875, -4.921875, -4.1015625, -3.28125, -2.4609375, -1.640625, -0.8203125, 0.0, 0.8203125, 1.640625, 2.4609375, 3.28125, 4.1015625, 4.921875, 5.7421875, 6.5625, 7.3828125, 8.203125, 9.0234375, 9.84375, 10.6640625, 11.484375, 12.3046875, 13.125, 13.9453125, 14.765625, 15.5859375, 16.40625, 17.2265625, 18.046875, 18.8671875, 19.6875]}, "gradients/decoder.roberta.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 12.0, 10.0, 15.0, 25.0, 24.0, 46.0, 72.0, 111.0, 193.0, 371.0, 717.0, 1061.0, 607.0, 311.0, 193.0, 106.0, 57.0, 45.0, 30.0, 23.0, 9.0, 10.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0576171875, -1.0080718994140625, -0.958526611328125, -0.9089813232421875, -0.85943603515625, -0.8098907470703125, -0.760345458984375, -0.7108001708984375, -0.6612548828125, -0.6117095947265625, -0.562164306640625, -0.5126190185546875, -0.46307373046875, -0.4135284423828125, -0.363983154296875, -0.3144378662109375, -0.264892578125, -0.2153472900390625, -0.165802001953125, -0.1162567138671875, -0.06671142578125, -0.0171661376953125, 0.032379150390625, 0.0819244384765625, 0.1314697265625, 0.1810150146484375, 0.230560302734375, 0.2801055908203125, 0.32965087890625, 0.3791961669921875, 0.428741455078125, 0.4782867431640625, 0.52783203125, 0.5773773193359375, 0.626922607421875, 0.6764678955078125, 0.72601318359375, 0.7755584716796875, 0.825103759765625, 0.8746490478515625, 0.9241943359375, 0.9737396240234375, 1.023284912109375, 1.0728302001953125, 1.12237548828125, 1.1719207763671875, 1.221466064453125, 1.2710113525390625, 1.320556640625, 1.3701019287109375, 1.419647216796875, 1.4691925048828125, 1.51873779296875, 1.5682830810546875, 1.617828369140625, 1.6673736572265625, 1.7169189453125, 1.7664642333984375, 1.816009521484375, 1.8655548095703125, 1.91510009765625, 1.9646453857421875, 2.014190673828125, 2.0637359619140625, 2.11328125]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 13.0, 32.0, 81.0, 151.0, 217.0, 197.0, 162.0, 92.0, 43.0, 16.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.45020866394043, -14.172697067260742, -13.895184516906738, -13.617671966552734, -13.340160369873047, -13.06264877319336, -12.785136222839355, -12.507623672485352, -12.230112075805664, -11.952600479125977, -11.675087928771973, -11.397575378417969, -11.120063781738281, -10.842552185058594, -10.56503963470459, -10.287527084350586, -10.010015487670898, -9.732503890991211, -9.454991340637207, -9.177478790283203, -8.899967193603516, -8.622455596923828, -8.344943046569824, -8.06743049621582, -7.789918899536133, -7.512406826019287, -7.234894752502441, -6.957382678985596, -6.67987060546875, -6.402358531951904, -6.124846458435059, -5.847334384918213, -5.569821834564209, -5.292309761047363, -5.014797687530518, -4.737285614013672, -4.459773540496826, -4.1822614669799805, -3.9047493934631348, -3.627237319946289, -3.3497252464294434, -3.0722131729125977, -2.794701099395752, -2.5171890258789062, -2.2396769523620605, -1.9621648788452148, -1.6846528053283691, -1.4071407318115234, -1.1296286582946777, -0.852116584777832, -0.5746045112609863, -0.2970924377441406, -0.019580364227294922, 0.2579317092895508, 0.5354437828063965, 0.8129558563232422, 1.090467929840088, 1.3679800033569336, 1.6454920768737793, 1.923004150390625, 2.2005162239074707, 2.4780282974243164, 2.755540370941162, 3.033052444458008, 3.3105645179748535]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 5.0, 7.0, 10.0, 15.0, 18.0, 10.0, 31.0, 23.0, 19.0, 29.0, 33.0, 35.0, 35.0, 34.0, 34.0, 41.0, 36.0, 41.0, 41.0, 52.0, 46.0, 43.0, 31.0, 32.0, 38.0, 35.0, 21.0, 24.0, 15.0, 29.0, 21.0, 23.0, 14.0, 13.0, 9.0, 9.0, 9.0, 2.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.4094197750091553, -2.331782579421997, -2.254145622253418, -2.1765084266662598, -2.0988712310791016, -2.0212340354919434, -1.9435969591140747, -1.865959882736206, -1.7883226871490479, -1.7106854915618896, -1.633048415184021, -1.5554113388061523, -1.4777741432189941, -1.400136947631836, -1.3224998712539673, -1.2448627948760986, -1.1672255992889404, -1.0895884037017822, -1.0119513273239136, -0.9343141913414001, -0.8566770553588867, -0.7790399193763733, -0.7014027833938599, -0.6237656474113464, -0.546128511428833, -0.4684913754463196, -0.39085423946380615, -0.3132171034812927, -0.2355799674987793, -0.15794283151626587, -0.08030569553375244, -0.0026685595512390137, 0.07496857643127441, 0.15260571241378784, 0.23024284839630127, 0.3078799843788147, 0.3855171203613281, 0.46315425634384155, 0.540791392326355, 0.6184285283088684, 0.6960656642913818, 0.7737028002738953, 0.8513399362564087, 0.9289770722389221, 1.0066142082214355, 1.0842514038085938, 1.1618884801864624, 1.239525556564331, 1.3171627521514893, 1.3947999477386475, 1.4724370241165161, 1.5500741004943848, 1.627711296081543, 1.7053484916687012, 1.7829855680465698, 1.8606226444244385, 1.9382598400115967, 2.015897035598755, 2.093533992767334, 2.171171188354492, 2.2488083839416504, 2.3264455795288086, 2.404082775115967, 2.481719732284546, 2.559356927871704]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 16.0, 11.0, 27.0, 43.0, 63.0, 78.0, 114.0, 188.0, 261.0, 349.0, 507.0, 785.0, 1106.0, 1633.0, 2369.0, 3776.0, 5817.0, 8863.0, 14349.0, 23858.0, 40954.0, 75457.0, 140172.0, 225170.0, 211808.0, 126260.0, 67895.0, 37474.0, 21572.0, 13279.0, 8311.0, 5297.0, 3411.0, 2305.0, 1585.0, 1070.0, 707.0, 522.0, 306.0, 248.0, 184.0, 103.0, 73.0, 63.0, 33.0, 21.0, 26.0, 10.0, 7.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.390625, -0.3775672912597656, -0.36450958251953125, -0.3514518737792969, -0.3383941650390625, -0.3253364562988281, -0.31227874755859375, -0.2992210388183594, -0.286163330078125, -0.2731056213378906, -0.26004791259765625, -0.24699020385742188, -0.2339324951171875, -0.22087478637695312, -0.20781707763671875, -0.19475936889648438, -0.18170166015625, -0.16864395141601562, -0.15558624267578125, -0.14252853393554688, -0.1294708251953125, -0.11641311645507812, -0.10335540771484375, -0.09029769897460938, -0.077239990234375, -0.06418228149414062, -0.05112457275390625, -0.038066864013671875, -0.0250091552734375, -0.011951446533203125, 0.00110626220703125, 0.014163970947265625, 0.0272216796875, 0.040279388427734375, 0.05333709716796875, 0.06639480590820312, 0.0794525146484375, 0.09251022338867188, 0.10556793212890625, 0.11862564086914062, 0.131683349609375, 0.14474105834960938, 0.15779876708984375, 0.17085647583007812, 0.1839141845703125, 0.19697189331054688, 0.21002960205078125, 0.22308731079101562, 0.23614501953125, 0.24920272827148438, 0.26226043701171875, 0.2753181457519531, 0.2883758544921875, 0.3014335632324219, 0.31449127197265625, 0.3275489807128906, 0.340606689453125, 0.3536643981933594, 0.36672210693359375, 0.3797798156738281, 0.3928375244140625, 0.4058952331542969, 0.41895294189453125, 0.4320106506347656, 0.445068359375]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 10.0, 7.0, 5.0, 7.0, 8.0, 17.0, 16.0, 12.0, 32.0, 22.0, 16.0, 33.0, 30.0, 37.0, 32.0, 39.0, 34.0, 40.0, 35.0, 39.0, 41.0, 53.0, 45.0, 45.0, 28.0, 33.0, 38.0, 37.0, 21.0, 25.0, 17.0, 28.0, 20.0, 25.0, 10.0, 15.0, 8.0, 9.0, 7.0, 4.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.369140625, -2.29351806640625, -2.2178955078125, -2.14227294921875, -2.066650390625, -1.99102783203125, -1.9154052734375, -1.83978271484375, -1.76416015625, -1.68853759765625, -1.6129150390625, -1.53729248046875, -1.461669921875, -1.38604736328125, -1.3104248046875, -1.23480224609375, -1.1591796875, -1.08355712890625, -1.0079345703125, -0.93231201171875, -0.856689453125, -0.78106689453125, -0.7054443359375, -0.62982177734375, -0.55419921875, -0.47857666015625, -0.4029541015625, -0.32733154296875, -0.251708984375, -0.17608642578125, -0.1004638671875, -0.02484130859375, 0.05078125, 0.12640380859375, 0.2020263671875, 0.27764892578125, 0.353271484375, 0.42889404296875, 0.5045166015625, 0.58013916015625, 0.65576171875, 0.73138427734375, 0.8070068359375, 0.88262939453125, 0.958251953125, 1.03387451171875, 1.1094970703125, 1.18511962890625, 1.2607421875, 1.33636474609375, 1.4119873046875, 1.48760986328125, 1.563232421875, 1.63885498046875, 1.7144775390625, 1.79010009765625, 1.86572265625, 1.94134521484375, 2.0169677734375, 2.09259033203125, 2.168212890625, 2.24383544921875, 2.3194580078125, 2.39508056640625, 2.470703125]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 14.0, 10.0, 16.0, 15.0, 34.0, 39.0, 42.0, 56.0, 90.0, 125.0, 178.0, 212.0, 353.0, 524.0, 834.0, 1382.0, 2716.0, 6353.0, 18025.0, 75149.0, 898257.0, 27331.0, 8642.0, 3626.0, 1635.0, 936.0, 606.0, 383.0, 255.0, 200.0, 127.0, 90.0, 71.0, 51.0, 47.0, 32.0, 25.0, 17.0, 12.0, 10.0, 7.0, 5.0, 4.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.447265625, -1.40362548828125, -1.3599853515625, -1.31634521484375, -1.272705078125, -1.22906494140625, -1.1854248046875, -1.14178466796875, -1.09814453125, -1.05450439453125, -1.0108642578125, -0.96722412109375, -0.923583984375, -0.87994384765625, -0.8363037109375, -0.79266357421875, -0.7490234375, -0.70538330078125, -0.6617431640625, -0.61810302734375, -0.574462890625, -0.53082275390625, -0.4871826171875, -0.44354248046875, -0.39990234375, -0.35626220703125, -0.3126220703125, -0.26898193359375, -0.225341796875, -0.18170166015625, -0.1380615234375, -0.09442138671875, -0.05078125, -0.00714111328125, 0.0364990234375, 0.08013916015625, 0.123779296875, 0.16741943359375, 0.2110595703125, 0.25469970703125, 0.29833984375, 0.34197998046875, 0.3856201171875, 0.42926025390625, 0.472900390625, 0.51654052734375, 0.5601806640625, 0.60382080078125, 0.6474609375, 0.69110107421875, 0.7347412109375, 0.77838134765625, 0.822021484375, 0.86566162109375, 0.9093017578125, 0.95294189453125, 0.99658203125, 1.04022216796875, 1.0838623046875, 1.12750244140625, 1.171142578125, 1.21478271484375, 1.2584228515625, 1.30206298828125, 1.345703125]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 13.0, 5.0, 13.0, 15.0, 16.0, 18.0, 17.0, 19.0, 17.0, 27.0, 29.0, 32.0, 27.0, 50.0, 41.0, 57.0, 38.0, 32.0, 39.0, 46.0, 53.0, 43.0, 39.0, 37.0, 40.0, 29.0, 22.0, 27.0, 18.0, 25.0, 14.0, 16.0, 18.0, 9.0, 6.0, 12.0, 6.0, 4.0, 3.0, 7.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.572265625, -1.5229339599609375, -1.473602294921875, -1.4242706298828125, -1.37493896484375, -1.3256072998046875, -1.276275634765625, -1.2269439697265625, -1.1776123046875, -1.1282806396484375, -1.078948974609375, -1.0296173095703125, -0.98028564453125, -0.9309539794921875, -0.881622314453125, -0.8322906494140625, -0.782958984375, -0.7336273193359375, -0.684295654296875, -0.6349639892578125, -0.58563232421875, -0.5363006591796875, -0.486968994140625, -0.4376373291015625, -0.3883056640625, -0.3389739990234375, -0.289642333984375, -0.2403106689453125, -0.19097900390625, -0.1416473388671875, -0.092315673828125, -0.0429840087890625, 0.00634765625, 0.0556793212890625, 0.105010986328125, 0.1543426513671875, 0.20367431640625, 0.2530059814453125, 0.302337646484375, 0.3516693115234375, 0.4010009765625, 0.4503326416015625, 0.499664306640625, 0.5489959716796875, 0.59832763671875, 0.6476593017578125, 0.696990966796875, 0.7463226318359375, 0.795654296875, 0.8449859619140625, 0.894317626953125, 0.9436492919921875, 0.99298095703125, 1.0423126220703125, 1.091644287109375, 1.1409759521484375, 1.1903076171875, 1.2396392822265625, 1.288970947265625, 1.3383026123046875, 1.38763427734375, 1.4369659423828125, 1.486297607421875, 1.5356292724609375, 1.5849609375]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 9.0, 4.0, 16.0, 12.0, 8.0, 17.0, 23.0, 34.0, 52.0, 55.0, 106.0, 147.0, 198.0, 301.0, 506.0, 848.0, 1541.0, 3171.0, 8042.0, 28283.0, 944259.0, 42468.0, 10181.0, 3870.0, 1846.0, 907.0, 561.0, 340.0, 223.0, 163.0, 109.0, 77.0, 64.0, 28.0, 22.0, 25.0, 14.0, 12.0, 2.0, 3.0, 5.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.1715087890625, -0.16640663146972656, -0.16130447387695312, -0.1562023162841797, -0.15110015869140625, -0.1459980010986328, -0.14089584350585938, -0.13579368591308594, -0.1306915283203125, -0.12558937072753906, -0.12048721313476562, -0.11538505554199219, -0.11028289794921875, -0.10518074035644531, -0.10007858276367188, -0.09497642517089844, -0.089874267578125, -0.08477210998535156, -0.07966995239257812, -0.07456779479980469, -0.06946563720703125, -0.06436347961425781, -0.059261322021484375, -0.05415916442871094, -0.0490570068359375, -0.04395484924316406, -0.038852691650390625, -0.03375053405761719, -0.02864837646484375, -0.023546218872070312, -0.018444061279296875, -0.013341903686523438, -0.00823974609375, -0.0031375885009765625, 0.001964569091796875, 0.0070667266845703125, 0.01216888427734375, 0.017271041870117188, 0.022373199462890625, 0.027475357055664062, 0.0325775146484375, 0.03767967224121094, 0.042781829833984375, 0.04788398742675781, 0.05298614501953125, 0.05808830261230469, 0.06319046020507812, 0.06829261779785156, 0.073394775390625, 0.07849693298339844, 0.08359909057617188, 0.08870124816894531, 0.09380340576171875, 0.09890556335449219, 0.10400772094726562, 0.10910987854003906, 0.1142120361328125, 0.11931419372558594, 0.12441635131835938, 0.1295185089111328, 0.13462066650390625, 0.1397228240966797, 0.14482498168945312, 0.14992713928222656, 0.155029296875]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 10.0, 16.0, 22.0, 24.0, 35.0, 39.0, 43.0, 64.0, 65.0, 78.0, 75.0, 90.0, 79.0, 60.0, 55.0, 48.0, 37.0, 50.0, 19.0, 23.0, 12.0, 9.0, 8.0, 7.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6133995056152344e-05, -4.468485713005066e-05, -4.3235719203948975e-05, -4.178658127784729e-05, -4.0337443351745605e-05, -3.888830542564392e-05, -3.7439167499542236e-05, -3.599002957344055e-05, -3.454089164733887e-05, -3.309175372123718e-05, -3.16426157951355e-05, -3.0193477869033813e-05, -2.874433994293213e-05, -2.7295202016830444e-05, -2.584606409072876e-05, -2.4396926164627075e-05, -2.294778823852539e-05, -2.1498650312423706e-05, -2.004951238632202e-05, -1.8600374460220337e-05, -1.7151236534118652e-05, -1.5702098608016968e-05, -1.4252960681915283e-05, -1.2803822755813599e-05, -1.1354684829711914e-05, -9.90554690361023e-06, -8.456408977508545e-06, -7.00727105140686e-06, -5.558133125305176e-06, -4.108995199203491e-06, -2.6598572731018066e-06, -1.210719347000122e-06, 2.384185791015625e-07, 1.687556505203247e-06, 3.1366944313049316e-06, 4.585832357406616e-06, 6.034970283508301e-06, 7.484108209609985e-06, 8.93324613571167e-06, 1.0382384061813354e-05, 1.1831521987915039e-05, 1.3280659914016724e-05, 1.4729797840118408e-05, 1.6178935766220093e-05, 1.7628073692321777e-05, 1.9077211618423462e-05, 2.0526349544525146e-05, 2.197548747062683e-05, 2.3424625396728516e-05, 2.48737633228302e-05, 2.6322901248931885e-05, 2.777203917503357e-05, 2.9221177101135254e-05, 3.067031502723694e-05, 3.211945295333862e-05, 3.356859087944031e-05, 3.501772880554199e-05, 3.646686673164368e-05, 3.791600465774536e-05, 3.9365142583847046e-05, 4.081428050994873e-05, 4.2263418436050415e-05, 4.37125563621521e-05, 4.5161694288253784e-05, 4.661083221435547e-05]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 9.0, 10.0, 16.0, 26.0, 21.0, 20.0, 55.0, 68.0, 117.0, 257.0, 1289.0, 20283.0, 882624.0, 138372.0, 4371.0, 507.0, 163.0, 98.0, 67.0, 39.0, 33.0, 27.0, 17.0, 17.0, 9.0, 5.0, 9.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.357666015625, -0.34737396240234375, -0.3370819091796875, -0.32678985595703125, -0.316497802734375, -0.30620574951171875, -0.2959136962890625, -0.28562164306640625, -0.27532958984375, -0.26503753662109375, -0.2547454833984375, -0.24445343017578125, -0.234161376953125, -0.22386932373046875, -0.2135772705078125, -0.20328521728515625, -0.1929931640625, -0.18270111083984375, -0.1724090576171875, -0.16211700439453125, -0.151824951171875, -0.14153289794921875, -0.1312408447265625, -0.12094879150390625, -0.11065673828125, -0.10036468505859375, -0.0900726318359375, -0.07978057861328125, -0.069488525390625, -0.05919647216796875, -0.0489044189453125, -0.03861236572265625, -0.0283203125, -0.01802825927734375, -0.0077362060546875, 0.00255584716796875, 0.012847900390625, 0.02313995361328125, 0.0334320068359375, 0.04372406005859375, 0.05401611328125, 0.06430816650390625, 0.0746002197265625, 0.08489227294921875, 0.095184326171875, 0.10547637939453125, 0.1157684326171875, 0.12606048583984375, 0.1363525390625, 0.14664459228515625, 0.1569366455078125, 0.16722869873046875, 0.177520751953125, 0.18781280517578125, 0.1981048583984375, 0.20839691162109375, 0.21868896484375, 0.22898101806640625, 0.2392730712890625, 0.24956512451171875, 0.259857177734375, 0.27014923095703125, 0.2804412841796875, 0.29073333740234375, 0.301025390625]}, "gradients/decoder.roberta.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 10.0, 16.0, 8.0, 17.0, 15.0, 33.0, 44.0, 58.0, 76.0, 82.0, 120.0, 119.0, 99.0, 70.0, 62.0, 53.0, 33.0, 21.0, 16.0, 18.0, 8.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024200439453125, -0.023373842239379883, -0.022547245025634766, -0.02172064781188965, -0.02089405059814453, -0.020067453384399414, -0.019240856170654297, -0.01841425895690918, -0.017587661743164062, -0.016761064529418945, -0.015934467315673828, -0.015107870101928711, -0.014281272888183594, -0.013454675674438477, -0.01262807846069336, -0.011801481246948242, -0.010974884033203125, -0.010148286819458008, -0.00932168960571289, -0.008495092391967773, -0.007668495178222656, -0.006841897964477539, -0.006015300750732422, -0.005188703536987305, -0.0043621063232421875, -0.0035355091094970703, -0.002708911895751953, -0.001882314682006836, -0.0010557174682617188, -0.00022912025451660156, 0.0005974769592285156, 0.0014240741729736328, 0.00225067138671875, 0.003077268600463867, 0.0039038658142089844, 0.0047304630279541016, 0.005557060241699219, 0.006383657455444336, 0.007210254669189453, 0.00803685188293457, 0.008863449096679688, 0.009690046310424805, 0.010516643524169922, 0.011343240737915039, 0.012169837951660156, 0.012996435165405273, 0.01382303237915039, 0.014649629592895508, 0.015476226806640625, 0.016302824020385742, 0.01712942123413086, 0.017956018447875977, 0.018782615661621094, 0.01960921287536621, 0.020435810089111328, 0.021262407302856445, 0.022089004516601562, 0.02291560173034668, 0.023742198944091797, 0.024568796157836914, 0.02539539337158203, 0.02622199058532715, 0.027048587799072266, 0.027875185012817383, 0.0287017822265625]}, "gradients/decoder.roberta.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 11.0, 32.0, 76.0, 142.0, 204.0, 201.0, 161.0, 99.0, 52.0, 24.0, 8.0, 3.0, 1.0], "bins": [-14.691914558410645, -14.430069923400879, -14.16822624206543, -13.906381607055664, -13.644536972045898, -13.38269329071045, -13.120848655700684, -12.859004020690918, -12.597160339355469, -12.335315704345703, -12.073472023010254, -11.811627388000488, -11.549782752990723, -11.287939071655273, -11.026094436645508, -10.764249801635742, -10.502405166625977, -10.240560531616211, -9.978716850280762, -9.716872215270996, -9.45502758026123, -9.193183898925781, -8.931339263916016, -8.66949462890625, -8.4076509475708, -8.145806312561035, -7.883962154388428, -7.62211799621582, -7.360273838043213, -7.0984296798706055, -6.83658504486084, -6.574740886688232, -6.312896728515625, -6.051052570343018, -5.789207935333252, -5.5273637771606445, -5.265519618988037, -5.00367546081543, -4.741830825805664, -4.479986667633057, -4.218142032623291, -3.9562976360321045, -3.694453477859497, -3.4326090812683105, -3.170764923095703, -2.9089205265045166, -2.64707612991333, -2.3852319717407227, -2.123387575149536, -1.8615432977676392, -1.5996990203857422, -1.3378546237945557, -1.0760103464126587, -0.8141660690307617, -0.5523216724395752, -0.2904773950576782, -0.02863311767578125, 0.2332111895084381, 0.49505549669265747, 0.7568998336791992, 1.0187441110610962, 1.2805883884429932, 1.5424327850341797, 1.8042770624160767, 2.0661213397979736]}, "gradients/decoder.roberta.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 8.0, 6.0, 7.0, 8.0, 16.0, 16.0, 13.0, 30.0, 22.0, 17.0, 33.0, 31.0, 35.0, 32.0, 41.0, 32.0, 43.0, 32.0, 39.0, 41.0, 51.0, 48.0, 46.0, 28.0, 32.0, 39.0, 37.0, 21.0, 25.0, 17.0, 26.0, 21.0, 26.0, 10.0, 14.0, 9.0, 9.0, 7.0, 4.0, 6.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.375817060470581, -2.3000807762145996, -2.224344491958618, -2.148608446121216, -2.0728721618652344, -1.997135877609253, -1.9213995933532715, -1.84566330909729, -1.7699271440505981, -1.6941908597946167, -1.6184546947479248, -1.5427184104919434, -1.466982126235962, -1.39124596118927, -1.3155096769332886, -1.2397735118865967, -1.1640372276306152, -1.0883009433746338, -1.012564778327942, -0.9368284940719604, -0.8610922694206238, -0.7853560447692871, -0.7096197605133057, -0.633883535861969, -0.5581473112106323, -0.48241108655929565, -0.4066748321056366, -0.33093857765197754, -0.25520235300064087, -0.1794661283493042, -0.10372987389564514, -0.027993619441986084, 0.047742605209350586, 0.12347884476184845, 0.1992150843143463, 0.27495133876800537, 0.35068756341934204, 0.4264237880706787, 0.5021600723266602, 0.5778962969779968, 0.6536325216293335, 0.7293687462806702, 0.8051049709320068, 0.8808412551879883, 0.956577479839325, 1.0323137044906616, 1.108049988746643, 1.183786153793335, 1.2595224380493164, 1.3352587223052979, 1.4109948873519897, 1.4867311716079712, 1.562467336654663, 1.6382036209106445, 1.713939905166626, 1.7896761894226074, 1.8654123544692993, 1.9411486387252808, 2.0168848037719727, 2.092621088027954, 2.1683573722839355, 2.244093418121338, 2.3198297023773193, 2.395565986633301, 2.4713022708892822]}, "gradients/decoder.roberta.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 14.0, 14.0, 17.0, 25.0, 30.0, 41.0, 46.0, 80.0, 128.0, 189.0, 303.0, 468.0, 630.0, 1127.0, 1746.0, 2824.0, 4567.0, 7463.0, 12538.0, 21021.0, 38136.0, 71305.0, 140054.0, 246901.0, 228568.0, 124255.0, 63457.0, 34075.0, 19180.0, 11217.0, 6885.0, 4234.0, 2583.0, 1557.0, 998.0, 657.0, 415.0, 283.0, 172.0, 112.0, 71.0, 49.0, 37.0, 23.0, 18.0, 10.0, 7.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.8681640625, -1.8077239990234375, -1.747283935546875, -1.6868438720703125, -1.62640380859375, -1.5659637451171875, -1.505523681640625, -1.4450836181640625, -1.3846435546875, -1.3242034912109375, -1.263763427734375, -1.2033233642578125, -1.14288330078125, -1.0824432373046875, -1.022003173828125, -0.9615631103515625, -0.901123046875, -0.8406829833984375, -0.780242919921875, -0.7198028564453125, -0.65936279296875, -0.5989227294921875, -0.538482666015625, -0.4780426025390625, -0.4176025390625, -0.3571624755859375, -0.296722412109375, -0.2362823486328125, -0.17584228515625, -0.1154022216796875, -0.054962158203125, 0.0054779052734375, 0.06591796875, 0.1263580322265625, 0.186798095703125, 0.2472381591796875, 0.30767822265625, 0.3681182861328125, 0.428558349609375, 0.4889984130859375, 0.5494384765625, 0.6098785400390625, 0.670318603515625, 0.7307586669921875, 0.79119873046875, 0.8516387939453125, 0.912078857421875, 0.9725189208984375, 1.032958984375, 1.0933990478515625, 1.153839111328125, 1.2142791748046875, 1.27471923828125, 1.3351593017578125, 1.395599365234375, 1.4560394287109375, 1.5164794921875, 1.5769195556640625, 1.637359619140625, 1.6977996826171875, 1.75823974609375, 1.8186798095703125, 1.879119873046875, 1.9395599365234375, 2.0]}, "gradients/decoder.roberta.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 10.0, 10.0, 12.0, 18.0, 12.0, 25.0, 27.0, 17.0, 23.0, 34.0, 32.0, 26.0, 50.0, 31.0, 40.0, 37.0, 44.0, 37.0, 44.0, 50.0, 46.0, 37.0, 27.0, 33.0, 37.0, 19.0, 30.0, 18.0, 25.0, 20.0, 23.0, 15.0, 17.0, 8.0, 13.0, 5.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.26953125, -2.1951904296875, -2.120849609375, -2.0465087890625, -1.97216796875, -1.8978271484375, -1.823486328125, -1.7491455078125, -1.6748046875, -1.6004638671875, -1.526123046875, -1.4517822265625, -1.37744140625, -1.3031005859375, -1.228759765625, -1.1544189453125, -1.080078125, -1.0057373046875, -0.931396484375, -0.8570556640625, -0.78271484375, -0.7083740234375, -0.634033203125, -0.5596923828125, -0.4853515625, -0.4110107421875, -0.336669921875, -0.2623291015625, -0.18798828125, -0.1136474609375, -0.039306640625, 0.0350341796875, 0.109375, 0.1837158203125, 0.258056640625, 0.3323974609375, 0.40673828125, 0.4810791015625, 0.555419921875, 0.6297607421875, 0.7041015625, 0.7784423828125, 0.852783203125, 0.9271240234375, 1.00146484375, 1.0758056640625, 1.150146484375, 1.2244873046875, 1.298828125, 1.3731689453125, 1.447509765625, 1.5218505859375, 1.59619140625, 1.6705322265625, 1.744873046875, 1.8192138671875, 1.8935546875, 1.9678955078125, 2.042236328125, 2.1165771484375, 2.19091796875, 2.2652587890625, 2.339599609375, 2.4139404296875, 2.48828125]}, "gradients/decoder.roberta.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 12.0, 9.0, 21.0, 12.0, 19.0, 35.0, 36.0, 54.0, 60.0, 88.0, 96.0, 130.0, 144.0, 334.0, 1045267.0, 1387.0, 165.0, 144.0, 110.0, 93.0, 74.0, 59.0, 46.0, 30.0, 28.0, 18.0, 20.0, 15.0, 7.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-78.5, -76.296875, -74.09375, -71.890625, -69.6875, -67.484375, -65.28125, -63.078125, -60.875, -58.671875, -56.46875, -54.265625, -52.0625, -49.859375, -47.65625, -45.453125, -43.25, -41.046875, -38.84375, -36.640625, -34.4375, -32.234375, -30.03125, -27.828125, -25.625, -23.421875, -21.21875, -19.015625, -16.8125, -14.609375, -12.40625, -10.203125, -8.0, -5.796875, -3.59375, -1.390625, 0.8125, 3.015625, 5.21875, 7.421875, 9.625, 11.828125, 14.03125, 16.234375, 18.4375, 20.640625, 22.84375, 25.046875, 27.25, 29.453125, 31.65625, 33.859375, 36.0625, 38.265625, 40.46875, 42.671875, 44.875, 47.078125, 49.28125, 51.484375, 53.6875, 55.890625, 58.09375, 60.296875, 62.5]}, "gradients/decoder.roberta.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 7.0, 9.0, 12.0, 7.0, 23.0, 12.0, 26.0, 29.0, 41.0, 40.0, 45.0, 43.0, 50.0, 59.0, 50.0, 66.0, 56.0, 52.0, 43.0, 50.0, 46.0, 47.0, 34.0, 25.0, 25.0, 17.0, 18.0, 18.0, 8.0, 10.0, 7.0, 7.0, 6.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.750030517578125, -2.65435791015625, -2.558685302734375, -2.4630126953125, -2.367340087890625, -2.27166748046875, -2.175994873046875, -2.080322265625, -1.984649658203125, -1.88897705078125, -1.793304443359375, -1.6976318359375, -1.601959228515625, -1.50628662109375, -1.410614013671875, -1.31494140625, -1.219268798828125, -1.12359619140625, -1.027923583984375, -0.9322509765625, -0.836578369140625, -0.74090576171875, -0.645233154296875, -0.549560546875, -0.453887939453125, -0.35821533203125, -0.262542724609375, -0.1668701171875, -0.071197509765625, 0.02447509765625, 0.120147705078125, 0.2158203125, 0.311492919921875, 0.40716552734375, 0.502838134765625, 0.5985107421875, 0.694183349609375, 0.78985595703125, 0.885528564453125, 0.981201171875, 1.076873779296875, 1.17254638671875, 1.268218994140625, 1.3638916015625, 1.459564208984375, 1.55523681640625, 1.650909423828125, 1.74658203125, 1.842254638671875, 1.93792724609375, 2.033599853515625, 2.1292724609375, 2.224945068359375, 2.32061767578125, 2.416290283203125, 2.511962890625, 2.607635498046875, 2.70330810546875, 2.798980712890625, 2.8946533203125, 2.990325927734375, 3.08599853515625, 3.181671142578125, 3.27734375]}, "gradients/decoder.roberta.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 9.0, 12.0, 21.0, 31.0, 55.0, 105.0, 216.0, 517.0, 1907.0, 19435.0, 805099.0, 212106.0, 7220.0, 1083.0, 348.0, 159.0, 83.0, 39.0, 30.0, 20.0, 9.0, 10.0, 7.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.38671875, -6.18597412109375, -5.9852294921875, -5.78448486328125, -5.583740234375, -5.38299560546875, -5.1822509765625, -4.98150634765625, -4.78076171875, -4.58001708984375, -4.3792724609375, -4.17852783203125, -3.977783203125, -3.77703857421875, -3.5762939453125, -3.37554931640625, -3.1748046875, -2.97406005859375, -2.7733154296875, -2.57257080078125, -2.371826171875, -2.17108154296875, -1.9703369140625, -1.76959228515625, -1.56884765625, -1.36810302734375, -1.1673583984375, -0.96661376953125, -0.765869140625, -0.56512451171875, -0.3643798828125, -0.16363525390625, 0.037109375, 0.23785400390625, 0.4385986328125, 0.63934326171875, 0.840087890625, 1.04083251953125, 1.2415771484375, 1.44232177734375, 1.64306640625, 1.84381103515625, 2.0445556640625, 2.24530029296875, 2.446044921875, 2.64678955078125, 2.8475341796875, 3.04827880859375, 3.2490234375, 3.44976806640625, 3.6505126953125, 3.85125732421875, 4.052001953125, 4.25274658203125, 4.4534912109375, 4.65423583984375, 4.85498046875, 5.05572509765625, 5.2564697265625, 5.45721435546875, 5.657958984375, 5.85870361328125, 6.0594482421875, 6.26019287109375, 6.4609375]}, "gradients/decoder.roberta.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 6.0, 17.0, 24.0, 49.0, 70.0, 93.0, 135.0, 179.0, 137.0, 89.0, 76.0, 36.0, 23.0, 27.0, 11.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003032684326171875, -0.00029421597719192505, -0.0002851635217666626, -0.00027611106634140015, -0.0002670586109161377, -0.00025800615549087524, -0.0002489537000656128, -0.00023990124464035034, -0.0002308487892150879, -0.00022179633378982544, -0.000212743878364563, -0.00020369142293930054, -0.00019463896751403809, -0.00018558651208877563, -0.00017653405666351318, -0.00016748160123825073, -0.00015842914581298828, -0.00014937669038772583, -0.00014032423496246338, -0.00013127177953720093, -0.00012221932411193848, -0.00011316686868667603, -0.00010411441326141357, -9.506195783615112e-05, -8.600950241088867e-05, -7.695704698562622e-05, -6.790459156036377e-05, -5.885213613510132e-05, -4.979968070983887e-05, -4.0747225284576416e-05, -3.1694769859313965e-05, -2.2642314434051514e-05, -1.3589859008789062e-05, -4.537403583526611e-06, 4.51505184173584e-06, 1.3567507266998291e-05, 2.2619962692260742e-05, 3.167241811752319e-05, 4.0724873542785645e-05, 4.9777328968048096e-05, 5.882978439331055e-05, 6.7882239818573e-05, 7.693469524383545e-05, 8.59871506690979e-05, 9.503960609436035e-05, 0.0001040920615196228, 0.00011314451694488525, 0.0001221969723701477, 0.00013124942779541016, 0.0001403018832206726, 0.00014935433864593506, 0.0001584067940711975, 0.00016745924949645996, 0.0001765117049217224, 0.00018556416034698486, 0.00019461661577224731, 0.00020366907119750977, 0.00021272152662277222, 0.00022177398204803467, 0.00023082643747329712, 0.00023987889289855957, 0.000248931348323822, 0.00025798380374908447, 0.0002670362591743469, 0.0002760887145996094]}, "gradients/decoder.roberta.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 12.0, 18.0, 47.0, 122.0, 834.0, 647996.0, 398473.0, 832.0, 123.0, 43.0, 19.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.890625, -16.085693359375, -15.28076171875, -14.475830078125, -13.6708984375, -12.865966796875, -12.06103515625, -11.256103515625, -10.451171875, -9.646240234375, -8.84130859375, -8.036376953125, -7.2314453125, -6.426513671875, -5.62158203125, -4.816650390625, -4.01171875, -3.206787109375, -2.40185546875, -1.596923828125, -0.7919921875, 0.012939453125, 0.81787109375, 1.622802734375, 2.427734375, 3.232666015625, 4.03759765625, 4.842529296875, 5.6474609375, 6.452392578125, 7.25732421875, 8.062255859375, 8.8671875, 9.672119140625, 10.47705078125, 11.281982421875, 12.0869140625, 12.891845703125, 13.69677734375, 14.501708984375, 15.306640625, 16.111572265625, 16.91650390625, 17.721435546875, 18.5263671875, 19.331298828125, 20.13623046875, 20.941162109375, 21.74609375, 22.551025390625, 23.35595703125, 24.160888671875, 24.9658203125, 25.770751953125, 26.57568359375, 27.380615234375, 28.185546875, 28.990478515625, 29.79541015625, 30.600341796875, 31.4052734375, 32.210205078125, 33.01513671875, 33.820068359375, 34.625]}, "gradients/decoder.roberta.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 19.0, 26.0, 55.0, 145.0, 266.0, 253.0, 107.0, 58.0, 25.0, 14.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.31640625, -2.264801025390625, -2.21319580078125, -2.161590576171875, -2.1099853515625, -2.058380126953125, -2.00677490234375, -1.955169677734375, -1.903564453125, -1.851959228515625, -1.80035400390625, -1.748748779296875, -1.6971435546875, -1.645538330078125, -1.59393310546875, -1.542327880859375, -1.49072265625, -1.439117431640625, -1.38751220703125, -1.335906982421875, -1.2843017578125, -1.232696533203125, -1.18109130859375, -1.129486083984375, -1.077880859375, -1.026275634765625, -0.97467041015625, -0.923065185546875, -0.8714599609375, -0.819854736328125, -0.76824951171875, -0.716644287109375, -0.6650390625, -0.613433837890625, -0.56182861328125, -0.510223388671875, -0.4586181640625, -0.407012939453125, -0.35540771484375, -0.303802490234375, -0.252197265625, -0.200592041015625, -0.14898681640625, -0.097381591796875, -0.0457763671875, 0.005828857421875, 0.05743408203125, 0.109039306640625, 0.16064453125, 0.212249755859375, 0.26385498046875, 0.315460205078125, 0.3670654296875, 0.418670654296875, 0.47027587890625, 0.521881103515625, 0.573486328125, 0.625091552734375, 0.67669677734375, 0.728302001953125, 0.7799072265625, 0.831512451171875, 0.88311767578125, 0.934722900390625, 0.986328125]}, "gradients/decoder.roberta.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 18.0, 76.0, 179.0, 239.0, 245.0, 170.0, 62.0, 20.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.978832244873047, -19.600738525390625, -19.22264289855957, -18.84454917907715, -18.466453552246094, -18.088359832763672, -17.71026611328125, -17.332170486450195, -16.954076766967773, -16.57598304748535, -16.197887420654297, -15.819793701171875, -15.441699028015137, -15.063604354858398, -14.68550968170166, -14.307415008544922, -13.929320335388184, -13.551225662231445, -13.173130989074707, -12.795036315917969, -12.416942596435547, -12.038847923278809, -11.66075325012207, -11.282658576965332, -10.904563903808594, -10.526469230651855, -10.148374557495117, -9.770280838012695, -9.392186164855957, -9.014091491699219, -8.63599681854248, -8.257902145385742, -7.879807472229004, -7.501712799072266, -7.1236186027526855, -6.745523929595947, -6.367429733276367, -5.989335060119629, -5.611240386962891, -5.233145713806152, -4.855051517486572, -4.476956844329834, -4.098862648010254, -3.7207679748535156, -3.3426735401153564, -2.9645791053771973, -2.586484432220459, -2.2083899974823, -1.8302955627441406, -1.4522011280059814, -1.0741065740585327, -0.696012020111084, -0.3179175853729248, 0.060176849365234375, 0.43827152252197266, 0.8163659572601318, 1.194460391998291, 1.5725548267364502, 1.950649380683899, 2.3287439346313477, 2.706838369369507, 3.084932804107666, 3.4630274772644043, 3.8411219120025635, 4.219216346740723]}, "gradients/decoder.roberta.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 6.0, 8.0, 9.0, 9.0, 13.0, 18.0, 20.0, 21.0, 21.0, 18.0, 16.0, 28.0, 20.0, 34.0, 37.0, 38.0, 40.0, 39.0, 36.0, 38.0, 30.0, 38.0, 30.0, 44.0, 42.0, 40.0, 28.0, 31.0, 28.0, 24.0, 31.0, 17.0, 20.0, 14.0, 23.0, 14.0, 14.0, 7.0, 9.0, 7.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-2.767303943634033, -2.6738998889923096, -2.580495595932007, -2.487091541290283, -2.3936872482299805, -2.300283193588257, -2.206879138946533, -2.1134748458862305, -2.0200705528259277, -1.9266663789749146, -1.8332622051239014, -1.7398581504821777, -1.646453857421875, -1.5530498027801514, -1.4596456289291382, -1.366241455078125, -1.2728374004364014, -1.1794332265853882, -1.086029052734375, -0.9926249384880066, -0.8992207646369934, -0.8058165907859802, -0.7124124765396118, -0.6190083026885986, -0.5256041288375854, -0.43219995498657227, -0.33879581093788147, -0.24539166688919067, -0.1519874930381775, -0.05858331918716431, 0.0348207950592041, 0.12822496891021729, 0.22162890434265137, 0.31503307819366455, 0.40843722224235535, 0.5018413662910461, 0.5952455401420593, 0.6886497139930725, 0.7820538282394409, 0.8754580020904541, 0.9688621759414673, 1.0622663497924805, 1.1556705236434937, 1.2490746974945068, 1.3424787521362305, 1.4358830451965332, 1.5292870998382568, 1.62269127368927, 1.7160954475402832, 1.8094996213912964, 1.9029037952423096, 1.9963078498840332, 2.089712142944336, 2.1831161975860596, 2.276520252227783, 2.369924545288086, 2.4633288383483887, 2.5567328929901123, 2.650137186050415, 2.7435412406921387, 2.8369455337524414, 2.930349588394165, 3.0237536430358887, 3.1171579360961914, 3.210561990737915]}, "gradients/decoder.roberta.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 3.0, 5.0, 6.0, 11.0, 11.0, 10.0, 18.0, 18.0, 19.0, 33.0, 49.0, 63.0, 95.0, 183.0, 317.0, 618.0, 1255.0, 4105.0, 20274.0, 236690.0, 3657745.0, 244954.0, 20902.0, 4075.0, 1320.0, 642.0, 319.0, 168.0, 119.0, 62.0, 35.0, 44.0, 22.0, 20.0, 13.0, 13.0, 10.0, 8.0, 3.0, 7.0, 4.0, 6.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.89984130859375, -6.6395263671875, -6.37921142578125, -6.118896484375, -5.85858154296875, -5.5982666015625, -5.33795166015625, -5.07763671875, -4.81732177734375, -4.5570068359375, -4.29669189453125, -4.036376953125, -3.77606201171875, -3.5157470703125, -3.25543212890625, -2.9951171875, -2.73480224609375, -2.4744873046875, -2.21417236328125, -1.953857421875, -1.69354248046875, -1.4332275390625, -1.17291259765625, -0.91259765625, -0.65228271484375, -0.3919677734375, -0.13165283203125, 0.128662109375, 0.38897705078125, 0.6492919921875, 0.90960693359375, 1.169921875, 1.43023681640625, 1.6905517578125, 1.95086669921875, 2.211181640625, 2.47149658203125, 2.7318115234375, 2.99212646484375, 3.25244140625, 3.51275634765625, 3.7730712890625, 4.03338623046875, 4.293701171875, 4.55401611328125, 4.8143310546875, 5.07464599609375, 5.3349609375, 5.59527587890625, 5.8555908203125, 6.11590576171875, 6.376220703125, 6.63653564453125, 6.8968505859375, 7.15716552734375, 7.41748046875, 7.67779541015625, 7.9381103515625, 8.19842529296875, 8.458740234375, 8.71905517578125, 8.9793701171875, 9.23968505859375, 9.5]}, "gradients/decoder.roberta.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 2.0, 6.0, 4.0, 2.0, 11.0, 8.0, 9.0, 13.0, 12.0, 16.0, 16.0, 25.0, 24.0, 20.0, 17.0, 23.0, 42.0, 34.0, 34.0, 35.0, 30.0, 32.0, 45.0, 37.0, 42.0, 45.0, 40.0, 27.0, 34.0, 35.0, 31.0, 34.0, 20.0, 25.0, 24.0, 27.0, 25.0, 11.0, 18.0, 12.0, 10.0, 10.0, 7.0, 14.0, 3.0, 5.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0], "bins": [-1.869140625, -1.814056396484375, -1.75897216796875, -1.703887939453125, -1.6488037109375, -1.593719482421875, -1.53863525390625, -1.483551025390625, -1.428466796875, -1.373382568359375, -1.31829833984375, -1.263214111328125, -1.2081298828125, -1.153045654296875, -1.09796142578125, -1.042877197265625, -0.98779296875, -0.932708740234375, -0.87762451171875, -0.822540283203125, -0.7674560546875, -0.712371826171875, -0.65728759765625, -0.602203369140625, -0.547119140625, -0.492034912109375, -0.43695068359375, -0.381866455078125, -0.3267822265625, -0.271697998046875, -0.21661376953125, -0.161529541015625, -0.1064453125, -0.051361083984375, 0.00372314453125, 0.058807373046875, 0.1138916015625, 0.168975830078125, 0.22406005859375, 0.279144287109375, 0.334228515625, 0.389312744140625, 0.44439697265625, 0.499481201171875, 0.5545654296875, 0.609649658203125, 0.66473388671875, 0.719818115234375, 0.77490234375, 0.829986572265625, 0.88507080078125, 0.940155029296875, 0.9952392578125, 1.050323486328125, 1.10540771484375, 1.160491943359375, 1.215576171875, 1.270660400390625, 1.32574462890625, 1.380828857421875, 1.4359130859375, 1.490997314453125, 1.54608154296875, 1.601165771484375, 1.65625]}, "gradients/decoder.roberta.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 3.0, 8.0, 13.0, 13.0, 17.0, 33.0, 40.0, 78.0, 105.0, 193.0, 310.0, 704.0, 3029.0, 61873.0, 4071551.0, 52046.0, 2855.0, 606.0, 301.0, 172.0, 84.0, 63.0, 45.0, 34.0, 20.0, 26.0, 13.0, 9.0, 6.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.71875, -21.0888671875, -20.458984375, -19.8291015625, -19.19921875, -18.5693359375, -17.939453125, -17.3095703125, -16.6796875, -16.0498046875, -15.419921875, -14.7900390625, -14.16015625, -13.5302734375, -12.900390625, -12.2705078125, -11.640625, -11.0107421875, -10.380859375, -9.7509765625, -9.12109375, -8.4912109375, -7.861328125, -7.2314453125, -6.6015625, -5.9716796875, -5.341796875, -4.7119140625, -4.08203125, -3.4521484375, -2.822265625, -2.1923828125, -1.5625, -0.9326171875, -0.302734375, 0.3271484375, 0.95703125, 1.5869140625, 2.216796875, 2.8466796875, 3.4765625, 4.1064453125, 4.736328125, 5.3662109375, 5.99609375, 6.6259765625, 7.255859375, 7.8857421875, 8.515625, 9.1455078125, 9.775390625, 10.4052734375, 11.03515625, 11.6650390625, 12.294921875, 12.9248046875, 13.5546875, 14.1845703125, 14.814453125, 15.4443359375, 16.07421875, 16.7041015625, 17.333984375, 17.9638671875, 18.59375]}, "gradients/decoder.roberta.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 8.0, 3.0, 9.0, 21.0, 20.0, 31.0, 54.0, 74.0, 92.0, 146.0, 237.0, 416.0, 737.0, 946.0, 444.0, 280.0, 172.0, 117.0, 80.0, 57.0, 40.0, 27.0, 17.0, 10.0, 7.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.173828125, -1.1319580078125, -1.090087890625, -1.0482177734375, -1.00634765625, -0.9644775390625, -0.922607421875, -0.8807373046875, -0.8388671875, -0.7969970703125, -0.755126953125, -0.7132568359375, -0.67138671875, -0.6295166015625, -0.587646484375, -0.5457763671875, -0.50390625, -0.4620361328125, -0.420166015625, -0.3782958984375, -0.33642578125, -0.2945556640625, -0.252685546875, -0.2108154296875, -0.1689453125, -0.1270751953125, -0.085205078125, -0.0433349609375, -0.00146484375, 0.0404052734375, 0.082275390625, 0.1241455078125, 0.166015625, 0.2078857421875, 0.249755859375, 0.2916259765625, 0.33349609375, 0.3753662109375, 0.417236328125, 0.4591064453125, 0.5009765625, 0.5428466796875, 0.584716796875, 0.6265869140625, 0.66845703125, 0.7103271484375, 0.752197265625, 0.7940673828125, 0.8359375, 0.8778076171875, 0.919677734375, 0.9615478515625, 1.00341796875, 1.0452880859375, 1.087158203125, 1.1290283203125, 1.1708984375, 1.2127685546875, 1.254638671875, 1.2965087890625, 1.33837890625, 1.3802490234375, 1.422119140625, 1.4639892578125, 1.505859375]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 18.0, 42.0, 68.0, 108.0, 139.0, 173.0, 169.0, 114.0, 67.0, 55.0, 28.0, 14.0, 2.0, 4.0, 4.0], "bins": [-10.729928970336914, -10.533834457397461, -10.337740898132324, -10.141646385192871, -9.945551872253418, -9.749458312988281, -9.553363800048828, -9.357269287109375, -9.161174774169922, -8.965080261230469, -8.768986701965332, -8.572892189025879, -8.376797676086426, -8.180704116821289, -7.984609603881836, -7.788515090942383, -7.592421531677246, -7.396327495574951, -7.200232982635498, -7.004138946533203, -6.80804443359375, -6.611950397491455, -6.41585636138916, -6.219761848449707, -6.023667812347412, -5.827573776245117, -5.631479263305664, -5.435385227203369, -5.239291191101074, -5.043196678161621, -4.847102642059326, -4.651008605957031, -4.454914093017578, -4.258820056915283, -4.06272554397583, -3.866631507873535, -3.670537233352661, -3.474442958831787, -3.278348922729492, -3.082254648208618, -2.886160373687744, -2.69006609916687, -2.493971824645996, -2.297877788543701, -2.101783514022827, -1.9056892395019531, -1.7095950841903687, -1.5135009288787842, -1.3174067735671997, -1.1213126182556152, -0.9252183437347412, -0.729124128818512, -0.5330299139022827, -0.33693569898605347, -0.14084148406982422, 0.055252671241760254, 0.2513469457626343, 0.4474411606788635, 0.6435353755950928, 0.839629590511322, 1.0357238054275513, 1.2318179607391357, 1.4279122352600098, 1.6240063905715942, 1.8201006650924683]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 7.0, 10.0, 8.0, 6.0, 12.0, 12.0, 12.0, 20.0, 21.0, 15.0, 19.0, 29.0, 26.0, 40.0, 24.0, 35.0, 45.0, 32.0, 36.0, 34.0, 41.0, 42.0, 39.0, 26.0, 37.0, 44.0, 33.0, 26.0, 34.0, 28.0, 28.0, 25.0, 19.0, 17.0, 27.0, 18.0, 12.0, 9.0, 9.0, 14.0, 4.0, 7.0, 4.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-2.21537709236145, -2.1458685398101807, -2.076359748840332, -2.0068511962890625, -1.937342643737793, -1.8678340911865234, -1.7983254194259644, -1.7288167476654053, -1.6593081951141357, -1.5897996425628662, -1.5202909708023071, -1.450782299041748, -1.3812737464904785, -1.311765193939209, -1.24225652217865, -1.1727478504180908, -1.1032392978668213, -1.0337307453155518, -0.9642220735549927, -0.8947134613990784, -0.8252048492431641, -0.7556962370872498, -0.6861876249313354, -0.6166790127754211, -0.5471704006195068, -0.47766178846359253, -0.4081531763076782, -0.3386445641517639, -0.2691359519958496, -0.1996273398399353, -0.130118727684021, -0.06061011552810669, 0.008898496627807617, 0.07840710878372192, 0.14791572093963623, 0.21742433309555054, 0.28693294525146484, 0.35644155740737915, 0.42595016956329346, 0.49545878171920776, 0.5649673938751221, 0.6344760060310364, 0.7039846181869507, 0.773493230342865, 0.8430018424987793, 0.9125104546546936, 0.9820190668106079, 1.051527738571167, 1.1210362911224365, 1.190544843673706, 1.2600535154342651, 1.3295621871948242, 1.3990707397460938, 1.4685792922973633, 1.5380879640579224, 1.6075966358184814, 1.677105188369751, 1.7466137409210205, 1.8161224126815796, 1.8856310844421387, 1.9551396369934082, 2.0246481895446777, 2.0941567420959473, 2.163665533065796, 2.2331740856170654]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 6.0, 15.0, 18.0, 15.0, 27.0, 43.0, 47.0, 95.0, 148.0, 185.0, 285.0, 406.0, 581.0, 808.0, 1153.0, 1686.0, 2424.0, 3603.0, 5425.0, 7841.0, 11876.0, 18398.0, 28678.0, 46133.0, 77679.0, 129568.0, 195921.0, 191180.0, 124544.0, 73971.0, 44747.0, 27768.0, 17421.0, 11853.0, 7581.0, 5232.0, 3495.0, 2352.0, 1723.0, 1174.0, 763.0, 512.0, 342.0, 269.0, 179.0, 123.0, 82.0, 55.0, 34.0, 38.0, 23.0, 16.0, 10.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3525390625, -0.3411521911621094, -0.32976531982421875, -0.3183784484863281, -0.3069915771484375, -0.2956047058105469, -0.28421783447265625, -0.2728309631347656, -0.261444091796875, -0.2500572204589844, -0.23867034912109375, -0.22728347778320312, -0.2158966064453125, -0.20450973510742188, -0.19312286376953125, -0.18173599243164062, -0.17034912109375, -0.15896224975585938, -0.14757537841796875, -0.13618850708007812, -0.1248016357421875, -0.11341476440429688, -0.10202789306640625, -0.09064102172851562, -0.079254150390625, -0.06786727905273438, -0.05648040771484375, -0.045093536376953125, -0.0337066650390625, -0.022319793701171875, -0.01093292236328125, 0.000453948974609375, 0.0118408203125, 0.023227691650390625, 0.03461456298828125, 0.046001434326171875, 0.0573883056640625, 0.06877517700195312, 0.08016204833984375, 0.09154891967773438, 0.102935791015625, 0.11432266235351562, 0.12570953369140625, 0.13709640502929688, 0.1484832763671875, 0.15987014770507812, 0.17125701904296875, 0.18264389038085938, 0.19403076171875, 0.20541763305664062, 0.21680450439453125, 0.22819137573242188, 0.2395782470703125, 0.2509651184082031, 0.26235198974609375, 0.2737388610839844, 0.285125732421875, 0.2965126037597656, 0.30789947509765625, 0.3192863464355469, 0.3306732177734375, 0.3420600891113281, 0.35344696044921875, 0.3648338317871094, 0.376220703125]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 13.0, 9.0, 6.0, 10.0, 13.0, 11.0, 22.0, 20.0, 14.0, 23.0, 26.0, 28.0, 36.0, 25.0, 33.0, 47.0, 33.0, 36.0, 39.0, 37.0, 42.0, 35.0, 31.0, 35.0, 46.0, 32.0, 30.0, 33.0, 23.0, 32.0, 26.0, 17.0, 23.0, 24.0, 15.0, 10.0, 13.0, 8.0, 12.0, 4.0, 7.0, 6.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-2.193359375, -2.125823974609375, -2.05828857421875, -1.990753173828125, -1.9232177734375, -1.855682373046875, -1.78814697265625, -1.720611572265625, -1.653076171875, -1.585540771484375, -1.51800537109375, -1.450469970703125, -1.3829345703125, -1.315399169921875, -1.24786376953125, -1.180328369140625, -1.11279296875, -1.045257568359375, -0.97772216796875, -0.910186767578125, -0.8426513671875, -0.775115966796875, -0.70758056640625, -0.640045166015625, -0.572509765625, -0.504974365234375, -0.43743896484375, -0.369903564453125, -0.3023681640625, -0.234832763671875, -0.16729736328125, -0.099761962890625, -0.0322265625, 0.035308837890625, 0.10284423828125, 0.170379638671875, 0.2379150390625, 0.305450439453125, 0.37298583984375, 0.440521240234375, 0.508056640625, 0.575592041015625, 0.64312744140625, 0.710662841796875, 0.7781982421875, 0.845733642578125, 0.91326904296875, 0.980804443359375, 1.04833984375, 1.115875244140625, 1.18341064453125, 1.250946044921875, 1.3184814453125, 1.386016845703125, 1.45355224609375, 1.521087646484375, 1.588623046875, 1.656158447265625, 1.72369384765625, 1.791229248046875, 1.8587646484375, 1.926300048828125, 1.99383544921875, 2.061370849609375, 2.12890625]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 5.0, 9.0, 13.0, 11.0, 13.0, 35.0, 43.0, 73.0, 83.0, 132.0, 155.0, 264.0, 429.0, 692.0, 1313.0, 2789.0, 7540.0, 30253.0, 936324.0, 50340.0, 10679.0, 3499.0, 1594.0, 787.0, 551.0, 286.0, 189.0, 143.0, 92.0, 73.0, 55.0, 31.0, 20.0, 9.0, 11.0, 7.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7900390625, -1.735198974609375, -1.68035888671875, -1.625518798828125, -1.5706787109375, -1.515838623046875, -1.46099853515625, -1.406158447265625, -1.351318359375, -1.296478271484375, -1.24163818359375, -1.186798095703125, -1.1319580078125, -1.077117919921875, -1.02227783203125, -0.967437744140625, -0.91259765625, -0.857757568359375, -0.80291748046875, -0.748077392578125, -0.6932373046875, -0.638397216796875, -0.58355712890625, -0.528717041015625, -0.473876953125, -0.419036865234375, -0.36419677734375, -0.309356689453125, -0.2545166015625, -0.199676513671875, -0.14483642578125, -0.089996337890625, -0.03515625, 0.019683837890625, 0.07452392578125, 0.129364013671875, 0.1842041015625, 0.239044189453125, 0.29388427734375, 0.348724365234375, 0.403564453125, 0.458404541015625, 0.51324462890625, 0.568084716796875, 0.6229248046875, 0.677764892578125, 0.73260498046875, 0.787445068359375, 0.84228515625, 0.897125244140625, 0.95196533203125, 1.006805419921875, 1.0616455078125, 1.116485595703125, 1.17132568359375, 1.226165771484375, 1.281005859375, 1.335845947265625, 1.39068603515625, 1.445526123046875, 1.5003662109375, 1.555206298828125, 1.61004638671875, 1.664886474609375, 1.7197265625]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 3.0, 17.0, 4.0, 13.0, 14.0, 20.0, 12.0, 17.0, 27.0, 20.0, 32.0, 39.0, 36.0, 33.0, 44.0, 38.0, 31.0, 44.0, 38.0, 50.0, 38.0, 45.0, 39.0, 41.0, 33.0, 26.0, 26.0, 20.0, 25.0, 22.0, 29.0, 17.0, 11.0, 13.0, 14.0, 15.0, 9.0, 10.0, 6.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4091796875, -1.3652191162109375, -1.321258544921875, -1.2772979736328125, -1.23333740234375, -1.1893768310546875, -1.145416259765625, -1.1014556884765625, -1.0574951171875, -1.0135345458984375, -0.969573974609375, -0.9256134033203125, -0.88165283203125, -0.8376922607421875, -0.793731689453125, -0.7497711181640625, -0.705810546875, -0.6618499755859375, -0.617889404296875, -0.5739288330078125, -0.52996826171875, -0.4860076904296875, -0.442047119140625, -0.3980865478515625, -0.3541259765625, -0.3101654052734375, -0.266204833984375, -0.2222442626953125, -0.17828369140625, -0.1343231201171875, -0.090362548828125, -0.0464019775390625, -0.00244140625, 0.0415191650390625, 0.085479736328125, 0.1294403076171875, 0.17340087890625, 0.2173614501953125, 0.261322021484375, 0.3052825927734375, 0.3492431640625, 0.3932037353515625, 0.437164306640625, 0.4811248779296875, 0.52508544921875, 0.5690460205078125, 0.613006591796875, 0.6569671630859375, 0.700927734375, 0.7448883056640625, 0.788848876953125, 0.8328094482421875, 0.87677001953125, 0.9207305908203125, 0.964691162109375, 1.0086517333984375, 1.0526123046875, 1.0965728759765625, 1.140533447265625, 1.1844940185546875, 1.22845458984375, 1.2724151611328125, 1.316375732421875, 1.3603363037109375, 1.404296875]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 2.0, 8.0, 8.0, 14.0, 27.0, 37.0, 66.0, 90.0, 114.0, 190.0, 328.0, 568.0, 1032.0, 2589.0, 6920.0, 33401.0, 965267.0, 27078.0, 6115.0, 2263.0, 1016.0, 576.0, 314.0, 171.0, 115.0, 71.0, 58.0, 40.0, 19.0, 15.0, 5.0, 11.0, 6.0, 8.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.212890625, -0.20589828491210938, -0.19890594482421875, -0.19191360473632812, -0.1849212646484375, -0.17792892456054688, -0.17093658447265625, -0.16394424438476562, -0.156951904296875, -0.14995956420898438, -0.14296722412109375, -0.13597488403320312, -0.1289825439453125, -0.12199020385742188, -0.11499786376953125, -0.10800552368164062, -0.10101318359375, -0.09402084350585938, -0.08702850341796875, -0.08003616333007812, -0.0730438232421875, -0.06605148315429688, -0.05905914306640625, -0.052066802978515625, -0.045074462890625, -0.038082122802734375, -0.03108978271484375, -0.024097442626953125, -0.0171051025390625, -0.010112762451171875, -0.00312042236328125, 0.003871917724609375, 0.0108642578125, 0.017856597900390625, 0.02484893798828125, 0.031841278076171875, 0.0388336181640625, 0.045825958251953125, 0.05281829833984375, 0.059810638427734375, 0.066802978515625, 0.07379531860351562, 0.08078765869140625, 0.08777999877929688, 0.0947723388671875, 0.10176467895507812, 0.10875701904296875, 0.11574935913085938, 0.12274169921875, 0.12973403930664062, 0.13672637939453125, 0.14371871948242188, 0.1507110595703125, 0.15770339965820312, 0.16469573974609375, 0.17168807983398438, 0.178680419921875, 0.18567276000976562, 0.19266510009765625, 0.19965744018554688, 0.2066497802734375, 0.21364212036132812, 0.22063446044921875, 0.22762680053710938, 0.234619140625]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 11.0, 20.0, 25.0, 39.0, 32.0, 60.0, 73.0, 78.0, 86.0, 93.0, 81.0, 60.0, 79.0, 53.0, 37.0, 33.0, 30.0, 26.0, 15.0, 12.0, 11.0, 13.0, 1.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8770179748535156e-05, -5.686469376087189e-05, -5.495920777320862e-05, -5.305372178554535e-05, -5.114823579788208e-05, -4.924274981021881e-05, -4.733726382255554e-05, -4.543177783489227e-05, -4.3526291847229004e-05, -4.1620805859565735e-05, -3.9715319871902466e-05, -3.78098338842392e-05, -3.590434789657593e-05, -3.399886190891266e-05, -3.209337592124939e-05, -3.018788993358612e-05, -2.828240394592285e-05, -2.6376917958259583e-05, -2.4471431970596313e-05, -2.2565945982933044e-05, -2.0660459995269775e-05, -1.8754974007606506e-05, -1.6849488019943237e-05, -1.4944002032279968e-05, -1.30385160446167e-05, -1.113303005695343e-05, -9.227544069290161e-06, -7.322058081626892e-06, -5.416572093963623e-06, -3.511086106300354e-06, -1.605600118637085e-06, 2.998858690261841e-07, 2.205371856689453e-06, 4.110857844352722e-06, 6.016343832015991e-06, 7.92182981967926e-06, 9.82731580734253e-06, 1.1732801795005798e-05, 1.3638287782669067e-05, 1.5543773770332336e-05, 1.7449259757995605e-05, 1.9354745745658875e-05, 2.1260231733322144e-05, 2.3165717720985413e-05, 2.507120370864868e-05, 2.697668969631195e-05, 2.888217568397522e-05, 3.078766167163849e-05, 3.269314765930176e-05, 3.459863364696503e-05, 3.6504119634628296e-05, 3.8409605622291565e-05, 4.0315091609954834e-05, 4.22205775976181e-05, 4.412606358528137e-05, 4.603154957294464e-05, 4.793703556060791e-05, 4.984252154827118e-05, 5.174800753593445e-05, 5.365349352359772e-05, 5.5558979511260986e-05, 5.7464465498924255e-05, 5.9369951486587524e-05, 6.12754374742508e-05, 6.318092346191406e-05]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 1.0, 9.0, 7.0, 10.0, 8.0, 10.0, 13.0, 17.0, 24.0, 28.0, 33.0, 59.0, 67.0, 114.0, 200.0, 754.0, 6470.0, 126579.0, 870290.0, 40059.0, 2814.0, 451.0, 147.0, 106.0, 59.0, 39.0, 38.0, 29.0, 22.0, 17.0, 15.0, 15.0, 9.0, 10.0, 6.0, 2.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.26513671875, -0.2563934326171875, -0.247650146484375, -0.2389068603515625, -0.23016357421875, -0.2214202880859375, -0.212677001953125, -0.2039337158203125, -0.1951904296875, -0.1864471435546875, -0.177703857421875, -0.1689605712890625, -0.16021728515625, -0.1514739990234375, -0.142730712890625, -0.1339874267578125, -0.125244140625, -0.1165008544921875, -0.107757568359375, -0.0990142822265625, -0.09027099609375, -0.0815277099609375, -0.072784423828125, -0.0640411376953125, -0.0552978515625, -0.0465545654296875, -0.037811279296875, -0.0290679931640625, -0.02032470703125, -0.0115814208984375, -0.002838134765625, 0.0059051513671875, 0.0146484375, 0.0233917236328125, 0.032135009765625, 0.0408782958984375, 0.04962158203125, 0.0583648681640625, 0.067108154296875, 0.0758514404296875, 0.0845947265625, 0.0933380126953125, 0.102081298828125, 0.1108245849609375, 0.11956787109375, 0.1283111572265625, 0.137054443359375, 0.1457977294921875, 0.154541015625, 0.1632843017578125, 0.172027587890625, 0.1807708740234375, 0.18951416015625, 0.1982574462890625, 0.207000732421875, 0.2157440185546875, 0.2244873046875, 0.2332305908203125, 0.241973876953125, 0.2507171630859375, 0.25946044921875, 0.2682037353515625, 0.276947021484375, 0.2856903076171875, 0.29443359375]}, "gradients/decoder.roberta.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 5.0, 2.0, 3.0, 10.0, 6.0, 15.0, 10.0, 9.0, 27.0, 19.0, 31.0, 50.0, 71.0, 116.0, 137.0, 127.0, 111.0, 64.0, 38.0, 29.0, 23.0, 25.0, 11.0, 9.0, 7.0, 9.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.023773193359375, -0.023093461990356445, -0.02241373062133789, -0.021733999252319336, -0.02105426788330078, -0.020374536514282227, -0.019694805145263672, -0.019015073776245117, -0.018335342407226562, -0.017655611038208008, -0.016975879669189453, -0.0162961483001709, -0.015616416931152344, -0.014936685562133789, -0.014256954193115234, -0.01357722282409668, -0.012897491455078125, -0.01221776008605957, -0.011538028717041016, -0.010858297348022461, -0.010178565979003906, -0.009498834609985352, -0.008819103240966797, -0.008139371871948242, -0.0074596405029296875, -0.006779909133911133, -0.006100177764892578, -0.0054204463958740234, -0.004740715026855469, -0.004060983657836914, -0.0033812522888183594, -0.0027015209197998047, -0.00202178955078125, -0.0013420581817626953, -0.0006623268127441406, 1.7404556274414062e-05, 0.0006971359252929688, 0.0013768672943115234, 0.002056598663330078, 0.002736330032348633, 0.0034160614013671875, 0.004095792770385742, 0.004775524139404297, 0.0054552555084228516, 0.006134986877441406, 0.006814718246459961, 0.007494449615478516, 0.00817418098449707, 0.008853912353515625, 0.00953364372253418, 0.010213375091552734, 0.010893106460571289, 0.011572837829589844, 0.012252569198608398, 0.012932300567626953, 0.013612031936645508, 0.014291763305664062, 0.014971494674682617, 0.015651226043701172, 0.016330957412719727, 0.01701068878173828, 0.017690420150756836, 0.01837015151977539, 0.019049882888793945, 0.0197296142578125]}, "gradients/decoder.roberta.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 25.0, 47.0, 102.0, 137.0, 189.0, 198.0, 142.0, 84.0, 52.0, 17.0, 7.0, 5.0, 5.0], "bins": [-12.525643348693848, -12.301187515258789, -12.076732635498047, -11.852276802062988, -11.62782096862793, -11.403365135192871, -11.178910255432129, -10.95445442199707, -10.729998588562012, -10.505542755126953, -10.281087875366211, -10.056632041931152, -9.832176208496094, -9.607720375061035, -9.383265495300293, -9.158809661865234, -8.934354782104492, -8.709898948669434, -8.485444068908691, -8.260988235473633, -8.036532402038574, -7.812077045440674, -7.587621688842773, -7.363165855407715, -7.138710021972656, -6.914254665374756, -6.689798831939697, -6.465343475341797, -6.240887641906738, -6.016432285308838, -5.7919769287109375, -5.567521095275879, -5.34306526184082, -5.11860990524292, -4.894154071807861, -4.669698715209961, -4.445242881774902, -4.220787525177002, -3.9963319301605225, -3.771876335144043, -3.5474207401275635, -3.322965145111084, -3.0985095500946045, -2.874053955078125, -2.6495985984802246, -2.425142765045166, -2.2006874084472656, -1.9762318134307861, -1.7517762184143066, -1.5273206233978271, -1.3028650283813477, -1.0784095525741577, -0.8539539575576782, -0.6294983625411987, -0.4050428867340088, -0.1805872917175293, 0.043868303298950195, 0.2683238685131073, 0.4927794337272644, 0.7172349691390991, 0.9416905641555786, 1.166146159172058, 1.390601634979248, 1.6150572299957275, 1.839512825012207]}, "gradients/decoder.roberta.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 12.0, 8.0, 6.0, 10.0, 15.0, 10.0, 22.0, 19.0, 15.0, 22.0, 28.0, 28.0, 36.0, 24.0, 33.0, 45.0, 35.0, 34.0, 40.0, 37.0, 43.0, 34.0, 28.0, 39.0, 44.0, 34.0, 29.0, 32.0, 26.0, 28.0, 29.0, 17.0, 21.0, 25.0, 16.0, 10.0, 11.0, 9.0, 13.0, 4.0, 6.0, 7.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0], "bins": [-2.1925666332244873, -2.125096082687378, -2.0576252937316895, -1.9901546239852905, -1.9226839542388916, -1.8552134037017822, -1.7877427339553833, -1.7202720642089844, -1.6528013944625854, -1.5853307247161865, -1.5178600549697876, -1.4503893852233887, -1.3829188346862793, -1.3154480457305908, -1.2479774951934814, -1.1805068254470825, -1.1130361557006836, -1.0455654859542847, -0.9780948162078857, -0.9106242060661316, -0.8431535363197327, -0.7756828665733337, -0.7082122564315796, -0.6407415866851807, -0.5732709169387817, -0.5058002471923828, -0.4383296072483063, -0.37085896730422974, -0.3033882975578308, -0.23591762781143188, -0.16844698786735535, -0.10097634792327881, -0.03350567817687988, 0.03396497666835785, 0.10143563151359558, 0.1689062863588333, 0.23637694120407104, 0.30384761095046997, 0.3713182508945465, 0.43878889083862305, 0.506259560585022, 0.5737302303314209, 0.6412009000778198, 0.708671510219574, 0.7761421799659729, 0.8436128497123718, 0.911083459854126, 0.9785541296005249, 1.0460247993469238, 1.1134954690933228, 1.1809661388397217, 1.2484368085861206, 1.3159074783325195, 1.383378028869629, 1.4508486986160278, 1.5183193683624268, 1.5857900381088257, 1.6532607078552246, 1.7207313776016235, 1.7882020473480225, 1.8556725978851318, 1.9231433868408203, 1.9906139373779297, 2.058084487915039, 2.1255552768707275]}, "gradients/decoder.roberta.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 7.0, 16.0, 21.0, 22.0, 35.0, 53.0, 56.0, 102.0, 109.0, 186.0, 320.0, 482.0, 799.0, 1380.0, 2441.0, 4104.0, 7653.0, 14150.0, 27055.0, 54590.0, 119199.0, 288411.0, 291984.0, 121149.0, 54956.0, 27224.0, 14012.0, 7568.0, 4288.0, 2434.0, 1467.0, 824.0, 498.0, 310.0, 198.0, 127.0, 86.0, 67.0, 44.0, 34.0, 18.0, 16.0, 10.0, 13.0, 10.0, 4.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0], "bins": [-2.75390625, -2.67047119140625, -2.5870361328125, -2.50360107421875, -2.420166015625, -2.33673095703125, -2.2532958984375, -2.16986083984375, -2.08642578125, -2.00299072265625, -1.9195556640625, -1.83612060546875, -1.752685546875, -1.66925048828125, -1.5858154296875, -1.50238037109375, -1.4189453125, -1.33551025390625, -1.2520751953125, -1.16864013671875, -1.085205078125, -1.00177001953125, -0.9183349609375, -0.83489990234375, -0.75146484375, -0.66802978515625, -0.5845947265625, -0.50115966796875, -0.417724609375, -0.33428955078125, -0.2508544921875, -0.16741943359375, -0.083984375, -0.00054931640625, 0.0828857421875, 0.16632080078125, 0.249755859375, 0.33319091796875, 0.4166259765625, 0.50006103515625, 0.58349609375, 0.66693115234375, 0.7503662109375, 0.83380126953125, 0.917236328125, 1.00067138671875, 1.0841064453125, 1.16754150390625, 1.2509765625, 1.33441162109375, 1.4178466796875, 1.50128173828125, 1.584716796875, 1.66815185546875, 1.7515869140625, 1.83502197265625, 1.91845703125, 2.00189208984375, 2.0853271484375, 2.16876220703125, 2.252197265625, 2.33563232421875, 2.4190673828125, 2.50250244140625, 2.5859375]}, "gradients/decoder.roberta.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 8.0, 12.0, 4.0, 7.0, 15.0, 12.0, 19.0, 17.0, 17.0, 21.0, 23.0, 28.0, 34.0, 32.0, 27.0, 35.0, 36.0, 34.0, 48.0, 36.0, 38.0, 37.0, 36.0, 35.0, 34.0, 41.0, 33.0, 25.0, 24.0, 37.0, 30.0, 17.0, 24.0, 18.0, 24.0, 12.0, 11.0, 10.0, 10.0, 10.0, 3.0, 7.0, 7.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0], "bins": [-2.240234375, -2.17218017578125, -2.1041259765625, -2.03607177734375, -1.968017578125, -1.89996337890625, -1.8319091796875, -1.76385498046875, -1.69580078125, -1.62774658203125, -1.5596923828125, -1.49163818359375, -1.423583984375, -1.35552978515625, -1.2874755859375, -1.21942138671875, -1.1513671875, -1.08331298828125, -1.0152587890625, -0.94720458984375, -0.879150390625, -0.81109619140625, -0.7430419921875, -0.67498779296875, -0.60693359375, -0.53887939453125, -0.4708251953125, -0.40277099609375, -0.334716796875, -0.26666259765625, -0.1986083984375, -0.13055419921875, -0.0625, 0.00555419921875, 0.0736083984375, 0.14166259765625, 0.209716796875, 0.27777099609375, 0.3458251953125, 0.41387939453125, 0.48193359375, 0.54998779296875, 0.6180419921875, 0.68609619140625, 0.754150390625, 0.82220458984375, 0.8902587890625, 0.95831298828125, 1.0263671875, 1.09442138671875, 1.1624755859375, 1.23052978515625, 1.298583984375, 1.36663818359375, 1.4346923828125, 1.50274658203125, 1.57080078125, 1.63885498046875, 1.7069091796875, 1.77496337890625, 1.843017578125, 1.91107177734375, 1.9791259765625, 2.04718017578125, 2.115234375]}, "gradients/decoder.roberta.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 8.0, 8.0, 16.0, 32.0, 37.0, 40.0, 63.0, 57.0, 90.0, 118.0, 144.0, 214.0, 489.0, 1045322.0, 1097.0, 166.0, 135.0, 102.0, 108.0, 69.0, 57.0, 49.0, 47.0, 33.0, 10.0, 12.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.4375, -41.3271484375, -39.216796875, -37.1064453125, -34.99609375, -32.8857421875, -30.775390625, -28.6650390625, -26.5546875, -24.4443359375, -22.333984375, -20.2236328125, -18.11328125, -16.0029296875, -13.892578125, -11.7822265625, -9.671875, -7.5615234375, -5.451171875, -3.3408203125, -1.23046875, 0.8798828125, 2.990234375, 5.1005859375, 7.2109375, 9.3212890625, 11.431640625, 13.5419921875, 15.65234375, 17.7626953125, 19.873046875, 21.9833984375, 24.09375, 26.2041015625, 28.314453125, 30.4248046875, 32.53515625, 34.6455078125, 36.755859375, 38.8662109375, 40.9765625, 43.0869140625, 45.197265625, 47.3076171875, 49.41796875, 51.5283203125, 53.638671875, 55.7490234375, 57.859375, 59.9697265625, 62.080078125, 64.1904296875, 66.30078125, 68.4111328125, 70.521484375, 72.6318359375, 74.7421875, 76.8525390625, 78.962890625, 81.0732421875, 83.18359375, 85.2939453125, 87.404296875, 89.5146484375, 91.625]}, "gradients/decoder.roberta.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 14.0, 5.0, 15.0, 27.0, 27.0, 29.0, 23.0, 58.0, 51.0, 57.0, 55.0, 81.0, 82.0, 66.0, 81.0, 68.0, 53.0, 50.0, 41.0, 31.0, 17.0, 21.0, 22.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.65625, -4.549346923828125, -4.44244384765625, -4.335540771484375, -4.2286376953125, -4.121734619140625, -4.01483154296875, -3.907928466796875, -3.801025390625, -3.694122314453125, -3.58721923828125, -3.480316162109375, -3.3734130859375, -3.266510009765625, -3.15960693359375, -3.052703857421875, -2.94580078125, -2.838897705078125, -2.73199462890625, -2.625091552734375, -2.5181884765625, -2.411285400390625, -2.30438232421875, -2.197479248046875, -2.090576171875, -1.983673095703125, -1.87677001953125, -1.769866943359375, -1.6629638671875, -1.556060791015625, -1.44915771484375, -1.342254638671875, -1.2353515625, -1.128448486328125, -1.02154541015625, -0.914642333984375, -0.8077392578125, -0.700836181640625, -0.59393310546875, -0.487030029296875, -0.380126953125, -0.273223876953125, -0.16632080078125, -0.059417724609375, 0.0474853515625, 0.154388427734375, 0.26129150390625, 0.368194580078125, 0.47509765625, 0.582000732421875, 0.68890380859375, 0.795806884765625, 0.9027099609375, 1.009613037109375, 1.11651611328125, 1.223419189453125, 1.330322265625, 1.437225341796875, 1.54412841796875, 1.651031494140625, 1.7579345703125, 1.864837646484375, 1.97174072265625, 2.078643798828125, 2.185546875]}, "gradients/decoder.roberta.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 10.0, 7.0, 5.0, 17.0, 17.0, 61.0, 114.0, 265.0, 1182.0, 32675.0, 1005383.0, 7694.0, 780.0, 182.0, 76.0, 30.0, 17.0, 12.0, 9.0, 2.0, 1.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8828125, -7.559326171875, -7.23583984375, -6.912353515625, -6.5888671875, -6.265380859375, -5.94189453125, -5.618408203125, -5.294921875, -4.971435546875, -4.64794921875, -4.324462890625, -4.0009765625, -3.677490234375, -3.35400390625, -3.030517578125, -2.70703125, -2.383544921875, -2.06005859375, -1.736572265625, -1.4130859375, -1.089599609375, -0.76611328125, -0.442626953125, -0.119140625, 0.204345703125, 0.52783203125, 0.851318359375, 1.1748046875, 1.498291015625, 1.82177734375, 2.145263671875, 2.46875, 2.792236328125, 3.11572265625, 3.439208984375, 3.7626953125, 4.086181640625, 4.40966796875, 4.733154296875, 5.056640625, 5.380126953125, 5.70361328125, 6.027099609375, 6.3505859375, 6.674072265625, 6.99755859375, 7.321044921875, 7.64453125, 7.968017578125, 8.29150390625, 8.614990234375, 8.9384765625, 9.261962890625, 9.58544921875, 9.908935546875, 10.232421875, 10.555908203125, 10.87939453125, 11.202880859375, 11.5263671875, 11.849853515625, 12.17333984375, 12.496826171875, 12.8203125]}, "gradients/decoder.roberta.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 10.0, 12.0, 26.0, 23.0, 36.0, 45.0, 48.0, 100.0, 142.0, 204.0, 93.0, 75.0, 61.0, 41.0, 20.0, 19.0, 16.0, 13.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003151893615722656, -0.0003066994249820709, -0.0002982094883918762, -0.0002897195518016815, -0.0002812296152114868, -0.0002727396786212921, -0.0002642497420310974, -0.0002557598054409027, -0.000247269868850708, -0.0002387799322605133, -0.0002302899956703186, -0.0002218000590801239, -0.0002133101224899292, -0.0002048201858997345, -0.0001963302493095398, -0.0001878403127193451, -0.0001793503761291504, -0.0001708604395389557, -0.00016237050294876099, -0.00015388056635856628, -0.00014539062976837158, -0.00013690069317817688, -0.00012841075658798218, -0.00011992081999778748, -0.00011143088340759277, -0.00010294094681739807, -9.445101022720337e-05, -8.596107363700867e-05, -7.747113704681396e-05, -6.898120045661926e-05, -6.049126386642456e-05, -5.200132727622986e-05, -4.3511390686035156e-05, -3.5021454095840454e-05, -2.6531517505645752e-05, -1.804158091545105e-05, -9.551644325256348e-06, -1.0617077350616455e-06, 7.428228855133057e-06, 1.591816544532776e-05, 2.440810203552246e-05, 3.289803862571716e-05, 4.1387975215911865e-05, 4.987791180610657e-05, 5.836784839630127e-05, 6.685778498649597e-05, 7.534772157669067e-05, 8.383765816688538e-05, 9.232759475708008e-05, 0.00010081753134727478, 0.00010930746793746948, 0.00011779740452766418, 0.0001262873411178589, 0.0001347772777080536, 0.0001432672142982483, 0.000151757150888443, 0.0001602470874786377, 0.0001687370240688324, 0.0001772269606590271, 0.0001857168972492218, 0.0001942068338394165, 0.0002026967704296112, 0.0002111867070198059, 0.0002196766436100006, 0.0002281665802001953]}, "gradients/decoder.roberta.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 2.0, 5.0, 8.0, 9.0, 18.0, 51.0, 112.0, 392.0, 2444.0, 1018169.0, 26035.0, 941.0, 226.0, 69.0, 31.0, 16.0, 10.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.390625, -12.826904296875, -12.26318359375, -11.699462890625, -11.1357421875, -10.572021484375, -10.00830078125, -9.444580078125, -8.880859375, -8.317138671875, -7.75341796875, -7.189697265625, -6.6259765625, -6.062255859375, -5.49853515625, -4.934814453125, -4.37109375, -3.807373046875, -3.24365234375, -2.679931640625, -2.1162109375, -1.552490234375, -0.98876953125, -0.425048828125, 0.138671875, 0.702392578125, 1.26611328125, 1.829833984375, 2.3935546875, 2.957275390625, 3.52099609375, 4.084716796875, 4.6484375, 5.212158203125, 5.77587890625, 6.339599609375, 6.9033203125, 7.467041015625, 8.03076171875, 8.594482421875, 9.158203125, 9.721923828125, 10.28564453125, 10.849365234375, 11.4130859375, 11.976806640625, 12.54052734375, 13.104248046875, 13.66796875, 14.231689453125, 14.79541015625, 15.359130859375, 15.9228515625, 16.486572265625, 17.05029296875, 17.614013671875, 18.177734375, 18.741455078125, 19.30517578125, 19.868896484375, 20.4326171875, 20.996337890625, 21.56005859375, 22.123779296875, 22.6875]}, "gradients/decoder.roberta.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 9.0, 25.0, 38.0, 82.0, 172.0, 301.0, 168.0, 100.0, 47.0, 22.0, 15.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8818359375, -1.8386688232421875, -1.795501708984375, -1.7523345947265625, -1.70916748046875, -1.6660003662109375, -1.622833251953125, -1.5796661376953125, -1.5364990234375, -1.4933319091796875, -1.450164794921875, -1.4069976806640625, -1.36383056640625, -1.3206634521484375, -1.277496337890625, -1.2343292236328125, -1.191162109375, -1.1479949951171875, -1.104827880859375, -1.0616607666015625, -1.01849365234375, -0.9753265380859375, -0.932159423828125, -0.8889923095703125, -0.8458251953125, -0.8026580810546875, -0.759490966796875, -0.7163238525390625, -0.67315673828125, -0.6299896240234375, -0.586822509765625, -0.5436553955078125, -0.50048828125, -0.4573211669921875, -0.414154052734375, -0.3709869384765625, -0.32781982421875, -0.2846527099609375, -0.241485595703125, -0.1983184814453125, -0.1551513671875, -0.1119842529296875, -0.068817138671875, -0.0256500244140625, 0.01751708984375, 0.0606842041015625, 0.103851318359375, 0.1470184326171875, 0.190185546875, 0.2333526611328125, 0.276519775390625, 0.3196868896484375, 0.36285400390625, 0.4060211181640625, 0.449188232421875, 0.4923553466796875, 0.5355224609375, 0.5786895751953125, 0.621856689453125, 0.6650238037109375, 0.70819091796875, 0.7513580322265625, 0.794525146484375, 0.8376922607421875, 0.880859375]}, "gradients/decoder.roberta.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 12.0, 15.0, 29.0, 42.0, 58.0, 75.0, 105.0, 123.0, 111.0, 114.0, 98.0, 73.0, 61.0, 35.0, 22.0, 13.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1819047927856445, -4.028029441833496, -3.874154567718506, -3.7202794551849365, -3.566404342651367, -3.412529230117798, -3.2586541175842285, -3.104779005050659, -2.95090389251709, -2.7970287799835205, -2.643153667449951, -2.489278554916382, -2.3354034423828125, -2.181528329849243, -2.027653217315674, -1.8737781047821045, -1.7199029922485352, -1.5660278797149658, -1.4121527671813965, -1.2582776546478271, -1.1044025421142578, -0.9505274295806885, -0.7966523170471191, -0.6427772045135498, -0.48890209197998047, -0.33502697944641113, -0.1811518669128418, -0.02727675437927246, 0.12659835815429688, 0.2804734706878662, 0.43434858322143555, 0.5882236957550049, 0.742098331451416, 0.8959734439849854, 1.0498485565185547, 1.203723669052124, 1.3575987815856934, 1.5114738941192627, 1.665349006652832, 1.8192241191864014, 1.9730992317199707, 2.12697434425354, 2.2808494567871094, 2.4347245693206787, 2.588599681854248, 2.7424747943878174, 2.8963499069213867, 3.050225019454956, 3.2041001319885254, 3.3579752445220947, 3.511850357055664, 3.6657254695892334, 3.8196005821228027, 3.973475694656372, 4.127350807189941, 4.28122615814209, 4.43510103225708, 4.58897590637207, 4.742851257324219, 4.896726608276367, 5.050601482391357, 5.204476356506348, 5.358351707458496, 5.5122270584106445, 5.666101932525635]}, "gradients/decoder.roberta.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 5.0, 7.0, 18.0, 10.0, 12.0, 16.0, 21.0, 23.0, 28.0, 17.0, 29.0, 39.0, 35.0, 48.0, 46.0, 30.0, 50.0, 39.0, 45.0, 50.0, 30.0, 30.0, 36.0, 39.0, 35.0, 32.0, 25.0, 29.0, 22.0, 26.0, 21.0, 19.0, 16.0, 12.0, 9.0, 8.0, 10.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.10143780708313, -2.0136876106262207, -1.9259374141693115, -1.8381872177124023, -1.7504370212554932, -1.662686824798584, -1.5749365091323853, -1.487186312675476, -1.399436116218567, -1.3116859197616577, -1.2239357233047485, -1.1361854076385498, -1.0484352111816406, -0.9606850743293762, -0.8729348182678223, -0.7851846218109131, -0.6974344253540039, -0.6096842288970947, -0.5219340324401855, -0.4341837763786316, -0.3464335799217224, -0.25868338346481323, -0.17093312740325928, -0.0831829309463501, 0.004567265510559082, 0.09231747686862946, 0.18006768822669983, 0.2678179144859314, 0.3555681109428406, 0.44331830739974976, 0.5310685634613037, 0.6188187599182129, 0.7065691947937012, 0.7943193912506104, 0.8820695877075195, 0.9698198437690735, 1.057569980621338, 1.145320177078247, 1.2330704927444458, 1.320820689201355, 1.4085708856582642, 1.4963210821151733, 1.5840712785720825, 1.6718215942382812, 1.7595717906951904, 1.8473219871520996, 1.9350721836090088, 2.022822380065918, 2.110572576522827, 2.1983227729797363, 2.2860729694366455, 2.3738231658935547, 2.461573362350464, 2.549323558807373, 2.6370739936828613, 2.7248239517211914, 2.8125743865966797, 2.900324583053589, 2.988074779510498, 3.0758249759674072, 3.1635751724243164, 3.2513253688812256, 3.3390755653381348, 3.426826000213623, 3.514575958251953]}, "gradients/decoder.roberta.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 1.0, 4.0, 6.0, 6.0, 13.0, 8.0, 19.0, 17.0, 17.0, 43.0, 43.0, 50.0, 65.0, 94.0, 113.0, 226.0, 447.0, 1152.0, 3745.0, 18436.0, 207679.0, 3817086.0, 126101.0, 13754.0, 3094.0, 997.0, 388.0, 192.0, 114.0, 84.0, 74.0, 58.0, 24.0, 24.0, 20.0, 19.0, 16.0, 12.0, 10.0, 6.0, 5.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-8.9765625, -8.71575927734375, -8.4549560546875, -8.19415283203125, -7.933349609375, -7.67254638671875, -7.4117431640625, -7.15093994140625, -6.89013671875, -6.62933349609375, -6.3685302734375, -6.10772705078125, -5.846923828125, -5.58612060546875, -5.3253173828125, -5.06451416015625, -4.8037109375, -4.54290771484375, -4.2821044921875, -4.02130126953125, -3.760498046875, -3.49969482421875, -3.2388916015625, -2.97808837890625, -2.71728515625, -2.45648193359375, -2.1956787109375, -1.93487548828125, -1.674072265625, -1.41326904296875, -1.1524658203125, -0.89166259765625, -0.630859375, -0.37005615234375, -0.1092529296875, 0.15155029296875, 0.412353515625, 0.67315673828125, 0.9339599609375, 1.19476318359375, 1.45556640625, 1.71636962890625, 1.9771728515625, 2.23797607421875, 2.498779296875, 2.75958251953125, 3.0203857421875, 3.28118896484375, 3.5419921875, 3.80279541015625, 4.0635986328125, 4.32440185546875, 4.585205078125, 4.84600830078125, 5.1068115234375, 5.36761474609375, 5.62841796875, 5.88922119140625, 6.1500244140625, 6.41082763671875, 6.671630859375, 6.93243408203125, 7.1932373046875, 7.45404052734375, 7.71484375]}, "gradients/decoder.roberta.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 10.0, 11.0, 10.0, 12.0, 10.0, 9.0, 17.0, 17.0, 13.0, 26.0, 26.0, 30.0, 23.0, 46.0, 31.0, 45.0, 42.0, 44.0, 41.0, 33.0, 49.0, 35.0, 32.0, 35.0, 34.0, 28.0, 44.0, 29.0, 41.0, 23.0, 22.0, 26.0, 18.0, 17.0, 16.0, 11.0, 13.0, 9.0, 9.0, 7.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7734375, -1.7147216796875, -1.656005859375, -1.5972900390625, -1.53857421875, -1.4798583984375, -1.421142578125, -1.3624267578125, -1.3037109375, -1.2449951171875, -1.186279296875, -1.1275634765625, -1.06884765625, -1.0101318359375, -0.951416015625, -0.8927001953125, -0.833984375, -0.7752685546875, -0.716552734375, -0.6578369140625, -0.59912109375, -0.5404052734375, -0.481689453125, -0.4229736328125, -0.3642578125, -0.3055419921875, -0.246826171875, -0.1881103515625, -0.12939453125, -0.0706787109375, -0.011962890625, 0.0467529296875, 0.10546875, 0.1641845703125, 0.222900390625, 0.2816162109375, 0.34033203125, 0.3990478515625, 0.457763671875, 0.5164794921875, 0.5751953125, 0.6339111328125, 0.692626953125, 0.7513427734375, 0.81005859375, 0.8687744140625, 0.927490234375, 0.9862060546875, 1.044921875, 1.1036376953125, 1.162353515625, 1.2210693359375, 1.27978515625, 1.3385009765625, 1.397216796875, 1.4559326171875, 1.5146484375, 1.5733642578125, 1.632080078125, 1.6907958984375, 1.74951171875, 1.8082275390625, 1.866943359375, 1.9256591796875, 1.984375]}, "gradients/decoder.roberta.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 8.0, 15.0, 28.0, 42.0, 61.0, 108.0, 252.0, 818.0, 7495.0, 4037864.0, 143977.0, 2658.0, 503.0, 186.0, 93.0, 52.0, 29.0, 21.0, 23.0, 12.0, 9.0, 5.0, 7.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.0, -23.220947265625, -22.44189453125, -21.662841796875, -20.8837890625, -20.104736328125, -19.32568359375, -18.546630859375, -17.767578125, -16.988525390625, -16.20947265625, -15.430419921875, -14.6513671875, -13.872314453125, -13.09326171875, -12.314208984375, -11.53515625, -10.756103515625, -9.97705078125, -9.197998046875, -8.4189453125, -7.639892578125, -6.86083984375, -6.081787109375, -5.302734375, -4.523681640625, -3.74462890625, -2.965576171875, -2.1865234375, -1.407470703125, -0.62841796875, 0.150634765625, 0.9296875, 1.708740234375, 2.48779296875, 3.266845703125, 4.0458984375, 4.824951171875, 5.60400390625, 6.383056640625, 7.162109375, 7.941162109375, 8.72021484375, 9.499267578125, 10.2783203125, 11.057373046875, 11.83642578125, 12.615478515625, 13.39453125, 14.173583984375, 14.95263671875, 15.731689453125, 16.5107421875, 17.289794921875, 18.06884765625, 18.847900390625, 19.626953125, 20.406005859375, 21.18505859375, 21.964111328125, 22.7431640625, 23.522216796875, 24.30126953125, 25.080322265625, 25.859375]}, "gradients/decoder.roberta.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 5.0, 4.0, 5.0, 7.0, 14.0, 18.0, 22.0, 24.0, 68.0, 95.0, 165.0, 370.0, 776.0, 1706.0, 340.0, 174.0, 98.0, 65.0, 38.0, 33.0, 13.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.966796875, -1.921173095703125, -1.87554931640625, -1.829925537109375, -1.7843017578125, -1.738677978515625, -1.69305419921875, -1.647430419921875, -1.601806640625, -1.556182861328125, -1.51055908203125, -1.464935302734375, -1.4193115234375, -1.373687744140625, -1.32806396484375, -1.282440185546875, -1.23681640625, -1.191192626953125, -1.14556884765625, -1.099945068359375, -1.0543212890625, -1.008697509765625, -0.96307373046875, -0.917449951171875, -0.871826171875, -0.826202392578125, -0.78057861328125, -0.734954833984375, -0.6893310546875, -0.643707275390625, -0.59808349609375, -0.552459716796875, -0.5068359375, -0.461212158203125, -0.41558837890625, -0.369964599609375, -0.3243408203125, -0.278717041015625, -0.23309326171875, -0.187469482421875, -0.141845703125, -0.096221923828125, -0.05059814453125, -0.004974365234375, 0.0406494140625, 0.086273193359375, 0.13189697265625, 0.177520751953125, 0.22314453125, 0.268768310546875, 0.31439208984375, 0.360015869140625, 0.4056396484375, 0.451263427734375, 0.49688720703125, 0.542510986328125, 0.588134765625, 0.633758544921875, 0.67938232421875, 0.725006103515625, 0.7706298828125, 0.816253662109375, 0.86187744140625, 0.907501220703125, 0.953125]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 3.0, 9.0, 13.0, 8.0, 13.0, 31.0, 19.0, 20.0, 40.0, 45.0, 42.0, 56.0, 67.0, 64.0, 69.0, 60.0, 78.0, 54.0, 45.0, 53.0, 31.0, 41.0, 28.0, 23.0, 22.0, 15.0, 12.0, 8.0, 12.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-2.9589781761169434, -2.8880813121795654, -2.8171842098236084, -2.7462873458862305, -2.6753904819488525, -2.6044936180114746, -2.5335965156555176, -2.4626996517181396, -2.3918027877807617, -2.320905923843384, -2.2500088214874268, -2.179111957550049, -2.108215093612671, -2.037318229675293, -1.966421127319336, -1.895524263381958, -1.824627161026001, -1.7537301778793335, -1.6828333139419556, -1.611936330795288, -1.5410394668579102, -1.4701424837112427, -1.3992455005645752, -1.3283486366271973, -1.2574516534805298, -1.1865546703338623, -1.1156578063964844, -1.044760823249817, -0.9738638997077942, -0.9029669761657715, -0.832069993019104, -0.7611730694770813, -0.690276026725769, -0.6193791031837463, -0.5484821796417236, -0.47758519649505615, -0.40668827295303345, -0.33579134941101074, -0.26489439606666565, -0.19399744272232056, -0.12310051918029785, -0.05220358073711395, 0.018693357706069946, 0.08959029614925385, 0.16048723459243774, 0.23138415813446045, 0.30228111147880554, 0.37317806482315063, 0.44407498836517334, 0.514971911907196, 0.5858688354492188, 0.6567658185958862, 0.7276627421379089, 0.7985596656799316, 0.8694566488265991, 0.9403535723686218, 1.0112504959106445, 1.082147479057312, 1.15304434299469, 1.2239413261413574, 1.2948381900787354, 1.3657351732254028, 1.4366321563720703, 1.5075290203094482, 1.5784260034561157]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 7.0, 7.0, 9.0, 16.0, 19.0, 16.0, 20.0, 18.0, 22.0, 32.0, 35.0, 39.0, 39.0, 42.0, 41.0, 38.0, 43.0, 36.0, 59.0, 42.0, 41.0, 49.0, 31.0, 41.0, 38.0, 25.0, 36.0, 31.0, 18.0, 26.0, 14.0, 12.0, 13.0, 8.0, 12.0, 4.0, 2.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.122023105621338, -2.04569149017334, -1.9693598747253418, -1.8930282592773438, -1.8166966438293457, -1.7403650283813477, -1.6640335321426392, -1.5877019166946411, -1.511370301246643, -1.435038685798645, -1.358707070350647, -1.282375454902649, -1.2060439586639404, -1.1297123432159424, -1.0533807277679443, -0.9770491123199463, -0.9007174968719482, -0.8243858814239502, -0.7480542659759521, -0.6717227101325989, -0.5953910946846008, -0.5190594792366028, -0.4427278935909271, -0.36639630794525146, -0.2900646924972534, -0.21373309195041656, -0.1374014914035797, -0.06106989085674286, 0.015261709690093994, 0.09159332513809204, 0.1679249107837677, 0.24425649642944336, 0.3205881118774414, 0.39691972732543945, 0.4732513129711151, 0.5495828986167908, 0.6259145140647888, 0.7022461295127869, 0.7785776853561401, 0.8549093008041382, 0.9312409162521362, 1.0075725317001343, 1.0839041471481323, 1.1602357625961304, 1.2365672588348389, 1.312898874282837, 1.389230489730835, 1.465562105178833, 1.541893720626831, 1.618225336074829, 1.6945569515228271, 1.7708885669708252, 1.8472201824188232, 1.9235517978668213, 1.9998832941055298, 2.0762147903442383, 2.1525464057922363, 2.2288780212402344, 2.3052096366882324, 2.3815412521362305, 2.4578728675842285, 2.5342044830322266, 2.6105360984802246, 2.6868677139282227, 2.7631993293762207]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 8.0, 4.0, 3.0, 4.0, 13.0, 18.0, 16.0, 21.0, 39.0, 51.0, 86.0, 95.0, 147.0, 192.0, 301.0, 426.0, 525.0, 851.0, 1281.0, 1808.0, 2634.0, 4038.0, 5656.0, 9087.0, 13762.0, 21622.0, 35059.0, 60170.0, 104923.0, 174847.0, 217439.0, 159533.0, 92383.0, 52649.0, 31712.0, 19478.0, 12682.0, 8035.0, 5497.0, 3597.0, 2398.0, 1646.0, 1159.0, 809.0, 596.0, 375.0, 260.0, 184.0, 133.0, 92.0, 65.0, 54.0, 30.0, 22.0, 20.0, 12.0, 8.0, 7.0, 7.0, 2.0, 1.0], "bins": [-0.3662109375, -0.3552436828613281, -0.34427642822265625, -0.3333091735839844, -0.3223419189453125, -0.3113746643066406, -0.30040740966796875, -0.2894401550292969, -0.278472900390625, -0.2675056457519531, -0.25653839111328125, -0.24557113647460938, -0.2346038818359375, -0.22363662719726562, -0.21266937255859375, -0.20170211791992188, -0.19073486328125, -0.17976760864257812, -0.16880035400390625, -0.15783309936523438, -0.1468658447265625, -0.13589859008789062, -0.12493133544921875, -0.11396408081054688, -0.102996826171875, -0.09202957153320312, -0.08106231689453125, -0.07009506225585938, -0.0591278076171875, -0.048160552978515625, -0.03719329833984375, -0.026226043701171875, -0.0152587890625, -0.004291534423828125, 0.00667572021484375, 0.017642974853515625, 0.0286102294921875, 0.039577484130859375, 0.05054473876953125, 0.061511993408203125, 0.072479248046875, 0.08344650268554688, 0.09441375732421875, 0.10538101196289062, 0.1163482666015625, 0.12731552124023438, 0.13828277587890625, 0.14925003051757812, 0.16021728515625, 0.17118453979492188, 0.18215179443359375, 0.19311904907226562, 0.2040863037109375, 0.21505355834960938, 0.22602081298828125, 0.23698806762695312, 0.247955322265625, 0.2589225769042969, 0.26988983154296875, 0.2808570861816406, 0.2918243408203125, 0.3027915954589844, 0.31375885009765625, 0.3247261047363281, 0.335693359375]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 8.0, 6.0, 7.0, 10.0, 13.0, 16.0, 19.0, 19.0, 22.0, 20.0, 27.0, 37.0, 38.0, 40.0, 43.0, 42.0, 31.0, 49.0, 35.0, 59.0, 37.0, 40.0, 45.0, 42.0, 34.0, 40.0, 24.0, 36.0, 37.0, 17.0, 28.0, 15.0, 13.0, 11.0, 10.0, 11.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.98724365234375, -1.9139404296875, -1.84063720703125, -1.767333984375, -1.69403076171875, -1.6207275390625, -1.54742431640625, -1.47412109375, -1.40081787109375, -1.3275146484375, -1.25421142578125, -1.180908203125, -1.10760498046875, -1.0343017578125, -0.96099853515625, -0.8876953125, -0.81439208984375, -0.7410888671875, -0.66778564453125, -0.594482421875, -0.52117919921875, -0.4478759765625, -0.37457275390625, -0.30126953125, -0.22796630859375, -0.1546630859375, -0.08135986328125, -0.008056640625, 0.06524658203125, 0.1385498046875, 0.21185302734375, 0.28515625, 0.35845947265625, 0.4317626953125, 0.50506591796875, 0.578369140625, 0.65167236328125, 0.7249755859375, 0.79827880859375, 0.87158203125, 0.94488525390625, 1.0181884765625, 1.09149169921875, 1.164794921875, 1.23809814453125, 1.3114013671875, 1.38470458984375, 1.4580078125, 1.53131103515625, 1.6046142578125, 1.67791748046875, 1.751220703125, 1.82452392578125, 1.8978271484375, 1.97113037109375, 2.04443359375, 2.11773681640625, 2.1910400390625, 2.26434326171875, 2.337646484375, 2.41094970703125, 2.4842529296875, 2.55755615234375, 2.630859375]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 4.0, 5.0, 10.0, 9.0, 26.0, 14.0, 26.0, 23.0, 44.0, 48.0, 71.0, 101.0, 150.0, 179.0, 247.0, 356.0, 528.0, 844.0, 1363.0, 2675.0, 6006.0, 16829.0, 70540.0, 903596.0, 27613.0, 8814.0, 3549.0, 1798.0, 980.0, 628.0, 410.0, 258.0, 214.0, 139.0, 119.0, 76.0, 58.0, 50.0, 31.0, 25.0, 15.0, 19.0, 20.0, 16.0, 4.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.2705078125, -1.231048583984375, -1.19158935546875, -1.152130126953125, -1.1126708984375, -1.073211669921875, -1.03375244140625, -0.994293212890625, -0.954833984375, -0.915374755859375, -0.87591552734375, -0.836456298828125, -0.7969970703125, -0.757537841796875, -0.71807861328125, -0.678619384765625, -0.63916015625, -0.599700927734375, -0.56024169921875, -0.520782470703125, -0.4813232421875, -0.441864013671875, -0.40240478515625, -0.362945556640625, -0.323486328125, -0.284027099609375, -0.24456787109375, -0.205108642578125, -0.1656494140625, -0.126190185546875, -0.08673095703125, -0.047271728515625, -0.0078125, 0.031646728515625, 0.07110595703125, 0.110565185546875, 0.1500244140625, 0.189483642578125, 0.22894287109375, 0.268402099609375, 0.307861328125, 0.347320556640625, 0.38677978515625, 0.426239013671875, 0.4656982421875, 0.505157470703125, 0.54461669921875, 0.584075927734375, 0.62353515625, 0.662994384765625, 0.70245361328125, 0.741912841796875, 0.7813720703125, 0.820831298828125, 0.86029052734375, 0.899749755859375, 0.939208984375, 0.978668212890625, 1.01812744140625, 1.057586669921875, 1.0970458984375, 1.136505126953125, 1.17596435546875, 1.215423583984375, 1.2548828125]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 7.0, 4.0, 3.0, 6.0, 10.0, 7.0, 10.0, 12.0, 8.0, 17.0, 17.0, 21.0, 18.0, 20.0, 21.0, 24.0, 34.0, 32.0, 33.0, 33.0, 40.0, 42.0, 32.0, 35.0, 40.0, 34.0, 44.0, 30.0, 36.0, 30.0, 33.0, 25.0, 20.0, 31.0, 25.0, 18.0, 22.0, 23.0, 20.0, 9.0, 15.0, 13.0, 8.0, 6.0, 10.0, 6.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.2001953125, -1.16217041015625, -1.1241455078125, -1.08612060546875, -1.048095703125, -1.01007080078125, -0.9720458984375, -0.93402099609375, -0.89599609375, -0.85797119140625, -0.8199462890625, -0.78192138671875, -0.743896484375, -0.70587158203125, -0.6678466796875, -0.62982177734375, -0.591796875, -0.55377197265625, -0.5157470703125, -0.47772216796875, -0.439697265625, -0.40167236328125, -0.3636474609375, -0.32562255859375, -0.28759765625, -0.24957275390625, -0.2115478515625, -0.17352294921875, -0.135498046875, -0.09747314453125, -0.0594482421875, -0.02142333984375, 0.0166015625, 0.05462646484375, 0.0926513671875, 0.13067626953125, 0.168701171875, 0.20672607421875, 0.2447509765625, 0.28277587890625, 0.32080078125, 0.35882568359375, 0.3968505859375, 0.43487548828125, 0.472900390625, 0.51092529296875, 0.5489501953125, 0.58697509765625, 0.625, 0.66302490234375, 0.7010498046875, 0.73907470703125, 0.777099609375, 0.81512451171875, 0.8531494140625, 0.89117431640625, 0.92919921875, 0.96722412109375, 1.0052490234375, 1.04327392578125, 1.081298828125, 1.11932373046875, 1.1573486328125, 1.19537353515625, 1.2333984375]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 4.0, 4.0, 9.0, 12.0, 21.0, 21.0, 26.0, 41.0, 50.0, 61.0, 97.0, 116.0, 156.0, 281.0, 397.0, 592.0, 1030.0, 1702.0, 3355.0, 7838.0, 24083.0, 922330.0, 60781.0, 14082.0, 5294.0, 2500.0, 1274.0, 729.0, 505.0, 318.0, 247.0, 155.0, 122.0, 94.0, 61.0, 41.0, 37.0, 15.0, 15.0, 12.0, 13.0, 7.0, 10.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12164306640625, -0.11755847930908203, -0.11347389221191406, -0.1093893051147461, -0.10530471801757812, -0.10122013092041016, -0.09713554382324219, -0.09305095672607422, -0.08896636962890625, -0.08488178253173828, -0.08079719543457031, -0.07671260833740234, -0.07262802124023438, -0.0685434341430664, -0.06445884704589844, -0.06037425994873047, -0.0562896728515625, -0.05220508575439453, -0.04812049865722656, -0.044035911560058594, -0.039951324462890625, -0.035866737365722656, -0.03178215026855469, -0.02769756317138672, -0.02361297607421875, -0.01952838897705078, -0.015443801879882812, -0.011359214782714844, -0.007274627685546875, -0.0031900405883789062, 0.0008945465087890625, 0.004979133605957031, 0.009063720703125, 0.013148307800292969, 0.017232894897460938, 0.021317481994628906, 0.025402069091796875, 0.029486656188964844, 0.03357124328613281, 0.03765583038330078, 0.04174041748046875, 0.04582500457763672, 0.04990959167480469, 0.053994178771972656, 0.058078765869140625, 0.062163352966308594, 0.06624794006347656, 0.07033252716064453, 0.0744171142578125, 0.07850170135498047, 0.08258628845214844, 0.0866708755493164, 0.09075546264648438, 0.09484004974365234, 0.09892463684082031, 0.10300922393798828, 0.10709381103515625, 0.11117839813232422, 0.11526298522949219, 0.11934757232666016, 0.12343215942382812, 0.1275167465209961, 0.13160133361816406, 0.13568592071533203, 0.1397705078125]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 6.0, 17.0, 13.0, 15.0, 23.0, 30.0, 24.0, 31.0, 31.0, 22.0, 44.0, 47.0, 48.0, 44.0, 47.0, 48.0, 42.0, 46.0, 50.0, 39.0, 33.0, 33.0, 33.0, 31.0, 25.0, 27.0, 23.0, 21.0, 19.0, 7.0, 15.0, 15.0, 4.0, 7.0, 5.0, 3.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.2067298889160156e-05, -3.099162131547928e-05, -2.99159437417984e-05, -2.8840266168117523e-05, -2.7764588594436646e-05, -2.6688911020755768e-05, -2.561323344707489e-05, -2.4537555873394012e-05, -2.3461878299713135e-05, -2.2386200726032257e-05, -2.131052315235138e-05, -2.0234845578670502e-05, -1.9159168004989624e-05, -1.8083490431308746e-05, -1.700781285762787e-05, -1.593213528394699e-05, -1.4856457710266113e-05, -1.3780780136585236e-05, -1.2705102562904358e-05, -1.162942498922348e-05, -1.0553747415542603e-05, -9.478069841861725e-06, -8.402392268180847e-06, -7.3267146944999695e-06, -6.251037120819092e-06, -5.175359547138214e-06, -4.0996819734573364e-06, -3.0240043997764587e-06, -1.948326826095581e-06, -8.726492524147034e-07, 2.0302832126617432e-07, 1.278705894947052e-06, 2.3543834686279297e-06, 3.4300610423088074e-06, 4.505738615989685e-06, 5.581416189670563e-06, 6.6570937633514404e-06, 7.732771337032318e-06, 8.808448910713196e-06, 9.884126484394073e-06, 1.0959804058074951e-05, 1.2035481631755829e-05, 1.3111159205436707e-05, 1.4186836779117584e-05, 1.5262514352798462e-05, 1.633819192647934e-05, 1.7413869500160217e-05, 1.8489547073841095e-05, 1.9565224647521973e-05, 2.064090222120285e-05, 2.1716579794883728e-05, 2.2792257368564606e-05, 2.3867934942245483e-05, 2.494361251592636e-05, 2.601929008960724e-05, 2.7094967663288116e-05, 2.8170645236968994e-05, 2.9246322810649872e-05, 3.032200038433075e-05, 3.139767795801163e-05, 3.2473355531692505e-05, 3.354903310537338e-05, 3.462471067905426e-05, 3.570038825273514e-05, 3.6776065826416016e-05]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 1.0, 7.0, 5.0, 12.0, 17.0, 27.0, 25.0, 39.0, 46.0, 77.0, 102.0, 168.0, 704.0, 14949.0, 907088.0, 121777.0, 2772.0, 290.0, 123.0, 98.0, 67.0, 42.0, 30.0, 21.0, 12.0, 10.0, 6.0, 6.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.343505859375, -0.3333282470703125, -0.323150634765625, -0.3129730224609375, -0.30279541015625, -0.2926177978515625, -0.282440185546875, -0.2722625732421875, -0.2620849609375, -0.2519073486328125, -0.241729736328125, -0.2315521240234375, -0.22137451171875, -0.2111968994140625, -0.201019287109375, -0.1908416748046875, -0.1806640625, -0.1704864501953125, -0.160308837890625, -0.1501312255859375, -0.13995361328125, -0.1297760009765625, -0.119598388671875, -0.1094207763671875, -0.0992431640625, -0.0890655517578125, -0.078887939453125, -0.0687103271484375, -0.05853271484375, -0.0483551025390625, -0.038177490234375, -0.0279998779296875, -0.017822265625, -0.0076446533203125, 0.002532958984375, 0.0127105712890625, 0.02288818359375, 0.0330657958984375, 0.043243408203125, 0.0534210205078125, 0.0635986328125, 0.0737762451171875, 0.083953857421875, 0.0941314697265625, 0.10430908203125, 0.1144866943359375, 0.124664306640625, 0.1348419189453125, 0.14501953125, 0.1551971435546875, 0.165374755859375, 0.1755523681640625, 0.18572998046875, 0.1959075927734375, 0.206085205078125, 0.2162628173828125, 0.2264404296875, 0.2366180419921875, 0.246795654296875, 0.2569732666015625, 0.26715087890625, 0.2773284912109375, 0.287506103515625, 0.2976837158203125, 0.307861328125]}, "gradients/decoder.roberta.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 7.0, 3.0, 6.0, 10.0, 17.0, 20.0, 45.0, 61.0, 120.0, 146.0, 179.0, 126.0, 84.0, 43.0, 31.0, 20.0, 11.0, 5.0, 9.0, 6.0, 7.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.016357421875, -0.015817880630493164, -0.015278339385986328, -0.014738798141479492, -0.014199256896972656, -0.01365971565246582, -0.013120174407958984, -0.012580633163452148, -0.012041091918945312, -0.011501550674438477, -0.01096200942993164, -0.010422468185424805, -0.009882926940917969, -0.009343385696411133, -0.008803844451904297, -0.008264303207397461, -0.007724761962890625, -0.007185220718383789, -0.006645679473876953, -0.006106138229370117, -0.005566596984863281, -0.005027055740356445, -0.004487514495849609, -0.0039479732513427734, -0.0034084320068359375, -0.0028688907623291016, -0.0023293495178222656, -0.0017898082733154297, -0.0012502670288085938, -0.0007107257843017578, -0.00017118453979492188, 0.00036835670471191406, 0.00090789794921875, 0.001447439193725586, 0.001986980438232422, 0.002526521682739258, 0.0030660629272460938, 0.0036056041717529297, 0.004145145416259766, 0.0046846866607666016, 0.0052242279052734375, 0.0057637691497802734, 0.006303310394287109, 0.006842851638793945, 0.007382392883300781, 0.007921934127807617, 0.008461475372314453, 0.009001016616821289, 0.009540557861328125, 0.010080099105834961, 0.010619640350341797, 0.011159181594848633, 0.011698722839355469, 0.012238264083862305, 0.01277780532836914, 0.013317346572875977, 0.013856887817382812, 0.014396429061889648, 0.014935970306396484, 0.01547551155090332, 0.016015052795410156, 0.016554594039916992, 0.017094135284423828, 0.017633676528930664, 0.0181732177734375]}, "gradients/decoder.roberta.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 11.0, 37.0, 80.0, 145.0, 199.0, 217.0, 148.0, 109.0, 41.0, 17.0, 5.0, 4.0], "bins": [-13.263062477111816, -13.030648231506348, -12.798233032226562, -12.565818786621094, -12.333403587341309, -12.10098934173584, -11.868574142456055, -11.636159896850586, -11.4037446975708, -11.171330451965332, -10.938915252685547, -10.706501007080078, -10.474085807800293, -10.241671562194824, -10.009256362915039, -9.77684211730957, -9.544427871704102, -9.312013626098633, -9.079598426818848, -8.847184181213379, -8.614768981933594, -8.382354736328125, -8.14993953704834, -7.917525291442871, -7.685110092163086, -7.452695369720459, -7.220280647277832, -6.987865924835205, -6.755451202392578, -6.523036479949951, -6.290621757507324, -6.0582075119018555, -5.82579231262207, -5.593377590179443, -5.360962867736816, -5.1285481452941895, -4.8961334228515625, -4.6637187004089355, -4.431303977966309, -4.19888973236084, -3.9664745330810547, -3.7340598106384277, -3.501645088195801, -3.269230365753174, -3.036815643310547, -2.80440092086792, -2.571986436843872, -2.339571714401245, -2.1071572303771973, -1.8747425079345703, -1.6423277854919434, -1.409913182258606, -1.177498459815979, -0.945083737373352, -0.7126691341400146, -0.4802544116973877, -0.2478395700454712, -0.015424877405166626, 0.21698981523513794, 0.4494044780731201, 0.6818192005157471, 0.914233922958374, 1.1466485261917114, 1.3790632486343384, 1.6114779710769653]}, "gradients/decoder.roberta.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 6.0, 8.0, 9.0, 13.0, 18.0, 17.0, 20.0, 21.0, 22.0, 28.0, 35.0, 40.0, 38.0, 43.0, 43.0, 32.0, 48.0, 36.0, 56.0, 41.0, 40.0, 47.0, 37.0, 35.0, 40.0, 25.0, 36.0, 35.0, 16.0, 28.0, 15.0, 13.0, 11.0, 10.0, 11.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0557775497436523, -1.9825454950332642, -1.909313440322876, -1.8360812664031982, -1.76284921169281, -1.6896171569824219, -1.6163851022720337, -1.5431530475616455, -1.4699208736419678, -1.3966888189315796, -1.3234567642211914, -1.2502245903015137, -1.1769925355911255, -1.1037604808807373, -1.0305284261703491, -0.9572963118553162, -0.8840643167495728, -0.8108322620391846, -0.7376001477241516, -0.6643680930137634, -0.5911359786987305, -0.5179039239883423, -0.4446718692779541, -0.37143975496292114, -0.29820770025253296, -0.2249756157398224, -0.151743546128273, -0.07851147651672363, -0.0052793920040130615, 0.06795269250869751, 0.1411847472190857, 0.21441686153411865, 0.28764891624450684, 0.3608810007572174, 0.434113085269928, 0.5073451399803162, 0.5805772542953491, 0.6538093090057373, 0.7270413637161255, 0.8002734780311584, 0.8735055327415466, 0.9467375874519348, 1.0199697017669678, 1.093201756477356, 1.1664338111877441, 1.2396659851074219, 1.3128979206085205, 1.3861300945281982, 1.4593621492385864, 1.5325942039489746, 1.6058262586593628, 1.679058313369751, 1.7522904872894287, 1.825522541999817, 1.898754596710205, 1.9719867706298828, 2.0452187061309814, 2.118450880050659, 2.191682815551758, 2.2649149894714355, 2.338146924972534, 2.411379098892212, 2.4846110343933105, 2.5578432083129883, 2.631075382232666]}, "gradients/decoder.roberta.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 15.0, 19.0, 24.0, 20.0, 24.0, 35.0, 51.0, 70.0, 155.0, 216.0, 397.0, 641.0, 1112.0, 1883.0, 3248.0, 5563.0, 9488.0, 18127.0, 47991.0, 275431.0, 559098.0, 74721.0, 22909.0, 11281.0, 6681.0, 3848.0, 2269.0, 1309.0, 744.0, 443.0, 269.0, 154.0, 94.0, 66.0, 44.0, 28.0, 22.0, 19.0, 16.0, 7.0, 3.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8203125, -2.72357177734375, -2.6268310546875, -2.53009033203125, -2.433349609375, -2.33660888671875, -2.2398681640625, -2.14312744140625, -2.04638671875, -1.94964599609375, -1.8529052734375, -1.75616455078125, -1.659423828125, -1.56268310546875, -1.4659423828125, -1.36920166015625, -1.2724609375, -1.17572021484375, -1.0789794921875, -0.98223876953125, -0.885498046875, -0.78875732421875, -0.6920166015625, -0.59527587890625, -0.49853515625, -0.40179443359375, -0.3050537109375, -0.20831298828125, -0.111572265625, -0.01483154296875, 0.0819091796875, 0.17864990234375, 0.275390625, 0.37213134765625, 0.4688720703125, 0.56561279296875, 0.662353515625, 0.75909423828125, 0.8558349609375, 0.95257568359375, 1.04931640625, 1.14605712890625, 1.2427978515625, 1.33953857421875, 1.436279296875, 1.53302001953125, 1.6297607421875, 1.72650146484375, 1.8232421875, 1.91998291015625, 2.0167236328125, 2.11346435546875, 2.210205078125, 2.30694580078125, 2.4036865234375, 2.50042724609375, 2.59716796875, 2.69390869140625, 2.7906494140625, 2.88739013671875, 2.984130859375, 3.08087158203125, 3.1776123046875, 3.27435302734375, 3.37109375]}, "gradients/decoder.roberta.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 8.0, 6.0, 7.0, 11.0, 21.0, 14.0, 19.0, 13.0, 26.0, 22.0, 24.0, 36.0, 33.0, 43.0, 43.0, 40.0, 33.0, 43.0, 32.0, 53.0, 41.0, 47.0, 38.0, 45.0, 31.0, 41.0, 30.0, 22.0, 33.0, 29.0, 21.0, 19.0, 14.0, 8.0, 12.0, 9.0, 12.0, 3.0, 4.0, 4.0, 5.0, 1.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.119140625, -2.046417236328125, -1.97369384765625, -1.900970458984375, -1.8282470703125, -1.755523681640625, -1.68280029296875, -1.610076904296875, -1.537353515625, -1.464630126953125, -1.39190673828125, -1.319183349609375, -1.2464599609375, -1.173736572265625, -1.10101318359375, -1.028289794921875, -0.95556640625, -0.882843017578125, -0.81011962890625, -0.737396240234375, -0.6646728515625, -0.591949462890625, -0.51922607421875, -0.446502685546875, -0.373779296875, -0.301055908203125, -0.22833251953125, -0.155609130859375, -0.0828857421875, -0.010162353515625, 0.06256103515625, 0.135284423828125, 0.2080078125, 0.280731201171875, 0.35345458984375, 0.426177978515625, 0.4989013671875, 0.571624755859375, 0.64434814453125, 0.717071533203125, 0.789794921875, 0.862518310546875, 0.93524169921875, 1.007965087890625, 1.0806884765625, 1.153411865234375, 1.22613525390625, 1.298858642578125, 1.37158203125, 1.444305419921875, 1.51702880859375, 1.589752197265625, 1.6624755859375, 1.735198974609375, 1.80792236328125, 1.880645751953125, 1.953369140625, 2.026092529296875, 2.09881591796875, 2.171539306640625, 2.2442626953125, 2.316986083984375, 2.38970947265625, 2.462432861328125, 2.53515625]}, "gradients/decoder.roberta.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 7.0, 9.0, 11.0, 13.0, 17.0, 19.0, 22.0, 34.0, 29.0, 36.0, 50.0, 54.0, 65.0, 60.0, 87.0, 111.0, 120.0, 268.0, 13494.0, 1028769.0, 4274.0, 218.0, 132.0, 107.0, 88.0, 88.0, 56.0, 57.0, 43.0, 37.0, 20.0, 26.0, 28.0, 14.0, 11.0, 8.0, 13.0, 13.0, 7.0, 10.0, 6.0, 4.0, 0.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.890625, -27.907470703125, -26.92431640625, -25.941162109375, -24.9580078125, -23.974853515625, -22.99169921875, -22.008544921875, -21.025390625, -20.042236328125, -19.05908203125, -18.075927734375, -17.0927734375, -16.109619140625, -15.12646484375, -14.143310546875, -13.16015625, -12.177001953125, -11.19384765625, -10.210693359375, -9.2275390625, -8.244384765625, -7.26123046875, -6.278076171875, -5.294921875, -4.311767578125, -3.32861328125, -2.345458984375, -1.3623046875, -0.379150390625, 0.60400390625, 1.587158203125, 2.5703125, 3.553466796875, 4.53662109375, 5.519775390625, 6.5029296875, 7.486083984375, 8.46923828125, 9.452392578125, 10.435546875, 11.418701171875, 12.40185546875, 13.385009765625, 14.3681640625, 15.351318359375, 16.33447265625, 17.317626953125, 18.30078125, 19.283935546875, 20.26708984375, 21.250244140625, 22.2333984375, 23.216552734375, 24.19970703125, 25.182861328125, 26.166015625, 27.149169921875, 28.13232421875, 29.115478515625, 30.0986328125, 31.081787109375, 32.06494140625, 33.048095703125, 34.03125]}, "gradients/decoder.roberta.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 12.0, 5.0, 6.0, 2.0, 9.0, 6.0, 5.0, 13.0, 13.0, 11.0, 24.0, 20.0, 22.0, 24.0, 38.0, 44.0, 48.0, 40.0, 51.0, 52.0, 55.0, 58.0, 50.0, 42.0, 53.0, 43.0, 33.0, 30.0, 23.0, 21.0, 21.0, 16.0, 16.0, 15.0, 9.0, 13.0, 12.0, 8.0, 2.0, 8.0, 8.0, 1.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.60546875, -1.5582275390625, -1.510986328125, -1.4637451171875, -1.41650390625, -1.3692626953125, -1.322021484375, -1.2747802734375, -1.2275390625, -1.1802978515625, -1.133056640625, -1.0858154296875, -1.03857421875, -0.9913330078125, -0.944091796875, -0.8968505859375, -0.849609375, -0.8023681640625, -0.755126953125, -0.7078857421875, -0.66064453125, -0.6134033203125, -0.566162109375, -0.5189208984375, -0.4716796875, -0.4244384765625, -0.377197265625, -0.3299560546875, -0.28271484375, -0.2354736328125, -0.188232421875, -0.1409912109375, -0.09375, -0.0465087890625, 0.000732421875, 0.0479736328125, 0.09521484375, 0.1424560546875, 0.189697265625, 0.2369384765625, 0.2841796875, 0.3314208984375, 0.378662109375, 0.4259033203125, 0.47314453125, 0.5203857421875, 0.567626953125, 0.6148681640625, 0.662109375, 0.7093505859375, 0.756591796875, 0.8038330078125, 0.85107421875, 0.8983154296875, 0.945556640625, 0.9927978515625, 1.0400390625, 1.0872802734375, 1.134521484375, 1.1817626953125, 1.22900390625, 1.2762451171875, 1.323486328125, 1.3707275390625, 1.41796875]}, "gradients/decoder.roberta.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 2.0, 5.0, 7.0, 10.0, 19.0, 40.0, 85.0, 164.0, 460.0, 2722.0, 110907.0, 928447.0, 4664.0, 574.0, 226.0, 93.0, 53.0, 26.0, 13.0, 9.0, 6.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.4114990234375, -4.248779296875, -4.0860595703125, -3.92333984375, -3.7606201171875, -3.597900390625, -3.4351806640625, -3.2724609375, -3.1097412109375, -2.947021484375, -2.7843017578125, -2.62158203125, -2.4588623046875, -2.296142578125, -2.1334228515625, -1.970703125, -1.8079833984375, -1.645263671875, -1.4825439453125, -1.31982421875, -1.1571044921875, -0.994384765625, -0.8316650390625, -0.6689453125, -0.5062255859375, -0.343505859375, -0.1807861328125, -0.01806640625, 0.1446533203125, 0.307373046875, 0.4700927734375, 0.6328125, 0.7955322265625, 0.958251953125, 1.1209716796875, 1.28369140625, 1.4464111328125, 1.609130859375, 1.7718505859375, 1.9345703125, 2.0972900390625, 2.260009765625, 2.4227294921875, 2.58544921875, 2.7481689453125, 2.910888671875, 3.0736083984375, 3.236328125, 3.3990478515625, 3.561767578125, 3.7244873046875, 3.88720703125, 4.0499267578125, 4.212646484375, 4.3753662109375, 4.5380859375, 4.7008056640625, 4.863525390625, 5.0262451171875, 5.18896484375, 5.3516845703125, 5.514404296875, 5.6771240234375, 5.83984375]}, "gradients/decoder.roberta.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 5.0, 8.0, 15.0, 13.0, 19.0, 45.0, 53.0, 63.0, 489.0, 102.0, 53.0, 48.0, 27.0, 17.0, 18.0, 8.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013816356658935547, -0.00013381056487560272, -0.00012945756316184998, -0.00012510456144809723, -0.00012075155973434448, -0.00011639855802059174, -0.00011204555630683899, -0.00010769255459308624, -0.0001033395528793335, -9.898655116558075e-05, -9.4633549451828e-05, -9.028054773807526e-05, -8.592754602432251e-05, -8.157454431056976e-05, -7.722154259681702e-05, -7.286854088306427e-05, -6.851553916931152e-05, -6.416253745555878e-05, -5.980953574180603e-05, -5.5456534028053284e-05, -5.110353231430054e-05, -4.675053060054779e-05, -4.2397528886795044e-05, -3.80445271730423e-05, -3.369152545928955e-05, -2.9338523745536804e-05, -2.4985522031784058e-05, -2.063252031803131e-05, -1.6279518604278564e-05, -1.1926516890525818e-05, -7.573515176773071e-06, -3.2205134630203247e-06, 1.1324882507324219e-06, 5.4854899644851685e-06, 9.838491678237915e-06, 1.4191493391990662e-05, 1.8544495105743408e-05, 2.2897496819496155e-05, 2.72504985332489e-05, 3.160350024700165e-05, 3.5956501960754395e-05, 4.030950367450714e-05, 4.466250538825989e-05, 4.9015507102012634e-05, 5.336850881576538e-05, 5.772151052951813e-05, 6.207451224327087e-05, 6.642751395702362e-05, 7.078051567077637e-05, 7.513351738452911e-05, 7.948651909828186e-05, 8.383952081203461e-05, 8.819252252578735e-05, 9.25455242395401e-05, 9.689852595329285e-05, 0.0001012515276670456, 0.00010560452938079834, 0.00010995753109455109, 0.00011431053280830383, 0.00011866353452205658, 0.00012301653623580933, 0.00012736953794956207, 0.00013172253966331482, 0.00013607554137706757, 0.0001404285430908203]}, "gradients/decoder.roberta.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 3.0, 6.0, 6.0, 10.0, 18.0, 26.0, 40.0, 80.0, 170.0, 521.0, 2644.0, 270298.0, 770909.0, 2912.0, 515.0, 206.0, 83.0, 40.0, 26.0, 12.0, 13.0, 3.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.29296875, -7.095947265625, -6.89892578125, -6.701904296875, -6.5048828125, -6.307861328125, -6.11083984375, -5.913818359375, -5.716796875, -5.519775390625, -5.32275390625, -5.125732421875, -4.9287109375, -4.731689453125, -4.53466796875, -4.337646484375, -4.140625, -3.943603515625, -3.74658203125, -3.549560546875, -3.3525390625, -3.155517578125, -2.95849609375, -2.761474609375, -2.564453125, -2.367431640625, -2.17041015625, -1.973388671875, -1.7763671875, -1.579345703125, -1.38232421875, -1.185302734375, -0.98828125, -0.791259765625, -0.59423828125, -0.397216796875, -0.2001953125, -0.003173828125, 0.19384765625, 0.390869140625, 0.587890625, 0.784912109375, 0.98193359375, 1.178955078125, 1.3759765625, 1.572998046875, 1.77001953125, 1.967041015625, 2.1640625, 2.361083984375, 2.55810546875, 2.755126953125, 2.9521484375, 3.149169921875, 3.34619140625, 3.543212890625, 3.740234375, 3.937255859375, 4.13427734375, 4.331298828125, 4.5283203125, 4.725341796875, 4.92236328125, 5.119384765625, 5.31640625]}, "gradients/decoder.roberta.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 12.0, 23.0, 65.0, 114.0, 587.0, 108.0, 42.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5224609375, -0.5026397705078125, -0.482818603515625, -0.4629974365234375, -0.44317626953125, -0.4233551025390625, -0.403533935546875, -0.3837127685546875, -0.3638916015625, -0.3440704345703125, -0.324249267578125, -0.3044281005859375, -0.28460693359375, -0.2647857666015625, -0.244964599609375, -0.2251434326171875, -0.205322265625, -0.1855010986328125, -0.165679931640625, -0.1458587646484375, -0.12603759765625, -0.1062164306640625, -0.086395263671875, -0.0665740966796875, -0.0467529296875, -0.0269317626953125, -0.007110595703125, 0.0127105712890625, 0.03253173828125, 0.0523529052734375, 0.072174072265625, 0.0919952392578125, 0.11181640625, 0.1316375732421875, 0.151458740234375, 0.1712799072265625, 0.19110107421875, 0.2109222412109375, 0.230743408203125, 0.2505645751953125, 0.2703857421875, 0.2902069091796875, 0.310028076171875, 0.3298492431640625, 0.34967041015625, 0.3694915771484375, 0.389312744140625, 0.4091339111328125, 0.428955078125, 0.4487762451171875, 0.468597412109375, 0.4884185791015625, 0.50823974609375, 0.5280609130859375, 0.547882080078125, 0.5677032470703125, 0.5875244140625, 0.6073455810546875, 0.627166748046875, 0.6469879150390625, 0.66680908203125, 0.6866302490234375, 0.706451416015625, 0.7262725830078125, 0.74609375]}, "gradients/decoder.roberta.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 4.0, 9.0, 9.0, 11.0, 17.0, 30.0, 42.0, 55.0, 40.0, 66.0, 73.0, 86.0, 90.0, 73.0, 83.0, 63.0, 59.0, 46.0, 44.0, 40.0, 13.0, 18.0, 10.0, 12.0, 1.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0296971797943115, -2.9337103366851807, -2.83772349357605, -2.741736650466919, -2.645749807357788, -2.5497629642486572, -2.4537758827209473, -2.3577890396118164, -2.2618021965026855, -2.1658153533935547, -2.069828510284424, -1.973841667175293, -1.877854824066162, -1.7818679809570312, -1.6858810186386108, -1.58989417552948, -1.4939074516296387, -1.3979206085205078, -1.301933765411377, -1.205946922302246, -1.1099600791931152, -1.0139732360839844, -0.917986273765564, -0.8219994306564331, -0.7260125875473022, -0.6300257444381714, -0.5340389013290405, -0.4380519986152649, -0.34206515550613403, -0.24607831239700317, -0.15009140968322754, -0.05410456657409668, 0.04188203811645508, 0.13786889612674713, 0.23385575413703918, 0.32984262704849243, 0.4258294701576233, 0.5218163132667542, 0.6178032159805298, 0.7137900590896606, 0.8097769021987915, 0.9057637453079224, 1.0017505884170532, 1.0977375507354736, 1.1937243938446045, 1.2897112369537354, 1.3856980800628662, 1.481684923171997, 1.577671766281128, 1.6736586093902588, 1.7696454524993896, 1.8656322956085205, 1.9616191387176514, 2.0576059818267822, 2.153593063354492, 2.249579906463623, 2.345566749572754, 2.4415535926818848, 2.5375404357910156, 2.6335272789001465, 2.7295141220092773, 2.825500965118408, 2.921487808227539, 3.01747465133667, 3.113461494445801]}, "gradients/decoder.roberta.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 3.0, 0.0, 7.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 10.0, 8.0, 9.0, 22.0, 18.0, 24.0, 13.0, 22.0, 28.0, 25.0, 34.0, 23.0, 37.0, 31.0, 38.0, 30.0, 44.0, 40.0, 37.0, 40.0, 44.0, 37.0, 36.0, 35.0, 24.0, 25.0, 25.0, 23.0, 30.0, 21.0, 22.0, 16.0, 14.0, 20.0, 9.0, 16.0, 8.0, 8.0, 9.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.0940780639648438, -2.0248193740844727, -1.9555606842041016, -1.8863019943237305, -1.8170433044433594, -1.7477846145629883, -1.6785259246826172, -1.609267234802246, -1.540008544921875, -1.470749855041504, -1.4014911651611328, -1.3322324752807617, -1.2629737854003906, -1.1937150955200195, -1.1244564056396484, -1.0551977157592773, -0.9859389066696167, -0.9166802167892456, -0.8474215269088745, -0.7781628370285034, -0.7089041471481323, -0.6396454572677612, -0.5703867077827454, -0.5011280179023743, -0.4318693280220032, -0.3626106381416321, -0.293351948261261, -0.2240932285785675, -0.1548345386981964, -0.08557584881782532, -0.016317129135131836, 0.05294156074523926, 0.12220025062561035, 0.19145894050598145, 0.26071763038635254, 0.329976350069046, 0.3992350399494171, 0.4684937298297882, 0.5377524495124817, 0.6070111393928528, 0.6762698292732239, 0.745528519153595, 0.8147872090339661, 0.8840459585189819, 0.953304648399353, 1.0225633382797241, 1.0918220281600952, 1.1610807180404663, 1.2303394079208374, 1.2995980978012085, 1.3688567876815796, 1.4381154775619507, 1.5073741674423218, 1.5766328573226929, 1.6458916664123535, 1.7151503562927246, 1.7844090461730957, 1.8536677360534668, 1.922926425933838, 1.992185115814209, 2.06144380569458, 2.130702495574951, 2.1999611854553223, 2.2692198753356934, 2.3384785652160645]}, "gradients/decoder.roberta.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 14.0, 10.0, 11.0, 15.0, 9.0, 16.0, 27.0, 35.0, 49.0, 65.0, 101.0, 186.0, 406.0, 955.0, 2980.0, 15644.0, 3969383.0, 192226.0, 8546.0, 2037.0, 743.0, 326.0, 134.0, 99.0, 59.0, 48.0, 28.0, 25.0, 21.0, 17.0, 13.0, 10.0, 13.0, 5.0, 8.0, 4.0, 0.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.4765625, -11.156494140625, -10.83642578125, -10.516357421875, -10.1962890625, -9.876220703125, -9.55615234375, -9.236083984375, -8.916015625, -8.595947265625, -8.27587890625, -7.955810546875, -7.6357421875, -7.315673828125, -6.99560546875, -6.675537109375, -6.35546875, -6.035400390625, -5.71533203125, -5.395263671875, -5.0751953125, -4.755126953125, -4.43505859375, -4.114990234375, -3.794921875, -3.474853515625, -3.15478515625, -2.834716796875, -2.5146484375, -2.194580078125, -1.87451171875, -1.554443359375, -1.234375, -0.914306640625, -0.59423828125, -0.274169921875, 0.0458984375, 0.365966796875, 0.68603515625, 1.006103515625, 1.326171875, 1.646240234375, 1.96630859375, 2.286376953125, 2.6064453125, 2.926513671875, 3.24658203125, 3.566650390625, 3.88671875, 4.206787109375, 4.52685546875, 4.846923828125, 5.1669921875, 5.487060546875, 5.80712890625, 6.127197265625, 6.447265625, 6.767333984375, 7.08740234375, 7.407470703125, 7.7275390625, 8.047607421875, 8.36767578125, 8.687744140625, 9.0078125]}, "gradients/decoder.roberta.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 4.0, 5.0, 4.0, 8.0, 4.0, 6.0, 10.0, 7.0, 3.0, 17.0, 14.0, 17.0, 23.0, 12.0, 15.0, 22.0, 20.0, 23.0, 32.0, 41.0, 29.0, 47.0, 33.0, 37.0, 33.0, 34.0, 41.0, 31.0, 33.0, 37.0, 39.0, 24.0, 40.0, 25.0, 31.0, 22.0, 29.0, 17.0, 28.0, 23.0, 20.0, 9.0, 12.0, 8.0, 6.0, 5.0, 13.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5146484375, -1.4644012451171875, -1.414154052734375, -1.3639068603515625, -1.31365966796875, -1.2634124755859375, -1.213165283203125, -1.1629180908203125, -1.1126708984375, -1.0624237060546875, -1.012176513671875, -0.9619293212890625, -0.91168212890625, -0.8614349365234375, -0.811187744140625, -0.7609405517578125, -0.710693359375, -0.6604461669921875, -0.610198974609375, -0.5599517822265625, -0.50970458984375, -0.4594573974609375, -0.409210205078125, -0.3589630126953125, -0.3087158203125, -0.2584686279296875, -0.208221435546875, -0.1579742431640625, -0.10772705078125, -0.0574798583984375, -0.007232666015625, 0.0430145263671875, 0.09326171875, 0.1435089111328125, 0.193756103515625, 0.2440032958984375, 0.29425048828125, 0.3444976806640625, 0.394744873046875, 0.4449920654296875, 0.4952392578125, 0.5454864501953125, 0.595733642578125, 0.6459808349609375, 0.69622802734375, 0.7464752197265625, 0.796722412109375, 0.8469696044921875, 0.897216796875, 0.9474639892578125, 0.997711181640625, 1.0479583740234375, 1.09820556640625, 1.1484527587890625, 1.198699951171875, 1.2489471435546875, 1.2991943359375, 1.3494415283203125, 1.399688720703125, 1.4499359130859375, 1.50018310546875, 1.5504302978515625, 1.600677490234375, 1.6509246826171875, 1.701171875]}, "gradients/decoder.roberta.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 10.0, 12.0, 16.0, 39.0, 63.0, 182.0, 1363.0, 4131449.0, 60250.0, 649.0, 151.0, 41.0, 23.0, 15.0, 9.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.328125, -30.429443359375, -29.53076171875, -28.632080078125, -27.7333984375, -26.834716796875, -25.93603515625, -25.037353515625, -24.138671875, -23.239990234375, -22.34130859375, -21.442626953125, -20.5439453125, -19.645263671875, -18.74658203125, -17.847900390625, -16.94921875, -16.050537109375, -15.15185546875, -14.253173828125, -13.3544921875, -12.455810546875, -11.55712890625, -10.658447265625, -9.759765625, -8.861083984375, -7.96240234375, -7.063720703125, -6.1650390625, -5.266357421875, -4.36767578125, -3.468994140625, -2.5703125, -1.671630859375, -0.77294921875, 0.125732421875, 1.0244140625, 1.923095703125, 2.82177734375, 3.720458984375, 4.619140625, 5.517822265625, 6.41650390625, 7.315185546875, 8.2138671875, 9.112548828125, 10.01123046875, 10.909912109375, 11.80859375, 12.707275390625, 13.60595703125, 14.504638671875, 15.4033203125, 16.302001953125, 17.20068359375, 18.099365234375, 18.998046875, 19.896728515625, 20.79541015625, 21.694091796875, 22.5927734375, 23.491455078125, 24.39013671875, 25.288818359375, 26.1875]}, "gradients/decoder.roberta.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 6.0, 20.0, 12.0, 38.0, 86.0, 294.0, 3089.0, 359.0, 81.0, 35.0, 16.0, 17.0, 5.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1302947998046875, -1.077972412109375, -1.0256500244140625, -0.97332763671875, -0.9210052490234375, -0.868682861328125, -0.8163604736328125, -0.7640380859375, -0.7117156982421875, -0.659393310546875, -0.6070709228515625, -0.55474853515625, -0.5024261474609375, -0.450103759765625, -0.3977813720703125, -0.345458984375, -0.2931365966796875, -0.240814208984375, -0.1884918212890625, -0.13616943359375, -0.0838470458984375, -0.031524658203125, 0.0207977294921875, 0.0731201171875, 0.1254425048828125, 0.177764892578125, 0.2300872802734375, 0.28240966796875, 0.3347320556640625, 0.387054443359375, 0.4393768310546875, 0.49169921875, 0.5440216064453125, 0.596343994140625, 0.6486663818359375, 0.70098876953125, 0.7533111572265625, 0.805633544921875, 0.8579559326171875, 0.9102783203125, 0.9626007080078125, 1.014923095703125, 1.0672454833984375, 1.11956787109375, 1.1718902587890625, 1.224212646484375, 1.2765350341796875, 1.328857421875, 1.3811798095703125, 1.433502197265625, 1.4858245849609375, 1.53814697265625, 1.5904693603515625, 1.642791748046875, 1.6951141357421875, 1.7474365234375, 1.7997589111328125, 1.852081298828125, 1.9044036865234375, 1.95672607421875, 2.0090484619140625, 2.061370849609375, 2.1136932373046875, 2.166015625]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 11.0, 19.0, 23.0, 32.0, 49.0, 35.0, 90.0, 97.0, 100.0, 87.0, 95.0, 85.0, 66.0, 55.0, 43.0, 35.0, 20.0, 30.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.667562484741211, -4.569026470184326, -4.470490455627441, -4.371954441070557, -4.273418426513672, -4.174882888793945, -4.076346397399902, -3.9778106212615967, -3.879274845123291, -3.7807388305664062, -3.6822028160095215, -3.5836668014526367, -3.485131025314331, -3.3865950107574463, -3.2880589962005615, -3.1895229816436768, -3.090986967086792, -2.9924509525299072, -2.8939149379730225, -2.795379161834717, -2.696843147277832, -2.5983071327209473, -2.4997711181640625, -2.4012351036071777, -2.302699089050293, -2.204163074493408, -2.1056270599365234, -2.0070910453796387, -1.908555269241333, -1.8100192546844482, -1.7114832401275635, -1.6129472255706787, -1.514411211013794, -1.4158751964569092, -1.317339301109314, -1.2188032865524292, -1.120267391204834, -1.0217313766479492, -0.9231953620910645, -0.8246594071388245, -0.7261234521865845, -0.6275874972343445, -0.5290515422821045, -0.4305155277252197, -0.33197957277297974, -0.23344361782073975, -0.13490760326385498, -0.03637164831161499, 0.062164306640625, 0.16070027649402618, 0.25923624634742737, 0.35777223110198975, 0.45630818605422974, 0.5548441410064697, 0.6533801555633545, 0.7519161105155945, 0.8504520654678345, 0.9489880204200745, 1.0475239753723145, 1.1460599899291992, 1.244596004486084, 1.3431318998336792, 1.441667914390564, 1.5402038097381592, 1.638739824295044]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 7.0, 12.0, 14.0, 8.0, 16.0, 13.0, 20.0, 15.0, 24.0, 23.0, 28.0, 37.0, 38.0, 43.0, 37.0, 48.0, 39.0, 51.0, 40.0, 46.0, 39.0, 42.0, 45.0, 38.0, 30.0, 33.0, 36.0, 29.0, 18.0, 24.0, 18.0, 13.0, 21.0, 10.0, 14.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.773690938949585, -1.708660364151001, -1.6436299085617065, -1.5785993337631226, -1.5135688781738281, -1.4485383033752441, -1.3835077285766602, -1.3184771537780762, -1.2534466981887817, -1.1884161233901978, -1.1233856678009033, -1.0583550930023193, -0.9933245778083801, -0.9282940626144409, -0.8632634878158569, -0.7982329726219177, -0.7332024574279785, -0.6681719422340393, -0.6031414270401001, -0.5381108522415161, -0.4730803370475769, -0.4080498218536377, -0.3430192768573761, -0.2779887318611145, -0.2129582166671753, -0.1479276865720749, -0.08289715647697449, -0.017866626381874084, 0.04716390371322632, 0.11219441890716553, 0.17722496390342712, 0.24225550889968872, 0.30728626251220703, 0.37231677770614624, 0.43734732270240784, 0.5023778676986694, 0.5674083828926086, 0.6324388980865479, 0.6974694728851318, 0.762499988079071, 0.8275305032730103, 0.8925610184669495, 0.9575915336608887, 1.0226221084594727, 1.0876526832580566, 1.152683138847351, 1.217713713645935, 1.2827441692352295, 1.3477747440338135, 1.4128053188323975, 1.477835774421692, 1.5428663492202759, 1.6078968048095703, 1.6729273796081543, 1.7379579544067383, 1.8029885292053223, 1.8680189847946167, 1.9330495595932007, 1.9980800151824951, 2.063110589981079, 2.128141164779663, 2.193171501159668, 2.258202075958252, 2.323232650756836, 2.38826322555542]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 6.0, 13.0, 20.0, 21.0, 48.0, 67.0, 96.0, 149.0, 269.0, 448.0, 691.0, 1227.0, 2070.0, 3706.0, 6014.0, 10687.0, 19429.0, 37519.0, 76470.0, 162085.0, 280167.0, 224625.0, 110431.0, 52397.0, 26623.0, 14115.0, 7963.0, 4542.0, 2713.0, 1597.0, 903.0, 513.0, 355.0, 196.0, 121.0, 85.0, 63.0, 34.0, 18.0, 17.0, 10.0, 8.0, 11.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.338134765625, -0.3263702392578125, -0.314605712890625, -0.3028411865234375, -0.29107666015625, -0.2793121337890625, -0.267547607421875, -0.2557830810546875, -0.2440185546875, -0.2322540283203125, -0.220489501953125, -0.2087249755859375, -0.19696044921875, -0.1851959228515625, -0.173431396484375, -0.1616668701171875, -0.14990234375, -0.1381378173828125, -0.126373291015625, -0.1146087646484375, -0.10284423828125, -0.0910797119140625, -0.079315185546875, -0.0675506591796875, -0.0557861328125, -0.0440216064453125, -0.032257080078125, -0.0204925537109375, -0.00872802734375, 0.0030364990234375, 0.014801025390625, 0.0265655517578125, 0.038330078125, 0.0500946044921875, 0.061859130859375, 0.0736236572265625, 0.08538818359375, 0.0971527099609375, 0.108917236328125, 0.1206817626953125, 0.1324462890625, 0.1442108154296875, 0.155975341796875, 0.1677398681640625, 0.17950439453125, 0.1912689208984375, 0.203033447265625, 0.2147979736328125, 0.2265625, 0.2383270263671875, 0.250091552734375, 0.2618560791015625, 0.27362060546875, 0.2853851318359375, 0.297149658203125, 0.3089141845703125, 0.3206787109375, 0.3324432373046875, 0.344207763671875, 0.3559722900390625, 0.36773681640625, 0.3795013427734375, 0.391265869140625, 0.4030303955078125, 0.414794921875]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 13.0, 13.0, 9.0, 17.0, 12.0, 19.0, 17.0, 22.0, 22.0, 31.0, 35.0, 40.0, 41.0, 37.0, 44.0, 45.0, 48.0, 44.0, 44.0, 38.0, 41.0, 47.0, 34.0, 33.0, 33.0, 37.0, 28.0, 18.0, 24.0, 19.0, 15.0, 17.0, 12.0, 15.0, 8.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6259765625, -1.5647735595703125, -1.503570556640625, -1.4423675537109375, -1.38116455078125, -1.3199615478515625, -1.258758544921875, -1.1975555419921875, -1.1363525390625, -1.0751495361328125, -1.013946533203125, -0.9527435302734375, -0.89154052734375, -0.8303375244140625, -0.769134521484375, -0.7079315185546875, -0.646728515625, -0.5855255126953125, -0.524322509765625, -0.4631195068359375, -0.40191650390625, -0.3407135009765625, -0.279510498046875, -0.2183074951171875, -0.1571044921875, -0.0959014892578125, -0.034698486328125, 0.0265045166015625, 0.08770751953125, 0.1489105224609375, 0.210113525390625, 0.2713165283203125, 0.33251953125, 0.3937225341796875, 0.454925537109375, 0.5161285400390625, 0.57733154296875, 0.6385345458984375, 0.699737548828125, 0.7609405517578125, 0.8221435546875, 0.8833465576171875, 0.944549560546875, 1.0057525634765625, 1.06695556640625, 1.1281585693359375, 1.189361572265625, 1.2505645751953125, 1.311767578125, 1.3729705810546875, 1.434173583984375, 1.4953765869140625, 1.55657958984375, 1.6177825927734375, 1.678985595703125, 1.7401885986328125, 1.8013916015625, 1.8625946044921875, 1.923797607421875, 1.9850006103515625, 2.04620361328125, 2.1074066162109375, 2.168609619140625, 2.2298126220703125, 2.291015625]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 5.0, 5.0, 19.0, 21.0, 24.0, 36.0, 40.0, 40.0, 58.0, 67.0, 98.0, 138.0, 179.0, 253.0, 370.0, 529.0, 734.0, 1245.0, 2233.0, 4666.0, 10878.0, 31362.0, 889900.0, 69683.0, 20082.0, 7476.0, 3350.0, 1702.0, 1080.0, 653.0, 405.0, 302.0, 226.0, 166.0, 132.0, 82.0, 69.0, 46.0, 48.0, 37.0, 28.0, 22.0, 10.0, 13.0, 10.0, 6.0, 6.0, 1.0, 6.0, 3.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.91259765625, -0.8847732543945312, -0.8569488525390625, -0.8291244506835938, -0.801300048828125, -0.7734756469726562, -0.7456512451171875, -0.7178268432617188, -0.69000244140625, -0.6621780395507812, -0.6343536376953125, -0.6065292358398438, -0.578704833984375, -0.5508804321289062, -0.5230560302734375, -0.49523162841796875, -0.4674072265625, -0.43958282470703125, -0.4117584228515625, -0.38393402099609375, -0.356109619140625, -0.32828521728515625, -0.3004608154296875, -0.27263641357421875, -0.24481201171875, -0.21698760986328125, -0.1891632080078125, -0.16133880615234375, -0.133514404296875, -0.10569000244140625, -0.0778656005859375, -0.05004119873046875, -0.022216796875, 0.00560760498046875, 0.0334320068359375, 0.06125640869140625, 0.089080810546875, 0.11690521240234375, 0.1447296142578125, 0.17255401611328125, 0.20037841796875, 0.22820281982421875, 0.2560272216796875, 0.28385162353515625, 0.311676025390625, 0.33950042724609375, 0.3673248291015625, 0.39514923095703125, 0.4229736328125, 0.45079803466796875, 0.4786224365234375, 0.5064468383789062, 0.534271240234375, 0.5620956420898438, 0.5899200439453125, 0.6177444458007812, 0.64556884765625, 0.6733932495117188, 0.7012176513671875, 0.7290420532226562, 0.756866455078125, 0.7846908569335938, 0.8125152587890625, 0.8403396606445312, 0.8681640625]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 7.0, 10.0, 6.0, 7.0, 16.0, 8.0, 18.0, 20.0, 22.0, 23.0, 16.0, 31.0, 35.0, 26.0, 42.0, 34.0, 32.0, 51.0, 38.0, 45.0, 54.0, 40.0, 40.0, 40.0, 35.0, 43.0, 38.0, 26.0, 26.0, 29.0, 20.0, 22.0, 13.0, 17.0, 14.0, 7.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.08795166015625, -1.0499267578125, -1.01190185546875, -0.973876953125, -0.93585205078125, -0.8978271484375, -0.85980224609375, -0.82177734375, -0.78375244140625, -0.7457275390625, -0.70770263671875, -0.669677734375, -0.63165283203125, -0.5936279296875, -0.55560302734375, -0.517578125, -0.47955322265625, -0.4415283203125, -0.40350341796875, -0.365478515625, -0.32745361328125, -0.2894287109375, -0.25140380859375, -0.21337890625, -0.17535400390625, -0.1373291015625, -0.09930419921875, -0.061279296875, -0.02325439453125, 0.0147705078125, 0.05279541015625, 0.0908203125, 0.12884521484375, 0.1668701171875, 0.20489501953125, 0.242919921875, 0.28094482421875, 0.3189697265625, 0.35699462890625, 0.39501953125, 0.43304443359375, 0.4710693359375, 0.50909423828125, 0.547119140625, 0.58514404296875, 0.6231689453125, 0.66119384765625, 0.69921875, 0.73724365234375, 0.7752685546875, 0.81329345703125, 0.851318359375, 0.88934326171875, 0.9273681640625, 0.96539306640625, 1.00341796875, 1.04144287109375, 1.0794677734375, 1.11749267578125, 1.155517578125, 1.19354248046875, 1.2315673828125, 1.26959228515625, 1.3076171875]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 11.0, 14.0, 21.0, 16.0, 26.0, 33.0, 41.0, 71.0, 64.0, 112.0, 146.0, 237.0, 305.0, 525.0, 747.0, 1273.0, 2395.0, 5030.0, 12859.0, 50807.0, 929998.0, 26708.0, 8421.0, 3657.0, 1919.0, 1075.0, 612.0, 371.0, 286.0, 188.0, 138.0, 103.0, 84.0, 60.0, 40.0, 34.0, 26.0, 14.0, 17.0, 12.0, 9.0, 5.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1162109375, -0.11237525939941406, -0.10853958129882812, -0.10470390319824219, -0.10086822509765625, -0.09703254699707031, -0.09319686889648438, -0.08936119079589844, -0.0855255126953125, -0.08168983459472656, -0.07785415649414062, -0.07401847839355469, -0.07018280029296875, -0.06634712219238281, -0.06251144409179688, -0.05867576599121094, -0.054840087890625, -0.05100440979003906, -0.047168731689453125, -0.04333305358886719, -0.03949737548828125, -0.03566169738769531, -0.031826019287109375, -0.027990341186523438, -0.0241546630859375, -0.020318984985351562, -0.016483306884765625, -0.012647628784179688, -0.00881195068359375, -0.0049762725830078125, -0.001140594482421875, 0.0026950836181640625, 0.00653076171875, 0.010366439819335938, 0.014202117919921875, 0.018037796020507812, 0.02187347412109375, 0.025709152221679688, 0.029544830322265625, 0.03338050842285156, 0.0372161865234375, 0.04105186462402344, 0.044887542724609375, 0.04872322082519531, 0.05255889892578125, 0.05639457702636719, 0.060230255126953125, 0.06406593322753906, 0.067901611328125, 0.07173728942871094, 0.07557296752929688, 0.07940864562988281, 0.08324432373046875, 0.08708000183105469, 0.09091567993164062, 0.09475135803222656, 0.0985870361328125, 0.10242271423339844, 0.10625839233398438, 0.11009407043457031, 0.11392974853515625, 0.11776542663574219, 0.12160110473632812, 0.12543678283691406, 0.1292724609375]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 6.0, 3.0, 7.0, 10.0, 7.0, 10.0, 12.0, 23.0, 42.0, 43.0, 50.0, 58.0, 89.0, 80.0, 80.0, 69.0, 70.0, 72.0, 55.0, 43.0, 32.0, 28.0, 17.0, 18.0, 14.0, 6.0, 9.0, 8.0, 1.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8650970458984375e-05, -5.658622831106186e-05, -5.452148616313934e-05, -5.245674401521683e-05, -5.039200186729431e-05, -4.8327259719371796e-05, -4.626251757144928e-05, -4.4197775423526764e-05, -4.213303327560425e-05, -4.006829112768173e-05, -3.8003548979759216e-05, -3.59388068318367e-05, -3.3874064683914185e-05, -3.180932253599167e-05, -2.9744580388069153e-05, -2.7679838240146637e-05, -2.561509609222412e-05, -2.3550353944301605e-05, -2.148561179637909e-05, -1.9420869648456573e-05, -1.7356127500534058e-05, -1.5291385352611542e-05, -1.3226643204689026e-05, -1.116190105676651e-05, -9.097158908843994e-06, -7.032416760921478e-06, -4.967674612998962e-06, -2.9029324650764465e-06, -8.381903171539307e-07, 1.2265518307685852e-06, 3.291293978691101e-06, 5.356036126613617e-06, 7.420778274536133e-06, 9.485520422458649e-06, 1.1550262570381165e-05, 1.361500471830368e-05, 1.5679746866226196e-05, 1.7744489014148712e-05, 1.9809231162071228e-05, 2.1873973309993744e-05, 2.393871545791626e-05, 2.6003457605838776e-05, 2.806819975376129e-05, 3.0132941901683807e-05, 3.219768404960632e-05, 3.426242619752884e-05, 3.6327168345451355e-05, 3.839191049337387e-05, 4.045665264129639e-05, 4.25213947892189e-05, 4.458613693714142e-05, 4.6650879085063934e-05, 4.871562123298645e-05, 5.0780363380908966e-05, 5.284510552883148e-05, 5.4909847676754e-05, 5.6974589824676514e-05, 5.903933197259903e-05, 6.110407412052155e-05, 6.316881626844406e-05, 6.523355841636658e-05, 6.729830056428909e-05, 6.936304271221161e-05, 7.142778486013412e-05, 7.349252700805664e-05]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 2.0, 5.0, 7.0, 9.0, 9.0, 16.0, 13.0, 15.0, 23.0, 29.0, 46.0, 44.0, 54.0, 80.0, 119.0, 229.0, 639.0, 3160.0, 22366.0, 331985.0, 649793.0, 33834.0, 4530.0, 807.0, 255.0, 123.0, 70.0, 60.0, 51.0, 37.0, 27.0, 28.0, 23.0, 19.0, 7.0, 10.0, 6.0, 2.0, 3.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1669921875, -0.1612529754638672, -0.15551376342773438, -0.14977455139160156, -0.14403533935546875, -0.13829612731933594, -0.13255691528320312, -0.1268177032470703, -0.1210784912109375, -0.11533927917480469, -0.10960006713867188, -0.10386085510253906, -0.09812164306640625, -0.09238243103027344, -0.08664321899414062, -0.08090400695800781, -0.075164794921875, -0.06942558288574219, -0.06368637084960938, -0.05794715881347656, -0.05220794677734375, -0.04646873474121094, -0.040729522705078125, -0.03499031066894531, -0.0292510986328125, -0.023511886596679688, -0.017772674560546875, -0.012033462524414062, -0.00629425048828125, -0.0005550384521484375, 0.005184173583984375, 0.010923385620117188, 0.01666259765625, 0.022401809692382812, 0.028141021728515625, 0.03388023376464844, 0.03961944580078125, 0.04535865783691406, 0.051097869873046875, 0.05683708190917969, 0.0625762939453125, 0.06831550598144531, 0.07405471801757812, 0.07979393005371094, 0.08553314208984375, 0.09127235412597656, 0.09701156616210938, 0.10275077819824219, 0.108489990234375, 0.11422920227050781, 0.11996841430664062, 0.12570762634277344, 0.13144683837890625, 0.13718605041503906, 0.14292526245117188, 0.1486644744873047, 0.1544036865234375, 0.1601428985595703, 0.16588211059570312, 0.17162132263183594, 0.17736053466796875, 0.18309974670410156, 0.18883895874023438, 0.1945781707763672, 0.2003173828125]}, "gradients/decoder.roberta.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 14.0, 17.0, 22.0, 16.0, 23.0, 25.0, 42.0, 48.0, 62.0, 86.0, 80.0, 74.0, 81.0, 80.0, 56.0, 49.0, 32.0, 29.0, 28.0, 18.0, 18.0, 13.0, 12.0, 11.0, 10.0, 8.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0166778564453125, -0.016175508499145508, -0.015673160552978516, -0.015170812606811523, -0.014668464660644531, -0.014166116714477539, -0.013663768768310547, -0.013161420822143555, -0.012659072875976562, -0.01215672492980957, -0.011654376983642578, -0.011152029037475586, -0.010649681091308594, -0.010147333145141602, -0.00964498519897461, -0.009142637252807617, -0.008640289306640625, -0.008137941360473633, -0.007635593414306641, -0.0071332454681396484, -0.006630897521972656, -0.006128549575805664, -0.005626201629638672, -0.00512385368347168, -0.0046215057373046875, -0.004119157791137695, -0.003616809844970703, -0.003114461898803711, -0.0026121139526367188, -0.0021097660064697266, -0.0016074180603027344, -0.0011050701141357422, -0.00060272216796875, -0.00010037422180175781, 0.0004019737243652344, 0.0009043216705322266, 0.0014066696166992188, 0.001909017562866211, 0.002411365509033203, 0.0029137134552001953, 0.0034160614013671875, 0.00391840934753418, 0.004420757293701172, 0.004923105239868164, 0.005425453186035156, 0.0059278011322021484, 0.006430149078369141, 0.006932497024536133, 0.007434844970703125, 0.007937192916870117, 0.00843954086303711, 0.008941888809204102, 0.009444236755371094, 0.009946584701538086, 0.010448932647705078, 0.01095128059387207, 0.011453628540039062, 0.011955976486206055, 0.012458324432373047, 0.012960672378540039, 0.013463020324707031, 0.013965368270874023, 0.014467716217041016, 0.014970064163208008, 0.015472412109375]}, "gradients/decoder.roberta.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 21.0, 38.0, 75.0, 116.0, 194.0, 189.0, 154.0, 99.0, 66.0, 37.0, 11.0, 7.0, 1.0, 2.0], "bins": [-10.158638954162598, -9.974987983703613, -9.791336059570312, -9.607685089111328, -9.424033164978027, -9.240382194519043, -9.056730270385742, -8.873079299926758, -8.689428329467773, -8.505777359008789, -8.322125434875488, -8.138474464416504, -7.954823017120361, -7.771171569824219, -7.587520122528076, -7.403868675231934, -7.220216751098633, -7.03656530380249, -6.852913856506348, -6.669262886047363, -6.485611438751221, -6.301959991455078, -6.1183085441589355, -5.934657096862793, -5.751006126403809, -5.567354679107666, -5.383703231811523, -5.200052261352539, -5.0164008140563965, -4.832749366760254, -4.649097919464111, -4.465446472167969, -4.281795501708984, -4.098144054412842, -3.9144928455352783, -3.7308413982391357, -3.547189950942993, -3.3635387420654297, -3.179887294769287, -2.9962358474731445, -2.812584400177002, -2.6289329528808594, -2.445281744003296, -2.2616302967071533, -2.0779788494110107, -1.8943275213241577, -1.7106761932373047, -1.527024745941162, -1.343373417854309, -1.159722089767456, -0.9760706424713135, -0.7924193143844604, -0.6087679266929626, -0.42511653900146484, -0.24146521091461182, -0.05781376361846924, 0.1258375644683838, 0.3094889521598816, 0.493140310049057, 0.6767916679382324, 0.8604430556297302, 1.044094443321228, 1.227745771408081, 1.4113972187042236, 1.5950485467910767]}, "gradients/decoder.roberta.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 9.0, 7.0, 12.0, 12.0, 10.0, 16.0, 13.0, 20.0, 16.0, 23.0, 21.0, 32.0, 34.0, 37.0, 44.0, 36.0, 49.0, 41.0, 47.0, 44.0, 45.0, 39.0, 41.0, 44.0, 37.0, 32.0, 33.0, 37.0, 28.0, 18.0, 24.0, 18.0, 15.0, 17.0, 13.0, 15.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6254708766937256, -1.5642788410186768, -1.5030866861343384, -1.4418946504592896, -1.3807026147842407, -1.3195104598999023, -1.2583184242248535, -1.1971263885498047, -1.1359343528747559, -1.074742317199707, -1.0135501623153687, -0.9523581266403198, -0.891166090965271, -0.8299739956855774, -0.7687819004058838, -0.707589864730835, -0.6463977098464966, -0.585205614566803, -0.5240135788917542, -0.46282148361206055, -0.40162941813468933, -0.3404373526573181, -0.2792452573776245, -0.2180531919002533, -0.15686112642288208, -0.09566905349493027, -0.034476980566978455, 0.026715099811553955, 0.08790716528892517, 0.1490992307662964, 0.21029132604599, 0.2714833915233612, 0.3326754570007324, 0.39386752247810364, 0.45505958795547485, 0.5162516832351685, 0.5774437189102173, 0.6386358141899109, 0.6998279094696045, 0.7610199451446533, 0.8222120404243469, 0.8834041357040405, 0.9445961713790894, 1.0057883262634277, 1.0669803619384766, 1.1281723976135254, 1.1893644332885742, 1.2505565881729126, 1.3117486238479614, 1.3729406595230103, 1.4341328144073486, 1.4953248500823975, 1.5565168857574463, 1.6177089214324951, 1.6789010763168335, 1.7400931119918823, 1.8012852668762207, 1.8624773025512695, 1.923669457435608, 1.9848614931106567, 2.046053647994995, 2.107245683670044, 2.1684377193450928, 2.2296297550201416, 2.2908217906951904]}, "gradients/decoder.roberta.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 6.0, 10.0, 18.0, 18.0, 24.0, 39.0, 54.0, 66.0, 102.0, 158.0, 184.0, 328.0, 492.0, 764.0, 1318.0, 2462.0, 4536.0, 9350.0, 20599.0, 47792.0, 132068.0, 418063.0, 265626.0, 81898.0, 32882.0, 14666.0, 6804.0, 3491.0, 1775.0, 1022.0, 647.0, 350.0, 274.0, 200.0, 131.0, 82.0, 64.0, 55.0, 36.0, 28.0, 25.0, 8.0, 7.0, 9.0, 5.0, 8.0, 5.0, 0.0, 1.0, 3.0], "bins": [-3.400390625, -3.30535888671875, -3.2103271484375, -3.11529541015625, -3.020263671875, -2.92523193359375, -2.8302001953125, -2.73516845703125, -2.64013671875, -2.54510498046875, -2.4500732421875, -2.35504150390625, -2.260009765625, -2.16497802734375, -2.0699462890625, -1.97491455078125, -1.8798828125, -1.78485107421875, -1.6898193359375, -1.59478759765625, -1.499755859375, -1.40472412109375, -1.3096923828125, -1.21466064453125, -1.11962890625, -1.02459716796875, -0.9295654296875, -0.83453369140625, -0.739501953125, -0.64447021484375, -0.5494384765625, -0.45440673828125, -0.359375, -0.26434326171875, -0.1693115234375, -0.07427978515625, 0.020751953125, 0.11578369140625, 0.2108154296875, 0.30584716796875, 0.40087890625, 0.49591064453125, 0.5909423828125, 0.68597412109375, 0.781005859375, 0.87603759765625, 0.9710693359375, 1.06610107421875, 1.1611328125, 1.25616455078125, 1.3511962890625, 1.44622802734375, 1.541259765625, 1.63629150390625, 1.7313232421875, 1.82635498046875, 1.92138671875, 2.01641845703125, 2.1114501953125, 2.20648193359375, 2.301513671875, 2.39654541015625, 2.4915771484375, 2.58660888671875, 2.681640625]}, "gradients/decoder.roberta.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 7.0, 17.0, 5.0, 16.0, 16.0, 17.0, 15.0, 23.0, 20.0, 25.0, 30.0, 41.0, 46.0, 32.0, 48.0, 42.0, 44.0, 48.0, 42.0, 45.0, 37.0, 52.0, 37.0, 29.0, 31.0, 34.0, 32.0, 26.0, 22.0, 19.0, 19.0, 14.0, 11.0, 19.0, 9.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7470703125, -1.6823577880859375, -1.617645263671875, -1.5529327392578125, -1.48822021484375, -1.4235076904296875, -1.358795166015625, -1.2940826416015625, -1.2293701171875, -1.1646575927734375, -1.099945068359375, -1.0352325439453125, -0.97052001953125, -0.9058074951171875, -0.841094970703125, -0.7763824462890625, -0.711669921875, -0.6469573974609375, -0.582244873046875, -0.5175323486328125, -0.45281982421875, -0.3881072998046875, -0.323394775390625, -0.2586822509765625, -0.1939697265625, -0.1292572021484375, -0.064544677734375, 0.0001678466796875, 0.06488037109375, 0.1295928955078125, 0.194305419921875, 0.2590179443359375, 0.32373046875, 0.3884429931640625, 0.453155517578125, 0.5178680419921875, 0.58258056640625, 0.6472930908203125, 0.712005615234375, 0.7767181396484375, 0.8414306640625, 0.9061431884765625, 0.970855712890625, 1.0355682373046875, 1.10028076171875, 1.1649932861328125, 1.229705810546875, 1.2944183349609375, 1.359130859375, 1.4238433837890625, 1.488555908203125, 1.5532684326171875, 1.61798095703125, 1.6826934814453125, 1.747406005859375, 1.8121185302734375, 1.8768310546875, 1.9415435791015625, 2.006256103515625, 2.0709686279296875, 2.13568115234375, 2.2003936767578125, 2.265106201171875, 2.3298187255859375, 2.39453125]}, "gradients/decoder.roberta.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 4.0, 7.0, 9.0, 14.0, 16.0, 17.0, 28.0, 37.0, 39.0, 63.0, 72.0, 69.0, 75.0, 109.0, 126.0, 154.0, 174.0, 244.0, 1333.0, 952125.0, 91875.0, 791.0, 212.0, 165.0, 144.0, 124.0, 92.0, 87.0, 77.0, 62.0, 53.0, 33.0, 35.0, 24.0, 22.0, 16.0, 11.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-33.125, -31.97802734375, -30.8310546875, -29.68408203125, -28.537109375, -27.39013671875, -26.2431640625, -25.09619140625, -23.94921875, -22.80224609375, -21.6552734375, -20.50830078125, -19.361328125, -18.21435546875, -17.0673828125, -15.92041015625, -14.7734375, -13.62646484375, -12.4794921875, -11.33251953125, -10.185546875, -9.03857421875, -7.8916015625, -6.74462890625, -5.59765625, -4.45068359375, -3.3037109375, -2.15673828125, -1.009765625, 0.13720703125, 1.2841796875, 2.43115234375, 3.578125, 4.72509765625, 5.8720703125, 7.01904296875, 8.166015625, 9.31298828125, 10.4599609375, 11.60693359375, 12.75390625, 13.90087890625, 15.0478515625, 16.19482421875, 17.341796875, 18.48876953125, 19.6357421875, 20.78271484375, 21.9296875, 23.07666015625, 24.2236328125, 25.37060546875, 26.517578125, 27.66455078125, 28.8115234375, 29.95849609375, 31.10546875, 32.25244140625, 33.3994140625, 34.54638671875, 35.693359375, 36.84033203125, 37.9873046875, 39.13427734375, 40.28125]}, "gradients/decoder.roberta.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 3.0, 9.0, 5.0, 14.0, 11.0, 16.0, 17.0, 21.0, 21.0, 26.0, 35.0, 28.0, 54.0, 43.0, 40.0, 60.0, 56.0, 43.0, 56.0, 58.0, 50.0, 55.0, 40.0, 38.0, 35.0, 20.0, 31.0, 27.0, 19.0, 14.0, 11.0, 14.0, 4.0, 11.0, 7.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.6953125, -2.621673583984375, -2.54803466796875, -2.474395751953125, -2.4007568359375, -2.327117919921875, -2.25347900390625, -2.179840087890625, -2.106201171875, -2.032562255859375, -1.95892333984375, -1.885284423828125, -1.8116455078125, -1.738006591796875, -1.66436767578125, -1.590728759765625, -1.51708984375, -1.443450927734375, -1.36981201171875, -1.296173095703125, -1.2225341796875, -1.148895263671875, -1.07525634765625, -1.001617431640625, -0.927978515625, -0.854339599609375, -0.78070068359375, -0.707061767578125, -0.6334228515625, -0.559783935546875, -0.48614501953125, -0.412506103515625, -0.3388671875, -0.265228271484375, -0.19158935546875, -0.117950439453125, -0.0443115234375, 0.029327392578125, 0.10296630859375, 0.176605224609375, 0.250244140625, 0.323883056640625, 0.39752197265625, 0.471160888671875, 0.5447998046875, 0.618438720703125, 0.69207763671875, 0.765716552734375, 0.83935546875, 0.912994384765625, 0.98663330078125, 1.060272216796875, 1.1339111328125, 1.207550048828125, 1.28118896484375, 1.354827880859375, 1.428466796875, 1.502105712890625, 1.57574462890625, 1.649383544921875, 1.7230224609375, 1.796661376953125, 1.87030029296875, 1.943939208984375, 2.017578125]}, "gradients/decoder.roberta.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 8.0, 4.0, 10.0, 18.0, 30.0, 38.0, 77.0, 149.0, 317.0, 1026.0, 8340.0, 266916.0, 756764.0, 12721.0, 1430.0, 332.0, 168.0, 83.0, 55.0, 30.0, 10.0, 9.0, 3.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.640625, -5.47515869140625, -5.3096923828125, -5.14422607421875, -4.978759765625, -4.81329345703125, -4.6478271484375, -4.48236083984375, -4.31689453125, -4.15142822265625, -3.9859619140625, -3.82049560546875, -3.655029296875, -3.48956298828125, -3.3240966796875, -3.15863037109375, -2.9931640625, -2.82769775390625, -2.6622314453125, -2.49676513671875, -2.331298828125, -2.16583251953125, -2.0003662109375, -1.83489990234375, -1.66943359375, -1.50396728515625, -1.3385009765625, -1.17303466796875, -1.007568359375, -0.84210205078125, -0.6766357421875, -0.51116943359375, -0.345703125, -0.18023681640625, -0.0147705078125, 0.15069580078125, 0.316162109375, 0.48162841796875, 0.6470947265625, 0.81256103515625, 0.97802734375, 1.14349365234375, 1.3089599609375, 1.47442626953125, 1.639892578125, 1.80535888671875, 1.9708251953125, 2.13629150390625, 2.3017578125, 2.46722412109375, 2.6326904296875, 2.79815673828125, 2.963623046875, 3.12908935546875, 3.2945556640625, 3.46002197265625, 3.62548828125, 3.79095458984375, 3.9564208984375, 4.12188720703125, 4.287353515625, 4.45281982421875, 4.6182861328125, 4.78375244140625, 4.94921875]}, "gradients/decoder.roberta.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 1.0, 4.0, 9.0, 15.0, 12.0, 25.0, 33.0, 65.0, 83.0, 151.0, 188.0, 147.0, 90.0, 52.0, 42.0, 23.0, 10.0, 12.0, 4.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00020813941955566406, -0.00020190328359603882, -0.00019566714763641357, -0.00018943101167678833, -0.00018319487571716309, -0.00017695873975753784, -0.0001707226037979126, -0.00016448646783828735, -0.0001582503318786621, -0.00015201419591903687, -0.00014577805995941162, -0.00013954192399978638, -0.00013330578804016113, -0.0001270696520805359, -0.00012083351612091064, -0.0001145973801612854, -0.00010836124420166016, -0.00010212510824203491, -9.588897228240967e-05, -8.965283632278442e-05, -8.341670036315918e-05, -7.718056440353394e-05, -7.094442844390869e-05, -6.470829248428345e-05, -5.84721565246582e-05, -5.223602056503296e-05, -4.5999884605407715e-05, -3.976374864578247e-05, -3.3527612686157227e-05, -2.7291476726531982e-05, -2.1055340766906738e-05, -1.4819204807281494e-05, -8.58306884765625e-06, -2.346932888031006e-06, 3.889203071594238e-06, 1.0125339031219482e-05, 1.6361474990844727e-05, 2.259761095046997e-05, 2.8833746910095215e-05, 3.506988286972046e-05, 4.13060188293457e-05, 4.754215478897095e-05, 5.377829074859619e-05, 6.0014426708221436e-05, 6.625056266784668e-05, 7.248669862747192e-05, 7.872283458709717e-05, 8.495897054672241e-05, 9.119510650634766e-05, 9.74312424659729e-05, 0.00010366737842559814, 0.00010990351438522339, 0.00011613965034484863, 0.00012237578630447388, 0.00012861192226409912, 0.00013484805822372437, 0.0001410841941833496, 0.00014732033014297485, 0.0001535564661026001, 0.00015979260206222534, 0.00016602873802185059, 0.00017226487398147583, 0.00017850100994110107, 0.00018473714590072632, 0.00019097328186035156]}, "gradients/decoder.roberta.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 6.0, 11.0, 17.0, 32.0, 40.0, 73.0, 149.0, 412.0, 1743.0, 63258.0, 973142.0, 8381.0, 734.0, 246.0, 108.0, 76.0, 30.0, 23.0, 7.0, 12.0, 9.0, 2.0, 1.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.4700927734375, -8.190185546875, -7.9102783203125, -7.63037109375, -7.3504638671875, -7.070556640625, -6.7906494140625, -6.5107421875, -6.2308349609375, -5.950927734375, -5.6710205078125, -5.39111328125, -5.1112060546875, -4.831298828125, -4.5513916015625, -4.271484375, -3.9915771484375, -3.711669921875, -3.4317626953125, -3.15185546875, -2.8719482421875, -2.592041015625, -2.3121337890625, -2.0322265625, -1.7523193359375, -1.472412109375, -1.1925048828125, -0.91259765625, -0.6326904296875, -0.352783203125, -0.0728759765625, 0.20703125, 0.4869384765625, 0.766845703125, 1.0467529296875, 1.32666015625, 1.6065673828125, 1.886474609375, 2.1663818359375, 2.4462890625, 2.7261962890625, 3.006103515625, 3.2860107421875, 3.56591796875, 3.8458251953125, 4.125732421875, 4.4056396484375, 4.685546875, 4.9654541015625, 5.245361328125, 5.5252685546875, 5.80517578125, 6.0850830078125, 6.364990234375, 6.6448974609375, 6.9248046875, 7.2047119140625, 7.484619140625, 7.7645263671875, 8.04443359375, 8.3243408203125, 8.604248046875, 8.8841552734375, 9.1640625]}, "gradients/decoder.roberta.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 22.0, 21.0, 32.0, 57.0, 95.0, 144.0, 196.0, 154.0, 88.0, 46.0, 33.0, 19.0, 19.0, 12.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5380859375, -0.5177688598632812, -0.4974517822265625, -0.47713470458984375, -0.456817626953125, -0.43650054931640625, -0.4161834716796875, -0.39586639404296875, -0.37554931640625, -0.35523223876953125, -0.3349151611328125, -0.31459808349609375, -0.294281005859375, -0.27396392822265625, -0.2536468505859375, -0.23332977294921875, -0.2130126953125, -0.19269561767578125, -0.1723785400390625, -0.15206146240234375, -0.131744384765625, -0.11142730712890625, -0.0911102294921875, -0.07079315185546875, -0.05047607421875, -0.03015899658203125, -0.0098419189453125, 0.01047515869140625, 0.030792236328125, 0.05110931396484375, 0.0714263916015625, 0.09174346923828125, 0.112060546875, 0.13237762451171875, 0.1526947021484375, 0.17301177978515625, 0.193328857421875, 0.21364593505859375, 0.2339630126953125, 0.25428009033203125, 0.27459716796875, 0.29491424560546875, 0.3152313232421875, 0.33554840087890625, 0.355865478515625, 0.37618255615234375, 0.3964996337890625, 0.41681671142578125, 0.4371337890625, 0.45745086669921875, 0.4777679443359375, 0.49808502197265625, 0.518402099609375, 0.5387191772460938, 0.5590362548828125, 0.5793533325195312, 0.59967041015625, 0.6199874877929688, 0.6403045654296875, 0.6606216430664062, 0.680938720703125, 0.7012557983398438, 0.7215728759765625, 0.7418899536132812, 0.76220703125]}, "gradients/decoder.roberta.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 12.0, 16.0, 10.0, 18.0, 22.0, 19.0, 35.0, 31.0, 35.0, 39.0, 51.0, 52.0, 57.0, 55.0, 64.0, 44.0, 52.0, 57.0, 54.0, 37.0, 35.0, 32.0, 29.0, 29.0, 17.0, 25.0, 23.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.2436695098876953, -2.1817893981933594, -2.1199092864990234, -2.0580294132232666, -1.9961493015289307, -1.9342691898345947, -1.8723890781402588, -1.8105089664459229, -1.7486289739608765, -1.6867488622665405, -1.6248688697814941, -1.5629887580871582, -1.5011086463928223, -1.4392286539077759, -1.37734854221344, -1.3154685497283936, -1.2535884380340576, -1.1917083263397217, -1.1298283338546753, -1.0679482221603394, -1.006068229675293, -0.944188117980957, -0.8823080062866211, -0.8204279541969299, -0.7585479021072388, -0.6966678500175476, -0.6347877979278564, -0.5729076862335205, -0.5110276341438293, -0.4491475820541382, -0.38726750016212463, -0.3253874182701111, -0.26350724697113037, -0.20162717998027802, -0.13974711298942566, -0.0778670459985733, -0.015986979007720947, 0.045893073081970215, 0.10777315497398376, 0.16965323686599731, 0.23153328895568848, 0.29341334104537964, 0.3552934229373932, 0.41717350482940674, 0.4790535569190979, 0.5409336090087891, 0.602813720703125, 0.6646937727928162, 0.7265738248825073, 0.7884538769721985, 0.8503339290618896, 0.9122140407562256, 0.9740940928459167, 1.035974144935608, 1.0978542566299438, 1.1597342491149902, 1.2216143608093262, 1.283494472503662, 1.3453744649887085, 1.4072545766830444, 1.4691345691680908, 1.5310146808624268, 1.5928947925567627, 1.6547749042510986, 1.716654896736145]}, "gradients/decoder.roberta.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 7.0, 5.0, 7.0, 15.0, 15.0, 12.0, 23.0, 29.0, 16.0, 39.0, 36.0, 35.0, 39.0, 36.0, 23.0, 49.0, 56.0, 40.0, 51.0, 45.0, 36.0, 48.0, 45.0, 29.0, 37.0, 27.0, 21.0, 29.0, 29.0, 18.0, 22.0, 8.0, 14.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.945497512817383, -2.857539176940918, -2.769580841064453, -2.6816225051879883, -2.5936641693115234, -2.5057058334350586, -2.4177474975585938, -2.329789161682129, -2.241830825805664, -2.153872489929199, -2.0659141540527344, -1.9779558181762695, -1.8899974822998047, -1.8020391464233398, -1.714080810546875, -1.6261224746704102, -1.5381641387939453, -1.4502058029174805, -1.3622474670410156, -1.2742891311645508, -1.186330795288086, -1.098372459411621, -1.0104141235351562, -0.9224557876586914, -0.8344974517822266, -0.7465391159057617, -0.6585807800292969, -0.570622444152832, -0.4826641082763672, -0.39470577239990234, -0.3067474365234375, -0.21878910064697266, -0.13083100318908691, -0.04287266731262207, 0.04508566856384277, 0.13304400444030762, 0.22100234031677246, 0.3089606761932373, 0.39691901206970215, 0.484877347946167, 0.5728356838226318, 0.6607940196990967, 0.7487523555755615, 0.8367106914520264, 0.9246690273284912, 1.012627363204956, 1.100585699081421, 1.1885440349578857, 1.2765023708343506, 1.3644607067108154, 1.4524190425872803, 1.5403773784637451, 1.62833571434021, 1.7162940502166748, 1.8042523860931396, 1.8922107219696045, 1.9801690578460693, 2.068127393722534, 2.156085729598999, 2.244044065475464, 2.3320024013519287, 2.4199607372283936, 2.5079190731048584, 2.5958774089813232, 2.683835744857788]}, "gradients/decoder.roberta.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 6.0, 4.0, 11.0, 11.0, 11.0, 15.0, 21.0, 27.0, 30.0, 44.0, 64.0, 114.0, 186.0, 399.0, 741.0, 1937.0, 6060.0, 25716.0, 4067579.0, 75059.0, 10698.0, 3204.0, 1150.0, 508.0, 242.0, 128.0, 81.0, 51.0, 41.0, 36.0, 17.0, 20.0, 11.0, 11.0, 14.0, 9.0, 8.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0], "bins": [-10.1328125, -9.86419677734375, -9.5955810546875, -9.32696533203125, -9.058349609375, -8.78973388671875, -8.5211181640625, -8.25250244140625, -7.98388671875, -7.71527099609375, -7.4466552734375, -7.17803955078125, -6.909423828125, -6.64080810546875, -6.3721923828125, -6.10357666015625, -5.8349609375, -5.56634521484375, -5.2977294921875, -5.02911376953125, -4.760498046875, -4.49188232421875, -4.2232666015625, -3.95465087890625, -3.68603515625, -3.41741943359375, -3.1488037109375, -2.88018798828125, -2.611572265625, -2.34295654296875, -2.0743408203125, -1.80572509765625, -1.537109375, -1.26849365234375, -0.9998779296875, -0.73126220703125, -0.462646484375, -0.19403076171875, 0.0745849609375, 0.34320068359375, 0.61181640625, 0.88043212890625, 1.1490478515625, 1.41766357421875, 1.686279296875, 1.95489501953125, 2.2235107421875, 2.49212646484375, 2.7607421875, 3.02935791015625, 3.2979736328125, 3.56658935546875, 3.835205078125, 4.10382080078125, 4.3724365234375, 4.64105224609375, 4.90966796875, 5.17828369140625, 5.4468994140625, 5.71551513671875, 5.984130859375, 6.25274658203125, 6.5213623046875, 6.78997802734375, 7.05859375]}, "gradients/decoder.roberta.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 2.0, 11.0, 11.0, 7.0, 12.0, 10.0, 13.0, 22.0, 10.0, 24.0, 31.0, 27.0, 34.0, 25.0, 30.0, 29.0, 32.0, 28.0, 40.0, 37.0, 41.0, 40.0, 33.0, 44.0, 49.0, 40.0, 35.0, 42.0, 32.0, 33.0, 27.0, 24.0, 20.0, 12.0, 25.0, 8.0, 13.0, 4.0, 9.0, 8.0, 5.0, 3.0, 5.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.6640625, -1.6122283935546875, -1.560394287109375, -1.5085601806640625, -1.45672607421875, -1.4048919677734375, -1.353057861328125, -1.3012237548828125, -1.2493896484375, -1.1975555419921875, -1.145721435546875, -1.0938873291015625, -1.04205322265625, -0.9902191162109375, -0.938385009765625, -0.8865509033203125, -0.834716796875, -0.7828826904296875, -0.731048583984375, -0.6792144775390625, -0.62738037109375, -0.5755462646484375, -0.523712158203125, -0.4718780517578125, -0.4200439453125, -0.3682098388671875, -0.316375732421875, -0.2645416259765625, -0.21270751953125, -0.1608734130859375, -0.109039306640625, -0.0572052001953125, -0.00537109375, 0.0464630126953125, 0.098297119140625, 0.1501312255859375, 0.20196533203125, 0.2537994384765625, 0.305633544921875, 0.3574676513671875, 0.4093017578125, 0.4611358642578125, 0.512969970703125, 0.5648040771484375, 0.61663818359375, 0.6684722900390625, 0.720306396484375, 0.7721405029296875, 0.823974609375, 0.8758087158203125, 0.927642822265625, 0.9794769287109375, 1.03131103515625, 1.0831451416015625, 1.134979248046875, 1.1868133544921875, 1.2386474609375, 1.2904815673828125, 1.342315673828125, 1.3941497802734375, 1.44598388671875, 1.4978179931640625, 1.549652099609375, 1.6014862060546875, 1.6533203125]}, "gradients/decoder.roberta.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 7.0, 5.0, 10.0, 39.0, 156.0, 1820.0, 4060706.0, 129996.0, 1336.0, 124.0, 36.0, 15.0, 3.0, 4.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.03125, -26.210693359375, -25.39013671875, -24.569580078125, -23.7490234375, -22.928466796875, -22.10791015625, -21.287353515625, -20.466796875, -19.646240234375, -18.82568359375, -18.005126953125, -17.1845703125, -16.364013671875, -15.54345703125, -14.722900390625, -13.90234375, -13.081787109375, -12.26123046875, -11.440673828125, -10.6201171875, -9.799560546875, -8.97900390625, -8.158447265625, -7.337890625, -6.517333984375, -5.69677734375, -4.876220703125, -4.0556640625, -3.235107421875, -2.41455078125, -1.593994140625, -0.7734375, 0.047119140625, 0.86767578125, 1.688232421875, 2.5087890625, 3.329345703125, 4.14990234375, 4.970458984375, 5.791015625, 6.611572265625, 7.43212890625, 8.252685546875, 9.0732421875, 9.893798828125, 10.71435546875, 11.534912109375, 12.35546875, 13.176025390625, 13.99658203125, 14.817138671875, 15.6376953125, 16.458251953125, 17.27880859375, 18.099365234375, 18.919921875, 19.740478515625, 20.56103515625, 21.381591796875, 22.2021484375, 23.022705078125, 23.84326171875, 24.663818359375, 25.484375]}, "gradients/decoder.roberta.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 13.0, 12.0, 55.0, 160.0, 3380.0, 345.0, 51.0, 22.0, 13.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.268768310546875, -1.21722412109375, -1.165679931640625, -1.1141357421875, -1.062591552734375, -1.01104736328125, -0.959503173828125, -0.907958984375, -0.856414794921875, -0.80487060546875, -0.753326416015625, -0.7017822265625, -0.650238037109375, -0.59869384765625, -0.547149658203125, -0.49560546875, -0.444061279296875, -0.39251708984375, -0.340972900390625, -0.2894287109375, -0.237884521484375, -0.18634033203125, -0.134796142578125, -0.083251953125, -0.031707763671875, 0.01983642578125, 0.071380615234375, 0.1229248046875, 0.174468994140625, 0.22601318359375, 0.277557373046875, 0.3291015625, 0.380645751953125, 0.43218994140625, 0.483734130859375, 0.5352783203125, 0.586822509765625, 0.63836669921875, 0.689910888671875, 0.741455078125, 0.792999267578125, 0.84454345703125, 0.896087646484375, 0.9476318359375, 0.999176025390625, 1.05072021484375, 1.102264404296875, 1.15380859375, 1.205352783203125, 1.25689697265625, 1.308441162109375, 1.3599853515625, 1.411529541015625, 1.46307373046875, 1.514617919921875, 1.566162109375, 1.617706298828125, 1.66925048828125, 1.720794677734375, 1.7723388671875, 1.823883056640625, 1.87542724609375, 1.926971435546875, 1.978515625]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 7.0, 8.0, 21.0, 31.0, 27.0, 31.0, 48.0, 53.0, 76.0, 74.0, 93.0, 80.0, 99.0, 72.0, 56.0, 61.0, 53.0, 23.0, 21.0, 25.0, 15.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7670148611068726, -1.690822720527649, -1.6146304607391357, -1.538438320159912, -1.462246060371399, -1.3860539197921753, -1.309861660003662, -1.2336695194244385, -1.1574773788452148, -1.0812852382659912, -1.005092978477478, -0.9289008378982544, -0.8527085781097412, -0.7765164375305176, -0.7003242373466492, -0.6241320371627808, -0.5479397773742676, -0.47174757719039917, -0.39555537700653076, -0.31936320662498474, -0.24317100644111633, -0.16697880625724792, -0.0907866358757019, -0.014594435691833496, 0.06159776449203491, 0.13778996467590332, 0.21398214995861053, 0.29017433524131775, 0.36636653542518616, 0.44255873560905457, 0.5187509059906006, 0.594943106174469, 0.6711351871490479, 0.7473273873329163, 0.8235195875167847, 0.8997117280960083, 0.9759039878845215, 1.0520961284637451, 1.1282882690429688, 1.204480528831482, 1.2806727886199951, 1.3568649291992188, 1.433057188987732, 1.5092493295669556, 1.5854415893554688, 1.6616337299346924, 1.737825870513916, 1.8140181303024292, 1.8902102708816528, 1.9664024114608765, 2.0425946712493896, 2.1187868118286133, 2.194978952407837, 2.2711713314056396, 2.3473634719848633, 2.423555612564087, 2.4997477531433105, 2.575939893722534, 2.652132034301758, 2.7283244132995605, 2.804516553878784, 2.880708694458008, 2.9569008350372314, 3.033092975616455, 3.109285354614258]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 7.0, 2.0, 6.0, 4.0, 3.0, 14.0, 14.0, 7.0, 14.0, 20.0, 18.0, 24.0, 17.0, 25.0, 32.0, 30.0, 25.0, 23.0, 32.0, 27.0, 37.0, 31.0, 34.0, 34.0, 37.0, 45.0, 41.0, 46.0, 38.0, 30.0, 38.0, 26.0, 30.0, 30.0, 33.0, 20.0, 25.0, 7.0, 14.0, 10.0, 8.0, 9.0, 13.0, 7.0, 4.0, 2.0, 4.0, 2.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5279091596603394, -1.47730553150177, -1.4267017841339111, -1.3760981559753418, -1.3254945278167725, -1.2748908996582031, -1.2242872714996338, -1.173683524131775, -1.1230798959732056, -1.0724762678146362, -1.0218725204467773, -0.971268892288208, -0.9206652641296387, -0.8700616359710693, -0.8194579482078552, -0.7688542604446411, -0.7182506322860718, -0.6676470041275024, -0.6170433163642883, -0.5664396286010742, -0.5158360004425049, -0.46523234248161316, -0.41462868452072144, -0.3640250265598297, -0.313421368598938, -0.26281771063804626, -0.21221405267715454, -0.16161039471626282, -0.1110067367553711, -0.06040307879447937, -0.009799420833587646, 0.04080423712730408, 0.0914078950881958, 0.14201155304908752, 0.19261521100997925, 0.24321886897087097, 0.2938225269317627, 0.3444261848926544, 0.39502984285354614, 0.44563350081443787, 0.4962371587753296, 0.5468407869338989, 0.597444474697113, 0.6480481624603271, 0.6986517906188965, 0.7492554187774658, 0.7998591065406799, 0.850462794303894, 0.9010664224624634, 0.9516700506210327, 1.0022737979888916, 1.052877426147461, 1.1034810543060303, 1.1540846824645996, 1.204688310623169, 1.2552920579910278, 1.3058956861495972, 1.3564993143081665, 1.4071030616760254, 1.4577066898345947, 1.508310317993164, 1.5589139461517334, 1.6095175743103027, 1.6601213216781616, 1.710724949836731]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 3.0, 12.0, 13.0, 10.0, 29.0, 40.0, 53.0, 84.0, 116.0, 137.0, 255.0, 324.0, 482.0, 702.0, 1047.0, 1517.0, 2222.0, 3330.0, 5256.0, 8038.0, 13064.0, 21352.0, 36770.0, 67464.0, 128173.0, 227680.0, 231489.0, 131781.0, 69539.0, 38078.0, 22066.0, 13392.0, 8287.0, 5272.0, 3366.0, 2265.0, 1509.0, 997.0, 691.0, 495.0, 345.0, 247.0, 162.0, 121.0, 85.0, 59.0, 38.0, 36.0, 25.0, 9.0, 12.0, 5.0, 4.0, 1.0, 6.0, 4.0, 1.0, 2.0], "bins": [-0.331298828125, -0.320953369140625, -0.31060791015625, -0.300262451171875, -0.2899169921875, -0.279571533203125, -0.26922607421875, -0.258880615234375, -0.24853515625, -0.238189697265625, -0.22784423828125, -0.217498779296875, -0.2071533203125, -0.196807861328125, -0.18646240234375, -0.176116943359375, -0.165771484375, -0.155426025390625, -0.14508056640625, -0.134735107421875, -0.1243896484375, -0.114044189453125, -0.10369873046875, -0.093353271484375, -0.0830078125, -0.072662353515625, -0.06231689453125, -0.051971435546875, -0.0416259765625, -0.031280517578125, -0.02093505859375, -0.010589599609375, -0.000244140625, 0.010101318359375, 0.02044677734375, 0.030792236328125, 0.0411376953125, 0.051483154296875, 0.06182861328125, 0.072174072265625, 0.08251953125, 0.092864990234375, 0.10321044921875, 0.113555908203125, 0.1239013671875, 0.134246826171875, 0.14459228515625, 0.154937744140625, 0.165283203125, 0.175628662109375, 0.18597412109375, 0.196319580078125, 0.2066650390625, 0.217010498046875, 0.22735595703125, 0.237701416015625, 0.248046875, 0.258392333984375, 0.26873779296875, 0.279083251953125, 0.2894287109375, 0.299774169921875, 0.31011962890625, 0.320465087890625, 0.330810546875]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 7.0, 3.0, 5.0, 11.0, 16.0, 8.0, 13.0, 19.0, 19.0, 20.0, 23.0, 24.0, 30.0, 26.0, 31.0, 22.0, 30.0, 29.0, 32.0, 36.0, 34.0, 34.0, 33.0, 52.0, 39.0, 42.0, 39.0, 32.0, 38.0, 28.0, 32.0, 30.0, 26.0, 24.0, 25.0, 7.0, 14.0, 11.0, 8.0, 8.0, 12.0, 6.0, 5.0, 1.0, 5.0, 2.0, 7.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.455078125, -1.407012939453125, -1.35894775390625, -1.310882568359375, -1.2628173828125, -1.214752197265625, -1.16668701171875, -1.118621826171875, -1.070556640625, -1.022491455078125, -0.97442626953125, -0.926361083984375, -0.8782958984375, -0.830230712890625, -0.78216552734375, -0.734100341796875, -0.68603515625, -0.637969970703125, -0.58990478515625, -0.541839599609375, -0.4937744140625, -0.445709228515625, -0.39764404296875, -0.349578857421875, -0.301513671875, -0.253448486328125, -0.20538330078125, -0.157318115234375, -0.1092529296875, -0.061187744140625, -0.01312255859375, 0.034942626953125, 0.0830078125, 0.131072998046875, 0.17913818359375, 0.227203369140625, 0.2752685546875, 0.323333740234375, 0.37139892578125, 0.419464111328125, 0.467529296875, 0.515594482421875, 0.56365966796875, 0.611724853515625, 0.6597900390625, 0.707855224609375, 0.75592041015625, 0.803985595703125, 0.85205078125, 0.900115966796875, 0.94818115234375, 0.996246337890625, 1.0443115234375, 1.092376708984375, 1.14044189453125, 1.188507080078125, 1.236572265625, 1.284637451171875, 1.33270263671875, 1.380767822265625, 1.4288330078125, 1.476898193359375, 1.52496337890625, 1.573028564453125, 1.62109375]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 2.0, 8.0, 6.0, 10.0, 11.0, 25.0, 26.0, 41.0, 41.0, 48.0, 86.0, 69.0, 110.0, 157.0, 214.0, 299.0, 365.0, 571.0, 923.0, 1452.0, 2717.0, 5746.0, 14579.0, 52099.0, 909297.0, 37063.0, 11525.0, 4667.0, 2325.0, 1361.0, 787.0, 508.0, 351.0, 259.0, 196.0, 136.0, 126.0, 61.0, 67.0, 55.0, 44.0, 30.0, 29.0, 12.0, 13.0, 10.0, 7.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.89501953125, -0.8665008544921875, -0.837982177734375, -0.8094635009765625, -0.78094482421875, -0.7524261474609375, -0.723907470703125, -0.6953887939453125, -0.6668701171875, -0.6383514404296875, -0.609832763671875, -0.5813140869140625, -0.55279541015625, -0.5242767333984375, -0.495758056640625, -0.4672393798828125, -0.438720703125, -0.4102020263671875, -0.381683349609375, -0.3531646728515625, -0.32464599609375, -0.2961273193359375, -0.267608642578125, -0.2390899658203125, -0.2105712890625, -0.1820526123046875, -0.153533935546875, -0.1250152587890625, -0.09649658203125, -0.0679779052734375, -0.039459228515625, -0.0109405517578125, 0.017578125, 0.0460968017578125, 0.074615478515625, 0.1031341552734375, 0.13165283203125, 0.1601715087890625, 0.188690185546875, 0.2172088623046875, 0.2457275390625, 0.2742462158203125, 0.302764892578125, 0.3312835693359375, 0.35980224609375, 0.3883209228515625, 0.416839599609375, 0.4453582763671875, 0.473876953125, 0.5023956298828125, 0.530914306640625, 0.5594329833984375, 0.58795166015625, 0.6164703369140625, 0.644989013671875, 0.6735076904296875, 0.7020263671875, 0.7305450439453125, 0.759063720703125, 0.7875823974609375, 0.81610107421875, 0.8446197509765625, 0.873138427734375, 0.9016571044921875, 0.93017578125]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 11.0, 2.0, 7.0, 4.0, 5.0, 8.0, 13.0, 8.0, 17.0, 21.0, 18.0, 14.0, 29.0, 30.0, 24.0, 23.0, 29.0, 34.0, 42.0, 42.0, 45.0, 42.0, 29.0, 39.0, 37.0, 34.0, 41.0, 31.0, 39.0, 32.0, 29.0, 36.0, 24.0, 17.0, 20.0, 26.0, 21.0, 18.0, 11.0, 11.0, 7.0, 11.0, 3.0, 6.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9267578125, -0.8952178955078125, -0.863677978515625, -0.8321380615234375, -0.80059814453125, -0.7690582275390625, -0.737518310546875, -0.7059783935546875, -0.6744384765625, -0.6428985595703125, -0.611358642578125, -0.5798187255859375, -0.54827880859375, -0.5167388916015625, -0.485198974609375, -0.4536590576171875, -0.422119140625, -0.3905792236328125, -0.359039306640625, -0.3274993896484375, -0.29595947265625, -0.2644195556640625, -0.232879638671875, -0.2013397216796875, -0.1697998046875, -0.1382598876953125, -0.106719970703125, -0.0751800537109375, -0.04364013671875, -0.0121002197265625, 0.019439697265625, 0.0509796142578125, 0.08251953125, 0.1140594482421875, 0.145599365234375, 0.1771392822265625, 0.20867919921875, 0.2402191162109375, 0.271759033203125, 0.3032989501953125, 0.3348388671875, 0.3663787841796875, 0.397918701171875, 0.4294586181640625, 0.46099853515625, 0.4925384521484375, 0.524078369140625, 0.5556182861328125, 0.587158203125, 0.6186981201171875, 0.650238037109375, 0.6817779541015625, 0.71331787109375, 0.7448577880859375, 0.776397705078125, 0.8079376220703125, 0.8394775390625, 0.8710174560546875, 0.902557373046875, 0.9340972900390625, 0.96563720703125, 0.9971771240234375, 1.028717041015625, 1.0602569580078125, 1.091796875]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 6.0, 16.0, 17.0, 21.0, 34.0, 45.0, 53.0, 78.0, 111.0, 233.0, 271.0, 437.0, 797.0, 1433.0, 2808.0, 6878.0, 23582.0, 942065.0, 50176.0, 10979.0, 4035.0, 1879.0, 942.0, 536.0, 343.0, 253.0, 150.0, 101.0, 81.0, 47.0, 33.0, 34.0, 21.0, 11.0, 13.0, 8.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1265869140625, -0.12246513366699219, -0.11834335327148438, -0.11422157287597656, -0.11009979248046875, -0.10597801208496094, -0.10185623168945312, -0.09773445129394531, -0.0936126708984375, -0.08949089050292969, -0.08536911010742188, -0.08124732971191406, -0.07712554931640625, -0.07300376892089844, -0.06888198852539062, -0.06476020812988281, -0.060638427734375, -0.05651664733886719, -0.052394866943359375, -0.04827308654785156, -0.04415130615234375, -0.04002952575683594, -0.035907745361328125, -0.03178596496582031, -0.0276641845703125, -0.023542404174804688, -0.019420623779296875, -0.015298843383789062, -0.01117706298828125, -0.0070552825927734375, -0.002933502197265625, 0.0011882781982421875, 0.00531005859375, 0.009431838989257812, 0.013553619384765625, 0.017675399780273438, 0.02179718017578125, 0.025918960571289062, 0.030040740966796875, 0.03416252136230469, 0.0382843017578125, 0.04240608215332031, 0.046527862548828125, 0.05064964294433594, 0.05477142333984375, 0.05889320373535156, 0.06301498413085938, 0.06713676452636719, 0.071258544921875, 0.07538032531738281, 0.07950210571289062, 0.08362388610839844, 0.08774566650390625, 0.09186744689941406, 0.09598922729492188, 0.10011100769042969, 0.1042327880859375, 0.10835456848144531, 0.11247634887695312, 0.11659812927246094, 0.12071990966796875, 0.12484169006347656, 0.12896347045898438, 0.1330852508544922, 0.13720703125]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 2.0, 2.0, 5.0, 7.0, 10.0, 16.0, 15.0, 21.0, 37.0, 35.0, 46.0, 59.0, 63.0, 71.0, 74.0, 74.0, 81.0, 65.0, 65.0, 61.0, 41.0, 33.0, 25.0, 27.0, 23.0, 11.0, 8.0, 9.0, 5.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7816505432128906e-05, -5.5934302508831024e-05, -5.405209958553314e-05, -5.216989666223526e-05, -5.028769373893738e-05, -4.8405490815639496e-05, -4.6523287892341614e-05, -4.464108496904373e-05, -4.275888204574585e-05, -4.087667912244797e-05, -3.8994476199150085e-05, -3.71122732758522e-05, -3.523007035255432e-05, -3.334786742925644e-05, -3.146566450595856e-05, -2.9583461582660675e-05, -2.7701258659362793e-05, -2.581905573606491e-05, -2.393685281276703e-05, -2.2054649889469147e-05, -2.0172446966171265e-05, -1.8290244042873383e-05, -1.64080411195755e-05, -1.4525838196277618e-05, -1.2643635272979736e-05, -1.0761432349681854e-05, -8.879229426383972e-06, -6.99702650308609e-06, -5.114823579788208e-06, -3.232620656490326e-06, -1.3504177331924438e-06, 5.317851901054382e-07, 2.4139881134033203e-06, 4.296191036701202e-06, 6.1783939599990845e-06, 8.060596883296967e-06, 9.942799806594849e-06, 1.182500272989273e-05, 1.3707205653190613e-05, 1.5589408576488495e-05, 1.7471611499786377e-05, 1.935381442308426e-05, 2.123601734638214e-05, 2.3118220269680023e-05, 2.5000423192977905e-05, 2.6882626116275787e-05, 2.876482903957367e-05, 3.064703196287155e-05, 3.2529234886169434e-05, 3.4411437809467316e-05, 3.62936407327652e-05, 3.817584365606308e-05, 4.005804657936096e-05, 4.1940249502658844e-05, 4.3822452425956726e-05, 4.570465534925461e-05, 4.758685827255249e-05, 4.946906119585037e-05, 5.1351264119148254e-05, 5.3233467042446136e-05, 5.511566996574402e-05, 5.69978728890419e-05, 5.888007581233978e-05, 6.0762278735637665e-05, 6.264448165893555e-05]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 1.0, 3.0, 7.0, 9.0, 10.0, 9.0, 11.0, 16.0, 15.0, 20.0, 33.0, 28.0, 46.0, 72.0, 107.0, 259.0, 2373.0, 92060.0, 931297.0, 20798.0, 848.0, 164.0, 96.0, 57.0, 44.0, 32.0, 25.0, 27.0, 13.0, 16.0, 6.0, 4.0, 15.0, 4.0, 5.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.262451171875, -0.2540702819824219, -0.24568939208984375, -0.23730850219726562, -0.2289276123046875, -0.22054672241210938, -0.21216583251953125, -0.20378494262695312, -0.195404052734375, -0.18702316284179688, -0.17864227294921875, -0.17026138305664062, -0.1618804931640625, -0.15349960327148438, -0.14511871337890625, -0.13673782348632812, -0.12835693359375, -0.11997604370117188, -0.11159515380859375, -0.10321426391601562, -0.0948333740234375, -0.08645248413085938, -0.07807159423828125, -0.06969070434570312, -0.061309814453125, -0.052928924560546875, -0.04454803466796875, -0.036167144775390625, -0.0277862548828125, -0.019405364990234375, -0.01102447509765625, -0.002643585205078125, 0.0057373046875, 0.014118194580078125, 0.02249908447265625, 0.030879974365234375, 0.0392608642578125, 0.047641754150390625, 0.05602264404296875, 0.06440353393554688, 0.072784423828125, 0.08116531372070312, 0.08954620361328125, 0.09792709350585938, 0.1063079833984375, 0.11468887329101562, 0.12306976318359375, 0.13145065307617188, 0.13983154296875, 0.14821243286132812, 0.15659332275390625, 0.16497421264648438, 0.1733551025390625, 0.18173599243164062, 0.19011688232421875, 0.19849777221679688, 0.206878662109375, 0.21525955200195312, 0.22364044189453125, 0.23202133178710938, 0.2404022216796875, 0.24878311157226562, 0.25716400146484375, 0.2655448913574219, 0.27392578125]}, "gradients/decoder.roberta.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 8.0, 3.0, 9.0, 8.0, 4.0, 9.0, 16.0, 9.0, 19.0, 13.0, 18.0, 28.0, 29.0, 44.0, 43.0, 60.0, 110.0, 135.0, 127.0, 68.0, 48.0, 37.0, 25.0, 20.0, 18.0, 17.0, 12.0, 8.0, 11.0, 5.0, 7.0, 3.0, 10.0, 4.0, 1.0, 6.0, 3.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0134735107421875, -0.013061165809631348, -0.012648820877075195, -0.012236475944519043, -0.01182413101196289, -0.011411786079406738, -0.010999441146850586, -0.010587096214294434, -0.010174751281738281, -0.009762406349182129, -0.009350061416625977, -0.008937716484069824, -0.008525371551513672, -0.00811302661895752, -0.007700681686401367, -0.007288336753845215, -0.0068759918212890625, -0.00646364688873291, -0.006051301956176758, -0.0056389570236206055, -0.005226612091064453, -0.004814267158508301, -0.0044019222259521484, -0.003989577293395996, -0.0035772323608398438, -0.0031648874282836914, -0.002752542495727539, -0.0023401975631713867, -0.0019278526306152344, -0.001515507698059082, -0.0011031627655029297, -0.0006908178329467773, -0.000278472900390625, 0.00013387203216552734, 0.0005462169647216797, 0.000958561897277832, 0.0013709068298339844, 0.0017832517623901367, 0.002195596694946289, 0.0026079416275024414, 0.0030202865600585938, 0.003432631492614746, 0.0038449764251708984, 0.004257321357727051, 0.004669666290283203, 0.0050820112228393555, 0.005494356155395508, 0.00590670108795166, 0.0063190460205078125, 0.006731390953063965, 0.007143735885620117, 0.0075560808181762695, 0.007968425750732422, 0.008380770683288574, 0.008793115615844727, 0.009205460548400879, 0.009617805480957031, 0.010030150413513184, 0.010442495346069336, 0.010854840278625488, 0.01126718521118164, 0.011679530143737793, 0.012091875076293945, 0.012504220008850098, 0.01291656494140625]}, "gradients/decoder.roberta.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 9.0, 21.0, 35.0, 32.0, 47.0, 48.0, 78.0, 81.0, 93.0, 92.0, 98.0, 92.0, 72.0, 64.0, 40.0, 24.0, 33.0, 17.0, 11.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6715704202651978, -1.5893990993499756, -1.5072277784347534, -1.4250564575195312, -1.3428850173950195, -1.2607136964797974, -1.1785423755645752, -1.0963709354400635, -1.0141997337341309, -0.9320284128189087, -0.8498570322990417, -0.7676857113838196, -0.6855143308639526, -0.6033430099487305, -0.5211716890335083, -0.43900030851364136, -0.3568289279937744, -0.27465757727622986, -0.1924862414598465, -0.11031490564346313, -0.02814355492591858, 0.05402779579162598, 0.13619911670684814, 0.2183704972267151, 0.30054181814193726, 0.3827131688594818, 0.46488451957702637, 0.5470558404922485, 0.6292271614074707, 0.7113985419273376, 0.7935698628425598, 0.8757412433624268, 0.9579124450683594, 1.0400837659835815, 1.1222550868988037, 1.2044265270233154, 1.2865978479385376, 1.3687691688537598, 1.450940489768982, 1.533111810684204, 1.6152832508087158, 1.697454571723938, 1.7796258926391602, 1.8617973327636719, 1.943968653678894, 2.026139974594116, 2.108311176300049, 2.1904826164245605, 2.2726540565490723, 2.354825496673584, 2.4369966983795166, 2.5191681385040283, 2.601339340209961, 2.6835107803344727, 2.7656822204589844, 2.847853422164917, 2.9300246238708496, 3.0121960639953613, 3.094367265701294, 3.1765387058258057, 3.2587099075317383, 3.34088134765625, 3.4230527877807617, 3.5052239894866943, 3.587395429611206]}, "gradients/decoder.roberta.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 7.0, 3.0, 4.0, 11.0, 13.0, 12.0, 13.0, 19.0, 18.0, 21.0, 20.0, 25.0, 32.0, 26.0, 29.0, 23.0, 29.0, 28.0, 32.0, 37.0, 33.0, 36.0, 31.0, 52.0, 41.0, 41.0, 36.0, 36.0, 36.0, 28.0, 29.0, 37.0, 24.0, 23.0, 26.0, 7.0, 14.0, 10.0, 8.0, 10.0, 11.0, 7.0, 5.0, 1.0, 5.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.4577996730804443, -1.409749984741211, -1.3617002964019775, -1.3136504888534546, -1.2656008005142212, -1.2175511121749878, -1.1695013046264648, -1.1214516162872314, -1.073401927947998, -1.0253522396087646, -0.9773024916648865, -0.9292527437210083, -0.8812030553817749, -0.8331533670425415, -0.7851036190986633, -0.7370538711547852, -0.6890041828155518, -0.6409544944763184, -0.5929047465324402, -0.544854998588562, -0.4968053102493286, -0.4487555921077728, -0.40070587396621704, -0.35265615582466125, -0.30460643768310547, -0.2565567195415497, -0.2085070013999939, -0.1604572832584381, -0.11240756511688232, -0.06435784697532654, -0.016308128833770752, 0.031741589307785034, 0.07979130744934082, 0.1278410255908966, 0.1758907437324524, 0.22394046187400818, 0.27199018001556396, 0.32003989815711975, 0.36808961629867554, 0.4161393344402313, 0.4641890525817871, 0.5122387409210205, 0.5602884888648987, 0.6083382368087769, 0.6563879251480103, 0.7044376134872437, 0.7524873614311218, 0.800537109375, 0.8485867977142334, 0.8966364860534668, 0.944686233997345, 0.9927359819412231, 1.0407856702804565, 1.08883535861969, 1.136885166168213, 1.1849348545074463, 1.2329845428466797, 1.281034231185913, 1.3290839195251465, 1.3771337270736694, 1.4251834154129028, 1.4732331037521362, 1.5212829113006592, 1.5693325996398926, 1.617382287979126]}, "gradients/decoder.roberta.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 7.0, 14.0, 12.0, 13.0, 16.0, 18.0, 35.0, 63.0, 66.0, 114.0, 178.0, 302.0, 481.0, 855.0, 1567.0, 2956.0, 5858.0, 11942.0, 24499.0, 52173.0, 105405.0, 181280.0, 229904.0, 194959.0, 118683.0, 60500.0, 28812.0, 13676.0, 6609.0, 3352.0, 1780.0, 914.0, 527.0, 339.0, 204.0, 134.0, 95.0, 63.0, 46.0, 25.0, 18.0, 13.0, 13.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.484375, -2.412567138671875, -2.34075927734375, -2.268951416015625, -2.1971435546875, -2.125335693359375, -2.05352783203125, -1.981719970703125, -1.909912109375, -1.838104248046875, -1.76629638671875, -1.694488525390625, -1.6226806640625, -1.550872802734375, -1.47906494140625, -1.407257080078125, -1.33544921875, -1.263641357421875, -1.19183349609375, -1.120025634765625, -1.0482177734375, -0.976409912109375, -0.90460205078125, -0.832794189453125, -0.760986328125, -0.689178466796875, -0.61737060546875, -0.545562744140625, -0.4737548828125, -0.401947021484375, -0.33013916015625, -0.258331298828125, -0.1865234375, -0.114715576171875, -0.04290771484375, 0.028900146484375, 0.1007080078125, 0.172515869140625, 0.24432373046875, 0.316131591796875, 0.387939453125, 0.459747314453125, 0.53155517578125, 0.603363037109375, 0.6751708984375, 0.746978759765625, 0.81878662109375, 0.890594482421875, 0.96240234375, 1.034210205078125, 1.10601806640625, 1.177825927734375, 1.2496337890625, 1.321441650390625, 1.39324951171875, 1.465057373046875, 1.536865234375, 1.608673095703125, 1.68048095703125, 1.752288818359375, 1.8240966796875, 1.895904541015625, 1.96771240234375, 2.039520263671875, 2.111328125]}, "gradients/decoder.roberta.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 11.0, 8.0, 18.0, 13.0, 12.0, 24.0, 26.0, 25.0, 23.0, 27.0, 27.0, 29.0, 29.0, 32.0, 34.0, 33.0, 32.0, 37.0, 35.0, 42.0, 38.0, 42.0, 47.0, 36.0, 26.0, 43.0, 36.0, 27.0, 27.0, 26.0, 23.0, 15.0, 8.0, 7.0, 17.0, 7.0, 8.0, 7.0, 3.0, 3.0, 7.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.173828125, -1.1354522705078125, -1.097076416015625, -1.0587005615234375, -1.02032470703125, -0.9819488525390625, -0.943572998046875, -0.9051971435546875, -0.8668212890625, -0.8284454345703125, -0.790069580078125, -0.7516937255859375, -0.71331787109375, -0.6749420166015625, -0.636566162109375, -0.5981903076171875, -0.559814453125, -0.5214385986328125, -0.483062744140625, -0.4446868896484375, -0.40631103515625, -0.3679351806640625, -0.329559326171875, -0.2911834716796875, -0.2528076171875, -0.2144317626953125, -0.176055908203125, -0.1376800537109375, -0.09930419921875, -0.0609283447265625, -0.022552490234375, 0.0158233642578125, 0.05419921875, 0.0925750732421875, 0.130950927734375, 0.1693267822265625, 0.20770263671875, 0.2460784912109375, 0.284454345703125, 0.3228302001953125, 0.3612060546875, 0.3995819091796875, 0.437957763671875, 0.4763336181640625, 0.51470947265625, 0.5530853271484375, 0.591461181640625, 0.6298370361328125, 0.668212890625, 0.7065887451171875, 0.744964599609375, 0.7833404541015625, 0.82171630859375, 0.8600921630859375, 0.898468017578125, 0.9368438720703125, 0.9752197265625, 1.0135955810546875, 1.051971435546875, 1.0903472900390625, 1.12872314453125, 1.1670989990234375, 1.205474853515625, 1.2438507080078125, 1.2822265625]}, "gradients/decoder.roberta.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 9.0, 17.0, 33.0, 26.0, 43.0, 55.0, 78.0, 114.0, 169.0, 259.0, 461.0, 804.0, 1736.0, 6735.0, 65592.0, 580487.0, 356092.0, 28870.0, 3830.0, 1275.0, 670.0, 444.0, 238.0, 157.0, 110.0, 48.0, 55.0, 48.0, 27.0, 23.0, 18.0, 9.0, 5.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.1396484375, -6.900390625, -6.6611328125, -6.421875, -6.1826171875, -5.943359375, -5.7041015625, -5.46484375, -5.2255859375, -4.986328125, -4.7470703125, -4.5078125, -4.2685546875, -4.029296875, -3.7900390625, -3.55078125, -3.3115234375, -3.072265625, -2.8330078125, -2.59375, -2.3544921875, -2.115234375, -1.8759765625, -1.63671875, -1.3974609375, -1.158203125, -0.9189453125, -0.6796875, -0.4404296875, -0.201171875, 0.0380859375, 0.27734375, 0.5166015625, 0.755859375, 0.9951171875, 1.234375, 1.4736328125, 1.712890625, 1.9521484375, 2.19140625, 2.4306640625, 2.669921875, 2.9091796875, 3.1484375, 3.3876953125, 3.626953125, 3.8662109375, 4.10546875, 4.3447265625, 4.583984375, 4.8232421875, 5.0625, 5.3017578125, 5.541015625, 5.7802734375, 6.01953125, 6.2587890625, 6.498046875, 6.7373046875, 6.9765625, 7.2158203125, 7.455078125, 7.6943359375, 7.93359375]}, "gradients/decoder.roberta.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 6.0, 9.0, 12.0, 15.0, 6.0, 16.0, 20.0, 29.0, 29.0, 40.0, 35.0, 42.0, 43.0, 50.0, 48.0, 42.0, 45.0, 42.0, 54.0, 42.0, 38.0, 54.0, 50.0, 48.0, 20.0, 25.0, 23.0, 22.0, 18.0, 22.0, 11.0, 8.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.080078125, -1.036529541015625, -0.99298095703125, -0.949432373046875, -0.9058837890625, -0.862335205078125, -0.81878662109375, -0.775238037109375, -0.731689453125, -0.688140869140625, -0.64459228515625, -0.601043701171875, -0.5574951171875, -0.513946533203125, -0.47039794921875, -0.426849365234375, -0.38330078125, -0.339752197265625, -0.29620361328125, -0.252655029296875, -0.2091064453125, -0.165557861328125, -0.12200927734375, -0.078460693359375, -0.034912109375, 0.008636474609375, 0.05218505859375, 0.095733642578125, 0.1392822265625, 0.182830810546875, 0.22637939453125, 0.269927978515625, 0.3134765625, 0.357025146484375, 0.40057373046875, 0.444122314453125, 0.4876708984375, 0.531219482421875, 0.57476806640625, 0.618316650390625, 0.661865234375, 0.705413818359375, 0.74896240234375, 0.792510986328125, 0.8360595703125, 0.879608154296875, 0.92315673828125, 0.966705322265625, 1.01025390625, 1.053802490234375, 1.09735107421875, 1.140899658203125, 1.1844482421875, 1.227996826171875, 1.27154541015625, 1.315093994140625, 1.358642578125, 1.402191162109375, 1.44573974609375, 1.489288330078125, 1.5328369140625, 1.576385498046875, 1.61993408203125, 1.663482666015625, 1.70703125]}, "gradients/decoder.roberta.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 9.0, 6.0, 12.0, 14.0, 16.0, 30.0, 52.0, 66.0, 97.0, 156.0, 267.0, 470.0, 891.0, 2195.0, 7147.0, 35919.0, 192777.0, 469044.0, 268373.0, 55371.0, 10316.0, 2825.0, 1101.0, 567.0, 294.0, 181.0, 110.0, 72.0, 57.0, 36.0, 26.0, 12.0, 10.0, 10.0, 6.0, 6.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76171875, -2.67706298828125, -2.5924072265625, -2.50775146484375, -2.423095703125, -2.33843994140625, -2.2537841796875, -2.16912841796875, -2.08447265625, -1.99981689453125, -1.9151611328125, -1.83050537109375, -1.745849609375, -1.66119384765625, -1.5765380859375, -1.49188232421875, -1.4072265625, -1.32257080078125, -1.2379150390625, -1.15325927734375, -1.068603515625, -0.98394775390625, -0.8992919921875, -0.81463623046875, -0.72998046875, -0.64532470703125, -0.5606689453125, -0.47601318359375, -0.391357421875, -0.30670166015625, -0.2220458984375, -0.13739013671875, -0.052734375, 0.03192138671875, 0.1165771484375, 0.20123291015625, 0.285888671875, 0.37054443359375, 0.4552001953125, 0.53985595703125, 0.62451171875, 0.70916748046875, 0.7938232421875, 0.87847900390625, 0.963134765625, 1.04779052734375, 1.1324462890625, 1.21710205078125, 1.3017578125, 1.38641357421875, 1.4710693359375, 1.55572509765625, 1.640380859375, 1.72503662109375, 1.8096923828125, 1.89434814453125, 1.97900390625, 2.06365966796875, 2.1483154296875, 2.23297119140625, 2.317626953125, 2.40228271484375, 2.4869384765625, 2.57159423828125, 2.65625]}, "gradients/decoder.roberta.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 9.0, 4.0, 11.0, 11.0, 29.0, 35.0, 47.0, 56.0, 68.0, 112.0, 106.0, 115.0, 96.0, 77.0, 74.0, 56.0, 40.0, 26.0, 20.0, 10.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013196468353271484, -0.000124247744679451, -0.00011653080582618713, -0.00010881386697292328, -0.00010109692811965942, -9.337998926639557e-05, -8.566305041313171e-05, -7.794611155986786e-05, -7.0229172706604e-05, -6.251223385334015e-05, -5.4795295000076294e-05, -4.707835614681244e-05, -3.9361417293548584e-05, -3.164447844028473e-05, -2.3927539587020874e-05, -1.621060073375702e-05, -8.493661880493164e-06, -7.767230272293091e-07, 6.940215826034546e-06, 1.4657154679298401e-05, 2.2374093532562256e-05, 3.009103238582611e-05, 3.7807971239089966e-05, 4.552491009235382e-05, 5.3241848945617676e-05, 6.095878779888153e-05, 6.867572665214539e-05, 7.639266550540924e-05, 8.41096043586731e-05, 9.182654321193695e-05, 9.95434820652008e-05, 0.00010726042091846466, 0.00011497735977172852, 0.00012269429862499237, 0.00013041123747825623, 0.00013812817633152008, 0.00014584511518478394, 0.0001535620540380478, 0.00016127899289131165, 0.0001689959317445755, 0.00017671287059783936, 0.0001844298094511032, 0.00019214674830436707, 0.00019986368715763092, 0.00020758062601089478, 0.00021529756486415863, 0.00022301450371742249, 0.00023073144257068634, 0.0002384483814239502, 0.00024616532027721405, 0.0002538822591304779, 0.00026159919798374176, 0.0002693161368370056, 0.00027703307569026947, 0.0002847500145435333, 0.0002924669533967972, 0.00030018389225006104, 0.0003079008311033249, 0.00031561776995658875, 0.0003233347088098526, 0.00033105164766311646, 0.0003387685865163803, 0.00034648552536964417, 0.000354202464222908, 0.0003619194030761719]}, "gradients/decoder.roberta.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 14.0, 16.0, 27.0, 41.0, 63.0, 134.0, 240.0, 520.0, 1864.0, 9544.0, 72119.0, 416316.0, 448998.0, 84421.0, 11029.0, 2045.0, 590.0, 242.0, 122.0, 85.0, 48.0, 32.0, 16.0, 12.0, 7.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.2545166015625, -3.149658203125, -3.0447998046875, -2.93994140625, -2.8350830078125, -2.730224609375, -2.6253662109375, -2.5205078125, -2.4156494140625, -2.310791015625, -2.2059326171875, -2.10107421875, -1.9962158203125, -1.891357421875, -1.7864990234375, -1.681640625, -1.5767822265625, -1.471923828125, -1.3670654296875, -1.26220703125, -1.1573486328125, -1.052490234375, -0.9476318359375, -0.8427734375, -0.7379150390625, -0.633056640625, -0.5281982421875, -0.42333984375, -0.3184814453125, -0.213623046875, -0.1087646484375, -0.00390625, 0.1009521484375, 0.205810546875, 0.3106689453125, 0.41552734375, 0.5203857421875, 0.625244140625, 0.7301025390625, 0.8349609375, 0.9398193359375, 1.044677734375, 1.1495361328125, 1.25439453125, 1.3592529296875, 1.464111328125, 1.5689697265625, 1.673828125, 1.7786865234375, 1.883544921875, 1.9884033203125, 2.09326171875, 2.1981201171875, 2.302978515625, 2.4078369140625, 2.5126953125, 2.6175537109375, 2.722412109375, 2.8272705078125, 2.93212890625, 3.0369873046875, 3.141845703125, 3.2467041015625, 3.3515625]}, "gradients/decoder.roberta.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 5.0, 11.0, 8.0, 16.0, 20.0, 20.0, 38.0, 41.0, 83.0, 76.0, 90.0, 101.0, 97.0, 102.0, 76.0, 69.0, 39.0, 31.0, 29.0, 13.0, 13.0, 6.0, 6.0, 7.0, 2.0, 4.0, 3.0, 3.0, 3.0], "bins": [-1.0234375, -1.0017013549804688, -0.9799652099609375, -0.9582290649414062, -0.936492919921875, -0.9147567749023438, -0.8930206298828125, -0.8712844848632812, -0.84954833984375, -0.8278121948242188, -0.8060760498046875, -0.7843399047851562, -0.762603759765625, -0.7408676147460938, -0.7191314697265625, -0.6973953247070312, -0.6756591796875, -0.6539230346679688, -0.6321868896484375, -0.6104507446289062, -0.588714599609375, -0.5669784545898438, -0.5452423095703125, -0.5235061645507812, -0.50177001953125, -0.48003387451171875, -0.4582977294921875, -0.43656158447265625, -0.414825439453125, -0.39308929443359375, -0.3713531494140625, -0.34961700439453125, -0.327880859375, -0.30614471435546875, -0.2844085693359375, -0.26267242431640625, -0.240936279296875, -0.21920013427734375, -0.1974639892578125, -0.17572784423828125, -0.15399169921875, -0.13225555419921875, -0.1105194091796875, -0.08878326416015625, -0.067047119140625, -0.04531097412109375, -0.0235748291015625, -0.00183868408203125, 0.0198974609375, 0.04163360595703125, 0.0633697509765625, 0.08510589599609375, 0.106842041015625, 0.12857818603515625, 0.1503143310546875, 0.17205047607421875, 0.19378662109375, 0.21552276611328125, 0.2372589111328125, 0.25899505615234375, 0.280731201171875, 0.30246734619140625, 0.3242034912109375, 0.34593963623046875, 0.36767578125]}, "gradients/decoder.roberta.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 3.0, 6.0, 7.0, 13.0, 9.0, 15.0, 11.0, 26.0, 39.0, 33.0, 45.0, 33.0, 39.0, 49.0, 56.0, 66.0, 59.0, 46.0, 80.0, 66.0, 50.0, 53.0, 45.0, 45.0, 24.0, 15.0, 18.0, 10.0, 10.0, 7.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6365050077438354, -1.567031741142273, -1.4975584745407104, -1.428085207939148, -1.358612060546875, -1.2891387939453125, -1.21966552734375, -1.1501922607421875, -1.080718994140625, -1.0112457275390625, -0.9417724609375, -0.8722992539405823, -0.8028259873390198, -0.7333527207374573, -0.6638795137405396, -0.594406247138977, -0.5249329805374146, -0.45545971393585205, -0.38598647713661194, -0.3165132403373718, -0.24703997373580933, -0.17756670713424683, -0.10809347033500671, -0.0386202335357666, 0.0308530330657959, 0.1003262847661972, 0.1697995364665985, 0.23927278816699982, 0.3087460398674011, 0.3782193064689636, 0.44769254326820374, 0.5171657800674438, 0.5866389274597168, 0.6561121940612793, 0.7255854606628418, 0.7950586676597595, 0.864531934261322, 0.9340052008628845, 1.0034784078598022, 1.0729516744613647, 1.1424249410629272, 1.2118982076644897, 1.2813714742660522, 1.3508447408676147, 1.4203178882598877, 1.4897911548614502, 1.5592644214630127, 1.6287376880645752, 1.6982109546661377, 1.7676842212677002, 1.8371574878692627, 1.9066307544708252, 1.9761040210723877, 2.04557728767395, 2.1150505542755127, 2.184523582458496, 2.2539968490600586, 2.323470115661621, 2.3929433822631836, 2.462416648864746, 2.5318899154663086, 2.601363182067871, 2.6708364486694336, 2.740309715270996, 2.8097829818725586]}, "gradients/decoder.roberta.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 11.0, 10.0, 8.0, 11.0, 12.0, 17.0, 17.0, 9.0, 25.0, 30.0, 25.0, 34.0, 44.0, 39.0, 49.0, 46.0, 39.0, 41.0, 43.0, 43.0, 51.0, 42.0, 41.0, 40.0, 32.0, 29.0, 37.0, 27.0, 26.0, 24.0, 20.0, 13.0, 12.0, 7.0, 8.0, 5.0, 9.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.2844350337982178, -2.2140026092529297, -2.1435701847076416, -2.0731377601623535, -2.0027053356170654, -1.9322729110717773, -1.8618406057357788, -1.7914081811904907, -1.7209757566452026, -1.6505433320999146, -1.5801109075546265, -1.5096784830093384, -1.4392461776733398, -1.3688137531280518, -1.2983813285827637, -1.2279489040374756, -1.1575164794921875, -1.0870840549468994, -1.0166516304016113, -0.946219265460968, -0.8757868409156799, -0.8053544163703918, -0.7349220514297485, -0.6644896268844604, -0.5940572023391724, -0.5236247777938843, -0.4531923830509186, -0.3827599883079529, -0.3123275637626648, -0.2418951392173767, -0.171462744474411, -0.10103034973144531, -0.030598163604736328, 0.039834246039390564, 0.11026665568351746, 0.18069906532764435, 0.25113147497177124, 0.3215638995170593, 0.391996294260025, 0.4624286890029907, 0.5328611135482788, 0.6032935380935669, 0.673725962638855, 0.7441583275794983, 0.8145907521247864, 0.8850231766700745, 0.9554555416107178, 1.0258879661560059, 1.096320390701294, 1.166752815246582, 1.2371852397918701, 1.3076176643371582, 1.3780500888824463, 1.4484825134277344, 1.518914818763733, 1.589347243309021, 1.659779667854309, 1.7302120923995972, 1.8006445169448853, 1.8710769414901733, 1.9415092468261719, 2.01194167137146, 2.082374095916748, 2.152806520462036, 2.223238945007324]}, "gradients/decoder.roberta.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 3.0, 5.0, 0.0, 3.0, 7.0, 4.0, 7.0, 8.0, 12.0, 18.0, 27.0, 41.0, 45.0, 46.0, 52.0, 93.0, 113.0, 176.0, 221.0, 317.0, 390.0, 595.0, 787.0, 1102.0, 1601.0, 2191.0, 2977.0, 3954.0, 5387.0, 482164.0, 6633.0, 4641.0, 3503.0, 2546.0, 1839.0, 1280.0, 957.0, 672.0, 497.0, 350.0, 256.0, 212.0, 144.0, 113.0, 75.0, 65.0, 45.0, 38.0, 24.0, 20.0, 12.0, 20.0, 10.0, 9.0, 8.0, 7.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-3.625924825668335, -3.5152242183685303, -3.4045233726501465, -3.293822765350342, -3.183122158050537, -3.0724213123321533, -2.9617207050323486, -2.851019859313965, -2.74031925201416, -2.6296186447143555, -2.5189177989959717, -2.408217191696167, -2.297516345977783, -2.1868157386779785, -2.076115131378174, -1.9654144048690796, -1.8547136783599854, -1.7440129518508911, -1.6333122253417969, -1.5226116180419922, -1.411910891532898, -1.3012101650238037, -1.190509557723999, -1.0798088312149048, -0.9691081047058105, -0.8584073781967163, -0.7477067112922668, -0.6370060443878174, -0.5263053178787231, -0.4156045913696289, -0.30490392446517944, -0.19420325756072998, -0.08350276947021484, 0.027197927236557007, 0.13789862394332886, 0.2485993206501007, 0.35930001735687256, 0.4700007438659668, 0.5807014107704163, 0.6914020776748657, 0.80210280418396, 0.9128035306930542, 1.0235042572021484, 1.1342048645019531, 1.2449055910110474, 1.3556063175201416, 1.4663069248199463, 1.5770076513290405, 1.6877083778381348, 1.798409104347229, 1.9091098308563232, 2.019810438156128, 2.1305112838745117, 2.2412118911743164, 2.351912498474121, 2.462613105773926, 2.5733139514923096, 2.6840145587921143, 2.794715404510498, 2.9054160118103027, 3.0161166191101074, 3.126817464828491, 3.237518072128296, 3.3482189178466797, 3.4589195251464844]}, "gradients/decoder.roberta.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 10.0, 13.0, 8.0, 11.0, 14.0, 20.0, 12.0, 22.0, 17.0, 33.0, 29.0, 31.0, 37.0, 37.0, 46.0, 52.0, 41.0, 41.0, 41.0, 39.0, 44.0, 42.0, 47.0, 41.0, 28.0, 38.0, 25.0, 35.0, 24.0, 14.0, 24.0, 16.0, 15.0, 8.0, 4.0, 11.0, 5.0, 8.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.182397842407227, -17.63738250732422, -17.09236717224121, -16.547351837158203, -16.002334594726562, -15.457320213317871, -14.912303924560547, -14.367288589477539, -13.822273254394531, -13.277257919311523, -12.732242584228516, -12.187226295471191, -11.642210960388184, -11.097195625305176, -10.552179336547852, -10.007164001464844, -9.462148666381836, -8.917133331298828, -8.37211799621582, -7.827101707458496, -7.282086372375488, -6.7370710372924805, -6.1920552253723145, -5.647039413452148, -5.102024078369141, -4.557008743286133, -4.011992931365967, -3.46697735786438, -2.921961784362793, -2.376946210861206, -1.8319306373596191, -1.2869150638580322, -0.7418994903564453, -0.1968839168548584, 0.3481316566467285, 0.8931472301483154, 1.4381628036499023, 1.9831783771514893, 2.528193950653076, 3.073209524154663, 3.61822509765625, 4.163240432739258, 4.708256244659424, 5.25327205657959, 5.798287391662598, 6.3433027267456055, 6.8883185386657715, 7.4333343505859375, 7.978349685668945, 8.523365020751953, 9.068380355834961, 9.613396644592285, 10.158411979675293, 10.7034273147583, 11.248443603515625, 11.793458938598633, 12.33847427368164, 12.883489608764648, 13.428504943847656, 13.97352123260498, 14.518536567687988, 15.063551902770996, 15.60856819152832, 16.153583526611328, 16.698598861694336]}, "gradients/decoder.roberta.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 12.0, 9.0, 30.0, 55.0, 123.0, 169.0, 546.0, 2071.0, 31566.0, 51430688.0, 5330.0, 505.0, 115.0, 36.0, 28.0, 13.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.90084075927734, -104.08610534667969, -100.27136993408203, -96.45663452148438, -92.64190673828125, -88.8271713256836, -85.01243591308594, -81.19770050048828, -77.38296508789062, -73.56822967529297, -69.75349426269531, -65.93876647949219, -62.12403106689453, -58.309295654296875, -54.49456024169922, -50.67982482910156, -46.86509704589844, -43.05036163330078, -39.23563003540039, -35.420894622802734, -31.60616111755371, -27.791427612304688, -23.97669219970703, -20.161958694458008, -16.347225189208984, -12.532491683959961, -8.717757225036621, -4.903022766113281, -1.0882892608642578, 2.7264442443847656, 6.541179656982422, 10.355913162231445, 14.170639038085938, 17.98537254333496, 21.800106048583984, 25.61484146118164, 29.429574966430664, 33.24430847167969, 37.059043884277344, 40.873779296875, 44.68851089477539, 48.50324630737305, 52.31797790527344, 56.132713317871094, 59.94744873046875, 63.76218032836914, 67.57691955566406, 71.39164733886719, 75.20638275146484, 79.0211181640625, 82.83585357666016, 86.65058898925781, 90.46531677246094, 94.2800521850586, 98.09478759765625, 101.9095230102539, 105.72425842285156, 109.53899383544922, 113.35372924804688, 117.16845703125, 120.98319244384766, 124.79792785644531, 128.6126708984375, 132.42739868164062, 136.24212646484375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 17.0, 41.0, 122.0, 277.0, 306.0, 160.0, 51.0, 15.0, 9.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.520975112915039, -14.05616283416748, -13.591350555419922, -13.126538276672363, -12.661725997924805, -12.196913719177246, -11.732101440429688, -11.267290115356445, -10.80247688293457, -10.337664604187012, -9.872852325439453, -9.408040046691895, -8.943227767944336, -8.478415489196777, -8.013603210449219, -7.548791408538818, -7.083979606628418, -6.619167327880859, -6.154355049133301, -5.689542770385742, -5.224730491638184, -4.759918212890625, -4.295106410980225, -3.830294132232666, -3.3654818534851074, -2.900669574737549, -2.4358572959899902, -1.9710452556610107, -1.5062329769134521, -1.0414206981658936, -0.5766086578369141, -0.11179637908935547, 0.3530158996582031, 0.8178281188011169, 1.2826403379440308, 1.7474524974822998, 2.2122647762298584, 2.677077054977417, 3.1418890953063965, 3.606701374053955, 4.071513652801514, 4.536325931549072, 5.001138210296631, 5.465950012207031, 5.93076229095459, 6.395574569702148, 6.860386848449707, 7.325199127197266, 7.790011405944824, 8.254823684692383, 8.719635963439941, 9.1844482421875, 9.649260520935059, 10.114072799682617, 10.57888412475586, 11.043697357177734, 11.508508682250977, 11.973320960998535, 12.438133239746094, 12.902945518493652, 13.367757797241211, 13.83257007598877, 14.297382354736328, 14.76219367980957, 15.227006912231445]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 8.0, 7.0, 5.0, 11.0, 9.0, 11.0, 14.0, 12.0, 17.0, 29.0, 25.0, 28.0, 26.0, 26.0, 30.0, 44.0, 40.0, 26.0, 43.0, 48.0, 46.0, 51.0, 45.0, 45.0, 40.0, 36.0, 20.0, 45.0, 30.0, 27.0, 32.0, 28.0, 20.0, 13.0, 14.0, 8.0, 11.0, 7.0, 7.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.698626518249512, -6.501410484313965, -6.304194450378418, -6.106978416442871, -5.909761905670166, -5.712545871734619, -5.515329837799072, -5.318113803863525, -5.12089729309082, -4.923681259155273, -4.726465225219727, -4.52924919128418, -4.332032680511475, -4.134816646575928, -3.937600612640381, -3.740384578704834, -3.543168544769287, -3.3459525108337402, -3.1487362384796143, -2.9515202045440674, -2.7543039321899414, -2.5570878982543945, -2.3598718643188477, -2.162655830383301, -1.9654395580291748, -1.7682234048843384, -1.571007251739502, -1.373791217803955, -1.1765750646591187, -0.9793589115142822, -0.7821428775787354, -0.5849267244338989, -0.3877105712890625, -0.19049444794654846, 0.006721675395965576, 0.20393776893615723, 0.40115392208099365, 0.5983700752258301, 0.795586109161377, 0.9928022623062134, 1.1900184154510498, 1.3872345685958862, 1.5844507217407227, 1.7816667556762695, 1.978882908821106, 2.1760990619659424, 2.3733150959014893, 2.5705313682556152, 2.767747402191162, 2.964963436126709, 3.162179708480835, 3.359395742416382, 3.556612014770508, 3.7538280487060547, 3.9510440826416016, 4.148260116577148, 4.345476150512695, 4.542692184448242, 4.739908218383789, 4.937124252319336, 5.134340763092041, 5.331556797027588, 5.528772830963135, 5.725988864898682, 5.923205375671387]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 3.0, 6.0, 14.0, 16.0, 24.0, 25.0, 47.0, 34.0, 46.0, 61.0, 100.0, 138.0, 217.0, 277.0, 437.0, 612.0, 1004.0, 1593.0, 2752.0, 4620.0, 9325.0, 20692.0, 59749.0, 3485512.0, 512780.0, 54207.0, 19440.0, 9031.0, 4704.0, 2604.0, 1542.0, 956.0, 603.0, 334.0, 260.0, 150.0, 110.0, 75.0, 53.0, 36.0, 33.0, 15.0, 13.0, 15.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1737060546875, -0.16873741149902344, -0.16376876831054688, -0.1588001251220703, -0.15383148193359375, -0.1488628387451172, -0.14389419555664062, -0.13892555236816406, -0.1339569091796875, -0.12898826599121094, -0.12401962280273438, -0.11905097961425781, -0.11408233642578125, -0.10911369323730469, -0.10414505004882812, -0.09917640686035156, -0.094207763671875, -0.08923912048339844, -0.08427047729492188, -0.07930183410644531, -0.07433319091796875, -0.06936454772949219, -0.06439590454101562, -0.05942726135253906, -0.0544586181640625, -0.04948997497558594, -0.044521331787109375, -0.03955268859863281, -0.03458404541015625, -0.029615402221679688, -0.024646759033203125, -0.019678115844726562, -0.01470947265625, -0.009740829467773438, -0.004772186279296875, 0.0001964569091796875, 0.00516510009765625, 0.010133743286132812, 0.015102386474609375, 0.020071029663085938, 0.0250396728515625, 0.030008316040039062, 0.034976959228515625, 0.03994560241699219, 0.04491424560546875, 0.04988288879394531, 0.054851531982421875, 0.05982017517089844, 0.064788818359375, 0.06975746154785156, 0.07472610473632812, 0.07969474792480469, 0.08466339111328125, 0.08963203430175781, 0.09460067749023438, 0.09956932067871094, 0.1045379638671875, 0.10950660705566406, 0.11447525024414062, 0.11944389343261719, 0.12441253662109375, 0.1293811798095703, 0.13434982299804688, 0.13931846618652344, 0.144287109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 1.0, 5.0, 6.0, 5.0, 7.0, 10.0, 11.0, 20.0, 21.0, 182.0, 615.0, 27.0, 13.0, 16.0, 8.0, 6.0, 11.0, 3.0, 4.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.056549072265625, -0.055063724517822266, -0.05357837677001953, -0.0520930290222168, -0.05060768127441406, -0.04912233352661133, -0.047636985778808594, -0.04615163803100586, -0.044666290283203125, -0.04318094253540039, -0.041695594787597656, -0.04021024703979492, -0.03872489929199219, -0.03723955154418945, -0.03575420379638672, -0.034268856048583984, -0.03278350830078125, -0.031298160552978516, -0.02981281280517578, -0.028327465057373047, -0.026842117309570312, -0.025356769561767578, -0.023871421813964844, -0.02238607406616211, -0.020900726318359375, -0.01941537857055664, -0.017930030822753906, -0.016444683074951172, -0.014959335327148438, -0.013473987579345703, -0.011988639831542969, -0.010503292083740234, -0.0090179443359375, -0.007532596588134766, -0.006047248840332031, -0.004561901092529297, -0.0030765533447265625, -0.0015912055969238281, -0.00010585784912109375, 0.0013794898986816406, 0.002864837646484375, 0.004350185394287109, 0.005835533142089844, 0.007320880889892578, 0.008806228637695312, 0.010291576385498047, 0.011776924133300781, 0.013262271881103516, 0.01474761962890625, 0.016232967376708984, 0.01771831512451172, 0.019203662872314453, 0.020689010620117188, 0.022174358367919922, 0.023659706115722656, 0.02514505386352539, 0.026630401611328125, 0.02811574935913086, 0.029601097106933594, 0.031086444854736328, 0.03257179260253906, 0.0340571403503418, 0.03554248809814453, 0.037027835845947266, 0.03851318359375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 10.0, 15.0, 12.0, 16.0, 37.0, 45.0, 82.0, 124.0, 200.0, 352.0, 650.0, 1310.0, 2920.0, 6971.0, 18141.0, 55085.0, 216334.0, 1927792.0, 1681957.0, 200663.0, 52217.0, 17181.0, 6462.0, 2767.0, 1311.0, 693.0, 363.0, 207.0, 125.0, 69.0, 55.0, 24.0, 28.0, 18.0, 10.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1085205078125, -0.10477638244628906, -0.10103225708007812, -0.09728813171386719, -0.09354400634765625, -0.08979988098144531, -0.08605575561523438, -0.08231163024902344, -0.0785675048828125, -0.07482337951660156, -0.07107925415039062, -0.06733512878417969, -0.06359100341796875, -0.05984687805175781, -0.056102752685546875, -0.05235862731933594, -0.048614501953125, -0.04487037658691406, -0.041126251220703125, -0.03738212585449219, -0.03363800048828125, -0.029893875122070312, -0.026149749755859375, -0.022405624389648438, -0.0186614990234375, -0.014917373657226562, -0.011173248291015625, -0.0074291229248046875, -0.00368499755859375, 5.91278076171875e-05, 0.003803253173828125, 0.0075473785400390625, 0.01129150390625, 0.015035629272460938, 0.018779754638671875, 0.022523880004882812, 0.02626800537109375, 0.030012130737304688, 0.033756256103515625, 0.03750038146972656, 0.0412445068359375, 0.04498863220214844, 0.048732757568359375, 0.05247688293457031, 0.05622100830078125, 0.05996513366699219, 0.06370925903320312, 0.06745338439941406, 0.071197509765625, 0.07494163513183594, 0.07868576049804688, 0.08242988586425781, 0.08617401123046875, 0.08991813659667969, 0.09366226196289062, 0.09740638732910156, 0.1011505126953125, 0.10489463806152344, 0.10863876342773438, 0.11238288879394531, 0.11612701416015625, 0.11987113952636719, 0.12361526489257812, 0.12735939025878906, 0.131103515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 9.0, 7.0, 8.0, 19.0, 13.0, 27.0, 25.0, 37.0, 46.0, 56.0, 80.0, 103.0, 128.0, 146.0, 220.0, 334.0, 573.0, 809.0, 394.0, 272.0, 181.0, 140.0, 106.0, 80.0, 49.0, 49.0, 34.0, 30.0, 23.0, 14.0, 16.0, 11.0, 12.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043731689453125, -0.042237281799316406, -0.04074287414550781, -0.03924846649169922, -0.037754058837890625, -0.03625965118408203, -0.03476524353027344, -0.033270835876464844, -0.03177642822265625, -0.030282020568847656, -0.028787612915039062, -0.02729320526123047, -0.025798797607421875, -0.02430438995361328, -0.022809982299804688, -0.021315574645996094, -0.0198211669921875, -0.018326759338378906, -0.016832351684570312, -0.015337944030761719, -0.013843536376953125, -0.012349128723144531, -0.010854721069335938, -0.009360313415527344, -0.00786590576171875, -0.006371498107910156, -0.0048770904541015625, -0.0033826828002929688, -0.001888275146484375, -0.00039386749267578125, 0.0011005401611328125, 0.0025949478149414062, 0.00408935546875, 0.005583763122558594, 0.0070781707763671875, 0.008572578430175781, 0.010066986083984375, 0.011561393737792969, 0.013055801391601562, 0.014550209045410156, 0.01604461669921875, 0.017539024353027344, 0.019033432006835938, 0.02052783966064453, 0.022022247314453125, 0.02351665496826172, 0.025011062622070312, 0.026505470275878906, 0.0279998779296875, 0.029494285583496094, 0.030988693237304688, 0.03248310089111328, 0.033977508544921875, 0.03547191619873047, 0.03696632385253906, 0.038460731506347656, 0.03995513916015625, 0.041449546813964844, 0.04294395446777344, 0.04443836212158203, 0.045932769775390625, 0.04742717742919922, 0.04892158508300781, 0.050415992736816406, 0.051910400390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 18.0, 33.0, 96.0, 204.0, 302.0, 218.0, 72.0, 30.0, 20.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5812878608703613, -0.5616493225097656, -0.5420107841491699, -0.5223721861839294, -0.5027336478233337, -0.48309510946273804, -0.46345657110214233, -0.44381800293922424, -0.42417943477630615, -0.40454089641571045, -0.38490232825279236, -0.36526378989219666, -0.34562522172927856, -0.32598668336868286, -0.30634814500808716, -0.28670957684516907, -0.26707103848457336, -0.24743248522281647, -0.22779393196105957, -0.20815539360046387, -0.18851682543754578, -0.16887828707695007, -0.14923973381519318, -0.12960118055343628, -0.10996262729167938, -0.09032407402992249, -0.07068552076816559, -0.05104697495698929, -0.03140842169523239, -0.011769868433475494, 0.007868677377700806, 0.027507230639457703, 0.0471457839012146, 0.0667843371629715, 0.0864228904247284, 0.1060614362359047, 0.1256999969482422, 0.1453385353088379, 0.1649770885705948, 0.18461564183235168, 0.20425419509410858, 0.22389274835586548, 0.24353130161762238, 0.2631698548793793, 0.282808393239975, 0.30244696140289307, 0.32208549976348877, 0.3417240381240845, 0.36136260628700256, 0.38100114464759827, 0.40063971281051636, 0.42027825117111206, 0.43991681933403015, 0.45955535769462585, 0.47919392585754395, 0.49883246421813965, 0.5184710025787354, 0.538109540939331, 0.5577480792999268, 0.5773866772651672, 0.5970252156257629, 0.6166637539863586, 0.6363022923469543, 0.6559408903121948, 0.6755794286727905]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 9.0, 8.0, 7.0, 13.0, 17.0, 25.0, 22.0, 34.0, 27.0, 43.0, 45.0, 37.0, 56.0, 46.0, 52.0, 55.0, 46.0, 48.0, 49.0, 45.0, 43.0, 39.0, 44.0, 39.0, 31.0, 20.0, 13.0, 18.0, 13.0, 9.0, 5.0, 11.0, 7.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21925705671310425, -0.2119484543800354, -0.20463986694812775, -0.1973312795162201, -0.19002267718315125, -0.1827140748500824, -0.17540548741817474, -0.1680968999862671, -0.16078829765319824, -0.1534796953201294, -0.14617110788822174, -0.1388625204563141, -0.13155391812324524, -0.12424532324075699, -0.11693672835826874, -0.10962813347578049, -0.10231953859329224, -0.09501094371080399, -0.08770234882831573, -0.08039375394582748, -0.07308515906333923, -0.06577656418085098, -0.05846796929836273, -0.05115937441587448, -0.04385077953338623, -0.03654218465089798, -0.02923358976840973, -0.02192499488592148, -0.014616400003433228, -0.007307805120944977, 7.897615432739258e-07, 0.007309384644031525, 0.014617979526519775, 0.021926574409008026, 0.029235169291496277, 0.03654376417398453, 0.04385235905647278, 0.05116095393896103, 0.05846954882144928, 0.06577814370393753, 0.07308673858642578, 0.08039533346891403, 0.08770392835140228, 0.09501252323389053, 0.10232111811637878, 0.10962971299886703, 0.11693830788135529, 0.12424690276384354, 0.1315554976463318, 0.13886409997940063, 0.1461726874113083, 0.15348127484321594, 0.1607898771762848, 0.16809847950935364, 0.1754070669412613, 0.18271565437316895, 0.1900242567062378, 0.19733285903930664, 0.2046414464712143, 0.21195003390312195, 0.2192586362361908, 0.22656723856925964, 0.2338758260011673, 0.24118441343307495, 0.2484930157661438]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 10.0, 9.0, 5.0, 5.0, 14.0, 31.0, 28.0, 44.0, 72.0, 81.0, 148.0, 212.0, 315.0, 422.0, 735.0, 1109.0, 1824.0, 2985.0, 5521.0, 10014.0, 19849.0, 69440.0, 796833.0, 91537.0, 22130.0, 10694.0, 5733.0, 3356.0, 1989.0, 1177.0, 798.0, 476.0, 291.0, 241.0, 130.0, 95.0, 68.0, 40.0, 27.0, 10.0, 18.0, 15.0, 9.0, 5.0, 4.0, 5.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.1292724609375, -0.12504196166992188, -0.12081146240234375, -0.11658096313476562, -0.1123504638671875, -0.10811996459960938, -0.10388946533203125, -0.09965896606445312, -0.095428466796875, -0.09119796752929688, -0.08696746826171875, -0.08273696899414062, -0.0785064697265625, -0.07427597045898438, -0.07004547119140625, -0.06581497192382812, -0.06158447265625, -0.057353973388671875, -0.05312347412109375, -0.048892974853515625, -0.0446624755859375, -0.040431976318359375, -0.03620147705078125, -0.031970977783203125, -0.027740478515625, -0.023509979248046875, -0.01927947998046875, -0.015048980712890625, -0.0108184814453125, -0.006587982177734375, -0.00235748291015625, 0.001873016357421875, 0.006103515625, 0.010334014892578125, 0.01456451416015625, 0.018795013427734375, 0.0230255126953125, 0.027256011962890625, 0.03148651123046875, 0.035717010498046875, 0.039947509765625, 0.044178009033203125, 0.04840850830078125, 0.052639007568359375, 0.0568695068359375, 0.061100006103515625, 0.06533050537109375, 0.06956100463867188, 0.07379150390625, 0.07802200317382812, 0.08225250244140625, 0.08648300170898438, 0.0907135009765625, 0.09494400024414062, 0.09917449951171875, 0.10340499877929688, 0.107635498046875, 0.11186599731445312, 0.11609649658203125, 0.12032699584960938, 0.1245574951171875, 0.12878799438476562, 0.13301849365234375, 0.13724899291992188, 0.1414794921875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 2.0, 5.0, 7.0, 3.0, 14.0, 15.0, 18.0, 59.0, 229.0, 321.0, 180.0, 50.0, 18.0, 7.0, 7.0, 8.0, 10.0, 10.0, 5.0, 2.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.047637939453125, -0.04636430740356445, -0.045090675354003906, -0.04381704330444336, -0.04254341125488281, -0.041269779205322266, -0.03999614715576172, -0.03872251510620117, -0.037448883056640625, -0.03617525100708008, -0.03490161895751953, -0.033627986907958984, -0.03235435485839844, -0.03108072280883789, -0.029807090759277344, -0.028533458709716797, -0.02725982666015625, -0.025986194610595703, -0.024712562561035156, -0.02343893051147461, -0.022165298461914062, -0.020891666412353516, -0.01961803436279297, -0.018344402313232422, -0.017070770263671875, -0.015797138214111328, -0.014523506164550781, -0.013249874114990234, -0.011976242065429688, -0.01070261001586914, -0.009428977966308594, -0.008155345916748047, -0.0068817138671875, -0.005608081817626953, -0.004334449768066406, -0.0030608177185058594, -0.0017871856689453125, -0.0005135536193847656, 0.0007600784301757812, 0.002033710479736328, 0.003307342529296875, 0.004580974578857422, 0.005854606628417969, 0.007128238677978516, 0.008401870727539062, 0.00967550277709961, 0.010949134826660156, 0.012222766876220703, 0.01349639892578125, 0.014770030975341797, 0.016043663024902344, 0.01731729507446289, 0.018590927124023438, 0.019864559173583984, 0.02113819122314453, 0.022411823272705078, 0.023685455322265625, 0.024959087371826172, 0.02623271942138672, 0.027506351470947266, 0.028779983520507812, 0.03005361557006836, 0.031327247619628906, 0.03260087966918945, 0.03387451171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 8.0, 5.0, 6.0, 11.0, 8.0, 15.0, 25.0, 27.0, 50.0, 62.0, 86.0, 147.0, 238.0, 459.0, 1011.0, 2720.0, 8955.0, 41529.0, 261408.0, 586665.0, 115581.0, 20842.0, 5284.0, 1716.0, 743.0, 366.0, 206.0, 120.0, 76.0, 53.0, 36.0, 20.0, 22.0, 21.0, 11.0, 8.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1956787109375, -0.1894245147705078, -0.18317031860351562, -0.17691612243652344, -0.17066192626953125, -0.16440773010253906, -0.15815353393554688, -0.1518993377685547, -0.1456451416015625, -0.1393909454345703, -0.13313674926757812, -0.12688255310058594, -0.12062835693359375, -0.11437416076660156, -0.10811996459960938, -0.10186576843261719, -0.095611572265625, -0.08935737609863281, -0.08310317993164062, -0.07684898376464844, -0.07059478759765625, -0.06434059143066406, -0.058086395263671875, -0.05183219909667969, -0.0455780029296875, -0.03932380676269531, -0.033069610595703125, -0.026815414428710938, -0.02056121826171875, -0.014307022094726562, -0.008052825927734375, -0.0017986297607421875, 0.00445556640625, 0.010709762573242188, 0.016963958740234375, 0.023218154907226562, 0.02947235107421875, 0.03572654724121094, 0.041980743408203125, 0.04823493957519531, 0.0544891357421875, 0.06074333190917969, 0.06699752807617188, 0.07325172424316406, 0.07950592041015625, 0.08576011657714844, 0.09201431274414062, 0.09826850891113281, 0.104522705078125, 0.11077690124511719, 0.11703109741210938, 0.12328529357910156, 0.12953948974609375, 0.13579368591308594, 0.14204788208007812, 0.1483020782470703, 0.1545562744140625, 0.1608104705810547, 0.16706466674804688, 0.17331886291503906, 0.17957305908203125, 0.18582725524902344, 0.19208145141601562, 0.1983356475830078, 0.20458984375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 9.0, 9.0, 9.0, 16.0, 15.0, 20.0, 35.0, 33.0, 36.0, 32.0, 44.0, 40.0, 53.0, 52.0, 65.0, 43.0, 54.0, 54.0, 41.0, 44.0, 38.0, 34.0, 37.0, 33.0, 24.0, 23.0, 22.0, 14.0, 13.0, 17.0, 5.0, 9.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.15952682495117188, -0.15401458740234375, -0.14850234985351562, -0.1429901123046875, -0.13747787475585938, -0.13196563720703125, -0.12645339965820312, -0.120941162109375, -0.11542892456054688, -0.10991668701171875, -0.10440444946289062, -0.0988922119140625, -0.09337997436523438, -0.08786773681640625, -0.08235549926757812, -0.07684326171875, -0.07133102416992188, -0.06581878662109375, -0.060306549072265625, -0.0547943115234375, -0.049282073974609375, -0.04376983642578125, -0.038257598876953125, -0.032745361328125, -0.027233123779296875, -0.02172088623046875, -0.016208648681640625, -0.0106964111328125, -0.005184173583984375, 0.00032806396484375, 0.005840301513671875, 0.0113525390625, 0.016864776611328125, 0.02237701416015625, 0.027889251708984375, 0.0334014892578125, 0.038913726806640625, 0.04442596435546875, 0.049938201904296875, 0.055450439453125, 0.060962677001953125, 0.06647491455078125, 0.07198715209960938, 0.0774993896484375, 0.08301162719726562, 0.08852386474609375, 0.09403610229492188, 0.09954833984375, 0.10506057739257812, 0.11057281494140625, 0.11608505249023438, 0.1215972900390625, 0.12710952758789062, 0.13262176513671875, 0.13813400268554688, 0.143646240234375, 0.14915847778320312, 0.15467071533203125, 0.16018295288085938, 0.1656951904296875, 0.17120742797851562, 0.17671966552734375, 0.18223190307617188, 0.187744140625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 8.0, 10.0, 12.0, 30.0, 38.0, 45.0, 91.0, 157.0, 297.0, 562.0, 1283.0, 3487.0, 16003.0, 826677.0, 185745.0, 9469.0, 2555.0, 1013.0, 472.0, 226.0, 146.0, 77.0, 46.0, 41.0, 18.0, 12.0, 5.0, 6.0, 5.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.271728515625, -0.2623138427734375, -0.252899169921875, -0.2434844970703125, -0.23406982421875, -0.2246551513671875, -0.215240478515625, -0.2058258056640625, -0.1964111328125, -0.1869964599609375, -0.177581787109375, -0.1681671142578125, -0.15875244140625, -0.1493377685546875, -0.139923095703125, -0.1305084228515625, -0.12109375, -0.1116790771484375, -0.102264404296875, -0.0928497314453125, -0.08343505859375, -0.0740203857421875, -0.064605712890625, -0.0551910400390625, -0.0457763671875, -0.0363616943359375, -0.026947021484375, -0.0175323486328125, -0.00811767578125, 0.0012969970703125, 0.010711669921875, 0.0201263427734375, 0.029541015625, 0.0389556884765625, 0.048370361328125, 0.0577850341796875, 0.06719970703125, 0.0766143798828125, 0.086029052734375, 0.0954437255859375, 0.1048583984375, 0.1142730712890625, 0.123687744140625, 0.1331024169921875, 0.14251708984375, 0.1519317626953125, 0.161346435546875, 0.1707611083984375, 0.18017578125, 0.1895904541015625, 0.199005126953125, 0.2084197998046875, 0.21783447265625, 0.2272491455078125, 0.236663818359375, 0.2460784912109375, 0.2554931640625, 0.2649078369140625, 0.274322509765625, 0.2837371826171875, 0.29315185546875, 0.3025665283203125, 0.311981201171875, 0.3213958740234375, 0.330810546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 8.0, 3.0, 4.0, 6.0, 16.0, 20.0, 30.0, 33.0, 28.0, 70.0, 58.0, 102.0, 136.0, 116.0, 102.0, 55.0, 50.0, 41.0, 25.0, 23.0, 17.0, 9.0, 7.0, 9.0, 6.0, 0.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010004043579101562, -0.0009631514549255371, -0.000925898551940918, -0.0008886456489562988, -0.0008513927459716797, -0.0008141398429870605, -0.0007768869400024414, -0.0007396340370178223, -0.0007023811340332031, -0.000665128231048584, -0.0006278753280639648, -0.0005906224250793457, -0.0005533695220947266, -0.0005161166191101074, -0.0004788637161254883, -0.00044161081314086914, -0.00040435791015625, -0.00036710500717163086, -0.0003298521041870117, -0.0002925992012023926, -0.00025534629821777344, -0.0002180933952331543, -0.00018084049224853516, -0.00014358758926391602, -0.00010633468627929688, -6.908178329467773e-05, -3.1828880310058594e-05, 5.424022674560547e-06, 4.267692565917969e-05, 7.992982864379883e-05, 0.00011718273162841797, 0.0001544356346130371, 0.00019168853759765625, 0.0002289414405822754, 0.00026619434356689453, 0.00030344724655151367, 0.0003407001495361328, 0.00037795305252075195, 0.0004152059555053711, 0.00045245885848999023, 0.0004897117614746094, 0.0005269646644592285, 0.0005642175674438477, 0.0006014704704284668, 0.0006387233734130859, 0.0006759762763977051, 0.0007132291793823242, 0.0007504820823669434, 0.0007877349853515625, 0.0008249878883361816, 0.0008622407913208008, 0.0008994936943054199, 0.0009367465972900391, 0.0009739995002746582, 0.0010112524032592773, 0.0010485053062438965, 0.0010857582092285156, 0.0011230111122131348, 0.001160264015197754, 0.001197516918182373, 0.0012347698211669922, 0.0012720227241516113, 0.0013092756271362305, 0.0013465285301208496, 0.0013837814331054688]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 5.0, 3.0, 10.0, 11.0, 12.0, 18.0, 27.0, 37.0, 47.0, 75.0, 103.0, 172.0, 260.0, 443.0, 796.0, 1523.0, 3229.0, 7576.0, 21107.0, 85163.0, 548501.0, 303306.0, 50365.0, 14680.0, 5570.0, 2511.0, 1290.0, 686.0, 405.0, 217.0, 135.0, 78.0, 64.0, 45.0, 24.0, 18.0, 12.0, 9.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.1339111328125, -0.130462646484375, -0.12701416015625, -0.123565673828125, -0.1201171875, -0.116668701171875, -0.11322021484375, -0.109771728515625, -0.1063232421875, -0.102874755859375, -0.09942626953125, -0.095977783203125, -0.092529296875, -0.089080810546875, -0.08563232421875, -0.082183837890625, -0.0787353515625, -0.075286865234375, -0.07183837890625, -0.068389892578125, -0.06494140625, -0.061492919921875, -0.05804443359375, -0.054595947265625, -0.0511474609375, -0.047698974609375, -0.04425048828125, -0.040802001953125, -0.037353515625, -0.033905029296875, -0.03045654296875, -0.027008056640625, -0.0235595703125, -0.020111083984375, -0.01666259765625, -0.013214111328125, -0.009765625, -0.006317138671875, -0.00286865234375, 0.000579833984375, 0.0040283203125, 0.007476806640625, 0.01092529296875, 0.014373779296875, 0.017822265625, 0.021270751953125, 0.02471923828125, 0.028167724609375, 0.0316162109375, 0.035064697265625, 0.03851318359375, 0.041961669921875, 0.04541015625, 0.048858642578125, 0.05230712890625, 0.055755615234375, 0.0592041015625, 0.062652587890625, 0.06610107421875, 0.069549560546875, 0.072998046875, 0.076446533203125, 0.07989501953125, 0.083343505859375, 0.0867919921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 12.0, 17.0, 13.0, 39.0, 25.0, 38.0, 61.0, 56.0, 82.0, 76.0, 81.0, 94.0, 86.0, 74.0, 47.0, 45.0, 40.0, 21.0, 17.0, 14.0, 11.0, 8.0, 7.0, 5.0, 6.0, 0.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08349609375, -0.07942390441894531, -0.07535171508789062, -0.07127952575683594, -0.06720733642578125, -0.06313514709472656, -0.059062957763671875, -0.05499076843261719, -0.0509185791015625, -0.04684638977050781, -0.042774200439453125, -0.03870201110839844, -0.03462982177734375, -0.030557632446289062, -0.026485443115234375, -0.022413253784179688, -0.018341064453125, -0.014268875122070312, -0.010196685791015625, -0.0061244964599609375, -0.00205230712890625, 0.0020198822021484375, 0.006092071533203125, 0.010164260864257812, 0.0142364501953125, 0.018308639526367188, 0.022380828857421875, 0.026453018188476562, 0.03052520751953125, 0.03459739685058594, 0.038669586181640625, 0.04274177551269531, 0.04681396484375, 0.05088615417480469, 0.054958343505859375, 0.05903053283691406, 0.06310272216796875, 0.06717491149902344, 0.07124710083007812, 0.07531929016113281, 0.0793914794921875, 0.08346366882324219, 0.08753585815429688, 0.09160804748535156, 0.09568023681640625, 0.09975242614746094, 0.10382461547851562, 0.10789680480957031, 0.111968994140625, 0.11604118347167969, 0.12011337280273438, 0.12418556213378906, 0.12825775146484375, 0.13232994079589844, 0.13640213012695312, 0.1404743194580078, 0.1445465087890625, 0.1486186981201172, 0.15269088745117188, 0.15676307678222656, 0.16083526611328125, 0.16490745544433594, 0.16897964477539062, 0.1730518341064453, 0.1771240234375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 1.0, 14.0, 24.0, 46.0, 89.0, 198.0, 306.0, 157.0, 71.0, 37.0, 23.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.162454605102539, -1.1080557107925415, -1.053656816482544, -0.9992578625679016, -0.9448589086532593, -0.8904600143432617, -0.8360611200332642, -0.7816622257232666, -0.7272632718086243, -0.6728643774986267, -0.6184654235839844, -0.5640665292739868, -0.5096676349639893, -0.4552686810493469, -0.40086978673934937, -0.3464708626270294, -0.2920719385147095, -0.23767301440238953, -0.18327410519123077, -0.12887519598007202, -0.07447627186775208, -0.02007734775543213, 0.03432154655456543, 0.08872047066688538, 0.14311939477920532, 0.19751831889152527, 0.2519172430038452, 0.3063161373138428, 0.3607150614261627, 0.41511398553848267, 0.4695128798484802, 0.5239118337631226, 0.5783107280731201, 0.6327096223831177, 0.68710857629776, 0.7415074706077576, 0.7959064245223999, 0.8503053188323975, 0.904704213142395, 0.9591031074523926, 1.0135021209716797, 1.0679010152816772, 1.1222999095916748, 1.176698923110962, 1.2310978174209595, 1.285496711730957, 1.3398956060409546, 1.3942945003509521, 1.4486933946609497, 1.5030922889709473, 1.5574911832809448, 1.6118900775909424, 1.6662890911102295, 1.720687985420227, 1.7750868797302246, 1.8294857740402222, 1.8838846683502197, 1.9382835626602173, 1.9926824569702148, 2.047081470489502, 2.10148024559021, 2.155879259109497, 2.210278034210205, 2.264677047729492, 2.3190760612487793]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 9.0, 6.0, 13.0, 14.0, 18.0, 32.0, 93.0, 166.0, 261.0, 195.0, 89.0, 37.0, 22.0, 10.0, 3.0, 8.0, 5.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62007474899292, -3.4931938648223877, -3.3663127422332764, -3.239431858062744, -3.112550973892212, -2.9856700897216797, -2.8587889671325684, -2.731908082962036, -2.605027198791504, -2.4781463146209717, -2.3512651920318604, -2.224384307861328, -2.097503423690796, -1.9706224203109741, -1.8437414169311523, -1.7168605327606201, -1.5899794101715088, -1.463098406791687, -1.3362175226211548, -1.209336519241333, -1.0824556350708008, -0.955574631690979, -0.8286936283111572, -0.7018126845359802, -0.5749317407608032, -0.4480507969856262, -0.32116982340812683, -0.19428884983062744, -0.06740790605545044, 0.05947303771972656, 0.18635404109954834, 0.31323498487472534, 0.44011592864990234, 0.5669968724250793, 0.6938778162002563, 0.8207588195800781, 0.9476397633552551, 1.0745207071304321, 1.201401710510254, 1.3282825946807861, 1.455163598060608, 1.5820446014404297, 1.708925485610962, 1.8358064889907837, 1.9626874923706055, 2.0895683765411377, 2.21644926071167, 2.3433303833007812, 2.4702112674713135, 2.5970921516418457, 2.723973274230957, 2.8508541584014893, 2.9777350425720215, 3.104616165161133, 3.231497049331665, 3.3583779335021973, 3.4852590560913086, 3.612139940261841, 3.739021062850952, 3.8659019470214844, 3.9927828311920166, 4.119663715362549, 4.24654483795166, 4.3734259605407715, 4.500306606292725]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 14.0, 12.0, 21.0, 50.0, 59.0, 93.0, 129.0, 206.0, 393.0, 709.0, 1544.0, 3811.0, 13371.0, 149807.0, 3981678.0, 32643.0, 5884.0, 1991.0, 854.0, 398.0, 213.0, 127.0, 78.0, 51.0, 32.0, 31.0, 11.0, 21.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.72412109375, -0.7035903930664062, -0.6830596923828125, -0.6625289916992188, -0.641998291015625, -0.6214675903320312, -0.6009368896484375, -0.5804061889648438, -0.55987548828125, -0.5393447875976562, -0.5188140869140625, -0.49828338623046875, -0.477752685546875, -0.45722198486328125, -0.4366912841796875, -0.41616058349609375, -0.3956298828125, -0.37509918212890625, -0.3545684814453125, -0.33403778076171875, -0.313507080078125, -0.29297637939453125, -0.2724456787109375, -0.25191497802734375, -0.23138427734375, -0.21085357666015625, -0.1903228759765625, -0.16979217529296875, -0.149261474609375, -0.12873077392578125, -0.1082000732421875, -0.08766937255859375, -0.067138671875, -0.04660797119140625, -0.0260772705078125, -0.00554656982421875, 0.014984130859375, 0.03551483154296875, 0.0560455322265625, 0.07657623291015625, 0.09710693359375, 0.11763763427734375, 0.1381683349609375, 0.15869903564453125, 0.179229736328125, 0.19976043701171875, 0.2202911376953125, 0.24082183837890625, 0.2613525390625, 0.28188323974609375, 0.3024139404296875, 0.32294464111328125, 0.343475341796875, 0.36400604248046875, 0.3845367431640625, 0.40506744384765625, 0.42559814453125, 0.44612884521484375, 0.4666595458984375, 0.48719024658203125, 0.507720947265625, 0.5282516479492188, 0.5487823486328125, 0.5693130493164062, 0.58984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 6.0, 4.0, 4.0, 11.0, 8.0, 18.0, 31.0, 48.0, 93.0, 222.0, 253.0, 154.0, 60.0, 17.0, 18.0, 13.0, 6.0, 8.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04058837890625, -0.03923654556274414, -0.03788471221923828, -0.03653287887573242, -0.03518104553222656, -0.0338292121887207, -0.032477378845214844, -0.031125545501708984, -0.029773712158203125, -0.028421878814697266, -0.027070045471191406, -0.025718212127685547, -0.024366378784179688, -0.023014545440673828, -0.02166271209716797, -0.02031087875366211, -0.01895904541015625, -0.01760721206665039, -0.01625537872314453, -0.014903545379638672, -0.013551712036132812, -0.012199878692626953, -0.010848045349121094, -0.009496212005615234, -0.008144378662109375, -0.006792545318603516, -0.005440711975097656, -0.004088878631591797, -0.0027370452880859375, -0.0013852119445800781, -3.337860107421875e-05, 0.0013184547424316406, 0.0026702880859375, 0.004022121429443359, 0.005373954772949219, 0.006725788116455078, 0.008077621459960938, 0.009429454803466797, 0.010781288146972656, 0.012133121490478516, 0.013484954833984375, 0.014836788177490234, 0.016188621520996094, 0.017540454864501953, 0.018892288208007812, 0.020244121551513672, 0.02159595489501953, 0.02294778823852539, 0.02429962158203125, 0.02565145492553711, 0.02700328826904297, 0.028355121612548828, 0.029706954956054688, 0.031058788299560547, 0.032410621643066406, 0.033762454986572266, 0.035114288330078125, 0.036466121673583984, 0.037817955017089844, 0.0391697883605957, 0.04052162170410156, 0.04187345504760742, 0.04322528839111328, 0.04457712173461914, 0.045928955078125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 2.0, 4.0, 5.0, 1.0, 12.0, 17.0, 16.0, 20.0, 38.0, 53.0, 79.0, 113.0, 181.0, 319.0, 459.0, 760.0, 1349.0, 2349.0, 4074.0, 8010.0, 18795.0, 62406.0, 721244.0, 3232612.0, 95715.0, 24238.0, 9841.0, 4949.0, 2673.0, 1485.0, 891.0, 531.0, 342.0, 236.0, 153.0, 108.0, 67.0, 56.0, 14.0, 15.0, 16.0, 5.0, 6.0, 6.0, 4.0, 3.0, 10.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.236572265625, -0.22872161865234375, -0.2208709716796875, -0.21302032470703125, -0.205169677734375, -0.19731903076171875, -0.1894683837890625, -0.18161773681640625, -0.17376708984375, -0.16591644287109375, -0.1580657958984375, -0.15021514892578125, -0.142364501953125, -0.13451385498046875, -0.1266632080078125, -0.11881256103515625, -0.1109619140625, -0.10311126708984375, -0.0952606201171875, -0.08740997314453125, -0.079559326171875, -0.07170867919921875, -0.0638580322265625, -0.05600738525390625, -0.04815673828125, -0.04030609130859375, -0.0324554443359375, -0.02460479736328125, -0.016754150390625, -0.00890350341796875, -0.0010528564453125, 0.00679779052734375, 0.0146484375, 0.02249908447265625, 0.0303497314453125, 0.03820037841796875, 0.046051025390625, 0.05390167236328125, 0.0617523193359375, 0.06960296630859375, 0.07745361328125, 0.08530426025390625, 0.0931549072265625, 0.10100555419921875, 0.108856201171875, 0.11670684814453125, 0.1245574951171875, 0.13240814208984375, 0.1402587890625, 0.14810943603515625, 0.1559600830078125, 0.16381072998046875, 0.171661376953125, 0.17951202392578125, 0.1873626708984375, 0.19521331787109375, 0.20306396484375, 0.21091461181640625, 0.2187652587890625, 0.22661590576171875, 0.234466552734375, 0.24231719970703125, 0.2501678466796875, 0.25801849365234375, 0.265869140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0, 4.0, 10.0, 13.0, 13.0, 25.0, 36.0, 60.0, 90.0, 221.0, 821.0, 2088.0, 368.0, 106.0, 71.0, 39.0, 27.0, 14.0, 6.0, 5.0, 10.0, 6.0, 10.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053741455078125, -0.051767826080322266, -0.04979419708251953, -0.0478205680847168, -0.04584693908691406, -0.04387331008911133, -0.041899681091308594, -0.03992605209350586, -0.037952423095703125, -0.03597879409790039, -0.034005165100097656, -0.03203153610229492, -0.030057907104492188, -0.028084278106689453, -0.02611064910888672, -0.024137020111083984, -0.02216339111328125, -0.020189762115478516, -0.01821613311767578, -0.016242504119873047, -0.014268875122070312, -0.012295246124267578, -0.010321617126464844, -0.00834798812866211, -0.006374359130859375, -0.004400730133056641, -0.0024271011352539062, -0.0004534721374511719, 0.0015201568603515625, 0.003493785858154297, 0.005467414855957031, 0.007441043853759766, 0.0094146728515625, 0.011388301849365234, 0.013361930847167969, 0.015335559844970703, 0.017309188842773438, 0.019282817840576172, 0.021256446838378906, 0.02323007583618164, 0.025203704833984375, 0.02717733383178711, 0.029150962829589844, 0.031124591827392578, 0.03309822082519531, 0.03507184982299805, 0.03704547882080078, 0.039019107818603516, 0.04099273681640625, 0.042966365814208984, 0.04493999481201172, 0.04691362380981445, 0.04888725280761719, 0.05086088180541992, 0.052834510803222656, 0.05480813980102539, 0.056781768798828125, 0.05875539779663086, 0.060729026794433594, 0.06270265579223633, 0.06467628479003906, 0.0666499137878418, 0.06862354278564453, 0.07059717178344727, 0.07257080078125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 35.0, 154.0, 519.0, 225.0, 37.0, 17.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4299262762069702, -0.40801453590393066, -0.3861027956008911, -0.36419105529785156, -0.342279314994812, -0.32036757469177246, -0.2984558343887329, -0.27654409408569336, -0.2546323537826538, -0.23272061347961426, -0.2108088731765747, -0.18889713287353516, -0.1669853925704956, -0.14507365226745605, -0.1231619119644165, -0.10125017166137695, -0.0793384313583374, -0.05742669105529785, -0.0355149507522583, -0.01360321044921875, 0.0083085298538208, 0.03022027015686035, 0.0521320104598999, 0.07404375076293945, 0.095955491065979, 0.11786723136901855, 0.1397789716720581, 0.16169071197509766, 0.1836024522781372, 0.20551419258117676, 0.2274259328842163, 0.24933767318725586, 0.2712494134902954, 0.29316115379333496, 0.3150728940963745, 0.33698463439941406, 0.3588963747024536, 0.38080811500549316, 0.4027198553085327, 0.42463159561157227, 0.4465433359146118, 0.46845507621765137, 0.4903668165206909, 0.5122785568237305, 0.53419029712677, 0.5561020374298096, 0.5780137777328491, 0.5999255180358887, 0.6218372583389282, 0.6437489986419678, 0.6656607389450073, 0.6875724792480469, 0.7094842195510864, 0.731395959854126, 0.7533077001571655, 0.7752194404602051, 0.7971311807632446, 0.8190429210662842, 0.8409546613693237, 0.8628664016723633, 0.8847781419754028, 0.9066898822784424, 0.9286016225814819, 0.9505133628845215, 0.972425103187561]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 7.0, 16.0, 40.0, 70.0, 120.0, 168.0, 193.0, 142.0, 86.0, 57.0, 32.0, 17.0, 7.0, 8.0, 5.0, 4.0, 1.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4757676124572754, -0.4626414477825165, -0.4495152533054352, -0.43638908863067627, -0.42326292395591736, -0.41013675928115845, -0.39701056480407715, -0.38388440012931824, -0.3707582354545593, -0.3576320707798004, -0.3445058763027191, -0.3313797116279602, -0.3182535469532013, -0.3051273822784424, -0.2920011878013611, -0.2788750231266022, -0.26574885845184326, -0.25262269377708435, -0.23949651420116425, -0.22637033462524414, -0.21324416995048523, -0.20011799037456512, -0.18699181079864502, -0.1738656461238861, -0.1607394516468048, -0.1476132720708847, -0.1344871073961258, -0.12136092782020569, -0.10823476314544678, -0.09510858356952667, -0.08198241144418716, -0.06885623931884766, -0.055730074644088745, -0.04260390251874924, -0.02947772853076458, -0.016351554542779922, -0.0032253824174404144, 0.009900793433189392, 0.0230269655585289, 0.03615313768386841, 0.049279309809207916, 0.062405481934547424, 0.07553165405988693, 0.08865782618522644, 0.10178400576114655, 0.11491017788648605, 0.12803635001182556, 0.14116251468658447, 0.15428869426250458, 0.16741487383842468, 0.1805410385131836, 0.1936672180891037, 0.2067933827638626, 0.21991956233978271, 0.23304572701454163, 0.24617190659046173, 0.25929808616638184, 0.27242425084114075, 0.28555044531822205, 0.29867660999298096, 0.31180277466773987, 0.3249289393424988, 0.3380551338195801, 0.351181298494339, 0.3643074631690979]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 11.0, 16.0, 23.0, 36.0, 57.0, 76.0, 106.0, 197.0, 344.0, 512.0, 863.0, 1558.0, 2556.0, 4813.0, 9057.0, 19609.0, 55056.0, 304173.0, 512029.0, 86683.0, 25900.0, 11339.0, 5910.0, 3256.0, 1721.0, 990.0, 623.0, 364.0, 243.0, 151.0, 97.0, 68.0, 44.0, 17.0, 17.0, 11.0, 6.0, 7.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12152099609375, -0.1174917221069336, -0.11346244812011719, -0.10943317413330078, -0.10540390014648438, -0.10137462615966797, -0.09734535217285156, -0.09331607818603516, -0.08928680419921875, -0.08525753021240234, -0.08122825622558594, -0.07719898223876953, -0.07316970825195312, -0.06914043426513672, -0.06511116027832031, -0.061081886291503906, -0.0570526123046875, -0.053023338317871094, -0.04899406433105469, -0.04496479034423828, -0.040935516357421875, -0.03690624237060547, -0.03287696838378906, -0.028847694396972656, -0.02481842041015625, -0.020789146423339844, -0.016759872436523438, -0.012730598449707031, -0.008701324462890625, -0.004672050476074219, -0.0006427764892578125, 0.0033864974975585938, 0.007415771484375, 0.011445045471191406, 0.015474319458007812, 0.01950359344482422, 0.023532867431640625, 0.02756214141845703, 0.03159141540527344, 0.035620689392089844, 0.03964996337890625, 0.043679237365722656, 0.04770851135253906, 0.05173778533935547, 0.055767059326171875, 0.05979633331298828, 0.06382560729980469, 0.0678548812866211, 0.0718841552734375, 0.0759134292602539, 0.07994270324707031, 0.08397197723388672, 0.08800125122070312, 0.09203052520751953, 0.09605979919433594, 0.10008907318115234, 0.10411834716796875, 0.10814762115478516, 0.11217689514160156, 0.11620616912841797, 0.12023544311523438, 0.12426471710205078, 0.1282939910888672, 0.1323232650756836, 0.1363525390625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 5.0, 3.0, 5.0, 5.0, 4.0, 5.0, 9.0, 8.0, 17.0, 13.0, 17.0, 34.0, 71.0, 81.0, 100.0, 119.0, 127.0, 95.0, 79.0, 55.0, 37.0, 18.0, 21.0, 8.0, 6.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016265869140625, -0.015682220458984375, -0.01509857177734375, -0.014514923095703125, -0.0139312744140625, -0.013347625732421875, -0.01276397705078125, -0.012180328369140625, -0.0115966796875, -0.011013031005859375, -0.01042938232421875, -0.009845733642578125, -0.0092620849609375, -0.008678436279296875, -0.00809478759765625, -0.007511138916015625, -0.006927490234375, -0.006343841552734375, -0.00576019287109375, -0.005176544189453125, -0.0045928955078125, -0.004009246826171875, -0.00342559814453125, -0.002841949462890625, -0.00225830078125, -0.001674652099609375, -0.00109100341796875, -0.000507354736328125, 7.62939453125e-05, 0.000659942626953125, 0.00124359130859375, 0.001827239990234375, 0.002410888671875, 0.002994537353515625, 0.00357818603515625, 0.004161834716796875, 0.0047454833984375, 0.005329132080078125, 0.00591278076171875, 0.006496429443359375, 0.007080078125, 0.007663726806640625, 0.00824737548828125, 0.008831024169921875, 0.0094146728515625, 0.009998321533203125, 0.01058197021484375, 0.011165618896484375, 0.011749267578125, 0.012332916259765625, 0.01291656494140625, 0.013500213623046875, 0.0140838623046875, 0.014667510986328125, 0.01525115966796875, 0.015834808349609375, 0.01641845703125, 0.017002105712890625, 0.01758575439453125, 0.018169403076171875, 0.0187530517578125, 0.019336700439453125, 0.01992034912109375, 0.020503997802734375, 0.021087646484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 15.0, 8.0, 12.0, 27.0, 53.0, 255.0, 1734.0, 23135.0, 563907.0, 439023.0, 18548.0, 1481.0, 224.0, 52.0, 25.0, 10.0, 5.0, 8.0, 4.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3125, -0.3020668029785156, -0.29163360595703125, -0.2812004089355469, -0.2707672119140625, -0.2603340148925781, -0.24990081787109375, -0.23946762084960938, -0.229034423828125, -0.21860122680664062, -0.20816802978515625, -0.19773483276367188, -0.1873016357421875, -0.17686843872070312, -0.16643524169921875, -0.15600204467773438, -0.14556884765625, -0.13513565063476562, -0.12470245361328125, -0.11426925659179688, -0.1038360595703125, -0.09340286254882812, -0.08296966552734375, -0.07253646850585938, -0.062103271484375, -0.051670074462890625, -0.04123687744140625, -0.030803680419921875, -0.0203704833984375, -0.009937286376953125, 0.00049591064453125, 0.010929107666015625, 0.0213623046875, 0.031795501708984375, 0.04222869873046875, 0.052661895751953125, 0.0630950927734375, 0.07352828979492188, 0.08396148681640625, 0.09439468383789062, 0.104827880859375, 0.11526107788085938, 0.12569427490234375, 0.13612747192382812, 0.1465606689453125, 0.15699386596679688, 0.16742706298828125, 0.17786026000976562, 0.18829345703125, 0.19872665405273438, 0.20915985107421875, 0.21959304809570312, 0.2300262451171875, 0.24045944213867188, 0.25089263916015625, 0.2613258361816406, 0.271759033203125, 0.2821922302246094, 0.29262542724609375, 0.3030586242675781, 0.3134918212890625, 0.3239250183105469, 0.33435821533203125, 0.3447914123535156, 0.355224609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 0.0, 8.0, 6.0, 7.0, 13.0, 14.0, 13.0, 7.0, 15.0, 17.0, 20.0, 23.0, 36.0, 27.0, 30.0, 34.0, 34.0, 39.0, 34.0, 34.0, 33.0, 37.0, 33.0, 41.0, 30.0, 27.0, 36.0, 31.0, 32.0, 45.0, 40.0, 23.0, 26.0, 15.0, 21.0, 22.0, 13.0, 22.0, 13.0, 10.0, 9.0, 4.0, 5.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.07220458984375, -0.06996917724609375, -0.0677337646484375, -0.06549835205078125, -0.063262939453125, -0.06102752685546875, -0.0587921142578125, -0.05655670166015625, -0.0543212890625, -0.05208587646484375, -0.0498504638671875, -0.04761505126953125, -0.045379638671875, -0.04314422607421875, -0.0409088134765625, -0.03867340087890625, -0.03643798828125, -0.03420257568359375, -0.0319671630859375, -0.02973175048828125, -0.027496337890625, -0.02526092529296875, -0.0230255126953125, -0.02079010009765625, -0.0185546875, -0.01631927490234375, -0.0140838623046875, -0.01184844970703125, -0.009613037109375, -0.00737762451171875, -0.0051422119140625, -0.00290679931640625, -0.00067138671875, 0.00156402587890625, 0.0037994384765625, 0.00603485107421875, 0.008270263671875, 0.01050567626953125, 0.0127410888671875, 0.01497650146484375, 0.0172119140625, 0.01944732666015625, 0.0216827392578125, 0.02391815185546875, 0.026153564453125, 0.02838897705078125, 0.0306243896484375, 0.03285980224609375, 0.03509521484375, 0.03733062744140625, 0.0395660400390625, 0.04180145263671875, 0.044036865234375, 0.04627227783203125, 0.0485076904296875, 0.05074310302734375, 0.052978515625, 0.05521392822265625, 0.0574493408203125, 0.05968475341796875, 0.061920166015625, 0.06415557861328125, 0.0663909912109375, 0.06862640380859375, 0.07086181640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 2.0, 7.0, 7.0, 5.0, 15.0, 21.0, 59.0, 247.0, 1721.0, 903991.0, 140908.0, 1230.0, 201.0, 63.0, 20.0, 7.0, 14.0, 3.0, 5.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.0478515625, -1.0169601440429688, -0.9860687255859375, -0.9551773071289062, -0.924285888671875, -0.8933944702148438, -0.8625030517578125, -0.8316116333007812, -0.80072021484375, -0.7698287963867188, -0.7389373779296875, -0.7080459594726562, -0.677154541015625, -0.6462631225585938, -0.6153717041015625, -0.5844802856445312, -0.5535888671875, -0.5226974487304688, -0.4918060302734375, -0.46091461181640625, -0.430023193359375, -0.39913177490234375, -0.3682403564453125, -0.33734893798828125, -0.30645751953125, -0.27556610107421875, -0.2446746826171875, -0.21378326416015625, -0.182891845703125, -0.15200042724609375, -0.1211090087890625, -0.09021759033203125, -0.059326171875, -0.02843475341796875, 0.0024566650390625, 0.03334808349609375, 0.064239501953125, 0.09513092041015625, 0.1260223388671875, 0.15691375732421875, 0.18780517578125, 0.21869659423828125, 0.2495880126953125, 0.28047943115234375, 0.311370849609375, 0.34226226806640625, 0.3731536865234375, 0.40404510498046875, 0.4349365234375, 0.46582794189453125, 0.4967193603515625, 0.5276107788085938, 0.558502197265625, 0.5893936157226562, 0.6202850341796875, 0.6511764526367188, 0.68206787109375, 0.7129592895507812, 0.7438507080078125, 0.7747421264648438, 0.805633544921875, 0.8365249633789062, 0.8674163818359375, 0.8983078002929688, 0.92919921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 8.0, 6.0, 4.0, 10.0, 19.0, 22.0, 19.0, 29.0, 32.0, 63.0, 83.0, 296.0, 190.0, 75.0, 49.0, 24.0, 20.0, 8.0, 8.0, 9.0, 3.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001560211181640625, -0.0015061497688293457, -0.0014520883560180664, -0.0013980269432067871, -0.0013439655303955078, -0.0012899041175842285, -0.0012358427047729492, -0.00118178129196167, -0.0011277198791503906, -0.0010736584663391113, -0.001019597053527832, -0.0009655356407165527, -0.0009114742279052734, -0.0008574128150939941, -0.0008033514022827148, -0.0007492899894714355, -0.0006952285766601562, -0.000641167163848877, -0.0005871057510375977, -0.0005330443382263184, -0.00047898292541503906, -0.00042492151260375977, -0.00037086009979248047, -0.00031679868698120117, -0.0002627372741699219, -0.00020867586135864258, -0.00015461444854736328, -0.00010055303573608398, -4.649162292480469e-05, 7.569789886474609e-06, 6.16312026977539e-05, 0.0001156926155090332, 0.0001697540283203125, 0.0002238154411315918, 0.0002778768539428711, 0.0003319382667541504, 0.0003859996795654297, 0.000440061092376709, 0.0004941225051879883, 0.0005481839179992676, 0.0006022453308105469, 0.0006563067436218262, 0.0007103681564331055, 0.0007644295692443848, 0.0008184909820556641, 0.0008725523948669434, 0.0009266138076782227, 0.000980675220489502, 0.0010347366333007812, 0.0010887980461120605, 0.0011428594589233398, 0.0011969208717346191, 0.0012509822845458984, 0.0013050436973571777, 0.001359105110168457, 0.0014131665229797363, 0.0014672279357910156, 0.001521289348602295, 0.0015753507614135742, 0.0016294121742248535, 0.0016834735870361328, 0.0017375349998474121, 0.0017915964126586914, 0.0018456578254699707, 0.00189971923828125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 9.0, 10.0, 20.0, 33.0, 31.0, 61.0, 94.0, 146.0, 221.0, 383.0, 671.0, 1341.0, 3113.0, 8828.0, 587799.0, 431780.0, 8268.0, 2910.0, 1247.0, 643.0, 354.0, 210.0, 131.0, 83.0, 61.0, 36.0, 25.0, 17.0, 15.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385009765625, -0.371246337890625, -0.35748291015625, -0.343719482421875, -0.3299560546875, -0.316192626953125, -0.30242919921875, -0.288665771484375, -0.27490234375, -0.261138916015625, -0.24737548828125, -0.233612060546875, -0.2198486328125, -0.206085205078125, -0.19232177734375, -0.178558349609375, -0.164794921875, -0.151031494140625, -0.13726806640625, -0.123504638671875, -0.1097412109375, -0.095977783203125, -0.08221435546875, -0.068450927734375, -0.0546875, -0.040924072265625, -0.02716064453125, -0.013397216796875, 0.0003662109375, 0.014129638671875, 0.02789306640625, 0.041656494140625, 0.055419921875, 0.069183349609375, 0.08294677734375, 0.096710205078125, 0.1104736328125, 0.124237060546875, 0.13800048828125, 0.151763916015625, 0.16552734375, 0.179290771484375, 0.19305419921875, 0.206817626953125, 0.2205810546875, 0.234344482421875, 0.24810791015625, 0.261871337890625, 0.275634765625, 0.289398193359375, 0.30316162109375, 0.316925048828125, 0.3306884765625, 0.344451904296875, 0.35821533203125, 0.371978759765625, 0.3857421875, 0.399505615234375, 0.41326904296875, 0.427032470703125, 0.4407958984375, 0.454559326171875, 0.46832275390625, 0.482086181640625, 0.495849609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 7.0, 44.0, 139.0, 291.0, 303.0, 136.0, 36.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.2763328552246094, -0.26677703857421875, -0.2572212219238281, -0.2476654052734375, -0.23810958862304688, -0.22855377197265625, -0.21899795532226562, -0.209442138671875, -0.19988632202148438, -0.19033050537109375, -0.18077468872070312, -0.1712188720703125, -0.16166305541992188, -0.15210723876953125, -0.14255142211914062, -0.13299560546875, -0.12343978881835938, -0.11388397216796875, -0.10432815551757812, -0.0947723388671875, -0.08521652221679688, -0.07566070556640625, -0.06610488891601562, -0.056549072265625, -0.046993255615234375, -0.03743743896484375, -0.027881622314453125, -0.0183258056640625, -0.008769989013671875, 0.00078582763671875, 0.010341644287109375, 0.0198974609375, 0.029453277587890625, 0.03900909423828125, 0.048564910888671875, 0.0581207275390625, 0.06767654418945312, 0.07723236083984375, 0.08678817749023438, 0.096343994140625, 0.10589981079101562, 0.11545562744140625, 0.12501144409179688, 0.1345672607421875, 0.14412307739257812, 0.15367889404296875, 0.16323471069335938, 0.17279052734375, 0.18234634399414062, 0.19190216064453125, 0.20145797729492188, 0.2110137939453125, 0.22056961059570312, 0.23012542724609375, 0.23968124389648438, 0.249237060546875, 0.2587928771972656, 0.26834869384765625, 0.2779045104980469, 0.2874603271484375, 0.2970161437988281, 0.30657196044921875, 0.3161277770996094, 0.32568359375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 13.0, 29.0, 47.0, 109.0, 216.0, 292.0, 172.0, 69.0, 28.0, 14.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029388666152954, -0.9887472987174988, -0.9481059908866882, -0.9074646234512329, -0.8668233156204224, -0.826181948184967, -0.7855405807495117, -0.7448992729187012, -0.7042579054832458, -0.6636165380477905, -0.62297523021698, -0.5823338627815247, -0.5416924953460693, -0.5010511875152588, -0.46040982007980347, -0.41976848244667053, -0.3791271448135376, -0.33848580718040466, -0.29784446954727173, -0.2572031021118164, -0.21656176447868347, -0.17592042684555054, -0.1352790743112564, -0.09463772177696228, -0.053996384143829346, -0.013355039060115814, 0.027286306023597717, 0.06792765110731125, 0.10856899619102478, 0.14921033382415771, 0.18985168635845184, 0.23049303889274597, 0.27113425731658936, 0.3117755949497223, 0.3524169325828552, 0.39305830001831055, 0.4336996376514435, 0.4743409752845764, 0.5149823427200317, 0.5556236505508423, 0.5962650179862976, 0.6369063854217529, 0.6775476932525635, 0.7181890606880188, 0.7588304281234741, 0.7994717359542847, 0.84011310338974, 0.8807544708251953, 0.9213957786560059, 0.9620371460914612, 1.0026785135269165, 1.043319821357727, 1.0839611291885376, 1.1246025562286377, 1.1652438640594482, 1.2058851718902588, 1.2465264797210693, 1.2871677875518799, 1.32780921459198, 1.3684505224227905, 1.409091830253601, 1.4497332572937012, 1.4903745651245117, 1.5310158729553223, 1.5716572999954224]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 11.0, 10.0, 14.0, 19.0, 28.0, 25.0, 37.0, 68.0, 72.0, 69.0, 96.0, 68.0, 69.0, 79.0, 72.0, 54.0, 36.0, 36.0, 31.0, 29.0, 8.0, 12.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7312377691268921, -0.7045794725418091, -0.6779211759567261, -0.6512628793716431, -0.6246045231819153, -0.5979462265968323, -0.5712879300117493, -0.5446296334266663, -0.5179712772369385, -0.49131298065185547, -0.4646546542644501, -0.43799635767936707, -0.41133803129196167, -0.38467973470687866, -0.35802143812179565, -0.33136314153671265, -0.30470484495162964, -0.27804654836654663, -0.25138822197914124, -0.22472992539405823, -0.19807161390781403, -0.17141330242156982, -0.14475500583648682, -0.11809669435024261, -0.09143838286399841, -0.06478007137775421, -0.03812176734209061, -0.011463463306427002, 0.0151948481798172, 0.0418531596660614, 0.06851145625114441, 0.09516976773738861, 0.12182801961898804, 0.14848633110523224, 0.17514464259147644, 0.20180293917655945, 0.22846125066280365, 0.25511956214904785, 0.28177785873413086, 0.30843615531921387, 0.33509448170661926, 0.36175277829170227, 0.38841110467910767, 0.4150694012641907, 0.4417276978492737, 0.4683860242366791, 0.4950443208217621, 0.5217026472091675, 0.5483609437942505, 0.5750192403793335, 0.6016775369644165, 0.6283358335494995, 0.6549941897392273, 0.6816524863243103, 0.7083107829093933, 0.7349690794944763, 0.7616274356842041, 0.7882857322692871, 0.8149440288543701, 0.8416023254394531, 0.8682606816291809, 0.8949189782142639, 0.9215772747993469, 0.9482355713844299, 0.9748938679695129]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 6.0, 6.0, 11.0, 14.0, 22.0, 31.0, 56.0, 103.0, 172.0, 342.0, 647.0, 1134.0, 2199.0, 5843.0, 21866.0, 459850.0, 3658130.0, 31666.0, 7142.0, 2407.0, 1080.0, 616.0, 344.0, 181.0, 133.0, 94.0, 44.0, 43.0, 17.0, 19.0, 18.0, 14.0, 5.0, 5.0, 12.0, 4.0, 3.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.488525390625, -0.4728202819824219, -0.45711517333984375, -0.4414100646972656, -0.4257049560546875, -0.4099998474121094, -0.39429473876953125, -0.3785896301269531, -0.362884521484375, -0.3471794128417969, -0.33147430419921875, -0.3157691955566406, -0.3000640869140625, -0.2843589782714844, -0.26865386962890625, -0.2529487609863281, -0.23724365234375, -0.22153854370117188, -0.20583343505859375, -0.19012832641601562, -0.1744232177734375, -0.15871810913085938, -0.14301300048828125, -0.12730789184570312, -0.111602783203125, -0.09589767456054688, -0.08019256591796875, -0.06448745727539062, -0.0487823486328125, -0.033077239990234375, -0.01737213134765625, -0.001667022705078125, 0.0140380859375, 0.029743194580078125, 0.04544830322265625, 0.061153411865234375, 0.0768585205078125, 0.09256362915039062, 0.10826873779296875, 0.12397384643554688, 0.139678955078125, 0.15538406372070312, 0.17108917236328125, 0.18679428100585938, 0.2024993896484375, 0.21820449829101562, 0.23390960693359375, 0.24961471557617188, 0.26531982421875, 0.2810249328613281, 0.29673004150390625, 0.3124351501464844, 0.3281402587890625, 0.3438453674316406, 0.35955047607421875, 0.3752555847167969, 0.390960693359375, 0.4066658020019531, 0.42237091064453125, 0.4380760192871094, 0.4537811279296875, 0.4694862365722656, 0.48519134521484375, 0.5008964538574219, 0.5166015625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 2.0, 5.0, 5.0, 15.0, 9.0, 11.0, 10.0, 17.0, 29.0, 37.0, 56.0, 82.0, 102.0, 113.0, 118.0, 98.0, 66.0, 75.0, 49.0, 27.0, 23.0, 14.0, 7.0, 5.0, 3.0, 8.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018524169921875, -0.01788640022277832, -0.01724863052368164, -0.01661086082458496, -0.01597309112548828, -0.015335321426391602, -0.014697551727294922, -0.014059782028198242, -0.013422012329101562, -0.012784242630004883, -0.012146472930908203, -0.011508703231811523, -0.010870933532714844, -0.010233163833618164, -0.009595394134521484, -0.008957624435424805, -0.008319854736328125, -0.007682085037231445, -0.007044315338134766, -0.006406545639038086, -0.005768775939941406, -0.0051310062408447266, -0.004493236541748047, -0.003855466842651367, -0.0032176971435546875, -0.002579927444458008, -0.0019421577453613281, -0.0013043880462646484, -0.0006666183471679688, -2.8848648071289062e-05, 0.0006089210510253906, 0.0012466907501220703, 0.00188446044921875, 0.0025222301483154297, 0.0031599998474121094, 0.003797769546508789, 0.004435539245605469, 0.0050733089447021484, 0.005711078643798828, 0.006348848342895508, 0.0069866180419921875, 0.007624387741088867, 0.008262157440185547, 0.008899927139282227, 0.009537696838378906, 0.010175466537475586, 0.010813236236572266, 0.011451005935668945, 0.012088775634765625, 0.012726545333862305, 0.013364315032958984, 0.014002084732055664, 0.014639854431152344, 0.015277624130249023, 0.015915393829345703, 0.016553163528442383, 0.017190933227539062, 0.017828702926635742, 0.018466472625732422, 0.0191042423248291, 0.01974201202392578, 0.02037978172302246, 0.02101755142211914, 0.02165532112121582, 0.0222930908203125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 2.0, 8.0, 6.0, 9.0, 14.0, 12.0, 18.0, 38.0, 38.0, 60.0, 140.0, 554.0, 7457.0, 4069391.0, 113971.0, 1943.0, 310.0, 114.0, 54.0, 42.0, 29.0, 16.0, 10.0, 12.0, 5.0, 2.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1328125, -1.1020126342773438, -1.0712127685546875, -1.0404129028320312, -1.009613037109375, -0.9788131713867188, -0.9480133056640625, -0.9172134399414062, -0.88641357421875, -0.8556137084960938, -0.8248138427734375, -0.7940139770507812, -0.763214111328125, -0.7324142456054688, -0.7016143798828125, -0.6708145141601562, -0.6400146484375, -0.6092147827148438, -0.5784149169921875, -0.5476150512695312, -0.516815185546875, -0.48601531982421875, -0.4552154541015625, -0.42441558837890625, -0.39361572265625, -0.36281585693359375, -0.3320159912109375, -0.30121612548828125, -0.270416259765625, -0.23961639404296875, -0.2088165283203125, -0.17801666259765625, -0.147216796875, -0.11641693115234375, -0.0856170654296875, -0.05481719970703125, -0.024017333984375, 0.00678253173828125, 0.0375823974609375, 0.06838226318359375, 0.09918212890625, 0.12998199462890625, 0.1607818603515625, 0.19158172607421875, 0.222381591796875, 0.25318145751953125, 0.2839813232421875, 0.31478118896484375, 0.3455810546875, 0.37638092041015625, 0.4071807861328125, 0.43798065185546875, 0.468780517578125, 0.49958038330078125, 0.5303802490234375, 0.5611801147460938, 0.59197998046875, 0.6227798461914062, 0.6535797119140625, 0.6843795776367188, 0.715179443359375, 0.7459793090820312, 0.7767791748046875, 0.8075790405273438, 0.83837890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 7.0, 4.0, 10.0, 15.0, 14.0, 36.0, 41.0, 56.0, 75.0, 154.0, 360.0, 1087.0, 1406.0, 342.0, 169.0, 87.0, 57.0, 43.0, 17.0, 19.0, 17.0, 14.0, 5.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032958984375, -0.03174257278442383, -0.030526161193847656, -0.029309749603271484, -0.028093338012695312, -0.02687692642211914, -0.02566051483154297, -0.024444103240966797, -0.023227691650390625, -0.022011280059814453, -0.02079486846923828, -0.01957845687866211, -0.018362045288085938, -0.017145633697509766, -0.015929222106933594, -0.014712810516357422, -0.01349639892578125, -0.012279987335205078, -0.011063575744628906, -0.009847164154052734, -0.008630752563476562, -0.007414340972900391, -0.006197929382324219, -0.004981517791748047, -0.003765106201171875, -0.002548694610595703, -0.0013322830200195312, -0.00011587142944335938, 0.0011005401611328125, 0.0023169517517089844, 0.0035333633422851562, 0.004749774932861328, 0.0059661865234375, 0.007182598114013672, 0.008399009704589844, 0.009615421295166016, 0.010831832885742188, 0.01204824447631836, 0.013264656066894531, 0.014481067657470703, 0.015697479248046875, 0.016913890838623047, 0.01813030242919922, 0.01934671401977539, 0.020563125610351562, 0.021779537200927734, 0.022995948791503906, 0.024212360382080078, 0.02542877197265625, 0.026645183563232422, 0.027861595153808594, 0.029078006744384766, 0.030294418334960938, 0.03151082992553711, 0.03272724151611328, 0.03394365310668945, 0.035160064697265625, 0.0363764762878418, 0.03759288787841797, 0.03880929946899414, 0.04002571105957031, 0.041242122650146484, 0.042458534240722656, 0.04367494583129883, 0.044891357421875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 65.0, 344.0, 446.0, 104.0, 30.0, 8.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0158137083053589, -0.9942454099655151, -0.9726771116256714, -0.9511088132858276, -0.9295405149459839, -0.9079722166061401, -0.8864039182662964, -0.8648356199264526, -0.8432673215866089, -0.8216990232467651, -0.8001307249069214, -0.7785624265670776, -0.7569941282272339, -0.7354258298873901, -0.7138575315475464, -0.6922892332077026, -0.6707209944725037, -0.6491526961326599, -0.6275843977928162, -0.6060160994529724, -0.5844478011131287, -0.5628795027732849, -0.5413112640380859, -0.5197429656982422, -0.49817463755607605, -0.4766063392162323, -0.45503804087638855, -0.4334697723388672, -0.41190147399902344, -0.3903331756591797, -0.36876487731933594, -0.3471965789794922, -0.32562822103500366, -0.3040599226951599, -0.28249162435531616, -0.2609233260154724, -0.23935504257678986, -0.2177867442369461, -0.19621846079826355, -0.1746501624584198, -0.15308186411857605, -0.1315135657787323, -0.10994527488946915, -0.088376984000206, -0.06680868566036224, -0.045240387320518494, -0.023672103881835938, -0.0021038055419921875, 0.019464492797851562, 0.041032787412405014, 0.06260108202695847, 0.08416937291622162, 0.10573767125606537, 0.12730596959590912, 0.14887425303459167, 0.17044255137443542, 0.19201084971427917, 0.21357914805412292, 0.23514744639396667, 0.25671571493148804, 0.2782840132713318, 0.29985231161117554, 0.3214206099510193, 0.34298890829086304, 0.3645572066307068]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 6.0, 9.0, 9.0, 13.0, 18.0, 19.0, 25.0, 36.0, 29.0, 48.0, 38.0, 61.0, 53.0, 73.0, 70.0, 66.0, 66.0, 55.0, 48.0, 40.0, 50.0, 33.0, 28.0, 17.0, 16.0, 9.0, 16.0, 6.0, 6.0, 7.0, 5.0, 5.0, 3.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1656232476234436, -0.16074219346046448, -0.15586115419864655, -0.15098010003566742, -0.1460990458726883, -0.14121800661087036, -0.13633695244789124, -0.1314558982849121, -0.12657484412193298, -0.12169379740953445, -0.11681274324655533, -0.1119316965341568, -0.10705064237117767, -0.10216959565877914, -0.09728854894638062, -0.09240749478340149, -0.08752645552158356, -0.08264540880918503, -0.0777643546462059, -0.07288330793380737, -0.06800225377082825, -0.06312120705842972, -0.05824016034603119, -0.05335910990834236, -0.048478059470653534, -0.043597009032964706, -0.03871595859527588, -0.03383491188287735, -0.028953861445188522, -0.024072811007499695, -0.019191762432456017, -0.014310713857412338, -0.00942966341972351, -0.004548613913357258, 0.00033243559300899506, 0.005213485099375248, 0.0100945346057415, 0.014975585043430328, 0.019856633618474007, 0.024737682193517685, 0.029618732631206512, 0.03449978306889534, 0.03938083350658417, 0.0442618802189827, 0.049142930656671524, 0.05402398109436035, 0.05890502780675888, 0.06378607451915741, 0.06866712868213654, 0.07354817539453506, 0.07842922955751419, 0.08331027626991272, 0.08819133043289185, 0.09307237714529037, 0.0979534238576889, 0.10283447802066803, 0.10771552473306656, 0.11259657144546509, 0.11747762560844421, 0.12235867232084274, 0.12723971903324127, 0.1321207731962204, 0.13700182735919952, 0.14188286662101746, 0.14676392078399658]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 5.0, 7.0, 2.0, 7.0, 11.0, 12.0, 4.0, 16.0, 25.0, 38.0, 46.0, 70.0, 87.0, 189.0, 438.0, 1467.0, 9039.0, 204971.0, 793321.0, 34053.0, 3255.0, 778.0, 291.0, 133.0, 100.0, 51.0, 31.0, 22.0, 20.0, 21.0, 7.0, 12.0, 8.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.309814453125, -0.3004951477050781, -0.29117584228515625, -0.2818565368652344, -0.2725372314453125, -0.2632179260253906, -0.25389862060546875, -0.24457931518554688, -0.235260009765625, -0.22594070434570312, -0.21662139892578125, -0.20730209350585938, -0.1979827880859375, -0.18866348266601562, -0.17934417724609375, -0.17002487182617188, -0.16070556640625, -0.15138626098632812, -0.14206695556640625, -0.13274765014648438, -0.1234283447265625, -0.11410903930664062, -0.10478973388671875, -0.09547042846679688, -0.086151123046875, -0.07683181762695312, -0.06751251220703125, -0.058193206787109375, -0.0488739013671875, -0.039554595947265625, -0.03023529052734375, -0.020915985107421875, -0.0115966796875, -0.002277374267578125, 0.00704193115234375, 0.016361236572265625, 0.0256805419921875, 0.034999847412109375, 0.04431915283203125, 0.053638458251953125, 0.062957763671875, 0.07227706909179688, 0.08159637451171875, 0.09091567993164062, 0.1002349853515625, 0.10955429077148438, 0.11887359619140625, 0.12819290161132812, 0.13751220703125, 0.14683151245117188, 0.15615081787109375, 0.16547012329101562, 0.1747894287109375, 0.18410873413085938, 0.19342803955078125, 0.20274734497070312, 0.212066650390625, 0.22138595581054688, 0.23070526123046875, 0.24002456665039062, 0.2493438720703125, 0.2586631774902344, 0.26798248291015625, 0.2773017883300781, 0.28662109375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 9.0, 5.0, 13.0, 25.0, 31.0, 53.0, 84.0, 131.0, 148.0, 151.0, 139.0, 93.0, 56.0, 34.0, 10.0, 14.0, 11.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03619384765625, -0.035288095474243164, -0.03438234329223633, -0.03347659111022949, -0.032570838928222656, -0.03166508674621582, -0.030759334564208984, -0.02985358238220215, -0.028947830200195312, -0.028042078018188477, -0.02713632583618164, -0.026230573654174805, -0.02532482147216797, -0.024419069290161133, -0.023513317108154297, -0.02260756492614746, -0.021701812744140625, -0.02079606056213379, -0.019890308380126953, -0.018984556198120117, -0.01807880401611328, -0.017173051834106445, -0.01626729965209961, -0.015361547470092773, -0.014455795288085938, -0.013550043106079102, -0.012644290924072266, -0.01173853874206543, -0.010832786560058594, -0.009927034378051758, -0.009021282196044922, -0.008115530014038086, -0.00720977783203125, -0.006304025650024414, -0.005398273468017578, -0.004492521286010742, -0.0035867691040039062, -0.0026810169219970703, -0.0017752647399902344, -0.0008695125579833984, 3.62396240234375e-05, 0.0009419918060302734, 0.0018477439880371094, 0.0027534961700439453, 0.0036592483520507812, 0.004565000534057617, 0.005470752716064453, 0.006376504898071289, 0.007282257080078125, 0.008188009262084961, 0.009093761444091797, 0.009999513626098633, 0.010905265808105469, 0.011811017990112305, 0.01271677017211914, 0.013622522354125977, 0.014528274536132812, 0.015434026718139648, 0.016339778900146484, 0.01724553108215332, 0.018151283264160156, 0.019057035446166992, 0.019962787628173828, 0.020868539810180664, 0.0217742919921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 11.0, 18.0, 19.0, 31.0, 43.0, 74.0, 114.0, 187.0, 292.0, 435.0, 940.0, 2139.0, 6743.0, 27274.0, 131512.0, 463825.0, 321910.0, 70286.0, 15363.0, 4185.0, 1497.0, 686.0, 339.0, 244.0, 129.0, 88.0, 60.0, 37.0, 38.0, 13.0, 14.0, 6.0, 3.0, 0.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.138671875, -0.1346874237060547, -0.13070297241210938, -0.12671852111816406, -0.12273406982421875, -0.11874961853027344, -0.11476516723632812, -0.11078071594238281, -0.1067962646484375, -0.10281181335449219, -0.09882736206054688, -0.09484291076660156, -0.09085845947265625, -0.08687400817871094, -0.08288955688476562, -0.07890510559082031, -0.074920654296875, -0.07093620300292969, -0.06695175170898438, -0.06296730041503906, -0.05898284912109375, -0.05499839782714844, -0.051013946533203125, -0.04702949523925781, -0.0430450439453125, -0.03906059265136719, -0.035076141357421875, -0.031091690063476562, -0.02710723876953125, -0.023122787475585938, -0.019138336181640625, -0.015153884887695312, -0.01116943359375, -0.0071849822998046875, -0.003200531005859375, 0.0007839202880859375, 0.00476837158203125, 0.008752822875976562, 0.012737274169921875, 0.016721725463867188, 0.0207061767578125, 0.024690628051757812, 0.028675079345703125, 0.03265953063964844, 0.03664398193359375, 0.04062843322753906, 0.044612884521484375, 0.04859733581542969, 0.052581787109375, 0.05656623840332031, 0.060550689697265625, 0.06453514099121094, 0.06851959228515625, 0.07250404357910156, 0.07648849487304688, 0.08047294616699219, 0.0844573974609375, 0.08844184875488281, 0.09242630004882812, 0.09641075134277344, 0.10039520263671875, 0.10437965393066406, 0.10836410522460938, 0.11234855651855469, 0.1163330078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 6.0, 3.0, 5.0, 7.0, 14.0, 10.0, 16.0, 22.0, 13.0, 27.0, 37.0, 26.0, 28.0, 37.0, 38.0, 30.0, 33.0, 49.0, 52.0, 43.0, 51.0, 41.0, 54.0, 43.0, 30.0, 31.0, 27.0, 34.0, 27.0, 24.0, 21.0, 20.0, 13.0, 20.0, 13.0, 8.0, 11.0, 2.0, 5.0, 4.0, 8.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05810546875, -0.05614280700683594, -0.054180145263671875, -0.05221748352050781, -0.05025482177734375, -0.04829216003417969, -0.046329498291015625, -0.04436683654785156, -0.0424041748046875, -0.04044151306152344, -0.038478851318359375, -0.03651618957519531, -0.03455352783203125, -0.03259086608886719, -0.030628204345703125, -0.028665542602539062, -0.026702880859375, -0.024740219116210938, -0.022777557373046875, -0.020814895629882812, -0.01885223388671875, -0.016889572143554688, -0.014926910400390625, -0.012964248657226562, -0.0110015869140625, -0.009038925170898438, -0.007076263427734375, -0.0051136016845703125, -0.00315093994140625, -0.0011882781982421875, 0.000774383544921875, 0.0027370452880859375, 0.00469970703125, 0.0066623687744140625, 0.008625030517578125, 0.010587692260742188, 0.01255035400390625, 0.014513015747070312, 0.016475677490234375, 0.018438339233398438, 0.0204010009765625, 0.022363662719726562, 0.024326324462890625, 0.026288986206054688, 0.02825164794921875, 0.030214309692382812, 0.032176971435546875, 0.03413963317871094, 0.036102294921875, 0.03806495666503906, 0.040027618408203125, 0.04199028015136719, 0.04395294189453125, 0.04591560363769531, 0.047878265380859375, 0.04984092712402344, 0.0518035888671875, 0.05376625061035156, 0.055728912353515625, 0.05769157409667969, 0.05965423583984375, 0.06161689758300781, 0.06357955932617188, 0.06554222106933594, 0.0675048828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 1.0, 5.0, 6.0, 10.0, 5.0, 14.0, 20.0, 30.0, 27.0, 49.0, 89.0, 138.0, 198.0, 440.0, 888.0, 2454.0, 8250.0, 43500.0, 390659.0, 523864.0, 61985.0, 10695.0, 2927.0, 1093.0, 493.0, 268.0, 145.0, 86.0, 59.0, 41.0, 25.0, 22.0, 18.0, 9.0, 6.0, 17.0, 6.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132080078125, -0.12796401977539062, -0.12384796142578125, -0.11973190307617188, -0.1156158447265625, -0.11149978637695312, -0.10738372802734375, -0.10326766967773438, -0.099151611328125, -0.09503555297851562, -0.09091949462890625, -0.08680343627929688, -0.0826873779296875, -0.07857131958007812, -0.07445526123046875, -0.07033920288085938, -0.06622314453125, -0.062107086181640625, -0.05799102783203125, -0.053874969482421875, -0.0497589111328125, -0.045642852783203125, -0.04152679443359375, -0.037410736083984375, -0.033294677734375, -0.029178619384765625, -0.02506256103515625, -0.020946502685546875, -0.0168304443359375, -0.012714385986328125, -0.00859832763671875, -0.004482269287109375, -0.0003662109375, 0.003749847412109375, 0.00786590576171875, 0.011981964111328125, 0.0160980224609375, 0.020214080810546875, 0.02433013916015625, 0.028446197509765625, 0.032562255859375, 0.036678314208984375, 0.04079437255859375, 0.044910430908203125, 0.0490264892578125, 0.053142547607421875, 0.05725860595703125, 0.061374664306640625, 0.06549072265625, 0.06960678100585938, 0.07372283935546875, 0.07783889770507812, 0.0819549560546875, 0.08607101440429688, 0.09018707275390625, 0.09430313110351562, 0.098419189453125, 0.10253524780273438, 0.10665130615234375, 0.11076736450195312, 0.1148834228515625, 0.11899948120117188, 0.12311553955078125, 0.12723159790039062, 0.13134765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 6.0, 3.0, 5.0, 8.0, 14.0, 10.0, 22.0, 16.0, 23.0, 36.0, 65.0, 94.0, 117.0, 132.0, 109.0, 105.0, 61.0, 38.0, 35.0, 28.0, 20.0, 12.0, 8.0, 14.0, 4.0, 7.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003173351287841797, -0.0003069452941417694, -0.00029655545949935913, -0.00028616562485694885, -0.0002757757902145386, -0.0002653859555721283, -0.000254996120929718, -0.00024460628628730774, -0.00023421645164489746, -0.00022382661700248718, -0.0002134367823600769, -0.00020304694771766663, -0.00019265711307525635, -0.00018226727843284607, -0.0001718774437904358, -0.0001614876091480255, -0.00015109777450561523, -0.00014070793986320496, -0.00013031810522079468, -0.0001199282705783844, -0.00010953843593597412, -9.914860129356384e-05, -8.875876665115356e-05, -7.836893200874329e-05, -6.797909736633301e-05, -5.758926272392273e-05, -4.719942808151245e-05, -3.680959343910217e-05, -2.6419758796691895e-05, -1.6029924154281616e-05, -5.640089511871338e-06, 4.7497451305389404e-06, 1.5139579772949219e-05, 2.5529414415359497e-05, 3.5919249057769775e-05, 4.6309083700180054e-05, 5.669891834259033e-05, 6.708875298500061e-05, 7.747858762741089e-05, 8.786842226982117e-05, 9.825825691223145e-05, 0.00010864809155464172, 0.000119037926197052, 0.00012942776083946228, 0.00013981759548187256, 0.00015020743012428284, 0.00016059726476669312, 0.0001709870994091034, 0.00018137693405151367, 0.00019176676869392395, 0.00020215660333633423, 0.0002125464379787445, 0.00022293627262115479, 0.00023332610726356506, 0.00024371594190597534, 0.0002541057765483856, 0.0002644956111907959, 0.0002748854458332062, 0.00028527528047561646, 0.00029566511511802673, 0.000306054949760437, 0.0003164447844028473, 0.00032683461904525757, 0.00033722445368766785, 0.0003476142883300781]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 6.0, 0.0, 6.0, 5.0, 8.0, 25.0, 16.0, 29.0, 49.0, 55.0, 86.0, 116.0, 180.0, 315.0, 505.0, 1013.0, 2108.0, 4575.0, 12216.0, 37860.0, 156260.0, 516307.0, 237165.0, 52708.0, 15536.0, 5931.0, 2535.0, 1280.0, 661.0, 347.0, 197.0, 126.0, 107.0, 62.0, 35.0, 46.0, 25.0, 14.0, 14.0, 3.0, 7.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1064453125, -0.10297012329101562, -0.09949493408203125, -0.09601974487304688, -0.0925445556640625, -0.08906936645507812, -0.08559417724609375, -0.08211898803710938, -0.078643798828125, -0.07516860961914062, -0.07169342041015625, -0.06821823120117188, -0.0647430419921875, -0.061267852783203125, -0.05779266357421875, -0.054317474365234375, -0.05084228515625, -0.047367095947265625, -0.04389190673828125, -0.040416717529296875, -0.0369415283203125, -0.033466339111328125, -0.02999114990234375, -0.026515960693359375, -0.023040771484375, -0.019565582275390625, -0.01609039306640625, -0.012615203857421875, -0.0091400146484375, -0.005664825439453125, -0.00218963623046875, 0.001285552978515625, 0.0047607421875, 0.008235931396484375, 0.01171112060546875, 0.015186309814453125, 0.0186614990234375, 0.022136688232421875, 0.02561187744140625, 0.029087066650390625, 0.032562255859375, 0.036037445068359375, 0.03951263427734375, 0.042987823486328125, 0.0464630126953125, 0.049938201904296875, 0.05341339111328125, 0.056888580322265625, 0.06036376953125, 0.06383895874023438, 0.06731414794921875, 0.07078933715820312, 0.0742645263671875, 0.07773971557617188, 0.08121490478515625, 0.08469009399414062, 0.088165283203125, 0.09164047241210938, 0.09511566162109375, 0.09859085083007812, 0.1020660400390625, 0.10554122924804688, 0.10901641845703125, 0.11249160766601562, 0.115966796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 9.0, 7.0, 6.0, 10.0, 14.0, 16.0, 34.0, 32.0, 47.0, 55.0, 67.0, 83.0, 80.0, 97.0, 81.0, 82.0, 61.0, 51.0, 38.0, 31.0, 23.0, 16.0, 10.0, 9.0, 7.0, 6.0, 5.0, 8.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0660400390625, -0.06378650665283203, -0.06153297424316406, -0.059279441833496094, -0.057025909423828125, -0.054772377014160156, -0.05251884460449219, -0.05026531219482422, -0.04801177978515625, -0.04575824737548828, -0.04350471496582031, -0.041251182556152344, -0.038997650146484375, -0.036744117736816406, -0.03449058532714844, -0.03223705291748047, -0.0299835205078125, -0.02772998809814453, -0.025476455688476562, -0.023222923278808594, -0.020969390869140625, -0.018715858459472656, -0.016462326049804688, -0.014208793640136719, -0.01195526123046875, -0.009701728820800781, -0.0074481964111328125, -0.005194664001464844, -0.002941131591796875, -0.0006875991821289062, 0.0015659332275390625, 0.0038194656372070312, 0.006072998046875, 0.008326530456542969, 0.010580062866210938, 0.012833595275878906, 0.015087127685546875, 0.017340660095214844, 0.019594192504882812, 0.02184772491455078, 0.02410125732421875, 0.02635478973388672, 0.028608322143554688, 0.030861854553222656, 0.033115386962890625, 0.035368919372558594, 0.03762245178222656, 0.03987598419189453, 0.0421295166015625, 0.04438304901123047, 0.04663658142089844, 0.048890113830566406, 0.051143646240234375, 0.053397178649902344, 0.05565071105957031, 0.05790424346923828, 0.06015777587890625, 0.06241130828857422, 0.06466484069824219, 0.06691837310791016, 0.06917190551757812, 0.0714254379272461, 0.07367897033691406, 0.07593250274658203, 0.07818603515625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 70.0, 619.0, 268.0, 33.0, 12.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.495405673980713, -5.377796649932861, -5.26018762588501, -5.142578601837158, -5.024969100952148, -4.907360076904297, -4.789751052856445, -4.672142028808594, -4.554533004760742, -4.436923980712891, -4.319314956665039, -4.2017059326171875, -4.084096431732178, -3.966487407684326, -3.8488783836364746, -3.731269359588623, -3.6136603355407715, -3.49605131149292, -3.3784420490264893, -3.2608330249786377, -3.143224000930786, -3.0256147384643555, -2.908005714416504, -2.7903966903686523, -2.6727874279022217, -2.55517840385437, -2.4375691413879395, -2.319960117340088, -2.2023510932922363, -2.0847420692443848, -1.967132806777954, -1.8495237827301025, -1.731914758682251, -1.6143056154251099, -1.4966965913772583, -1.3790874481201172, -1.2614784240722656, -1.1438692808151245, -1.0262601375579834, -0.9086511135101318, -0.7910420298576355, -0.6734329462051392, -0.5558238625526428, -0.4382147490978241, -0.32060566544532776, -0.20299655199050903, -0.0853874683380127, 0.03222161531448364, 0.14983069896697998, 0.2674397826194763, 0.38504886627197266, 0.5026580095291138, 0.6202670335769653, 0.7378761768341064, 0.8554852604866028, 0.9730943441390991, 1.0907034873962402, 1.2083126306533813, 1.325921654701233, 1.443530797958374, 1.5611398220062256, 1.6787489652633667, 1.7963581085205078, 1.9139671325683594, 2.031576156616211]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 11.0, 9.0, 6.0, 13.0, 21.0, 23.0, 24.0, 29.0, 32.0, 48.0, 54.0, 68.0, 48.0, 56.0, 67.0, 69.0, 44.0, 59.0, 60.0, 40.0, 39.0, 33.0, 29.0, 25.0, 19.0, 20.0, 18.0, 9.0, 8.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.7037016153335571, -0.684956431388855, -0.6662112474441528, -0.6474660634994507, -0.6287208795547485, -0.6099756956100464, -0.5912305116653442, -0.5724853277206421, -0.5537401437759399, -0.5349949598312378, -0.5162497758865356, -0.4975045919418335, -0.47875940799713135, -0.4600142240524292, -0.44126904010772705, -0.4225238561630249, -0.40377870202064514, -0.385033518075943, -0.36628833413124084, -0.3475431501865387, -0.32879796624183655, -0.3100527822971344, -0.29130762815475464, -0.2725624442100525, -0.25381726026535034, -0.2350720763206482, -0.21632689237594604, -0.1975817084312439, -0.17883652448654175, -0.1600913405418396, -0.14134617149829865, -0.1226009875535965, -0.10385578870773315, -0.085110604763031, -0.06636542081832886, -0.047620244324207306, -0.028875060379505157, -0.010129876434803009, 0.008615300059318542, 0.02736048400402069, 0.04610566794872284, 0.06485085189342499, 0.08359603583812714, 0.10234121233224869, 0.12108639627695084, 0.1398315727710724, 0.15857675671577454, 0.17732194066047668, 0.19606712460517883, 0.21481230854988098, 0.23355749249458313, 0.2523026764392853, 0.2710478603839874, 0.2897930443286896, 0.30853819847106934, 0.3272833824157715, 0.34602856636047363, 0.3647737503051758, 0.38351893424987793, 0.4022641181945801, 0.4210093021392822, 0.4397544860839844, 0.4584996700286865, 0.47724485397338867, 0.4959900379180908]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 15.0, 18.0, 32.0, 58.0, 106.0, 187.0, 507.0, 7241.0, 4167000.0, 18191.0, 628.0, 145.0, 83.0, 31.0, 14.0, 12.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.771484375, -1.72674560546875, -1.6820068359375, -1.63726806640625, -1.592529296875, -1.54779052734375, -1.5030517578125, -1.45831298828125, -1.41357421875, -1.36883544921875, -1.3240966796875, -1.27935791015625, -1.234619140625, -1.18988037109375, -1.1451416015625, -1.10040283203125, -1.0556640625, -1.01092529296875, -0.9661865234375, -0.92144775390625, -0.876708984375, -0.83197021484375, -0.7872314453125, -0.74249267578125, -0.69775390625, -0.65301513671875, -0.6082763671875, -0.56353759765625, -0.518798828125, -0.47406005859375, -0.4293212890625, -0.38458251953125, -0.33984375, -0.29510498046875, -0.2503662109375, -0.20562744140625, -0.160888671875, -0.11614990234375, -0.0714111328125, -0.02667236328125, 0.01806640625, 0.06280517578125, 0.1075439453125, 0.15228271484375, 0.197021484375, 0.24176025390625, 0.2864990234375, 0.33123779296875, 0.3759765625, 0.42071533203125, 0.4654541015625, 0.51019287109375, 0.554931640625, 0.59967041015625, 0.6444091796875, 0.68914794921875, 0.73388671875, 0.77862548828125, 0.8233642578125, 0.86810302734375, 0.912841796875, 0.95758056640625, 1.0023193359375, 1.04705810546875, 1.091796875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 18.0, 18.0, 40.0, 65.0, 83.0, 122.0, 146.0, 142.0, 109.0, 97.0, 55.0, 47.0, 25.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04339599609375, -0.04228472709655762, -0.041173458099365234, -0.04006218910217285, -0.03895092010498047, -0.037839651107788086, -0.0367283821105957, -0.03561711311340332, -0.03450584411621094, -0.033394575119018555, -0.03228330612182617, -0.03117203712463379, -0.030060768127441406, -0.028949499130249023, -0.02783823013305664, -0.026726961135864258, -0.025615692138671875, -0.024504423141479492, -0.02339315414428711, -0.022281885147094727, -0.021170616149902344, -0.02005934715270996, -0.018948078155517578, -0.017836809158325195, -0.016725540161132812, -0.01561427116394043, -0.014503002166748047, -0.013391733169555664, -0.012280464172363281, -0.011169195175170898, -0.010057926177978516, -0.008946657180786133, -0.00783538818359375, -0.006724119186401367, -0.005612850189208984, -0.0045015811920166016, -0.0033903121948242188, -0.002279043197631836, -0.0011677742004394531, -5.650520324707031e-05, 0.0010547637939453125, 0.0021660327911376953, 0.003277301788330078, 0.004388570785522461, 0.005499839782714844, 0.0066111087799072266, 0.007722377777099609, 0.008833646774291992, 0.009944915771484375, 0.011056184768676758, 0.01216745376586914, 0.013278722763061523, 0.014389991760253906, 0.015501260757446289, 0.016612529754638672, 0.017723798751831055, 0.018835067749023438, 0.01994633674621582, 0.021057605743408203, 0.022168874740600586, 0.02328014373779297, 0.02439141273498535, 0.025502681732177734, 0.026613950729370117, 0.0277252197265625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 13.0, 19.0, 28.0, 48.0, 81.0, 134.0, 228.0, 445.0, 1240.0, 7232.0, 237978.0, 3914607.0, 27827.0, 2813.0, 780.0, 335.0, 179.0, 117.0, 72.0, 34.0, 23.0, 22.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.765625, -0.7486953735351562, -0.7317657470703125, -0.7148361206054688, -0.697906494140625, -0.6809768676757812, -0.6640472412109375, -0.6471176147460938, -0.63018798828125, -0.6132583618164062, -0.5963287353515625, -0.5793991088867188, -0.562469482421875, -0.5455398559570312, -0.5286102294921875, -0.5116806030273438, -0.4947509765625, -0.47782135009765625, -0.4608917236328125, -0.44396209716796875, -0.427032470703125, -0.41010284423828125, -0.3931732177734375, -0.37624359130859375, -0.35931396484375, -0.34238433837890625, -0.3254547119140625, -0.30852508544921875, -0.291595458984375, -0.27466583251953125, -0.2577362060546875, -0.24080657958984375, -0.223876953125, -0.20694732666015625, -0.1900177001953125, -0.17308807373046875, -0.156158447265625, -0.13922882080078125, -0.1222991943359375, -0.10536956787109375, -0.08843994140625, -0.07151031494140625, -0.0545806884765625, -0.03765106201171875, -0.020721435546875, -0.00379180908203125, 0.0131378173828125, 0.03006744384765625, 0.0469970703125, 0.06392669677734375, 0.0808563232421875, 0.09778594970703125, 0.114715576171875, 0.13164520263671875, 0.1485748291015625, 0.16550445556640625, 0.18243408203125, 0.19936370849609375, 0.2162933349609375, 0.23322296142578125, 0.250152587890625, 0.26708221435546875, 0.2840118408203125, 0.30094146728515625, 0.31787109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 9.0, 10.0, 22.0, 51.0, 115.0, 395.0, 2282.0, 787.0, 195.0, 87.0, 49.0, 36.0, 16.0, 10.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06048583984375, -0.057824134826660156, -0.05516242980957031, -0.05250072479248047, -0.049839019775390625, -0.04717731475830078, -0.04451560974121094, -0.041853904724121094, -0.03919219970703125, -0.036530494689941406, -0.03386878967285156, -0.03120708465576172, -0.028545379638671875, -0.02588367462158203, -0.023221969604492188, -0.020560264587402344, -0.0178985595703125, -0.015236854553222656, -0.012575149536132812, -0.009913444519042969, -0.007251739501953125, -0.004590034484863281, -0.0019283294677734375, 0.0007333755493164062, 0.00339508056640625, 0.006056785583496094, 0.008718490600585938, 0.011380195617675781, 0.014041900634765625, 0.01670360565185547, 0.019365310668945312, 0.022027015686035156, 0.024688720703125, 0.027350425720214844, 0.030012130737304688, 0.03267383575439453, 0.035335540771484375, 0.03799724578857422, 0.04065895080566406, 0.043320655822753906, 0.04598236083984375, 0.048644065856933594, 0.05130577087402344, 0.05396747589111328, 0.056629180908203125, 0.05929088592529297, 0.06195259094238281, 0.06461429595947266, 0.0672760009765625, 0.06993770599365234, 0.07259941101074219, 0.07526111602783203, 0.07792282104492188, 0.08058452606201172, 0.08324623107910156, 0.0859079360961914, 0.08856964111328125, 0.0912313461303711, 0.09389305114746094, 0.09655475616455078, 0.09921646118164062, 0.10187816619873047, 0.10453987121582031, 0.10720157623291016, 0.10986328125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 21.0, 81.0, 333.0, 386.0, 138.0, 23.0, 14.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8619567155838013, -0.834230363368988, -0.8065040111541748, -0.7787776589393616, -0.7510513067245483, -0.7233248949050903, -0.6955985426902771, -0.6678721904754639, -0.6401458382606506, -0.6124194860458374, -0.5846931338310242, -0.5569667816162109, -0.5292403697967529, -0.5015140771865845, -0.47378766536712646, -0.44606131315231323, -0.4183349609375, -0.39060860872268677, -0.36288225650787354, -0.3351558744907379, -0.3074295222759247, -0.27970317006111145, -0.25197678804397583, -0.2242504358291626, -0.19652408361434937, -0.16879773139953613, -0.1410713642835617, -0.11334500461816788, -0.08561864495277405, -0.057892292737960815, -0.03016592562198639, -0.002439558506011963, 0.02528679370880127, 0.0530131533741951, 0.08073951303958893, 0.10846587270498276, 0.1361922323703766, 0.16391858458518982, 0.19164495170116425, 0.21937131881713867, 0.2470976710319519, 0.27482402324676514, 0.30255037546157837, 0.330276757478714, 0.3580031096935272, 0.38572946190834045, 0.4134558439254761, 0.4411821961402893, 0.46890854835510254, 0.49663490056991577, 0.524361252784729, 0.5520876049995422, 0.5798139572143555, 0.6075403690338135, 0.6352667212486267, 0.6629930734634399, 0.6907194256782532, 0.7184457778930664, 0.7461721301078796, 0.7738984823226929, 0.8016248941421509, 0.8293511867523193, 0.8570775985717773, 0.8848039507865906, 0.9125303030014038]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 11.0, 20.0, 19.0, 28.0, 35.0, 46.0, 65.0, 77.0, 79.0, 100.0, 87.0, 91.0, 76.0, 64.0, 49.0, 57.0, 19.0, 26.0, 14.0, 14.0, 9.0, 8.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.29967689514160156, -0.2895333766937256, -0.2793898582458496, -0.26924633979797363, -0.25910285115242004, -0.24895933270454407, -0.2388158142566681, -0.22867229580879211, -0.21852877736091614, -0.20838525891304016, -0.19824175536632538, -0.1880982369184494, -0.17795471847057343, -0.16781121492385864, -0.15766769647598267, -0.1475241780281067, -0.1373806744813919, -0.12723715603351593, -0.11709364503622055, -0.10695013403892517, -0.0968066155910492, -0.08666310459375381, -0.07651959359645844, -0.06637607514858246, -0.05623256415128708, -0.0460890494287014, -0.03594553470611572, -0.025802023708820343, -0.015658508986234665, -0.005514994263648987, 0.004628516733646393, 0.01477203518152237, 0.02491554617881775, 0.03505906090140343, 0.045202575623989105, 0.055346086621284485, 0.06548960506916046, 0.07563311606645584, 0.08577662706375122, 0.0959201455116272, 0.10606365650892258, 0.11620716750621796, 0.12635068595409393, 0.13649418950080872, 0.1466377079486847, 0.15678122639656067, 0.16692474484443665, 0.17706826329231262, 0.1872117668390274, 0.19735528528690338, 0.20749878883361816, 0.21764230728149414, 0.22778582572937012, 0.2379293441772461, 0.24807284772396088, 0.25821638107299805, 0.26835986971855164, 0.2785033881664276, 0.2886469066143036, 0.2987903952598572, 0.30893391370773315, 0.31907743215560913, 0.3292209506034851, 0.3393644690513611, 0.34950798749923706]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 4.0, 7.0, 7.0, 15.0, 15.0, 25.0, 33.0, 39.0, 56.0, 117.0, 238.0, 818.0, 4224.0, 68136.0, 873645.0, 94632.0, 5013.0, 929.0, 268.0, 120.0, 66.0, 40.0, 24.0, 24.0, 20.0, 9.0, 11.0, 3.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39453125, -0.38311004638671875, -0.3716888427734375, -0.36026763916015625, -0.348846435546875, -0.33742523193359375, -0.3260040283203125, -0.31458282470703125, -0.30316162109375, -0.29174041748046875, -0.2803192138671875, -0.26889801025390625, -0.257476806640625, -0.24605560302734375, -0.2346343994140625, -0.22321319580078125, -0.2117919921875, -0.20037078857421875, -0.1889495849609375, -0.17752838134765625, -0.166107177734375, -0.15468597412109375, -0.1432647705078125, -0.13184356689453125, -0.12042236328125, -0.10900115966796875, -0.0975799560546875, -0.08615875244140625, -0.074737548828125, -0.06331634521484375, -0.0518951416015625, -0.04047393798828125, -0.029052734375, -0.01763153076171875, -0.0062103271484375, 0.00521087646484375, 0.016632080078125, 0.02805328369140625, 0.0394744873046875, 0.05089569091796875, 0.06231689453125, 0.07373809814453125, 0.0851593017578125, 0.09658050537109375, 0.108001708984375, 0.11942291259765625, 0.1308441162109375, 0.14226531982421875, 0.1536865234375, 0.16510772705078125, 0.1765289306640625, 0.18795013427734375, 0.199371337890625, 0.21079254150390625, 0.2222137451171875, 0.23363494873046875, 0.24505615234375, 0.25647735595703125, 0.2678985595703125, 0.27931976318359375, 0.290740966796875, 0.30216217041015625, 0.3135833740234375, 0.32500457763671875, 0.33642578125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 8.0, 19.0, 44.0, 51.0, 68.0, 124.0, 150.0, 155.0, 121.0, 95.0, 65.0, 50.0, 24.0, 11.0, 4.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049530029296875, -0.048384666442871094, -0.04723930358886719, -0.04609394073486328, -0.044948577880859375, -0.04380321502685547, -0.04265785217285156, -0.041512489318847656, -0.04036712646484375, -0.039221763610839844, -0.03807640075683594, -0.03693103790283203, -0.035785675048828125, -0.03464031219482422, -0.03349494934082031, -0.032349586486816406, -0.0312042236328125, -0.030058860778808594, -0.028913497924804688, -0.02776813507080078, -0.026622772216796875, -0.02547740936279297, -0.024332046508789062, -0.023186683654785156, -0.02204132080078125, -0.020895957946777344, -0.019750595092773438, -0.01860523223876953, -0.017459869384765625, -0.01631450653076172, -0.015169143676757812, -0.014023780822753906, -0.01287841796875, -0.011733055114746094, -0.010587692260742188, -0.009442329406738281, -0.008296966552734375, -0.007151603698730469, -0.0060062408447265625, -0.004860877990722656, -0.00371551513671875, -0.0025701522827148438, -0.0014247894287109375, -0.00027942657470703125, 0.000865936279296875, 0.0020112991333007812, 0.0031566619873046875, 0.004302024841308594, 0.0054473876953125, 0.006592750549316406, 0.0077381134033203125, 0.008883476257324219, 0.010028839111328125, 0.011174201965332031, 0.012319564819335938, 0.013464927673339844, 0.01461029052734375, 0.015755653381347656, 0.016901016235351562, 0.01804637908935547, 0.019191741943359375, 0.02033710479736328, 0.021482467651367188, 0.022627830505371094, 0.023773193359375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 1.0, 10.0, 3.0, 8.0, 10.0, 20.0, 16.0, 29.0, 51.0, 73.0, 112.0, 200.0, 379.0, 657.0, 1253.0, 3343.0, 11778.0, 67022.0, 408718.0, 455586.0, 79230.0, 13348.0, 3638.0, 1402.0, 688.0, 389.0, 228.0, 132.0, 75.0, 48.0, 29.0, 22.0, 18.0, 13.0, 10.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.136474609375, -0.1320781707763672, -0.12768173217773438, -0.12328529357910156, -0.11888885498046875, -0.11449241638183594, -0.11009597778320312, -0.10569953918457031, -0.1013031005859375, -0.09690666198730469, -0.09251022338867188, -0.08811378479003906, -0.08371734619140625, -0.07932090759277344, -0.07492446899414062, -0.07052803039550781, -0.066131591796875, -0.06173515319824219, -0.057338714599609375, -0.05294227600097656, -0.04854583740234375, -0.04414939880371094, -0.039752960205078125, -0.03535652160644531, -0.0309600830078125, -0.026563644409179688, -0.022167205810546875, -0.017770767211914062, -0.01337432861328125, -0.008977890014648438, -0.004581451416015625, -0.0001850128173828125, 0.00421142578125, 0.008607864379882812, 0.013004302978515625, 0.017400741577148438, 0.02179718017578125, 0.026193618774414062, 0.030590057373046875, 0.03498649597167969, 0.0393829345703125, 0.04377937316894531, 0.048175811767578125, 0.05257225036621094, 0.05696868896484375, 0.06136512756347656, 0.06576156616210938, 0.07015800476074219, 0.074554443359375, 0.07895088195800781, 0.08334732055664062, 0.08774375915527344, 0.09214019775390625, 0.09653663635253906, 0.10093307495117188, 0.10532951354980469, 0.1097259521484375, 0.11412239074707031, 0.11851882934570312, 0.12291526794433594, 0.12731170654296875, 0.13170814514160156, 0.13610458374023438, 0.1405010223388672, 0.1448974609375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 11.0, 17.0, 11.0, 15.0, 27.0, 24.0, 36.0, 32.0, 44.0, 42.0, 32.0, 49.0, 41.0, 39.0, 50.0, 46.0, 47.0, 39.0, 42.0, 43.0, 37.0, 43.0, 35.0, 33.0, 26.0, 21.0, 17.0, 13.0, 10.0, 13.0, 11.0, 7.0, 3.0, 4.0, 0.0, 6.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06493663787841797, -0.06267356872558594, -0.060410499572753906, -0.058147430419921875, -0.055884361267089844, -0.05362129211425781, -0.05135822296142578, -0.04909515380859375, -0.04683208465576172, -0.04456901550292969, -0.042305946350097656, -0.040042877197265625, -0.037779808044433594, -0.03551673889160156, -0.03325366973876953, -0.0309906005859375, -0.02872753143310547, -0.026464462280273438, -0.024201393127441406, -0.021938323974609375, -0.019675254821777344, -0.017412185668945312, -0.015149116516113281, -0.01288604736328125, -0.010622978210449219, -0.008359909057617188, -0.006096839904785156, -0.003833770751953125, -0.0015707015991210938, 0.0006923675537109375, 0.0029554367065429688, 0.005218505859375, 0.007481575012207031, 0.009744644165039062, 0.012007713317871094, 0.014270782470703125, 0.016533851623535156, 0.018796920776367188, 0.02105998992919922, 0.02332305908203125, 0.02558612823486328, 0.027849197387695312, 0.030112266540527344, 0.032375335693359375, 0.034638404846191406, 0.03690147399902344, 0.03916454315185547, 0.0414276123046875, 0.04369068145751953, 0.04595375061035156, 0.048216819763183594, 0.050479888916015625, 0.052742958068847656, 0.05500602722167969, 0.05726909637451172, 0.05953216552734375, 0.06179523468017578, 0.06405830383300781, 0.06632137298583984, 0.06858444213867188, 0.0708475112915039, 0.07311058044433594, 0.07537364959716797, 0.07763671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 14.0, 15.0, 14.0, 36.0, 63.0, 85.0, 151.0, 251.0, 556.0, 1268.0, 4193.0, 22894.0, 577490.0, 417404.0, 18158.0, 3665.0, 1155.0, 510.0, 216.0, 135.0, 89.0, 45.0, 43.0, 23.0, 20.0, 10.0, 10.0, 6.0, 3.0, 8.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1973876953125, -0.1920452117919922, -0.18670272827148438, -0.18136024475097656, -0.17601776123046875, -0.17067527770996094, -0.16533279418945312, -0.1599903106689453, -0.1546478271484375, -0.1493053436279297, -0.14396286010742188, -0.13862037658691406, -0.13327789306640625, -0.12793540954589844, -0.12259292602539062, -0.11725044250488281, -0.111907958984375, -0.10656547546386719, -0.10122299194335938, -0.09588050842285156, -0.09053802490234375, -0.08519554138183594, -0.07985305786132812, -0.07451057434082031, -0.0691680908203125, -0.06382560729980469, -0.058483123779296875, -0.05314064025878906, -0.04779815673828125, -0.04245567321777344, -0.037113189697265625, -0.03177070617675781, -0.02642822265625, -0.021085739135742188, -0.015743255615234375, -0.010400772094726562, -0.00505828857421875, 0.0002841949462890625, 0.005626678466796875, 0.010969161987304688, 0.0163116455078125, 0.021654129028320312, 0.026996612548828125, 0.03233909606933594, 0.03768157958984375, 0.04302406311035156, 0.048366546630859375, 0.05370903015136719, 0.059051513671875, 0.06439399719238281, 0.06973648071289062, 0.07507896423339844, 0.08042144775390625, 0.08576393127441406, 0.09110641479492188, 0.09644889831542969, 0.1017913818359375, 0.10713386535644531, 0.11247634887695312, 0.11781883239746094, 0.12316131591796875, 0.12850379943847656, 0.13384628295898438, 0.1391887664794922, 0.14453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 13.0, 10.0, 22.0, 24.0, 27.0, 57.0, 65.0, 101.0, 112.0, 83.0, 123.0, 93.0, 68.0, 60.0, 45.0, 25.0, 22.0, 14.0, 10.0, 9.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001442432403564453, -0.00013936683535575867, -0.00013449043035507202, -0.00012961402535438538, -0.00012473762035369873, -0.00011986121535301208, -0.00011498481035232544, -0.0001101084053516388, -0.00010523200035095215, -0.0001003555953502655, -9.547919034957886e-05, -9.060278534889221e-05, -8.572638034820557e-05, -8.084997534751892e-05, -7.597357034683228e-05, -7.109716534614563e-05, -6.622076034545898e-05, -6.134435534477234e-05, -5.646795034408569e-05, -5.159154534339905e-05, -4.67151403427124e-05, -4.183873534202576e-05, -3.696233034133911e-05, -3.2085925340652466e-05, -2.720952033996582e-05, -2.2333115339279175e-05, -1.745671033859253e-05, -1.2580305337905884e-05, -7.703900337219238e-06, -2.8274953365325928e-06, 2.0489096641540527e-06, 6.925314664840698e-06, 1.1801719665527344e-05, 1.667812466621399e-05, 2.1554529666900635e-05, 2.643093466758728e-05, 3.1307339668273926e-05, 3.618374466896057e-05, 4.106014966964722e-05, 4.593655467033386e-05, 5.081295967102051e-05, 5.568936467170715e-05, 6.05657696723938e-05, 6.544217467308044e-05, 7.031857967376709e-05, 7.519498467445374e-05, 8.007138967514038e-05, 8.494779467582703e-05, 8.982419967651367e-05, 9.470060467720032e-05, 9.957700967788696e-05, 0.00010445341467857361, 0.00010932981967926025, 0.0001142062246799469, 0.00011908262968063354, 0.0001239590346813202, 0.00012883543968200684, 0.00013371184468269348, 0.00013858824968338013, 0.00014346465468406677, 0.00014834105968475342, 0.00015321746468544006, 0.0001580938696861267, 0.00016297027468681335, 0.0001678466796875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 10.0, 3.0, 10.0, 6.0, 12.0, 17.0, 29.0, 52.0, 83.0, 121.0, 246.0, 467.0, 1158.0, 3107.0, 12260.0, 116104.0, 811467.0, 87448.0, 10816.0, 3015.0, 1040.0, 486.0, 252.0, 123.0, 78.0, 40.0, 33.0, 25.0, 21.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1767578125, -0.17190933227539062, -0.16706085205078125, -0.16221237182617188, -0.1573638916015625, -0.15251541137695312, -0.14766693115234375, -0.14281845092773438, -0.137969970703125, -0.13312149047851562, -0.12827301025390625, -0.12342453002929688, -0.1185760498046875, -0.11372756958007812, -0.10887908935546875, -0.10403060913085938, -0.09918212890625, -0.09433364868164062, -0.08948516845703125, -0.08463668823242188, -0.0797882080078125, -0.07493972778320312, -0.07009124755859375, -0.06524276733398438, -0.060394287109375, -0.055545806884765625, -0.05069732666015625, -0.045848846435546875, -0.0410003662109375, -0.036151885986328125, -0.03130340576171875, -0.026454925537109375, -0.0216064453125, -0.016757965087890625, -0.01190948486328125, -0.007061004638671875, -0.0022125244140625, 0.002635955810546875, 0.00748443603515625, 0.012332916259765625, 0.017181396484375, 0.022029876708984375, 0.02687835693359375, 0.031726837158203125, 0.0365753173828125, 0.041423797607421875, 0.04627227783203125, 0.051120758056640625, 0.05596923828125, 0.060817718505859375, 0.06566619873046875, 0.07051467895507812, 0.0753631591796875, 0.08021163940429688, 0.08506011962890625, 0.08990859985351562, 0.094757080078125, 0.09960556030273438, 0.10445404052734375, 0.10930252075195312, 0.1141510009765625, 0.11899948120117188, 0.12384796142578125, 0.12869644165039062, 0.133544921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 9.0, 12.0, 16.0, 28.0, 40.0, 53.0, 86.0, 113.0, 107.0, 128.0, 126.0, 90.0, 60.0, 40.0, 30.0, 14.0, 13.0, 4.0, 5.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052093505859375, -0.0496220588684082, -0.047150611877441406, -0.04467916488647461, -0.04220771789550781, -0.039736270904541016, -0.03726482391357422, -0.03479337692260742, -0.032321929931640625, -0.029850482940673828, -0.02737903594970703, -0.024907588958740234, -0.022436141967773438, -0.01996469497680664, -0.017493247985839844, -0.015021800994873047, -0.01255035400390625, -0.010078907012939453, -0.007607460021972656, -0.005136013031005859, -0.0026645660400390625, -0.00019311904907226562, 0.0022783279418945312, 0.004749774932861328, 0.007221221923828125, 0.009692668914794922, 0.012164115905761719, 0.014635562896728516, 0.017107009887695312, 0.01957845687866211, 0.022049903869628906, 0.024521350860595703, 0.0269927978515625, 0.029464244842529297, 0.031935691833496094, 0.03440713882446289, 0.03687858581542969, 0.039350032806396484, 0.04182147979736328, 0.04429292678833008, 0.046764373779296875, 0.04923582077026367, 0.05170726776123047, 0.054178714752197266, 0.05665016174316406, 0.05912160873413086, 0.061593055725097656, 0.06406450271606445, 0.06653594970703125, 0.06900739669799805, 0.07147884368896484, 0.07395029067993164, 0.07642173767089844, 0.07889318466186523, 0.08136463165283203, 0.08383607864379883, 0.08630752563476562, 0.08877897262573242, 0.09125041961669922, 0.09372186660766602, 0.09619331359863281, 0.09866476058959961, 0.1011362075805664, 0.1036076545715332, 0.1060791015625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 33.0, 85.0, 236.0, 329.0, 182.0, 80.0, 28.0, 7.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8287944793701172, -1.783369541168213, -1.737944483757019, -1.6925195455551147, -1.647094488143921, -1.6016695499420166, -1.5562446117401123, -1.510819673538208, -1.4653946161270142, -1.4199696779251099, -1.374544620513916, -1.3291196823120117, -1.2836947441101074, -1.2382696866989136, -1.1928447484970093, -1.1474196910858154, -1.1019947528839111, -1.0565698146820068, -1.011144757270813, -0.9657198190689087, -0.9202948212623596, -0.8748698234558105, -0.8294448852539062, -0.7840198874473572, -0.7385948896408081, -0.693169891834259, -0.64774489402771, -0.6023199558258057, -0.5568949580192566, -0.5114699602127075, -0.46604499220848083, -0.42062002420425415, -0.3751950263977051, -0.329770028591156, -0.2843450605869293, -0.23892007768154144, -0.19349509477615356, -0.14807011187076569, -0.10264512896537781, -0.05722016096115112, -0.01179516315460205, 0.03362981975078583, 0.0790548026561737, 0.12447978556156158, 0.16990476846694946, 0.21532975137233734, 0.2607547342777252, 0.3061797022819519, 0.351604700088501, 0.39702969789505005, 0.44245466589927673, 0.4878796339035034, 0.5333046317100525, 0.5787296295166016, 0.6241545677185059, 0.6695795655250549, 0.715004563331604, 0.7604295611381531, 0.8058545589447021, 0.8512794971466064, 0.8967044949531555, 0.9421294927597046, 0.9875544309616089, 1.0329794883728027, 1.078404426574707]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 8.0, 15.0, 5.0, 10.0, 12.0, 17.0, 21.0, 38.0, 25.0, 36.0, 33.0, 38.0, 50.0, 43.0, 55.0, 62.0, 37.0, 61.0, 52.0, 58.0, 46.0, 43.0, 43.0, 24.0, 36.0, 24.0, 16.0, 11.0, 21.0, 10.0, 15.0, 3.0, 6.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.6281569600105286, -0.611257791519165, -0.5943586230278015, -0.577459454536438, -0.5605602860450745, -0.5436611175537109, -0.5267619490623474, -0.5098627805709839, -0.49296361207962036, -0.47606444358825684, -0.4591652750968933, -0.4422661066055298, -0.42536693811416626, -0.40846776962280273, -0.3915686011314392, -0.3746694326400757, -0.35777026414871216, -0.34087109565734863, -0.3239719271659851, -0.3070727586746216, -0.29017359018325806, -0.27327442169189453, -0.256375253200531, -0.23947608470916748, -0.22257691621780396, -0.20567774772644043, -0.1887785792350769, -0.17187941074371338, -0.15498024225234985, -0.13808107376098633, -0.1211819052696228, -0.10428273677825928, -0.08738356828689575, -0.07048439979553223, -0.0535852313041687, -0.036686062812805176, -0.01978689432144165, -0.002887725830078125, 0.0140114426612854, 0.030910611152648926, 0.04780977964401245, 0.06470894813537598, 0.0816081166267395, 0.09850728511810303, 0.11540645360946655, 0.13230562210083008, 0.1492047905921936, 0.16610395908355713, 0.18300312757492065, 0.19990229606628418, 0.2168014645576477, 0.23370063304901123, 0.25059980154037476, 0.2674989700317383, 0.2843981385231018, 0.30129730701446533, 0.31819647550582886, 0.3350956439971924, 0.3519948124885559, 0.36889398097991943, 0.38579314947128296, 0.4026923179626465, 0.41959148645401, 0.43649065494537354, 0.45338982343673706]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 7.0, 4.0, 3.0, 5.0, 5.0, 9.0, 4.0, 9.0, 4.0, 5.0, 17.0, 16.0, 17.0, 17.0, 27.0, 25.0, 21.0, 29.0, 38.0, 47.0, 44.0, 101.0, 174.0, 299.0, 649.0, 1953.0, 7695.0, 65321.0, 3832716.0, 262361.0, 17879.0, 3294.0, 888.0, 344.0, 140.0, 60.0, 26.0, 17.0, 14.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.521484375, -0.5109939575195312, -0.5005035400390625, -0.49001312255859375, -0.479522705078125, -0.46903228759765625, -0.4585418701171875, -0.44805145263671875, -0.43756103515625, -0.42707061767578125, -0.4165802001953125, -0.40608978271484375, -0.395599365234375, -0.38510894775390625, -0.3746185302734375, -0.36412811279296875, -0.3536376953125, -0.34314727783203125, -0.3326568603515625, -0.32216644287109375, -0.311676025390625, -0.30118560791015625, -0.2906951904296875, -0.28020477294921875, -0.26971435546875, -0.25922393798828125, -0.2487335205078125, -0.23824310302734375, -0.227752685546875, -0.21726226806640625, -0.2067718505859375, -0.19628143310546875, -0.185791015625, -0.17530059814453125, -0.1648101806640625, -0.15431976318359375, -0.143829345703125, -0.13333892822265625, -0.1228485107421875, -0.11235809326171875, -0.10186767578125, -0.09137725830078125, -0.0808868408203125, -0.07039642333984375, -0.059906005859375, -0.04941558837890625, -0.0389251708984375, -0.02843475341796875, -0.0179443359375, -0.00745391845703125, 0.0030364990234375, 0.01352691650390625, 0.024017333984375, 0.03450775146484375, 0.0449981689453125, 0.05548858642578125, 0.06597900390625, 0.07646942138671875, 0.0869598388671875, 0.09745025634765625, 0.107940673828125, 0.11843109130859375, 0.1289215087890625, 0.13941192626953125, 0.14990234375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 13.0, 21.0, 41.0, 50.0, 68.0, 108.0, 135.0, 140.0, 131.0, 82.0, 72.0, 61.0, 36.0, 16.0, 13.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05419921875, -0.05300545692443848, -0.05181169509887695, -0.05061793327331543, -0.049424171447753906, -0.04823040962219238, -0.04703664779663086, -0.045842885971069336, -0.04464912414550781, -0.04345536231994629, -0.042261600494384766, -0.04106783866882324, -0.03987407684326172, -0.038680315017700195, -0.03748655319213867, -0.03629279136657715, -0.035099029541015625, -0.0339052677154541, -0.03271150588989258, -0.031517744064331055, -0.03032398223876953, -0.029130220413208008, -0.027936458587646484, -0.02674269676208496, -0.025548934936523438, -0.024355173110961914, -0.02316141128540039, -0.021967649459838867, -0.020773887634277344, -0.01958012580871582, -0.018386363983154297, -0.017192602157592773, -0.01599884033203125, -0.014805078506469727, -0.013611316680908203, -0.01241755485534668, -0.011223793029785156, -0.010030031204223633, -0.00883626937866211, -0.007642507553100586, -0.0064487457275390625, -0.005254983901977539, -0.004061222076416016, -0.002867460250854492, -0.0016736984252929688, -0.0004799365997314453, 0.0007138252258300781, 0.0019075870513916016, 0.003101348876953125, 0.0042951107025146484, 0.005488872528076172, 0.006682634353637695, 0.007876396179199219, 0.009070158004760742, 0.010263919830322266, 0.011457681655883789, 0.012651443481445312, 0.013845205307006836, 0.01503896713256836, 0.016232728958129883, 0.017426490783691406, 0.01862025260925293, 0.019814014434814453, 0.021007776260375977, 0.0222015380859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 4.0, 9.0, 15.0, 14.0, 40.0, 74.0, 141.0, 213.0, 382.0, 672.0, 1178.0, 3123.0, 55900.0, 4100392.0, 27920.0, 2399.0, 865.0, 413.0, 238.0, 126.0, 68.0, 37.0, 20.0, 13.0, 8.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76416015625, -0.7465591430664062, -0.7289581298828125, -0.7113571166992188, -0.693756103515625, -0.6761550903320312, -0.6585540771484375, -0.6409530639648438, -0.62335205078125, -0.6057510375976562, -0.5881500244140625, -0.5705490112304688, -0.552947998046875, -0.5353469848632812, -0.5177459716796875, -0.5001449584960938, -0.4825439453125, -0.46494293212890625, -0.4473419189453125, -0.42974090576171875, -0.412139892578125, -0.39453887939453125, -0.3769378662109375, -0.35933685302734375, -0.34173583984375, -0.32413482666015625, -0.3065338134765625, -0.28893280029296875, -0.271331787109375, -0.25373077392578125, -0.2361297607421875, -0.21852874755859375, -0.200927734375, -0.18332672119140625, -0.1657257080078125, -0.14812469482421875, -0.130523681640625, -0.11292266845703125, -0.0953216552734375, -0.07772064208984375, -0.06011962890625, -0.04251861572265625, -0.0249176025390625, -0.00731658935546875, 0.010284423828125, 0.02788543701171875, 0.0454864501953125, 0.06308746337890625, 0.0806884765625, 0.09828948974609375, 0.1158905029296875, 0.13349151611328125, 0.151092529296875, 0.16869354248046875, 0.1862945556640625, 0.20389556884765625, 0.22149658203125, 0.23909759521484375, 0.2566986083984375, 0.27429962158203125, 0.291900634765625, 0.30950164794921875, 0.3271026611328125, 0.34470367431640625, 0.3623046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 9.0, 13.0, 11.0, 24.0, 58.0, 130.0, 335.0, 1738.0, 1297.0, 229.0, 108.0, 43.0, 24.0, 10.0, 16.0, 12.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09568119049072266, -0.09340095520019531, -0.09112071990966797, -0.08884048461914062, -0.08656024932861328, -0.08428001403808594, -0.0819997787475586, -0.07971954345703125, -0.0774393081665039, -0.07515907287597656, -0.07287883758544922, -0.07059860229492188, -0.06831836700439453, -0.06603813171386719, -0.06375789642333984, -0.0614776611328125, -0.059197425842285156, -0.05691719055175781, -0.05463695526123047, -0.052356719970703125, -0.05007648468017578, -0.04779624938964844, -0.045516014099121094, -0.04323577880859375, -0.040955543518066406, -0.03867530822753906, -0.03639507293701172, -0.034114837646484375, -0.03183460235595703, -0.029554367065429688, -0.027274131774902344, -0.024993896484375, -0.022713661193847656, -0.020433425903320312, -0.01815319061279297, -0.015872955322265625, -0.013592720031738281, -0.011312484741210938, -0.009032249450683594, -0.00675201416015625, -0.004471778869628906, -0.0021915435791015625, 8.869171142578125e-05, 0.002368927001953125, 0.004649162292480469, 0.0069293975830078125, 0.009209632873535156, 0.0114898681640625, 0.013770103454589844, 0.016050338745117188, 0.01833057403564453, 0.020610809326171875, 0.02289104461669922, 0.025171279907226562, 0.027451515197753906, 0.02973175048828125, 0.032011985778808594, 0.03429222106933594, 0.03657245635986328, 0.038852691650390625, 0.04113292694091797, 0.04341316223144531, 0.045693397521972656, 0.0479736328125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 12.0, 17.0, 33.0, 55.0, 163.0, 282.0, 233.0, 109.0, 43.0, 28.0, 9.0, 2.0, 2.0, 6.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7660737037658691, -0.7482742667198181, -0.7304747700691223, -0.7126753330230713, -0.6948758363723755, -0.6770763993263245, -0.6592769622802734, -0.6414774656295776, -0.6236780285835266, -0.6058785915374756, -0.5880790948867798, -0.5702796578407288, -0.5524802207946777, -0.5346807241439819, -0.5168812870979309, -0.4990818202495575, -0.4812823534011841, -0.46348288655281067, -0.44568341970443726, -0.42788398265838623, -0.4100845158100128, -0.3922850489616394, -0.3744856119155884, -0.35668614506721497, -0.33888667821884155, -0.32108721137046814, -0.3032877445220947, -0.2854883074760437, -0.2676888406276703, -0.24988937377929688, -0.23208992183208466, -0.21429046988487244, -0.19649100303649902, -0.1786915361881256, -0.1608920842409134, -0.14309263229370117, -0.12529316544532776, -0.10749370604753494, -0.08969424664974213, -0.07189478725194931, -0.054095327854156494, -0.03629586845636368, -0.018496409058570862, -0.0006969496607780457, 0.01710250973701477, 0.03490196913480759, 0.0527014285326004, 0.07050088793039322, 0.08830034732818604, 0.10609980672597885, 0.12389926612377167, 0.1416987180709839, 0.1594981849193573, 0.1772976517677307, 0.19509710371494293, 0.21289655566215515, 0.23069602251052856, 0.24849548935890198, 0.2662949562072754, 0.2840943932533264, 0.30189386010169983, 0.31969332695007324, 0.33749276399612427, 0.3552922308444977, 0.3730916976928711]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 11.0, 12.0, 20.0, 37.0, 44.0, 64.0, 95.0, 111.0, 103.0, 103.0, 97.0, 94.0, 76.0, 58.0, 24.0, 26.0, 10.0, 13.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5520994067192078, -0.5359964966773987, -0.5198935866355896, -0.5037906765937805, -0.48768776655197144, -0.47158485651016235, -0.4554819166660309, -0.4393790066242218, -0.4232760965824127, -0.40717318654060364, -0.39107027649879456, -0.3749673664569855, -0.358864426612854, -0.3427615165710449, -0.32665860652923584, -0.31055569648742676, -0.2944527864456177, -0.2783498764038086, -0.2622469663619995, -0.24614404141902924, -0.23004113137722015, -0.21393822133541107, -0.1978352963924408, -0.1817323863506317, -0.16562947630882263, -0.14952656626701355, -0.13342365622520447, -0.11732073128223419, -0.10121782124042511, -0.08511491119861603, -0.06901199370622635, -0.05290907621383667, -0.03680616617202759, -0.020703252404928207, -0.004600338637828827, 0.011502575129270554, 0.027605488896369934, 0.043708398938179016, 0.059811316430568695, 0.07591423392295837, 0.09201714396476746, 0.10812005400657654, 0.12422297149896622, 0.1403258889913559, 0.15642879903316498, 0.17253170907497406, 0.18863463401794434, 0.20473754405975342, 0.2208404541015625, 0.23694336414337158, 0.25304627418518066, 0.26914918422698975, 0.28525209426879883, 0.3013550043106079, 0.3174579441547394, 0.33356085419654846, 0.34966376423835754, 0.3657666742801666, 0.3818695843219757, 0.3979724943637848, 0.41407543420791626, 0.43017834424972534, 0.4462812542915344, 0.4623841643333435, 0.4784870743751526]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 2.0, 10.0, 12.0, 8.0, 22.0, 24.0, 38.0, 39.0, 51.0, 81.0, 121.0, 183.0, 329.0, 712.0, 1849.0, 6541.0, 37308.0, 360901.0, 560977.0, 65004.0, 9841.0, 2511.0, 926.0, 385.0, 213.0, 144.0, 85.0, 61.0, 42.0, 38.0, 23.0, 22.0, 10.0, 9.0, 7.0, 6.0, 6.0, 2.0, 3.0, 7.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.184814453125, -0.17774200439453125, -0.1706695556640625, -0.16359710693359375, -0.156524658203125, -0.14945220947265625, -0.1423797607421875, -0.13530731201171875, -0.12823486328125, -0.12116241455078125, -0.1140899658203125, -0.10701751708984375, -0.099945068359375, -0.09287261962890625, -0.0858001708984375, -0.07872772216796875, -0.0716552734375, -0.06458282470703125, -0.0575103759765625, -0.05043792724609375, -0.043365478515625, -0.03629302978515625, -0.0292205810546875, -0.02214813232421875, -0.01507568359375, -0.00800323486328125, -0.0009307861328125, 0.00614166259765625, 0.013214111328125, 0.02028656005859375, 0.0273590087890625, 0.03443145751953125, 0.04150390625, 0.04857635498046875, 0.0556488037109375, 0.06272125244140625, 0.069793701171875, 0.07686614990234375, 0.0839385986328125, 0.09101104736328125, 0.09808349609375, 0.10515594482421875, 0.1122283935546875, 0.11930084228515625, 0.126373291015625, 0.13344573974609375, 0.1405181884765625, 0.14759063720703125, 0.1546630859375, 0.16173553466796875, 0.1688079833984375, 0.17588043212890625, 0.182952880859375, 0.19002532958984375, 0.1970977783203125, 0.20417022705078125, 0.21124267578125, 0.21831512451171875, 0.2253875732421875, 0.23246002197265625, 0.239532470703125, 0.24660491943359375, 0.2536773681640625, 0.26074981689453125, 0.267822265625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 17.0, 25.0, 32.0, 64.0, 75.0, 99.0, 103.0, 116.0, 114.0, 109.0, 64.0, 54.0, 44.0, 27.0, 18.0, 8.0, 12.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04736328125, -0.04613614082336426, -0.044909000396728516, -0.04368185997009277, -0.04245471954345703, -0.04122757911682129, -0.04000043869018555, -0.038773298263549805, -0.03754615783691406, -0.03631901741027832, -0.03509187698364258, -0.033864736557006836, -0.032637596130371094, -0.03141045570373535, -0.03018331527709961, -0.028956174850463867, -0.027729034423828125, -0.026501893997192383, -0.02527475357055664, -0.0240476131439209, -0.022820472717285156, -0.021593332290649414, -0.020366191864013672, -0.01913905143737793, -0.017911911010742188, -0.016684770584106445, -0.015457630157470703, -0.014230489730834961, -0.013003349304199219, -0.011776208877563477, -0.010549068450927734, -0.009321928024291992, -0.00809478759765625, -0.006867647171020508, -0.005640506744384766, -0.0044133663177490234, -0.0031862258911132812, -0.001959085464477539, -0.0007319450378417969, 0.0004951953887939453, 0.0017223358154296875, 0.0029494762420654297, 0.004176616668701172, 0.005403757095336914, 0.006630897521972656, 0.007858037948608398, 0.00908517837524414, 0.010312318801879883, 0.011539459228515625, 0.012766599655151367, 0.01399374008178711, 0.015220880508422852, 0.016448020935058594, 0.017675161361694336, 0.018902301788330078, 0.02012944221496582, 0.021356582641601562, 0.022583723068237305, 0.023810863494873047, 0.02503800392150879, 0.02626514434814453, 0.027492284774780273, 0.028719425201416016, 0.029946565628051758, 0.0311737060546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 4.0, 18.0, 14.0, 22.0, 27.0, 34.0, 63.0, 89.0, 113.0, 187.0, 284.0, 500.0, 947.0, 1813.0, 3993.0, 10893.0, 37914.0, 162878.0, 475125.0, 264601.0, 61944.0, 16250.0, 5624.0, 2346.0, 1176.0, 671.0, 348.0, 220.0, 144.0, 101.0, 61.0, 38.0, 29.0, 15.0, 17.0, 9.0, 7.0, 9.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.09967041015625, -0.09619426727294922, -0.09271812438964844, -0.08924198150634766, -0.08576583862304688, -0.0822896957397461, -0.07881355285644531, -0.07533740997314453, -0.07186126708984375, -0.06838512420654297, -0.06490898132324219, -0.061432838439941406, -0.057956695556640625, -0.054480552673339844, -0.05100440979003906, -0.04752826690673828, -0.0440521240234375, -0.04057598114013672, -0.03709983825683594, -0.033623695373535156, -0.030147552490234375, -0.026671409606933594, -0.023195266723632812, -0.01971912384033203, -0.01624298095703125, -0.012766838073730469, -0.009290695190429688, -0.005814552307128906, -0.002338409423828125, 0.0011377334594726562, 0.0046138763427734375, 0.008090019226074219, 0.011566162109375, 0.015042304992675781, 0.018518447875976562, 0.021994590759277344, 0.025470733642578125, 0.028946876525878906, 0.03242301940917969, 0.03589916229248047, 0.03937530517578125, 0.04285144805908203, 0.04632759094238281, 0.049803733825683594, 0.053279876708984375, 0.056756019592285156, 0.06023216247558594, 0.06370830535888672, 0.0671844482421875, 0.07066059112548828, 0.07413673400878906, 0.07761287689208984, 0.08108901977539062, 0.0845651626586914, 0.08804130554199219, 0.09151744842529297, 0.09499359130859375, 0.09846973419189453, 0.10194587707519531, 0.1054220199584961, 0.10889816284179688, 0.11237430572509766, 0.11585044860839844, 0.11932659149169922, 0.122802734375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 9.0, 7.0, 10.0, 12.0, 23.0, 19.0, 30.0, 24.0, 34.0, 32.0, 28.0, 35.0, 38.0, 44.0, 33.0, 46.0, 45.0, 41.0, 44.0, 44.0, 43.0, 38.0, 36.0, 40.0, 36.0, 30.0, 30.0, 20.0, 22.0, 20.0, 14.0, 7.0, 13.0, 14.0, 3.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0736083984375, -0.07106494903564453, -0.06852149963378906, -0.0659780502319336, -0.06343460083007812, -0.060891151428222656, -0.05834770202636719, -0.05580425262451172, -0.05326080322265625, -0.05071735382080078, -0.04817390441894531, -0.045630455017089844, -0.043087005615234375, -0.040543556213378906, -0.03800010681152344, -0.03545665740966797, -0.0329132080078125, -0.03036975860595703, -0.027826309204101562, -0.025282859802246094, -0.022739410400390625, -0.020195960998535156, -0.017652511596679688, -0.015109062194824219, -0.01256561279296875, -0.010022163391113281, -0.0074787139892578125, -0.004935264587402344, -0.002391815185546875, 0.00015163421630859375, 0.0026950836181640625, 0.005238533020019531, 0.007781982421875, 0.010325431823730469, 0.012868881225585938, 0.015412330627441406, 0.017955780029296875, 0.020499229431152344, 0.023042678833007812, 0.02558612823486328, 0.02812957763671875, 0.03067302703857422, 0.03321647644042969, 0.035759925842285156, 0.038303375244140625, 0.040846824645996094, 0.04339027404785156, 0.04593372344970703, 0.0484771728515625, 0.05102062225341797, 0.05356407165527344, 0.056107521057128906, 0.058650970458984375, 0.061194419860839844, 0.06373786926269531, 0.06628131866455078, 0.06882476806640625, 0.07136821746826172, 0.07391166687011719, 0.07645511627197266, 0.07899856567382812, 0.0815420150756836, 0.08408546447753906, 0.08662891387939453, 0.08917236328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 9.0, 12.0, 17.0, 33.0, 36.0, 54.0, 70.0, 127.0, 221.0, 414.0, 931.0, 2162.0, 6325.0, 23778.0, 195879.0, 706152.0, 89592.0, 14956.0, 4563.0, 1649.0, 692.0, 360.0, 195.0, 108.0, 51.0, 44.0, 31.0, 18.0, 11.0, 13.0, 8.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08856201171875, -0.08582401275634766, -0.08308601379394531, -0.08034801483154297, -0.07761001586914062, -0.07487201690673828, -0.07213401794433594, -0.0693960189819336, -0.06665802001953125, -0.0639200210571289, -0.06118202209472656, -0.05844402313232422, -0.055706024169921875, -0.05296802520751953, -0.05023002624511719, -0.047492027282714844, -0.0447540283203125, -0.042016029357910156, -0.03927803039550781, -0.03654003143310547, -0.033802032470703125, -0.03106403350830078, -0.028326034545898438, -0.025588035583496094, -0.02285003662109375, -0.020112037658691406, -0.017374038696289062, -0.014636039733886719, -0.011898040771484375, -0.009160041809082031, -0.0064220428466796875, -0.0036840438842773438, -0.000946044921875, 0.0017919540405273438, 0.0045299530029296875, 0.007267951965332031, 0.010005950927734375, 0.012743949890136719, 0.015481948852539062, 0.018219947814941406, 0.02095794677734375, 0.023695945739746094, 0.026433944702148438, 0.02917194366455078, 0.031909942626953125, 0.03464794158935547, 0.03738594055175781, 0.040123939514160156, 0.0428619384765625, 0.045599937438964844, 0.04833793640136719, 0.05107593536376953, 0.053813934326171875, 0.05655193328857422, 0.05928993225097656, 0.062027931213378906, 0.06476593017578125, 0.0675039291381836, 0.07024192810058594, 0.07297992706298828, 0.07571792602539062, 0.07845592498779297, 0.08119392395019531, 0.08393192291259766, 0.086669921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 10.0, 10.0, 10.0, 23.0, 17.0, 20.0, 38.0, 33.0, 65.0, 66.0, 71.0, 78.0, 75.0, 89.0, 77.0, 62.0, 55.0, 39.0, 35.0, 36.0, 21.0, 25.0, 6.0, 8.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00013899803161621094, -0.00013528671115636826, -0.00013157539069652557, -0.0001278640702366829, -0.0001241527497768402, -0.00012044142931699753, -0.00011673010885715485, -0.00011301878839731216, -0.00010930746793746948, -0.0001055961474776268, -0.00010188482701778412, -9.817350655794144e-05, -9.446218609809875e-05, -9.075086563825607e-05, -8.703954517841339e-05, -8.332822471857071e-05, -7.961690425872803e-05, -7.590558379888535e-05, -7.219426333904266e-05, -6.848294287919998e-05, -6.47716224193573e-05, -6.106030195951462e-05, -5.7348981499671936e-05, -5.3637661039829254e-05, -4.992634057998657e-05, -4.621502012014389e-05, -4.250369966030121e-05, -3.8792379200458527e-05, -3.5081058740615845e-05, -3.136973828077316e-05, -2.765841782093048e-05, -2.39470973610878e-05, -2.0235776901245117e-05, -1.6524456441402435e-05, -1.2813135981559753e-05, -9.101815521717072e-06, -5.39049506187439e-06, -1.6791746020317078e-06, 2.032145857810974e-06, 5.743466317653656e-06, 9.454786777496338e-06, 1.316610723733902e-05, 1.68774276971817e-05, 2.0588748157024384e-05, 2.4300068616867065e-05, 2.8011389076709747e-05, 3.172270953655243e-05, 3.543402999639511e-05, 3.914535045623779e-05, 4.2856670916080475e-05, 4.656799137592316e-05, 5.027931183576584e-05, 5.399063229560852e-05, 5.77019527554512e-05, 6.141327321529388e-05, 6.512459367513657e-05, 6.883591413497925e-05, 7.254723459482193e-05, 7.625855505466461e-05, 7.99698755145073e-05, 8.368119597434998e-05, 8.739251643419266e-05, 9.110383689403534e-05, 9.481515735387802e-05, 9.85264778137207e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 5.0, 7.0, 8.0, 18.0, 12.0, 25.0, 27.0, 36.0, 53.0, 100.0, 128.0, 234.0, 400.0, 716.0, 1407.0, 2982.0, 7408.0, 23393.0, 125415.0, 636288.0, 201395.0, 31893.0, 9365.0, 3613.0, 1639.0, 829.0, 448.0, 246.0, 147.0, 100.0, 66.0, 40.0, 32.0, 17.0, 23.0, 14.0, 7.0, 5.0, 7.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.0838623046875, -0.08157157897949219, -0.07928085327148438, -0.07699012756347656, -0.07469940185546875, -0.07240867614746094, -0.07011795043945312, -0.06782722473144531, -0.0655364990234375, -0.06324577331542969, -0.060955047607421875, -0.05866432189941406, -0.05637359619140625, -0.05408287048339844, -0.051792144775390625, -0.04950141906738281, -0.047210693359375, -0.04491996765136719, -0.042629241943359375, -0.04033851623535156, -0.03804779052734375, -0.03575706481933594, -0.033466339111328125, -0.031175613403320312, -0.0288848876953125, -0.026594161987304688, -0.024303436279296875, -0.022012710571289062, -0.01972198486328125, -0.017431259155273438, -0.015140533447265625, -0.012849807739257812, -0.01055908203125, -0.008268356323242188, -0.005977630615234375, -0.0036869049072265625, -0.00139617919921875, 0.0008945465087890625, 0.003185272216796875, 0.0054759979248046875, 0.0077667236328125, 0.010057449340820312, 0.012348175048828125, 0.014638900756835938, 0.01692962646484375, 0.019220352172851562, 0.021511077880859375, 0.023801803588867188, 0.026092529296875, 0.028383255004882812, 0.030673980712890625, 0.03296470642089844, 0.03525543212890625, 0.03754615783691406, 0.039836883544921875, 0.04212760925292969, 0.0444183349609375, 0.04670906066894531, 0.048999786376953125, 0.05129051208496094, 0.05358123779296875, 0.05587196350097656, 0.058162689208984375, 0.06045341491699219, 0.062744140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 12.0, 7.0, 17.0, 20.0, 18.0, 36.0, 54.0, 63.0, 109.0, 117.0, 118.0, 121.0, 93.0, 54.0, 48.0, 27.0, 22.0, 13.0, 13.0, 9.0, 8.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0562744140625, -0.05447673797607422, -0.05267906188964844, -0.050881385803222656, -0.049083709716796875, -0.047286033630371094, -0.04548835754394531, -0.04369068145751953, -0.04189300537109375, -0.04009532928466797, -0.03829765319824219, -0.036499977111816406, -0.034702301025390625, -0.032904624938964844, -0.031106948852539062, -0.02930927276611328, -0.0275115966796875, -0.02571392059326172, -0.023916244506835938, -0.022118568420410156, -0.020320892333984375, -0.018523216247558594, -0.016725540161132812, -0.014927864074707031, -0.01313018798828125, -0.011332511901855469, -0.009534835815429688, -0.007737159729003906, -0.005939483642578125, -0.004141807556152344, -0.0023441314697265625, -0.0005464553833007812, 0.001251220703125, 0.0030488967895507812, 0.0048465728759765625, 0.006644248962402344, 0.008441925048828125, 0.010239601135253906, 0.012037277221679688, 0.013834953308105469, 0.01563262939453125, 0.01743030548095703, 0.019227981567382812, 0.021025657653808594, 0.022823333740234375, 0.024621009826660156, 0.026418685913085938, 0.02821636199951172, 0.0300140380859375, 0.03181171417236328, 0.03360939025878906, 0.035407066345214844, 0.037204742431640625, 0.039002418518066406, 0.04080009460449219, 0.04259777069091797, 0.04439544677734375, 0.04619312286376953, 0.04799079895019531, 0.049788475036621094, 0.051586151123046875, 0.053383827209472656, 0.05518150329589844, 0.05697917938232422, 0.05877685546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 16.0, 39.0, 76.0, 159.0, 216.0, 228.0, 134.0, 57.0, 29.0, 19.0, 8.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.5560122728347778, -1.5227512121200562, -1.4894901514053345, -1.4562289714813232, -1.4229679107666016, -1.3897068500518799, -1.3564457893371582, -1.3231847286224365, -1.2899236679077148, -1.2566626071929932, -1.2234015464782715, -1.1901403665542603, -1.1568793058395386, -1.123618245124817, -1.0903571844100952, -1.0570961236953735, -1.0238349437713623, -0.9905738830566406, -0.9573127627372742, -0.9240517020225525, -0.890790581703186, -0.8575295209884644, -0.8242684602737427, -0.791007399559021, -0.7577462792396545, -0.7244852185249329, -0.6912240982055664, -0.6579630374908447, -0.624701976776123, -0.5914408564567566, -0.5581797957420349, -0.5249186754226685, -0.4916574954986572, -0.45839640498161316, -0.4251353144645691, -0.3918742537498474, -0.35861316323280334, -0.3253520727157593, -0.2920910120010376, -0.25882992148399353, -0.22556883096694946, -0.1923077404499054, -0.15904666483402252, -0.12578558921813965, -0.09252449870109558, -0.059263408184051514, -0.02600233256816864, 0.007258743047714233, 0.0405198335647583, 0.07378091663122177, 0.10704199969768524, 0.14030307531356812, 0.17356416583061218, 0.20682525634765625, 0.24008633196353912, 0.273347407579422, 0.30660849809646606, 0.33986958861351013, 0.3731306791305542, 0.4063917398452759, 0.43965283036231995, 0.472913920879364, 0.5061749815940857, 0.5394361019134521, 0.5726971626281738]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 9.0, 19.0, 18.0, 29.0, 31.0, 47.0, 52.0, 56.0, 63.0, 79.0, 81.0, 68.0, 77.0, 69.0, 50.0, 53.0, 30.0, 33.0, 32.0, 18.0, 23.0, 10.0, 14.0, 12.0, 2.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5380100607872009, -0.5138401985168457, -0.4896702766418457, -0.4655003845691681, -0.4413304924964905, -0.41716060042381287, -0.39299070835113525, -0.36882081627845764, -0.34465092420578003, -0.3204810321331024, -0.2963111400604248, -0.2721412479877472, -0.24797135591506958, -0.22380146384239197, -0.19963157176971436, -0.17546167969703674, -0.15129178762435913, -0.12712189555168152, -0.1029520034790039, -0.0787821114063263, -0.05461221933364868, -0.03044232726097107, -0.006272435188293457, 0.017897456884384155, 0.04206734895706177, 0.06623724102973938, 0.09040713310241699, 0.1145770251750946, 0.13874691724777222, 0.16291680932044983, 0.18708670139312744, 0.21125659346580505, 0.2354264259338379, 0.2595963180065155, 0.2837662100791931, 0.3079361021518707, 0.33210599422454834, 0.35627588629722595, 0.38044577836990356, 0.4046156704425812, 0.4287855625152588, 0.4529554545879364, 0.477125346660614, 0.5012952089309692, 0.5254651308059692, 0.5496350526809692, 0.5738049149513245, 0.5979747772216797, 0.6221446990966797, 0.6463146209716797, 0.6704844832420349, 0.6946543455123901, 0.7188242673873901, 0.7429941892623901, 0.7671640515327454, 0.7913339138031006, 0.8155038356781006, 0.8396737575531006, 0.8638436198234558, 0.888013482093811, 0.912183403968811, 0.936353325843811, 0.9605231881141663, 0.9846930503845215, 1.0088629722595215]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 4.0, 8.0, 5.0, 2.0, 16.0, 12.0, 24.0, 34.0, 23.0, 60.0, 71.0, 107.0, 186.0, 381.0, 690.0, 2094.0, 9330.0, 104176.0, 3989858.0, 75492.0, 8429.0, 2034.0, 621.0, 275.0, 139.0, 71.0, 46.0, 22.0, 17.0, 18.0, 7.0, 4.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.394775390625, -0.3847675323486328, -0.3747596740722656, -0.36475181579589844, -0.35474395751953125, -0.34473609924316406, -0.3347282409667969, -0.3247203826904297, -0.3147125244140625, -0.3047046661376953, -0.2946968078613281, -0.28468894958496094, -0.27468109130859375, -0.26467323303222656, -0.2546653747558594, -0.2446575164794922, -0.234649658203125, -0.2246417999267578, -0.21463394165039062, -0.20462608337402344, -0.19461822509765625, -0.18461036682128906, -0.17460250854492188, -0.1645946502685547, -0.1545867919921875, -0.1445789337158203, -0.13457107543945312, -0.12456321716308594, -0.11455535888671875, -0.10454750061035156, -0.09453964233398438, -0.08453178405761719, -0.07452392578125, -0.06451606750488281, -0.054508209228515625, -0.04450035095214844, -0.03449249267578125, -0.024484634399414062, -0.014476776123046875, -0.0044689178466796875, 0.0055389404296875, 0.015546798706054688, 0.025554656982421875, 0.03556251525878906, 0.04557037353515625, 0.05557823181152344, 0.06558609008789062, 0.07559394836425781, 0.085601806640625, 0.09560966491699219, 0.10561752319335938, 0.11562538146972656, 0.12563323974609375, 0.13564109802246094, 0.14564895629882812, 0.1556568145751953, 0.1656646728515625, 0.1756725311279297, 0.18568038940429688, 0.19568824768066406, 0.20569610595703125, 0.21570396423339844, 0.22571182250976562, 0.2357196807861328, 0.2457275390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 9.0, 30.0, 48.0, 55.0, 89.0, 115.0, 131.0, 103.0, 106.0, 87.0, 76.0, 49.0, 35.0, 21.0, 12.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04705810546875, -0.045641422271728516, -0.04422473907470703, -0.04280805587768555, -0.04139137268066406, -0.03997468948364258, -0.038558006286621094, -0.03714132308959961, -0.035724639892578125, -0.03430795669555664, -0.032891273498535156, -0.03147459030151367, -0.030057907104492188, -0.028641223907470703, -0.02722454071044922, -0.025807857513427734, -0.02439117431640625, -0.022974491119384766, -0.02155780792236328, -0.020141124725341797, -0.018724441528320312, -0.017307758331298828, -0.015891075134277344, -0.01447439193725586, -0.013057708740234375, -0.01164102554321289, -0.010224342346191406, -0.008807659149169922, -0.0073909759521484375, -0.005974292755126953, -0.004557609558105469, -0.0031409263610839844, -0.0017242431640625, -0.0003075599670410156, 0.0011091232299804688, 0.002525806427001953, 0.0039424896240234375, 0.005359172821044922, 0.006775856018066406, 0.00819253921508789, 0.009609222412109375, 0.01102590560913086, 0.012442588806152344, 0.013859272003173828, 0.015275955200195312, 0.016692638397216797, 0.01810932159423828, 0.019526004791259766, 0.02094268798828125, 0.022359371185302734, 0.02377605438232422, 0.025192737579345703, 0.026609420776367188, 0.028026103973388672, 0.029442787170410156, 0.03085947036743164, 0.032276153564453125, 0.03369283676147461, 0.035109519958496094, 0.03652620315551758, 0.03794288635253906, 0.03935956954956055, 0.04077625274658203, 0.042192935943603516, 0.043609619140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 3.0, 1.0, 3.0, 5.0, 12.0, 5.0, 14.0, 17.0, 29.0, 25.0, 50.0, 63.0, 103.0, 174.0, 270.0, 585.0, 1433.0, 6557.0, 93925.0, 4018439.0, 64385.0, 5647.0, 1403.0, 514.0, 224.0, 149.0, 75.0, 55.0, 40.0, 28.0, 13.0, 14.0, 6.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.396728515625, -0.3869209289550781, -0.37711334228515625, -0.3673057556152344, -0.3574981689453125, -0.3476905822753906, -0.33788299560546875, -0.3280754089355469, -0.318267822265625, -0.3084602355957031, -0.29865264892578125, -0.2888450622558594, -0.2790374755859375, -0.2692298889160156, -0.25942230224609375, -0.24961471557617188, -0.23980712890625, -0.22999954223632812, -0.22019195556640625, -0.21038436889648438, -0.2005767822265625, -0.19076919555664062, -0.18096160888671875, -0.17115402221679688, -0.161346435546875, -0.15153884887695312, -0.14173126220703125, -0.13192367553710938, -0.1221160888671875, -0.11230850219726562, -0.10250091552734375, -0.09269332885742188, -0.0828857421875, -0.07307815551757812, -0.06327056884765625, -0.053462982177734375, -0.0436553955078125, -0.033847808837890625, -0.02404022216796875, -0.014232635498046875, -0.004425048828125, 0.005382537841796875, 0.01519012451171875, 0.024997711181640625, 0.0348052978515625, 0.044612884521484375, 0.05442047119140625, 0.06422805786132812, 0.07403564453125, 0.08384323120117188, 0.09365081787109375, 0.10345840454101562, 0.1132659912109375, 0.12307357788085938, 0.13288116455078125, 0.14268875122070312, 0.152496337890625, 0.16230392456054688, 0.17211151123046875, 0.18191909790039062, 0.1917266845703125, 0.20153427124023438, 0.21134185791015625, 0.22114944458007812, 0.23095703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 10.0, 20.0, 27.0, 66.0, 156.0, 652.0, 2470.0, 454.0, 115.0, 55.0, 23.0, 6.0, 7.0, 7.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0963134765625, -0.09373855590820312, -0.09116363525390625, -0.08858871459960938, -0.0860137939453125, -0.08343887329101562, -0.08086395263671875, -0.07828903198242188, -0.075714111328125, -0.07313919067382812, -0.07056427001953125, -0.06798934936523438, -0.0654144287109375, -0.06283950805664062, -0.06026458740234375, -0.057689666748046875, -0.05511474609375, -0.052539825439453125, -0.04996490478515625, -0.047389984130859375, -0.0448150634765625, -0.042240142822265625, -0.03966522216796875, -0.037090301513671875, -0.034515380859375, -0.031940460205078125, -0.02936553955078125, -0.026790618896484375, -0.0242156982421875, -0.021640777587890625, -0.01906585693359375, -0.016490936279296875, -0.013916015625, -0.011341094970703125, -0.00876617431640625, -0.006191253662109375, -0.0036163330078125, -0.001041412353515625, 0.00153350830078125, 0.004108428955078125, 0.006683349609375, 0.009258270263671875, 0.01183319091796875, 0.014408111572265625, 0.0169830322265625, 0.019557952880859375, 0.02213287353515625, 0.024707794189453125, 0.02728271484375, 0.029857635498046875, 0.03243255615234375, 0.035007476806640625, 0.0375823974609375, 0.040157318115234375, 0.04273223876953125, 0.045307159423828125, 0.047882080078125, 0.050457000732421875, 0.05303192138671875, 0.055606842041015625, 0.0581817626953125, 0.060756683349609375, 0.06333160400390625, 0.06590652465820312, 0.0684814453125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 16.0, 13.0, 24.0, 90.0, 153.0, 249.0, 211.0, 148.0, 48.0, 23.0, 6.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4391190707683563, -0.42579716444015503, -0.41247525811195374, -0.39915335178375244, -0.38583147525787354, -0.37250956892967224, -0.35918766260147095, -0.34586575627326965, -0.33254384994506836, -0.31922194361686707, -0.30590003728866577, -0.29257816076278687, -0.27925625443458557, -0.2659343481063843, -0.252612441778183, -0.2392905354499817, -0.22596865892410278, -0.2126467525959015, -0.1993248611688614, -0.1860029548406601, -0.17268106341362, -0.1593591570854187, -0.1460372507572174, -0.1327153444290161, -0.11939345300197601, -0.10607155412435532, -0.09274965524673462, -0.07942774891853333, -0.06610585004091263, -0.05278395116329193, -0.03946204483509064, -0.02614014595746994, -0.012818217277526855, 0.0005036834627389908, 0.013825584203004837, 0.027147486805915833, 0.04046938568353653, 0.05379128456115723, 0.06711319088935852, 0.08043508976697922, 0.09375698864459991, 0.10707888752222061, 0.12040078639984131, 0.1337226927280426, 0.1470445990562439, 0.160366490483284, 0.1736883968114853, 0.1870102882385254, 0.20033219456672668, 0.21365410089492798, 0.22697599232196808, 0.24029789865016937, 0.2536197900772095, 0.26694169640541077, 0.28026360273361206, 0.29358550906181335, 0.30690741539001465, 0.32022932171821594, 0.33355122804641724, 0.34687310457229614, 0.36019501090049744, 0.37351691722869873, 0.3868388235569, 0.4001607298851013, 0.4134826064109802]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 6.0, 7.0, 8.0, 18.0, 31.0, 22.0, 33.0, 40.0, 40.0, 44.0, 50.0, 57.0, 59.0, 56.0, 62.0, 70.0, 48.0, 50.0, 50.0, 57.0, 35.0, 41.0, 16.0, 26.0, 21.0, 13.0, 8.0, 9.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17601275444030762, -0.17073889076709747, -0.16546502709388733, -0.16019116342067719, -0.15491729974746704, -0.1496434360742569, -0.14436957240104675, -0.1390957087278366, -0.13382184505462646, -0.12854798138141632, -0.12327411770820618, -0.11800025403499603, -0.11272639036178589, -0.10745252668857574, -0.1021786630153656, -0.09690479934215546, -0.09163093566894531, -0.08635707199573517, -0.08108320832252502, -0.07580934464931488, -0.07053548097610474, -0.06526161730289459, -0.05998775362968445, -0.054713889956474304, -0.04944002628326416, -0.044166162610054016, -0.03889229893684387, -0.03361843526363373, -0.028344571590423584, -0.02307070791721344, -0.017796844244003296, -0.012522980570793152, -0.007249116897583008, -0.0019752532243728638, 0.0032986104488372803, 0.008572474122047424, 0.013846337795257568, 0.019120201468467712, 0.024394065141677856, 0.029667928814888, 0.034941792488098145, 0.04021565616130829, 0.04548951983451843, 0.05076338350772858, 0.05603724718093872, 0.061311110854148865, 0.06658497452735901, 0.07185883820056915, 0.0771327018737793, 0.08240656554698944, 0.08768042922019958, 0.09295429289340973, 0.09822815656661987, 0.10350202023983002, 0.10877588391304016, 0.1140497475862503, 0.11932361125946045, 0.1245974749326706, 0.12987133860588074, 0.13514520227909088, 0.14041906595230103, 0.14569292962551117, 0.1509667932987213, 0.15624065697193146, 0.1615145206451416]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 1.0, 9.0, 6.0, 20.0, 22.0, 31.0, 49.0, 74.0, 144.0, 212.0, 470.0, 1097.0, 3462.0, 18608.0, 257476.0, 692248.0, 63695.0, 7413.0, 2004.0, 699.0, 352.0, 186.0, 93.0, 51.0, 38.0, 32.0, 17.0, 10.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.2540130615234375, -0.245330810546875, -0.2366485595703125, -0.22796630859375, -0.2192840576171875, -0.210601806640625, -0.2019195556640625, -0.1932373046875, -0.1845550537109375, -0.175872802734375, -0.1671905517578125, -0.15850830078125, -0.1498260498046875, -0.141143798828125, -0.1324615478515625, -0.123779296875, -0.1150970458984375, -0.106414794921875, -0.0977325439453125, -0.08905029296875, -0.0803680419921875, -0.071685791015625, -0.0630035400390625, -0.0543212890625, -0.0456390380859375, -0.036956787109375, -0.0282745361328125, -0.01959228515625, -0.0109100341796875, -0.002227783203125, 0.0064544677734375, 0.01513671875, 0.0238189697265625, 0.032501220703125, 0.0411834716796875, 0.04986572265625, 0.0585479736328125, 0.067230224609375, 0.0759124755859375, 0.0845947265625, 0.0932769775390625, 0.101959228515625, 0.1106414794921875, 0.11932373046875, 0.1280059814453125, 0.136688232421875, 0.1453704833984375, 0.154052734375, 0.1627349853515625, 0.171417236328125, 0.1800994873046875, 0.18878173828125, 0.1974639892578125, 0.206146240234375, 0.2148284912109375, 0.2235107421875, 0.2321929931640625, 0.240875244140625, 0.2495574951171875, 0.25823974609375, 0.2669219970703125, 0.275604248046875, 0.2842864990234375, 0.29296875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 2.0, 6.0, 8.0, 16.0, 24.0, 27.0, 35.0, 51.0, 65.0, 61.0, 93.0, 94.0, 84.0, 91.0, 70.0, 74.0, 41.0, 38.0, 41.0, 26.0, 16.0, 9.0, 13.0, 4.0, 3.0, 1.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0435791015625, -0.04249310493469238, -0.041407108306884766, -0.04032111167907715, -0.03923511505126953, -0.038149118423461914, -0.0370631217956543, -0.03597712516784668, -0.03489112854003906, -0.033805131912231445, -0.03271913528442383, -0.03163313865661621, -0.030547142028808594, -0.029461145401000977, -0.02837514877319336, -0.027289152145385742, -0.026203155517578125, -0.025117158889770508, -0.02403116226196289, -0.022945165634155273, -0.021859169006347656, -0.02077317237854004, -0.019687175750732422, -0.018601179122924805, -0.017515182495117188, -0.01642918586730957, -0.015343189239501953, -0.014257192611694336, -0.013171195983886719, -0.012085199356079102, -0.010999202728271484, -0.009913206100463867, -0.00882720947265625, -0.007741212844848633, -0.006655216217041016, -0.0055692195892333984, -0.004483222961425781, -0.003397226333618164, -0.002311229705810547, -0.0012252330780029297, -0.0001392364501953125, 0.0009467601776123047, 0.002032756805419922, 0.003118753433227539, 0.004204750061035156, 0.0052907466888427734, 0.006376743316650391, 0.007462739944458008, 0.008548736572265625, 0.009634733200073242, 0.01072072982788086, 0.011806726455688477, 0.012892723083496094, 0.013978719711303711, 0.015064716339111328, 0.016150712966918945, 0.017236709594726562, 0.01832270622253418, 0.019408702850341797, 0.020494699478149414, 0.02158069610595703, 0.02266669273376465, 0.023752689361572266, 0.024838685989379883, 0.0259246826171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 13.0, 19.0, 29.0, 31.0, 35.0, 70.0, 108.0, 193.0, 267.0, 488.0, 912.0, 1928.0, 4362.0, 12805.0, 53658.0, 302913.0, 514831.0, 119573.0, 23710.0, 6923.0, 2761.0, 1259.0, 632.0, 376.0, 245.0, 134.0, 76.0, 58.0, 31.0, 24.0, 19.0, 8.0, 5.0, 11.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.1700439453125, -0.16547679901123047, -0.16090965270996094, -0.1563425064086914, -0.15177536010742188, -0.14720821380615234, -0.1426410675048828, -0.13807392120361328, -0.13350677490234375, -0.12893962860107422, -0.12437248229980469, -0.11980533599853516, -0.11523818969726562, -0.1106710433959961, -0.10610389709472656, -0.10153675079345703, -0.0969696044921875, -0.09240245819091797, -0.08783531188964844, -0.0832681655883789, -0.07870101928710938, -0.07413387298583984, -0.06956672668457031, -0.06499958038330078, -0.06043243408203125, -0.05586528778076172, -0.05129814147949219, -0.046730995178222656, -0.042163848876953125, -0.037596702575683594, -0.03302955627441406, -0.02846240997314453, -0.023895263671875, -0.01932811737060547, -0.014760971069335938, -0.010193824768066406, -0.005626678466796875, -0.0010595321655273438, 0.0035076141357421875, 0.008074760437011719, 0.01264190673828125, 0.01720905303955078, 0.021776199340820312, 0.026343345642089844, 0.030910491943359375, 0.035477638244628906, 0.04004478454589844, 0.04461193084716797, 0.0491790771484375, 0.05374622344970703, 0.05831336975097656, 0.0628805160522461, 0.06744766235351562, 0.07201480865478516, 0.07658195495605469, 0.08114910125732422, 0.08571624755859375, 0.09028339385986328, 0.09485054016113281, 0.09941768646240234, 0.10398483276367188, 0.1085519790649414, 0.11311912536621094, 0.11768627166748047, 0.12225341796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 6.0, 7.0, 14.0, 25.0, 16.0, 29.0, 25.0, 37.0, 50.0, 42.0, 54.0, 54.0, 47.0, 73.0, 60.0, 68.0, 53.0, 68.0, 39.0, 45.0, 33.0, 37.0, 26.0, 22.0, 16.0, 11.0, 8.0, 6.0, 9.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.1619873046875, -0.1578378677368164, -0.1536884307861328, -0.14953899383544922, -0.14538955688476562, -0.14124011993408203, -0.13709068298339844, -0.13294124603271484, -0.12879180908203125, -0.12464237213134766, -0.12049293518066406, -0.11634349822998047, -0.11219406127929688, -0.10804462432861328, -0.10389518737792969, -0.0997457504272461, -0.0955963134765625, -0.0914468765258789, -0.08729743957519531, -0.08314800262451172, -0.07899856567382812, -0.07484912872314453, -0.07069969177246094, -0.06655025482177734, -0.06240081787109375, -0.058251380920410156, -0.05410194396972656, -0.04995250701904297, -0.045803070068359375, -0.04165363311767578, -0.03750419616699219, -0.033354759216308594, -0.029205322265625, -0.025055885314941406, -0.020906448364257812, -0.01675701141357422, -0.012607574462890625, -0.008458137512207031, -0.0043087005615234375, -0.00015926361083984375, 0.00399017333984375, 0.008139610290527344, 0.012289047241210938, 0.01643848419189453, 0.020587921142578125, 0.02473735809326172, 0.028886795043945312, 0.033036231994628906, 0.0371856689453125, 0.041335105895996094, 0.04548454284667969, 0.04963397979736328, 0.053783416748046875, 0.05793285369873047, 0.06208229064941406, 0.06623172760009766, 0.07038116455078125, 0.07453060150146484, 0.07868003845214844, 0.08282947540283203, 0.08697891235351562, 0.09112834930419922, 0.09527778625488281, 0.0994272232055664, 0.10357666015625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 12.0, 13.0, 13.0, 21.0, 29.0, 44.0, 88.0, 146.0, 255.0, 460.0, 968.0, 2172.0, 6890.0, 29931.0, 202671.0, 602768.0, 166743.0, 25421.0, 5929.0, 2061.0, 920.0, 410.0, 231.0, 135.0, 68.0, 47.0, 32.0, 21.0, 13.0, 12.0, 5.0, 7.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06690788269042969, -0.06484603881835938, -0.06278419494628906, -0.06072235107421875, -0.05866050720214844, -0.056598663330078125, -0.05453681945800781, -0.0524749755859375, -0.05041313171386719, -0.048351287841796875, -0.04628944396972656, -0.04422760009765625, -0.04216575622558594, -0.040103912353515625, -0.03804206848144531, -0.035980224609375, -0.03391838073730469, -0.031856536865234375, -0.029794692993164062, -0.02773284912109375, -0.025671005249023438, -0.023609161376953125, -0.021547317504882812, -0.0194854736328125, -0.017423629760742188, -0.015361785888671875, -0.013299942016601562, -0.01123809814453125, -0.009176254272460938, -0.007114410400390625, -0.0050525665283203125, -0.00299072265625, -0.0009288787841796875, 0.001132965087890625, 0.0031948089599609375, 0.00525665283203125, 0.0073184967041015625, 0.009380340576171875, 0.011442184448242188, 0.0135040283203125, 0.015565872192382812, 0.017627716064453125, 0.019689559936523438, 0.02175140380859375, 0.023813247680664062, 0.025875091552734375, 0.027936935424804688, 0.029998779296875, 0.03206062316894531, 0.034122467041015625, 0.03618431091308594, 0.03824615478515625, 0.04030799865722656, 0.042369842529296875, 0.04443168640136719, 0.0464935302734375, 0.04855537414550781, 0.050617218017578125, 0.05267906188964844, 0.05474090576171875, 0.05680274963378906, 0.058864593505859375, 0.06092643737792969, 0.06298828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 5.0, 7.0, 4.0, 5.0, 3.0, 11.0, 21.0, 20.0, 21.0, 27.0, 32.0, 36.0, 62.0, 56.0, 64.0, 79.0, 80.0, 74.0, 90.0, 53.0, 55.0, 44.0, 43.0, 35.0, 16.0, 20.0, 16.0, 5.0, 2.0, 7.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.963180541992188e-05, -7.576867938041687e-05, -7.190555334091187e-05, -6.804242730140686e-05, -6.417930126190186e-05, -6.031617522239685e-05, -5.6453049182891846e-05, -5.258992314338684e-05, -4.8726797103881836e-05, -4.486367106437683e-05, -4.1000545024871826e-05, -3.713741898536682e-05, -3.3274292945861816e-05, -2.941116690635681e-05, -2.5548040866851807e-05, -2.1684914827346802e-05, -1.7821788787841797e-05, -1.3958662748336792e-05, -1.0095536708831787e-05, -6.232410669326782e-06, -2.3692846298217773e-06, 1.4938414096832275e-06, 5.356967449188232e-06, 9.220093488693237e-06, 1.3083219528198242e-05, 1.6946345567703247e-05, 2.0809471607208252e-05, 2.4672597646713257e-05, 2.8535723686218262e-05, 3.2398849725723267e-05, 3.626197576522827e-05, 4.0125101804733276e-05, 4.398822784423828e-05, 4.7851353883743286e-05, 5.171447992324829e-05, 5.5577605962753296e-05, 5.94407320022583e-05, 6.33038580417633e-05, 6.716698408126831e-05, 7.103011012077332e-05, 7.489323616027832e-05, 7.875636219978333e-05, 8.261948823928833e-05, 8.648261427879333e-05, 9.034574031829834e-05, 9.420886635780334e-05, 9.807199239730835e-05, 0.00010193511843681335, 0.00010579824447631836, 0.00010966137051582336, 0.00011352449655532837, 0.00011738762259483337, 0.00012125074863433838, 0.00012511387467384338, 0.0001289770007133484, 0.0001328401267528534, 0.0001367032527923584, 0.0001405663788318634, 0.0001444295048713684, 0.0001482926309108734, 0.00015215575695037842, 0.00015601888298988342, 0.00015988200902938843, 0.00016374513506889343, 0.00016760826110839844]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 9.0, 13.0, 15.0, 21.0, 36.0, 68.0, 90.0, 127.0, 210.0, 338.0, 541.0, 952.0, 1785.0, 3607.0, 8325.0, 23931.0, 85189.0, 302285.0, 412680.0, 146681.0, 38773.0, 12585.0, 4958.0, 2273.0, 1159.0, 739.0, 401.0, 238.0, 141.0, 122.0, 67.0, 62.0, 30.0, 16.0, 22.0, 11.0, 6.0, 6.0, 8.0, 3.0, 5.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03863525390625, -0.03726530075073242, -0.035895347595214844, -0.034525394439697266, -0.03315544128417969, -0.03178548812866211, -0.03041553497314453, -0.029045581817626953, -0.027675628662109375, -0.026305675506591797, -0.02493572235107422, -0.02356576919555664, -0.022195816040039062, -0.020825862884521484, -0.019455909729003906, -0.018085956573486328, -0.01671600341796875, -0.015346050262451172, -0.013976097106933594, -0.012606143951416016, -0.011236190795898438, -0.00986623764038086, -0.008496284484863281, -0.007126331329345703, -0.005756378173828125, -0.004386425018310547, -0.0030164718627929688, -0.0016465187072753906, -0.0002765655517578125, 0.0010933876037597656, 0.0024633407592773438, 0.003833293914794922, 0.0052032470703125, 0.006573200225830078, 0.007943153381347656, 0.009313106536865234, 0.010683059692382812, 0.01205301284790039, 0.013422966003417969, 0.014792919158935547, 0.016162872314453125, 0.017532825469970703, 0.01890277862548828, 0.02027273178100586, 0.021642684936523438, 0.023012638092041016, 0.024382591247558594, 0.025752544403076172, 0.02712249755859375, 0.028492450714111328, 0.029862403869628906, 0.031232357025146484, 0.03260231018066406, 0.03397226333618164, 0.03534221649169922, 0.0367121696472168, 0.038082122802734375, 0.03945207595825195, 0.04082202911376953, 0.04219198226928711, 0.04356193542480469, 0.044931888580322266, 0.046301841735839844, 0.04767179489135742, 0.049041748046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 7.0, 8.0, 9.0, 17.0, 12.0, 23.0, 33.0, 33.0, 37.0, 40.0, 54.0, 55.0, 77.0, 77.0, 74.0, 71.0, 65.0, 53.0, 44.0, 42.0, 36.0, 27.0, 23.0, 16.0, 18.0, 12.0, 9.0, 6.0, 8.0, 7.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033966064453125, -0.032848358154296875, -0.03173065185546875, -0.030612945556640625, -0.0294952392578125, -0.028377532958984375, -0.02725982666015625, -0.026142120361328125, -0.0250244140625, -0.023906707763671875, -0.02278900146484375, -0.021671295166015625, -0.0205535888671875, -0.019435882568359375, -0.01831817626953125, -0.017200469970703125, -0.016082763671875, -0.014965057373046875, -0.01384735107421875, -0.012729644775390625, -0.0116119384765625, -0.010494232177734375, -0.00937652587890625, -0.008258819580078125, -0.00714111328125, -0.006023406982421875, -0.00490570068359375, -0.003787994384765625, -0.0026702880859375, -0.001552581787109375, -0.00043487548828125, 0.000682830810546875, 0.001800537109375, 0.002918243408203125, 0.00403594970703125, 0.005153656005859375, 0.0062713623046875, 0.007389068603515625, 0.00850677490234375, 0.009624481201171875, 0.0107421875, 0.011859893798828125, 0.01297760009765625, 0.014095306396484375, 0.0152130126953125, 0.016330718994140625, 0.01744842529296875, 0.018566131591796875, 0.019683837890625, 0.020801544189453125, 0.02191925048828125, 0.023036956787109375, 0.0241546630859375, 0.025272369384765625, 0.02639007568359375, 0.027507781982421875, 0.02862548828125, 0.029743194580078125, 0.03086090087890625, 0.031978607177734375, 0.0330963134765625, 0.034214019775390625, 0.03533172607421875, 0.036449432373046875, 0.037567138671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 9.0, 18.0, 35.0, 56.0, 152.0, 227.0, 211.0, 143.0, 73.0, 36.0, 20.0, 7.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.399295687675476, -1.3593984842300415, -1.3195011615753174, -1.2796039581298828, -1.2397066354751587, -1.1998094320297241, -1.159912109375, -1.1200149059295654, -1.0801177024841309, -1.0402204990386963, -1.0003231763839722, -0.9604259133338928, -0.9205286502838135, -0.8806314468383789, -0.8407341837882996, -0.8008369207382202, -0.7609395980834961, -0.7210423350334167, -0.6811450719833374, -0.6412478089332581, -0.6013505458831787, -0.5614533424377441, -0.5215560793876648, -0.48165881633758545, -0.4417615532875061, -0.40186429023742676, -0.3619670271873474, -0.32206979393959045, -0.2821725308895111, -0.24227526783943176, -0.2023780196905136, -0.16248077154159546, -0.12258362770080566, -0.08268637210130692, -0.042789116501808167, -0.0028918609023094177, 0.03700539469718933, 0.07690265774726868, 0.11679990589618683, 0.15669715404510498, 0.19659441709518433, 0.23649168014526367, 0.276388943195343, 0.3162861764431, 0.3561834394931793, 0.39608070254325867, 0.4359779357910156, 0.47587519884109497, 0.5157724618911743, 0.5556697249412537, 0.595566987991333, 0.6354642510414124, 0.6753615140914917, 0.7152587175369263, 0.7551559805870056, 0.795053243637085, 0.8349505066871643, 0.8748477697372437, 0.914745032787323, 0.9546422958374023, 0.9945394992828369, 1.034436821937561, 1.0743340253829956, 1.1142313480377197, 1.1541285514831543]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 7.0, 6.0, 12.0, 6.0, 5.0, 15.0, 22.0, 33.0, 22.0, 43.0, 33.0, 41.0, 36.0, 40.0, 49.0, 57.0, 45.0, 64.0, 58.0, 46.0, 48.0, 50.0, 32.0, 37.0, 31.0, 36.0, 23.0, 21.0, 16.0, 12.0, 12.0, 13.0, 7.0, 3.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8413145542144775, -0.8191577196121216, -0.7970008850097656, -0.7748440504074097, -0.7526872158050537, -0.7305303812026978, -0.7083735466003418, -0.6862167119979858, -0.6640598773956299, -0.6419030427932739, -0.619746208190918, -0.597589373588562, -0.575432538986206, -0.5532757043838501, -0.5311188697814941, -0.5089620351791382, -0.48680517077445984, -0.4646483361721039, -0.4424915015697479, -0.42033466696739197, -0.398177832365036, -0.37602099776268005, -0.3538641333580017, -0.33170729875564575, -0.3095504641532898, -0.28739362955093384, -0.2652367949485779, -0.24307996034622192, -0.22092312574386597, -0.19876629114151, -0.17660944163799286, -0.1544526070356369, -0.13229578733444214, -0.11013895273208618, -0.08798211812973022, -0.06582527607679367, -0.043668441474437714, -0.021511606872081757, 0.0006452351808547974, 0.022802069783210754, 0.04495890438556671, 0.06711573898792267, 0.08927257359027863, 0.11142941564321518, 0.13358625769615173, 0.1557430922985077, 0.17789992690086365, 0.2000567615032196, 0.22221359610557556, 0.24437043070793152, 0.2665272653102875, 0.28868409991264343, 0.3108409345149994, 0.33299776911735535, 0.3551546335220337, 0.37731146812438965, 0.3994683027267456, 0.42162513732910156, 0.4437819719314575, 0.4659388065338135, 0.48809564113616943, 0.5102524757385254, 0.5324093103408813, 0.5545661449432373, 0.5767229795455933]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 4.0, 7.0, 8.0, 7.0, 7.0, 13.0, 16.0, 20.0, 28.0, 27.0, 45.0, 67.0, 68.0, 110.0, 167.0, 248.0, 471.0, 837.0, 1899.0, 5891.0, 30183.0, 482329.0, 3587051.0, 69612.0, 10601.0, 2716.0, 956.0, 442.0, 181.0, 118.0, 66.0, 41.0, 16.0, 7.0, 8.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4013671875, -0.3922843933105469, -0.38320159912109375, -0.3741188049316406, -0.3650360107421875, -0.3559532165527344, -0.34687042236328125, -0.3377876281738281, -0.328704833984375, -0.3196220397949219, -0.31053924560546875, -0.3014564514160156, -0.2923736572265625, -0.2832908630371094, -0.27420806884765625, -0.2651252746582031, -0.25604248046875, -0.24695968627929688, -0.23787689208984375, -0.22879409790039062, -0.2197113037109375, -0.21062850952148438, -0.20154571533203125, -0.19246292114257812, -0.183380126953125, -0.17429733276367188, -0.16521453857421875, -0.15613174438476562, -0.1470489501953125, -0.13796615600585938, -0.12888336181640625, -0.11980056762695312, -0.1107177734375, -0.10163497924804688, -0.09255218505859375, -0.08346939086914062, -0.0743865966796875, -0.06530380249023438, -0.05622100830078125, -0.047138214111328125, -0.038055419921875, -0.028972625732421875, -0.01988983154296875, -0.010807037353515625, -0.0017242431640625, 0.007358551025390625, 0.01644134521484375, 0.025524139404296875, 0.03460693359375, 0.043689727783203125, 0.05277252197265625, 0.061855316162109375, 0.0709381103515625, 0.08002090454101562, 0.08910369873046875, 0.09818649291992188, 0.107269287109375, 0.11635208129882812, 0.12543487548828125, 0.13451766967773438, 0.1436004638671875, 0.15268325805664062, 0.16176605224609375, 0.17084884643554688, 0.179931640625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 10.0, 2.0, 10.0, 17.0, 15.0, 29.0, 37.0, 47.0, 56.0, 87.0, 93.0, 79.0, 95.0, 92.0, 81.0, 59.0, 56.0, 41.0, 25.0, 21.0, 17.0, 9.0, 12.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.045074462890625, -0.0439457893371582, -0.042817115783691406, -0.04168844223022461, -0.04055976867675781, -0.039431095123291016, -0.03830242156982422, -0.03717374801635742, -0.036045074462890625, -0.03491640090942383, -0.03378772735595703, -0.032659053802490234, -0.03153038024902344, -0.03040170669555664, -0.029273033142089844, -0.028144359588623047, -0.02701568603515625, -0.025887012481689453, -0.024758338928222656, -0.02362966537475586, -0.022500991821289062, -0.021372318267822266, -0.02024364471435547, -0.019114971160888672, -0.017986297607421875, -0.016857624053955078, -0.01572895050048828, -0.014600276947021484, -0.013471603393554688, -0.01234292984008789, -0.011214256286621094, -0.010085582733154297, -0.0089569091796875, -0.007828235626220703, -0.006699562072753906, -0.005570888519287109, -0.0044422149658203125, -0.0033135414123535156, -0.0021848678588867188, -0.0010561943054199219, 7.2479248046875e-05, 0.0012011528015136719, 0.0023298263549804688, 0.0034584999084472656, 0.0045871734619140625, 0.005715847015380859, 0.006844520568847656, 0.007973194122314453, 0.00910186767578125, 0.010230541229248047, 0.011359214782714844, 0.01248788833618164, 0.013616561889648438, 0.014745235443115234, 0.01587390899658203, 0.017002582550048828, 0.018131256103515625, 0.019259929656982422, 0.02038860321044922, 0.021517276763916016, 0.022645950317382812, 0.02377462387084961, 0.024903297424316406, 0.026031970977783203, 0.02716064453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 8.0, 9.0, 13.0, 18.0, 28.0, 47.0, 54.0, 86.0, 133.0, 262.0, 651.0, 1680.0, 6490.0, 96922.0, 4057812.0, 24743.0, 3555.0, 1003.0, 382.0, 148.0, 92.0, 46.0, 40.0, 19.0, 11.0, 13.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.650390625, -0.632965087890625, -0.61553955078125, -0.598114013671875, -0.5806884765625, -0.563262939453125, -0.54583740234375, -0.528411865234375, -0.510986328125, -0.493560791015625, -0.47613525390625, -0.458709716796875, -0.4412841796875, -0.423858642578125, -0.40643310546875, -0.389007568359375, -0.37158203125, -0.354156494140625, -0.33673095703125, -0.319305419921875, -0.3018798828125, -0.284454345703125, -0.26702880859375, -0.249603271484375, -0.232177734375, -0.214752197265625, -0.19732666015625, -0.179901123046875, -0.1624755859375, -0.145050048828125, -0.12762451171875, -0.110198974609375, -0.0927734375, -0.075347900390625, -0.05792236328125, -0.040496826171875, -0.0230712890625, -0.005645751953125, 0.01177978515625, 0.029205322265625, 0.046630859375, 0.064056396484375, 0.08148193359375, 0.098907470703125, 0.1163330078125, 0.133758544921875, 0.15118408203125, 0.168609619140625, 0.18603515625, 0.203460693359375, 0.22088623046875, 0.238311767578125, 0.2557373046875, 0.273162841796875, 0.29058837890625, 0.308013916015625, 0.325439453125, 0.342864990234375, 0.36029052734375, 0.377716064453125, 0.3951416015625, 0.412567138671875, 0.42999267578125, 0.447418212890625, 0.46484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 23.0, 52.0, 126.0, 512.0, 2509.0, 575.0, 159.0, 39.0, 36.0, 9.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.232666015625, -0.22777175903320312, -0.22287750244140625, -0.21798324584960938, -0.2130889892578125, -0.20819473266601562, -0.20330047607421875, -0.19840621948242188, -0.193511962890625, -0.18861770629882812, -0.18372344970703125, -0.17882919311523438, -0.1739349365234375, -0.16904067993164062, -0.16414642333984375, -0.15925216674804688, -0.15435791015625, -0.14946365356445312, -0.14456939697265625, -0.13967514038085938, -0.1347808837890625, -0.12988662719726562, -0.12499237060546875, -0.12009811401367188, -0.115203857421875, -0.11030960083007812, -0.10541534423828125, -0.10052108764648438, -0.0956268310546875, -0.09073257446289062, -0.08583831787109375, -0.08094406127929688, -0.0760498046875, -0.07115554809570312, -0.06626129150390625, -0.061367034912109375, -0.0564727783203125, -0.051578521728515625, -0.04668426513671875, -0.041790008544921875, -0.036895751953125, -0.032001495361328125, -0.02710723876953125, -0.022212982177734375, -0.0173187255859375, -0.012424468994140625, -0.00753021240234375, -0.002635955810546875, 0.00225830078125, 0.007152557373046875, 0.01204681396484375, 0.016941070556640625, 0.0218353271484375, 0.026729583740234375, 0.03162384033203125, 0.036518096923828125, 0.041412353515625, 0.046306610107421875, 0.05120086669921875, 0.056095123291015625, 0.0609893798828125, 0.06588363647460938, 0.07077789306640625, 0.07567214965820312, 0.08056640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 16.0, 26.0, 70.0, 166.0, 318.0, 232.0, 103.0, 35.0, 13.0, 4.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.5474777221679688, -1.5157463550567627, -1.484014868736267, -1.452283501625061, -1.4205520153045654, -1.3888206481933594, -1.3570892810821533, -1.3253577947616577, -1.2936264276504517, -1.2618950605392456, -1.23016357421875, -1.198432207107544, -1.166700839996338, -1.1349693536758423, -1.1032379865646362, -1.0715065002441406, -1.0397751331329346, -1.0080437660217285, -0.9763122797012329, -0.9445809125900269, -0.912849485874176, -0.8811180591583252, -0.8493866920471191, -0.8176552653312683, -0.7859238386154175, -0.7541924118995667, -0.7224609851837158, -0.6907296180725098, -0.6589981913566589, -0.6272667646408081, -0.595535397529602, -0.5638039708137512, -0.5320725440979004, -0.5003411173820496, -0.4686097204685211, -0.4368783235549927, -0.40514689683914185, -0.373415470123291, -0.3416840732097626, -0.30995267629623413, -0.2782212495803833, -0.24648983776569366, -0.21475842595100403, -0.1830270141363144, -0.15129560232162476, -0.11956419050693512, -0.08783277869224548, -0.05610136687755585, -0.02436995506286621, 0.007361456751823425, 0.03909286856651306, 0.0708242803812027, 0.10255569219589233, 0.13428710401058197, 0.1660185158252716, 0.19774992763996124, 0.22948133945465088, 0.2612127661705017, 0.29294416308403015, 0.3246755599975586, 0.3564069867134094, 0.38813841342926025, 0.4198698103427887, 0.45160120725631714, 0.48333263397216797]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 13.0, 21.0, 41.0, 53.0, 68.0, 91.0, 103.0, 113.0, 124.0, 111.0, 88.0, 64.0, 55.0, 16.0, 17.0, 12.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7077667713165283, -0.6876403093338013, -0.6675138473510742, -0.6473873853683472, -0.6272609233856201, -0.6071344614028931, -0.587007999420166, -0.566881537437439, -0.5467550754547119, -0.5266286134719849, -0.5065021514892578, -0.48637568950653076, -0.4662492275238037, -0.44612276554107666, -0.4259962737560272, -0.40586981177330017, -0.38574331998825073, -0.3656168580055237, -0.34549039602279663, -0.3253639340400696, -0.30523747205734253, -0.2851110100746155, -0.26498451828956604, -0.244858056306839, -0.22473159432411194, -0.2046051323413849, -0.18447867035865784, -0.1643521934747696, -0.14422573149204254, -0.12409926950931549, -0.10397280007600784, -0.0838463306427002, -0.06371986865997314, -0.043593402951955795, -0.023466937243938446, -0.003340471535921097, 0.016785994172096252, 0.0369124561548233, 0.05703892558813095, 0.0771653950214386, 0.09729185700416565, 0.1174183189868927, 0.13754478096961975, 0.157671257853508, 0.17779771983623505, 0.1979241818189621, 0.21805065870285034, 0.2381771206855774, 0.25830358266830444, 0.2784300446510315, 0.29855650663375854, 0.3186829686164856, 0.33880943059921265, 0.3589358925819397, 0.37906238436698914, 0.3991888463497162, 0.41931530833244324, 0.4394417703151703, 0.45956823229789734, 0.4796946942806244, 0.49982118606567383, 0.5199476480484009, 0.5400741100311279, 0.560200572013855, 0.580327033996582]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 6.0, 7.0, 9.0, 7.0, 7.0, 24.0, 16.0, 25.0, 23.0, 46.0, 59.0, 84.0, 110.0, 185.0, 313.0, 545.0, 1224.0, 3235.0, 14115.0, 112018.0, 665429.0, 219502.0, 23538.0, 4777.0, 1519.0, 672.0, 392.0, 216.0, 132.0, 69.0, 67.0, 40.0, 38.0, 28.0, 17.0, 14.0, 8.0, 8.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2330322265625, -0.2258930206298828, -0.21875381469726562, -0.21161460876464844, -0.20447540283203125, -0.19733619689941406, -0.19019699096679688, -0.1830577850341797, -0.1759185791015625, -0.1687793731689453, -0.16164016723632812, -0.15450096130371094, -0.14736175537109375, -0.14022254943847656, -0.13308334350585938, -0.1259441375732422, -0.118804931640625, -0.11166572570800781, -0.10452651977539062, -0.09738731384277344, -0.09024810791015625, -0.08310890197753906, -0.07596969604492188, -0.06883049011230469, -0.0616912841796875, -0.05455207824707031, -0.047412872314453125, -0.04027366638183594, -0.03313446044921875, -0.025995254516601562, -0.018856048583984375, -0.011716842651367188, -0.00457763671875, 0.0025615692138671875, 0.009700775146484375, 0.016839981079101562, 0.02397918701171875, 0.031118392944335938, 0.038257598876953125, 0.04539680480957031, 0.0525360107421875, 0.05967521667480469, 0.06681442260742188, 0.07395362854003906, 0.08109283447265625, 0.08823204040527344, 0.09537124633789062, 0.10251045227050781, 0.109649658203125, 0.11678886413574219, 0.12392807006835938, 0.13106727600097656, 0.13820648193359375, 0.14534568786621094, 0.15248489379882812, 0.1596240997314453, 0.1667633056640625, 0.1739025115966797, 0.18104171752929688, 0.18818092346191406, 0.19532012939453125, 0.20245933532714844, 0.20959854125976562, 0.2167377471923828, 0.223876953125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 12.0, 10.0, 29.0, 52.0, 78.0, 86.0, 124.0, 132.0, 115.0, 112.0, 89.0, 60.0, 44.0, 27.0, 15.0, 8.0, 4.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07745361328125, -0.07576227188110352, -0.07407093048095703, -0.07237958908081055, -0.07068824768066406, -0.06899690628051758, -0.0673055648803711, -0.06561422348022461, -0.06392288208007812, -0.06223154067993164, -0.060540199279785156, -0.05884885787963867, -0.05715751647949219, -0.0554661750793457, -0.05377483367919922, -0.052083492279052734, -0.05039215087890625, -0.048700809478759766, -0.04700946807861328, -0.0453181266784668, -0.04362678527832031, -0.04193544387817383, -0.040244102478027344, -0.03855276107788086, -0.036861419677734375, -0.03517007827758789, -0.033478736877441406, -0.03178739547729492, -0.030096054077148438, -0.028404712677001953, -0.02671337127685547, -0.025022029876708984, -0.0233306884765625, -0.021639347076416016, -0.01994800567626953, -0.018256664276123047, -0.016565322875976562, -0.014873981475830078, -0.013182640075683594, -0.01149129867553711, -0.009799957275390625, -0.00810861587524414, -0.006417274475097656, -0.004725933074951172, -0.0030345916748046875, -0.0013432502746582031, 0.00034809112548828125, 0.0020394325256347656, 0.00373077392578125, 0.005422115325927734, 0.007113456726074219, 0.008804798126220703, 0.010496139526367188, 0.012187480926513672, 0.013878822326660156, 0.01557016372680664, 0.017261505126953125, 0.01895284652709961, 0.020644187927246094, 0.022335529327392578, 0.024026870727539062, 0.025718212127685547, 0.02740955352783203, 0.029100894927978516, 0.030792236328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 13.0, 7.0, 16.0, 19.0, 29.0, 36.0, 49.0, 90.0, 147.0, 208.0, 437.0, 805.0, 1836.0, 4695.0, 14036.0, 51577.0, 206981.0, 463690.0, 223837.0, 56003.0, 15259.0, 4922.0, 1902.0, 870.0, 460.0, 207.0, 138.0, 79.0, 49.0, 43.0, 22.0, 21.0, 22.0, 10.0, 7.0, 5.0, 6.0, 8.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0794677734375, -0.07635498046875, -0.0732421875, -0.07012939453125, -0.0670166015625, -0.06390380859375, -0.060791015625, -0.05767822265625, -0.0545654296875, -0.05145263671875, -0.04833984375, -0.04522705078125, -0.0421142578125, -0.03900146484375, -0.035888671875, -0.03277587890625, -0.0296630859375, -0.02655029296875, -0.0234375, -0.02032470703125, -0.0172119140625, -0.01409912109375, -0.010986328125, -0.00787353515625, -0.0047607421875, -0.00164794921875, 0.00146484375, 0.00457763671875, 0.0076904296875, 0.01080322265625, 0.013916015625, 0.01702880859375, 0.0201416015625, 0.02325439453125, 0.0263671875, 0.02947998046875, 0.0325927734375, 0.03570556640625, 0.038818359375, 0.04193115234375, 0.0450439453125, 0.04815673828125, 0.05126953125, 0.05438232421875, 0.0574951171875, 0.06060791015625, 0.063720703125, 0.06683349609375, 0.0699462890625, 0.07305908203125, 0.076171875, 0.07928466796875, 0.0823974609375, 0.08551025390625, 0.088623046875, 0.09173583984375, 0.0948486328125, 0.09796142578125, 0.10107421875, 0.10418701171875, 0.1072998046875, 0.11041259765625, 0.113525390625, 0.11663818359375, 0.1197509765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 7.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 12.0, 16.0, 19.0, 20.0, 39.0, 26.0, 23.0, 39.0, 34.0, 36.0, 39.0, 42.0, 47.0, 57.0, 57.0, 50.0, 42.0, 53.0, 49.0, 38.0, 35.0, 33.0, 22.0, 29.0, 20.0, 23.0, 13.0, 14.0, 6.0, 7.0, 10.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07421875, -0.07126235961914062, -0.06830596923828125, -0.06534957885742188, -0.0623931884765625, -0.059436798095703125, -0.05648040771484375, -0.053524017333984375, -0.050567626953125, -0.047611236572265625, -0.04465484619140625, -0.041698455810546875, -0.0387420654296875, -0.035785675048828125, -0.03282928466796875, -0.029872894287109375, -0.02691650390625, -0.023960113525390625, -0.02100372314453125, -0.018047332763671875, -0.0150909423828125, -0.012134552001953125, -0.00917816162109375, -0.006221771240234375, -0.003265380859375, -0.000308990478515625, 0.00264739990234375, 0.005603790283203125, 0.0085601806640625, 0.011516571044921875, 0.01447296142578125, 0.017429351806640625, 0.0203857421875, 0.023342132568359375, 0.02629852294921875, 0.029254913330078125, 0.0322113037109375, 0.035167694091796875, 0.03812408447265625, 0.041080474853515625, 0.044036865234375, 0.046993255615234375, 0.04994964599609375, 0.052906036376953125, 0.0558624267578125, 0.058818817138671875, 0.06177520751953125, 0.06473159790039062, 0.06768798828125, 0.07064437866210938, 0.07360076904296875, 0.07655715942382812, 0.0795135498046875, 0.08246994018554688, 0.08542633056640625, 0.08838272094726562, 0.091339111328125, 0.09429550170898438, 0.09725189208984375, 0.10020828247070312, 0.1031646728515625, 0.10612106323242188, 0.10907745361328125, 0.11203384399414062, 0.114990234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 10.0, 18.0, 28.0, 34.0, 44.0, 90.0, 133.0, 236.0, 413.0, 985.0, 2463.0, 7643.0, 35786.0, 251110.0, 590482.0, 130144.0, 20485.0, 4990.0, 1736.0, 783.0, 362.0, 213.0, 117.0, 68.0, 52.0, 33.0, 26.0, 7.0, 16.0, 9.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.060272216796875, -0.058408260345458984, -0.05654430389404297, -0.05468034744262695, -0.05281639099121094, -0.05095243453979492, -0.049088478088378906, -0.04722452163696289, -0.045360565185546875, -0.04349660873413086, -0.041632652282714844, -0.03976869583129883, -0.03790473937988281, -0.0360407829284668, -0.03417682647705078, -0.032312870025634766, -0.03044891357421875, -0.028584957122802734, -0.02672100067138672, -0.024857044219970703, -0.022993087768554688, -0.021129131317138672, -0.019265174865722656, -0.01740121841430664, -0.015537261962890625, -0.01367330551147461, -0.011809349060058594, -0.009945392608642578, -0.008081436157226562, -0.006217479705810547, -0.004353523254394531, -0.0024895668029785156, -0.0006256103515625, 0.0012383460998535156, 0.0031023025512695312, 0.004966259002685547, 0.0068302154541015625, 0.008694171905517578, 0.010558128356933594, 0.01242208480834961, 0.014286041259765625, 0.01614999771118164, 0.018013954162597656, 0.019877910614013672, 0.021741867065429688, 0.023605823516845703, 0.02546977996826172, 0.027333736419677734, 0.02919769287109375, 0.031061649322509766, 0.03292560577392578, 0.0347895622253418, 0.03665351867675781, 0.03851747512817383, 0.040381431579589844, 0.04224538803100586, 0.044109344482421875, 0.04597330093383789, 0.047837257385253906, 0.04970121383666992, 0.05156517028808594, 0.05342912673950195, 0.05529308319091797, 0.057157039642333984, 0.05902099609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 13.0, 10.0, 16.0, 24.0, 42.0, 46.0, 91.0, 152.0, 151.0, 167.0, 105.0, 70.0, 41.0, 28.0, 21.0, 11.0, 10.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.208917617797852e-05, -8.626189082860947e-05, -8.043460547924042e-05, -7.460732012987137e-05, -6.878003478050232e-05, -6.295274943113327e-05, -5.712546408176422e-05, -5.129817873239517e-05, -4.547089338302612e-05, -3.9643608033657074e-05, -3.3816322684288025e-05, -2.7989037334918976e-05, -2.2161751985549927e-05, -1.6334466636180878e-05, -1.0507181286811829e-05, -4.6798959374427795e-06, 1.1473894119262695e-06, 6.974674761295319e-06, 1.2801960110664368e-05, 1.8629245460033417e-05, 2.4456530809402466e-05, 3.0283816158771515e-05, 3.6111101508140564e-05, 4.193838685750961e-05, 4.776567220687866e-05, 5.359295755624771e-05, 5.942024290561676e-05, 6.524752825498581e-05, 7.107481360435486e-05, 7.690209895372391e-05, 8.272938430309296e-05, 8.8556669652462e-05, 9.438395500183105e-05, 0.0001002112403512001, 0.00010603852570056915, 0.0001118658110499382, 0.00011769309639930725, 0.0001235203817486763, 0.00012934766709804535, 0.0001351749524474144, 0.00014100223779678345, 0.0001468295231461525, 0.00015265680849552155, 0.0001584840938448906, 0.00016431137919425964, 0.0001701386645436287, 0.00017596594989299774, 0.0001817932352423668, 0.00018762052059173584, 0.0001934478059411049, 0.00019927509129047394, 0.000205102376639843, 0.00021092966198921204, 0.00021675694733858109, 0.00022258423268795013, 0.00022841151803731918, 0.00023423880338668823, 0.00024006608873605728, 0.00024589337408542633, 0.0002517206594347954, 0.00025754794478416443, 0.0002633752301335335, 0.0002692025154829025, 0.0002750298008322716, 0.0002808570861816406]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 8.0, 9.0, 10.0, 20.0, 27.0, 40.0, 72.0, 119.0, 217.0, 389.0, 874.0, 1995.0, 5847.0, 22546.0, 117321.0, 495816.0, 323577.0, 60167.0, 12882.0, 3869.0, 1356.0, 645.0, 287.0, 179.0, 95.0, 81.0, 32.0, 17.0, 18.0, 12.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.05926513671875, -0.05765485763549805, -0.056044578552246094, -0.05443429946899414, -0.05282402038574219, -0.051213741302490234, -0.04960346221923828, -0.04799318313598633, -0.046382904052734375, -0.04477262496948242, -0.04316234588623047, -0.041552066802978516, -0.03994178771972656, -0.03833150863647461, -0.036721229553222656, -0.0351109504699707, -0.03350067138671875, -0.0318903923034668, -0.030280113220214844, -0.02866983413696289, -0.027059555053710938, -0.025449275970458984, -0.02383899688720703, -0.022228717803955078, -0.020618438720703125, -0.019008159637451172, -0.01739788055419922, -0.015787601470947266, -0.014177322387695312, -0.01256704330444336, -0.010956764221191406, -0.009346485137939453, -0.0077362060546875, -0.006125926971435547, -0.004515647888183594, -0.0029053688049316406, -0.0012950897216796875, 0.0003151893615722656, 0.0019254684448242188, 0.003535747528076172, 0.005146026611328125, 0.006756305694580078, 0.008366584777832031, 0.009976863861083984, 0.011587142944335938, 0.01319742202758789, 0.014807701110839844, 0.016417980194091797, 0.01802825927734375, 0.019638538360595703, 0.021248817443847656, 0.02285909652709961, 0.024469375610351562, 0.026079654693603516, 0.02768993377685547, 0.029300212860107422, 0.030910491943359375, 0.03252077102661133, 0.03413105010986328, 0.035741329193115234, 0.03735160827636719, 0.03896188735961914, 0.040572166442871094, 0.04218244552612305, 0.043792724609375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 5.0, 5.0, 9.0, 5.0, 17.0, 22.0, 27.0, 25.0, 38.0, 54.0, 60.0, 57.0, 80.0, 80.0, 105.0, 65.0, 83.0, 64.0, 48.0, 31.0, 37.0, 26.0, 18.0, 7.0, 7.0, 6.0, 7.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038543701171875, -0.03738546371459961, -0.03622722625732422, -0.03506898880004883, -0.03391075134277344, -0.03275251388549805, -0.031594276428222656, -0.030436038970947266, -0.029277801513671875, -0.028119564056396484, -0.026961326599121094, -0.025803089141845703, -0.024644851684570312, -0.023486614227294922, -0.02232837677001953, -0.02117013931274414, -0.02001190185546875, -0.01885366439819336, -0.01769542694091797, -0.016537189483642578, -0.015378952026367188, -0.014220714569091797, -0.013062477111816406, -0.011904239654541016, -0.010746002197265625, -0.009587764739990234, -0.008429527282714844, -0.007271289825439453, -0.0061130523681640625, -0.004954814910888672, -0.0037965774536132812, -0.0026383399963378906, -0.0014801025390625, -0.0003218650817871094, 0.0008363723754882812, 0.001994609832763672, 0.0031528472900390625, 0.004311084747314453, 0.005469322204589844, 0.006627559661865234, 0.007785797119140625, 0.008944034576416016, 0.010102272033691406, 0.011260509490966797, 0.012418746948242188, 0.013576984405517578, 0.014735221862792969, 0.01589345932006836, 0.01705169677734375, 0.01820993423461914, 0.01936817169189453, 0.020526409149169922, 0.021684646606445312, 0.022842884063720703, 0.024001121520996094, 0.025159358978271484, 0.026317596435546875, 0.027475833892822266, 0.028634071350097656, 0.029792308807373047, 0.030950546264648438, 0.03210878372192383, 0.03326702117919922, 0.03442525863647461, 0.03558349609375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 2.0, 7.0, 11.0, 23.0, 58.0, 146.0, 241.0, 236.0, 148.0, 72.0, 33.0, 17.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4437568187713623, -1.4069010019302368, -1.3700450658798218, -1.3331892490386963, -1.2963333129882812, -1.2594774961471558, -1.2226215600967407, -1.1857657432556152, -1.1489098072052002, -1.1120539903640747, -1.0751980543136597, -1.0383422374725342, -1.0014863014221191, -0.9646304249763489, -0.9277745485305786, -0.8909187316894531, -0.8540628552436829, -0.8172069787979126, -0.7803511023521423, -0.7434952259063721, -0.7066393494606018, -0.6697834730148315, -0.632927656173706, -0.596071720123291, -0.5592159032821655, -0.5223600268363953, -0.485504150390625, -0.44864827394485474, -0.4117923974990845, -0.3749365210533142, -0.33808067440986633, -0.30122479796409607, -0.2643688917160034, -0.22751301527023315, -0.1906571388244629, -0.15380127727985382, -0.11694540083408356, -0.0800895243883133, -0.043233662843704224, -0.00637778639793396, 0.030478090047836304, 0.06733396649360657, 0.10418983548879623, 0.1410457044839859, 0.17790158092975616, 0.21475745737552643, 0.2516133189201355, 0.28846919536590576, 0.325325071811676, 0.3621809482574463, 0.39903682470321655, 0.4358927011489868, 0.4727485775947571, 0.5096044540405273, 0.5464602708816528, 0.5833162069320679, 0.6201720237731934, 0.6570279002189636, 0.6938837766647339, 0.7307396531105042, 0.7675955295562744, 0.8044514060020447, 0.8413072824478149, 0.8781630992889404, 0.9150190353393555]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 6.0, 4.0, 6.0, 11.0, 12.0, 14.0, 14.0, 18.0, 17.0, 23.0, 33.0, 26.0, 21.0, 39.0, 37.0, 30.0, 40.0, 45.0, 46.0, 37.0, 46.0, 49.0, 36.0, 23.0, 39.0, 43.0, 38.0, 33.0, 26.0, 25.0, 28.0, 20.0, 21.0, 14.0, 16.0, 8.0, 11.0, 6.0, 12.0, 8.0, 8.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.5194609761238098, -0.5045477747917175, -0.48963460326194763, -0.47472140192985535, -0.45980820059776306, -0.44489502906799316, -0.4299818277359009, -0.4150686264038086, -0.4001554250717163, -0.385242223739624, -0.3703290522098541, -0.35541585087776184, -0.34050264954566956, -0.32558947801589966, -0.3106762766838074, -0.2957630753517151, -0.2808499038219452, -0.2659367024898529, -0.251023530960083, -0.23611032962799072, -0.22119712829589844, -0.20628394186496735, -0.19137075543403625, -0.17645755410194397, -0.16154436767101288, -0.1466311812400818, -0.1317179799079895, -0.11680479347705841, -0.10189159959554672, -0.08697840571403503, -0.07206521928310394, -0.057152025401592255, -0.042238831520080566, -0.027325639501214027, -0.012412447482347488, 0.0025007426738739014, 0.01741393655538559, 0.03232713043689728, 0.04724031686782837, 0.06215351074934006, 0.07706670463085175, 0.09197989851236343, 0.10689309239387512, 0.12180627882480621, 0.1367194652557373, 0.1516326665878296, 0.16654585301876068, 0.18145903944969177, 0.19637224078178406, 0.21128542721271515, 0.22619862854480743, 0.24111181497573853, 0.2560250163078308, 0.2709382176399231, 0.285851389169693, 0.3007645905017853, 0.3156777620315552, 0.33059096336364746, 0.34550413489341736, 0.36041733622550964, 0.37533053755760193, 0.3902437090873718, 0.4051569104194641, 0.4200701117515564, 0.4349833130836487]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 9.0, 10.0, 18.0, 22.0, 24.0, 60.0, 81.0, 102.0, 182.0, 352.0, 723.0, 1703.0, 7252.0, 100069.0, 4017243.0, 58228.0, 5476.0, 1392.0, 585.0, 296.0, 142.0, 104.0, 62.0, 47.0, 18.0, 20.0, 12.0, 14.0, 7.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.404052734375, -0.3945274353027344, -0.38500213623046875, -0.3754768371582031, -0.3659515380859375, -0.3564262390136719, -0.34690093994140625, -0.3373756408691406, -0.327850341796875, -0.3183250427246094, -0.30879974365234375, -0.2992744445800781, -0.2897491455078125, -0.2802238464355469, -0.27069854736328125, -0.2611732482910156, -0.25164794921875, -0.24212265014648438, -0.23259735107421875, -0.22307205200195312, -0.2135467529296875, -0.20402145385742188, -0.19449615478515625, -0.18497085571289062, -0.175445556640625, -0.16592025756835938, -0.15639495849609375, -0.14686965942382812, -0.1373443603515625, -0.12781906127929688, -0.11829376220703125, -0.10876846313476562, -0.0992431640625, -0.08971786499023438, -0.08019256591796875, -0.07066726684570312, -0.0611419677734375, -0.051616668701171875, -0.04209136962890625, -0.032566070556640625, -0.023040771484375, -0.013515472412109375, -0.00399017333984375, 0.005535125732421875, 0.0150604248046875, 0.024585723876953125, 0.03411102294921875, 0.043636322021484375, 0.05316162109375, 0.06268692016601562, 0.07221221923828125, 0.08173751831054688, 0.0912628173828125, 0.10078811645507812, 0.11031341552734375, 0.11983871459960938, 0.129364013671875, 0.13888931274414062, 0.14841461181640625, 0.15793991088867188, 0.1674652099609375, 0.17699050903320312, 0.18651580810546875, 0.19604110717773438, 0.20556640625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 9.0, 18.0, 28.0, 39.0, 59.0, 66.0, 114.0, 110.0, 131.0, 125.0, 90.0, 69.0, 54.0, 39.0, 16.0, 14.0, 9.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.07550048828125, -0.07383441925048828, -0.07216835021972656, -0.07050228118896484, -0.06883621215820312, -0.0671701431274414, -0.06550407409667969, -0.06383800506591797, -0.06217193603515625, -0.06050586700439453, -0.05883979797363281, -0.057173728942871094, -0.055507659912109375, -0.053841590881347656, -0.05217552185058594, -0.05050945281982422, -0.0488433837890625, -0.04717731475830078, -0.04551124572753906, -0.043845176696777344, -0.042179107666015625, -0.040513038635253906, -0.03884696960449219, -0.03718090057373047, -0.03551483154296875, -0.03384876251220703, -0.03218269348144531, -0.030516624450683594, -0.028850555419921875, -0.027184486389160156, -0.025518417358398438, -0.02385234832763672, -0.022186279296875, -0.02052021026611328, -0.018854141235351562, -0.017188072204589844, -0.015522003173828125, -0.013855934143066406, -0.012189865112304688, -0.010523796081542969, -0.00885772705078125, -0.007191658020019531, -0.0055255889892578125, -0.0038595199584960938, -0.002193450927734375, -0.0005273818969726562, 0.0011386871337890625, 0.0028047561645507812, 0.0044708251953125, 0.006136894226074219, 0.0078029632568359375, 0.009469032287597656, 0.011135101318359375, 0.012801170349121094, 0.014467239379882812, 0.01613330841064453, 0.01779937744140625, 0.01946544647216797, 0.021131515502929688, 0.022797584533691406, 0.024463653564453125, 0.026129722595214844, 0.027795791625976562, 0.02946186065673828, 0.0311279296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 6.0, 9.0, 11.0, 10.0, 17.0, 20.0, 32.0, 44.0, 59.0, 69.0, 125.0, 192.0, 335.0, 785.0, 1891.0, 5633.0, 21404.0, 105134.0, 3053220.0, 910805.0, 70954.0, 15738.0, 4505.0, 1665.0, 703.0, 333.0, 171.0, 124.0, 76.0, 53.0, 46.0, 28.0, 15.0, 13.0, 12.0, 9.0, 9.0, 6.0, 6.0, 2.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11083984375, -0.10686492919921875, -0.1028900146484375, -0.09891510009765625, -0.094940185546875, -0.09096527099609375, -0.0869903564453125, -0.08301544189453125, -0.07904052734375, -0.07506561279296875, -0.0710906982421875, -0.06711578369140625, -0.063140869140625, -0.05916595458984375, -0.0551910400390625, -0.05121612548828125, -0.0472412109375, -0.04326629638671875, -0.0392913818359375, -0.03531646728515625, -0.031341552734375, -0.02736663818359375, -0.0233917236328125, -0.01941680908203125, -0.01544189453125, -0.01146697998046875, -0.0074920654296875, -0.00351715087890625, 0.000457763671875, 0.00443267822265625, 0.0084075927734375, 0.01238250732421875, 0.016357421875, 0.02033233642578125, 0.0243072509765625, 0.02828216552734375, 0.032257080078125, 0.03623199462890625, 0.0402069091796875, 0.04418182373046875, 0.04815673828125, 0.05213165283203125, 0.0561065673828125, 0.06008148193359375, 0.064056396484375, 0.06803131103515625, 0.0720062255859375, 0.07598114013671875, 0.0799560546875, 0.08393096923828125, 0.0879058837890625, 0.09188079833984375, 0.095855712890625, 0.09983062744140625, 0.1038055419921875, 0.10778045654296875, 0.11175537109375, 0.11573028564453125, 0.1197052001953125, 0.12368011474609375, 0.127655029296875, 0.13162994384765625, 0.1356048583984375, 0.13957977294921875, 0.1435546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 14.0, 18.0, 34.0, 37.0, 78.0, 142.0, 344.0, 1748.0, 1006.0, 298.0, 146.0, 85.0, 43.0, 21.0, 17.0, 10.0, 13.0, 5.0, 4.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05029296875, -0.04848670959472656, -0.046680450439453125, -0.04487419128417969, -0.04306793212890625, -0.04126167297363281, -0.039455413818359375, -0.03764915466308594, -0.0358428955078125, -0.03403663635253906, -0.032230377197265625, -0.030424118041992188, -0.02861785888671875, -0.026811599731445312, -0.025005340576171875, -0.023199081420898438, -0.021392822265625, -0.019586563110351562, -0.017780303955078125, -0.015974044799804688, -0.01416778564453125, -0.012361526489257812, -0.010555267333984375, -0.008749008178710938, -0.0069427490234375, -0.0051364898681640625, -0.003330230712890625, -0.0015239715576171875, 0.00028228759765625, 0.0020885467529296875, 0.003894805908203125, 0.0057010650634765625, 0.00750732421875, 0.009313583374023438, 0.011119842529296875, 0.012926101684570312, 0.01473236083984375, 0.016538619995117188, 0.018344879150390625, 0.020151138305664062, 0.0219573974609375, 0.023763656616210938, 0.025569915771484375, 0.027376174926757812, 0.02918243408203125, 0.030988693237304688, 0.032794952392578125, 0.03460121154785156, 0.036407470703125, 0.03821372985839844, 0.040019989013671875, 0.04182624816894531, 0.04363250732421875, 0.04543876647949219, 0.047245025634765625, 0.04905128479003906, 0.0508575439453125, 0.05266380310058594, 0.054470062255859375, 0.05627632141113281, 0.05808258056640625, 0.05988883972167969, 0.061695098876953125, 0.06350135803222656, 0.0653076171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 12.0, 17.0, 43.0, 91.0, 172.0, 234.0, 190.0, 128.0, 59.0, 22.0, 12.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3411470055580139, -0.3287104666233063, -0.31627392768859863, -0.3038373589515686, -0.29140082001686096, -0.2789642810821533, -0.2665277123451233, -0.25409117341041565, -0.241654634475708, -0.22921809554100037, -0.21678154170513153, -0.2043449878692627, -0.19190844893455505, -0.1794719099998474, -0.16703535616397858, -0.15459880232810974, -0.1421622633934021, -0.12972572445869446, -0.11728917062282562, -0.10485262423753738, -0.09241607785224915, -0.07997953146696091, -0.06754298508167267, -0.05510643869638443, -0.04266989231109619, -0.030233345925807953, -0.017796799540519714, -0.005360253155231476, 0.007076293230056763, 0.019512839615345, 0.03194938600063324, 0.04438593238592148, 0.05682247877120972, 0.06925902515649796, 0.0816955715417862, 0.09413211792707443, 0.10656866431236267, 0.11900521069765091, 0.13144175708293915, 0.14387831091880798, 0.15631484985351562, 0.16875138878822327, 0.1811879426240921, 0.19362449645996094, 0.20606103539466858, 0.21849757432937622, 0.23093412816524506, 0.2433706820011139, 0.25580722093582153, 0.2682437598705292, 0.2806802988052368, 0.29311686754226685, 0.3055534064769745, 0.31798994541168213, 0.33042651414871216, 0.3428630530834198, 0.35529959201812744, 0.3677361309528351, 0.3801726698875427, 0.39260923862457275, 0.4050457775592804, 0.41748231649398804, 0.42991888523101807, 0.4423554241657257, 0.45479196310043335]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 6.0, 7.0, 13.0, 13.0, 17.0, 17.0, 18.0, 29.0, 39.0, 39.0, 38.0, 47.0, 47.0, 53.0, 54.0, 57.0, 61.0, 44.0, 47.0, 45.0, 36.0, 48.0, 37.0, 31.0, 30.0, 19.0, 28.0, 19.0, 10.0, 7.0, 8.0, 7.0, 3.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15105199813842773, -0.14620257914066315, -0.14135314524173737, -0.13650372624397278, -0.131654292345047, -0.1268048733472824, -0.12195544689893723, -0.11710602045059204, -0.11225659400224686, -0.10740716755390167, -0.10255774110555649, -0.0977083146572113, -0.09285889565944672, -0.08800946176052094, -0.08316004276275635, -0.07831061631441116, -0.07346118986606598, -0.0686117634177208, -0.06376233696937561, -0.058912914246320724, -0.05406348779797554, -0.049214061349630356, -0.04436463862657547, -0.039515212178230286, -0.0346657857298851, -0.029816359281539917, -0.024966934695839882, -0.020117510110139847, -0.015268083661794662, -0.010418657213449478, -0.005569232627749443, -0.000719808042049408, 0.004129618406295776, 0.008979043923318386, 0.013828469440340996, 0.01867789402604103, 0.023527320474386215, 0.0283767469227314, 0.033226169645786285, 0.03807559609413147, 0.042925022542476654, 0.04777444899082184, 0.05262387543916702, 0.05747329816222191, 0.06232272461056709, 0.06717215478420258, 0.07202157378196716, 0.07687100023031235, 0.08172042667865753, 0.08656985312700272, 0.0914192795753479, 0.09626870602369308, 0.10111813247203827, 0.10596755146980286, 0.11081697791814804, 0.11566640436649323, 0.12051583081483841, 0.1253652572631836, 0.13021467626094818, 0.13506411015987396, 0.13991352915763855, 0.14476296305656433, 0.14961238205432892, 0.1544618010520935, 0.1593112349510193]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 14.0, 8.0, 19.0, 22.0, 30.0, 40.0, 74.0, 94.0, 168.0, 284.0, 595.0, 1490.0, 5206.0, 35302.0, 430689.0, 519960.0, 45307.0, 6019.0, 1726.0, 719.0, 320.0, 153.0, 84.0, 61.0, 37.0, 35.0, 25.0, 15.0, 11.0, 14.0, 10.0, 4.0, 4.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.202880859375, -0.19538116455078125, -0.1878814697265625, -0.18038177490234375, -0.172882080078125, -0.16538238525390625, -0.1578826904296875, -0.15038299560546875, -0.14288330078125, -0.13538360595703125, -0.1278839111328125, -0.12038421630859375, -0.112884521484375, -0.10538482666015625, -0.0978851318359375, -0.09038543701171875, -0.0828857421875, -0.07538604736328125, -0.0678863525390625, -0.06038665771484375, -0.052886962890625, -0.04538726806640625, -0.0378875732421875, -0.03038787841796875, -0.02288818359375, -0.01538848876953125, -0.0078887939453125, -0.00038909912109375, 0.007110595703125, 0.01461029052734375, 0.0221099853515625, 0.02960968017578125, 0.037109375, 0.04460906982421875, 0.0521087646484375, 0.05960845947265625, 0.067108154296875, 0.07460784912109375, 0.0821075439453125, 0.08960723876953125, 0.09710693359375, 0.10460662841796875, 0.1121063232421875, 0.11960601806640625, 0.127105712890625, 0.13460540771484375, 0.1421051025390625, 0.14960479736328125, 0.1571044921875, 0.16460418701171875, 0.1721038818359375, 0.17960357666015625, 0.187103271484375, 0.19460296630859375, 0.2021026611328125, 0.20960235595703125, 0.21710205078125, 0.22460174560546875, 0.2321014404296875, 0.23960113525390625, 0.247100830078125, 0.25460052490234375, 0.2621002197265625, 0.26959991455078125, 0.277099609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 16.0, 22.0, 33.0, 51.0, 65.0, 80.0, 117.0, 122.0, 128.0, 94.0, 88.0, 57.0, 47.0, 31.0, 15.0, 13.0, 9.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.07086181640625, -0.06928086280822754, -0.06769990921020508, -0.06611895561218262, -0.06453800201416016, -0.0629570484161377, -0.061376094818115234, -0.05979514122009277, -0.05821418762207031, -0.05663323402404785, -0.05505228042602539, -0.05347132682800293, -0.05189037322998047, -0.05030941963195801, -0.04872846603393555, -0.047147512435913086, -0.045566558837890625, -0.043985605239868164, -0.0424046516418457, -0.04082369804382324, -0.03924274444580078, -0.03766179084777832, -0.03608083724975586, -0.0344998836517334, -0.03291893005371094, -0.03133797645568848, -0.029757022857666016, -0.028176069259643555, -0.026595115661621094, -0.025014162063598633, -0.023433208465576172, -0.02185225486755371, -0.02027130126953125, -0.01869034767150879, -0.017109394073486328, -0.015528440475463867, -0.013947486877441406, -0.012366533279418945, -0.010785579681396484, -0.009204626083374023, -0.0076236724853515625, -0.0060427188873291016, -0.004461765289306641, -0.0028808116912841797, -0.0012998580932617188, 0.0002810955047607422, 0.0018620491027832031, 0.003443002700805664, 0.005023956298828125, 0.006604909896850586, 0.008185863494873047, 0.009766817092895508, 0.011347770690917969, 0.01292872428894043, 0.01450967788696289, 0.01609063148498535, 0.017671585083007812, 0.019252538681030273, 0.020833492279052734, 0.022414445877075195, 0.023995399475097656, 0.025576353073120117, 0.027157306671142578, 0.02873826026916504, 0.0303192138671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 9.0, 8.0, 7.0, 14.0, 20.0, 29.0, 40.0, 49.0, 106.0, 136.0, 189.0, 332.0, 487.0, 870.0, 1564.0, 3150.0, 7014.0, 17061.0, 46842.0, 131265.0, 307822.0, 313588.0, 136845.0, 48739.0, 18054.0, 7124.0, 3278.0, 1560.0, 914.0, 490.0, 331.0, 207.0, 142.0, 68.0, 55.0, 48.0, 29.0, 25.0, 10.0, 10.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07147216796875, -0.0691680908203125, -0.066864013671875, -0.0645599365234375, -0.062255859375, -0.0599517822265625, -0.057647705078125, -0.0553436279296875, -0.05303955078125, -0.0507354736328125, -0.048431396484375, -0.0461273193359375, -0.0438232421875, -0.0415191650390625, -0.039215087890625, -0.0369110107421875, -0.03460693359375, -0.0323028564453125, -0.029998779296875, -0.0276947021484375, -0.025390625, -0.0230865478515625, -0.020782470703125, -0.0184783935546875, -0.01617431640625, -0.0138702392578125, -0.011566162109375, -0.0092620849609375, -0.0069580078125, -0.0046539306640625, -0.002349853515625, -4.57763671875e-05, 0.00225830078125, 0.0045623779296875, 0.006866455078125, 0.0091705322265625, 0.011474609375, 0.0137786865234375, 0.016082763671875, 0.0183868408203125, 0.02069091796875, 0.0229949951171875, 0.025299072265625, 0.0276031494140625, 0.0299072265625, 0.0322113037109375, 0.034515380859375, 0.0368194580078125, 0.03912353515625, 0.0414276123046875, 0.043731689453125, 0.0460357666015625, 0.04833984375, 0.0506439208984375, 0.052947998046875, 0.0552520751953125, 0.05755615234375, 0.0598602294921875, 0.062164306640625, 0.0644683837890625, 0.0667724609375, 0.0690765380859375, 0.071380615234375, 0.0736846923828125, 0.07598876953125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 9.0, 5.0, 11.0, 16.0, 13.0, 17.0, 16.0, 19.0, 23.0, 27.0, 35.0, 42.0, 35.0, 39.0, 45.0, 38.0, 40.0, 42.0, 45.0, 35.0, 35.0, 43.0, 37.0, 31.0, 44.0, 40.0, 37.0, 33.0, 21.0, 25.0, 18.0, 17.0, 15.0, 10.0, 12.0, 9.0, 4.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0909423828125, -0.08823776245117188, -0.08553314208984375, -0.08282852172851562, -0.0801239013671875, -0.07741928100585938, -0.07471466064453125, -0.07201004028320312, -0.069305419921875, -0.06660079956054688, -0.06389617919921875, -0.061191558837890625, -0.0584869384765625, -0.055782318115234375, -0.05307769775390625, -0.050373077392578125, -0.04766845703125, -0.044963836669921875, -0.04225921630859375, -0.039554595947265625, -0.0368499755859375, -0.034145355224609375, -0.03144073486328125, -0.028736114501953125, -0.026031494140625, -0.023326873779296875, -0.02062225341796875, -0.017917633056640625, -0.0152130126953125, -0.012508392333984375, -0.00980377197265625, -0.007099151611328125, -0.00439453125, -0.001689910888671875, 0.00101470947265625, 0.003719329833984375, 0.0064239501953125, 0.009128570556640625, 0.01183319091796875, 0.014537811279296875, 0.017242431640625, 0.019947052001953125, 0.02265167236328125, 0.025356292724609375, 0.0280609130859375, 0.030765533447265625, 0.03347015380859375, 0.036174774169921875, 0.03887939453125, 0.041584014892578125, 0.04428863525390625, 0.046993255615234375, 0.0496978759765625, 0.052402496337890625, 0.05510711669921875, 0.057811737060546875, 0.060516357421875, 0.06322097778320312, 0.06592559814453125, 0.06863021850585938, 0.0713348388671875, 0.07403945922851562, 0.07674407958984375, 0.07944869995117188, 0.0821533203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 10.0, 15.0, 37.0, 74.0, 183.0, 598.0, 2808.0, 28780.0, 671160.0, 329322.0, 13211.0, 1715.0, 403.0, 117.0, 75.0, 17.0, 16.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10162353515625, -0.0982198715209961, -0.09481620788574219, -0.09141254425048828, -0.08800888061523438, -0.08460521697998047, -0.08120155334472656, -0.07779788970947266, -0.07439422607421875, -0.07099056243896484, -0.06758689880371094, -0.06418323516845703, -0.060779571533203125, -0.05737590789794922, -0.05397224426269531, -0.050568580627441406, -0.0471649169921875, -0.043761253356933594, -0.04035758972167969, -0.03695392608642578, -0.033550262451171875, -0.03014659881591797, -0.026742935180664062, -0.023339271545410156, -0.01993560791015625, -0.016531944274902344, -0.013128280639648438, -0.009724617004394531, -0.006320953369140625, -0.0029172897338867188, 0.0004863739013671875, 0.0038900375366210938, 0.007293701171875, 0.010697364807128906, 0.014101028442382812, 0.01750469207763672, 0.020908355712890625, 0.02431201934814453, 0.027715682983398438, 0.031119346618652344, 0.03452301025390625, 0.037926673889160156, 0.04133033752441406, 0.04473400115966797, 0.048137664794921875, 0.05154132843017578, 0.05494499206542969, 0.058348655700683594, 0.0617523193359375, 0.0651559829711914, 0.06855964660644531, 0.07196331024169922, 0.07536697387695312, 0.07877063751220703, 0.08217430114746094, 0.08557796478271484, 0.08898162841796875, 0.09238529205322266, 0.09578895568847656, 0.09919261932373047, 0.10259628295898438, 0.10599994659423828, 0.10940361022949219, 0.1128072738647461, 0.1162109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 9.0, 18.0, 25.0, 21.0, 54.0, 77.0, 118.0, 151.0, 126.0, 124.0, 100.0, 67.0, 30.0, 31.0, 14.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002701282501220703, -0.00026387162506580353, -0.00025761500000953674, -0.00025135837495326996, -0.0002451017498970032, -0.0002388451248407364, -0.0002325884997844696, -0.00022633187472820282, -0.00022007524967193604, -0.00021381862461566925, -0.00020756199955940247, -0.00020130537450313568, -0.0001950487494468689, -0.0001887921243906021, -0.00018253549933433533, -0.00017627887427806854, -0.00017002224922180176, -0.00016376562416553497, -0.0001575089991092682, -0.0001512523740530014, -0.00014499574899673462, -0.00013873912394046783, -0.00013248249888420105, -0.00012622587382793427, -0.00011996924877166748, -0.0001137126237154007, -0.00010745599865913391, -0.00010119937360286713, -9.494274854660034e-05, -8.868612349033356e-05, -8.242949843406677e-05, -7.617287337779999e-05, -6.99162483215332e-05, -6.365962326526642e-05, -5.7402998208999634e-05, -5.114637315273285e-05, -4.4889748096466064e-05, -3.863312304019928e-05, -3.2376497983932495e-05, -2.611987292766571e-05, -1.9863247871398926e-05, -1.3606622815132141e-05, -7.3499977588653564e-06, -1.0933727025985718e-06, 5.163252353668213e-06, 1.1419877409934998e-05, 1.7676502466201782e-05, 2.3933127522468567e-05, 3.018975257873535e-05, 3.6446377635002136e-05, 4.270300269126892e-05, 4.8959627747535706e-05, 5.521625280380249e-05, 6.147287786006927e-05, 6.772950291633606e-05, 7.398612797260284e-05, 8.024275302886963e-05, 8.649937808513641e-05, 9.27560031414032e-05, 9.901262819766998e-05, 0.00010526925325393677, 0.00011152587831020355, 0.00011778250336647034, 0.00012403912842273712, 0.0001302957534790039]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 5.0, 2.0, 7.0, 13.0, 18.0, 27.0, 53.0, 84.0, 138.0, 325.0, 672.0, 1674.0, 4890.0, 21675.0, 159620.0, 654757.0, 173023.0, 23141.0, 5264.0, 1725.0, 711.0, 337.0, 162.0, 90.0, 53.0, 33.0, 18.0, 14.0, 9.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07977294921875, -0.07764673233032227, -0.07552051544189453, -0.0733942985534668, -0.07126808166503906, -0.06914186477661133, -0.0670156478881836, -0.06488943099975586, -0.06276321411132812, -0.06063699722290039, -0.058510780334472656, -0.05638456344604492, -0.05425834655761719, -0.05213212966918945, -0.05000591278076172, -0.047879695892333984, -0.04575347900390625, -0.043627262115478516, -0.04150104522705078, -0.03937482833862305, -0.03724861145019531, -0.03512239456176758, -0.032996177673339844, -0.03086996078491211, -0.028743743896484375, -0.02661752700805664, -0.024491310119628906, -0.022365093231201172, -0.020238876342773438, -0.018112659454345703, -0.01598644256591797, -0.013860225677490234, -0.0117340087890625, -0.009607791900634766, -0.007481575012207031, -0.005355358123779297, -0.0032291412353515625, -0.0011029243469238281, 0.0010232925415039062, 0.0031495094299316406, 0.005275726318359375, 0.007401943206787109, 0.009528160095214844, 0.011654376983642578, 0.013780593872070312, 0.015906810760498047, 0.01803302764892578, 0.020159244537353516, 0.02228546142578125, 0.024411678314208984, 0.02653789520263672, 0.028664112091064453, 0.030790328979492188, 0.03291654586791992, 0.035042762756347656, 0.03716897964477539, 0.039295196533203125, 0.04142141342163086, 0.043547630310058594, 0.04567384719848633, 0.04780006408691406, 0.0499262809753418, 0.05205249786376953, 0.054178714752197266, 0.056304931640625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 13.0, 12.0, 24.0, 49.0, 63.0, 100.0, 119.0, 129.0, 137.0, 99.0, 83.0, 59.0, 34.0, 30.0, 13.0, 10.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.08984375, -0.08784246444702148, -0.08584117889404297, -0.08383989334106445, -0.08183860778808594, -0.07983732223510742, -0.0778360366821289, -0.07583475112915039, -0.07383346557617188, -0.07183218002319336, -0.06983089447021484, -0.06782960891723633, -0.06582832336425781, -0.0638270378112793, -0.06182575225830078, -0.059824466705322266, -0.05782318115234375, -0.055821895599365234, -0.05382061004638672, -0.0518193244934082, -0.04981803894042969, -0.04781675338745117, -0.045815467834472656, -0.04381418228149414, -0.041812896728515625, -0.03981161117553711, -0.037810325622558594, -0.03580904006958008, -0.03380775451660156, -0.03180646896362305, -0.02980518341064453, -0.027803897857666016, -0.0258026123046875, -0.023801326751708984, -0.02180004119873047, -0.019798755645751953, -0.017797470092773438, -0.015796184539794922, -0.013794898986816406, -0.01179361343383789, -0.009792327880859375, -0.007791042327880859, -0.005789756774902344, -0.003788471221923828, -0.0017871856689453125, 0.00021409988403320312, 0.0022153854370117188, 0.004216670989990234, 0.00621795654296875, 0.008219242095947266, 0.010220527648925781, 0.012221813201904297, 0.014223098754882812, 0.016224384307861328, 0.018225669860839844, 0.02022695541381836, 0.022228240966796875, 0.02422952651977539, 0.026230812072753906, 0.028232097625732422, 0.030233383178710938, 0.03223466873168945, 0.03423595428466797, 0.036237239837646484, 0.038238525390625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 10.0, 20.0, 43.0, 67.0, 111.0, 189.0, 168.0, 159.0, 102.0, 57.0, 29.0, 18.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1697193384170532, -1.1420021057128906, -1.1142849922180176, -1.086567759513855, -1.058850646018982, -1.0311334133148193, -1.0034162998199463, -0.9756990671157837, -0.9479818344116211, -0.9202646613121033, -0.8925474882125854, -0.8648302555084229, -0.837113082408905, -0.8093959093093872, -0.7816787362098694, -0.7539615631103516, -0.7262443900108337, -0.6985272169113159, -0.6708100438117981, -0.6430928707122803, -0.6153756380081177, -0.5876584649085999, -0.559941291809082, -0.5322241187095642, -0.5045069456100464, -0.47678977251052856, -0.44907256960868835, -0.42135539650917053, -0.3936381936073303, -0.3659210205078125, -0.3382038474082947, -0.31048667430877686, -0.28276944160461426, -0.25505226850509644, -0.22733506560325623, -0.1996178925037384, -0.1719007045030594, -0.14418351650238037, -0.11646634340286255, -0.08874915540218353, -0.06103196740150452, -0.0333147831261158, -0.005597598850727081, 0.022119581699371338, 0.049836769700050354, 0.07755395770072937, 0.10527113080024719, 0.1329883188009262, 0.16070550680160522, 0.18842269480228424, 0.21613988280296326, 0.24385705590248108, 0.2715742588043213, 0.2992914319038391, 0.32700860500335693, 0.35472577810287476, 0.38244298100471497, 0.4101601541042328, 0.437877357006073, 0.4655945301055908, 0.49331170320510864, 0.5210288763046265, 0.5487461090087891, 0.5764632821083069, 0.6041804552078247]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 7.0, 3.0, 12.0, 13.0, 14.0, 14.0, 23.0, 31.0, 30.0, 27.0, 40.0, 44.0, 43.0, 34.0, 50.0, 53.0, 44.0, 61.0, 50.0, 51.0, 43.0, 34.0, 39.0, 34.0, 43.0, 22.0, 25.0, 25.0, 11.0, 12.0, 11.0, 19.0, 11.0, 3.0, 7.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5290791988372803, -0.5125712752342224, -0.4960632920265198, -0.4795553684234619, -0.46304741501808167, -0.4465394616127014, -0.43003150820732117, -0.4135235548019409, -0.39701563119888306, -0.3805076777935028, -0.36399972438812256, -0.3474918007850647, -0.33098384737968445, -0.3144758939743042, -0.29796794056892395, -0.2814599871635437, -0.26495203375816345, -0.2484440803527832, -0.23193614184856415, -0.2154281884431839, -0.19892024993896484, -0.1824122965335846, -0.16590434312820435, -0.1493963897228241, -0.13288845121860504, -0.11638050526380539, -0.09987255930900574, -0.08336460590362549, -0.06685665994882584, -0.050348713994026184, -0.033840760588645935, -0.017332814633846283, -0.0008248686790466309, 0.01568307913839817, 0.03219102695584297, 0.04869897663593292, 0.06520692259073257, 0.08171486854553223, 0.09822282195091248, 0.11473076790571213, 0.13123871386051178, 0.14774666726589203, 0.16425460577011108, 0.18076255917549133, 0.19727051258087158, 0.21377845108509064, 0.2302864044904709, 0.24679434299468994, 0.2633022964000702, 0.27981024980545044, 0.2963182032108307, 0.31282615661621094, 0.3293340802192688, 0.34584203362464905, 0.3623499870300293, 0.37885794043540955, 0.3953658938407898, 0.41187384724617004, 0.4283818006515503, 0.44488972425460815, 0.4613976776599884, 0.47790563106536865, 0.4944135844707489, 0.5109215378761292, 0.527429461479187]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 7.0, 6.0, 9.0, 23.0, 34.0, 54.0, 72.0, 139.0, 275.0, 576.0, 1704.0, 11366.0, 3802910.0, 367854.0, 7044.0, 1310.0, 466.0, 173.0, 105.0, 66.0, 39.0, 23.0, 14.0, 6.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56396484375, -0.5486793518066406, -0.5333938598632812, -0.5181083679199219, -0.5028228759765625, -0.4875373840332031, -0.47225189208984375, -0.4569664001464844, -0.441680908203125, -0.4263954162597656, -0.41110992431640625, -0.3958244323730469, -0.3805389404296875, -0.3652534484863281, -0.34996795654296875, -0.3346824645996094, -0.31939697265625, -0.3041114807128906, -0.28882598876953125, -0.2735404968261719, -0.2582550048828125, -0.24296951293945312, -0.22768402099609375, -0.21239852905273438, -0.197113037109375, -0.18182754516601562, -0.16654205322265625, -0.15125656127929688, -0.1359710693359375, -0.12068557739257812, -0.10540008544921875, -0.09011459350585938, -0.0748291015625, -0.059543609619140625, -0.04425811767578125, -0.028972625732421875, -0.0136871337890625, 0.001598358154296875, 0.01688385009765625, 0.032169342041015625, 0.047454833984375, 0.06274032592773438, 0.07802581787109375, 0.09331130981445312, 0.1085968017578125, 0.12388229370117188, 0.13916778564453125, 0.15445327758789062, 0.16973876953125, 0.18502426147460938, 0.20030975341796875, 0.21559524536132812, 0.2308807373046875, 0.24616622924804688, 0.26145172119140625, 0.2767372131347656, 0.292022705078125, 0.3073081970214844, 0.32259368896484375, 0.3378791809082031, 0.3531646728515625, 0.3684501647949219, 0.38373565673828125, 0.3990211486816406, 0.414306640625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 15.0, 10.0, 21.0, 34.0, 47.0, 49.0, 85.0, 94.0, 101.0, 104.0, 121.0, 89.0, 68.0, 47.0, 40.0, 25.0, 18.0, 11.0, 10.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0692138671875, -0.06768536567687988, -0.06615686416625977, -0.06462836265563965, -0.06309986114501953, -0.061571359634399414, -0.0600428581237793, -0.05851435661315918, -0.05698585510253906, -0.055457353591918945, -0.05392885208129883, -0.05240035057067871, -0.050871849060058594, -0.04934334754943848, -0.04781484603881836, -0.04628634452819824, -0.044757843017578125, -0.04322934150695801, -0.04170083999633789, -0.04017233848571777, -0.038643836975097656, -0.03711533546447754, -0.03558683395385742, -0.034058332443237305, -0.03252983093261719, -0.03100132942199707, -0.029472827911376953, -0.027944326400756836, -0.02641582489013672, -0.0248873233795166, -0.023358821868896484, -0.021830320358276367, -0.02030181884765625, -0.018773317337036133, -0.017244815826416016, -0.0157163143157959, -0.014187812805175781, -0.012659311294555664, -0.011130809783935547, -0.00960230827331543, -0.008073806762695312, -0.006545305252075195, -0.005016803741455078, -0.003488302230834961, -0.0019598007202148438, -0.00043129920959472656, 0.0010972023010253906, 0.002625703811645508, 0.004154205322265625, 0.005682706832885742, 0.007211208343505859, 0.008739709854125977, 0.010268211364746094, 0.011796712875366211, 0.013325214385986328, 0.014853715896606445, 0.016382217407226562, 0.01791071891784668, 0.019439220428466797, 0.020967721939086914, 0.02249622344970703, 0.02402472496032715, 0.025553226470947266, 0.027081727981567383, 0.0286102294921875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 15.0, 14.0, 18.0, 20.0, 26.0, 38.0, 64.0, 69.0, 91.0, 143.0, 198.0, 268.0, 452.0, 701.0, 1230.0, 2517.0, 5906.0, 18162.0, 83952.0, 1737308.0, 2221153.0, 90675.0, 19081.0, 6211.0, 2513.0, 1343.0, 744.0, 450.0, 276.0, 214.0, 120.0, 92.0, 52.0, 43.0, 34.0, 18.0, 15.0, 7.0, 14.0, 9.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1363525390625, -0.13234424591064453, -0.12833595275878906, -0.1243276596069336, -0.12031936645507812, -0.11631107330322266, -0.11230278015136719, -0.10829448699951172, -0.10428619384765625, -0.10027790069580078, -0.09626960754394531, -0.09226131439208984, -0.08825302124023438, -0.0842447280883789, -0.08023643493652344, -0.07622814178466797, -0.0722198486328125, -0.06821155548095703, -0.06420326232910156, -0.060194969177246094, -0.056186676025390625, -0.052178382873535156, -0.04817008972167969, -0.04416179656982422, -0.04015350341796875, -0.03614521026611328, -0.03213691711425781, -0.028128623962402344, -0.024120330810546875, -0.020112037658691406, -0.016103744506835938, -0.012095451354980469, -0.008087158203125, -0.004078865051269531, -7.05718994140625e-05, 0.003937721252441406, 0.007946014404296875, 0.011954307556152344, 0.015962600708007812, 0.01997089385986328, 0.02397918701171875, 0.02798748016357422, 0.03199577331542969, 0.036004066467285156, 0.040012359619140625, 0.044020652770996094, 0.04802894592285156, 0.05203723907470703, 0.0560455322265625, 0.06005382537841797, 0.06406211853027344, 0.0680704116821289, 0.07207870483398438, 0.07608699798583984, 0.08009529113769531, 0.08410358428955078, 0.08811187744140625, 0.09212017059326172, 0.09612846374511719, 0.10013675689697266, 0.10414505004882812, 0.1081533432006836, 0.11216163635253906, 0.11616992950439453, 0.12017822265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 6.0, 18.0, 16.0, 39.0, 50.0, 88.0, 160.0, 395.0, 1297.0, 1240.0, 340.0, 157.0, 83.0, 55.0, 40.0, 20.0, 12.0, 11.0, 8.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08172607421875, -0.07977867126464844, -0.07783126831054688, -0.07588386535644531, -0.07393646240234375, -0.07198905944824219, -0.07004165649414062, -0.06809425354003906, -0.0661468505859375, -0.06419944763183594, -0.062252044677734375, -0.06030464172363281, -0.05835723876953125, -0.05640983581542969, -0.054462432861328125, -0.05251502990722656, -0.050567626953125, -0.04862022399902344, -0.046672821044921875, -0.04472541809082031, -0.04277801513671875, -0.04083061218261719, -0.038883209228515625, -0.03693580627441406, -0.0349884033203125, -0.03304100036621094, -0.031093597412109375, -0.029146194458007812, -0.02719879150390625, -0.025251388549804688, -0.023303985595703125, -0.021356582641601562, -0.0194091796875, -0.017461776733398438, -0.015514373779296875, -0.013566970825195312, -0.01161956787109375, -0.009672164916992188, -0.007724761962890625, -0.0057773590087890625, -0.0038299560546875, -0.0018825531005859375, 6.4849853515625e-05, 0.0020122528076171875, 0.00395965576171875, 0.0059070587158203125, 0.007854461669921875, 0.009801864624023438, 0.011749267578125, 0.013696670532226562, 0.015644073486328125, 0.017591476440429688, 0.01953887939453125, 0.021486282348632812, 0.023433685302734375, 0.025381088256835938, 0.0273284912109375, 0.029275894165039062, 0.031223297119140625, 0.03317070007324219, 0.03511810302734375, 0.03706550598144531, 0.039012908935546875, 0.04096031188964844, 0.04290771484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 23.0, 29.0, 60.0, 156.0, 233.0, 234.0, 125.0, 72.0, 33.0, 12.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5840854644775391, -0.5673457980155945, -0.5506061315536499, -0.5338664650917053, -0.5171267986297607, -0.5003871321678162, -0.48364749550819397, -0.4669078290462494, -0.4501681625843048, -0.43342849612236023, -0.41668882966041565, -0.39994916319847107, -0.3832095265388489, -0.3664698600769043, -0.3497301936149597, -0.33299052715301514, -0.31625086069107056, -0.299511194229126, -0.2827715277671814, -0.2660318613052368, -0.24929220974445343, -0.23255254328250885, -0.21581289172172546, -0.19907322525978088, -0.1823335587978363, -0.16559389233589172, -0.14885422587394714, -0.13211457431316376, -0.11537490785121918, -0.0986352413892746, -0.08189558237791061, -0.06515592336654663, -0.04841625690460205, -0.03167659416794777, -0.014936931431293488, 0.001802731305360794, 0.018542394042015076, 0.035282060503959656, 0.05202171951532364, 0.06876137852668762, 0.0855010449886322, 0.10224071145057678, 0.11898037046194077, 0.13572002947330475, 0.15245969593524933, 0.1691993623971939, 0.1859390139579773, 0.20267868041992188, 0.21941834688186646, 0.23615801334381104, 0.2528976798057556, 0.2696373462677002, 0.2863770127296448, 0.30311667919158936, 0.31985631585121155, 0.33659598231315613, 0.3533356487751007, 0.3700753152370453, 0.38681498169898987, 0.40355464816093445, 0.42029428482055664, 0.4370339512825012, 0.4537736177444458, 0.4705132842063904, 0.48725295066833496]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 16.0, 10.0, 16.0, 22.0, 22.0, 34.0, 36.0, 39.0, 56.0, 58.0, 66.0, 73.0, 49.0, 66.0, 64.0, 56.0, 62.0, 42.0, 41.0, 33.0, 36.0, 27.0, 20.0, 17.0, 13.0, 11.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17734479904174805, -0.17016486823558807, -0.1629849374294281, -0.15580500662326813, -0.14862507581710815, -0.14144514501094818, -0.1342652142047882, -0.12708529829978943, -0.11990536004304886, -0.11272542923688889, -0.10554549843072891, -0.09836557507514954, -0.09118564426898956, -0.08400571346282959, -0.07682578265666962, -0.06964585185050964, -0.06246592104434967, -0.0552859902381897, -0.048106059432029724, -0.04092613235116005, -0.033746201545000076, -0.026566270738840103, -0.01938634365797043, -0.012206412851810455, -0.005026482045650482, 0.0021534478291869164, 0.009333377704024315, 0.01651330664753914, 0.023693237453699112, 0.030873168259859085, 0.03805309534072876, 0.04523302614688873, 0.052412956953048706, 0.05959288775920868, 0.06677281856536865, 0.07395274937152863, 0.0811326801776886, 0.08831261098384857, 0.09549253433942795, 0.10267246514558792, 0.1098523959517479, 0.11703232675790787, 0.12421225756406784, 0.13139218091964722, 0.1385721117258072, 0.14575204253196716, 0.15293197333812714, 0.1601119041442871, 0.16729183495044708, 0.17447176575660706, 0.18165169656276703, 0.188831627368927, 0.19601155817508698, 0.20319148898124695, 0.21037140488624573, 0.2175513505935669, 0.22473126649856567, 0.23191119730472565, 0.23909112811088562, 0.2462710589170456, 0.25345098972320557, 0.26063090562820435, 0.2678108513355255, 0.2749907672405243, 0.28217071294784546]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 8.0, 7.0, 8.0, 19.0, 20.0, 20.0, 41.0, 68.0, 94.0, 210.0, 517.0, 1436.0, 6770.0, 84572.0, 860826.0, 84613.0, 6949.0, 1414.0, 507.0, 182.0, 109.0, 55.0, 35.0, 26.0, 13.0, 15.0, 8.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285400390625, -0.2760429382324219, -0.26668548583984375, -0.2573280334472656, -0.2479705810546875, -0.23861312866210938, -0.22925567626953125, -0.21989822387695312, -0.210540771484375, -0.20118331909179688, -0.19182586669921875, -0.18246841430664062, -0.1731109619140625, -0.16375350952148438, -0.15439605712890625, -0.14503860473632812, -0.13568115234375, -0.12632369995117188, -0.11696624755859375, -0.10760879516601562, -0.0982513427734375, -0.08889389038085938, -0.07953643798828125, -0.07017898559570312, -0.060821533203125, -0.051464080810546875, -0.04210662841796875, -0.032749176025390625, -0.0233917236328125, -0.014034271240234375, -0.00467681884765625, 0.004680633544921875, 0.0140380859375, 0.023395538330078125, 0.03275299072265625, 0.042110443115234375, 0.0514678955078125, 0.060825347900390625, 0.07018280029296875, 0.07954025268554688, 0.088897705078125, 0.09825515747070312, 0.10761260986328125, 0.11697006225585938, 0.1263275146484375, 0.13568496704101562, 0.14504241943359375, 0.15439987182617188, 0.16375732421875, 0.17311477661132812, 0.18247222900390625, 0.19182968139648438, 0.2011871337890625, 0.21054458618164062, 0.21990203857421875, 0.22925949096679688, 0.238616943359375, 0.24797439575195312, 0.25733184814453125, 0.2666893005371094, 0.2760467529296875, 0.2854042053222656, 0.29476165771484375, 0.3041191101074219, 0.3134765625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 18.0, 14.0, 30.0, 48.0, 55.0, 71.0, 94.0, 126.0, 117.0, 109.0, 92.0, 78.0, 51.0, 33.0, 17.0, 18.0, 6.0, 10.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07080078125, -0.06916284561157227, -0.06752490997314453, -0.0658869743347168, -0.06424903869628906, -0.06261110305786133, -0.060973167419433594, -0.05933523178100586, -0.057697296142578125, -0.05605936050415039, -0.054421424865722656, -0.05278348922729492, -0.05114555358886719, -0.04950761795043945, -0.04786968231201172, -0.046231746673583984, -0.04459381103515625, -0.042955875396728516, -0.04131793975830078, -0.03968000411987305, -0.03804206848144531, -0.03640413284301758, -0.034766197204589844, -0.03312826156616211, -0.031490325927734375, -0.02985239028930664, -0.028214454650878906, -0.026576519012451172, -0.024938583374023438, -0.023300647735595703, -0.02166271209716797, -0.020024776458740234, -0.0183868408203125, -0.016748905181884766, -0.015110969543457031, -0.013473033905029297, -0.011835098266601562, -0.010197162628173828, -0.008559226989746094, -0.006921291351318359, -0.005283355712890625, -0.0036454200744628906, -0.0020074844360351562, -0.0003695487976074219, 0.0012683868408203125, 0.002906322479248047, 0.004544258117675781, 0.006182193756103516, 0.00782012939453125, 0.009458065032958984, 0.011096000671386719, 0.012733936309814453, 0.014371871948242188, 0.016009807586669922, 0.017647743225097656, 0.01928567886352539, 0.020923614501953125, 0.02256155014038086, 0.024199485778808594, 0.025837421417236328, 0.027475357055664062, 0.029113292694091797, 0.03075122833251953, 0.032389163970947266, 0.034027099609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 1.0, 6.0, 3.0, 10.0, 9.0, 13.0, 14.0, 38.0, 45.0, 75.0, 84.0, 144.0, 249.0, 436.0, 759.0, 1474.0, 3275.0, 8733.0, 27872.0, 119935.0, 511740.0, 289106.0, 58596.0, 15732.0, 5415.0, 2213.0, 1064.0, 569.0, 335.0, 188.0, 132.0, 88.0, 52.0, 38.0, 34.0, 28.0, 14.0, 12.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.10394287109375, -0.10077095031738281, -0.09759902954101562, -0.09442710876464844, -0.09125518798828125, -0.08808326721191406, -0.08491134643554688, -0.08173942565917969, -0.0785675048828125, -0.07539558410644531, -0.07222366333007812, -0.06905174255371094, -0.06587982177734375, -0.06270790100097656, -0.059535980224609375, -0.05636405944824219, -0.053192138671875, -0.05002021789550781, -0.046848297119140625, -0.04367637634277344, -0.04050445556640625, -0.03733253479003906, -0.034160614013671875, -0.030988693237304688, -0.0278167724609375, -0.024644851684570312, -0.021472930908203125, -0.018301010131835938, -0.01512908935546875, -0.011957168579101562, -0.008785247802734375, -0.0056133270263671875, -0.00244140625, 0.0007305145263671875, 0.003902435302734375, 0.0070743560791015625, 0.01024627685546875, 0.013418197631835938, 0.016590118408203125, 0.019762039184570312, 0.0229339599609375, 0.026105880737304688, 0.029277801513671875, 0.03244972229003906, 0.03562164306640625, 0.03879356384277344, 0.041965484619140625, 0.04513740539550781, 0.048309326171875, 0.05148124694824219, 0.054653167724609375, 0.05782508850097656, 0.06099700927734375, 0.06416893005371094, 0.06734085083007812, 0.07051277160644531, 0.0736846923828125, 0.07685661315917969, 0.08002853393554688, 0.08320045471191406, 0.08637237548828125, 0.08954429626464844, 0.09271621704101562, 0.09588813781738281, 0.09906005859375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 5.0, 10.0, 11.0, 14.0, 16.0, 16.0, 21.0, 30.0, 21.0, 27.0, 45.0, 46.0, 49.0, 39.0, 50.0, 41.0, 50.0, 52.0, 51.0, 45.0, 44.0, 46.0, 48.0, 31.0, 28.0, 23.0, 17.0, 19.0, 16.0, 16.0, 11.0, 15.0, 6.0, 6.0, 5.0, 5.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09698486328125, -0.09399127960205078, -0.09099769592285156, -0.08800411224365234, -0.08501052856445312, -0.0820169448852539, -0.07902336120605469, -0.07602977752685547, -0.07303619384765625, -0.07004261016845703, -0.06704902648925781, -0.0640554428100586, -0.061061859130859375, -0.058068275451660156, -0.05507469177246094, -0.05208110809326172, -0.0490875244140625, -0.04609394073486328, -0.04310035705566406, -0.040106773376464844, -0.037113189697265625, -0.034119606018066406, -0.031126022338867188, -0.02813243865966797, -0.02513885498046875, -0.02214527130126953, -0.019151687622070312, -0.016158103942871094, -0.013164520263671875, -0.010170936584472656, -0.0071773529052734375, -0.004183769226074219, -0.001190185546875, 0.0018033981323242188, 0.0047969818115234375, 0.007790565490722656, 0.010784149169921875, 0.013777732849121094, 0.016771316528320312, 0.01976490020751953, 0.02275848388671875, 0.02575206756591797, 0.028745651245117188, 0.031739234924316406, 0.034732818603515625, 0.037726402282714844, 0.04071998596191406, 0.04371356964111328, 0.0467071533203125, 0.04970073699951172, 0.05269432067871094, 0.055687904357910156, 0.058681488037109375, 0.061675071716308594, 0.06466865539550781, 0.06766223907470703, 0.07065582275390625, 0.07364940643310547, 0.07664299011230469, 0.0796365737915039, 0.08263015747070312, 0.08562374114990234, 0.08861732482910156, 0.09161090850830078, 0.0946044921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 14.0, 24.0, 48.0, 144.0, 349.0, 1428.0, 26958.0, 998073.0, 19719.0, 1215.0, 327.0, 116.0, 59.0, 31.0, 13.0, 11.0, 4.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1968994140625, -0.1906414031982422, -0.18438339233398438, -0.17812538146972656, -0.17186737060546875, -0.16560935974121094, -0.15935134887695312, -0.1530933380126953, -0.1468353271484375, -0.1405773162841797, -0.13431930541992188, -0.12806129455566406, -0.12180328369140625, -0.11554527282714844, -0.10928726196289062, -0.10302925109863281, -0.096771240234375, -0.09051322937011719, -0.08425521850585938, -0.07799720764160156, -0.07173919677734375, -0.06548118591308594, -0.059223175048828125, -0.05296516418457031, -0.0467071533203125, -0.04044914245605469, -0.034191131591796875, -0.027933120727539062, -0.02167510986328125, -0.015417098999023438, -0.009159088134765625, -0.0029010772705078125, 0.00335693359375, 0.009614944458007812, 0.015872955322265625, 0.022130966186523438, 0.02838897705078125, 0.03464698791503906, 0.040904998779296875, 0.04716300964355469, 0.0534210205078125, 0.05967903137207031, 0.06593704223632812, 0.07219505310058594, 0.07845306396484375, 0.08471107482910156, 0.09096908569335938, 0.09722709655761719, 0.103485107421875, 0.10974311828613281, 0.11600112915039062, 0.12225914001464844, 0.12851715087890625, 0.13477516174316406, 0.14103317260742188, 0.1472911834716797, 0.1535491943359375, 0.1598072052001953, 0.16606521606445312, 0.17232322692871094, 0.17858123779296875, 0.18483924865722656, 0.19109725952148438, 0.1973552703857422, 0.20361328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 13.0, 21.0, 32.0, 51.0, 83.0, 134.0, 160.0, 152.0, 130.0, 74.0, 50.0, 31.0, 23.0, 20.0, 6.0, 4.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012230873107910156, -0.00011587515473365784, -0.00010944157838821411, -0.00010300800204277039, -9.657442569732666e-05, -9.014084935188293e-05, -8.370727300643921e-05, -7.727369666099548e-05, -7.084012031555176e-05, -6.440654397010803e-05, -5.797296762466431e-05, -5.153939127922058e-05, -4.5105814933776855e-05, -3.867223858833313e-05, -3.2238662242889404e-05, -2.580508589744568e-05, -1.9371509552001953e-05, -1.2937933206558228e-05, -6.504356861114502e-06, -7.078051567077637e-08, 6.362795829772949e-06, 1.2796372175216675e-05, 1.92299485206604e-05, 2.5663524866104126e-05, 3.209710121154785e-05, 3.853067755699158e-05, 4.49642539024353e-05, 5.139783024787903e-05, 5.7831406593322754e-05, 6.426498293876648e-05, 7.06985592842102e-05, 7.713213562965393e-05, 8.356571197509766e-05, 8.999928832054138e-05, 9.643286466598511e-05, 0.00010286644101142883, 0.00010930001735687256, 0.00011573359370231628, 0.00012216717004776, 0.00012860074639320374, 0.00013503432273864746, 0.0001414678990840912, 0.0001479014754295349, 0.00015433505177497864, 0.00016076862812042236, 0.0001672022044658661, 0.00017363578081130981, 0.00018006935715675354, 0.00018650293350219727, 0.000192936509847641, 0.00019937008619308472, 0.00020580366253852844, 0.00021223723888397217, 0.0002186708152294159, 0.00022510439157485962, 0.00023153796792030334, 0.00023797154426574707, 0.0002444051206111908, 0.0002508386969566345, 0.00025727227330207825, 0.00026370584964752197, 0.0002701394259929657, 0.0002765730023384094, 0.00028300657868385315, 0.0002894401550292969]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 10.0, 17.0, 19.0, 46.0, 61.0, 95.0, 173.0, 356.0, 1371.0, 15161.0, 963336.0, 64138.0, 2698.0, 552.0, 222.0, 114.0, 74.0, 49.0, 23.0, 13.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2354736328125, -0.22905349731445312, -0.22263336181640625, -0.21621322631835938, -0.2097930908203125, -0.20337295532226562, -0.19695281982421875, -0.19053268432617188, -0.184112548828125, -0.17769241333007812, -0.17127227783203125, -0.16485214233398438, -0.1584320068359375, -0.15201187133789062, -0.14559173583984375, -0.13917160034179688, -0.13275146484375, -0.12633132934570312, -0.11991119384765625, -0.11349105834960938, -0.1070709228515625, -0.10065078735351562, -0.09423065185546875, -0.08781051635742188, -0.081390380859375, -0.07497024536132812, -0.06855010986328125, -0.062129974365234375, -0.0557098388671875, -0.049289703369140625, -0.04286956787109375, -0.036449432373046875, -0.030029296875, -0.023609161376953125, -0.01718902587890625, -0.010768890380859375, -0.0043487548828125, 0.002071380615234375, 0.00849151611328125, 0.014911651611328125, 0.021331787109375, 0.027751922607421875, 0.03417205810546875, 0.040592193603515625, 0.0470123291015625, 0.053432464599609375, 0.05985260009765625, 0.06627273559570312, 0.07269287109375, 0.07911300659179688, 0.08553314208984375, 0.09195327758789062, 0.0983734130859375, 0.10479354858398438, 0.11121368408203125, 0.11763381958007812, 0.124053955078125, 0.13047409057617188, 0.13689422607421875, 0.14331436157226562, 0.1497344970703125, 0.15615463256835938, 0.16257476806640625, 0.16899490356445312, 0.1754150390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 10.0, 24.0, 41.0, 162.0, 467.0, 201.0, 56.0, 22.0, 13.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21337890625, -0.20720863342285156, -0.20103836059570312, -0.1948680877685547, -0.18869781494140625, -0.1825275421142578, -0.17635726928710938, -0.17018699645996094, -0.1640167236328125, -0.15784645080566406, -0.15167617797851562, -0.1455059051513672, -0.13933563232421875, -0.1331653594970703, -0.12699508666992188, -0.12082481384277344, -0.114654541015625, -0.10848426818847656, -0.10231399536132812, -0.09614372253417969, -0.08997344970703125, -0.08380317687988281, -0.07763290405273438, -0.07146263122558594, -0.0652923583984375, -0.05912208557128906, -0.052951812744140625, -0.04678153991699219, -0.04061126708984375, -0.03444099426269531, -0.028270721435546875, -0.022100448608398438, -0.01593017578125, -0.009759902954101562, -0.003589630126953125, 0.0025806427001953125, 0.00875091552734375, 0.014921188354492188, 0.021091461181640625, 0.027261734008789062, 0.0334320068359375, 0.03960227966308594, 0.045772552490234375, 0.05194282531738281, 0.05811309814453125, 0.06428337097167969, 0.07045364379882812, 0.07662391662597656, 0.082794189453125, 0.08896446228027344, 0.09513473510742188, 0.10130500793457031, 0.10747528076171875, 0.11364555358886719, 0.11981582641601562, 0.12598609924316406, 0.1321563720703125, 0.13832664489746094, 0.14449691772460938, 0.1506671905517578, 0.15683746337890625, 0.1630077362060547, 0.16917800903320312, 0.17534828186035156, 0.1815185546875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 136.0, 641.0, 186.0, 28.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0024824142456055, -1.8937771320343018, -1.785071849822998, -1.6763665676116943, -1.567661166191101, -1.4589558839797974, -1.3502506017684937, -1.2415452003479004, -1.1328399181365967, -1.024134635925293, -0.9154292941093445, -0.8067240118980408, -0.6980186700820923, -0.5893133878707886, -0.48060810565948486, -0.3719027638435364, -0.26319754123687744, -0.15449222922325134, -0.04578693211078644, 0.06291836500167847, 0.17162367701530457, 0.28032898902893066, 0.3890342712402344, 0.49773961305618286, 0.6064448952674866, 0.7151501774787903, 0.8238555192947388, 0.9325608015060425, 1.0412660837173462, 1.1499714851379395, 1.2586767673492432, 1.3673820495605469, 1.4760873317718506, 1.5847926139831543, 1.693497896194458, 1.8022031784057617, 1.910908579826355, 2.019613742828369, 2.128319263458252, 2.2370245456695557, 2.3457298278808594, 2.454435110092163, 2.563140392303467, 2.6718456745147705, 2.780550956726074, 2.889256477355957, 2.9979615211486816, 3.1066670417785645, 3.215372085571289, 3.3240773677825928, 3.4327826499938965, 3.5414879322052, 3.650193214416504, 3.7588987350463867, 3.8676037788391113, 3.976309299468994, 4.085014820098877, 4.19372034072876, 4.302425384521484, 4.411130905151367, 4.519835948944092, 4.628541469573975, 4.737246513366699, 4.845952033996582, 4.954657077789307]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 9.0, 11.0, 15.0, 14.0, 14.0, 20.0, 34.0, 35.0, 25.0, 33.0, 48.0, 33.0, 40.0, 49.0, 41.0, 49.0, 44.0, 49.0, 50.0, 43.0, 32.0, 30.0, 43.0, 41.0, 26.0, 30.0, 24.0, 19.0, 20.0, 16.0, 12.0, 14.0, 12.0, 3.0, 6.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44944095611572266, -0.43393415212631226, -0.41842737793922424, -0.40292057394981384, -0.38741376996040344, -0.37190699577331543, -0.35640019178390503, -0.34089338779449463, -0.32538658380508423, -0.30987977981567383, -0.2943730056285858, -0.2788662016391754, -0.263359397649765, -0.2478526085615158, -0.2323458194732666, -0.2168390154838562, -0.2013322412967682, -0.18582545220851898, -0.17031864821910858, -0.15481185913085938, -0.13930505514144897, -0.12379826605319977, -0.10829147696495056, -0.09278468042612076, -0.07727788388729095, -0.06177108734846115, -0.046264294534921646, -0.03075750172138214, -0.015250705182552338, 0.0002560913562774658, 0.015762880444526672, 0.031269676983356476, 0.04677647352218628, 0.06228327006101608, 0.07779006659984589, 0.09329685568809509, 0.1088036522269249, 0.1243104487657547, 0.1398172378540039, 0.1553240418434143, 0.1708308309316635, 0.18633762001991272, 0.20184442400932312, 0.21735121309757233, 0.23285800218582153, 0.24836480617523193, 0.26387161016464233, 0.27937838435173035, 0.29488518834114075, 0.31039199233055115, 0.32589876651763916, 0.34140557050704956, 0.35691237449645996, 0.37241917848587036, 0.3879259526729584, 0.4034327566623688, 0.4189395308494568, 0.4344463348388672, 0.4499531090259552, 0.4654599130153656, 0.480966717004776, 0.496473491191864, 0.5119802951812744, 0.5274870991706848, 0.5429939031600952]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 13.0, 5.0, 12.0, 26.0, 49.0, 75.0, 134.0, 210.0, 555.0, 2159.0, 30606.0, 4117331.0, 39198.0, 2710.0, 639.0, 260.0, 117.0, 63.0, 37.0, 29.0, 15.0, 9.0, 4.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.61669921875, -0.6021995544433594, -0.5876998901367188, -0.5732002258300781, -0.5587005615234375, -0.5442008972167969, -0.5297012329101562, -0.5152015686035156, -0.500701904296875, -0.4862022399902344, -0.47170257568359375, -0.4572029113769531, -0.4427032470703125, -0.4282035827636719, -0.41370391845703125, -0.3992042541503906, -0.38470458984375, -0.3702049255371094, -0.35570526123046875, -0.3412055969238281, -0.3267059326171875, -0.3122062683105469, -0.29770660400390625, -0.2832069396972656, -0.268707275390625, -0.2542076110839844, -0.23970794677734375, -0.22520828247070312, -0.2107086181640625, -0.19620895385742188, -0.18170928955078125, -0.16720962524414062, -0.1527099609375, -0.13821029663085938, -0.12371063232421875, -0.10921096801757812, -0.0947113037109375, -0.08021163940429688, -0.06571197509765625, -0.051212310791015625, -0.036712646484375, -0.022212982177734375, -0.00771331787109375, 0.006786346435546875, 0.0212860107421875, 0.035785675048828125, 0.05028533935546875, 0.06478500366210938, 0.07928466796875, 0.09378433227539062, 0.10828399658203125, 0.12278366088867188, 0.1372833251953125, 0.15178298950195312, 0.16628265380859375, 0.18078231811523438, 0.195281982421875, 0.20978164672851562, 0.22428131103515625, 0.23878097534179688, 0.2532806396484375, 0.2677803039550781, 0.28227996826171875, 0.2967796325683594, 0.311279296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 22.0, 21.0, 39.0, 65.0, 74.0, 79.0, 101.0, 112.0, 105.0, 96.0, 85.0, 65.0, 47.0, 30.0, 16.0, 15.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07623291015625, -0.07448959350585938, -0.07274627685546875, -0.07100296020507812, -0.0692596435546875, -0.06751632690429688, -0.06577301025390625, -0.06402969360351562, -0.062286376953125, -0.060543060302734375, -0.05879974365234375, -0.057056427001953125, -0.0553131103515625, -0.053569793701171875, -0.05182647705078125, -0.050083160400390625, -0.04833984375, -0.046596527099609375, -0.04485321044921875, -0.043109893798828125, -0.0413665771484375, -0.039623260498046875, -0.03787994384765625, -0.036136627197265625, -0.034393310546875, -0.032649993896484375, -0.03090667724609375, -0.029163360595703125, -0.0274200439453125, -0.025676727294921875, -0.02393341064453125, -0.022190093994140625, -0.02044677734375, -0.018703460693359375, -0.01696014404296875, -0.015216827392578125, -0.0134735107421875, -0.011730194091796875, -0.00998687744140625, -0.008243560791015625, -0.006500244140625, -0.004756927490234375, -0.00301361083984375, -0.001270294189453125, 0.0004730224609375, 0.002216339111328125, 0.00395965576171875, 0.005702972412109375, 0.0074462890625, 0.009189605712890625, 0.01093292236328125, 0.012676239013671875, 0.0144195556640625, 0.016162872314453125, 0.01790618896484375, 0.019649505615234375, 0.021392822265625, 0.023136138916015625, 0.02487945556640625, 0.026622772216796875, 0.0283660888671875, 0.030109405517578125, 0.03185272216796875, 0.033596038818359375, 0.03533935546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 5.0, 13.0, 22.0, 42.0, 30.0, 38.0, 59.0, 94.0, 117.0, 152.0, 224.0, 281.0, 407.0, 581.0, 1016.0, 1729.0, 4240.0, 13320.0, 64368.0, 2674074.0, 1357185.0, 56030.0, 11867.0, 3827.0, 1622.0, 919.0, 521.0, 381.0, 313.0, 212.0, 152.0, 126.0, 83.0, 68.0, 46.0, 28.0, 23.0, 15.0, 12.0, 10.0, 4.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1640625, -0.15937042236328125, -0.1546783447265625, -0.14998626708984375, -0.145294189453125, -0.14060211181640625, -0.1359100341796875, -0.13121795654296875, -0.12652587890625, -0.12183380126953125, -0.1171417236328125, -0.11244964599609375, -0.107757568359375, -0.10306549072265625, -0.0983734130859375, -0.09368133544921875, -0.0889892578125, -0.08429718017578125, -0.0796051025390625, -0.07491302490234375, -0.070220947265625, -0.06552886962890625, -0.0608367919921875, -0.05614471435546875, -0.05145263671875, -0.04676055908203125, -0.0420684814453125, -0.03737640380859375, -0.032684326171875, -0.02799224853515625, -0.0233001708984375, -0.01860809326171875, -0.013916015625, -0.00922393798828125, -0.0045318603515625, 0.00016021728515625, 0.004852294921875, 0.00954437255859375, 0.0142364501953125, 0.01892852783203125, 0.02362060546875, 0.02831268310546875, 0.0330047607421875, 0.03769683837890625, 0.042388916015625, 0.04708099365234375, 0.0517730712890625, 0.05646514892578125, 0.0611572265625, 0.06584930419921875, 0.0705413818359375, 0.07523345947265625, 0.079925537109375, 0.08461761474609375, 0.0893096923828125, 0.09400177001953125, 0.09869384765625, 0.10338592529296875, 0.1080780029296875, 0.11277008056640625, 0.117462158203125, 0.12215423583984375, 0.1268463134765625, 0.13153839111328125, 0.13623046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 10.0, 17.0, 26.0, 38.0, 54.0, 113.0, 326.0, 1909.0, 1116.0, 257.0, 97.0, 46.0, 22.0, 19.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.085205078125, -0.08289623260498047, -0.08058738708496094, -0.0782785415649414, -0.07596969604492188, -0.07366085052490234, -0.07135200500488281, -0.06904315948486328, -0.06673431396484375, -0.06442546844482422, -0.06211662292480469, -0.059807777404785156, -0.057498931884765625, -0.055190086364746094, -0.05288124084472656, -0.05057239532470703, -0.0482635498046875, -0.04595470428466797, -0.04364585876464844, -0.041337013244628906, -0.039028167724609375, -0.036719322204589844, -0.03441047668457031, -0.03210163116455078, -0.02979278564453125, -0.02748394012451172, -0.025175094604492188, -0.022866249084472656, -0.020557403564453125, -0.018248558044433594, -0.015939712524414062, -0.013630867004394531, -0.011322021484375, -0.009013175964355469, -0.0067043304443359375, -0.004395484924316406, -0.002086639404296875, 0.00022220611572265625, 0.0025310516357421875, 0.004839897155761719, 0.00714874267578125, 0.009457588195800781, 0.011766433715820312, 0.014075279235839844, 0.016384124755859375, 0.018692970275878906, 0.021001815795898438, 0.02331066131591797, 0.0256195068359375, 0.02792835235595703, 0.030237197875976562, 0.032546043395996094, 0.034854888916015625, 0.037163734436035156, 0.03947257995605469, 0.04178142547607422, 0.04409027099609375, 0.04639911651611328, 0.04870796203613281, 0.051016807556152344, 0.053325653076171875, 0.055634498596191406, 0.05794334411621094, 0.06025218963623047, 0.06256103515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 6.0, 2.0, 5.0, 15.0, 23.0, 29.0, 58.0, 120.0, 155.0, 183.0, 157.0, 104.0, 67.0, 30.0, 16.0, 17.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4670237600803375, -0.45588675141334534, -0.44474974274635315, -0.43361273407936096, -0.4224757254123688, -0.4113387167453766, -0.400201678276062, -0.3890646696090698, -0.37792766094207764, -0.36679065227508545, -0.35565364360809326, -0.3445166349411011, -0.3333796262741089, -0.3222426176071167, -0.3111056089401245, -0.2999686002731323, -0.28883159160614014, -0.27769458293914795, -0.26655757427215576, -0.2554205656051636, -0.2442835569381714, -0.2331465482711792, -0.22200952470302582, -0.21087251603603363, -0.19973550736904144, -0.18859849870204926, -0.17746149003505707, -0.1663244664669037, -0.1551874577999115, -0.1440504491329193, -0.13291344046592712, -0.12177643179893494, -0.11063945293426514, -0.09950244426727295, -0.08836543560028076, -0.07722841948270798, -0.06609141081571579, -0.0549544021487236, -0.04381738603115082, -0.03268037736415863, -0.021543368697166443, -0.010406358167529106, 0.0007306523621082306, 0.011867664754390717, 0.023004673421382904, 0.03414168208837509, 0.045278698205947876, 0.056415706872940063, 0.06755271553993225, 0.07868972420692444, 0.08982673287391663, 0.10096374899148941, 0.1121007576584816, 0.12323776632547379, 0.13437478244304657, 0.14551179111003876, 0.15664879977703094, 0.16778580844402313, 0.17892281711101532, 0.1900598406791687, 0.2011968493461609, 0.21233385801315308, 0.22347086668014526, 0.23460787534713745, 0.24574488401412964]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 9.0, 9.0, 19.0, 18.0, 35.0, 31.0, 37.0, 48.0, 67.0, 68.0, 63.0, 75.0, 73.0, 58.0, 63.0, 61.0, 58.0, 47.0, 43.0, 32.0, 26.0, 22.0, 15.0, 9.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.24328351020812988, -0.2361203283071518, -0.2289571464061737, -0.22179394960403442, -0.21463076770305634, -0.20746758580207825, -0.20030438899993896, -0.19314120709896088, -0.1859780251979828, -0.1788148432970047, -0.1716516613960266, -0.16448846459388733, -0.15732528269290924, -0.15016210079193115, -0.14299890398979187, -0.13583572208881378, -0.1286725401878357, -0.1215093582868576, -0.11434616893529892, -0.10718297958374023, -0.10001979768276215, -0.09285661578178406, -0.08569342643022537, -0.07853023707866669, -0.0713670551776886, -0.06420387327671051, -0.057040683925151825, -0.04987749829888344, -0.04271431267261505, -0.035551127046346664, -0.028387941420078278, -0.02122475579380989, -0.014061570167541504, -0.006898384541273117, 0.0002648010849952698, 0.007427986711263657, 0.014591172337532043, 0.02175435796380043, 0.028917543590068817, 0.036080729216337204, 0.04324391484260559, 0.05040710046887398, 0.057570286095142365, 0.06473347544670105, 0.07189665734767914, 0.07905983924865723, 0.08622302860021591, 0.0933862179517746, 0.10054939985275269, 0.10771258175373077, 0.11487577110528946, 0.12203896045684814, 0.12920214235782623, 0.13636532425880432, 0.1435285210609436, 0.1506917029619217, 0.15785488486289978, 0.16501806676387787, 0.17218124866485596, 0.17934444546699524, 0.18650762736797333, 0.19367080926895142, 0.2008340060710907, 0.2079971879720688, 0.21516036987304688]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 17.0, 23.0, 31.0, 27.0, 51.0, 92.0, 139.0, 279.0, 720.0, 2293.0, 14140.0, 201586.0, 762140.0, 58718.0, 5982.0, 1301.0, 482.0, 175.0, 118.0, 69.0, 49.0, 27.0, 25.0, 10.0, 10.0, 13.0, 4.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.254638671875, -0.2462310791015625, -0.237823486328125, -0.2294158935546875, -0.22100830078125, -0.2126007080078125, -0.204193115234375, -0.1957855224609375, -0.1873779296875, -0.1789703369140625, -0.170562744140625, -0.1621551513671875, -0.15374755859375, -0.1453399658203125, -0.136932373046875, -0.1285247802734375, -0.1201171875, -0.1117095947265625, -0.103302001953125, -0.0948944091796875, -0.08648681640625, -0.0780792236328125, -0.069671630859375, -0.0612640380859375, -0.0528564453125, -0.0444488525390625, -0.036041259765625, -0.0276336669921875, -0.01922607421875, -0.0108184814453125, -0.002410888671875, 0.0059967041015625, 0.014404296875, 0.0228118896484375, 0.031219482421875, 0.0396270751953125, 0.04803466796875, 0.0564422607421875, 0.064849853515625, 0.0732574462890625, 0.0816650390625, 0.0900726318359375, 0.098480224609375, 0.1068878173828125, 0.11529541015625, 0.1237030029296875, 0.132110595703125, 0.1405181884765625, 0.14892578125, 0.1573333740234375, 0.165740966796875, 0.1741485595703125, 0.18255615234375, 0.1909637451171875, 0.199371337890625, 0.2077789306640625, 0.2161865234375, 0.2245941162109375, 0.233001708984375, 0.2414093017578125, 0.24981689453125, 0.2582244873046875, 0.266632080078125, 0.2750396728515625, 0.283447265625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 12.0, 23.0, 37.0, 51.0, 61.0, 86.0, 102.0, 101.0, 93.0, 107.0, 89.0, 70.0, 65.0, 34.0, 25.0, 16.0, 10.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08001708984375, -0.07820653915405273, -0.07639598846435547, -0.0745854377746582, -0.07277488708496094, -0.07096433639526367, -0.0691537857055664, -0.06734323501586914, -0.06553268432617188, -0.06372213363647461, -0.061911582946777344, -0.06010103225708008, -0.05829048156738281, -0.05647993087768555, -0.05466938018798828, -0.052858829498291016, -0.05104827880859375, -0.049237728118896484, -0.04742717742919922, -0.04561662673950195, -0.04380607604980469, -0.04199552536010742, -0.040184974670410156, -0.03837442398071289, -0.036563873291015625, -0.03475332260131836, -0.032942771911621094, -0.031132221221923828, -0.029321670532226562, -0.027511119842529297, -0.02570056915283203, -0.023890018463134766, -0.0220794677734375, -0.020268917083740234, -0.01845836639404297, -0.016647815704345703, -0.014837265014648438, -0.013026714324951172, -0.011216163635253906, -0.00940561294555664, -0.007595062255859375, -0.005784511566162109, -0.003973960876464844, -0.002163410186767578, -0.0003528594970703125, 0.0014576911926269531, 0.0032682418823242188, 0.005078792572021484, 0.00688934326171875, 0.008699893951416016, 0.010510444641113281, 0.012320995330810547, 0.014131546020507812, 0.015942096710205078, 0.017752647399902344, 0.01956319808959961, 0.021373748779296875, 0.02318429946899414, 0.024994850158691406, 0.026805400848388672, 0.028615951538085938, 0.030426502227783203, 0.03223705291748047, 0.034047603607177734, 0.035858154296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 5.0, 6.0, 4.0, 12.0, 11.0, 20.0, 27.0, 35.0, 45.0, 93.0, 129.0, 213.0, 378.0, 752.0, 1672.0, 4857.0, 17039.0, 71477.0, 344731.0, 469070.0, 103232.0, 23838.0, 6675.0, 2190.0, 924.0, 406.0, 247.0, 146.0, 89.0, 72.0, 62.0, 20.0, 26.0, 17.0, 11.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08984375, -0.08675861358642578, -0.08367347717285156, -0.08058834075927734, -0.07750320434570312, -0.0744180679321289, -0.07133293151855469, -0.06824779510498047, -0.06516265869140625, -0.06207752227783203, -0.05899238586425781, -0.055907249450683594, -0.052822113037109375, -0.049736976623535156, -0.04665184020996094, -0.04356670379638672, -0.0404815673828125, -0.03739643096923828, -0.03431129455566406, -0.031226158142089844, -0.028141021728515625, -0.025055885314941406, -0.021970748901367188, -0.01888561248779297, -0.01580047607421875, -0.012715339660644531, -0.009630203247070312, -0.006545066833496094, -0.003459930419921875, -0.00037479400634765625, 0.0027103424072265625, 0.005795478820800781, 0.008880615234375, 0.011965751647949219, 0.015050888061523438, 0.018136024475097656, 0.021221160888671875, 0.024306297302246094, 0.027391433715820312, 0.03047657012939453, 0.03356170654296875, 0.03664684295654297, 0.03973197937011719, 0.042817115783691406, 0.045902252197265625, 0.048987388610839844, 0.05207252502441406, 0.05515766143798828, 0.0582427978515625, 0.06132793426513672, 0.06441307067871094, 0.06749820709228516, 0.07058334350585938, 0.0736684799194336, 0.07675361633300781, 0.07983875274658203, 0.08292388916015625, 0.08600902557373047, 0.08909416198730469, 0.0921792984008789, 0.09526443481445312, 0.09834957122802734, 0.10143470764160156, 0.10451984405517578, 0.10760498046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 4.0, 10.0, 12.0, 14.0, 25.0, 25.0, 20.0, 28.0, 31.0, 42.0, 45.0, 50.0, 39.0, 42.0, 59.0, 45.0, 41.0, 40.0, 47.0, 62.0, 42.0, 38.0, 29.0, 32.0, 22.0, 21.0, 30.0, 14.0, 12.0, 16.0, 8.0, 7.0, 7.0, 12.0, 7.0, 2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.105224609375, -0.10218143463134766, -0.09913825988769531, -0.09609508514404297, -0.09305191040039062, -0.09000873565673828, -0.08696556091308594, -0.0839223861694336, -0.08087921142578125, -0.0778360366821289, -0.07479286193847656, -0.07174968719482422, -0.06870651245117188, -0.06566333770751953, -0.06262016296386719, -0.059576988220214844, -0.0565338134765625, -0.053490638732910156, -0.05044746398925781, -0.04740428924560547, -0.044361114501953125, -0.04131793975830078, -0.03827476501464844, -0.035231590270996094, -0.03218841552734375, -0.029145240783691406, -0.026102066040039062, -0.02305889129638672, -0.020015716552734375, -0.01697254180908203, -0.013929367065429688, -0.010886192321777344, -0.007843017578125, -0.004799842834472656, -0.0017566680908203125, 0.0012865066528320312, 0.004329681396484375, 0.007372856140136719, 0.010416030883789062, 0.013459205627441406, 0.01650238037109375, 0.019545555114746094, 0.022588729858398438, 0.02563190460205078, 0.028675079345703125, 0.03171825408935547, 0.03476142883300781, 0.037804603576660156, 0.0408477783203125, 0.043890953063964844, 0.04693412780761719, 0.04997730255126953, 0.053020477294921875, 0.05606365203857422, 0.05910682678222656, 0.062150001525878906, 0.06519317626953125, 0.0682363510131836, 0.07127952575683594, 0.07432270050048828, 0.07736587524414062, 0.08040904998779297, 0.08345222473144531, 0.08649539947509766, 0.08953857421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 9.0, 12.0, 20.0, 46.0, 63.0, 99.0, 211.0, 444.0, 1025.0, 3381.0, 15533.0, 104711.0, 608490.0, 269137.0, 35954.0, 6406.0, 1739.0, 598.0, 284.0, 161.0, 92.0, 52.0, 31.0, 20.0, 11.0, 9.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046630859375, -0.04520606994628906, -0.043781280517578125, -0.04235649108886719, -0.04093170166015625, -0.03950691223144531, -0.038082122802734375, -0.03665733337402344, -0.0352325439453125, -0.03380775451660156, -0.032382965087890625, -0.030958175659179688, -0.02953338623046875, -0.028108596801757812, -0.026683807373046875, -0.025259017944335938, -0.023834228515625, -0.022409439086914062, -0.020984649658203125, -0.019559860229492188, -0.01813507080078125, -0.016710281372070312, -0.015285491943359375, -0.013860702514648438, -0.0124359130859375, -0.011011123657226562, -0.009586334228515625, -0.008161544799804688, -0.00673675537109375, -0.0053119659423828125, -0.003887176513671875, -0.0024623870849609375, -0.00103759765625, 0.0003871917724609375, 0.001811981201171875, 0.0032367706298828125, 0.00466156005859375, 0.0060863494873046875, 0.007511138916015625, 0.008935928344726562, 0.0103607177734375, 0.011785507202148438, 0.013210296630859375, 0.014635086059570312, 0.01605987548828125, 0.017484664916992188, 0.018909454345703125, 0.020334243774414062, 0.021759033203125, 0.023183822631835938, 0.024608612060546875, 0.026033401489257812, 0.02745819091796875, 0.028882980346679688, 0.030307769775390625, 0.03173255920410156, 0.0331573486328125, 0.03458213806152344, 0.036006927490234375, 0.03743171691894531, 0.03885650634765625, 0.04028129577636719, 0.041706085205078125, 0.04313087463378906, 0.0445556640625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 11.0, 11.0, 14.0, 30.0, 44.0, 58.0, 76.0, 107.0, 127.0, 123.0, 98.0, 93.0, 67.0, 38.0, 35.0, 22.0, 15.0, 11.0, 10.0, 11.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002300739288330078, -0.00022510718554258347, -0.00022014044225215912, -0.00021517369896173477, -0.00021020695567131042, -0.00020524021238088608, -0.00020027346909046173, -0.00019530672580003738, -0.00019033998250961304, -0.0001853732392191887, -0.00018040649592876434, -0.00017543975263834, -0.00017047300934791565, -0.0001655062660574913, -0.00016053952276706696, -0.0001555727794766426, -0.00015060603618621826, -0.00014563929289579391, -0.00014067254960536957, -0.00013570580631494522, -0.00013073906302452087, -0.00012577231973409653, -0.00012080557644367218, -0.00011583883315324783, -0.00011087208986282349, -0.00010590534657239914, -0.00010093860328197479, -9.597185999155045e-05, -9.10051167011261e-05, -8.603837341070175e-05, -8.10716301202774e-05, -7.610488682985306e-05, -7.113814353942871e-05, -6.617140024900436e-05, -6.120465695858002e-05, -5.623791366815567e-05, -5.127117037773132e-05, -4.6304427087306976e-05, -4.133768379688263e-05, -3.637094050645828e-05, -3.1404197216033936e-05, -2.643745392560959e-05, -2.1470710635185242e-05, -1.6503967344760895e-05, -1.1537224054336548e-05, -6.570480763912201e-06, -1.603737473487854e-06, 3.363005816936493e-06, 8.32974910736084e-06, 1.3296492397785187e-05, 1.8263235688209534e-05, 2.322997897863388e-05, 2.8196722269058228e-05, 3.3163465559482574e-05, 3.813020884990692e-05, 4.309695214033127e-05, 4.8063695430755615e-05, 5.303043872117996e-05, 5.799718201160431e-05, 6.296392530202866e-05, 6.7930668592453e-05, 7.289741188287735e-05, 7.78641551733017e-05, 8.283089846372604e-05, 8.779764175415039e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 1.0, 8.0, 10.0, 13.0, 13.0, 25.0, 29.0, 49.0, 72.0, 158.0, 217.0, 460.0, 1212.0, 4239.0, 22864.0, 199395.0, 699413.0, 102155.0, 13565.0, 2848.0, 893.0, 407.0, 201.0, 121.0, 54.0, 40.0, 27.0, 16.0, 23.0, 4.0, 6.0, 3.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05560302734375, -0.053984642028808594, -0.05236625671386719, -0.05074787139892578, -0.049129486083984375, -0.04751110076904297, -0.04589271545410156, -0.044274330139160156, -0.04265594482421875, -0.041037559509277344, -0.03941917419433594, -0.03780078887939453, -0.036182403564453125, -0.03456401824951172, -0.03294563293457031, -0.031327247619628906, -0.0297088623046875, -0.028090476989746094, -0.026472091674804688, -0.02485370635986328, -0.023235321044921875, -0.02161693572998047, -0.019998550415039062, -0.018380165100097656, -0.01676177978515625, -0.015143394470214844, -0.013525009155273438, -0.011906623840332031, -0.010288238525390625, -0.008669853210449219, -0.0070514678955078125, -0.005433082580566406, -0.003814697265625, -0.0021963119506835938, -0.0005779266357421875, 0.0010404586791992188, 0.002658843994140625, 0.004277229309082031, 0.0058956146240234375, 0.007513999938964844, 0.00913238525390625, 0.010750770568847656, 0.012369155883789062, 0.013987541198730469, 0.015605926513671875, 0.01722431182861328, 0.018842697143554688, 0.020461082458496094, 0.0220794677734375, 0.023697853088378906, 0.025316238403320312, 0.02693462371826172, 0.028553009033203125, 0.03017139434814453, 0.03178977966308594, 0.033408164978027344, 0.03502655029296875, 0.036644935607910156, 0.03826332092285156, 0.03988170623779297, 0.041500091552734375, 0.04311847686767578, 0.04473686218261719, 0.046355247497558594, 0.0479736328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 8.0, 20.0, 24.0, 28.0, 53.0, 66.0, 99.0, 108.0, 150.0, 133.0, 82.0, 70.0, 48.0, 33.0, 28.0, 10.0, 8.0, 7.0, 13.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06072998046875, -0.059336185455322266, -0.05794239044189453, -0.0565485954284668, -0.05515480041503906, -0.05376100540161133, -0.052367210388183594, -0.05097341537475586, -0.049579620361328125, -0.04818582534790039, -0.046792030334472656, -0.04539823532104492, -0.04400444030761719, -0.04261064529418945, -0.04121685028076172, -0.039823055267333984, -0.03842926025390625, -0.037035465240478516, -0.03564167022705078, -0.03424787521362305, -0.03285408020019531, -0.03146028518676758, -0.030066490173339844, -0.02867269515991211, -0.027278900146484375, -0.02588510513305664, -0.024491310119628906, -0.023097515106201172, -0.021703720092773438, -0.020309925079345703, -0.01891613006591797, -0.017522335052490234, -0.0161285400390625, -0.014734745025634766, -0.013340950012207031, -0.011947154998779297, -0.010553359985351562, -0.009159564971923828, -0.007765769958496094, -0.006371974945068359, -0.004978179931640625, -0.0035843849182128906, -0.0021905899047851562, -0.0007967948913574219, 0.0005970001220703125, 0.001990795135498047, 0.0033845901489257812, 0.004778385162353516, 0.00617218017578125, 0.007565975189208984, 0.008959770202636719, 0.010353565216064453, 0.011747360229492188, 0.013141155242919922, 0.014534950256347656, 0.01592874526977539, 0.017322540283203125, 0.01871633529663086, 0.020110130310058594, 0.021503925323486328, 0.022897720336914062, 0.024291515350341797, 0.02568531036376953, 0.027079105377197266, 0.028472900390625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 12.0, 18.0, 30.0, 73.0, 141.0, 194.0, 203.0, 139.0, 91.0, 53.0, 25.0, 8.0, 12.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6264997720718384, -0.5996057987213135, -0.5727118849754333, -0.5458179116249084, -0.5189239978790283, -0.4920300245285034, -0.4651360809803009, -0.4382421374320984, -0.4113481640815735, -0.38445422053337097, -0.35756027698516846, -0.33066630363464355, -0.30377236008644104, -0.2768784165382385, -0.249984472990036, -0.2230905145406723, -0.19619658589363098, -0.16930264234542847, -0.14240868389606476, -0.11551474034786224, -0.08862078934907913, -0.06172683835029602, -0.034832894802093506, -0.007938936352729797, 0.018955007195472717, 0.04584895819425583, 0.07274290919303894, 0.09963685274124146, 0.12653079628944397, 0.15342475473880768, 0.1803186982870102, 0.2072126567363739, 0.23410660028457642, 0.26100054383277893, 0.28789448738098145, 0.31478846073150635, 0.34168240427970886, 0.3685763478279114, 0.3954702913761139, 0.4223642349243164, 0.4492582082748413, 0.4761521518230438, 0.5030460953712463, 0.5299400687217712, 0.5568339824676514, 0.5837279558181763, 0.6106219291687012, 0.6375158429145813, 0.6644097566604614, 0.6913037300109863, 0.7181976437568665, 0.7450916171073914, 0.7719855308532715, 0.7988795042037964, 0.8257734775543213, 0.8526673913002014, 0.8795613646507263, 0.9064553380012512, 0.9333492517471313, 0.9602432250976562, 0.9871371388435364, 1.014031171798706, 1.0409250259399414, 1.0678189992904663, 1.0947129726409912]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 6.0, 7.0, 3.0, 10.0, 4.0, 9.0, 11.0, 12.0, 14.0, 20.0, 24.0, 30.0, 26.0, 26.0, 25.0, 33.0, 48.0, 46.0, 43.0, 46.0, 54.0, 33.0, 54.0, 43.0, 39.0, 37.0, 40.0, 36.0, 34.0, 16.0, 35.0, 25.0, 21.0, 14.0, 18.0, 10.0, 15.0, 11.0, 11.0, 6.0, 0.0, 6.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.39657557010650635, -0.38302141427993774, -0.36946725845336914, -0.35591310262680054, -0.34235891699790955, -0.32880476117134094, -0.31525060534477234, -0.30169644951820374, -0.28814226388931274, -0.27458810806274414, -0.26103395223617554, -0.24747978150844574, -0.23392561078071594, -0.22037145495414734, -0.20681729912757874, -0.19326314330101013, -0.17970898747444153, -0.16615483164787292, -0.15260066092014313, -0.13904650509357452, -0.12549233436584473, -0.11193817853927612, -0.09838402271270752, -0.08482985943555832, -0.07127569615840912, -0.05772153288125992, -0.044167373329401016, -0.030613213777542114, -0.017059050500392914, -0.0035048872232437134, 0.01004926860332489, 0.02360343188047409, 0.03715759515762329, 0.05071175843477249, 0.06426592171192169, 0.0778200775384903, 0.0913742408156395, 0.1049284040927887, 0.1184825599193573, 0.1320367157459259, 0.1455908864736557, 0.1591450423002243, 0.1726992130279541, 0.1862533688545227, 0.1998075246810913, 0.2133616954088211, 0.2269158512353897, 0.2404700219631195, 0.2540241777896881, 0.2675783336162567, 0.2811324894428253, 0.2946866750717163, 0.3082408308982849, 0.3217949867248535, 0.3353491425514221, 0.3489032983779907, 0.3624574542045593, 0.37601161003112793, 0.38956576585769653, 0.40311992168426514, 0.41667410731315613, 0.43022826313972473, 0.44378241896629333, 0.45733657479286194, 0.47089076042175293]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 5.0, 4.0, 8.0, 7.0, 12.0, 10.0, 18.0, 21.0, 32.0, 38.0, 52.0, 87.0, 131.0, 226.0, 500.0, 1209.0, 3702.0, 16707.0, 223635.0, 3902691.0, 35267.0, 6461.0, 1915.0, 739.0, 324.0, 169.0, 94.0, 62.0, 38.0, 27.0, 21.0, 22.0, 11.0, 10.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.376953125, -0.3668174743652344, -0.35668182373046875, -0.3465461730957031, -0.3364105224609375, -0.3262748718261719, -0.31613922119140625, -0.3060035705566406, -0.295867919921875, -0.2857322692871094, -0.27559661865234375, -0.2654609680175781, -0.2553253173828125, -0.24518966674804688, -0.23505401611328125, -0.22491836547851562, -0.21478271484375, -0.20464706420898438, -0.19451141357421875, -0.18437576293945312, -0.1742401123046875, -0.16410446166992188, -0.15396881103515625, -0.14383316040039062, -0.133697509765625, -0.12356185913085938, -0.11342620849609375, -0.10329055786132812, -0.0931549072265625, -0.08301925659179688, -0.07288360595703125, -0.06274795532226562, -0.0526123046875, -0.042476654052734375, -0.03234100341796875, -0.022205352783203125, -0.0120697021484375, -0.001934051513671875, 0.00820159912109375, 0.018337249755859375, 0.028472900390625, 0.038608551025390625, 0.04874420166015625, 0.058879852294921875, 0.0690155029296875, 0.07915115356445312, 0.08928680419921875, 0.09942245483398438, 0.10955810546875, 0.11969375610351562, 0.12982940673828125, 0.13996505737304688, 0.1501007080078125, 0.16023635864257812, 0.17037200927734375, 0.18050765991210938, 0.190643310546875, 0.20077896118164062, 0.21091461181640625, 0.22105026245117188, 0.2311859130859375, 0.24132156372070312, 0.25145721435546875, 0.2615928649902344, 0.271728515625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 10.0, 19.0, 32.0, 35.0, 72.0, 60.0, 83.0, 90.0, 91.0, 118.0, 92.0, 83.0, 64.0, 47.0, 37.0, 21.0, 15.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07421875, -0.07248353958129883, -0.07074832916259766, -0.06901311874389648, -0.06727790832519531, -0.06554269790649414, -0.06380748748779297, -0.0620722770690918, -0.060337066650390625, -0.05860185623168945, -0.05686664581298828, -0.05513143539428711, -0.05339622497558594, -0.051661014556884766, -0.049925804138183594, -0.04819059371948242, -0.04645538330078125, -0.04472017288208008, -0.042984962463378906, -0.041249752044677734, -0.03951454162597656, -0.03777933120727539, -0.03604412078857422, -0.03430891036987305, -0.032573699951171875, -0.030838489532470703, -0.02910327911376953, -0.02736806869506836, -0.025632858276367188, -0.023897647857666016, -0.022162437438964844, -0.020427227020263672, -0.0186920166015625, -0.016956806182861328, -0.015221595764160156, -0.013486385345458984, -0.011751174926757812, -0.01001596450805664, -0.008280754089355469, -0.006545543670654297, -0.004810333251953125, -0.003075122833251953, -0.0013399124145507812, 0.0003952980041503906, 0.0021305084228515625, 0.0038657188415527344, 0.005600929260253906, 0.007336139678955078, 0.00907135009765625, 0.010806560516357422, 0.012541770935058594, 0.014276981353759766, 0.016012191772460938, 0.01774740219116211, 0.01948261260986328, 0.021217823028564453, 0.022953033447265625, 0.024688243865966797, 0.02642345428466797, 0.02815866470336914, 0.029893875122070312, 0.031629085540771484, 0.033364295959472656, 0.03509950637817383, 0.036834716796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 11.0, 13.0, 14.0, 16.0, 13.0, 16.0, 35.0, 39.0, 68.0, 89.0, 113.0, 171.0, 273.0, 458.0, 762.0, 1730.0, 5048.0, 22078.0, 250422.0, 3839568.0, 57593.0, 9992.0, 2931.0, 1132.0, 623.0, 322.0, 233.0, 146.0, 99.0, 71.0, 59.0, 39.0, 18.0, 24.0, 15.0, 10.0, 8.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2454833984375, -0.23831558227539062, -0.23114776611328125, -0.22397994995117188, -0.2168121337890625, -0.20964431762695312, -0.20247650146484375, -0.19530868530273438, -0.188140869140625, -0.18097305297851562, -0.17380523681640625, -0.16663742065429688, -0.1594696044921875, -0.15230178833007812, -0.14513397216796875, -0.13796615600585938, -0.13079833984375, -0.12363052368164062, -0.11646270751953125, -0.10929489135742188, -0.1021270751953125, -0.09495925903320312, -0.08779144287109375, -0.08062362670898438, -0.073455810546875, -0.06628799438476562, -0.05912017822265625, -0.051952362060546875, -0.0447845458984375, -0.037616729736328125, -0.03044891357421875, -0.023281097412109375, -0.01611328125, -0.008945465087890625, -0.00177764892578125, 0.005390167236328125, 0.0125579833984375, 0.019725799560546875, 0.02689361572265625, 0.034061431884765625, 0.041229248046875, 0.048397064208984375, 0.05556488037109375, 0.06273269653320312, 0.0699005126953125, 0.07706832885742188, 0.08423614501953125, 0.09140396118164062, 0.09857177734375, 0.10573959350585938, 0.11290740966796875, 0.12007522583007812, 0.1272430419921875, 0.13441085815429688, 0.14157867431640625, 0.14874649047851562, 0.155914306640625, 0.16308212280273438, 0.17024993896484375, 0.17741775512695312, 0.1845855712890625, 0.19175338745117188, 0.19892120361328125, 0.20608901977539062, 0.2132568359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 3.0, 17.0, 31.0, 55.0, 210.0, 2832.0, 691.0, 128.0, 46.0, 21.0, 15.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.16748046875, -0.16365814208984375, -0.1598358154296875, -0.15601348876953125, -0.152191162109375, -0.14836883544921875, -0.1445465087890625, -0.14072418212890625, -0.13690185546875, -0.13307952880859375, -0.1292572021484375, -0.12543487548828125, -0.121612548828125, -0.11779022216796875, -0.1139678955078125, -0.11014556884765625, -0.1063232421875, -0.10250091552734375, -0.0986785888671875, -0.09485626220703125, -0.091033935546875, -0.08721160888671875, -0.0833892822265625, -0.07956695556640625, -0.07574462890625, -0.07192230224609375, -0.0680999755859375, -0.06427764892578125, -0.060455322265625, -0.05663299560546875, -0.0528106689453125, -0.04898834228515625, -0.045166015625, -0.04134368896484375, -0.0375213623046875, -0.03369903564453125, -0.029876708984375, -0.02605438232421875, -0.0222320556640625, -0.01840972900390625, -0.01458740234375, -0.01076507568359375, -0.0069427490234375, -0.00312042236328125, 0.000701904296875, 0.00452423095703125, 0.0083465576171875, 0.01216888427734375, 0.0159912109375, 0.01981353759765625, 0.0236358642578125, 0.02745819091796875, 0.031280517578125, 0.03510284423828125, 0.0389251708984375, 0.04274749755859375, 0.04656982421875, 0.05039215087890625, 0.0542144775390625, 0.05803680419921875, 0.061859130859375, 0.06568145751953125, 0.0695037841796875, 0.07332611083984375, 0.0771484375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 6.0, 13.0, 73.0, 216.0, 349.0, 207.0, 77.0, 33.0, 13.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5794578194618225, -0.5591939687728882, -0.5389301180839539, -0.5186662673950195, -0.4984024167060852, -0.4781385660171509, -0.45787468552589417, -0.43761083483695984, -0.4173469841480255, -0.3970831334590912, -0.37681928277015686, -0.35655543208122253, -0.3362915515899658, -0.3160277009010315, -0.29576385021209717, -0.27549999952316284, -0.2552361488342285, -0.2349722981452942, -0.21470844745635986, -0.19444458186626434, -0.17418073117733002, -0.1539168804883957, -0.13365301489830017, -0.11338916420936584, -0.09312531352043152, -0.07286146283149719, -0.05259760469198227, -0.032333750277757645, -0.01206989586353302, 0.008193954825401306, 0.02845781296491623, 0.04872167110443115, 0.0689854621887207, 0.08924931287765503, 0.10951317101716995, 0.12977702915668488, 0.1500408798456192, 0.17030473053455353, 0.19056859612464905, 0.21083244681358337, 0.2310962975025177, 0.251360148191452, 0.27162399888038635, 0.2918878495693207, 0.3121517300605774, 0.3324155807495117, 0.35267943143844604, 0.37294328212738037, 0.3932071328163147, 0.413470983505249, 0.43373483419418335, 0.4539986848831177, 0.474262535572052, 0.49452638626098633, 0.5147902369499207, 0.535054087638855, 0.5553179979324341, 0.5755818486213684, 0.5958456993103027, 0.6161095499992371, 0.6363734006881714, 0.6566372513771057, 0.67690110206604, 0.6971650123596191, 0.7174288034439087]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 8.0, 27.0, 42.0, 56.0, 82.0, 92.0, 124.0, 150.0, 128.0, 92.0, 61.0, 60.0, 34.0, 13.0, 13.0, 9.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41549354791641235, -0.40273118019104004, -0.38996878266334534, -0.377206414937973, -0.3644440472126007, -0.351681649684906, -0.3389192819595337, -0.3261569142341614, -0.31339454650878906, -0.30063217878341675, -0.28786978125572205, -0.27510741353034973, -0.2623450458049774, -0.2495826631784439, -0.2368202805519104, -0.22405791282653809, -0.21129551529884338, -0.19853313267230988, -0.18577076494693756, -0.17300838232040405, -0.16024601459503174, -0.14748363196849823, -0.13472124934196472, -0.12195887416601181, -0.1091964989900589, -0.09643412381410599, -0.08367174863815308, -0.07090936601161957, -0.058146990835666656, -0.045384615659713745, -0.03262223303318024, -0.019859857857227325, -0.007097482681274414, 0.0056648943573236465, 0.018427271395921707, 0.031189650297164917, 0.04395202547311783, 0.05671440064907074, 0.06947678327560425, 0.08223915845155716, 0.09500153362751007, 0.10776390880346298, 0.1205262839794159, 0.1332886666059494, 0.1460510492324829, 0.15881341695785522, 0.17157579958438873, 0.18433818221092224, 0.19710054993629456, 0.20986293256282806, 0.22262530028820038, 0.2353876829147339, 0.2481500506401062, 0.2609124183654785, 0.2736748158931732, 0.28643718361854553, 0.29919958114624023, 0.31196194887161255, 0.32472434639930725, 0.33748671412467957, 0.3502490818500519, 0.3630114793777466, 0.3757738471031189, 0.3885362148284912, 0.4012985825538635]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 3.0, 7.0, 9.0, 8.0, 22.0, 28.0, 39.0, 75.0, 129.0, 253.0, 608.0, 1912.0, 10874.0, 195499.0, 786221.0, 46269.0, 4662.0, 1115.0, 391.0, 177.0, 91.0, 57.0, 39.0, 22.0, 16.0, 9.0, 4.0, 2.0, 5.0, 7.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.278076171875, -0.26788330078125, -0.2576904296875, -0.24749755859375, -0.2373046875, -0.22711181640625, -0.2169189453125, -0.20672607421875, -0.196533203125, -0.18634033203125, -0.1761474609375, -0.16595458984375, -0.15576171875, -0.14556884765625, -0.1353759765625, -0.12518310546875, -0.114990234375, -0.10479736328125, -0.0946044921875, -0.08441162109375, -0.07421875, -0.06402587890625, -0.0538330078125, -0.04364013671875, -0.033447265625, -0.02325439453125, -0.0130615234375, -0.00286865234375, 0.00732421875, 0.01751708984375, 0.0277099609375, 0.03790283203125, 0.048095703125, 0.05828857421875, 0.0684814453125, 0.07867431640625, 0.0888671875, 0.09906005859375, 0.1092529296875, 0.11944580078125, 0.129638671875, 0.13983154296875, 0.1500244140625, 0.16021728515625, 0.17041015625, 0.18060302734375, 0.1907958984375, 0.20098876953125, 0.211181640625, 0.22137451171875, 0.2315673828125, 0.24176025390625, 0.251953125, 0.26214599609375, 0.2723388671875, 0.28253173828125, 0.292724609375, 0.30291748046875, 0.3131103515625, 0.32330322265625, 0.33349609375, 0.34368896484375, 0.3538818359375, 0.36407470703125, 0.374267578125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 7.0, 22.0, 22.0, 30.0, 47.0, 50.0, 77.0, 91.0, 99.0, 107.0, 90.0, 95.0, 81.0, 50.0, 43.0, 31.0, 15.0, 10.0, 9.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07666015625, -0.07485246658325195, -0.0730447769165039, -0.07123708724975586, -0.06942939758300781, -0.06762170791625977, -0.06581401824951172, -0.06400632858276367, -0.062198638916015625, -0.06039094924926758, -0.05858325958251953, -0.056775569915771484, -0.05496788024902344, -0.05316019058227539, -0.051352500915527344, -0.0495448112487793, -0.04773712158203125, -0.0459294319152832, -0.044121742248535156, -0.04231405258178711, -0.04050636291503906, -0.038698673248291016, -0.03689098358154297, -0.03508329391479492, -0.033275604248046875, -0.03146791458129883, -0.02966022491455078, -0.027852535247802734, -0.026044845581054688, -0.02423715591430664, -0.022429466247558594, -0.020621776580810547, -0.0188140869140625, -0.017006397247314453, -0.015198707580566406, -0.01339101791381836, -0.011583328247070312, -0.009775638580322266, -0.007967948913574219, -0.006160259246826172, -0.004352569580078125, -0.002544879913330078, -0.0007371902465820312, 0.0010704994201660156, 0.0028781890869140625, 0.004685878753662109, 0.006493568420410156, 0.008301258087158203, 0.01010894775390625, 0.011916637420654297, 0.013724327087402344, 0.01553201675415039, 0.017339706420898438, 0.019147396087646484, 0.02095508575439453, 0.022762775421142578, 0.024570465087890625, 0.026378154754638672, 0.02818584442138672, 0.029993534088134766, 0.03180122375488281, 0.03360891342163086, 0.035416603088378906, 0.03722429275512695, 0.039031982421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 10.0, 13.0, 11.0, 12.0, 18.0, 45.0, 72.0, 100.0, 149.0, 233.0, 401.0, 692.0, 1269.0, 2487.0, 6500.0, 20806.0, 80945.0, 314351.0, 434009.0, 135832.0, 33377.0, 9703.0, 3644.0, 1577.0, 881.0, 495.0, 328.0, 203.0, 119.0, 91.0, 47.0, 43.0, 25.0, 11.0, 14.0, 11.0, 9.0, 6.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09027099609375, -0.0872802734375, -0.08428955078125, -0.081298828125, -0.07830810546875, -0.0753173828125, -0.07232666015625, -0.0693359375, -0.06634521484375, -0.0633544921875, -0.06036376953125, -0.057373046875, -0.05438232421875, -0.0513916015625, -0.04840087890625, -0.04541015625, -0.04241943359375, -0.0394287109375, -0.03643798828125, -0.033447265625, -0.03045654296875, -0.0274658203125, -0.02447509765625, -0.021484375, -0.01849365234375, -0.0155029296875, -0.01251220703125, -0.009521484375, -0.00653076171875, -0.0035400390625, -0.00054931640625, 0.00244140625, 0.00543212890625, 0.0084228515625, 0.01141357421875, 0.014404296875, 0.01739501953125, 0.0203857421875, 0.02337646484375, 0.0263671875, 0.02935791015625, 0.0323486328125, 0.03533935546875, 0.038330078125, 0.04132080078125, 0.0443115234375, 0.04730224609375, 0.05029296875, 0.05328369140625, 0.0562744140625, 0.05926513671875, 0.062255859375, 0.06524658203125, 0.0682373046875, 0.07122802734375, 0.07421875, 0.07720947265625, 0.0802001953125, 0.08319091796875, 0.086181640625, 0.08917236328125, 0.0921630859375, 0.09515380859375, 0.09814453125, 0.10113525390625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 5.0, 12.0, 21.0, 23.0, 30.0, 45.0, 41.0, 52.0, 49.0, 67.0, 70.0, 56.0, 50.0, 65.0, 56.0, 63.0, 56.0, 43.0, 45.0, 36.0, 26.0, 22.0, 16.0, 12.0, 15.0, 12.0, 2.0, 6.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1767578125, -0.1713695526123047, -0.16598129272460938, -0.16059303283691406, -0.15520477294921875, -0.14981651306152344, -0.14442825317382812, -0.1390399932861328, -0.1336517333984375, -0.1282634735107422, -0.12287521362304688, -0.11748695373535156, -0.11209869384765625, -0.10671043395996094, -0.10132217407226562, -0.09593391418457031, -0.090545654296875, -0.08515739440917969, -0.07976913452148438, -0.07438087463378906, -0.06899261474609375, -0.06360435485839844, -0.058216094970703125, -0.05282783508300781, -0.0474395751953125, -0.04205131530761719, -0.036663055419921875, -0.03127479553222656, -0.02588653564453125, -0.020498275756835938, -0.015110015869140625, -0.009721755981445312, -0.00433349609375, 0.0010547637939453125, 0.006443023681640625, 0.011831283569335938, 0.01721954345703125, 0.022607803344726562, 0.027996063232421875, 0.03338432312011719, 0.0387725830078125, 0.04416084289550781, 0.049549102783203125, 0.05493736267089844, 0.06032562255859375, 0.06571388244628906, 0.07110214233398438, 0.07649040222167969, 0.081878662109375, 0.08726692199707031, 0.09265518188476562, 0.09804344177246094, 0.10343170166015625, 0.10881996154785156, 0.11420822143554688, 0.11959648132324219, 0.1249847412109375, 0.1303730010986328, 0.13576126098632812, 0.14114952087402344, 0.14653778076171875, 0.15192604064941406, 0.15731430053710938, 0.1627025604248047, 0.1680908203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 7.0, 11.0, 24.0, 34.0, 81.0, 294.0, 1082.0, 19967.0, 991237.0, 34063.0, 1308.0, 253.0, 96.0, 35.0, 19.0, 12.0, 7.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1519775390625, -0.14646148681640625, -0.1409454345703125, -0.13542938232421875, -0.129913330078125, -0.12439727783203125, -0.1188812255859375, -0.11336517333984375, -0.10784912109375, -0.10233306884765625, -0.0968170166015625, -0.09130096435546875, -0.085784912109375, -0.08026885986328125, -0.0747528076171875, -0.06923675537109375, -0.063720703125, -0.05820465087890625, -0.0526885986328125, -0.04717254638671875, -0.041656494140625, -0.03614044189453125, -0.0306243896484375, -0.02510833740234375, -0.01959228515625, -0.01407623291015625, -0.0085601806640625, -0.00304412841796875, 0.002471923828125, 0.00798797607421875, 0.0135040283203125, 0.01902008056640625, 0.0245361328125, 0.03005218505859375, 0.0355682373046875, 0.04108428955078125, 0.046600341796875, 0.05211639404296875, 0.0576324462890625, 0.06314849853515625, 0.06866455078125, 0.07418060302734375, 0.0796966552734375, 0.08521270751953125, 0.090728759765625, 0.09624481201171875, 0.1017608642578125, 0.10727691650390625, 0.11279296875, 0.11830902099609375, 0.1238250732421875, 0.12934112548828125, 0.134857177734375, 0.14037322998046875, 0.1458892822265625, 0.15140533447265625, 0.15692138671875, 0.16243743896484375, 0.1679534912109375, 0.17346954345703125, 0.178985595703125, 0.18450164794921875, 0.1900177001953125, 0.19553375244140625, 0.2010498046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 12.0, 17.0, 22.0, 24.0, 28.0, 29.0, 38.0, 73.0, 67.0, 93.0, 95.0, 90.0, 91.0, 73.0, 51.0, 36.0, 33.0, 23.0, 29.0, 14.0, 12.0, 16.0, 5.0, 7.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.487701416015625e-05, -8.182041347026825e-05, -7.876381278038025e-05, -7.570721209049225e-05, -7.265061140060425e-05, -6.959401071071625e-05, -6.653741002082825e-05, -6.348080933094025e-05, -6.0424208641052246e-05, -5.7367607951164246e-05, -5.4311007261276245e-05, -5.1254406571388245e-05, -4.8197805881500244e-05, -4.5141205191612244e-05, -4.208460450172424e-05, -3.902800381183624e-05, -3.597140312194824e-05, -3.291480243206024e-05, -2.985820174217224e-05, -2.680160105228424e-05, -2.374500036239624e-05, -2.068839967250824e-05, -1.763179898262024e-05, -1.4575198292732239e-05, -1.1518597602844238e-05, -8.461996912956238e-06, -5.405396223068237e-06, -2.348795533180237e-06, 7.078051567077637e-07, 3.764405846595764e-06, 6.821006536483765e-06, 9.877607226371765e-06, 1.2934207916259766e-05, 1.5990808606147766e-05, 1.9047409296035767e-05, 2.2104009985923767e-05, 2.5160610675811768e-05, 2.8217211365699768e-05, 3.127381205558777e-05, 3.433041274547577e-05, 3.738701343536377e-05, 4.044361412525177e-05, 4.350021481513977e-05, 4.655681550502777e-05, 4.961341619491577e-05, 5.267001688480377e-05, 5.572661757469177e-05, 5.878321826457977e-05, 6.183981895446777e-05, 6.489641964435577e-05, 6.795302033424377e-05, 7.100962102413177e-05, 7.406622171401978e-05, 7.712282240390778e-05, 8.017942309379578e-05, 8.323602378368378e-05, 8.629262447357178e-05, 8.934922516345978e-05, 9.240582585334778e-05, 9.546242654323578e-05, 9.851902723312378e-05, 0.00010157562792301178, 0.00010463222861289978, 0.00010768882930278778, 0.00011074542999267578]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 9.0, 6.0, 8.0, 17.0, 17.0, 40.0, 58.0, 105.0, 219.0, 679.0, 4414.0, 248727.0, 783095.0, 9590.0, 1008.0, 246.0, 105.0, 65.0, 49.0, 33.0, 22.0, 21.0, 7.0, 9.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1864013671875, -0.18109703063964844, -0.17579269409179688, -0.1704883575439453, -0.16518402099609375, -0.1598796844482422, -0.15457534790039062, -0.14927101135253906, -0.1439666748046875, -0.13866233825683594, -0.13335800170898438, -0.1280536651611328, -0.12274932861328125, -0.11744499206542969, -0.11214065551757812, -0.10683631896972656, -0.101531982421875, -0.09622764587402344, -0.09092330932617188, -0.08561897277832031, -0.08031463623046875, -0.07501029968261719, -0.06970596313476562, -0.06440162658691406, -0.0590972900390625, -0.05379295349121094, -0.048488616943359375, -0.04318428039550781, -0.03787994384765625, -0.03257560729980469, -0.027271270751953125, -0.021966934204101562, -0.01666259765625, -0.011358261108398438, -0.006053924560546875, -0.0007495880126953125, 0.00455474853515625, 0.009859085083007812, 0.015163421630859375, 0.020467758178710938, 0.0257720947265625, 0.031076431274414062, 0.036380767822265625, 0.04168510437011719, 0.04698944091796875, 0.05229377746582031, 0.057598114013671875, 0.06290245056152344, 0.068206787109375, 0.07351112365722656, 0.07881546020507812, 0.08411979675292969, 0.08942413330078125, 0.09472846984863281, 0.10003280639648438, 0.10533714294433594, 0.1106414794921875, 0.11594581604003906, 0.12125015258789062, 0.1265544891357422, 0.13185882568359375, 0.1371631622314453, 0.14246749877929688, 0.14777183532714844, 0.153076171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 12.0, 22.0, 38.0, 52.0, 154.0, 211.0, 207.0, 151.0, 70.0, 37.0, 26.0, 10.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05572509765625, -0.051733970642089844, -0.04774284362792969, -0.04375171661376953, -0.039760589599609375, -0.03576946258544922, -0.03177833557128906, -0.027787208557128906, -0.02379608154296875, -0.019804954528808594, -0.015813827514648438, -0.011822700500488281, -0.007831573486328125, -0.0038404464721679688, 0.0001506805419921875, 0.004141807556152344, 0.0081329345703125, 0.012124061584472656, 0.016115188598632812, 0.02010631561279297, 0.024097442626953125, 0.02808856964111328, 0.03207969665527344, 0.036070823669433594, 0.04006195068359375, 0.044053077697753906, 0.04804420471191406, 0.05203533172607422, 0.056026458740234375, 0.06001758575439453, 0.06400871276855469, 0.06799983978271484, 0.071990966796875, 0.07598209381103516, 0.07997322082519531, 0.08396434783935547, 0.08795547485351562, 0.09194660186767578, 0.09593772888183594, 0.0999288558959961, 0.10391998291015625, 0.1079111099243164, 0.11190223693847656, 0.11589336395263672, 0.11988449096679688, 0.12387561798095703, 0.1278667449951172, 0.13185787200927734, 0.1358489990234375, 0.13984012603759766, 0.1438312530517578, 0.14782238006591797, 0.15181350708007812, 0.15580463409423828, 0.15979576110839844, 0.1637868881225586, 0.16777801513671875, 0.1717691421508789, 0.17576026916503906, 0.17975139617919922, 0.18374252319335938, 0.18773365020751953, 0.1917247772216797, 0.19571590423583984, 0.19970703125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 18.0, 66.0, 342.0, 470.0, 102.0, 9.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8843941688537598, -1.7805275917053223, -1.6766610145568848, -1.5727945566177368, -1.4689279794692993, -1.3650614023208618, -1.2611949443817139, -1.1573283672332764, -1.0534617900848389, -0.9495952129364014, -0.8457286953926086, -0.7418621778488159, -0.6379956007003784, -0.5341290235519409, -0.4302625060081482, -0.32639598846435547, -0.22252941131591797, -0.11866286396980286, -0.014796316623687744, 0.08907023072242737, 0.19293677806854248, 0.29680335521698, 0.4006698727607727, 0.5045363903045654, 0.6084029674530029, 0.7122695446014404, 0.8161360621452332, 0.9200025796890259, 1.0238691568374634, 1.1277357339859009, 1.2316021919250488, 1.3354687690734863, 1.4393353462219238, 1.5432019233703613, 1.6470685005187988, 1.7509349584579468, 1.8548015356063843, 1.9586681127548218, 2.0625345706939697, 2.1664011478424072, 2.2702677249908447, 2.3741343021392822, 2.4780008792877197, 2.5818674564361572, 2.6857337951660156, 2.789600372314453, 2.8934669494628906, 2.997333526611328, 3.1012001037597656, 3.205066680908203, 3.3089332580566406, 3.412799835205078, 3.5166664123535156, 3.620532989501953, 3.7243993282318115, 3.828265905380249, 3.9321324825286865, 4.035998821258545, 4.139865398406982, 4.24373197555542, 4.347598552703857, 4.451465129852295, 4.555331707000732, 4.65919828414917, 4.763064861297607]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 8.0, 6.0, 6.0, 5.0, 13.0, 11.0, 9.0, 16.0, 23.0, 25.0, 16.0, 28.0, 35.0, 33.0, 21.0, 29.0, 47.0, 41.0, 48.0, 54.0, 52.0, 43.0, 48.0, 51.0, 41.0, 44.0, 34.0, 27.0, 37.0, 23.0, 21.0, 23.0, 21.0, 8.0, 18.0, 9.0, 8.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6521785259246826, -0.6306167244911194, -0.6090549230575562, -0.5874930620193481, -0.5659312605857849, -0.5443694591522217, -0.5228076577186584, -0.5012458562850952, -0.4796840250492096, -0.45812222361564636, -0.43656039237976074, -0.4149985909461975, -0.3934367895126343, -0.37187495827674866, -0.3503131568431854, -0.3287513256072998, -0.3071895241737366, -0.28562772274017334, -0.2640658915042877, -0.2425040900707245, -0.22094227373600006, -0.19938045740127563, -0.1778186559677124, -0.15625683963298798, -0.13469502329826355, -0.11313320696353912, -0.0915713980793953, -0.07000958919525146, -0.04844777286052704, -0.026885956525802612, -0.00532415509223938, 0.016237661242485046, 0.0377994179725647, 0.059361230581998825, 0.08092304319143295, 0.10248485207557678, 0.12404666841030121, 0.14560848474502563, 0.16717028617858887, 0.1887321025133133, 0.21029391884803772, 0.23185573518276215, 0.2534175515174866, 0.2749793529510498, 0.29654115438461304, 0.31810298562049866, 0.3396647870540619, 0.3612266182899475, 0.38278841972351074, 0.404350221157074, 0.4259120523929596, 0.4474738538265228, 0.46903568506240845, 0.4905974864959717, 0.5121592879295349, 0.5337210893630981, 0.5552829504013062, 0.5768447518348694, 0.5984065532684326, 0.6199684143066406, 0.6415302157402039, 0.6630920171737671, 0.6846538186073303, 0.7062156200408936, 0.7277774214744568]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 6.0, 4.0, 12.0, 15.0, 16.0, 19.0, 41.0, 38.0, 72.0, 135.0, 242.0, 544.0, 1629.0, 7588.0, 115379.0, 4022124.0, 39823.0, 4593.0, 1166.0, 421.0, 166.0, 98.0, 45.0, 37.0, 23.0, 19.0, 13.0, 3.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.52197265625, -0.5096435546875, -0.497314453125, -0.4849853515625, -0.47265625, -0.4603271484375, -0.447998046875, -0.4356689453125, -0.42333984375, -0.4110107421875, -0.398681640625, -0.3863525390625, -0.3740234375, -0.3616943359375, -0.349365234375, -0.3370361328125, -0.32470703125, -0.3123779296875, -0.300048828125, -0.2877197265625, -0.275390625, -0.2630615234375, -0.250732421875, -0.2384033203125, -0.22607421875, -0.2137451171875, -0.201416015625, -0.1890869140625, -0.1767578125, -0.1644287109375, -0.152099609375, -0.1397705078125, -0.12744140625, -0.1151123046875, -0.102783203125, -0.0904541015625, -0.078125, -0.0657958984375, -0.053466796875, -0.0411376953125, -0.02880859375, -0.0164794921875, -0.004150390625, 0.0081787109375, 0.0205078125, 0.0328369140625, 0.045166015625, 0.0574951171875, 0.06982421875, 0.0821533203125, 0.094482421875, 0.1068115234375, 0.119140625, 0.1314697265625, 0.143798828125, 0.1561279296875, 0.16845703125, 0.1807861328125, 0.193115234375, 0.2054443359375, 0.2177734375, 0.2301025390625, 0.242431640625, 0.2547607421875, 0.26708984375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 16.0, 20.0, 21.0, 31.0, 37.0, 49.0, 63.0, 79.0, 84.0, 88.0, 68.0, 80.0, 88.0, 57.0, 58.0, 38.0, 28.0, 31.0, 17.0, 13.0, 12.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07220458984375, -0.0704503059387207, -0.0686960220336914, -0.06694173812866211, -0.06518745422363281, -0.06343317031860352, -0.06167888641357422, -0.05992460250854492, -0.058170318603515625, -0.05641603469848633, -0.05466175079345703, -0.052907466888427734, -0.05115318298339844, -0.04939889907836914, -0.047644615173339844, -0.04589033126831055, -0.04413604736328125, -0.04238176345825195, -0.040627479553222656, -0.03887319564819336, -0.03711891174316406, -0.035364627838134766, -0.03361034393310547, -0.03185606002807617, -0.030101776123046875, -0.028347492218017578, -0.02659320831298828, -0.024838924407958984, -0.023084640502929688, -0.02133035659790039, -0.019576072692871094, -0.017821788787841797, -0.0160675048828125, -0.014313220977783203, -0.012558937072753906, -0.01080465316772461, -0.009050369262695312, -0.007296085357666016, -0.005541801452636719, -0.003787517547607422, -0.002033233642578125, -0.0002789497375488281, 0.0014753341674804688, 0.0032296180725097656, 0.0049839019775390625, 0.006738185882568359, 0.008492469787597656, 0.010246753692626953, 0.01200103759765625, 0.013755321502685547, 0.015509605407714844, 0.01726388931274414, 0.019018173217773438, 0.020772457122802734, 0.02252674102783203, 0.024281024932861328, 0.026035308837890625, 0.027789592742919922, 0.02954387664794922, 0.031298160552978516, 0.03305244445800781, 0.03480672836303711, 0.036561012268066406, 0.0383152961730957, 0.040069580078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 12.0, 12.0, 16.0, 23.0, 39.0, 42.0, 102.0, 116.0, 186.0, 362.0, 571.0, 1092.0, 2245.0, 6568.0, 25152.0, 229583.0, 3796117.0, 106941.0, 16448.0, 4673.0, 1854.0, 886.0, 432.0, 306.0, 155.0, 122.0, 65.0, 39.0, 49.0, 22.0, 18.0, 9.0, 9.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.1354236602783203, -0.12936782836914062, -0.12331199645996094, -0.11725616455078125, -0.11120033264160156, -0.10514450073242188, -0.09908866882324219, -0.0930328369140625, -0.08697700500488281, -0.08092117309570312, -0.07486534118652344, -0.06880950927734375, -0.06275367736816406, -0.056697845458984375, -0.05064201354980469, -0.044586181640625, -0.03853034973144531, -0.032474517822265625, -0.026418685913085938, -0.02036285400390625, -0.014307022094726562, -0.008251190185546875, -0.0021953582763671875, 0.0038604736328125, 0.009916305541992188, 0.015972137451171875, 0.022027969360351562, 0.02808380126953125, 0.03413963317871094, 0.040195465087890625, 0.04625129699707031, 0.05230712890625, 0.05836296081542969, 0.06441879272460938, 0.07047462463378906, 0.07653045654296875, 0.08258628845214844, 0.08864212036132812, 0.09469795227050781, 0.1007537841796875, 0.10680961608886719, 0.11286544799804688, 0.11892127990722656, 0.12497711181640625, 0.13103294372558594, 0.13708877563476562, 0.1431446075439453, 0.149200439453125, 0.1552562713623047, 0.16131210327148438, 0.16736793518066406, 0.17342376708984375, 0.17947959899902344, 0.18553543090820312, 0.1915912628173828, 0.1976470947265625, 0.2037029266357422, 0.20975875854492188, 0.21581459045410156, 0.22187042236328125, 0.22792625427246094, 0.23398208618164062, 0.2400379180908203, 0.24609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 11.0, 10.0, 30.0, 48.0, 136.0, 563.0, 2794.0, 298.0, 90.0, 40.0, 21.0, 16.0, 10.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.141845703125, -0.1370067596435547, -0.13216781616210938, -0.12732887268066406, -0.12248992919921875, -0.11765098571777344, -0.11281204223632812, -0.10797309875488281, -0.1031341552734375, -0.09829521179199219, -0.09345626831054688, -0.08861732482910156, -0.08377838134765625, -0.07893943786621094, -0.07410049438476562, -0.06926155090332031, -0.064422607421875, -0.05958366394042969, -0.054744720458984375, -0.04990577697753906, -0.04506683349609375, -0.04022789001464844, -0.035388946533203125, -0.030550003051757812, -0.0257110595703125, -0.020872116088867188, -0.016033172607421875, -0.011194229125976562, -0.00635528564453125, -0.0015163421630859375, 0.003322601318359375, 0.008161544799804688, 0.01300048828125, 0.017839431762695312, 0.022678375244140625, 0.027517318725585938, 0.03235626220703125, 0.03719520568847656, 0.042034149169921875, 0.04687309265136719, 0.0517120361328125, 0.05655097961425781, 0.061389923095703125, 0.06622886657714844, 0.07106781005859375, 0.07590675354003906, 0.08074569702148438, 0.08558464050292969, 0.090423583984375, 0.09526252746582031, 0.10010147094726562, 0.10494041442871094, 0.10977935791015625, 0.11461830139160156, 0.11945724487304688, 0.12429618835449219, 0.1291351318359375, 0.1339740753173828, 0.13881301879882812, 0.14365196228027344, 0.14849090576171875, 0.15332984924316406, 0.15816879272460938, 0.1630077362060547, 0.1678466796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 12.0, 40.0, 104.0, 239.0, 280.0, 186.0, 77.0, 28.0, 15.0, 4.0, 7.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6228259205818176, -0.5980949401855469, -0.5733639001846313, -0.5486329197883606, -0.5239018797874451, -0.49917086958885193, -0.4744398593902588, -0.44970887899398804, -0.4249778389930725, -0.40024682879447937, -0.37551581859588623, -0.3507848083972931, -0.32605379819869995, -0.3013227880001068, -0.27659177780151367, -0.2518607974052429, -0.22712978720664978, -0.20239877700805664, -0.1776677668094635, -0.15293675661087036, -0.12820574641227722, -0.10347474366426468, -0.07874374091625214, -0.054012730717659, -0.029281720519065857, -0.0045507121831178665, 0.020180296152830124, 0.044911302626132965, 0.0696423128247261, 0.09437332302331924, 0.11910432577133179, 0.14383533596992493, 0.16856634616851807, 0.1932973563671112, 0.21802836656570435, 0.24275937676429749, 0.2674903869628906, 0.29222139716148376, 0.3169524073600769, 0.34168338775634766, 0.3664144277572632, 0.3911454379558563, 0.41587644815444946, 0.4406074583530426, 0.46533846855163574, 0.4900694787502289, 0.514800488948822, 0.5395314693450928, 0.5642625093460083, 0.588993489742279, 0.6137245297431946, 0.6384555101394653, 0.6631865501403809, 0.6879175305366516, 0.7126485705375671, 0.7373795509338379, 0.7621105313301086, 0.7868415117263794, 0.8115725517272949, 0.8363035321235657, 0.8610345721244812, 0.885765552520752, 0.9104965925216675, 0.9352275729179382, 0.9599586129188538]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 6.0, 15.0, 16.0, 20.0, 23.0, 32.0, 26.0, 46.0, 29.0, 40.0, 50.0, 55.0, 48.0, 59.0, 46.0, 58.0, 62.0, 48.0, 56.0, 48.0, 34.0, 31.0, 18.0, 31.0, 18.0, 14.0, 14.0, 9.0, 12.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3234723210334778, -0.3147957921028137, -0.30611926317214966, -0.2974427342414856, -0.28876620531082153, -0.28008967638015747, -0.2714131474494934, -0.26273661851882935, -0.2540600895881653, -0.24538356065750122, -0.23670703172683716, -0.2280305027961731, -0.21935397386550903, -0.21067744493484497, -0.2020009160041809, -0.19332438707351685, -0.18464787304401398, -0.17597134411334991, -0.16729481518268585, -0.1586182862520218, -0.14994175732135773, -0.14126522839069366, -0.1325887143611908, -0.12391217797994614, -0.11523564904928207, -0.10655912011861801, -0.09788259118795395, -0.08920606970787048, -0.08052954077720642, -0.07185301184654236, -0.0631764829158783, -0.05449995398521423, -0.04582342505455017, -0.03714689612388611, -0.028470369055867195, -0.019793841987848282, -0.01111731305718422, -0.002440784126520157, 0.006235741078853607, 0.01491227000951767, 0.023588798940181732, 0.032265327870845795, 0.04094185680150986, 0.04961838200688362, 0.058294910937547684, 0.06697143614292145, 0.07564796507358551, 0.08432449400424957, 0.09300102293491364, 0.1016775518655777, 0.11035408079624176, 0.11903060972690582, 0.12770713865756989, 0.13638366758823395, 0.14506018161773682, 0.15373671054840088, 0.16241323947906494, 0.171089768409729, 0.17976629734039307, 0.18844282627105713, 0.1971193552017212, 0.20579588413238525, 0.21447241306304932, 0.22314894199371338, 0.23182547092437744]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 6.0, 6.0, 15.0, 11.0, 19.0, 47.0, 54.0, 90.0, 117.0, 236.0, 480.0, 1452.0, 6006.0, 40816.0, 439428.0, 501621.0, 48431.0, 6893.0, 1621.0, 589.0, 236.0, 132.0, 82.0, 47.0, 27.0, 27.0, 12.0, 12.0, 9.0, 9.0, 5.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2734375, -0.2658500671386719, -0.25826263427734375, -0.2506752014160156, -0.2430877685546875, -0.23550033569335938, -0.22791290283203125, -0.22032546997070312, -0.212738037109375, -0.20515060424804688, -0.19756317138671875, -0.18997573852539062, -0.1823883056640625, -0.17480087280273438, -0.16721343994140625, -0.15962600708007812, -0.15203857421875, -0.14445114135742188, -0.13686370849609375, -0.12927627563476562, -0.1216888427734375, -0.11410140991210938, -0.10651397705078125, -0.09892654418945312, -0.091339111328125, -0.08375167846679688, -0.07616424560546875, -0.06857681274414062, -0.0609893798828125, -0.053401947021484375, -0.04581451416015625, -0.038227081298828125, -0.0306396484375, -0.023052215576171875, -0.01546478271484375, -0.007877349853515625, -0.0002899169921875, 0.007297515869140625, 0.01488494873046875, 0.022472381591796875, 0.030059814453125, 0.037647247314453125, 0.04523468017578125, 0.052822113037109375, 0.0604095458984375, 0.06799697875976562, 0.07558441162109375, 0.08317184448242188, 0.09075927734375, 0.09834671020507812, 0.10593414306640625, 0.11352157592773438, 0.1211090087890625, 0.12869644165039062, 0.13628387451171875, 0.14387130737304688, 0.151458740234375, 0.15904617309570312, 0.16663360595703125, 0.17422103881835938, 0.1818084716796875, 0.18939590454101562, 0.19698333740234375, 0.20457077026367188, 0.212158203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 6.0, 23.0, 14.0, 35.0, 34.0, 41.0, 48.0, 65.0, 97.0, 91.0, 74.0, 87.0, 80.0, 77.0, 41.0, 50.0, 40.0, 23.0, 17.0, 14.0, 12.0, 6.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07720947265625, -0.07529830932617188, -0.07338714599609375, -0.07147598266601562, -0.0695648193359375, -0.06765365600585938, -0.06574249267578125, -0.06383132934570312, -0.061920166015625, -0.060009002685546875, -0.05809783935546875, -0.056186676025390625, -0.0542755126953125, -0.052364349365234375, -0.05045318603515625, -0.048542022705078125, -0.046630859375, -0.044719696044921875, -0.04280853271484375, -0.040897369384765625, -0.0389862060546875, -0.037075042724609375, -0.03516387939453125, -0.033252716064453125, -0.031341552734375, -0.029430389404296875, -0.02751922607421875, -0.025608062744140625, -0.0236968994140625, -0.021785736083984375, -0.01987457275390625, -0.017963409423828125, -0.01605224609375, -0.014141082763671875, -0.01222991943359375, -0.010318756103515625, -0.0084075927734375, -0.006496429443359375, -0.00458526611328125, -0.002674102783203125, -0.000762939453125, 0.001148223876953125, 0.00305938720703125, 0.004970550537109375, 0.0068817138671875, 0.008792877197265625, 0.01070404052734375, 0.012615203857421875, 0.0145263671875, 0.016437530517578125, 0.01834869384765625, 0.020259857177734375, 0.0221710205078125, 0.024082183837890625, 0.02599334716796875, 0.027904510498046875, 0.029815673828125, 0.031726837158203125, 0.03363800048828125, 0.035549163818359375, 0.0374603271484375, 0.039371490478515625, 0.04128265380859375, 0.043193817138671875, 0.04510498046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 11.0, 8.0, 20.0, 28.0, 19.0, 34.0, 47.0, 80.0, 90.0, 137.0, 209.0, 329.0, 519.0, 825.0, 1327.0, 2502.0, 4776.0, 10077.0, 24008.0, 62932.0, 181052.0, 375399.0, 242295.0, 84924.0, 31194.0, 12743.0, 5899.0, 2873.0, 1568.0, 895.0, 542.0, 370.0, 235.0, 156.0, 118.0, 84.0, 58.0, 44.0, 29.0, 20.0, 16.0, 9.0, 9.0, 10.0, 5.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.08197021484375, -0.07938003540039062, -0.07678985595703125, -0.07419967651367188, -0.0716094970703125, -0.06901931762695312, -0.06642913818359375, -0.06383895874023438, -0.061248779296875, -0.058658599853515625, -0.05606842041015625, -0.053478240966796875, -0.0508880615234375, -0.048297882080078125, -0.04570770263671875, -0.043117523193359375, -0.04052734375, -0.037937164306640625, -0.03534698486328125, -0.032756805419921875, -0.0301666259765625, -0.027576446533203125, -0.02498626708984375, -0.022396087646484375, -0.019805908203125, -0.017215728759765625, -0.01462554931640625, -0.012035369873046875, -0.0094451904296875, -0.006855010986328125, -0.00426483154296875, -0.001674652099609375, 0.00091552734375, 0.003505706787109375, 0.00609588623046875, 0.008686065673828125, 0.0112762451171875, 0.013866424560546875, 0.01645660400390625, 0.019046783447265625, 0.021636962890625, 0.024227142333984375, 0.02681732177734375, 0.029407501220703125, 0.0319976806640625, 0.034587860107421875, 0.03717803955078125, 0.039768218994140625, 0.0423583984375, 0.044948577880859375, 0.04753875732421875, 0.050128936767578125, 0.0527191162109375, 0.055309295654296875, 0.05789947509765625, 0.060489654541015625, 0.063079833984375, 0.06567001342773438, 0.06826019287109375, 0.07085037231445312, 0.0734405517578125, 0.07603073120117188, 0.07862091064453125, 0.08121109008789062, 0.08380126953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 11.0, 8.0, 10.0, 22.0, 13.0, 28.0, 17.0, 28.0, 30.0, 37.0, 50.0, 40.0, 34.0, 47.0, 46.0, 47.0, 40.0, 54.0, 63.0, 44.0, 55.0, 41.0, 43.0, 30.0, 30.0, 17.0, 22.0, 20.0, 10.0, 12.0, 10.0, 11.0, 6.0, 10.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.191650390625, -0.18595504760742188, -0.18025970458984375, -0.17456436157226562, -0.1688690185546875, -0.16317367553710938, -0.15747833251953125, -0.15178298950195312, -0.146087646484375, -0.14039230346679688, -0.13469696044921875, -0.12900161743164062, -0.1233062744140625, -0.11761093139648438, -0.11191558837890625, -0.10622024536132812, -0.10052490234375, -0.09482955932617188, -0.08913421630859375, -0.08343887329101562, -0.0777435302734375, -0.07204818725585938, -0.06635284423828125, -0.060657501220703125, -0.054962158203125, -0.049266815185546875, -0.04357147216796875, -0.037876129150390625, -0.0321807861328125, -0.026485443115234375, -0.02079010009765625, -0.015094757080078125, -0.0093994140625, -0.003704071044921875, 0.00199127197265625, 0.007686614990234375, 0.0133819580078125, 0.019077301025390625, 0.02477264404296875, 0.030467987060546875, 0.036163330078125, 0.041858673095703125, 0.04755401611328125, 0.053249359130859375, 0.0589447021484375, 0.06464004516601562, 0.07033538818359375, 0.07603073120117188, 0.08172607421875, 0.08742141723632812, 0.09311676025390625, 0.09881210327148438, 0.1045074462890625, 0.11020278930664062, 0.11589813232421875, 0.12159347534179688, 0.127288818359375, 0.13298416137695312, 0.13867950439453125, 0.14437484741210938, 0.1500701904296875, 0.15576553344726562, 0.16146087646484375, 0.16715621948242188, 0.1728515625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 1.0, 8.0, 21.0, 30.0, 32.0, 54.0, 97.0, 189.0, 416.0, 1088.0, 4448.0, 37676.0, 643532.0, 337461.0, 18964.0, 2918.0, 877.0, 336.0, 175.0, 90.0, 45.0, 29.0, 25.0, 14.0, 7.0, 6.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12188720703125, -0.11839103698730469, -0.11489486694335938, -0.11139869689941406, -0.10790252685546875, -0.10440635681152344, -0.10091018676757812, -0.09741401672363281, -0.0939178466796875, -0.09042167663574219, -0.08692550659179688, -0.08342933654785156, -0.07993316650390625, -0.07643699645996094, -0.07294082641601562, -0.06944465637207031, -0.065948486328125, -0.06245231628417969, -0.058956146240234375, -0.05545997619628906, -0.05196380615234375, -0.04846763610839844, -0.044971466064453125, -0.04147529602050781, -0.0379791259765625, -0.03448295593261719, -0.030986785888671875, -0.027490615844726562, -0.02399444580078125, -0.020498275756835938, -0.017002105712890625, -0.013505935668945312, -0.010009765625, -0.0065135955810546875, -0.003017425537109375, 0.0004787445068359375, 0.00397491455078125, 0.0074710845947265625, 0.010967254638671875, 0.014463424682617188, 0.0179595947265625, 0.021455764770507812, 0.024951934814453125, 0.028448104858398438, 0.03194427490234375, 0.03544044494628906, 0.038936614990234375, 0.04243278503417969, 0.045928955078125, 0.04942512512207031, 0.052921295166015625, 0.05641746520996094, 0.05991363525390625, 0.06340980529785156, 0.06690597534179688, 0.07040214538574219, 0.0738983154296875, 0.07739448547363281, 0.08089065551757812, 0.08438682556152344, 0.08788299560546875, 0.09137916564941406, 0.09487533569335938, 0.09837150573730469, 0.10186767578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 8.0, 6.0, 13.0, 18.0, 13.0, 30.0, 46.0, 39.0, 62.0, 79.0, 103.0, 109.0, 101.0, 92.0, 69.0, 43.0, 45.0, 31.0, 19.0, 14.0, 13.0, 9.0, 9.0, 8.0, 9.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.322166442871094e-05, -8.89357179403305e-05, -8.464977145195007e-05, -8.036382496356964e-05, -7.607787847518921e-05, -7.179193198680878e-05, -6.750598549842834e-05, -6.322003901004791e-05, -5.893409252166748e-05, -5.464814603328705e-05, -5.0362199544906616e-05, -4.6076253056526184e-05, -4.179030656814575e-05, -3.750436007976532e-05, -3.321841359138489e-05, -2.8932467103004456e-05, -2.4646520614624023e-05, -2.036057412624359e-05, -1.607462763786316e-05, -1.1788681149482727e-05, -7.502734661102295e-06, -3.216788172721863e-06, 1.0691583156585693e-06, 5.3551048040390015e-06, 9.641051292419434e-06, 1.3926997780799866e-05, 1.8212944269180298e-05, 2.249889075756073e-05, 2.6784837245941162e-05, 3.1070783734321594e-05, 3.5356730222702026e-05, 3.964267671108246e-05, 4.392862319946289e-05, 4.821456968784332e-05, 5.2500516176223755e-05, 5.678646266460419e-05, 6.107240915298462e-05, 6.535835564136505e-05, 6.964430212974548e-05, 7.393024861812592e-05, 7.821619510650635e-05, 8.250214159488678e-05, 8.678808808326721e-05, 9.107403457164764e-05, 9.535998106002808e-05, 9.964592754840851e-05, 0.00010393187403678894, 0.00010821782052516937, 0.0001125037670135498, 0.00011678971350193024, 0.00012107565999031067, 0.0001253616064786911, 0.00012964755296707153, 0.00013393349945545197, 0.0001382194459438324, 0.00014250539243221283, 0.00014679133892059326, 0.0001510772854089737, 0.00015536323189735413, 0.00015964917838573456, 0.000163935124874115, 0.00016822107136249542, 0.00017250701785087585, 0.0001767929643392563, 0.00018107891082763672]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 12.0, 23.0, 28.0, 50.0, 69.0, 106.0, 176.0, 331.0, 520.0, 1137.0, 2853.0, 11007.0, 72106.0, 533509.0, 371051.0, 43537.0, 7632.0, 2246.0, 955.0, 483.0, 245.0, 149.0, 109.0, 69.0, 42.0, 31.0, 12.0, 16.0, 4.0, 6.0, 8.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.06531906127929688, -0.06288909912109375, -0.060459136962890625, -0.0580291748046875, -0.055599212646484375, -0.05316925048828125, -0.050739288330078125, -0.048309326171875, -0.045879364013671875, -0.04344940185546875, -0.041019439697265625, -0.0385894775390625, -0.036159515380859375, -0.03372955322265625, -0.031299591064453125, -0.02886962890625, -0.026439666748046875, -0.02400970458984375, -0.021579742431640625, -0.0191497802734375, -0.016719818115234375, -0.01428985595703125, -0.011859893798828125, -0.009429931640625, -0.006999969482421875, -0.00457000732421875, -0.002140045166015625, 0.0002899169921875, 0.002719879150390625, 0.00514984130859375, 0.007579803466796875, 0.010009765625, 0.012439727783203125, 0.01486968994140625, 0.017299652099609375, 0.0197296142578125, 0.022159576416015625, 0.02458953857421875, 0.027019500732421875, 0.029449462890625, 0.031879425048828125, 0.03430938720703125, 0.036739349365234375, 0.0391693115234375, 0.041599273681640625, 0.04402923583984375, 0.046459197998046875, 0.04888916015625, 0.051319122314453125, 0.05374908447265625, 0.056179046630859375, 0.0586090087890625, 0.061038970947265625, 0.06346893310546875, 0.06589889526367188, 0.068328857421875, 0.07075881958007812, 0.07318878173828125, 0.07561874389648438, 0.0780487060546875, 0.08047866821289062, 0.08290863037109375, 0.08533859252929688, 0.0877685546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 10.0, 14.0, 42.0, 74.0, 137.0, 202.0, 189.0, 149.0, 75.0, 41.0, 19.0, 16.0, 15.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14697265625, -0.14226150512695312, -0.13755035400390625, -0.13283920288085938, -0.1281280517578125, -0.12341690063476562, -0.11870574951171875, -0.11399459838867188, -0.109283447265625, -0.10457229614257812, -0.09986114501953125, -0.09514999389648438, -0.0904388427734375, -0.08572769165039062, -0.08101654052734375, -0.07630538940429688, -0.07159423828125, -0.06688308715820312, -0.06217193603515625, -0.057460784912109375, -0.0527496337890625, -0.048038482666015625, -0.04332733154296875, -0.038616180419921875, -0.033905029296875, -0.029193878173828125, -0.02448272705078125, -0.019771575927734375, -0.0150604248046875, -0.010349273681640625, -0.00563812255859375, -0.000926971435546875, 0.0037841796875, 0.008495330810546875, 0.01320648193359375, 0.017917633056640625, 0.0226287841796875, 0.027339935302734375, 0.03205108642578125, 0.036762237548828125, 0.041473388671875, 0.046184539794921875, 0.05089569091796875, 0.055606842041015625, 0.0603179931640625, 0.06502914428710938, 0.06974029541015625, 0.07445144653320312, 0.07916259765625, 0.08387374877929688, 0.08858489990234375, 0.09329605102539062, 0.0980072021484375, 0.10271835327148438, 0.10742950439453125, 0.11214065551757812, 0.116851806640625, 0.12156295776367188, 0.12627410888671875, 0.13098526000976562, 0.1356964111328125, 0.14040756225585938, 0.14511871337890625, 0.14982986450195312, 0.154541015625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 10.0, 16.0, 41.0, 130.0, 265.0, 290.0, 168.0, 56.0, 18.0, 12.0, 4.0, 1.0], "bins": [-4.122613430023193, -4.050593852996826, -3.978574514389038, -3.90655517578125, -3.834535837173462, -3.762516498565674, -3.6904969215393066, -3.6184775829315186, -3.5464582443237305, -3.4744389057159424, -3.402419328689575, -3.330399990081787, -3.258380651473999, -3.186361312866211, -3.1143417358398438, -3.0423223972320557, -2.9703030586242676, -2.8982837200164795, -2.8262641429901123, -2.754244804382324, -2.682225465774536, -2.610206127166748, -2.538186550140381, -2.4661672115325928, -2.3941476345062256, -2.3221282958984375, -2.2501087188720703, -2.1780893802642822, -2.106070041656494, -2.034050703048706, -1.9620311260223389, -1.8900117874145508, -1.8179926872253418, -1.7459732294082642, -1.673953890800476, -1.6019344329833984, -1.5299150943756104, -1.4578956365585327, -1.385876178741455, -1.313856840133667, -1.2418373823165894, -1.1698179244995117, -1.0977985858917236, -1.025779128074646, -0.9537597894668579, -0.8817403316497803, -0.8097209334373474, -0.7377015352249146, -0.6656821370124817, -0.5936627388000488, -0.521643340587616, -0.4496239125728607, -0.37760451436042786, -0.305585116147995, -0.23356568813323975, -0.16154628992080688, -0.08952689170837402, -0.017507486045360565, 0.05451191961765289, 0.12653133273124695, 0.1985507309436798, 0.27057012915611267, 0.3425895571708679, 0.4146089553833008, 0.48662835359573364]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 12.0, 19.0, 11.0, 21.0, 18.0, 33.0, 28.0, 49.0, 56.0, 49.0, 48.0, 49.0, 63.0, 48.0, 62.0, 58.0, 44.0, 43.0, 54.0, 50.0, 30.0, 26.0, 25.0, 23.0, 15.0, 16.0, 9.0, 7.0, 6.0, 3.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1614229679107666, -1.1241322755813599, -1.0868414640426636, -1.0495507717132568, -1.0122599601745605, -0.974969208240509, -0.9376784563064575, -0.9003877639770508, -0.8630969524383545, -0.825806200504303, -0.7885154485702515, -0.7512246966362, -0.7139339447021484, -0.6766431927680969, -0.6393524408340454, -0.6020617485046387, -0.5647709965705872, -0.5274802446365356, -0.49018949270248413, -0.4528987407684326, -0.4156079888343811, -0.3783172369003296, -0.34102651476860046, -0.30373576283454895, -0.26644501090049744, -0.22915425896644592, -0.1918635070323944, -0.1545727699995041, -0.11728201806545258, -0.07999126613140106, -0.04270052909851074, -0.0054097771644592285, 0.031880974769592285, 0.0691717267036438, 0.10646247118711472, 0.14375321567058563, 0.18104396760463715, 0.21833471953868866, 0.255625456571579, 0.2929162085056305, 0.330206960439682, 0.3674977123737335, 0.40478846430778503, 0.44207918643951416, 0.4793699383735657, 0.5166606903076172, 0.5539514422416687, 0.5912421941757202, 0.6285329461097717, 0.6658236980438232, 0.7031144499778748, 0.7404052019119263, 0.7776959538459778, 0.8149867057800293, 0.852277398109436, 0.8895682096481323, 0.9268589019775391, 0.9641496539115906, 1.001440405845642, 1.0387310981750488, 1.0760219097137451, 1.1133126020431519, 1.1506034135818481, 1.1878941059112549, 1.2251849174499512]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 5.0, 13.0, 30.0, 52.0, 198.0, 861.0, 48513.0, 4142456.0, 1701.0, 284.0, 101.0, 29.0, 6.0, 9.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.427734375, -1.398681640625, -1.36962890625, -1.340576171875, -1.3115234375, -1.282470703125, -1.25341796875, -1.224365234375, -1.1953125, -1.166259765625, -1.13720703125, -1.108154296875, -1.0791015625, -1.050048828125, -1.02099609375, -0.991943359375, -0.962890625, -0.933837890625, -0.90478515625, -0.875732421875, -0.8466796875, -0.817626953125, -0.78857421875, -0.759521484375, -0.73046875, -0.701416015625, -0.67236328125, -0.643310546875, -0.6142578125, -0.585205078125, -0.55615234375, -0.527099609375, -0.498046875, -0.468994140625, -0.43994140625, -0.410888671875, -0.3818359375, -0.352783203125, -0.32373046875, -0.294677734375, -0.265625, -0.236572265625, -0.20751953125, -0.178466796875, -0.1494140625, -0.120361328125, -0.09130859375, -0.062255859375, -0.033203125, -0.004150390625, 0.02490234375, 0.053955078125, 0.0830078125, 0.112060546875, 0.14111328125, 0.170166015625, 0.19921875, 0.228271484375, 0.25732421875, 0.286376953125, 0.3154296875, 0.344482421875, 0.37353515625, 0.402587890625, 0.431640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 13.0, 12.0, 17.0, 12.0, 16.0, 21.0, 43.0, 33.0, 56.0, 46.0, 65.0, 50.0, 62.0, 74.0, 65.0, 69.0, 57.0, 47.0, 51.0, 32.0, 33.0, 34.0, 18.0, 15.0, 16.0, 11.0, 11.0, 8.0, 1.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.069091796875, -0.06724786758422852, -0.06540393829345703, -0.06356000900268555, -0.06171607971191406, -0.05987215042114258, -0.058028221130371094, -0.05618429183959961, -0.054340362548828125, -0.05249643325805664, -0.050652503967285156, -0.04880857467651367, -0.04696464538574219, -0.0451207160949707, -0.04327678680419922, -0.041432857513427734, -0.03958892822265625, -0.037744998931884766, -0.03590106964111328, -0.0340571403503418, -0.03221321105957031, -0.030369281768798828, -0.028525352478027344, -0.02668142318725586, -0.024837493896484375, -0.02299356460571289, -0.021149635314941406, -0.019305706024169922, -0.017461776733398438, -0.015617847442626953, -0.013773918151855469, -0.011929988861083984, -0.0100860595703125, -0.008242130279541016, -0.006398200988769531, -0.004554271697998047, -0.0027103424072265625, -0.0008664131164550781, 0.0009775161743164062, 0.0028214454650878906, 0.004665374755859375, 0.006509304046630859, 0.008353233337402344, 0.010197162628173828, 0.012041091918945312, 0.013885021209716797, 0.01572895050048828, 0.017572879791259766, 0.01941680908203125, 0.021260738372802734, 0.02310466766357422, 0.024948596954345703, 0.026792526245117188, 0.028636455535888672, 0.030480384826660156, 0.03232431411743164, 0.034168243408203125, 0.03601217269897461, 0.037856101989746094, 0.03970003128051758, 0.04154396057128906, 0.04338788986206055, 0.04523181915283203, 0.047075748443603516, 0.048919677734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 6.0, 4.0, 9.0, 10.0, 18.0, 23.0, 24.0, 42.0, 44.0, 66.0, 93.0, 145.0, 172.0, 274.0, 403.0, 628.0, 930.0, 1579.0, 2572.0, 4915.0, 10012.0, 25863.0, 119055.0, 3811338.0, 161734.0, 30481.0, 11181.0, 5280.0, 2753.0, 1684.0, 969.0, 643.0, 397.0, 281.0, 196.0, 133.0, 108.0, 63.0, 33.0, 40.0, 26.0, 14.0, 8.0, 14.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0860595703125, -0.08341693878173828, -0.08077430725097656, -0.07813167572021484, -0.07548904418945312, -0.0728464126586914, -0.07020378112792969, -0.06756114959716797, -0.06491851806640625, -0.06227588653564453, -0.05963325500488281, -0.056990623474121094, -0.054347991943359375, -0.051705360412597656, -0.04906272888183594, -0.04642009735107422, -0.0437774658203125, -0.04113483428955078, -0.03849220275878906, -0.035849571228027344, -0.033206939697265625, -0.030564308166503906, -0.027921676635742188, -0.02527904510498047, -0.02263641357421875, -0.01999378204345703, -0.017351150512695312, -0.014708518981933594, -0.012065887451171875, -0.009423255920410156, -0.0067806243896484375, -0.004137992858886719, -0.001495361328125, 0.0011472702026367188, 0.0037899017333984375, 0.006432533264160156, 0.009075164794921875, 0.011717796325683594, 0.014360427856445312, 0.01700305938720703, 0.01964569091796875, 0.02228832244873047, 0.024930953979492188, 0.027573585510253906, 0.030216217041015625, 0.032858848571777344, 0.03550148010253906, 0.03814411163330078, 0.0407867431640625, 0.04342937469482422, 0.04607200622558594, 0.048714637756347656, 0.051357269287109375, 0.053999900817871094, 0.05664253234863281, 0.05928516387939453, 0.06192779541015625, 0.06457042694091797, 0.06721305847167969, 0.0698556900024414, 0.07249832153320312, 0.07514095306396484, 0.07778358459472656, 0.08042621612548828, 0.08306884765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 5.0, 10.0, 14.0, 14.0, 29.0, 32.0, 80.0, 261.0, 3062.0, 330.0, 75.0, 54.0, 34.0, 16.0, 15.0, 9.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0284576416015625, -0.027699947357177734, -0.02694225311279297, -0.026184558868408203, -0.025426864624023438, -0.024669170379638672, -0.023911476135253906, -0.02315378189086914, -0.022396087646484375, -0.02163839340209961, -0.020880699157714844, -0.020123004913330078, -0.019365310668945312, -0.018607616424560547, -0.01784992218017578, -0.017092227935791016, -0.01633453369140625, -0.015576839447021484, -0.014819145202636719, -0.014061450958251953, -0.013303756713867188, -0.012546062469482422, -0.011788368225097656, -0.01103067398071289, -0.010272979736328125, -0.00951528549194336, -0.008757591247558594, -0.007999897003173828, -0.0072422027587890625, -0.006484508514404297, -0.005726814270019531, -0.004969120025634766, -0.00421142578125, -0.0034537315368652344, -0.0026960372924804688, -0.0019383430480957031, -0.0011806488037109375, -0.0004229545593261719, 0.00033473968505859375, 0.0010924339294433594, 0.001850128173828125, 0.0026078224182128906, 0.0033655166625976562, 0.004123210906982422, 0.0048809051513671875, 0.005638599395751953, 0.006396293640136719, 0.007153987884521484, 0.00791168212890625, 0.008669376373291016, 0.009427070617675781, 0.010184764862060547, 0.010942459106445312, 0.011700153350830078, 0.012457847595214844, 0.01321554183959961, 0.013973236083984375, 0.01473093032836914, 0.015488624572753906, 0.016246318817138672, 0.017004013061523438, 0.017761707305908203, 0.01851940155029297, 0.019277095794677734, 0.0200347900390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 4.0, 21.0, 27.0, 53.0, 94.0, 160.0, 189.0, 149.0, 124.0, 69.0, 47.0, 24.0, 16.0, 8.0, 4.0, 1.0, 3.0, 1.0], "bins": [-0.23447898030281067, -0.23003557324409485, -0.22559216618537903, -0.2211487591266632, -0.2167053520679474, -0.21226194500923157, -0.20781853795051575, -0.20337513089179993, -0.1989317238330841, -0.1944883167743683, -0.19004490971565247, -0.18560150265693665, -0.18115809559822083, -0.176714688539505, -0.17227128148078918, -0.16782787442207336, -0.16338448226451874, -0.15894107520580292, -0.1544976681470871, -0.15005426108837128, -0.14561085402965546, -0.14116744697093964, -0.13672403991222382, -0.1322806477546692, -0.12783724069595337, -0.12339383363723755, -0.11895042657852173, -0.11450701951980591, -0.11006361246109009, -0.10562020540237427, -0.10117680579423904, -0.09673339873552322, -0.0922899842262268, -0.08784657716751099, -0.08340317010879517, -0.07895976305007935, -0.07451635599136353, -0.0700729489326477, -0.06562954932451248, -0.06118614226579666, -0.05674273148179054, -0.05229932442307472, -0.0478559210896492, -0.04341251403093338, -0.03896910697221756, -0.03452569991350174, -0.03008229471743107, -0.025638889521360397, -0.021195482462644577, -0.016752075403928757, -0.012308670207858086, -0.00786526408046484, -0.0034218579530715942, 0.001021549105644226, 0.005464954301714897, 0.009908359497785568, 0.014351766556501389, 0.01879517361521721, 0.02323857881128788, 0.02768198400735855, 0.03212539106607437, 0.03656879812479019, 0.04101220518350601, 0.045455608516931534, 0.049899015575647354]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 10.0, 11.0, 13.0, 19.0, 19.0, 20.0, 21.0, 25.0, 29.0, 32.0, 28.0, 39.0, 46.0, 49.0, 54.0, 44.0, 41.0, 43.0, 43.0, 38.0, 48.0, 43.0, 37.0, 35.0, 33.0, 27.0, 18.0, 21.0, 18.0, 17.0, 16.0, 9.0, 12.0, 12.0, 5.0, 6.0, 5.0, 1.0, 1.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05004245042800903, -0.04840123653411865, -0.04676002636551857, -0.04511881619691849, -0.04347760230302811, -0.041836388409137726, -0.04019517824053764, -0.03855396807193756, -0.03691275417804718, -0.0352715402841568, -0.03363033011555672, -0.031989119946956635, -0.030347906053066254, -0.028706694021821022, -0.02706548199057579, -0.02542426995933056, -0.023783057928085327, -0.022141845896840096, -0.020500633865594864, -0.018859421834349632, -0.0172182098031044, -0.015576997771859169, -0.013935785740613937, -0.012294573709368706, -0.010653361678123474, -0.009012149646878242, -0.007370937615633011, -0.005729725584387779, -0.004088513553142548, -0.002447301521897316, -0.0008060894906520844, 0.0008351225405931473, 0.002476334571838379, 0.0041175466030836105, 0.005758758634328842, 0.007399970665574074, 0.009041182696819305, 0.010682394728064537, 0.012323606759309769, 0.013964818790555, 0.015606030821800232, 0.017247242853045464, 0.018888454884290695, 0.020529666915535927, 0.02217087894678116, 0.02381209097802639, 0.02545330300927162, 0.027094515040516853, 0.028735727071762085, 0.030376939103007317, 0.03201815113425255, 0.03365936130285263, 0.03530057519674301, 0.03694178909063339, 0.038582999259233475, 0.04022420942783356, 0.04186542332172394, 0.04350663721561432, 0.0451478473842144, 0.046789057552814484, 0.048430271446704865, 0.050071485340595245, 0.05171269550919533, 0.05335390567779541, 0.05499511957168579]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 4.0, 11.0, 16.0, 16.0, 20.0, 27.0, 41.0, 64.0, 116.0, 196.0, 395.0, 984.0, 3976.0, 23159.0, 198647.0, 646528.0, 151181.0, 18202.0, 3200.0, 893.0, 376.0, 179.0, 98.0, 72.0, 48.0, 23.0, 17.0, 14.0, 14.0, 6.0, 7.0, 4.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2041015625, -0.19666290283203125, -0.1892242431640625, -0.18178558349609375, -0.174346923828125, -0.16690826416015625, -0.1594696044921875, -0.15203094482421875, -0.14459228515625, -0.13715362548828125, -0.1297149658203125, -0.12227630615234375, -0.114837646484375, -0.10739898681640625, -0.0999603271484375, -0.09252166748046875, -0.0850830078125, -0.07764434814453125, -0.0702056884765625, -0.06276702880859375, -0.055328369140625, -0.04788970947265625, -0.0404510498046875, -0.03301239013671875, -0.02557373046875, -0.01813507080078125, -0.0106964111328125, -0.00325775146484375, 0.004180908203125, 0.01161956787109375, 0.0190582275390625, 0.02649688720703125, 0.033935546875, 0.04137420654296875, 0.0488128662109375, 0.05625152587890625, 0.063690185546875, 0.07112884521484375, 0.0785675048828125, 0.08600616455078125, 0.09344482421875, 0.10088348388671875, 0.1083221435546875, 0.11576080322265625, 0.123199462890625, 0.13063812255859375, 0.1380767822265625, 0.14551544189453125, 0.1529541015625, 0.16039276123046875, 0.1678314208984375, 0.17527008056640625, 0.182708740234375, 0.19014739990234375, 0.1975860595703125, 0.20502471923828125, 0.21246337890625, 0.21990203857421875, 0.2273406982421875, 0.23477935791015625, 0.242218017578125, 0.24965667724609375, 0.2570953369140625, 0.26453399658203125, 0.27197265625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 11.0, 12.0, 12.0, 11.0, 19.0, 21.0, 30.0, 30.0, 47.0, 59.0, 58.0, 58.0, 60.0, 60.0, 68.0, 65.0, 50.0, 55.0, 51.0, 41.0, 42.0, 29.0, 26.0, 24.0, 12.0, 16.0, 11.0, 7.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07147216796875, -0.06959009170532227, -0.06770801544189453, -0.0658259391784668, -0.06394386291503906, -0.06206178665161133, -0.060179710388183594, -0.05829763412475586, -0.056415557861328125, -0.05453348159790039, -0.052651405334472656, -0.05076932907104492, -0.04888725280761719, -0.04700517654418945, -0.04512310028076172, -0.043241024017333984, -0.04135894775390625, -0.039476871490478516, -0.03759479522705078, -0.03571271896362305, -0.03383064270019531, -0.03194856643676758, -0.030066490173339844, -0.02818441390991211, -0.026302337646484375, -0.02442026138305664, -0.022538185119628906, -0.020656108856201172, -0.018774032592773438, -0.016891956329345703, -0.015009880065917969, -0.013127803802490234, -0.0112457275390625, -0.009363651275634766, -0.007481575012207031, -0.005599498748779297, -0.0037174224853515625, -0.0018353462219238281, 4.673004150390625e-05, 0.0019288063049316406, 0.003810882568359375, 0.005692958831787109, 0.007575035095214844, 0.009457111358642578, 0.011339187622070312, 0.013221263885498047, 0.015103340148925781, 0.016985416412353516, 0.01886749267578125, 0.020749568939208984, 0.02263164520263672, 0.024513721466064453, 0.026395797729492188, 0.028277873992919922, 0.030159950256347656, 0.03204202651977539, 0.033924102783203125, 0.03580617904663086, 0.037688255310058594, 0.03957033157348633, 0.04145240783691406, 0.0433344841003418, 0.04521656036376953, 0.047098636627197266, 0.048980712890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 14.0, 20.0, 15.0, 33.0, 48.0, 73.0, 150.0, 197.0, 351.0, 740.0, 1609.0, 3912.0, 12595.0, 54715.0, 299482.0, 526061.0, 114731.0, 22908.0, 6338.0, 2289.0, 1040.0, 507.0, 265.0, 165.0, 105.0, 54.0, 46.0, 29.0, 18.0, 11.0, 9.0, 8.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1650390625, -0.16048240661621094, -0.15592575073242188, -0.1513690948486328, -0.14681243896484375, -0.1422557830810547, -0.13769912719726562, -0.13314247131347656, -0.1285858154296875, -0.12402915954589844, -0.11947250366210938, -0.11491584777832031, -0.11035919189453125, -0.10580253601074219, -0.10124588012695312, -0.09668922424316406, -0.092132568359375, -0.08757591247558594, -0.08301925659179688, -0.07846260070800781, -0.07390594482421875, -0.06934928894042969, -0.06479263305664062, -0.06023597717285156, -0.0556793212890625, -0.05112266540527344, -0.046566009521484375, -0.04200935363769531, -0.03745269775390625, -0.03289604187011719, -0.028339385986328125, -0.023782730102539062, -0.01922607421875, -0.014669418334960938, -0.010112762451171875, -0.0055561065673828125, -0.00099945068359375, 0.0035572052001953125, 0.008113861083984375, 0.012670516967773438, 0.0172271728515625, 0.021783828735351562, 0.026340484619140625, 0.030897140502929688, 0.03545379638671875, 0.04001045227050781, 0.044567108154296875, 0.04912376403808594, 0.053680419921875, 0.05823707580566406, 0.06279373168945312, 0.06735038757324219, 0.07190704345703125, 0.07646369934082031, 0.08102035522460938, 0.08557701110839844, 0.0901336669921875, 0.09469032287597656, 0.09924697875976562, 0.10380363464355469, 0.10836029052734375, 0.11291694641113281, 0.11747360229492188, 0.12203025817871094, 0.1265869140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 7.0, 8.0, 11.0, 11.0, 14.0, 20.0, 26.0, 36.0, 31.0, 37.0, 31.0, 32.0, 57.0, 52.0, 60.0, 60.0, 54.0, 63.0, 45.0, 49.0, 52.0, 40.0, 37.0, 32.0, 38.0, 23.0, 12.0, 16.0, 7.0, 6.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1959228515625, -0.1878337860107422, -0.17974472045898438, -0.17165565490722656, -0.16356658935546875, -0.15547752380371094, -0.14738845825195312, -0.1392993927001953, -0.1312103271484375, -0.12312126159667969, -0.11503219604492188, -0.10694313049316406, -0.09885406494140625, -0.09076499938964844, -0.08267593383789062, -0.07458686828613281, -0.066497802734375, -0.05840873718261719, -0.050319671630859375, -0.04223060607910156, -0.03414154052734375, -0.026052474975585938, -0.017963409423828125, -0.009874343872070312, -0.0017852783203125, 0.0063037872314453125, 0.014392852783203125, 0.022481918334960938, 0.03057098388671875, 0.03866004943847656, 0.046749114990234375, 0.05483818054199219, 0.06292724609375, 0.07101631164550781, 0.07910537719726562, 0.08719444274902344, 0.09528350830078125, 0.10337257385253906, 0.11146163940429688, 0.11955070495605469, 0.1276397705078125, 0.1357288360595703, 0.14381790161132812, 0.15190696716308594, 0.15999603271484375, 0.16808509826660156, 0.17617416381835938, 0.1842632293701172, 0.192352294921875, 0.2004413604736328, 0.20853042602539062, 0.21661949157714844, 0.22470855712890625, 0.23279762268066406, 0.24088668823242188, 0.2489757537841797, 0.2570648193359375, 0.2651538848876953, 0.2732429504394531, 0.28133201599121094, 0.28942108154296875, 0.29751014709472656, 0.3055992126464844, 0.3136882781982422, 0.32177734375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 5.0, 2.0, 6.0, 10.0, 18.0, 26.0, 53.0, 121.0, 294.0, 866.0, 3725.0, 53924.0, 906207.0, 77433.0, 4396.0, 889.0, 301.0, 113.0, 70.0, 35.0, 26.0, 12.0, 8.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1600341796875, -0.15511703491210938, -0.15019989013671875, -0.14528274536132812, -0.1403656005859375, -0.13544845581054688, -0.13053131103515625, -0.12561416625976562, -0.120697021484375, -0.11577987670898438, -0.11086273193359375, -0.10594558715820312, -0.1010284423828125, -0.09611129760742188, -0.09119415283203125, -0.08627700805664062, -0.08135986328125, -0.07644271850585938, -0.07152557373046875, -0.06660842895507812, -0.0616912841796875, -0.056774139404296875, -0.05185699462890625, -0.046939849853515625, -0.042022705078125, -0.037105560302734375, -0.03218841552734375, -0.027271270751953125, -0.0223541259765625, -0.017436981201171875, -0.01251983642578125, -0.007602691650390625, -0.002685546875, 0.002231597900390625, 0.00714874267578125, 0.012065887451171875, 0.0169830322265625, 0.021900177001953125, 0.02681732177734375, 0.031734466552734375, 0.036651611328125, 0.041568756103515625, 0.04648590087890625, 0.051403045654296875, 0.0563201904296875, 0.061237335205078125, 0.06615447998046875, 0.07107162475585938, 0.07598876953125, 0.08090591430664062, 0.08582305908203125, 0.09074020385742188, 0.0956573486328125, 0.10057449340820312, 0.10549163818359375, 0.11040878295898438, 0.115325927734375, 0.12024307250976562, 0.12516021728515625, 0.13007736206054688, 0.1349945068359375, 0.13991165161132812, 0.14482879638671875, 0.14974594116210938, 0.1546630859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 12.0, 12.0, 23.0, 37.0, 61.0, 57.0, 63.0, 71.0, 77.0, 82.0, 68.0, 69.0, 81.0, 52.0, 51.0, 49.0, 22.0, 23.0, 22.0, 9.0, 8.0, 8.0, 4.0, 8.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0], "bins": [-0.0001341104507446289, -0.0001310473307967186, -0.0001279842108488083, -0.00012492109090089798, -0.00012185797095298767, -0.00011879485100507736, -0.00011573173105716705, -0.00011266861110925674, -0.00010960549116134644, -0.00010654237121343613, -0.00010347925126552582, -0.00010041613131761551, -9.73530113697052e-05, -9.428989142179489e-05, -9.122677147388458e-05, -8.816365152597427e-05, -8.510053157806396e-05, -8.203741163015366e-05, -7.897429168224335e-05, -7.591117173433304e-05, -7.284805178642273e-05, -6.978493183851242e-05, -6.672181189060211e-05, -6.36586919426918e-05, -6.0595571994781494e-05, -5.7532452046871185e-05, -5.4469332098960876e-05, -5.140621215105057e-05, -4.834309220314026e-05, -4.527997225522995e-05, -4.221685230731964e-05, -3.915373235940933e-05, -3.6090612411499023e-05, -3.3027492463588715e-05, -2.9964372515678406e-05, -2.6901252567768097e-05, -2.3838132619857788e-05, -2.077501267194748e-05, -1.771189272403717e-05, -1.4648772776126862e-05, -1.1585652828216553e-05, -8.522532880306244e-06, -5.459412932395935e-06, -2.3962929844856262e-06, 6.668269634246826e-07, 3.7299469113349915e-06, 6.7930668592453e-06, 9.856186807155609e-06, 1.2919306755065918e-05, 1.5982426702976227e-05, 1.9045546650886536e-05, 2.2108666598796844e-05, 2.5171786546707153e-05, 2.8234906494617462e-05, 3.129802644252777e-05, 3.436114639043808e-05, 3.742426633834839e-05, 4.04873862862587e-05, 4.3550506234169006e-05, 4.6613626182079315e-05, 4.9676746129989624e-05, 5.273986607789993e-05, 5.580298602581024e-05, 5.886610597372055e-05, 6.192922592163086e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 1.0, 3.0, 10.0, 10.0, 35.0, 50.0, 121.0, 284.0, 740.0, 2972.0, 25769.0, 653637.0, 348174.0, 13664.0, 2074.0, 591.0, 212.0, 113.0, 49.0, 15.0, 13.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155029296875, -0.15093708038330078, -0.14684486389160156, -0.14275264739990234, -0.13866043090820312, -0.1345682144165039, -0.1304759979248047, -0.12638378143310547, -0.12229156494140625, -0.11819934844970703, -0.11410713195800781, -0.1100149154663086, -0.10592269897460938, -0.10183048248291016, -0.09773826599121094, -0.09364604949951172, -0.0895538330078125, -0.08546161651611328, -0.08136940002441406, -0.07727718353271484, -0.07318496704101562, -0.0690927505493164, -0.06500053405761719, -0.06090831756591797, -0.05681610107421875, -0.05272388458251953, -0.04863166809082031, -0.044539451599121094, -0.040447235107421875, -0.036355018615722656, -0.03226280212402344, -0.02817058563232422, -0.024078369140625, -0.01998615264892578, -0.015893936157226562, -0.011801719665527344, -0.007709503173828125, -0.0036172866821289062, 0.0004749298095703125, 0.004567146301269531, 0.00865936279296875, 0.012751579284667969, 0.016843795776367188, 0.020936012268066406, 0.025028228759765625, 0.029120445251464844, 0.03321266174316406, 0.03730487823486328, 0.0413970947265625, 0.04548931121826172, 0.04958152770996094, 0.053673744201660156, 0.057765960693359375, 0.061858177185058594, 0.06595039367675781, 0.07004261016845703, 0.07413482666015625, 0.07822704315185547, 0.08231925964355469, 0.0864114761352539, 0.09050369262695312, 0.09459590911865234, 0.09868812561035156, 0.10278034210205078, 0.10687255859375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 20.0, 27.0, 72.0, 95.0, 116.0, 184.0, 168.0, 117.0, 74.0, 46.0, 26.0, 10.0, 4.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08477783203125, -0.0800008773803711, -0.07522392272949219, -0.07044696807861328, -0.06567001342773438, -0.06089305877685547, -0.05611610412597656, -0.051339149475097656, -0.04656219482421875, -0.041785240173339844, -0.03700828552246094, -0.03223133087158203, -0.027454376220703125, -0.02267742156982422, -0.017900466918945312, -0.013123512268066406, -0.0083465576171875, -0.0035696029663085938, 0.0012073516845703125, 0.005984306335449219, 0.010761260986328125, 0.015538215637207031, 0.020315170288085938, 0.025092124938964844, 0.02986907958984375, 0.034646034240722656, 0.03942298889160156, 0.04419994354248047, 0.048976898193359375, 0.05375385284423828, 0.05853080749511719, 0.0633077621459961, 0.068084716796875, 0.0728616714477539, 0.07763862609863281, 0.08241558074951172, 0.08719253540039062, 0.09196949005126953, 0.09674644470214844, 0.10152339935302734, 0.10630035400390625, 0.11107730865478516, 0.11585426330566406, 0.12063121795654297, 0.12540817260742188, 0.13018512725830078, 0.1349620819091797, 0.1397390365600586, 0.1445159912109375, 0.1492929458618164, 0.1540699005126953, 0.15884685516357422, 0.16362380981445312, 0.16840076446533203, 0.17317771911621094, 0.17795467376708984, 0.18273162841796875, 0.18750858306884766, 0.19228553771972656, 0.19706249237060547, 0.20183944702148438, 0.20661640167236328, 0.2113933563232422, 0.2161703109741211, 0.220947265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 13.0, 37.0, 65.0, 171.0, 292.0, 250.0, 114.0, 38.0, 18.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9730415344238281, -0.8972538709640503, -0.8214661478996277, -0.7456784844398499, -0.6698907613754272, -0.5941030979156494, -0.5183154344558716, -0.442527711391449, -0.36674004793167114, -0.2909523546695709, -0.2151646763086319, -0.13937699794769287, -0.06358930468559265, 0.012198388576507568, 0.0879860520362854, 0.163773775100708, 0.23956143856048584, 0.31534913182258606, 0.3911368250846863, 0.4669244885444641, 0.5427122116088867, 0.6184998750686646, 0.6942875385284424, 0.770075261592865, 0.8458629250526428, 0.9216505885124207, 0.9974383115768433, 1.073225975036621, 1.149013638496399, 1.2248013019561768, 1.3005890846252441, 1.376376748085022, 1.4521644115447998, 1.5279520750045776, 1.6037397384643555, 1.6795275211334229, 1.7553151845932007, 1.8311028480529785, 1.9068905115127563, 1.9826781749725342, 2.0584659576416016, 2.134253740310669, 2.2100412845611572, 2.2858290672302246, 2.361616611480713, 2.4374043941497803, 2.5131921768188477, 2.588979721069336, 2.664767265319824, 2.7405550479888916, 2.81634259223938, 2.8921303749084473, 2.9679179191589355, 3.043705701828003, 3.1194934844970703, 3.1952810287475586, 3.271068811416626, 3.3468565940856934, 3.4226441383361816, 3.498431921005249, 3.5742194652557373, 3.6500072479248047, 3.725794792175293, 3.8015825748443604, 3.8773703575134277]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 3.0, 8.0, 11.0, 9.0, 14.0, 7.0, 12.0, 21.0, 16.0, 23.0, 19.0, 27.0, 42.0, 43.0, 37.0, 37.0, 52.0, 58.0, 41.0, 49.0, 50.0, 37.0, 33.0, 50.0, 39.0, 36.0, 30.0, 30.0, 37.0, 18.0, 18.0, 18.0, 16.0, 10.0, 6.0, 9.0, 9.0, 2.0, 4.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.25397527217865, -1.2202231884002686, -1.1864711046218872, -1.1527189016342163, -1.118966817855835, -1.0852147340774536, -1.0514626502990723, -1.017710566520691, -0.9839584231376648, -0.9502063393592834, -0.9164541959762573, -0.882702112197876, -0.8489500284194946, -0.8151978850364685, -0.7814458012580872, -0.747693657875061, -0.7139415740966797, -0.6801894903182983, -0.6464373469352722, -0.6126852631568909, -0.5789331197738647, -0.5451810359954834, -0.511428952217102, -0.4776768386363983, -0.4439247250556946, -0.41017261147499084, -0.3764204978942871, -0.34266841411590576, -0.308916300535202, -0.2751641869544983, -0.24141208827495575, -0.2076599895954132, -0.17390799522399902, -0.1401558816432953, -0.10640378296375275, -0.07265167683362961, -0.03889957070350647, -0.005147457122802734, 0.028604641556739807, 0.06235674023628235, 0.09610885381698608, 0.12986096739768982, 0.16361306607723236, 0.1973651647567749, 0.23111727833747864, 0.2648693919181824, 0.2986214756965637, 0.33237358927726746, 0.3661257028579712, 0.3998778164386749, 0.43362993001937866, 0.46738201379776, 0.5011341571807861, 0.5348862409591675, 0.5686383247375488, 0.6023904085159302, 0.6361425518989563, 0.6698946356773376, 0.7036467790603638, 0.7373988628387451, 0.7711509466171265, 0.8049030900001526, 0.8386551737785339, 0.8724073171615601, 0.9061594009399414]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 6.0, 4.0, 12.0, 8.0, 22.0, 33.0, 92.0, 250.0, 1099.0, 10442.0, 4109385.0, 69342.0, 2871.0, 492.0, 105.0, 50.0, 26.0, 17.0, 10.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64013671875, -0.6255035400390625, -0.610870361328125, -0.5962371826171875, -0.58160400390625, -0.5669708251953125, -0.552337646484375, -0.5377044677734375, -0.5230712890625, -0.5084381103515625, -0.493804931640625, -0.4791717529296875, -0.46453857421875, -0.4499053955078125, -0.435272216796875, -0.4206390380859375, -0.406005859375, -0.3913726806640625, -0.376739501953125, -0.3621063232421875, -0.34747314453125, -0.3328399658203125, -0.318206787109375, -0.3035736083984375, -0.2889404296875, -0.2743072509765625, -0.259674072265625, -0.2450408935546875, -0.23040771484375, -0.2157745361328125, -0.201141357421875, -0.1865081787109375, -0.171875, -0.1572418212890625, -0.142608642578125, -0.1279754638671875, -0.11334228515625, -0.0987091064453125, -0.084075927734375, -0.0694427490234375, -0.0548095703125, -0.0401763916015625, -0.025543212890625, -0.0109100341796875, 0.00372314453125, 0.0183563232421875, 0.032989501953125, 0.0476226806640625, 0.062255859375, 0.0768890380859375, 0.091522216796875, 0.1061553955078125, 0.12078857421875, 0.1354217529296875, 0.150054931640625, 0.1646881103515625, 0.1793212890625, 0.1939544677734375, 0.208587646484375, 0.2232208251953125, 0.23785400390625, 0.2524871826171875, 0.267120361328125, 0.2817535400390625, 0.29638671875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 16.0, 12.0, 17.0, 24.0, 31.0, 34.0, 40.0, 49.0, 42.0, 55.0, 52.0, 61.0, 71.0, 62.0, 80.0, 54.0, 57.0, 43.0, 38.0, 33.0, 25.0, 22.0, 20.0, 11.0, 11.0, 8.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.064453125, -0.062399864196777344, -0.06034660339355469, -0.05829334259033203, -0.056240081787109375, -0.05418682098388672, -0.05213356018066406, -0.050080299377441406, -0.04802703857421875, -0.045973777770996094, -0.04392051696777344, -0.04186725616455078, -0.039813995361328125, -0.03776073455810547, -0.03570747375488281, -0.033654212951660156, -0.0316009521484375, -0.029547691345214844, -0.027494430541992188, -0.02544116973876953, -0.023387908935546875, -0.02133464813232422, -0.019281387329101562, -0.017228126525878906, -0.01517486572265625, -0.013121604919433594, -0.011068344116210938, -0.009015083312988281, -0.006961822509765625, -0.004908561706542969, -0.0028553009033203125, -0.0008020401000976562, 0.001251220703125, 0.0033044815063476562, 0.0053577423095703125, 0.007411003112792969, 0.009464263916015625, 0.011517524719238281, 0.013570785522460938, 0.015624046325683594, 0.01767730712890625, 0.019730567932128906, 0.021783828735351562, 0.02383708953857422, 0.025890350341796875, 0.02794361114501953, 0.029996871948242188, 0.032050132751464844, 0.0341033935546875, 0.036156654357910156, 0.03820991516113281, 0.04026317596435547, 0.042316436767578125, 0.04436969757080078, 0.04642295837402344, 0.048476219177246094, 0.05052947998046875, 0.052582740783691406, 0.05463600158691406, 0.05668926239013672, 0.058742523193359375, 0.06079578399658203, 0.06284904479980469, 0.06490230560302734, 0.06695556640625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 5.0, 11.0, 3.0, 24.0, 16.0, 20.0, 44.0, 64.0, 89.0, 150.0, 240.0, 383.0, 607.0, 1095.0, 1784.0, 3335.0, 6565.0, 14657.0, 37947.0, 144022.0, 3466123.0, 406357.0, 68133.0, 22736.0, 9571.0, 4582.0, 2334.0, 1259.0, 788.0, 462.0, 265.0, 189.0, 135.0, 101.0, 50.0, 34.0, 32.0, 19.0, 18.0, 10.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.087158203125, -0.08449649810791016, -0.08183479309082031, -0.07917308807373047, -0.07651138305664062, -0.07384967803955078, -0.07118797302246094, -0.0685262680053711, -0.06586456298828125, -0.0632028579711914, -0.06054115295410156, -0.05787944793701172, -0.055217742919921875, -0.05255603790283203, -0.04989433288574219, -0.047232627868652344, -0.0445709228515625, -0.041909217834472656, -0.03924751281738281, -0.03658580780029297, -0.033924102783203125, -0.03126239776611328, -0.028600692749023438, -0.025938987731933594, -0.02327728271484375, -0.020615577697753906, -0.017953872680664062, -0.015292167663574219, -0.012630462646484375, -0.009968757629394531, -0.0073070526123046875, -0.004645347595214844, -0.001983642578125, 0.0006780624389648438, 0.0033397674560546875, 0.006001472473144531, 0.008663177490234375, 0.011324882507324219, 0.013986587524414062, 0.016648292541503906, 0.01930999755859375, 0.021971702575683594, 0.024633407592773438, 0.02729511260986328, 0.029956817626953125, 0.03261852264404297, 0.03528022766113281, 0.037941932678222656, 0.0406036376953125, 0.043265342712402344, 0.04592704772949219, 0.04858875274658203, 0.051250457763671875, 0.05391216278076172, 0.05657386779785156, 0.059235572814941406, 0.06189727783203125, 0.0645589828491211, 0.06722068786621094, 0.06988239288330078, 0.07254409790039062, 0.07520580291748047, 0.07786750793457031, 0.08052921295166016, 0.08319091796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 5.0, 6.0, 11.0, 12.0, 13.0, 20.0, 30.0, 45.0, 74.0, 109.0, 309.0, 2553.0, 441.0, 169.0, 98.0, 58.0, 25.0, 23.0, 16.0, 11.0, 9.0, 6.0, 8.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0311126708984375, -0.030187368392944336, -0.029262065887451172, -0.028336763381958008, -0.027411460876464844, -0.02648615837097168, -0.025560855865478516, -0.02463555335998535, -0.023710250854492188, -0.022784948348999023, -0.02185964584350586, -0.020934343338012695, -0.02000904083251953, -0.019083738327026367, -0.018158435821533203, -0.01723313331604004, -0.016307830810546875, -0.015382528305053711, -0.014457225799560547, -0.013531923294067383, -0.012606620788574219, -0.011681318283081055, -0.01075601577758789, -0.009830713272094727, -0.008905410766601562, -0.007980108261108398, -0.007054805755615234, -0.00612950325012207, -0.005204200744628906, -0.004278898239135742, -0.003353595733642578, -0.002428293228149414, -0.00150299072265625, -0.0005776882171630859, 0.0003476142883300781, 0.0012729167938232422, 0.0021982192993164062, 0.0031235218048095703, 0.004048824310302734, 0.0049741268157958984, 0.0058994293212890625, 0.0068247318267822266, 0.007750034332275391, 0.008675336837768555, 0.009600639343261719, 0.010525941848754883, 0.011451244354248047, 0.012376546859741211, 0.013301849365234375, 0.014227151870727539, 0.015152454376220703, 0.016077756881713867, 0.01700305938720703, 0.017928361892700195, 0.01885366439819336, 0.019778966903686523, 0.020704269409179688, 0.02162957191467285, 0.022554874420166016, 0.02348017692565918, 0.024405479431152344, 0.025330781936645508, 0.026256084442138672, 0.027181386947631836, 0.028106689453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 6.0, 13.0, 22.0, 39.0, 91.0, 128.0, 190.0, 192.0, 145.0, 99.0, 48.0, 18.0, 10.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07341936975717545, -0.06599925458431244, -0.058579135686159134, -0.05115901678800583, -0.04373890161514282, -0.03631878271698952, -0.028898663818836212, -0.021478548645973206, -0.0140584297478199, -0.006638312246650457, 0.0007818052545189857, 0.008201923221349716, 0.015622040256857872, 0.023042157292366028, 0.030462276190519333, 0.03788239136338234, 0.045302510261535645, 0.05272262915968895, 0.060142744332551956, 0.06756286323070526, 0.07498297840356827, 0.08240309357643127, 0.08982321619987488, 0.09724333137273788, 0.10466344654560089, 0.1120835617184639, 0.1195036843419075, 0.1269237995147705, 0.1343439221382141, 0.14176402986049652, 0.14918415248394012, 0.15660426020622253, 0.16402439773082733, 0.17144452035427094, 0.17886462807655334, 0.18628475069999695, 0.19370487332344055, 0.20112498104572296, 0.20854510366916656, 0.21596521139144897, 0.22338533401489258, 0.23080545663833618, 0.2382255643606186, 0.2456456869840622, 0.2530657947063446, 0.2604859173297882, 0.2679060399532318, 0.2753261625766754, 0.282746285200119, 0.2901664078235626, 0.2975865304470062, 0.30500662326812744, 0.31242674589157104, 0.31984686851501465, 0.32726699113845825, 0.33468711376190186, 0.34210720658302307, 0.3495273292064667, 0.3569474518299103, 0.3643675446510315, 0.3717876672744751, 0.3792077898979187, 0.3866279125213623, 0.3940480351448059, 0.4014681577682495]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 7.0, 4.0, 15.0, 7.0, 11.0, 10.0, 12.0, 20.0, 17.0, 25.0, 31.0, 32.0, 32.0, 35.0, 39.0, 45.0, 54.0, 48.0, 58.0, 51.0, 38.0, 39.0, 41.0, 44.0, 42.0, 24.0, 32.0, 38.0, 19.0, 23.0, 31.0, 12.0, 9.0, 8.0, 12.0, 11.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07597875595092773, -0.0735168382525444, -0.07105492055416107, -0.06859300285577774, -0.06613108515739441, -0.06366916745901108, -0.06120724976062775, -0.058745332062244415, -0.056283414363861084, -0.05382149666547775, -0.05135957896709442, -0.04889766126871109, -0.04643574357032776, -0.04397382587194443, -0.041511908173561096, -0.039049990475177765, -0.036588072776794434, -0.0341261550784111, -0.03166423738002777, -0.02920231968164444, -0.02674040198326111, -0.024278484284877777, -0.021816566586494446, -0.019354648888111115, -0.016892731189727783, -0.014430813491344452, -0.01196889579296112, -0.00950697809457779, -0.007045060396194458, -0.004583142697811127, -0.0021212249994277954, 0.0003406926989555359, 0.002802610397338867, 0.0052645280957221985, 0.00772644579410553, 0.010188363492488861, 0.012650281190872192, 0.015112198889255524, 0.017574116587638855, 0.020036034286022186, 0.022497951984405518, 0.02495986968278885, 0.02742178738117218, 0.02988370507955551, 0.03234562277793884, 0.034807540476322174, 0.037269458174705505, 0.03973137587308884, 0.04219329357147217, 0.0446552112698555, 0.04711712896823883, 0.04957904666662216, 0.05204096436500549, 0.054502882063388824, 0.056964799761772156, 0.05942671746015549, 0.06188863515853882, 0.06435055285692215, 0.06681247055530548, 0.06927438825368881, 0.07173630595207214, 0.07419822365045547, 0.0766601413488388, 0.07912205904722214, 0.08158397674560547]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 3.0, 5.0, 9.0, 14.0, 15.0, 15.0, 22.0, 49.0, 73.0, 108.0, 188.0, 329.0, 597.0, 1364.0, 3469.0, 10535.0, 39431.0, 171766.0, 464840.0, 268185.0, 63215.0, 15975.0, 4778.0, 1790.0, 797.0, 370.0, 214.0, 118.0, 82.0, 54.0, 41.0, 30.0, 20.0, 16.0, 7.0, 9.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1231689453125, -0.11901664733886719, -0.11486434936523438, -0.11071205139160156, -0.10655975341796875, -0.10240745544433594, -0.09825515747070312, -0.09410285949707031, -0.0899505615234375, -0.08579826354980469, -0.08164596557617188, -0.07749366760253906, -0.07334136962890625, -0.06918907165527344, -0.06503677368164062, -0.06088447570800781, -0.056732177734375, -0.05257987976074219, -0.048427581787109375, -0.04427528381347656, -0.04012298583984375, -0.03597068786621094, -0.031818389892578125, -0.027666091918945312, -0.0235137939453125, -0.019361495971679688, -0.015209197998046875, -0.011056900024414062, -0.00690460205078125, -0.0027523040771484375, 0.001399993896484375, 0.0055522918701171875, 0.00970458984375, 0.013856887817382812, 0.018009185791015625, 0.022161483764648438, 0.02631378173828125, 0.030466079711914062, 0.034618377685546875, 0.03877067565917969, 0.0429229736328125, 0.04707527160644531, 0.051227569580078125, 0.05537986755371094, 0.05953216552734375, 0.06368446350097656, 0.06783676147460938, 0.07198905944824219, 0.076141357421875, 0.08029365539550781, 0.08444595336914062, 0.08859825134277344, 0.09275054931640625, 0.09690284729003906, 0.10105514526367188, 0.10520744323730469, 0.1093597412109375, 0.11351203918457031, 0.11766433715820312, 0.12181663513183594, 0.12596893310546875, 0.13012123107910156, 0.13427352905273438, 0.1384258270263672, 0.142578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 5.0, 12.0, 11.0, 23.0, 22.0, 24.0, 33.0, 34.0, 30.0, 48.0, 49.0, 48.0, 59.0, 70.0, 68.0, 71.0, 56.0, 48.0, 59.0, 36.0, 42.0, 29.0, 27.0, 22.0, 15.0, 11.0, 12.0, 4.0, 6.0, 9.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06353759765625, -0.061553001403808594, -0.05956840515136719, -0.05758380889892578, -0.055599212646484375, -0.05361461639404297, -0.05163002014160156, -0.049645423889160156, -0.04766082763671875, -0.045676231384277344, -0.04369163513183594, -0.04170703887939453, -0.039722442626953125, -0.03773784637451172, -0.03575325012207031, -0.033768653869628906, -0.0317840576171875, -0.029799461364746094, -0.027814865112304688, -0.02583026885986328, -0.023845672607421875, -0.02186107635498047, -0.019876480102539062, -0.017891883850097656, -0.01590728759765625, -0.013922691345214844, -0.011938095092773438, -0.009953498840332031, -0.007968902587890625, -0.005984306335449219, -0.0039997100830078125, -0.0020151138305664062, -3.0517578125e-05, 0.0019540786743164062, 0.0039386749267578125, 0.005923271179199219, 0.007907867431640625, 0.009892463684082031, 0.011877059936523438, 0.013861656188964844, 0.01584625244140625, 0.017830848693847656, 0.019815444946289062, 0.02180004119873047, 0.023784637451171875, 0.02576923370361328, 0.027753829956054688, 0.029738426208496094, 0.0317230224609375, 0.033707618713378906, 0.03569221496582031, 0.03767681121826172, 0.039661407470703125, 0.04164600372314453, 0.04363059997558594, 0.045615196228027344, 0.04759979248046875, 0.049584388732910156, 0.05156898498535156, 0.05355358123779297, 0.055538177490234375, 0.05752277374267578, 0.05950736999511719, 0.061491966247558594, 0.0634765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 12.0, 14.0, 12.0, 15.0, 20.0, 46.0, 64.0, 108.0, 169.0, 288.0, 524.0, 1165.0, 2982.0, 11243.0, 75232.0, 610027.0, 303918.0, 32444.0, 6299.0, 1977.0, 887.0, 441.0, 237.0, 117.0, 98.0, 56.0, 39.0, 29.0, 14.0, 22.0, 12.0, 7.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2003173828125, -0.19456100463867188, -0.18880462646484375, -0.18304824829101562, -0.1772918701171875, -0.17153549194335938, -0.16577911376953125, -0.16002273559570312, -0.154266357421875, -0.14850997924804688, -0.14275360107421875, -0.13699722290039062, -0.1312408447265625, -0.12548446655273438, -0.11972808837890625, -0.11397171020507812, -0.10821533203125, -0.10245895385742188, -0.09670257568359375, -0.09094619750976562, -0.0851898193359375, -0.07943344116210938, -0.07367706298828125, -0.06792068481445312, -0.062164306640625, -0.056407928466796875, -0.05065155029296875, -0.044895172119140625, -0.0391387939453125, -0.033382415771484375, -0.02762603759765625, -0.021869659423828125, -0.01611328125, -0.010356903076171875, -0.00460052490234375, 0.001155853271484375, 0.0069122314453125, 0.012668609619140625, 0.01842498779296875, 0.024181365966796875, 0.029937744140625, 0.035694122314453125, 0.04145050048828125, 0.047206878662109375, 0.0529632568359375, 0.058719635009765625, 0.06447601318359375, 0.07023239135742188, 0.07598876953125, 0.08174514770507812, 0.08750152587890625, 0.09325790405273438, 0.0990142822265625, 0.10477066040039062, 0.11052703857421875, 0.11628341674804688, 0.122039794921875, 0.12779617309570312, 0.13355255126953125, 0.13930892944335938, 0.1450653076171875, 0.15082168579101562, 0.15657806396484375, 0.16233444213867188, 0.1680908203125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 11.0, 6.0, 14.0, 8.0, 20.0, 22.0, 25.0, 33.0, 49.0, 44.0, 58.0, 70.0, 65.0, 63.0, 79.0, 67.0, 56.0, 65.0, 34.0, 36.0, 45.0, 34.0, 32.0, 15.0, 15.0, 10.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.35791015625, -0.34793853759765625, -0.3379669189453125, -0.32799530029296875, -0.318023681640625, -0.30805206298828125, -0.2980804443359375, -0.28810882568359375, -0.27813720703125, -0.26816558837890625, -0.2581939697265625, -0.24822235107421875, -0.238250732421875, -0.22827911376953125, -0.2183074951171875, -0.20833587646484375, -0.1983642578125, -0.18839263916015625, -0.1784210205078125, -0.16844940185546875, -0.158477783203125, -0.14850616455078125, -0.1385345458984375, -0.12856292724609375, -0.11859130859375, -0.10861968994140625, -0.0986480712890625, -0.08867645263671875, -0.078704833984375, -0.06873321533203125, -0.0587615966796875, -0.04878997802734375, -0.038818359375, -0.02884674072265625, -0.0188751220703125, -0.00890350341796875, 0.001068115234375, 0.01103973388671875, 0.0210113525390625, 0.03098297119140625, 0.04095458984375, 0.05092620849609375, 0.0608978271484375, 0.07086944580078125, 0.080841064453125, 0.09081268310546875, 0.1007843017578125, 0.11075592041015625, 0.1207275390625, 0.13069915771484375, 0.1406707763671875, 0.15064239501953125, 0.160614013671875, 0.17058563232421875, 0.1805572509765625, 0.19052886962890625, 0.20050048828125, 0.21047210693359375, 0.2204437255859375, 0.23041534423828125, 0.240386962890625, 0.25035858154296875, 0.2603302001953125, 0.27030181884765625, 0.2802734375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 15.0, 22.0, 24.0, 43.0, 105.0, 336.0, 1780.0, 80175.0, 959545.0, 5541.0, 627.0, 183.0, 81.0, 38.0, 19.0, 6.0, 10.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3603515625, -0.35012054443359375, -0.3398895263671875, -0.32965850830078125, -0.319427490234375, -0.30919647216796875, -0.2989654541015625, -0.28873443603515625, -0.27850341796875, -0.26827239990234375, -0.2580413818359375, -0.24781036376953125, -0.237579345703125, -0.22734832763671875, -0.2171173095703125, -0.20688629150390625, -0.1966552734375, -0.18642425537109375, -0.1761932373046875, -0.16596221923828125, -0.155731201171875, -0.14550018310546875, -0.1352691650390625, -0.12503814697265625, -0.11480712890625, -0.10457611083984375, -0.0943450927734375, -0.08411407470703125, -0.073883056640625, -0.06365203857421875, -0.0534210205078125, -0.04319000244140625, -0.032958984375, -0.02272796630859375, -0.0124969482421875, -0.00226593017578125, 0.007965087890625, 0.01819610595703125, 0.0284271240234375, 0.03865814208984375, 0.04888916015625, 0.05912017822265625, 0.0693511962890625, 0.07958221435546875, 0.089813232421875, 0.10004425048828125, 0.1102752685546875, 0.12050628662109375, 0.1307373046875, 0.14096832275390625, 0.1511993408203125, 0.16143035888671875, 0.171661376953125, 0.18189239501953125, 0.1921234130859375, 0.20235443115234375, 0.21258544921875, 0.22281646728515625, 0.2330474853515625, 0.24327850341796875, 0.253509521484375, 0.26374053955078125, 0.2739715576171875, 0.28420257568359375, 0.29443359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 10.0, 7.0, 9.0, 17.0, 11.0, 11.0, 22.0, 25.0, 30.0, 34.0, 50.0, 58.0, 67.0, 101.0, 83.0, 88.0, 72.0, 68.0, 51.0, 42.0, 27.0, 26.0, 17.0, 13.0, 13.0, 12.0, 10.0, 7.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0], "bins": [-7.748603820800781e-05, -7.541850209236145e-05, -7.335096597671509e-05, -7.128342986106873e-05, -6.921589374542236e-05, -6.7148357629776e-05, -6.508082151412964e-05, -6.301328539848328e-05, -6.0945749282836914e-05, -5.887821316719055e-05, -5.681067705154419e-05, -5.474314093589783e-05, -5.2675604820251465e-05, -5.06080687046051e-05, -4.854053258895874e-05, -4.647299647331238e-05, -4.4405460357666016e-05, -4.233792424201965e-05, -4.027038812637329e-05, -3.820285201072693e-05, -3.6135315895080566e-05, -3.4067779779434204e-05, -3.200024366378784e-05, -2.993270754814148e-05, -2.7865171432495117e-05, -2.5797635316848755e-05, -2.3730099201202393e-05, -2.166256308555603e-05, -1.9595026969909668e-05, -1.7527490854263306e-05, -1.5459954738616943e-05, -1.3392418622970581e-05, -1.1324882507324219e-05, -9.257346391677856e-06, -7.189810276031494e-06, -5.122274160385132e-06, -3.0547380447387695e-06, -9.872019290924072e-07, 1.080334186553955e-06, 3.1478703022003174e-06, 5.21540641784668e-06, 7.282942533493042e-06, 9.350478649139404e-06, 1.1418014764785767e-05, 1.3485550880432129e-05, 1.555308699607849e-05, 1.7620623111724854e-05, 1.9688159227371216e-05, 2.1755695343017578e-05, 2.382323145866394e-05, 2.5890767574310303e-05, 2.7958303689956665e-05, 3.0025839805603027e-05, 3.209337592124939e-05, 3.416091203689575e-05, 3.6228448152542114e-05, 3.8295984268188477e-05, 4.036352038383484e-05, 4.24310564994812e-05, 4.4498592615127563e-05, 4.6566128730773926e-05, 4.863366484642029e-05, 5.070120096206665e-05, 5.276873707771301e-05, 5.4836273193359375e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 12.0, 14.0, 45.0, 43.0, 122.0, 264.0, 774.0, 4546.0, 350263.0, 684746.0, 6217.0, 942.0, 274.0, 147.0, 58.0, 35.0, 26.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2861328125, -0.2781982421875, -0.270263671875, -0.2623291015625, -0.25439453125, -0.2464599609375, -0.238525390625, -0.2305908203125, -0.22265625, -0.2147216796875, -0.206787109375, -0.1988525390625, -0.19091796875, -0.1829833984375, -0.175048828125, -0.1671142578125, -0.1591796875, -0.1512451171875, -0.143310546875, -0.1353759765625, -0.12744140625, -0.1195068359375, -0.111572265625, -0.1036376953125, -0.095703125, -0.0877685546875, -0.079833984375, -0.0718994140625, -0.06396484375, -0.0560302734375, -0.048095703125, -0.0401611328125, -0.0322265625, -0.0242919921875, -0.016357421875, -0.0084228515625, -0.00048828125, 0.0074462890625, 0.015380859375, 0.0233154296875, 0.03125, 0.0391845703125, 0.047119140625, 0.0550537109375, 0.06298828125, 0.0709228515625, 0.078857421875, 0.0867919921875, 0.0947265625, 0.1026611328125, 0.110595703125, 0.1185302734375, 0.12646484375, 0.1343994140625, 0.142333984375, 0.1502685546875, 0.158203125, 0.1661376953125, 0.174072265625, 0.1820068359375, 0.18994140625, 0.1978759765625, 0.205810546875, 0.2137451171875, 0.2216796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 11.0, 22.0, 31.0, 78.0, 147.0, 241.0, 212.0, 148.0, 50.0, 31.0, 19.0, 7.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10137939453125, -0.09403133392333984, -0.08668327331542969, -0.07933521270751953, -0.07198715209960938, -0.06463909149169922, -0.05729103088378906, -0.049942970275878906, -0.04259490966796875, -0.035246849060058594, -0.027898788452148438, -0.02055072784423828, -0.013202667236328125, -0.005854606628417969, 0.0014934539794921875, 0.008841514587402344, 0.0161895751953125, 0.023537635803222656, 0.030885696411132812, 0.03823375701904297, 0.045581817626953125, 0.05292987823486328, 0.06027793884277344, 0.0676259994506836, 0.07497406005859375, 0.0823221206665039, 0.08967018127441406, 0.09701824188232422, 0.10436630249023438, 0.11171436309814453, 0.11906242370605469, 0.12641048431396484, 0.133758544921875, 0.14110660552978516, 0.1484546661376953, 0.15580272674560547, 0.16315078735351562, 0.17049884796142578, 0.17784690856933594, 0.1851949691772461, 0.19254302978515625, 0.1998910903930664, 0.20723915100097656, 0.21458721160888672, 0.22193527221679688, 0.22928333282470703, 0.2366313934326172, 0.24397945404052734, 0.2513275146484375, 0.25867557525634766, 0.2660236358642578, 0.27337169647216797, 0.2807197570800781, 0.2880678176879883, 0.29541587829589844, 0.3027639389038086, 0.31011199951171875, 0.3174600601196289, 0.32480812072753906, 0.3321561813354492, 0.3395042419433594, 0.34685230255126953, 0.3542003631591797, 0.36154842376708984, 0.368896484375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 13.0, 55.0, 270.0, 441.0, 158.0, 49.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.848891735076904, -6.709672451019287, -6.570453643798828, -6.431234359741211, -6.292015075683594, -6.152795791625977, -6.013576984405518, -5.8743577003479, -5.735138893127441, -5.595919609069824, -5.456700801849365, -5.317481517791748, -5.178262233734131, -5.039043426513672, -4.899824142456055, -4.7606048583984375, -4.62138557434082, -4.482166290283203, -4.342947483062744, -4.203728199005127, -4.06450891494751, -3.9252898693084717, -3.7860708236694336, -3.6468515396118164, -3.5076324939727783, -3.3684134483337402, -3.229194164276123, -3.089975118637085, -2.950756072998047, -2.8115367889404297, -2.6723177433013916, -2.5330986976623535, -2.3938791751861572, -2.254660129547119, -2.115440845489502, -1.9762217998504639, -1.8370026350021362, -1.6977834701538086, -1.5585644245147705, -1.4193452596664429, -1.2801260948181152, -1.1409069299697876, -1.00168776512146, -0.8624687194824219, -0.7232495546340942, -0.5840303897857666, -0.44481128454208374, -0.3055921792984009, -0.16637301445007324, -0.027153879404067993, 0.11206525564193726, 0.2512843906879425, 0.39050352573394775, 0.5297226905822754, 0.6689417958259583, 0.8081609010696411, 0.9473800659179688, 1.0865992307662964, 1.225818395614624, 1.365037441253662, 1.5042566061019897, 1.6434757709503174, 1.7826948165893555, 1.921913981437683, 2.0611331462860107]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 5.0, 0.0, 2.0, 12.0, 9.0, 5.0, 5.0, 6.0, 18.0, 17.0, 20.0, 18.0, 24.0, 17.0, 21.0, 31.0, 33.0, 28.0, 40.0, 55.0, 36.0, 36.0, 43.0, 41.0, 55.0, 48.0, 37.0, 39.0, 36.0, 35.0, 39.0, 22.0, 30.0, 20.0, 20.0, 19.0, 17.0, 19.0, 11.0, 12.0, 7.0, 3.0, 4.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9243149161338806, -0.8916608095169067, -0.8590066432952881, -0.8263525366783142, -0.7936983704566956, -0.7610442638397217, -0.728390097618103, -0.6957359910011292, -0.6630818843841553, -0.6304277777671814, -0.5977736115455627, -0.5651195049285889, -0.5324653387069702, -0.49981123208999634, -0.4671570956707001, -0.4345029592514038, -0.40184879302978516, -0.3691946566104889, -0.3365405201911926, -0.30388641357421875, -0.2712322473526001, -0.23857812583446503, -0.20592400431632996, -0.1732698678970337, -0.14061573147773743, -0.10796159505844116, -0.0753074660897255, -0.04265333712100983, -0.009999200701713562, 0.022654935717582703, 0.05530905723571777, 0.08796319365501404, 0.12061727046966553, 0.1532714068889618, 0.18592554330825806, 0.21857966482639313, 0.2512338161468506, 0.28388792276382446, 0.3165420591831207, 0.349196195602417, 0.38185033202171326, 0.4145044684410095, 0.4471586048603058, 0.47981274127960205, 0.5124668478965759, 0.5451210141181946, 0.5777751207351685, 0.6104292869567871, 0.643083393573761, 0.6757375001907349, 0.7083916664123535, 0.7410457730293274, 0.773699939250946, 0.8063540458679199, 0.8390082120895386, 0.8716623187065125, 0.9043164253234863, 0.9369705319404602, 0.9696246981620789, 1.0022788047790527, 1.0349329710006714, 1.06758713722229, 1.1002411842346191, 1.1328953504562378, 1.1655495166778564]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 12.0, 11.0, 12.0, 22.0, 27.0, 57.0, 99.0, 239.0, 772.0, 2655.0, 27192.0, 4144061.0, 15942.0, 2146.0, 571.0, 208.0, 114.0, 46.0, 23.0, 18.0, 12.0, 7.0, 5.0, 4.0, 1.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.471923828125, -0.4585990905761719, -0.44527435302734375, -0.4319496154785156, -0.4186248779296875, -0.4053001403808594, -0.39197540283203125, -0.3786506652832031, -0.365325927734375, -0.3520011901855469, -0.33867645263671875, -0.3253517150878906, -0.3120269775390625, -0.2987022399902344, -0.28537750244140625, -0.2720527648925781, -0.25872802734375, -0.24540328979492188, -0.23207855224609375, -0.21875381469726562, -0.2054290771484375, -0.19210433959960938, -0.17877960205078125, -0.16545486450195312, -0.152130126953125, -0.13880538940429688, -0.12548065185546875, -0.11215591430664062, -0.0988311767578125, -0.08550643920898438, -0.07218170166015625, -0.058856964111328125, -0.0455322265625, -0.032207489013671875, -0.01888275146484375, -0.005558013916015625, 0.0077667236328125, 0.021091461181640625, 0.03441619873046875, 0.047740936279296875, 0.061065673828125, 0.07439041137695312, 0.08771514892578125, 0.10103988647460938, 0.1143646240234375, 0.12768936157226562, 0.14101409912109375, 0.15433883666992188, 0.16766357421875, 0.18098831176757812, 0.19431304931640625, 0.20763778686523438, 0.2209625244140625, 0.23428726196289062, 0.24761199951171875, 0.2609367370605469, 0.274261474609375, 0.2875862121582031, 0.30091094970703125, 0.3142356872558594, 0.3275604248046875, 0.3408851623535156, 0.35420989990234375, 0.3675346374511719, 0.380859375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 9.0, 8.0, 14.0, 17.0, 24.0, 36.0, 44.0, 35.0, 66.0, 70.0, 72.0, 77.0, 83.0, 63.0, 64.0, 65.0, 61.0, 45.0, 35.0, 23.0, 24.0, 16.0, 13.0, 4.0, 12.0, 5.0, 5.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06536865234375, -0.06267547607421875, -0.0599822998046875, -0.05728912353515625, -0.054595947265625, -0.05190277099609375, -0.0492095947265625, -0.04651641845703125, -0.0438232421875, -0.04113006591796875, -0.0384368896484375, -0.03574371337890625, -0.033050537109375, -0.03035736083984375, -0.0276641845703125, -0.02497100830078125, -0.02227783203125, -0.01958465576171875, -0.0168914794921875, -0.01419830322265625, -0.011505126953125, -0.00881195068359375, -0.0061187744140625, -0.00342559814453125, -0.000732421875, 0.00196075439453125, 0.0046539306640625, 0.00734710693359375, 0.010040283203125, 0.01273345947265625, 0.0154266357421875, 0.01811981201171875, 0.02081298828125, 0.02350616455078125, 0.0261993408203125, 0.02889251708984375, 0.031585693359375, 0.03427886962890625, 0.0369720458984375, 0.03966522216796875, 0.0423583984375, 0.04505157470703125, 0.0477447509765625, 0.05043792724609375, 0.053131103515625, 0.05582427978515625, 0.0585174560546875, 0.06121063232421875, 0.06390380859375, 0.06659698486328125, 0.0692901611328125, 0.07198333740234375, 0.074676513671875, 0.07736968994140625, 0.0800628662109375, 0.08275604248046875, 0.08544921875, 0.08814239501953125, 0.0908355712890625, 0.09352874755859375, 0.096221923828125, 0.09891510009765625, 0.1016082763671875, 0.10430145263671875, 0.10699462890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 14.0, 19.0, 22.0, 37.0, 49.0, 72.0, 93.0, 146.0, 212.0, 409.0, 712.0, 1296.0, 3363.0, 14402.0, 248990.0, 3894341.0, 22158.0, 4301.0, 1621.0, 804.0, 423.0, 247.0, 179.0, 115.0, 90.0, 58.0, 42.0, 20.0, 11.0, 10.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193603515625, -0.18671607971191406, -0.17982864379882812, -0.1729412078857422, -0.16605377197265625, -0.1591663360595703, -0.15227890014648438, -0.14539146423339844, -0.1385040283203125, -0.13161659240722656, -0.12472915649414062, -0.11784172058105469, -0.11095428466796875, -0.10406684875488281, -0.09717941284179688, -0.09029197692871094, -0.083404541015625, -0.07651710510253906, -0.06962966918945312, -0.06274223327636719, -0.05585479736328125, -0.04896736145019531, -0.042079925537109375, -0.03519248962402344, -0.0283050537109375, -0.021417617797851562, -0.014530181884765625, -0.0076427459716796875, -0.00075531005859375, 0.0061321258544921875, 0.013019561767578125, 0.019906997680664062, 0.02679443359375, 0.03368186950683594, 0.040569305419921875, 0.04745674133300781, 0.05434417724609375, 0.06123161315917969, 0.06811904907226562, 0.07500648498535156, 0.0818939208984375, 0.08878135681152344, 0.09566879272460938, 0.10255622863769531, 0.10944366455078125, 0.11633110046386719, 0.12321853637695312, 0.13010597229003906, 0.136993408203125, 0.14388084411621094, 0.15076828002929688, 0.1576557159423828, 0.16454315185546875, 0.1714305877685547, 0.17831802368164062, 0.18520545959472656, 0.1920928955078125, 0.19898033142089844, 0.20586776733398438, 0.2127552032470703, 0.21964263916015625, 0.2265300750732422, 0.23341751098632812, 0.24030494689941406, 0.2471923828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 12.0, 21.0, 43.0, 145.0, 3601.0, 163.0, 50.0, 17.0, 12.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0771484375, -0.07469940185546875, -0.0722503662109375, -0.06980133056640625, -0.067352294921875, -0.06490325927734375, -0.0624542236328125, -0.06000518798828125, -0.05755615234375, -0.05510711669921875, -0.0526580810546875, -0.05020904541015625, -0.047760009765625, -0.04531097412109375, -0.0428619384765625, -0.04041290283203125, -0.0379638671875, -0.03551483154296875, -0.0330657958984375, -0.03061676025390625, -0.028167724609375, -0.02571868896484375, -0.0232696533203125, -0.02082061767578125, -0.01837158203125, -0.01592254638671875, -0.0134735107421875, -0.01102447509765625, -0.008575439453125, -0.00612640380859375, -0.0036773681640625, -0.00122833251953125, 0.001220703125, 0.00366973876953125, 0.0061187744140625, 0.00856781005859375, 0.011016845703125, 0.01346588134765625, 0.0159149169921875, 0.01836395263671875, 0.02081298828125, 0.02326202392578125, 0.0257110595703125, 0.02816009521484375, 0.030609130859375, 0.03305816650390625, 0.0355072021484375, 0.03795623779296875, 0.0404052734375, 0.04285430908203125, 0.0453033447265625, 0.04775238037109375, 0.050201416015625, 0.05265045166015625, 0.0550994873046875, 0.05754852294921875, 0.05999755859375, 0.06244659423828125, 0.0648956298828125, 0.06734466552734375, 0.069793701171875, 0.07224273681640625, 0.0746917724609375, 0.07714080810546875, 0.07958984375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 15.0, 33.0, 59.0, 133.0, 228.0, 205.0, 154.0, 99.0, 45.0, 18.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24924665689468384, -0.24236628413200378, -0.23548591136932373, -0.22860553860664368, -0.22172515094280243, -0.21484477818012238, -0.20796440541744232, -0.20108403265476227, -0.19420364499092102, -0.18732327222824097, -0.1804428994655609, -0.17356252670288086, -0.1666821390390396, -0.15980176627635956, -0.1529213935136795, -0.14604102075099945, -0.1391606479883194, -0.13228027522563934, -0.1253999024629593, -0.11851952224969864, -0.11163914203643799, -0.10475876927375793, -0.09787839651107788, -0.09099802374839783, -0.08411764353513718, -0.07723727077245712, -0.07035689055919647, -0.06347651779651642, -0.056596141308546066, -0.049715764820575714, -0.04283539205789566, -0.03595501556992531, -0.029074639081954956, -0.022194262593984604, -0.015313887968659401, -0.008433513343334198, -0.0015531368553638458, 0.005327239632606506, 0.01220761239528656, 0.019087988883256912, 0.025968365371227264, 0.03284874185919762, 0.03972911834716797, 0.04660949110984802, 0.053489867597818375, 0.06037024408578873, 0.06725061684846878, 0.07413099706172943, 0.08101136982440948, 0.08789174258708954, 0.09477212280035019, 0.10165249556303024, 0.1085328757762909, 0.11541324853897095, 0.122293621301651, 0.12917399406433105, 0.1360543668270111, 0.14293473958969116, 0.14981511235237122, 0.15669548511505127, 0.16357587277889252, 0.17045624554157257, 0.17733661830425262, 0.18421699106693268, 0.19109737873077393]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 8.0, 16.0, 17.0, 12.0, 16.0, 28.0, 26.0, 37.0, 38.0, 53.0, 60.0, 58.0, 66.0, 47.0, 53.0, 51.0, 57.0, 63.0, 62.0, 38.0, 42.0, 28.0, 21.0, 27.0, 17.0, 13.0, 11.0, 6.0, 5.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0998525619506836, -0.09673759341239929, -0.09362262487411499, -0.09050765633583069, -0.08739268779754639, -0.08427772670984268, -0.08116275817155838, -0.07804778963327408, -0.07493282109498978, -0.07181785255670547, -0.06870288401842117, -0.06558791548013687, -0.06247295066714287, -0.059357982128858566, -0.05624301731586456, -0.05312804877758026, -0.05001308023929596, -0.04689811170101166, -0.043783143162727356, -0.04066817834973335, -0.03755320981144905, -0.03443824127316475, -0.031323276460170746, -0.028208307921886444, -0.025093339383602142, -0.02197837084531784, -0.018863404169678688, -0.015748437494039536, -0.012633468955755234, -0.009518501348793507, -0.0064035337418317795, -0.003288567066192627, -0.0001735985279083252, 0.002941369079053402, 0.006056336686015129, 0.009171304292976856, 0.012286271899938583, 0.01540123950690031, 0.018516207113862038, 0.02163117378950119, 0.024746142327785492, 0.027861110866069794, 0.030976077541708946, 0.0340910442173481, 0.0372060127556324, 0.0403209812939167, 0.043435946106910706, 0.04655091464519501, 0.04966588318347931, 0.05278085172176361, 0.05589582026004791, 0.059010785073041916, 0.06212575361132622, 0.06524071842432022, 0.06835568696260452, 0.07147065550088882, 0.07458562403917313, 0.07770059257745743, 0.08081556111574173, 0.08393052965402603, 0.08704549074172974, 0.09016045928001404, 0.09327542781829834, 0.09639039635658264, 0.09950536489486694]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 15.0, 31.0, 36.0, 62.0, 118.0, 235.0, 481.0, 1259.0, 4053.0, 17703.0, 130452.0, 644773.0, 214306.0, 26835.0, 5408.0, 1537.0, 653.0, 285.0, 124.0, 74.0, 39.0, 27.0, 17.0, 14.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18994140625, -0.18373680114746094, -0.17753219604492188, -0.1713275909423828, -0.16512298583984375, -0.1589183807373047, -0.15271377563476562, -0.14650917053222656, -0.1403045654296875, -0.13409996032714844, -0.12789535522460938, -0.12169075012207031, -0.11548614501953125, -0.10928153991699219, -0.10307693481445312, -0.09687232971191406, -0.090667724609375, -0.08446311950683594, -0.07825851440429688, -0.07205390930175781, -0.06584930419921875, -0.05964469909667969, -0.053440093994140625, -0.04723548889160156, -0.0410308837890625, -0.03482627868652344, -0.028621673583984375, -0.022417068481445312, -0.01621246337890625, -0.010007858276367188, -0.003803253173828125, 0.0024013519287109375, 0.00860595703125, 0.014810562133789062, 0.021015167236328125, 0.027219772338867188, 0.03342437744140625, 0.03962898254394531, 0.045833587646484375, 0.05203819274902344, 0.0582427978515625, 0.06444740295410156, 0.07065200805664062, 0.07685661315917969, 0.08306121826171875, 0.08926582336425781, 0.09547042846679688, 0.10167503356933594, 0.107879638671875, 0.11408424377441406, 0.12028884887695312, 0.1264934539794922, 0.13269805908203125, 0.1389026641845703, 0.14510726928710938, 0.15131187438964844, 0.1575164794921875, 0.16372108459472656, 0.16992568969726562, 0.1761302947998047, 0.18233489990234375, 0.1885395050048828, 0.19474411010742188, 0.20094871520996094, 0.2071533203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 10.0, 12.0, 9.0, 9.0, 19.0, 27.0, 39.0, 31.0, 38.0, 54.0, 56.0, 69.0, 76.0, 69.0, 61.0, 50.0, 71.0, 60.0, 38.0, 54.0, 26.0, 27.0, 25.0, 17.0, 18.0, 9.0, 9.0, 4.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0672607421875, -0.0647573471069336, -0.06225395202636719, -0.05975055694580078, -0.057247161865234375, -0.05474376678466797, -0.05224037170410156, -0.049736976623535156, -0.04723358154296875, -0.044730186462402344, -0.04222679138183594, -0.03972339630126953, -0.037220001220703125, -0.03471660614013672, -0.03221321105957031, -0.029709815979003906, -0.0272064208984375, -0.024703025817871094, -0.022199630737304688, -0.01969623565673828, -0.017192840576171875, -0.014689445495605469, -0.012186050415039062, -0.009682655334472656, -0.00717926025390625, -0.004675865173339844, -0.0021724700927734375, 0.00033092498779296875, 0.002834320068359375, 0.005337715148925781, 0.007841110229492188, 0.010344505310058594, 0.012847900390625, 0.015351295471191406, 0.017854690551757812, 0.02035808563232422, 0.022861480712890625, 0.02536487579345703, 0.027868270874023438, 0.030371665954589844, 0.03287506103515625, 0.035378456115722656, 0.03788185119628906, 0.04038524627685547, 0.042888641357421875, 0.04539203643798828, 0.04789543151855469, 0.050398826599121094, 0.0529022216796875, 0.055405616760253906, 0.05790901184082031, 0.06041240692138672, 0.06291580200195312, 0.06541919708251953, 0.06792259216308594, 0.07042598724365234, 0.07292938232421875, 0.07543277740478516, 0.07793617248535156, 0.08043956756591797, 0.08294296264648438, 0.08544635772705078, 0.08794975280761719, 0.0904531478881836, 0.09295654296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 5.0, 6.0, 4.0, 12.0, 9.0, 18.0, 25.0, 31.0, 44.0, 69.0, 121.0, 181.0, 266.0, 509.0, 1034.0, 2595.0, 9676.0, 66538.0, 656466.0, 277335.0, 25472.0, 4852.0, 1589.0, 733.0, 368.0, 218.0, 137.0, 66.0, 60.0, 25.0, 19.0, 25.0, 16.0, 8.0, 8.0, 7.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2086181640625, -0.2026195526123047, -0.19662094116210938, -0.19062232971191406, -0.18462371826171875, -0.17862510681152344, -0.17262649536132812, -0.1666278839111328, -0.1606292724609375, -0.1546306610107422, -0.14863204956054688, -0.14263343811035156, -0.13663482666015625, -0.13063621520996094, -0.12463760375976562, -0.11863899230957031, -0.112640380859375, -0.10664176940917969, -0.10064315795898438, -0.09464454650878906, -0.08864593505859375, -0.08264732360839844, -0.07664871215820312, -0.07065010070800781, -0.0646514892578125, -0.05865287780761719, -0.052654266357421875, -0.04665565490722656, -0.04065704345703125, -0.03465843200683594, -0.028659820556640625, -0.022661209106445312, -0.01666259765625, -0.010663986206054688, -0.004665374755859375, 0.0013332366943359375, 0.00733184814453125, 0.013330459594726562, 0.019329071044921875, 0.025327682495117188, 0.0313262939453125, 0.03732490539550781, 0.043323516845703125, 0.04932212829589844, 0.05532073974609375, 0.06131935119628906, 0.06731796264648438, 0.07331657409667969, 0.079315185546875, 0.08531379699707031, 0.09131240844726562, 0.09731101989746094, 0.10330963134765625, 0.10930824279785156, 0.11530685424804688, 0.12130546569824219, 0.1273040771484375, 0.1333026885986328, 0.13930130004882812, 0.14529991149902344, 0.15129852294921875, 0.15729713439941406, 0.16329574584960938, 0.1692943572998047, 0.17529296875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 10.0, 10.0, 9.0, 18.0, 25.0, 24.0, 31.0, 29.0, 41.0, 40.0, 33.0, 50.0, 41.0, 38.0, 37.0, 48.0, 43.0, 43.0, 34.0, 56.0, 52.0, 27.0, 36.0, 37.0, 30.0, 23.0, 18.0, 16.0, 13.0, 17.0, 12.0, 8.0, 6.0, 3.0, 3.0, 2.0, 6.0, 7.0, 0.0, 1.0, 4.0, 3.0], "bins": [-0.302490234375, -0.2945117950439453, -0.2865333557128906, -0.27855491638183594, -0.27057647705078125, -0.26259803771972656, -0.2546195983886719, -0.2466411590576172, -0.2386627197265625, -0.2306842803955078, -0.22270584106445312, -0.21472740173339844, -0.20674896240234375, -0.19877052307128906, -0.19079208374023438, -0.1828136444091797, -0.174835205078125, -0.1668567657470703, -0.15887832641601562, -0.15089988708496094, -0.14292144775390625, -0.13494300842285156, -0.12696456909179688, -0.11898612976074219, -0.1110076904296875, -0.10302925109863281, -0.09505081176757812, -0.08707237243652344, -0.07909393310546875, -0.07111549377441406, -0.06313705444335938, -0.05515861511230469, -0.04718017578125, -0.03920173645019531, -0.031223297119140625, -0.023244857788085938, -0.01526641845703125, -0.0072879791259765625, 0.000690460205078125, 0.008668899536132812, 0.0166473388671875, 0.024625778198242188, 0.032604217529296875, 0.04058265686035156, 0.04856109619140625, 0.05653953552246094, 0.06451797485351562, 0.07249641418457031, 0.080474853515625, 0.08845329284667969, 0.09643173217773438, 0.10441017150878906, 0.11238861083984375, 0.12036705017089844, 0.12834548950195312, 0.1363239288330078, 0.1443023681640625, 0.1522808074951172, 0.16025924682617188, 0.16823768615722656, 0.17621612548828125, 0.18419456481933594, 0.19217300415039062, 0.2001514434814453, 0.2081298828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 10.0, 14.0, 21.0, 39.0, 40.0, 92.0, 216.0, 377.0, 1043.0, 5595.0, 253245.0, 774761.0, 10724.0, 1419.0, 456.0, 192.0, 118.0, 62.0, 36.0, 28.0, 15.0, 8.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.223876953125, -0.21750259399414062, -0.21112823486328125, -0.20475387573242188, -0.1983795166015625, -0.19200515747070312, -0.18563079833984375, -0.17925643920898438, -0.172882080078125, -0.16650772094726562, -0.16013336181640625, -0.15375900268554688, -0.1473846435546875, -0.14101028442382812, -0.13463592529296875, -0.12826156616210938, -0.12188720703125, -0.11551284790039062, -0.10913848876953125, -0.10276412963867188, -0.0963897705078125, -0.09001541137695312, -0.08364105224609375, -0.07726669311523438, -0.070892333984375, -0.06451797485351562, -0.05814361572265625, -0.051769256591796875, -0.0453948974609375, -0.039020538330078125, -0.03264617919921875, -0.026271820068359375, -0.0198974609375, -0.013523101806640625, -0.00714874267578125, -0.000774383544921875, 0.0055999755859375, 0.011974334716796875, 0.01834869384765625, 0.024723052978515625, 0.031097412109375, 0.037471771240234375, 0.04384613037109375, 0.050220489501953125, 0.0565948486328125, 0.06296920776367188, 0.06934356689453125, 0.07571792602539062, 0.08209228515625, 0.08846664428710938, 0.09484100341796875, 0.10121536254882812, 0.1075897216796875, 0.11396408081054688, 0.12033843994140625, 0.12671279907226562, 0.133087158203125, 0.13946151733398438, 0.14583587646484375, 0.15221023559570312, 0.1585845947265625, 0.16495895385742188, 0.17133331298828125, 0.17770767211914062, 0.18408203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 12.0, 7.0, 7.0, 19.0, 17.0, 19.0, 38.0, 55.0, 67.0, 98.0, 144.0, 165.0, 127.0, 51.0, 46.0, 39.0, 26.0, 18.0, 16.0, 11.0, 7.0, 3.0, 4.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.420778274536133e-05, -7.16550275683403e-05, -6.910227239131927e-05, -6.654951721429825e-05, -6.399676203727722e-05, -6.14440068602562e-05, -5.889125168323517e-05, -5.633849650621414e-05, -5.3785741329193115e-05, -5.123298615217209e-05, -4.868023097515106e-05, -4.6127475798130035e-05, -4.357472062110901e-05, -4.102196544408798e-05, -3.8469210267066956e-05, -3.591645509004593e-05, -3.33636999130249e-05, -3.0810944736003876e-05, -2.825818955898285e-05, -2.5705434381961823e-05, -2.3152679204940796e-05, -2.059992402791977e-05, -1.8047168850898743e-05, -1.5494413673877716e-05, -1.294165849685669e-05, -1.0388903319835663e-05, -7.836148142814636e-06, -5.28339296579361e-06, -2.730637788772583e-06, -1.778826117515564e-07, 2.3748725652694702e-06, 4.927627742290497e-06, 7.4803829193115234e-06, 1.003313809633255e-05, 1.2585893273353577e-05, 1.5138648450374603e-05, 1.769140362739563e-05, 2.0244158804416656e-05, 2.2796913981437683e-05, 2.534966915845871e-05, 2.7902424335479736e-05, 3.0455179512500763e-05, 3.300793468952179e-05, 3.5560689866542816e-05, 3.811344504356384e-05, 4.066620022058487e-05, 4.3218955397605896e-05, 4.577171057462692e-05, 4.832446575164795e-05, 5.0877220928668976e-05, 5.342997610569e-05, 5.598273128271103e-05, 5.8535486459732056e-05, 6.108824163675308e-05, 6.364099681377411e-05, 6.619375199079514e-05, 6.874650716781616e-05, 7.129926234483719e-05, 7.385201752185822e-05, 7.640477269887924e-05, 7.895752787590027e-05, 8.15102830529213e-05, 8.406303822994232e-05, 8.661579340696335e-05, 8.916854858398438e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 5.0, 6.0, 8.0, 15.0, 16.0, 37.0, 61.0, 88.0, 187.0, 491.0, 1290.0, 5118.0, 57080.0, 903970.0, 72130.0, 5645.0, 1413.0, 508.0, 242.0, 88.0, 59.0, 37.0, 17.0, 11.0, 11.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1446533203125, -0.13991546630859375, -0.1351776123046875, -0.13043975830078125, -0.125701904296875, -0.12096405029296875, -0.1162261962890625, -0.11148834228515625, -0.10675048828125, -0.10201263427734375, -0.0972747802734375, -0.09253692626953125, -0.087799072265625, -0.08306121826171875, -0.0783233642578125, -0.07358551025390625, -0.06884765625, -0.06410980224609375, -0.0593719482421875, -0.05463409423828125, -0.049896240234375, -0.04515838623046875, -0.0404205322265625, -0.03568267822265625, -0.03094482421875, -0.02620697021484375, -0.0214691162109375, -0.01673126220703125, -0.011993408203125, -0.00725555419921875, -0.0025177001953125, 0.00222015380859375, 0.0069580078125, 0.01169586181640625, 0.0164337158203125, 0.02117156982421875, 0.025909423828125, 0.03064727783203125, 0.0353851318359375, 0.04012298583984375, 0.04486083984375, 0.04959869384765625, 0.0543365478515625, 0.05907440185546875, 0.063812255859375, 0.06855010986328125, 0.0732879638671875, 0.07802581787109375, 0.082763671875, 0.08750152587890625, 0.0922393798828125, 0.09697723388671875, 0.101715087890625, 0.10645294189453125, 0.1111907958984375, 0.11592864990234375, 0.12066650390625, 0.12540435791015625, 0.1301422119140625, 0.13488006591796875, 0.139617919921875, 0.14435577392578125, 0.1490936279296875, 0.15383148193359375, 0.1585693359375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 18.0, 23.0, 28.0, 33.0, 50.0, 69.0, 105.0, 104.0, 127.0, 100.0, 92.0, 73.0, 50.0, 37.0, 17.0, 22.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.18359375, -0.17936420440673828, -0.17513465881347656, -0.17090511322021484, -0.16667556762695312, -0.1624460220336914, -0.1582164764404297, -0.15398693084716797, -0.14975738525390625, -0.14552783966064453, -0.1412982940673828, -0.1370687484741211, -0.13283920288085938, -0.12860965728759766, -0.12438011169433594, -0.12015056610107422, -0.1159210205078125, -0.11169147491455078, -0.10746192932128906, -0.10323238372802734, -0.09900283813476562, -0.0947732925415039, -0.09054374694824219, -0.08631420135498047, -0.08208465576171875, -0.07785511016845703, -0.07362556457519531, -0.0693960189819336, -0.06516647338867188, -0.060936927795410156, -0.05670738220214844, -0.05247783660888672, -0.048248291015625, -0.04401874542236328, -0.03978919982910156, -0.035559654235839844, -0.031330108642578125, -0.027100563049316406, -0.022871017456054688, -0.01864147186279297, -0.01441192626953125, -0.010182380676269531, -0.0059528350830078125, -0.0017232894897460938, 0.002506256103515625, 0.006735801696777344, 0.010965347290039062, 0.015194892883300781, 0.0194244384765625, 0.02365398406982422, 0.027883529663085938, 0.032113075256347656, 0.036342620849609375, 0.040572166442871094, 0.04480171203613281, 0.04903125762939453, 0.05326080322265625, 0.05749034881591797, 0.06171989440917969, 0.0659494400024414, 0.07017898559570312, 0.07440853118896484, 0.07863807678222656, 0.08286762237548828, 0.08709716796875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 25.0, 596.0, 373.0, 14.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.894050598144531, -10.598784446716309, -10.30351734161377, -10.008251190185547, -9.712985038757324, -9.417718887329102, -9.122451782226562, -8.82718563079834, -8.531919479370117, -8.236653327941895, -7.941386699676514, -7.646120071411133, -7.35085391998291, -7.055587291717529, -6.760320663452148, -6.465054512023926, -6.169787883758545, -5.874521255493164, -5.579255104064941, -5.2839884757995605, -4.988722324371338, -4.693455696105957, -4.398189544677734, -4.1029229164123535, -3.8076565265655518, -3.51239013671875, -3.2171237468719482, -2.9218573570251465, -2.6265907287597656, -2.331324577331543, -2.036057949066162, -1.7407915592193604, -1.4455251693725586, -1.1502587795257568, -0.8549923300743103, -0.5597258806228638, -0.264459490776062, 0.030806899070739746, 0.32607340812683105, 0.6213397979736328, 0.9166061878204346, 1.2118725776672363, 1.507138967514038, 1.8024054765701294, 2.0976719856262207, 2.3929381370544434, 2.688204765319824, 2.983471155166626, 3.2787375450134277, 3.5740039348602295, 3.8692703247070312, 4.164536952972412, 4.459803104400635, 4.755069732666016, 5.050335884094238, 5.345602512359619, 5.640869140625, 5.936135768890381, 6.2314019203186035, 6.526668548583984, 6.821934700012207, 7.117201328277588, 7.412467956542969, 7.707734107971191, 8.003000259399414]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 6.0, 10.0, 10.0, 15.0, 20.0, 28.0, 24.0, 35.0, 42.0, 55.0, 47.0, 56.0, 58.0, 68.0, 73.0, 76.0, 58.0, 40.0, 55.0, 45.0, 35.0, 30.0, 22.0, 25.0, 17.0, 12.0, 6.0, 10.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6806137561798096, -1.630094289779663, -1.5795749425888062, -1.5290554761886597, -1.4785361289978027, -1.4280166625976562, -1.3774971961975098, -1.3269778490066528, -1.276458501815796, -1.2259390354156494, -1.1754196882247925, -1.124900221824646, -1.074380874633789, -1.0238614082336426, -0.9733420014381409, -0.9228225946426392, -0.8723031282424927, -0.821783721446991, -0.7712643146514893, -0.7207448482513428, -0.6702255010604858, -0.6197060346603394, -0.5691866278648376, -0.5186672210693359, -0.46814781427383423, -0.4176284074783325, -0.3671090006828308, -0.3165895640850067, -0.266070157289505, -0.2155507504940033, -0.1650313138961792, -0.11451190710067749, -0.06399250030517578, -0.013473086059093475, 0.03704632818698883, 0.08756574988365173, 0.13808515667915344, 0.18860456347465515, 0.23912400007247925, 0.28964340686798096, 0.34016281366348267, 0.3906822204589844, 0.4412016272544861, 0.4917210638523102, 0.5422405004501343, 0.5927598476409912, 0.6432793140411377, 0.6937987208366394, 0.7443181276321411, 0.7948375344276428, 0.8453569412231445, 0.895876407623291, 0.946395754814148, 0.9969152212142944, 1.0474345684051514, 1.0979540348052979, 1.1484735012054443, 1.1989929676055908, 1.2495123147964478, 1.3000317811965942, 1.3505511283874512, 1.4010705947875977, 1.4515900611877441, 1.502109408378601, 1.552628755569458]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 7.0, 7.0, 9.0, 27.0, 44.0, 123.0, 388.0, 1312.0, 9689.0, 3962658.0, 213324.0, 5368.0, 898.0, 230.0, 93.0, 39.0, 23.0, 12.0, 11.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4765625, -0.46490478515625, -0.4532470703125, -0.44158935546875, -0.429931640625, -0.41827392578125, -0.4066162109375, -0.39495849609375, -0.38330078125, -0.37164306640625, -0.3599853515625, -0.34832763671875, -0.336669921875, -0.32501220703125, -0.3133544921875, -0.30169677734375, -0.2900390625, -0.27838134765625, -0.2667236328125, -0.25506591796875, -0.243408203125, -0.23175048828125, -0.2200927734375, -0.20843505859375, -0.19677734375, -0.18511962890625, -0.1734619140625, -0.16180419921875, -0.150146484375, -0.13848876953125, -0.1268310546875, -0.11517333984375, -0.103515625, -0.09185791015625, -0.0802001953125, -0.06854248046875, -0.056884765625, -0.04522705078125, -0.0335693359375, -0.02191162109375, -0.01025390625, 0.00140380859375, 0.0130615234375, 0.02471923828125, 0.036376953125, 0.04803466796875, 0.0596923828125, 0.07135009765625, 0.0830078125, 0.09466552734375, 0.1063232421875, 0.11798095703125, 0.129638671875, 0.14129638671875, 0.1529541015625, 0.16461181640625, 0.17626953125, 0.18792724609375, 0.1995849609375, 0.21124267578125, 0.222900390625, 0.23455810546875, 0.2462158203125, 0.25787353515625, 0.26953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 7.0, 6.0, 10.0, 10.0, 12.0, 19.0, 32.0, 27.0, 30.0, 55.0, 56.0, 47.0, 73.0, 85.0, 75.0, 81.0, 68.0, 47.0, 54.0, 54.0, 29.0, 28.0, 24.0, 18.0, 13.0, 13.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0828857421875, -0.08031654357910156, -0.07774734497070312, -0.07517814636230469, -0.07260894775390625, -0.07003974914550781, -0.06747055053710938, -0.06490135192871094, -0.0623321533203125, -0.05976295471191406, -0.057193756103515625, -0.05462455749511719, -0.05205535888671875, -0.04948616027832031, -0.046916961669921875, -0.04434776306152344, -0.041778564453125, -0.03920936584472656, -0.036640167236328125, -0.03407096862792969, -0.03150177001953125, -0.028932571411132812, -0.026363372802734375, -0.023794174194335938, -0.0212249755859375, -0.018655776977539062, -0.016086578369140625, -0.013517379760742188, -0.01094818115234375, -0.008378982543945312, -0.005809783935546875, -0.0032405853271484375, -0.00067138671875, 0.0018978118896484375, 0.004467010498046875, 0.0070362091064453125, 0.00960540771484375, 0.012174606323242188, 0.014743804931640625, 0.017313003540039062, 0.0198822021484375, 0.022451400756835938, 0.025020599365234375, 0.027589797973632812, 0.03015899658203125, 0.03272819519042969, 0.035297393798828125, 0.03786659240722656, 0.040435791015625, 0.04300498962402344, 0.045574188232421875, 0.04814338684082031, 0.05071258544921875, 0.05328178405761719, 0.055850982666015625, 0.05842018127441406, 0.0609893798828125, 0.06355857849121094, 0.06612777709960938, 0.06869697570800781, 0.07126617431640625, 0.07383537292480469, 0.07640457153320312, 0.07897377014160156, 0.08154296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 7.0, 8.0, 16.0, 17.0, 31.0, 41.0, 46.0, 66.0, 89.0, 129.0, 173.0, 314.0, 475.0, 854.0, 1684.0, 3380.0, 7595.0, 20322.0, 67235.0, 545056.0, 3390144.0, 109275.0, 28398.0, 9986.0, 4247.0, 2017.0, 1091.0, 598.0, 320.0, 211.0, 143.0, 88.0, 63.0, 45.0, 28.0, 23.0, 21.0, 11.0, 14.0, 9.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.087890625, -0.08515739440917969, -0.08242416381835938, -0.07969093322753906, -0.07695770263671875, -0.07422447204589844, -0.07149124145507812, -0.06875801086425781, -0.0660247802734375, -0.06329154968261719, -0.060558319091796875, -0.05782508850097656, -0.05509185791015625, -0.05235862731933594, -0.049625396728515625, -0.04689216613769531, -0.044158935546875, -0.04142570495605469, -0.038692474365234375, -0.03595924377441406, -0.03322601318359375, -0.030492782592773438, -0.027759552001953125, -0.025026321411132812, -0.0222930908203125, -0.019559860229492188, -0.016826629638671875, -0.014093399047851562, -0.01136016845703125, -0.008626937866210938, -0.005893707275390625, -0.0031604766845703125, -0.00042724609375, 0.0023059844970703125, 0.005039215087890625, 0.0077724456787109375, 0.01050567626953125, 0.013238906860351562, 0.015972137451171875, 0.018705368041992188, 0.0214385986328125, 0.024171829223632812, 0.026905059814453125, 0.029638290405273438, 0.03237152099609375, 0.03510475158691406, 0.037837982177734375, 0.04057121276855469, 0.043304443359375, 0.04603767395019531, 0.048770904541015625, 0.05150413513183594, 0.05423736572265625, 0.05697059631347656, 0.059703826904296875, 0.06243705749511719, 0.0651702880859375, 0.06790351867675781, 0.07063674926757812, 0.07336997985839844, 0.07610321044921875, 0.07883644104003906, 0.08156967163085938, 0.08430290222167969, 0.0870361328125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 9.0, 15.0, 12.0, 30.0, 41.0, 68.0, 162.0, 719.0, 2530.0, 260.0, 103.0, 49.0, 38.0, 14.0, 10.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08721923828125, -0.08480644226074219, -0.08239364624023438, -0.07998085021972656, -0.07756805419921875, -0.07515525817871094, -0.07274246215820312, -0.07032966613769531, -0.0679168701171875, -0.06550407409667969, -0.06309127807617188, -0.06067848205566406, -0.05826568603515625, -0.05585289001464844, -0.053440093994140625, -0.05102729797363281, -0.048614501953125, -0.04620170593261719, -0.043788909912109375, -0.04137611389160156, -0.03896331787109375, -0.03655052185058594, -0.034137725830078125, -0.03172492980957031, -0.0293121337890625, -0.026899337768554688, -0.024486541748046875, -0.022073745727539062, -0.01966094970703125, -0.017248153686523438, -0.014835357666015625, -0.012422561645507812, -0.010009765625, -0.0075969696044921875, -0.005184173583984375, -0.0027713775634765625, -0.00035858154296875, 0.0020542144775390625, 0.004467010498046875, 0.0068798065185546875, 0.0092926025390625, 0.011705398559570312, 0.014118194580078125, 0.016530990600585938, 0.01894378662109375, 0.021356582641601562, 0.023769378662109375, 0.026182174682617188, 0.028594970703125, 0.031007766723632812, 0.033420562744140625, 0.03583335876464844, 0.03824615478515625, 0.04065895080566406, 0.043071746826171875, 0.04548454284667969, 0.0478973388671875, 0.05031013488769531, 0.052722930908203125, 0.05513572692871094, 0.05754852294921875, 0.05996131896972656, 0.062374114990234375, 0.06478691101074219, 0.06719970703125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 7.0, 13.0, 35.0, 90.0, 191.0, 256.0, 188.0, 112.0, 52.0, 30.0, 15.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34411361813545227, -0.3300383388996124, -0.3159630298614502, -0.30188775062561035, -0.2878124713897705, -0.2737371623516083, -0.25966188311576843, -0.2455865889787674, -0.23151129484176636, -0.21743600070476532, -0.20336070656776428, -0.18928542733192444, -0.1752101331949234, -0.16113483905792236, -0.14705955982208252, -0.13298426568508148, -0.11890897154808044, -0.1048336774110794, -0.09075839072465897, -0.07668310403823853, -0.06260780990123749, -0.04853251576423645, -0.03445722907781601, -0.02038194239139557, -0.006306648254394531, 0.007768642157316208, 0.021843932569026947, 0.035919222980737686, 0.049994513392448425, 0.06406980752944946, 0.0781450942158699, 0.09222038090229034, 0.10629570484161377, 0.12037099897861481, 0.13444629311561584, 0.1485215723514557, 0.16259686648845673, 0.17667216062545776, 0.1907474398612976, 0.20482273399829865, 0.21889802813529968, 0.23297332227230072, 0.24704861640930176, 0.2611238956451416, 0.27519917488098145, 0.2892744839191437, 0.3033497631549835, 0.31742507219314575, 0.3315003514289856, 0.34557563066482544, 0.35965093970298767, 0.3737262189388275, 0.38780152797698975, 0.4018768072128296, 0.41595208644866943, 0.4300273656845093, 0.4441026747226715, 0.45817795395851135, 0.4722532629966736, 0.4863285422325134, 0.5004038214683533, 0.5144791603088379, 0.5285544395446777, 0.5426297187805176, 0.5567049980163574]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 7.0, 13.0, 5.0, 13.0, 14.0, 24.0, 24.0, 30.0, 39.0, 34.0, 40.0, 36.0, 58.0, 49.0, 46.0, 61.0, 66.0, 50.0, 57.0, 50.0, 42.0, 34.0, 44.0, 35.0, 24.0, 30.0, 25.0, 14.0, 12.0, 8.0, 5.0, 7.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18039089441299438, -0.17462590336799622, -0.16886091232299805, -0.16309592127799988, -0.1573309302330017, -0.15156595408916473, -0.14580096304416656, -0.1400359719991684, -0.13427098095417023, -0.12850598990917206, -0.12274099886417389, -0.11697601526975632, -0.11121102422475815, -0.10544603317975998, -0.09968104958534241, -0.09391605854034424, -0.08815106749534607, -0.0823860764503479, -0.07662108540534973, -0.07085610181093216, -0.06509111076593399, -0.05932611972093582, -0.05356113240122795, -0.04779614508152008, -0.04203115403652191, -0.03626616299152374, -0.030501175671815872, -0.024736186489462852, -0.018971197307109833, -0.013206208124756813, -0.007441218942403793, -0.0016762316226959229, 0.004088759422302246, 0.009853748604655266, 0.015618737787008286, 0.021383726969361305, 0.027148716151714325, 0.032913707196712494, 0.038678694516420364, 0.044443681836128235, 0.050208672881126404, 0.05597366392612457, 0.06173865124583244, 0.06750363856554031, 0.07326862961053848, 0.07903362065553665, 0.08479860424995422, 0.09056359529495239, 0.09632858633995056, 0.10209357738494873, 0.1078585684299469, 0.11362355202436447, 0.11938854306936264, 0.1251535266637802, 0.13091851770877838, 0.13668350875377655, 0.14244849979877472, 0.1482134908437729, 0.15397848188877106, 0.15974347293376923, 0.1655084490776062, 0.17127344012260437, 0.17703843116760254, 0.1828034222126007, 0.18856841325759888]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 9.0, 9.0, 16.0, 17.0, 31.0, 62.0, 99.0, 152.0, 241.0, 461.0, 829.0, 1749.0, 4229.0, 12136.0, 46880.0, 237484.0, 530906.0, 163718.0, 33704.0, 9332.0, 3296.0, 1457.0, 758.0, 389.0, 208.0, 147.0, 75.0, 54.0, 24.0, 24.0, 13.0, 16.0, 4.0, 6.0, 0.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13330078125, -0.12891387939453125, -0.1245269775390625, -0.12014007568359375, -0.115753173828125, -0.11136627197265625, -0.1069793701171875, -0.10259246826171875, -0.09820556640625, -0.09381866455078125, -0.0894317626953125, -0.08504486083984375, -0.080657958984375, -0.07627105712890625, -0.0718841552734375, -0.06749725341796875, -0.0631103515625, -0.05872344970703125, -0.0543365478515625, -0.04994964599609375, -0.045562744140625, -0.04117584228515625, -0.0367889404296875, -0.03240203857421875, -0.02801513671875, -0.02362823486328125, -0.0192413330078125, -0.01485443115234375, -0.010467529296875, -0.00608062744140625, -0.0016937255859375, 0.00269317626953125, 0.007080078125, 0.01146697998046875, 0.0158538818359375, 0.02024078369140625, 0.024627685546875, 0.02901458740234375, 0.0334014892578125, 0.03778839111328125, 0.04217529296875, 0.04656219482421875, 0.0509490966796875, 0.05533599853515625, 0.059722900390625, 0.06410980224609375, 0.0684967041015625, 0.07288360595703125, 0.0772705078125, 0.08165740966796875, 0.0860443115234375, 0.09043121337890625, 0.094818115234375, 0.09920501708984375, 0.1035919189453125, 0.10797882080078125, 0.11236572265625, 0.11675262451171875, 0.1211395263671875, 0.12552642822265625, 0.129913330078125, 0.13430023193359375, 0.1386871337890625, 0.14307403564453125, 0.1474609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 6.0, 9.0, 7.0, 12.0, 21.0, 11.0, 20.0, 30.0, 45.0, 32.0, 52.0, 50.0, 64.0, 71.0, 67.0, 67.0, 68.0, 50.0, 64.0, 53.0, 31.0, 36.0, 19.0, 25.0, 28.0, 11.0, 9.0, 10.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07354736328125, -0.07115840911865234, -0.06876945495605469, -0.06638050079345703, -0.06399154663085938, -0.06160259246826172, -0.05921363830566406, -0.056824684143066406, -0.05443572998046875, -0.052046775817871094, -0.04965782165527344, -0.04726886749267578, -0.044879913330078125, -0.04249095916748047, -0.04010200500488281, -0.037713050842285156, -0.0353240966796875, -0.032935142517089844, -0.030546188354492188, -0.02815723419189453, -0.025768280029296875, -0.02337932586669922, -0.020990371704101562, -0.018601417541503906, -0.01621246337890625, -0.013823509216308594, -0.011434555053710938, -0.009045600891113281, -0.006656646728515625, -0.004267692565917969, -0.0018787384033203125, 0.0005102157592773438, 0.002899169921875, 0.005288124084472656, 0.0076770782470703125, 0.010066032409667969, 0.012454986572265625, 0.014843940734863281, 0.017232894897460938, 0.019621849060058594, 0.02201080322265625, 0.024399757385253906, 0.026788711547851562, 0.02917766571044922, 0.031566619873046875, 0.03395557403564453, 0.03634452819824219, 0.038733482360839844, 0.0411224365234375, 0.043511390686035156, 0.04590034484863281, 0.04828929901123047, 0.050678253173828125, 0.05306720733642578, 0.05545616149902344, 0.057845115661621094, 0.06023406982421875, 0.0626230239868164, 0.06501197814941406, 0.06740093231201172, 0.06978988647460938, 0.07217884063720703, 0.07456779479980469, 0.07695674896240234, 0.079345703125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 6.0, 10.0, 12.0, 15.0, 26.0, 40.0, 60.0, 75.0, 102.0, 183.0, 327.0, 688.0, 1597.0, 4720.0, 24878.0, 355864.0, 608451.0, 41326.0, 6374.0, 2022.0, 852.0, 387.0, 209.0, 117.0, 79.0, 51.0, 27.0, 21.0, 7.0, 14.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24872779846191406, -0.24184036254882812, -0.2349529266357422, -0.22806549072265625, -0.2211780548095703, -0.21429061889648438, -0.20740318298339844, -0.2005157470703125, -0.19362831115722656, -0.18674087524414062, -0.1798534393310547, -0.17296600341796875, -0.1660785675048828, -0.15919113159179688, -0.15230369567871094, -0.145416259765625, -0.13852882385253906, -0.13164138793945312, -0.12475395202636719, -0.11786651611328125, -0.11097908020019531, -0.10409164428710938, -0.09720420837402344, -0.0903167724609375, -0.08342933654785156, -0.07654190063476562, -0.06965446472167969, -0.06276702880859375, -0.05587959289550781, -0.048992156982421875, -0.04210472106933594, -0.03521728515625, -0.028329849243164062, -0.021442413330078125, -0.014554977416992188, -0.00766754150390625, -0.0007801055908203125, 0.006107330322265625, 0.012994766235351562, 0.0198822021484375, 0.026769638061523438, 0.033657073974609375, 0.04054450988769531, 0.04743194580078125, 0.05431938171386719, 0.061206817626953125, 0.06809425354003906, 0.074981689453125, 0.08186912536621094, 0.08875656127929688, 0.09564399719238281, 0.10253143310546875, 0.10941886901855469, 0.11630630493164062, 0.12319374084472656, 0.1300811767578125, 0.13696861267089844, 0.14385604858398438, 0.1507434844970703, 0.15763092041015625, 0.1645183563232422, 0.17140579223632812, 0.17829322814941406, 0.1851806640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 17.0, 17.0, 19.0, 25.0, 33.0, 51.0, 50.0, 58.0, 78.0, 61.0, 64.0, 52.0, 61.0, 68.0, 58.0, 44.0, 43.0, 43.0, 28.0, 21.0, 34.0, 11.0, 12.0, 8.0, 7.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3682441711425781, -0.35782623291015625, -0.3474082946777344, -0.3369903564453125, -0.3265724182128906, -0.31615447998046875, -0.3057365417480469, -0.295318603515625, -0.2849006652832031, -0.27448272705078125, -0.2640647888183594, -0.2536468505859375, -0.24322891235351562, -0.23281097412109375, -0.22239303588867188, -0.21197509765625, -0.20155715942382812, -0.19113922119140625, -0.18072128295898438, -0.1703033447265625, -0.15988540649414062, -0.14946746826171875, -0.13904953002929688, -0.128631591796875, -0.11821365356445312, -0.10779571533203125, -0.09737777709960938, -0.0869598388671875, -0.07654190063476562, -0.06612396240234375, -0.055706024169921875, -0.0452880859375, -0.034870147705078125, -0.02445220947265625, -0.014034271240234375, -0.0036163330078125, 0.006801605224609375, 0.01721954345703125, 0.027637481689453125, 0.038055419921875, 0.048473358154296875, 0.05889129638671875, 0.06930923461914062, 0.0797271728515625, 0.09014511108398438, 0.10056304931640625, 0.11098098754882812, 0.12139892578125, 0.13181686401367188, 0.14223480224609375, 0.15265274047851562, 0.1630706787109375, 0.17348861694335938, 0.18390655517578125, 0.19432449340820312, 0.204742431640625, 0.21516036987304688, 0.22557830810546875, 0.23599624633789062, 0.2464141845703125, 0.2568321228027344, 0.26725006103515625, 0.2776679992675781, 0.2880859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 11.0, 9.0, 17.0, 17.0, 22.0, 51.0, 43.0, 115.0, 168.0, 347.0, 817.0, 2266.0, 10150.0, 102561.0, 805331.0, 111860.0, 10741.0, 2434.0, 766.0, 347.0, 203.0, 74.0, 53.0, 37.0, 26.0, 23.0, 12.0, 9.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0826416015625, -0.08031463623046875, -0.0779876708984375, -0.07566070556640625, -0.073333740234375, -0.07100677490234375, -0.0686798095703125, -0.06635284423828125, -0.06402587890625, -0.06169891357421875, -0.0593719482421875, -0.05704498291015625, -0.054718017578125, -0.05239105224609375, -0.0500640869140625, -0.04773712158203125, -0.04541015625, -0.04308319091796875, -0.0407562255859375, -0.03842926025390625, -0.036102294921875, -0.03377532958984375, -0.0314483642578125, -0.02912139892578125, -0.02679443359375, -0.02446746826171875, -0.0221405029296875, -0.01981353759765625, -0.017486572265625, -0.01515960693359375, -0.0128326416015625, -0.01050567626953125, -0.0081787109375, -0.00585174560546875, -0.0035247802734375, -0.00119781494140625, 0.001129150390625, 0.00345611572265625, 0.0057830810546875, 0.00811004638671875, 0.01043701171875, 0.01276397705078125, 0.0150909423828125, 0.01741790771484375, 0.019744873046875, 0.02207183837890625, 0.0243988037109375, 0.02672576904296875, 0.029052734375, 0.03137969970703125, 0.0337066650390625, 0.03603363037109375, 0.038360595703125, 0.04068756103515625, 0.0430145263671875, 0.04534149169921875, 0.04766845703125, 0.04999542236328125, 0.0523223876953125, 0.05464935302734375, 0.056976318359375, 0.05930328369140625, 0.0616302490234375, 0.06395721435546875, 0.0662841796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 9.0, 6.0, 4.0, 14.0, 17.0, 14.0, 31.0, 36.0, 46.0, 54.0, 91.0, 129.0, 125.0, 114.0, 86.0, 55.0, 40.0, 36.0, 22.0, 14.0, 12.0, 15.0, 9.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.827447891235352e-05, -8.577294647693634e-05, -8.327141404151917e-05, -8.076988160610199e-05, -7.826834917068481e-05, -7.576681673526764e-05, -7.326528429985046e-05, -7.076375186443329e-05, -6.826221942901611e-05, -6.576068699359894e-05, -6.325915455818176e-05, -6.075762212276459e-05, -5.825608968734741e-05, -5.575455725193024e-05, -5.325302481651306e-05, -5.0751492381095886e-05, -4.824995994567871e-05, -4.5748427510261536e-05, -4.324689507484436e-05, -4.0745362639427185e-05, -3.824383020401001e-05, -3.5742297768592834e-05, -3.324076533317566e-05, -3.0739232897758484e-05, -2.823770046234131e-05, -2.5736168026924133e-05, -2.3234635591506958e-05, -2.0733103156089783e-05, -1.8231570720672607e-05, -1.5730038285255432e-05, -1.3228505849838257e-05, -1.0726973414421082e-05, -8.225440979003906e-06, -5.723908543586731e-06, -3.2223761081695557e-06, -7.208436727523804e-07, 1.780688762664795e-06, 4.28222119808197e-06, 6.7837536334991455e-06, 9.28528606891632e-06, 1.1786818504333496e-05, 1.4288350939750671e-05, 1.6789883375167847e-05, 1.9291415810585022e-05, 2.1792948246002197e-05, 2.4294480681419373e-05, 2.6796013116836548e-05, 2.9297545552253723e-05, 3.17990779876709e-05, 3.4300610423088074e-05, 3.680214285850525e-05, 3.9303675293922424e-05, 4.18052077293396e-05, 4.4306740164756775e-05, 4.680827260017395e-05, 4.9309805035591125e-05, 5.18113374710083e-05, 5.4312869906425476e-05, 5.681440234184265e-05, 5.931593477725983e-05, 6.1817467212677e-05, 6.431899964809418e-05, 6.682053208351135e-05, 6.932206451892853e-05, 7.18235969543457e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 8.0, 4.0, 10.0, 12.0, 20.0, 32.0, 37.0, 54.0, 91.0, 150.0, 244.0, 506.0, 934.0, 2576.0, 10162.0, 90314.0, 762066.0, 160312.0, 15317.0, 3238.0, 1198.0, 514.0, 273.0, 141.0, 97.0, 66.0, 51.0, 41.0, 24.0, 14.0, 10.0, 7.0, 4.0, 7.0, 2.0, 6.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.07781982421875, -0.07557106018066406, -0.07332229614257812, -0.07107353210449219, -0.06882476806640625, -0.06657600402832031, -0.06432723999023438, -0.06207847595214844, -0.0598297119140625, -0.05758094787597656, -0.055332183837890625, -0.05308341979980469, -0.05083465576171875, -0.04858589172363281, -0.046337127685546875, -0.04408836364746094, -0.041839599609375, -0.03959083557128906, -0.037342071533203125, -0.03509330749511719, -0.03284454345703125, -0.030595779418945312, -0.028347015380859375, -0.026098251342773438, -0.0238494873046875, -0.021600723266601562, -0.019351959228515625, -0.017103195190429688, -0.01485443115234375, -0.012605667114257812, -0.010356903076171875, -0.008108139038085938, -0.005859375, -0.0036106109619140625, -0.001361846923828125, 0.0008869171142578125, 0.00313568115234375, 0.0053844451904296875, 0.007633209228515625, 0.009881973266601562, 0.0121307373046875, 0.014379501342773438, 0.016628265380859375, 0.018877029418945312, 0.02112579345703125, 0.023374557495117188, 0.025623321533203125, 0.027872085571289062, 0.030120849609375, 0.03236961364746094, 0.034618377685546875, 0.03686714172363281, 0.03911590576171875, 0.04136466979980469, 0.043613433837890625, 0.04586219787597656, 0.0481109619140625, 0.05035972595214844, 0.052608489990234375, 0.05485725402832031, 0.05710601806640625, 0.05935478210449219, 0.061603546142578125, 0.06385231018066406, 0.06610107421875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 10.0, 18.0, 21.0, 52.0, 70.0, 121.0, 174.0, 179.0, 139.0, 81.0, 70.0, 29.0, 20.0, 6.0, 7.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06982421875, -0.06552696228027344, -0.061229705810546875, -0.05693244934082031, -0.05263519287109375, -0.04833793640136719, -0.044040679931640625, -0.03974342346191406, -0.0354461669921875, -0.031148910522460938, -0.026851654052734375, -0.022554397583007812, -0.01825714111328125, -0.013959884643554688, -0.009662628173828125, -0.0053653717041015625, -0.001068115234375, 0.0032291412353515625, 0.007526397705078125, 0.011823654174804688, 0.01612091064453125, 0.020418167114257812, 0.024715423583984375, 0.029012680053710938, 0.0333099365234375, 0.03760719299316406, 0.041904449462890625, 0.04620170593261719, 0.05049896240234375, 0.05479621887207031, 0.059093475341796875, 0.06339073181152344, 0.06768798828125, 0.07198524475097656, 0.07628250122070312, 0.08057975769042969, 0.08487701416015625, 0.08917427062988281, 0.09347152709960938, 0.09776878356933594, 0.1020660400390625, 0.10636329650878906, 0.11066055297851562, 0.11495780944824219, 0.11925506591796875, 0.12355232238769531, 0.12784957885742188, 0.13214683532714844, 0.136444091796875, 0.14074134826660156, 0.14503860473632812, 0.1493358612060547, 0.15363311767578125, 0.1579303741455078, 0.16222763061523438, 0.16652488708496094, 0.1708221435546875, 0.17511940002441406, 0.17941665649414062, 0.1837139129638672, 0.18801116943359375, 0.1923084259033203, 0.19660568237304688, 0.20090293884277344, 0.2052001953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 2.0, 14.0, 31.0, 67.0, 152.0, 219.0, 243.0, 140.0, 69.0, 32.0, 15.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2400741577148438, -1.1777137517929077, -1.1153533458709717, -1.0529930591583252, -0.9906326532363892, -0.9282722473144531, -0.8659118413925171, -0.803551435470581, -0.7411910891532898, -0.6788306832313538, -0.6164703369140625, -0.5541099309921265, -0.4917495548725128, -0.42938917875289917, -0.36702877283096313, -0.3046683967113495, -0.24230802059173584, -0.1799476444721222, -0.11758725345134735, -0.05522686243057251, 0.007133513689041138, 0.06949388980865479, 0.13185429573059082, 0.19421467185020447, 0.2565750479698181, 0.31893542408943176, 0.3812958002090454, 0.44365620613098145, 0.5060166120529175, 0.5683769583702087, 0.6307373642921448, 0.693097710609436, 0.7554581165313721, 0.8178185224533081, 0.8801788687705994, 0.9425392746925354, 1.0048996210098267, 1.0672600269317627, 1.1296204328536987, 1.1919808387756348, 1.2543411254882812, 1.3167015314102173, 1.3790619373321533, 1.4414222240447998, 1.5037826299667358, 1.5661430358886719, 1.628503441810608, 1.690863847732544, 1.75322425365448, 1.815584659576416, 1.877945065498352, 1.940305471420288, 2.0026657581329346, 2.06502628326416, 2.1273865699768066, 2.189746856689453, 2.2521073818206787, 2.314467668533325, 2.376828193664551, 2.4391884803771973, 2.501549005508423, 2.5639092922210693, 2.626269817352295, 2.6886301040649414, 2.750990390777588]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 4.0, 6.0, 8.0, 7.0, 18.0, 12.0, 27.0, 25.0, 37.0, 44.0, 35.0, 51.0, 59.0, 55.0, 41.0, 67.0, 65.0, 54.0, 51.0, 49.0, 41.0, 39.0, 33.0, 37.0, 30.0, 21.0, 21.0, 16.0, 5.0, 8.0, 10.0, 3.0, 6.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4186487197875977, -1.3738893270492554, -1.3291298151016235, -1.2843704223632812, -1.2396109104156494, -1.1948515176773071, -1.1500921249389648, -1.105332612991333, -1.0605731010437012, -1.0158137083053589, -0.971054196357727, -0.9262948036193848, -0.8815352916717529, -0.8367758989334106, -0.7920164465904236, -0.7472569942474365, -0.7024976015090942, -0.6577381491661072, -0.6129786968231201, -0.5682193040847778, -0.523459792137146, -0.4787003695964813, -0.43394094705581665, -0.3891814947128296, -0.34442204236984253, -0.29966259002685547, -0.2549031376838684, -0.21014371514320374, -0.16538426280021667, -0.12062481045722961, -0.07586538791656494, -0.03110593557357788, 0.01365351676940918, 0.05841296166181564, 0.1031724065542221, 0.14793184399604797, 0.19269129633903503, 0.2374507486820221, 0.28221017122268677, 0.32696962356567383, 0.3717290759086609, 0.41648852825164795, 0.461247980594635, 0.5060074329376221, 0.5507668256759644, 0.5955263376235962, 0.6402857303619385, 0.6850451827049255, 0.7298046350479126, 0.7745640873908997, 0.8193235397338867, 0.864082932472229, 0.9088424444198608, 0.9536018371582031, 0.9983612895011902, 1.0431207418441772, 1.0878801345825195, 1.1326395273208618, 1.1773990392684937, 1.222158432006836, 1.2669179439544678, 1.31167733669281, 1.3564367294311523, 1.4011962413787842, 1.445955753326416]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 11.0, 14.0, 21.0, 28.0, 45.0, 66.0, 119.0, 259.0, 606.0, 1911.0, 7511.0, 53358.0, 3643198.0, 461041.0, 19760.0, 4006.0, 1240.0, 521.0, 249.0, 130.0, 61.0, 49.0, 28.0, 16.0, 11.0, 9.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1666259765625, -0.1606292724609375, -0.154632568359375, -0.1486358642578125, -0.14263916015625, -0.1366424560546875, -0.130645751953125, -0.1246490478515625, -0.11865234375, -0.1126556396484375, -0.106658935546875, -0.1006622314453125, -0.09466552734375, -0.0886688232421875, -0.082672119140625, -0.0766754150390625, -0.0706787109375, -0.0646820068359375, -0.058685302734375, -0.0526885986328125, -0.04669189453125, -0.0406951904296875, -0.034698486328125, -0.0287017822265625, -0.022705078125, -0.0167083740234375, -0.010711669921875, -0.0047149658203125, 0.00128173828125, 0.0072784423828125, 0.013275146484375, 0.0192718505859375, 0.0252685546875, 0.0312652587890625, 0.037261962890625, 0.0432586669921875, 0.04925537109375, 0.0552520751953125, 0.061248779296875, 0.0672454833984375, 0.0732421875, 0.0792388916015625, 0.085235595703125, 0.0912322998046875, 0.09722900390625, 0.1032257080078125, 0.109222412109375, 0.1152191162109375, 0.1212158203125, 0.1272125244140625, 0.133209228515625, 0.1392059326171875, 0.14520263671875, 0.1511993408203125, 0.157196044921875, 0.1631927490234375, 0.169189453125, 0.1751861572265625, 0.181182861328125, 0.1871795654296875, 0.19317626953125, 0.1991729736328125, 0.205169677734375, 0.2111663818359375, 0.2171630859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 7.0, 8.0, 16.0, 20.0, 41.0, 55.0, 82.0, 71.0, 96.0, 104.0, 99.0, 86.0, 57.0, 77.0, 57.0, 41.0, 23.0, 19.0, 15.0, 12.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08221435546875, -0.07893848419189453, -0.07566261291503906, -0.0723867416381836, -0.06911087036132812, -0.06583499908447266, -0.06255912780761719, -0.05928325653076172, -0.05600738525390625, -0.05273151397705078, -0.04945564270019531, -0.046179771423339844, -0.042903900146484375, -0.039628028869628906, -0.03635215759277344, -0.03307628631591797, -0.0298004150390625, -0.02652454376220703, -0.023248672485351562, -0.019972801208496094, -0.016696929931640625, -0.013421058654785156, -0.010145187377929688, -0.006869316101074219, -0.00359344482421875, -0.00031757354736328125, 0.0029582977294921875, 0.006234169006347656, 0.009510040283203125, 0.012785911560058594, 0.016061782836914062, 0.01933765411376953, 0.022613525390625, 0.02588939666748047, 0.029165267944335938, 0.032441139221191406, 0.035717010498046875, 0.038992881774902344, 0.04226875305175781, 0.04554462432861328, 0.04882049560546875, 0.05209636688232422, 0.05537223815917969, 0.058648109436035156, 0.061923980712890625, 0.0651998519897461, 0.06847572326660156, 0.07175159454345703, 0.0750274658203125, 0.07830333709716797, 0.08157920837402344, 0.0848550796508789, 0.08813095092773438, 0.09140682220458984, 0.09468269348144531, 0.09795856475830078, 0.10123443603515625, 0.10451030731201172, 0.10778617858886719, 0.11106204986572266, 0.11433792114257812, 0.1176137924194336, 0.12088966369628906, 0.12416553497314453, 0.12744140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 8.0, 20.0, 30.0, 54.0, 136.0, 337.0, 1003.0, 4522.0, 38920.0, 3813733.0, 319308.0, 13240.0, 2013.0, 570.0, 209.0, 92.0, 25.0, 17.0, 6.0, 11.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.2152729034423828, -0.20752334594726562, -0.19977378845214844, -0.19202423095703125, -0.18427467346191406, -0.17652511596679688, -0.1687755584716797, -0.1610260009765625, -0.1532764434814453, -0.14552688598632812, -0.13777732849121094, -0.13002777099609375, -0.12227821350097656, -0.11452865600585938, -0.10677909851074219, -0.099029541015625, -0.09127998352050781, -0.08353042602539062, -0.07578086853027344, -0.06803131103515625, -0.06028175354003906, -0.052532196044921875, -0.04478263854980469, -0.0370330810546875, -0.029283523559570312, -0.021533966064453125, -0.013784408569335938, -0.00603485107421875, 0.0017147064208984375, 0.009464263916015625, 0.017213821411132812, 0.02496337890625, 0.03271293640136719, 0.040462493896484375, 0.04821205139160156, 0.05596160888671875, 0.06371116638183594, 0.07146072387695312, 0.07921028137207031, 0.0869598388671875, 0.09470939636230469, 0.10245895385742188, 0.11020851135253906, 0.11795806884765625, 0.12570762634277344, 0.13345718383789062, 0.1412067413330078, 0.148956298828125, 0.1567058563232422, 0.16445541381835938, 0.17220497131347656, 0.17995452880859375, 0.18770408630371094, 0.19545364379882812, 0.2032032012939453, 0.2109527587890625, 0.2187023162841797, 0.22645187377929688, 0.23420143127441406, 0.24195098876953125, 0.24970054626464844, 0.2574501037597656, 0.2651996612548828, 0.27294921875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 6.0, 5.0, 9.0, 13.0, 13.0, 37.0, 50.0, 67.0, 216.0, 613.0, 1575.0, 961.0, 280.0, 97.0, 40.0, 26.0, 20.0, 21.0, 12.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.242919921875, -0.23645591735839844, -0.22999191284179688, -0.2235279083251953, -0.21706390380859375, -0.2105998992919922, -0.20413589477539062, -0.19767189025878906, -0.1912078857421875, -0.18474388122558594, -0.17827987670898438, -0.1718158721923828, -0.16535186767578125, -0.1588878631591797, -0.15242385864257812, -0.14595985412597656, -0.139495849609375, -0.13303184509277344, -0.12656784057617188, -0.12010383605957031, -0.11363983154296875, -0.10717582702636719, -0.10071182250976562, -0.09424781799316406, -0.0877838134765625, -0.08131980895996094, -0.07485580444335938, -0.06839179992675781, -0.06192779541015625, -0.05546379089355469, -0.048999786376953125, -0.04253578186035156, -0.03607177734375, -0.029607772827148438, -0.023143768310546875, -0.016679763793945312, -0.01021575927734375, -0.0037517547607421875, 0.002712249755859375, 0.009176254272460938, 0.0156402587890625, 0.022104263305664062, 0.028568267822265625, 0.03503227233886719, 0.04149627685546875, 0.04796028137207031, 0.054424285888671875, 0.06088829040527344, 0.067352294921875, 0.07381629943847656, 0.08028030395507812, 0.08674430847167969, 0.09320831298828125, 0.09967231750488281, 0.10613632202148438, 0.11260032653808594, 0.1190643310546875, 0.12552833557128906, 0.13199234008789062, 0.1384563446044922, 0.14492034912109375, 0.1513843536376953, 0.15784835815429688, 0.16431236267089844, 0.1707763671875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 11.0, 16.0, 47.0, 72.0, 135.0, 161.0, 178.0, 144.0, 83.0, 55.0, 32.0, 14.0, 11.0, 4.0, 6.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8262320160865784, -0.7948660850524902, -0.7635002136230469, -0.7321342825889587, -0.7007684111595154, -0.6694024801254272, -0.6380366086959839, -0.6066706776618958, -0.5753047466278076, -0.5439388155937195, -0.5125729441642761, -0.481207013130188, -0.44984114170074463, -0.4184752106666565, -0.38710930943489075, -0.355743408203125, -0.32437753677368164, -0.2930116355419159, -0.26164573431015015, -0.2302798181772232, -0.19891391694545746, -0.1675480157136917, -0.13618209958076477, -0.10481619834899902, -0.07345029711723328, -0.04208439216017723, -0.010718487203121185, 0.02064742147922516, 0.052013322710990906, 0.08337922394275665, 0.1147451400756836, 0.14611104130744934, 0.17747700214385986, 0.2088429033756256, 0.24020880460739136, 0.2715747356414795, 0.30294060707092285, 0.334306538105011, 0.36567243933677673, 0.3970383405685425, 0.4284042418003082, 0.459770143032074, 0.4911360442638397, 0.5225019454956055, 0.5538678765296936, 0.585233747959137, 0.6165996789932251, 0.6479655504226685, 0.6793314814567566, 0.7106974124908447, 0.7420632839202881, 0.7734292149543762, 0.8047950863838196, 0.8361610174179077, 0.8675268888473511, 0.8988928198814392, 0.9302587509155273, 0.9616246819496155, 0.9929905533790588, 1.024356484413147, 1.0557223558425903, 1.0870882272720337, 1.1184542179107666, 1.14982008934021, 1.1811859607696533]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 12.0, 12.0, 19.0, 14.0, 26.0, 17.0, 21.0, 29.0, 38.0, 38.0, 25.0, 40.0, 51.0, 43.0, 52.0, 48.0, 42.0, 47.0, 48.0, 38.0, 51.0, 41.0, 42.0, 35.0, 30.0, 28.0, 16.0, 16.0, 8.0, 12.0, 15.0, 4.0, 4.0, 9.0, 10.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6143044829368591, -0.5954985618591309, -0.5766926407814026, -0.5578866600990295, -0.5390807390213013, -0.520274817943573, -0.5014688968658447, -0.48266297578811646, -0.4638570249080658, -0.4450511038303375, -0.42624515295028687, -0.4074392318725586, -0.3886333107948303, -0.36982735991477966, -0.3510214388370514, -0.33221548795700073, -0.31340956687927246, -0.2946036458015442, -0.27579769492149353, -0.25699177384376526, -0.2381858378648758, -0.21937990188598633, -0.20057398080825806, -0.1817680448293686, -0.16296210885047913, -0.14415617287158966, -0.1253502368927002, -0.10654431581497192, -0.08773837983608246, -0.068932443857193, -0.050126515328884125, -0.031320586800575256, -0.012514591217041016, 0.006291341036558151, 0.025097273290157318, 0.043903205543756485, 0.06270913779735565, 0.08151507377624512, 0.10032100230455399, 0.11912693083286285, 0.13793286681175232, 0.15673880279064178, 0.17554473876953125, 0.19435065984725952, 0.213156595826149, 0.23196253180503845, 0.2507684528827667, 0.2695744037628174, 0.28838032484054565, 0.3071862459182739, 0.3259921967983246, 0.34479811787605286, 0.3636040687561035, 0.3824099898338318, 0.40121591091156006, 0.42002183198928833, 0.438827782869339, 0.45763370394706726, 0.4764396548271179, 0.4952455759048462, 0.5140514969825745, 0.5328574180603027, 0.5516633987426758, 0.570469319820404, 0.5892752408981323]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 15.0, 16.0, 22.0, 22.0, 63.0, 71.0, 177.0, 302.0, 635.0, 1408.0, 4061.0, 12803.0, 49849.0, 233355.0, 522391.0, 170538.0, 37297.0, 9927.0, 3210.0, 1217.0, 542.0, 266.0, 130.0, 84.0, 43.0, 31.0, 22.0, 13.0, 13.0, 10.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.1434326171875, -0.13949203491210938, -0.13555145263671875, -0.13161087036132812, -0.1276702880859375, -0.12372970581054688, -0.11978912353515625, -0.11584854125976562, -0.111907958984375, -0.10796737670898438, -0.10402679443359375, -0.10008621215820312, -0.0961456298828125, -0.09220504760742188, -0.08826446533203125, -0.08432388305664062, -0.08038330078125, -0.07644271850585938, -0.07250213623046875, -0.06856155395507812, -0.0646209716796875, -0.060680389404296875, -0.05673980712890625, -0.052799224853515625, -0.048858642578125, -0.044918060302734375, -0.04097747802734375, -0.037036895751953125, -0.0330963134765625, -0.029155731201171875, -0.02521514892578125, -0.021274566650390625, -0.017333984375, -0.013393402099609375, -0.00945281982421875, -0.005512237548828125, -0.0015716552734375, 0.002368927001953125, 0.00630950927734375, 0.010250091552734375, 0.014190673828125, 0.018131256103515625, 0.02207183837890625, 0.026012420654296875, 0.0299530029296875, 0.033893585205078125, 0.03783416748046875, 0.041774749755859375, 0.04571533203125, 0.049655914306640625, 0.05359649658203125, 0.057537078857421875, 0.0614776611328125, 0.06541824340820312, 0.06935882568359375, 0.07329940795898438, 0.077239990234375, 0.08118057250976562, 0.08512115478515625, 0.08906173706054688, 0.0930023193359375, 0.09694290161132812, 0.10088348388671875, 0.10482406616210938, 0.1087646484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 2.0, 10.0, 14.0, 20.0, 18.0, 24.0, 33.0, 40.0, 37.0, 62.0, 57.0, 50.0, 73.0, 75.0, 63.0, 61.0, 68.0, 47.0, 55.0, 34.0, 32.0, 32.0, 23.0, 20.0, 10.0, 9.0, 12.0, 7.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059814453125, -0.05759239196777344, -0.055370330810546875, -0.05314826965332031, -0.05092620849609375, -0.04870414733886719, -0.046482086181640625, -0.04426002502441406, -0.0420379638671875, -0.03981590270996094, -0.037593841552734375, -0.03537178039550781, -0.03314971923828125, -0.030927658081054688, -0.028705596923828125, -0.026483535766601562, -0.024261474609375, -0.022039413452148438, -0.019817352294921875, -0.017595291137695312, -0.01537322998046875, -0.013151168823242188, -0.010929107666015625, -0.008707046508789062, -0.0064849853515625, -0.0042629241943359375, -0.002040863037109375, 0.0001811981201171875, 0.00240325927734375, 0.0046253204345703125, 0.006847381591796875, 0.009069442749023438, 0.01129150390625, 0.013513565063476562, 0.015735626220703125, 0.017957687377929688, 0.02017974853515625, 0.022401809692382812, 0.024623870849609375, 0.026845932006835938, 0.0290679931640625, 0.03129005432128906, 0.033512115478515625, 0.03573417663574219, 0.03795623779296875, 0.04017829895019531, 0.042400360107421875, 0.04462242126464844, 0.046844482421875, 0.04906654357910156, 0.051288604736328125, 0.05351066589355469, 0.05573272705078125, 0.05795478820800781, 0.060176849365234375, 0.06239891052246094, 0.0646209716796875, 0.06684303283691406, 0.06906509399414062, 0.07128715515136719, 0.07350921630859375, 0.07573127746582031, 0.07795333862304688, 0.08017539978027344, 0.0823974609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 11.0, 9.0, 13.0, 13.0, 23.0, 26.0, 24.0, 61.0, 92.0, 123.0, 209.0, 297.0, 523.0, 1036.0, 2210.0, 7319.0, 48874.0, 677051.0, 280484.0, 22047.0, 4489.0, 1645.0, 789.0, 430.0, 265.0, 162.0, 96.0, 72.0, 50.0, 36.0, 18.0, 17.0, 7.0, 8.0, 7.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1739501953125, -0.1683063507080078, -0.16266250610351562, -0.15701866149902344, -0.15137481689453125, -0.14573097229003906, -0.14008712768554688, -0.1344432830810547, -0.1287994384765625, -0.12315559387207031, -0.11751174926757812, -0.11186790466308594, -0.10622406005859375, -0.10058021545410156, -0.09493637084960938, -0.08929252624511719, -0.083648681640625, -0.07800483703613281, -0.07236099243164062, -0.06671714782714844, -0.06107330322265625, -0.05542945861816406, -0.049785614013671875, -0.04414176940917969, -0.0384979248046875, -0.03285408020019531, -0.027210235595703125, -0.021566390991210938, -0.01592254638671875, -0.010278701782226562, -0.004634857177734375, 0.0010089874267578125, 0.00665283203125, 0.012296676635742188, 0.017940521240234375, 0.023584365844726562, 0.02922821044921875, 0.03487205505371094, 0.040515899658203125, 0.04615974426269531, 0.0518035888671875, 0.05744743347167969, 0.06309127807617188, 0.06873512268066406, 0.07437896728515625, 0.08002281188964844, 0.08566665649414062, 0.09131050109863281, 0.096954345703125, 0.10259819030761719, 0.10824203491210938, 0.11388587951660156, 0.11952972412109375, 0.12517356872558594, 0.13081741333007812, 0.1364612579345703, 0.1421051025390625, 0.1477489471435547, 0.15339279174804688, 0.15903663635253906, 0.16468048095703125, 0.17032432556152344, 0.17596817016601562, 0.1816120147705078, 0.187255859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 11.0, 7.0, 10.0, 15.0, 19.0, 25.0, 11.0, 33.0, 46.0, 44.0, 43.0, 49.0, 53.0, 52.0, 67.0, 55.0, 60.0, 53.0, 41.0, 37.0, 49.0, 30.0, 35.0, 30.0, 22.0, 23.0, 21.0, 13.0, 4.0, 13.0, 9.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.259765625, -0.25261497497558594, -0.24546432495117188, -0.2383136749267578, -0.23116302490234375, -0.2240123748779297, -0.21686172485351562, -0.20971107482910156, -0.2025604248046875, -0.19540977478027344, -0.18825912475585938, -0.1811084747314453, -0.17395782470703125, -0.1668071746826172, -0.15965652465820312, -0.15250587463378906, -0.145355224609375, -0.13820457458496094, -0.13105392456054688, -0.12390327453613281, -0.11675262451171875, -0.10960197448730469, -0.10245132446289062, -0.09530067443847656, -0.0881500244140625, -0.08099937438964844, -0.07384872436523438, -0.06669807434082031, -0.05954742431640625, -0.05239677429199219, -0.045246124267578125, -0.03809547424316406, -0.03094482421875, -0.023794174194335938, -0.016643524169921875, -0.009492874145507812, -0.00234222412109375, 0.0048084259033203125, 0.011959075927734375, 0.019109725952148438, 0.0262603759765625, 0.03341102600097656, 0.040561676025390625, 0.04771232604980469, 0.05486297607421875, 0.06201362609863281, 0.06916427612304688, 0.07631492614746094, 0.083465576171875, 0.09061622619628906, 0.09776687622070312, 0.10491752624511719, 0.11206817626953125, 0.11921882629394531, 0.12636947631835938, 0.13352012634277344, 0.1406707763671875, 0.14782142639160156, 0.15497207641601562, 0.1621227264404297, 0.16927337646484375, 0.1764240264892578, 0.18357467651367188, 0.19072532653808594, 0.1978759765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 12.0, 15.0, 18.0, 22.0, 43.0, 59.0, 160.0, 300.0, 858.0, 3586.0, 37654.0, 905036.0, 92938.0, 5876.0, 1164.0, 424.0, 147.0, 90.0, 47.0, 19.0, 19.0, 21.0, 16.0, 9.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08209228515625, -0.07875919342041016, -0.07542610168457031, -0.07209300994873047, -0.06875991821289062, -0.06542682647705078, -0.06209373474121094, -0.058760643005371094, -0.05542755126953125, -0.052094459533691406, -0.04876136779785156, -0.04542827606201172, -0.042095184326171875, -0.03876209259033203, -0.03542900085449219, -0.032095909118652344, -0.0287628173828125, -0.025429725646972656, -0.022096633911132812, -0.01876354217529297, -0.015430450439453125, -0.012097358703613281, -0.008764266967773438, -0.005431175231933594, -0.00209808349609375, 0.0012350082397460938, 0.0045680999755859375, 0.007901191711425781, 0.011234283447265625, 0.014567375183105469, 0.017900466918945312, 0.021233558654785156, 0.024566650390625, 0.027899742126464844, 0.031232833862304688, 0.03456592559814453, 0.037899017333984375, 0.04123210906982422, 0.04456520080566406, 0.047898292541503906, 0.05123138427734375, 0.054564476013183594, 0.05789756774902344, 0.06123065948486328, 0.06456375122070312, 0.06789684295654297, 0.07122993469238281, 0.07456302642822266, 0.0778961181640625, 0.08122920989990234, 0.08456230163574219, 0.08789539337158203, 0.09122848510742188, 0.09456157684326172, 0.09789466857910156, 0.1012277603149414, 0.10456085205078125, 0.1078939437866211, 0.11122703552246094, 0.11456012725830078, 0.11789321899414062, 0.12122631072998047, 0.12455940246582031, 0.12789249420166016, 0.1312255859375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 4.0, 9.0, 6.0, 8.0, 8.0, 7.0, 15.0, 14.0, 40.0, 61.0, 77.0, 145.0, 191.0, 156.0, 81.0, 56.0, 28.0, 20.0, 13.0, 11.0, 8.0, 7.0, 9.0, 2.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001308917999267578, -0.00012729410082101822, -0.00012369640171527863, -0.00012009870260953903, -0.00011650100350379944, -0.00011290330439805984, -0.00010930560529232025, -0.00010570790618658066, -0.00010211020708084106, -9.851250797510147e-05, -9.491480886936188e-05, -9.131710976362228e-05, -8.771941065788269e-05, -8.41217115521431e-05, -8.05240124464035e-05, -7.692631334066391e-05, -7.332861423492432e-05, -6.973091512918472e-05, -6.613321602344513e-05, -6.253551691770554e-05, -5.893781781196594e-05, -5.534011870622635e-05, -5.1742419600486755e-05, -4.814472049474716e-05, -4.454702138900757e-05, -4.0949322283267975e-05, -3.735162317752838e-05, -3.375392407178879e-05, -3.0156224966049194e-05, -2.65585258603096e-05, -2.2960826754570007e-05, -1.9363127648830414e-05, -1.576542854309082e-05, -1.2167729437351227e-05, -8.570030331611633e-06, -4.97233122587204e-06, -1.3746321201324463e-06, 2.2230669856071472e-06, 5.820766091346741e-06, 9.418465197086334e-06, 1.3016164302825928e-05, 1.661386340856552e-05, 2.0211562514305115e-05, 2.3809261620044708e-05, 2.7406960725784302e-05, 3.1004659831523895e-05, 3.460235893726349e-05, 3.820005804300308e-05, 4.1797757148742676e-05, 4.539545625448227e-05, 4.899315536022186e-05, 5.2590854465961456e-05, 5.618855357170105e-05, 5.978625267744064e-05, 6.338395178318024e-05, 6.698165088891983e-05, 7.057934999465942e-05, 7.417704910039902e-05, 7.777474820613861e-05, 8.13724473118782e-05, 8.49701464176178e-05, 8.856784552335739e-05, 9.216554462909698e-05, 9.576324373483658e-05, 9.936094284057617e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 9.0, 19.0, 17.0, 27.0, 37.0, 55.0, 74.0, 155.0, 266.0, 499.0, 1074.0, 2771.0, 10717.0, 88955.0, 793923.0, 129893.0, 14009.0, 3395.0, 1264.0, 592.0, 313.0, 167.0, 106.0, 61.0, 54.0, 25.0, 24.0, 10.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07208633422851562, -0.06964874267578125, -0.06721115112304688, -0.0647735595703125, -0.062335968017578125, -0.05989837646484375, -0.057460784912109375, -0.055023193359375, -0.052585601806640625, -0.05014801025390625, -0.047710418701171875, -0.0452728271484375, -0.042835235595703125, -0.04039764404296875, -0.037960052490234375, -0.0355224609375, -0.033084869384765625, -0.03064727783203125, -0.028209686279296875, -0.0257720947265625, -0.023334503173828125, -0.02089691162109375, -0.018459320068359375, -0.016021728515625, -0.013584136962890625, -0.01114654541015625, -0.008708953857421875, -0.0062713623046875, -0.003833770751953125, -0.00139617919921875, 0.001041412353515625, 0.00347900390625, 0.005916595458984375, 0.00835418701171875, 0.010791778564453125, 0.0132293701171875, 0.015666961669921875, 0.01810455322265625, 0.020542144775390625, 0.022979736328125, 0.025417327880859375, 0.02785491943359375, 0.030292510986328125, 0.0327301025390625, 0.035167694091796875, 0.03760528564453125, 0.040042877197265625, 0.04248046875, 0.044918060302734375, 0.04735565185546875, 0.049793243408203125, 0.0522308349609375, 0.054668426513671875, 0.05710601806640625, 0.059543609619140625, 0.061981201171875, 0.06441879272460938, 0.06685638427734375, 0.06929397583007812, 0.0717315673828125, 0.07416915893554688, 0.07660675048828125, 0.07904434204101562, 0.08148193359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 7.0, 6.0, 7.0, 11.0, 18.0, 20.0, 43.0, 35.0, 43.0, 53.0, 83.0, 103.0, 108.0, 101.0, 85.0, 68.0, 51.0, 34.0, 31.0, 19.0, 16.0, 12.0, 14.0, 15.0, 8.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06201171875, -0.05985450744628906, -0.057697296142578125, -0.05554008483886719, -0.05338287353515625, -0.05122566223144531, -0.049068450927734375, -0.04691123962402344, -0.0447540283203125, -0.04259681701660156, -0.040439605712890625, -0.03828239440917969, -0.03612518310546875, -0.03396797180175781, -0.031810760498046875, -0.029653549194335938, -0.027496337890625, -0.025339126586914062, -0.023181915283203125, -0.021024703979492188, -0.01886749267578125, -0.016710281372070312, -0.014553070068359375, -0.012395858764648438, -0.0102386474609375, -0.008081436157226562, -0.005924224853515625, -0.0037670135498046875, -0.00160980224609375, 0.0005474090576171875, 0.002704620361328125, 0.0048618316650390625, 0.00701904296875, 0.009176254272460938, 0.011333465576171875, 0.013490676879882812, 0.01564788818359375, 0.017805099487304688, 0.019962310791015625, 0.022119522094726562, 0.0242767333984375, 0.026433944702148438, 0.028591156005859375, 0.030748367309570312, 0.03290557861328125, 0.03506278991699219, 0.037220001220703125, 0.03937721252441406, 0.041534423828125, 0.04369163513183594, 0.045848846435546875, 0.04800605773925781, 0.05016326904296875, 0.05232048034667969, 0.054477691650390625, 0.05663490295410156, 0.0587921142578125, 0.06094932556152344, 0.06310653686523438, 0.06526374816894531, 0.06742095947265625, 0.06957817077636719, 0.07173538208007812, 0.07389259338378906, 0.0760498046875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 9.0, 12.0, 23.0, 45.0, 105.0, 221.0, 235.0, 166.0, 92.0, 41.0, 22.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4509326219558716, -1.4060605764389038, -1.3611884117126465, -1.3163163661956787, -1.271444320678711, -1.2265721559524536, -1.1817001104354858, -1.1368279457092285, -1.0919559001922607, -1.047083854675293, -1.0022116899490356, -0.9573396444320679, -0.9124675393104553, -0.8675954341888428, -0.822723388671875, -0.7778512835502625, -0.7329791784286499, -0.6881070733070374, -0.6432349681854248, -0.598362922668457, -0.5534908175468445, -0.5086187124252319, -0.4637466371059418, -0.4188745617866516, -0.37400245666503906, -0.3291303515434265, -0.28425827622413635, -0.239386186003685, -0.19451409578323364, -0.1496420055627823, -0.10476991534233093, -0.05989784002304077, -0.015025615692138672, 0.029846474528312683, 0.07471856474876404, 0.1195906549692154, 0.16446274518966675, 0.2093348354101181, 0.25420692563056946, 0.2990790009498596, 0.34395110607147217, 0.3888232111930847, 0.4336952865123749, 0.47856736183166504, 0.5234394669532776, 0.5683115720748901, 0.6131836175918579, 0.6580557227134705, 0.702927827835083, 0.7477999329566956, 0.7926720380783081, 0.8375440835952759, 0.8824161887168884, 0.927288293838501, 0.9721603393554688, 1.0170323848724365, 1.0619045495986938, 1.1067765951156616, 1.151648759841919, 1.1965208053588867, 1.2413928508758545, 1.2862650156021118, 1.3311370611190796, 1.376009225845337, 1.4208812713623047]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 14.0, 14.0, 6.0, 12.0, 10.0, 19.0, 14.0, 17.0, 21.0, 27.0, 20.0, 25.0, 34.0, 34.0, 41.0, 44.0, 50.0, 55.0, 55.0, 47.0, 56.0, 54.0, 37.0, 42.0, 38.0, 30.0, 26.0, 18.0, 21.0, 15.0, 13.0, 8.0, 15.0, 13.0, 6.0, 14.0, 8.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.8345845937728882, -0.8091962337493896, -0.7838079333305359, -0.7584195733070374, -0.7330312132835388, -0.7076429128646851, -0.6822545528411865, -0.656866192817688, -0.6314778327941895, -0.6060894727706909, -0.5807011723518372, -0.5553128123283386, -0.5299244523048401, -0.5045361518859863, -0.4791477918624878, -0.45375943183898926, -0.4283711016178131, -0.40298277139663696, -0.3775944113731384, -0.3522060811519623, -0.32681772112846375, -0.3014293909072876, -0.27604103088378906, -0.2506527006626129, -0.22526435554027557, -0.19987601041793823, -0.1744876652956009, -0.14909932017326355, -0.1237109825015068, -0.09832264482975006, -0.07293429970741272, -0.04754595458507538, -0.022157609462738037, 0.003230733796954155, 0.028619077056646347, 0.05400741845369339, 0.07939576357603073, 0.10478410124778748, 0.13017244637012482, 0.15556079149246216, 0.1809491366147995, 0.20633748173713684, 0.23172582685947418, 0.2571141719818115, 0.28250250220298767, 0.3078908324241638, 0.33327919244766235, 0.3586675524711609, 0.38405588269233704, 0.4094442129135132, 0.4348325729370117, 0.46022090315818787, 0.4856092631816864, 0.5109975934028625, 0.5363859534263611, 0.5617742538452148, 0.5871626138687134, 0.6125509738922119, 0.6379392743110657, 0.6633276343345642, 0.6887159943580627, 0.7141042947769165, 0.739492654800415, 0.7648810148239136, 0.7902693748474121]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 10.0, 6.0, 14.0, 16.0, 19.0, 36.0, 38.0, 61.0, 78.0, 112.0, 165.0, 259.0, 444.0, 1561.0, 45271.0, 4127209.0, 16697.0, 1193.0, 373.0, 211.0, 135.0, 100.0, 75.0, 41.0, 34.0, 31.0, 15.0, 14.0, 13.0, 9.0, 12.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.414306640625, -0.4035148620605469, -0.39272308349609375, -0.3819313049316406, -0.3711395263671875, -0.3603477478027344, -0.34955596923828125, -0.3387641906738281, -0.327972412109375, -0.3171806335449219, -0.30638885498046875, -0.2955970764160156, -0.2848052978515625, -0.2740135192871094, -0.26322174072265625, -0.2524299621582031, -0.24163818359375, -0.23084640502929688, -0.22005462646484375, -0.20926284790039062, -0.1984710693359375, -0.18767929077148438, -0.17688751220703125, -0.16609573364257812, -0.155303955078125, -0.14451217651367188, -0.13372039794921875, -0.12292861938476562, -0.1121368408203125, -0.10134506225585938, -0.09055328369140625, -0.07976150512695312, -0.0689697265625, -0.058177947998046875, -0.04738616943359375, -0.036594390869140625, -0.0258026123046875, -0.015010833740234375, -0.00421905517578125, 0.006572723388671875, 0.017364501953125, 0.028156280517578125, 0.03894805908203125, 0.049739837646484375, 0.0605316162109375, 0.07132339477539062, 0.08211517333984375, 0.09290695190429688, 0.10369873046875, 0.11449050903320312, 0.12528228759765625, 0.13607406616210938, 0.1468658447265625, 0.15765762329101562, 0.16844940185546875, 0.17924118041992188, 0.190032958984375, 0.20082473754882812, 0.21161651611328125, 0.22240829467773438, 0.2332000732421875, 0.24399185180664062, 0.25478363037109375, 0.2655754089355469, 0.2763671875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 3.0, 7.0, 5.0, 11.0, 16.0, 15.0, 20.0, 22.0, 38.0, 25.0, 39.0, 47.0, 52.0, 47.0, 51.0, 49.0, 43.0, 68.0, 57.0, 54.0, 39.0, 42.0, 26.0, 38.0, 31.0, 32.0, 27.0, 20.0, 24.0, 9.0, 16.0, 4.0, 6.0, 4.0, 8.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05780029296875, -0.056107521057128906, -0.05441474914550781, -0.05272197723388672, -0.051029205322265625, -0.04933643341064453, -0.04764366149902344, -0.045950889587402344, -0.04425811767578125, -0.042565345764160156, -0.04087257385253906, -0.03917980194091797, -0.037487030029296875, -0.03579425811767578, -0.03410148620605469, -0.032408714294433594, -0.0307159423828125, -0.029023170471191406, -0.027330398559570312, -0.02563762664794922, -0.023944854736328125, -0.02225208282470703, -0.020559310913085938, -0.018866539001464844, -0.01717376708984375, -0.015480995178222656, -0.013788223266601562, -0.012095451354980469, -0.010402679443359375, -0.008709907531738281, -0.0070171356201171875, -0.005324363708496094, -0.003631591796875, -0.0019388198852539062, -0.0002460479736328125, 0.0014467239379882812, 0.003139495849609375, 0.004832267761230469, 0.0065250396728515625, 0.008217811584472656, 0.00991058349609375, 0.011603355407714844, 0.013296127319335938, 0.014988899230957031, 0.016681671142578125, 0.01837444305419922, 0.020067214965820312, 0.021759986877441406, 0.0234527587890625, 0.025145530700683594, 0.026838302612304688, 0.02853107452392578, 0.030223846435546875, 0.03191661834716797, 0.03360939025878906, 0.035302162170410156, 0.03699493408203125, 0.038687705993652344, 0.04038047790527344, 0.04207324981689453, 0.043766021728515625, 0.04545879364013672, 0.04715156555175781, 0.048844337463378906, 0.050537109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 14.0, 10.0, 15.0, 27.0, 58.0, 83.0, 187.0, 322.0, 576.0, 1182.0, 2524.0, 5787.0, 14717.0, 49686.0, 350152.0, 3232218.0, 453030.0, 56420.0, 16001.0, 6000.0, 2681.0, 1231.0, 627.0, 343.0, 174.0, 70.0, 64.0, 28.0, 13.0, 12.0, 11.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08856201171875, -0.08613872528076172, -0.08371543884277344, -0.08129215240478516, -0.07886886596679688, -0.0764455795288086, -0.07402229309082031, -0.07159900665283203, -0.06917572021484375, -0.06675243377685547, -0.06432914733886719, -0.061905860900878906, -0.059482574462890625, -0.057059288024902344, -0.05463600158691406, -0.05221271514892578, -0.0497894287109375, -0.04736614227294922, -0.04494285583496094, -0.042519569396972656, -0.040096282958984375, -0.037672996520996094, -0.03524971008300781, -0.03282642364501953, -0.03040313720703125, -0.02797985076904297, -0.025556564331054688, -0.023133277893066406, -0.020709991455078125, -0.018286705017089844, -0.015863418579101562, -0.013440132141113281, -0.011016845703125, -0.008593559265136719, -0.0061702728271484375, -0.0037469863891601562, -0.001323699951171875, 0.0010995864868164062, 0.0035228729248046875, 0.005946159362792969, 0.00836944580078125, 0.010792732238769531, 0.013216018676757812, 0.015639305114746094, 0.018062591552734375, 0.020485877990722656, 0.022909164428710938, 0.02533245086669922, 0.0277557373046875, 0.03017902374267578, 0.03260231018066406, 0.035025596618652344, 0.037448883056640625, 0.039872169494628906, 0.04229545593261719, 0.04471874237060547, 0.04714202880859375, 0.04956531524658203, 0.05198860168457031, 0.054411888122558594, 0.056835174560546875, 0.059258460998535156, 0.06168174743652344, 0.06410503387451172, 0.0665283203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 7.0, 5.0, 10.0, 4.0, 11.0, 11.0, 25.0, 38.0, 49.0, 92.0, 141.0, 270.0, 513.0, 809.0, 824.0, 556.0, 267.0, 162.0, 86.0, 47.0, 36.0, 27.0, 20.0, 11.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0986328125, -0.09581851959228516, -0.09300422668457031, -0.09018993377685547, -0.08737564086914062, -0.08456134796142578, -0.08174705505371094, -0.0789327621459961, -0.07611846923828125, -0.0733041763305664, -0.07048988342285156, -0.06767559051513672, -0.06486129760742188, -0.06204700469970703, -0.05923271179199219, -0.056418418884277344, -0.0536041259765625, -0.050789833068847656, -0.04797554016113281, -0.04516124725341797, -0.042346954345703125, -0.03953266143798828, -0.03671836853027344, -0.033904075622558594, -0.03108978271484375, -0.028275489807128906, -0.025461196899414062, -0.02264690399169922, -0.019832611083984375, -0.01701831817626953, -0.014204025268554688, -0.011389732360839844, -0.008575439453125, -0.005761146545410156, -0.0029468536376953125, -0.00013256072998046875, 0.002681732177734375, 0.005496025085449219, 0.008310317993164062, 0.011124610900878906, 0.01393890380859375, 0.016753196716308594, 0.019567489624023438, 0.02238178253173828, 0.025196075439453125, 0.02801036834716797, 0.030824661254882812, 0.033638954162597656, 0.0364532470703125, 0.039267539978027344, 0.04208183288574219, 0.04489612579345703, 0.047710418701171875, 0.05052471160888672, 0.05333900451660156, 0.056153297424316406, 0.05896759033203125, 0.061781883239746094, 0.06459617614746094, 0.06741046905517578, 0.07022476196289062, 0.07303905487060547, 0.07585334777832031, 0.07866764068603516, 0.08148193359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 9.0, 16.0, 33.0, 71.0, 105.0, 182.0, 201.0, 178.0, 94.0, 57.0, 21.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7749538421630859, -0.7495549917221069, -0.7241561412811279, -0.6987572908401489, -0.6733584403991699, -0.6479595899581909, -0.6225607395172119, -0.5971618890762329, -0.5717630386352539, -0.5463641881942749, -0.5209653377532959, -0.4955664873123169, -0.4701676368713379, -0.4447687864303589, -0.4193699359893799, -0.3939710855484009, -0.36857226490974426, -0.34317341446876526, -0.31777456402778625, -0.29237571358680725, -0.26697686314582825, -0.24157802760601044, -0.21617917716503143, -0.19078032672405243, -0.16538147628307343, -0.13998262584209442, -0.11458377540111542, -0.08918493241071701, -0.063786081969738, -0.0383872389793396, -0.012988388538360596, 0.012410461902618408, 0.03780931234359741, 0.06320816278457642, 0.08860701322555542, 0.11400585621595383, 0.13940471410751343, 0.16480354964733124, 0.19020240008831024, 0.21560125052928925, 0.24100010097026825, 0.26639893651008606, 0.29179778695106506, 0.31719663739204407, 0.34259548783302307, 0.3679943382740021, 0.3933931887149811, 0.4187920391559601, 0.4441908895969391, 0.4695897400379181, 0.4949885904788971, 0.5203874111175537, 0.5457862615585327, 0.5711851119995117, 0.5965839624404907, 0.6219828128814697, 0.6473816633224487, 0.6727805137634277, 0.6981793642044067, 0.7235782146453857, 0.7489770650863647, 0.7743759155273438, 0.7997747659683228, 0.8251736164093018, 0.8505724668502808]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 7.0, 2.0, 10.0, 7.0, 11.0, 7.0, 11.0, 21.0, 25.0, 20.0, 29.0, 30.0, 28.0, 29.0, 32.0, 54.0, 44.0, 50.0, 54.0, 41.0, 51.0, 41.0, 47.0, 30.0, 37.0, 42.0, 37.0, 23.0, 25.0, 26.0, 34.0, 16.0, 22.0, 14.0, 10.0, 9.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3328278064727783, -0.3214702010154724, -0.3101125657558441, -0.2987549602985382, -0.2873973250389099, -0.276039719581604, -0.2646821141242981, -0.2533245086669922, -0.2419668734073639, -0.2306092530488968, -0.2192516326904297, -0.20789402723312378, -0.19653640687465668, -0.18517878651618958, -0.17382118105888367, -0.16246356070041656, -0.15110594034194946, -0.13974831998348236, -0.12839069962501526, -0.11703309416770935, -0.10567547380924225, -0.09431785345077515, -0.08296024054288864, -0.07160262763500214, -0.060245007276535034, -0.04888739064335823, -0.03752977401018143, -0.026172157377004623, -0.01481454074382782, -0.0034569241106510162, 0.007900692522525787, 0.019258305430412292, 0.030615925788879395, 0.0419735424220562, 0.053331159055233, 0.0646887719631195, 0.07604639232158661, 0.08740401268005371, 0.09876162558794022, 0.11011923849582672, 0.12147685885429382, 0.13283447921276093, 0.14419209957122803, 0.15554970502853394, 0.16690732538700104, 0.17826494574546814, 0.18962255120277405, 0.20098017156124115, 0.21233779191970825, 0.22369541227817535, 0.23505303263664246, 0.24641063809394836, 0.25776827335357666, 0.26912587881088257, 0.2804834842681885, 0.2918410897254944, 0.3031987249851227, 0.3145563304424286, 0.3259139657020569, 0.3372715711593628, 0.3486291766166687, 0.359986811876297, 0.3713444173336029, 0.3827020525932312, 0.3940596580505371]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 18.0, 33.0, 36.0, 72.0, 126.0, 199.0, 391.0, 789.0, 1783.0, 4530.0, 14863.0, 58231.0, 273485.0, 510653.0, 137702.0, 31440.0, 8671.0, 2974.0, 1244.0, 563.0, 307.0, 151.0, 91.0, 60.0, 33.0, 38.0, 19.0, 7.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.1485595703125, -0.14487171173095703, -0.14118385314941406, -0.1374959945678711, -0.13380813598632812, -0.13012027740478516, -0.1264324188232422, -0.12274456024169922, -0.11905670166015625, -0.11536884307861328, -0.11168098449707031, -0.10799312591552734, -0.10430526733398438, -0.1006174087524414, -0.09692955017089844, -0.09324169158935547, -0.0895538330078125, -0.08586597442626953, -0.08217811584472656, -0.0784902572631836, -0.07480239868164062, -0.07111454010009766, -0.06742668151855469, -0.06373882293701172, -0.06005096435546875, -0.05636310577392578, -0.05267524719238281, -0.048987388610839844, -0.045299530029296875, -0.041611671447753906, -0.03792381286621094, -0.03423595428466797, -0.030548095703125, -0.02686023712158203, -0.023172378540039062, -0.019484519958496094, -0.015796661376953125, -0.012108802795410156, -0.008420944213867188, -0.004733085632324219, -0.00104522705078125, 0.0026426315307617188, 0.0063304901123046875, 0.010018348693847656, 0.013706207275390625, 0.017394065856933594, 0.021081924438476562, 0.02476978302001953, 0.0284576416015625, 0.03214550018310547, 0.03583335876464844, 0.039521217346191406, 0.043209075927734375, 0.046896934509277344, 0.05058479309082031, 0.05427265167236328, 0.05796051025390625, 0.06164836883544922, 0.06533622741699219, 0.06902408599853516, 0.07271194458007812, 0.0763998031616211, 0.08008766174316406, 0.08377552032470703, 0.08746337890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 9.0, 9.0, 3.0, 17.0, 19.0, 27.0, 33.0, 42.0, 45.0, 41.0, 50.0, 47.0, 62.0, 51.0, 53.0, 57.0, 66.0, 54.0, 28.0, 46.0, 39.0, 38.0, 28.0, 32.0, 18.0, 14.0, 15.0, 15.0, 10.0, 11.0, 7.0, 6.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.057586669921875, -0.05577850341796875, -0.0539703369140625, -0.05216217041015625, -0.05035400390625, -0.04854583740234375, -0.0467376708984375, -0.04492950439453125, -0.043121337890625, -0.04131317138671875, -0.0395050048828125, -0.03769683837890625, -0.035888671875, -0.03408050537109375, -0.0322723388671875, -0.03046417236328125, -0.028656005859375, -0.02684783935546875, -0.0250396728515625, -0.02323150634765625, -0.02142333984375, -0.01961517333984375, -0.0178070068359375, -0.01599884033203125, -0.014190673828125, -0.01238250732421875, -0.0105743408203125, -0.00876617431640625, -0.0069580078125, -0.00514984130859375, -0.0033416748046875, -0.00153350830078125, 0.000274658203125, 0.00208282470703125, 0.0038909912109375, 0.00569915771484375, 0.00750732421875, 0.00931549072265625, 0.0111236572265625, 0.01293182373046875, 0.014739990234375, 0.01654815673828125, 0.0183563232421875, 0.02016448974609375, 0.02197265625, 0.02378082275390625, 0.0255889892578125, 0.02739715576171875, 0.029205322265625, 0.03101348876953125, 0.0328216552734375, 0.03462982177734375, 0.03643798828125, 0.03824615478515625, 0.0400543212890625, 0.04186248779296875, 0.043670654296875, 0.04547882080078125, 0.0472869873046875, 0.04909515380859375, 0.0509033203125, 0.05271148681640625, 0.0545196533203125, 0.05632781982421875, 0.058135986328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 13.0, 21.0, 18.0, 33.0, 40.0, 62.0, 113.0, 154.0, 277.0, 401.0, 736.0, 1496.0, 3507.0, 11718.0, 53379.0, 340368.0, 534156.0, 78406.0, 15485.0, 4475.0, 1682.0, 765.0, 468.0, 247.0, 163.0, 133.0, 72.0, 49.0, 37.0, 24.0, 10.0, 7.0, 8.0, 8.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1282958984375, -0.12430000305175781, -0.12030410766601562, -0.11630821228027344, -0.11231231689453125, -0.10831642150878906, -0.10432052612304688, -0.10032463073730469, -0.0963287353515625, -0.09233283996582031, -0.08833694458007812, -0.08434104919433594, -0.08034515380859375, -0.07634925842285156, -0.07235336303710938, -0.06835746765136719, -0.064361572265625, -0.06036567687988281, -0.056369781494140625, -0.05237388610839844, -0.04837799072265625, -0.04438209533691406, -0.040386199951171875, -0.03639030456542969, -0.0323944091796875, -0.028398513793945312, -0.024402618408203125, -0.020406723022460938, -0.01641082763671875, -0.012414932250976562, -0.008419036865234375, -0.0044231414794921875, -0.00042724609375, 0.0035686492919921875, 0.007564544677734375, 0.011560440063476562, 0.01555633544921875, 0.019552230834960938, 0.023548126220703125, 0.027544021606445312, 0.0315399169921875, 0.03553581237792969, 0.039531707763671875, 0.04352760314941406, 0.04752349853515625, 0.05151939392089844, 0.055515289306640625, 0.05951118469238281, 0.063507080078125, 0.06750297546386719, 0.07149887084960938, 0.07549476623535156, 0.07949066162109375, 0.08348655700683594, 0.08748245239257812, 0.09147834777832031, 0.0954742431640625, 0.09947013854980469, 0.10346603393554688, 0.10746192932128906, 0.11145782470703125, 0.11545372009277344, 0.11944961547851562, 0.12344551086425781, 0.12744140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 10.0, 13.0, 14.0, 18.0, 10.0, 22.0, 17.0, 33.0, 33.0, 27.0, 36.0, 38.0, 34.0, 52.0, 48.0, 49.0, 48.0, 39.0, 44.0, 47.0, 38.0, 48.0, 42.0, 31.0, 29.0, 27.0, 25.0, 21.0, 12.0, 29.0, 14.0, 13.0, 11.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.189453125, -0.1837482452392578, -0.17804336547851562, -0.17233848571777344, -0.16663360595703125, -0.16092872619628906, -0.15522384643554688, -0.1495189666748047, -0.1438140869140625, -0.1381092071533203, -0.13240432739257812, -0.12669944763183594, -0.12099456787109375, -0.11528968811035156, -0.10958480834960938, -0.10387992858886719, -0.098175048828125, -0.09247016906738281, -0.08676528930664062, -0.08106040954589844, -0.07535552978515625, -0.06965065002441406, -0.06394577026367188, -0.05824089050292969, -0.0525360107421875, -0.04683113098144531, -0.041126251220703125, -0.03542137145996094, -0.02971649169921875, -0.024011611938476562, -0.018306732177734375, -0.012601852416992188, -0.00689697265625, -0.0011920928955078125, 0.004512786865234375, 0.010217666625976562, 0.01592254638671875, 0.021627426147460938, 0.027332305908203125, 0.03303718566894531, 0.0387420654296875, 0.04444694519042969, 0.050151824951171875, 0.05585670471191406, 0.06156158447265625, 0.06726646423339844, 0.07297134399414062, 0.07867622375488281, 0.084381103515625, 0.09008598327636719, 0.09579086303710938, 0.10149574279785156, 0.10720062255859375, 0.11290550231933594, 0.11861038208007812, 0.12431526184082031, 0.1300201416015625, 0.1357250213623047, 0.14142990112304688, 0.14713478088378906, 0.15283966064453125, 0.15854454040527344, 0.16424942016601562, 0.1699542999267578, 0.1756591796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 10.0, 18.0, 20.0, 52.0, 97.0, 182.0, 660.0, 3368.0, 82264.0, 948829.0, 11123.0, 1294.0, 334.0, 128.0, 65.0, 36.0, 24.0, 16.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1495361328125, -0.14404869079589844, -0.13856124877929688, -0.1330738067626953, -0.12758636474609375, -0.12209892272949219, -0.11661148071289062, -0.11112403869628906, -0.1056365966796875, -0.10014915466308594, -0.09466171264648438, -0.08917427062988281, -0.08368682861328125, -0.07819938659667969, -0.07271194458007812, -0.06722450256347656, -0.061737060546875, -0.05624961853027344, -0.050762176513671875, -0.04527473449707031, -0.03978729248046875, -0.03429985046386719, -0.028812408447265625, -0.023324966430664062, -0.0178375244140625, -0.012350082397460938, -0.006862640380859375, -0.0013751983642578125, 0.00411224365234375, 0.009599685668945312, 0.015087127685546875, 0.020574569702148438, 0.02606201171875, 0.03154945373535156, 0.037036895751953125, 0.04252433776855469, 0.04801177978515625, 0.05349922180175781, 0.058986663818359375, 0.06447410583496094, 0.0699615478515625, 0.07544898986816406, 0.08093643188476562, 0.08642387390136719, 0.09191131591796875, 0.09739875793457031, 0.10288619995117188, 0.10837364196777344, 0.113861083984375, 0.11934852600097656, 0.12483596801757812, 0.1303234100341797, 0.13581085205078125, 0.1412982940673828, 0.14678573608398438, 0.15227317810058594, 0.1577606201171875, 0.16324806213378906, 0.16873550415039062, 0.1742229461669922, 0.17971038818359375, 0.1851978302001953, 0.19068527221679688, 0.19617271423339844, 0.20166015625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 8.0, 2.0, 5.0, 2.0, 14.0, 16.0, 13.0, 24.0, 33.0, 57.0, 47.0, 83.0, 125.0, 111.0, 110.0, 89.0, 69.0, 44.0, 32.0, 17.0, 20.0, 9.0, 7.0, 9.0, 9.0, 10.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.365776062011719e-05, -6.169266998767853e-05, -5.972757935523987e-05, -5.776248872280121e-05, -5.579739809036255e-05, -5.383230745792389e-05, -5.186721682548523e-05, -4.990212619304657e-05, -4.793703556060791e-05, -4.597194492816925e-05, -4.400685429573059e-05, -4.204176366329193e-05, -4.007667303085327e-05, -3.811158239841461e-05, -3.614649176597595e-05, -3.418140113353729e-05, -3.221631050109863e-05, -3.0251219868659973e-05, -2.8286129236221313e-05, -2.6321038603782654e-05, -2.4355947971343994e-05, -2.2390857338905334e-05, -2.0425766706466675e-05, -1.8460676074028015e-05, -1.6495585441589355e-05, -1.4530494809150696e-05, -1.2565404176712036e-05, -1.0600313544273376e-05, -8.635222911834717e-06, -6.670132279396057e-06, -4.7050416469573975e-06, -2.739951014518738e-06, -7.748603820800781e-07, 1.1902302503585815e-06, 3.155320882797241e-06, 5.120411515235901e-06, 7.0855021476745605e-06, 9.05059278011322e-06, 1.101568341255188e-05, 1.298077404499054e-05, 1.49458646774292e-05, 1.691095530986786e-05, 1.887604594230652e-05, 2.0841136574745178e-05, 2.2806227207183838e-05, 2.4771317839622498e-05, 2.6736408472061157e-05, 2.8701499104499817e-05, 3.0666589736938477e-05, 3.2631680369377136e-05, 3.4596771001815796e-05, 3.6561861634254456e-05, 3.8526952266693115e-05, 4.0492042899131775e-05, 4.2457133531570435e-05, 4.4422224164009094e-05, 4.6387314796447754e-05, 4.8352405428886414e-05, 5.031749606132507e-05, 5.228258669376373e-05, 5.424767732620239e-05, 5.621276795864105e-05, 5.817785859107971e-05, 6.014294922351837e-05, 6.210803985595703e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 9.0, 10.0, 12.0, 18.0, 29.0, 46.0, 90.0, 128.0, 190.0, 460.0, 938.0, 2644.0, 10156.0, 83169.0, 821811.0, 111573.0, 12183.0, 2928.0, 1083.0, 491.0, 210.0, 122.0, 94.0, 49.0, 31.0, 21.0, 17.0, 12.0, 5.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07403564453125, -0.07161235809326172, -0.06918907165527344, -0.06676578521728516, -0.06434249877929688, -0.061919212341308594, -0.05949592590332031, -0.05707263946533203, -0.05464935302734375, -0.05222606658935547, -0.04980278015136719, -0.047379493713378906, -0.044956207275390625, -0.042532920837402344, -0.04010963439941406, -0.03768634796142578, -0.0352630615234375, -0.03283977508544922, -0.030416488647460938, -0.027993202209472656, -0.025569915771484375, -0.023146629333496094, -0.020723342895507812, -0.01830005645751953, -0.01587677001953125, -0.013453483581542969, -0.011030197143554688, -0.008606910705566406, -0.006183624267578125, -0.0037603378295898438, -0.0013370513916015625, 0.0010862350463867188, 0.003509521484375, 0.005932807922363281, 0.008356094360351562, 0.010779380798339844, 0.013202667236328125, 0.015625953674316406, 0.018049240112304688, 0.02047252655029297, 0.02289581298828125, 0.02531909942626953, 0.027742385864257812, 0.030165672302246094, 0.032588958740234375, 0.035012245178222656, 0.03743553161621094, 0.03985881805419922, 0.0422821044921875, 0.04470539093017578, 0.04712867736816406, 0.049551963806152344, 0.051975250244140625, 0.054398536682128906, 0.05682182312011719, 0.05924510955810547, 0.06166839599609375, 0.06409168243408203, 0.06651496887207031, 0.0689382553100586, 0.07136154174804688, 0.07378482818603516, 0.07620811462402344, 0.07863140106201172, 0.0810546875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 7.0, 11.0, 9.0, 26.0, 25.0, 40.0, 47.0, 69.0, 75.0, 84.0, 113.0, 116.0, 88.0, 78.0, 63.0, 35.0, 29.0, 22.0, 15.0, 13.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07623291015625, -0.07431411743164062, -0.07239532470703125, -0.07047653198242188, -0.0685577392578125, -0.06663894653320312, -0.06472015380859375, -0.06280136108398438, -0.060882568359375, -0.058963775634765625, -0.05704498291015625, -0.055126190185546875, -0.0532073974609375, -0.051288604736328125, -0.04936981201171875, -0.047451019287109375, -0.0455322265625, -0.043613433837890625, -0.04169464111328125, -0.039775848388671875, -0.0378570556640625, -0.035938262939453125, -0.03401947021484375, -0.032100677490234375, -0.030181884765625, -0.028263092041015625, -0.02634429931640625, -0.024425506591796875, -0.0225067138671875, -0.020587921142578125, -0.01866912841796875, -0.016750335693359375, -0.01483154296875, -0.012912750244140625, -0.01099395751953125, -0.009075164794921875, -0.0071563720703125, -0.005237579345703125, -0.00331878662109375, -0.001399993896484375, 0.000518798828125, 0.002437591552734375, 0.00435638427734375, 0.006275177001953125, 0.0081939697265625, 0.010112762451171875, 0.01203155517578125, 0.013950347900390625, 0.015869140625, 0.017787933349609375, 0.01970672607421875, 0.021625518798828125, 0.0235443115234375, 0.025463104248046875, 0.02738189697265625, 0.029300689697265625, 0.031219482421875, 0.033138275146484375, 0.03505706787109375, 0.036975860595703125, 0.0388946533203125, 0.040813446044921875, 0.04273223876953125, 0.044651031494140625, 0.04656982421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 12.0, 13.0, 24.0, 70.0, 156.0, 304.0, 251.0, 94.0, 41.0, 12.0, 2.0, 6.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7678046226501465, -1.719799518585205, -1.6717944145202637, -1.6237893104553223, -1.5757842063903809, -1.5277791023254395, -1.479773998260498, -1.4317688941955566, -1.3837637901306152, -1.3357586860656738, -1.2877535820007324, -1.239748477935791, -1.1917433738708496, -1.1437382698059082, -1.0957331657409668, -1.0477280616760254, -0.999722957611084, -0.9517178535461426, -0.9037127494812012, -0.8557076454162598, -0.8077025413513184, -0.759697437286377, -0.7116923332214355, -0.6636872291564941, -0.6156821250915527, -0.5676770210266113, -0.5196719169616699, -0.4716668128967285, -0.4236617088317871, -0.3756566047668457, -0.3276515007019043, -0.2796463966369629, -0.23164129257202148, -0.18363618850708008, -0.13563108444213867, -0.08762598037719727, -0.03962087631225586, 0.008384227752685547, 0.05638933181762695, 0.10439443588256836, 0.15239953994750977, 0.20040464401245117, 0.24840974807739258, 0.296414852142334, 0.3444199562072754, 0.3924250602722168, 0.4404301643371582, 0.4884352684020996, 0.536440372467041, 0.5844454765319824, 0.6324505805969238, 0.6804556846618652, 0.7284607887268066, 0.776465892791748, 0.8244709968566895, 0.8724761009216309, 0.9204812049865723, 0.9684863090515137, 1.016491413116455, 1.0644965171813965, 1.112501621246338, 1.1605067253112793, 1.2085118293762207, 1.256516933441162, 1.3045220375061035]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 4.0, 2.0, 4.0, 3.0, 8.0, 5.0, 9.0, 11.0, 14.0, 13.0, 21.0, 23.0, 31.0, 21.0, 26.0, 33.0, 31.0, 32.0, 51.0, 46.0, 59.0, 66.0, 52.0, 58.0, 46.0, 40.0, 42.0, 26.0, 33.0, 26.0, 19.0, 15.0, 20.0, 14.0, 15.0, 15.0, 13.0, 16.0, 8.0, 17.0, 4.0, 8.0, 1.0, 1.0, 1.0, 4.0], "bins": [-0.903170108795166, -0.8807067275047302, -0.8582433462142944, -0.8357799053192139, -0.8133165240287781, -0.7908531427383423, -0.7683897018432617, -0.7459263205528259, -0.7234629392623901, -0.7009995579719543, -0.6785361766815186, -0.656072735786438, -0.6336093544960022, -0.6111459732055664, -0.5886825323104858, -0.56621915102005, -0.5437557697296143, -0.5212923884391785, -0.4988289773464203, -0.4763655662536621, -0.4539021849632263, -0.4314388036727905, -0.40897539258003235, -0.38651198148727417, -0.3640486001968384, -0.3415852189064026, -0.3191218078136444, -0.29665839672088623, -0.27419501543045044, -0.25173163414001465, -0.22926822304725647, -0.20680482685565948, -0.18434137105941772, -0.16187797486782074, -0.13941457867622375, -0.11695118248462677, -0.09448778629302979, -0.0720243901014328, -0.049560993909835815, -0.02709759771823883, -0.004634201526641846, 0.01782919466495514, 0.040292590856552124, 0.06275598704814911, 0.0852193832397461, 0.10768277943134308, 0.13014617562294006, 0.15260957181453705, 0.17507296800613403, 0.19753636419773102, 0.219999760389328, 0.242463156580925, 0.264926552772522, 0.28738993406295776, 0.30985334515571594, 0.3323167562484741, 0.3547801375389099, 0.3772435188293457, 0.3997069299221039, 0.42217034101486206, 0.44463372230529785, 0.46709710359573364, 0.4895605146884918, 0.51202392578125, 0.5344873070716858]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 12.0, 11.0, 11.0, 23.0, 32.0, 51.0, 86.0, 148.0, 251.0, 497.0, 1361.0, 4599.0, 28669.0, 907403.0, 3165293.0, 73280.0, 8867.0, 2144.0, 757.0, 365.0, 167.0, 101.0, 43.0, 40.0, 21.0, 23.0, 10.0, 10.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.12857341766357422, -0.12457847595214844, -0.12058353424072266, -0.11658859252929688, -0.1125936508178711, -0.10859870910644531, -0.10460376739501953, -0.10060882568359375, -0.09661388397216797, -0.09261894226074219, -0.0886240005493164, -0.08462905883789062, -0.08063411712646484, -0.07663917541503906, -0.07264423370361328, -0.0686492919921875, -0.06465435028076172, -0.06065940856933594, -0.056664466857910156, -0.052669525146484375, -0.048674583435058594, -0.04467964172363281, -0.04068470001220703, -0.03668975830078125, -0.03269481658935547, -0.028699874877929688, -0.024704933166503906, -0.020709991455078125, -0.016715049743652344, -0.012720108032226562, -0.008725166320800781, -0.004730224609375, -0.0007352828979492188, 0.0032596588134765625, 0.007254600524902344, 0.011249542236328125, 0.015244483947753906, 0.019239425659179688, 0.02323436737060547, 0.02722930908203125, 0.03122425079345703, 0.03521919250488281, 0.039214134216308594, 0.043209075927734375, 0.047204017639160156, 0.05119895935058594, 0.05519390106201172, 0.0591888427734375, 0.06318378448486328, 0.06717872619628906, 0.07117366790771484, 0.07516860961914062, 0.0791635513305664, 0.08315849304199219, 0.08715343475341797, 0.09114837646484375, 0.09514331817626953, 0.09913825988769531, 0.1031332015991211, 0.10712814331054688, 0.11112308502197266, 0.11511802673339844, 0.11911296844482422, 0.12310791015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 8.0, 10.0, 19.0, 21.0, 18.0, 33.0, 38.0, 41.0, 52.0, 55.0, 47.0, 64.0, 58.0, 57.0, 85.0, 62.0, 57.0, 41.0, 44.0, 38.0, 31.0, 31.0, 11.0, 21.0, 16.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063720703125, -0.06191253662109375, -0.0601043701171875, -0.05829620361328125, -0.056488037109375, -0.05467987060546875, -0.0528717041015625, -0.05106353759765625, -0.04925537109375, -0.04744720458984375, -0.0456390380859375, -0.04383087158203125, -0.042022705078125, -0.04021453857421875, -0.0384063720703125, -0.03659820556640625, -0.0347900390625, -0.03298187255859375, -0.0311737060546875, -0.02936553955078125, -0.027557373046875, -0.02574920654296875, -0.0239410400390625, -0.02213287353515625, -0.02032470703125, -0.01851654052734375, -0.0167083740234375, -0.01490020751953125, -0.013092041015625, -0.01128387451171875, -0.0094757080078125, -0.00766754150390625, -0.005859375, -0.00405120849609375, -0.0022430419921875, -0.00043487548828125, 0.001373291015625, 0.00318145751953125, 0.0049896240234375, 0.00679779052734375, 0.00860595703125, 0.01041412353515625, 0.0122222900390625, 0.01403045654296875, 0.015838623046875, 0.01764678955078125, 0.0194549560546875, 0.02126312255859375, 0.0230712890625, 0.02487945556640625, 0.0266876220703125, 0.02849578857421875, 0.030303955078125, 0.03211212158203125, 0.0339202880859375, 0.03572845458984375, 0.03753662109375, 0.03934478759765625, 0.0411529541015625, 0.04296112060546875, 0.044769287109375, 0.04657745361328125, 0.0483856201171875, 0.05019378662109375, 0.052001953125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 10.0, 13.0, 20.0, 31.0, 50.0, 89.0, 151.0, 283.0, 531.0, 1207.0, 3080.0, 9186.0, 42085.0, 415765.0, 3437137.0, 236815.0, 34017.0, 8625.0, 2743.0, 1144.0, 528.0, 282.0, 168.0, 105.0, 61.0, 45.0, 31.0, 21.0, 18.0, 16.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.12091064453125, -0.11784172058105469, -0.11477279663085938, -0.11170387268066406, -0.10863494873046875, -0.10556602478027344, -0.10249710083007812, -0.09942817687988281, -0.0963592529296875, -0.09329032897949219, -0.09022140502929688, -0.08715248107910156, -0.08408355712890625, -0.08101463317871094, -0.07794570922851562, -0.07487678527832031, -0.071807861328125, -0.06873893737792969, -0.06567001342773438, -0.06260108947753906, -0.05953216552734375, -0.05646324157714844, -0.053394317626953125, -0.05032539367675781, -0.0472564697265625, -0.04418754577636719, -0.041118621826171875, -0.03804969787597656, -0.03498077392578125, -0.03191184997558594, -0.028842926025390625, -0.025774002075195312, -0.022705078125, -0.019636154174804688, -0.016567230224609375, -0.013498306274414062, -0.01042938232421875, -0.0073604583740234375, -0.004291534423828125, -0.0012226104736328125, 0.0018463134765625, 0.0049152374267578125, 0.007984161376953125, 0.011053085327148438, 0.01412200927734375, 0.017190933227539062, 0.020259857177734375, 0.023328781127929688, 0.026397705078125, 0.029466629028320312, 0.032535552978515625, 0.03560447692871094, 0.03867340087890625, 0.04174232482910156, 0.044811248779296875, 0.04788017272949219, 0.0509490966796875, 0.05401802062988281, 0.057086944580078125, 0.06015586853027344, 0.06322479248046875, 0.06629371643066406, 0.06936264038085938, 0.07243156433105469, 0.07550048828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 8.0, 1.0, 7.0, 7.0, 10.0, 16.0, 20.0, 35.0, 75.0, 109.0, 205.0, 482.0, 831.0, 984.0, 553.0, 292.0, 166.0, 80.0, 60.0, 38.0, 25.0, 18.0, 16.0, 11.0, 9.0, 4.0, 2.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1046142578125, -0.10076904296875, -0.096923828125, -0.09307861328125, -0.0892333984375, -0.08538818359375, -0.08154296875, -0.07769775390625, -0.0738525390625, -0.07000732421875, -0.066162109375, -0.06231689453125, -0.0584716796875, -0.05462646484375, -0.05078125, -0.04693603515625, -0.0430908203125, -0.03924560546875, -0.035400390625, -0.03155517578125, -0.0277099609375, -0.02386474609375, -0.02001953125, -0.01617431640625, -0.0123291015625, -0.00848388671875, -0.004638671875, -0.00079345703125, 0.0030517578125, 0.00689697265625, 0.0107421875, 0.01458740234375, 0.0184326171875, 0.02227783203125, 0.026123046875, 0.02996826171875, 0.0338134765625, 0.03765869140625, 0.04150390625, 0.04534912109375, 0.0491943359375, 0.05303955078125, 0.056884765625, 0.06072998046875, 0.0645751953125, 0.06842041015625, 0.072265625, 0.07611083984375, 0.0799560546875, 0.08380126953125, 0.087646484375, 0.09149169921875, 0.0953369140625, 0.09918212890625, 0.10302734375, 0.10687255859375, 0.1107177734375, 0.11456298828125, 0.118408203125, 0.12225341796875, 0.1260986328125, 0.12994384765625, 0.1337890625, 0.13763427734375, 0.1414794921875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 4.0, 9.0, 14.0, 54.0, 122.0, 227.0, 218.0, 178.0, 94.0, 36.0, 12.0, 10.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1803889274597168, -1.1437506675720215, -1.1071122884750366, -1.0704739093780518, -1.0338356494903564, -0.9971973299980164, -0.9605590105056763, -0.9239206910133362, -0.8872823715209961, -0.850644052028656, -0.8140057325363159, -0.7773674130439758, -0.7407290935516357, -0.7040907740592957, -0.6674524545669556, -0.6308141350746155, -0.5941758155822754, -0.5575374960899353, -0.5208991765975952, -0.4842608571052551, -0.44762253761291504, -0.41098421812057495, -0.37434589862823486, -0.3377075791358948, -0.3010692596435547, -0.2644309401512146, -0.2277926206588745, -0.19115430116653442, -0.15451598167419434, -0.11787766218185425, -0.08123934268951416, -0.04460102319717407, -0.007962584495544434, 0.028675734996795654, 0.06531405448913574, 0.10195237398147583, 0.13859069347381592, 0.175229012966156, 0.2118673324584961, 0.24850565195083618, 0.28514397144317627, 0.32178229093551636, 0.35842061042785645, 0.39505892992019653, 0.4316972494125366, 0.4683355689048767, 0.5049738883972168, 0.5416122078895569, 0.578250527381897, 0.6148888468742371, 0.6515271663665771, 0.6881654858589172, 0.7248038053512573, 0.7614421248435974, 0.7980804443359375, 0.8347187638282776, 0.8713570833206177, 0.9079954028129578, 0.9446337223052979, 0.9812720417976379, 1.017910361289978, 1.054548740386963, 1.0911870002746582, 1.1278252601623535, 1.1644636392593384]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 10.0, 4.0, 14.0, 6.0, 7.0, 14.0, 21.0, 19.0, 30.0, 37.0, 22.0, 37.0, 47.0, 45.0, 51.0, 38.0, 51.0, 54.0, 50.0, 40.0, 39.0, 44.0, 47.0, 38.0, 41.0, 25.0, 31.0, 34.0, 21.0, 16.0, 21.0, 13.0, 5.0, 8.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43015140295028687, -0.41484224796295166, -0.39953309297561646, -0.38422393798828125, -0.36891478300094604, -0.35360562801361084, -0.33829647302627563, -0.32298731803894043, -0.3076781630516052, -0.29236900806427, -0.2770598530769348, -0.2617506980895996, -0.2464415431022644, -0.2311323881149292, -0.2158232182264328, -0.2005140632390976, -0.1852048933506012, -0.169895738363266, -0.1545865833759308, -0.13927742838859558, -0.12396826595067978, -0.10865911096334457, -0.09334994852542877, -0.07804079353809357, -0.06273163855075836, -0.04742248356342316, -0.03211332485079765, -0.01680416613817215, -0.0014950111508369446, 0.01381414383649826, 0.029123306274414062, 0.04443246126174927, 0.05974161624908447, 0.07505077123641968, 0.09035992622375488, 0.10566908866167068, 0.12097824364900589, 0.1362873911857605, 0.1515965610742569, 0.1669057160615921, 0.1822148710489273, 0.1975240260362625, 0.21283318102359772, 0.22814235091209412, 0.24345150589942932, 0.2587606608867645, 0.27406981587409973, 0.28937897086143494, 0.30468812584877014, 0.31999728083610535, 0.33530643582344055, 0.35061559081077576, 0.36592474579811096, 0.38123390078544617, 0.39654308557510376, 0.41185224056243896, 0.42716139554977417, 0.4424705505371094, 0.4577797055244446, 0.4730888605117798, 0.488398015499115, 0.5037071704864502, 0.5190163254737854, 0.5343254804611206, 0.5496346354484558]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 13.0, 12.0, 17.0, 26.0, 32.0, 56.0, 75.0, 103.0, 194.0, 311.0, 589.0, 1237.0, 2519.0, 5753.0, 14860.0, 44334.0, 136105.0, 329454.0, 319014.0, 127865.0, 41418.0, 13971.0, 5586.0, 2372.0, 1125.0, 596.0, 335.0, 213.0, 110.0, 78.0, 48.0, 36.0, 21.0, 18.0, 12.0, 12.0, 10.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0751953125, -0.0729818344116211, -0.07076835632324219, -0.06855487823486328, -0.06634140014648438, -0.06412792205810547, -0.06191444396972656, -0.059700965881347656, -0.05748748779296875, -0.055274009704589844, -0.05306053161621094, -0.05084705352783203, -0.048633575439453125, -0.04642009735107422, -0.04420661926269531, -0.041993141174316406, -0.0397796630859375, -0.037566184997558594, -0.03535270690917969, -0.03313922882080078, -0.030925750732421875, -0.02871227264404297, -0.026498794555664062, -0.024285316467285156, -0.02207183837890625, -0.019858360290527344, -0.017644882202148438, -0.015431404113769531, -0.013217926025390625, -0.011004447937011719, -0.008790969848632812, -0.006577491760253906, -0.004364013671875, -0.0021505355834960938, 6.29425048828125e-05, 0.0022764205932617188, 0.004489898681640625, 0.006703376770019531, 0.008916854858398438, 0.011130332946777344, 0.01334381103515625, 0.015557289123535156, 0.017770767211914062, 0.01998424530029297, 0.022197723388671875, 0.02441120147705078, 0.026624679565429688, 0.028838157653808594, 0.0310516357421875, 0.033265113830566406, 0.03547859191894531, 0.03769207000732422, 0.039905548095703125, 0.04211902618408203, 0.04433250427246094, 0.046545982360839844, 0.04875946044921875, 0.050972938537597656, 0.05318641662597656, 0.05539989471435547, 0.057613372802734375, 0.05982685089111328, 0.06204032897949219, 0.0642538070678711, 0.06646728515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 7.0, 7.0, 6.0, 11.0, 23.0, 27.0, 33.0, 34.0, 31.0, 47.0, 57.0, 55.0, 56.0, 58.0, 70.0, 56.0, 69.0, 47.0, 41.0, 45.0, 45.0, 38.0, 29.0, 30.0, 21.0, 17.0, 11.0, 10.0, 7.0, 10.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05609130859375, -0.05438089370727539, -0.05267047882080078, -0.05096006393432617, -0.04924964904785156, -0.04753923416137695, -0.045828819274902344, -0.044118404388427734, -0.042407989501953125, -0.040697574615478516, -0.038987159729003906, -0.0372767448425293, -0.03556632995605469, -0.03385591506958008, -0.03214550018310547, -0.03043508529663086, -0.02872467041015625, -0.02701425552368164, -0.02530384063720703, -0.023593425750732422, -0.021883010864257812, -0.020172595977783203, -0.018462181091308594, -0.016751766204833984, -0.015041351318359375, -0.013330936431884766, -0.011620521545410156, -0.009910106658935547, -0.008199691772460938, -0.006489276885986328, -0.004778861999511719, -0.0030684471130371094, -0.0013580322265625, 0.0003523826599121094, 0.0020627975463867188, 0.003773212432861328, 0.0054836273193359375, 0.007194042205810547, 0.008904457092285156, 0.010614871978759766, 0.012325286865234375, 0.014035701751708984, 0.015746116638183594, 0.017456531524658203, 0.019166946411132812, 0.020877361297607422, 0.02258777618408203, 0.02429819107055664, 0.02600860595703125, 0.02771902084350586, 0.02942943572998047, 0.031139850616455078, 0.03285026550292969, 0.0345606803894043, 0.036271095275878906, 0.037981510162353516, 0.039691925048828125, 0.041402339935302734, 0.043112754821777344, 0.04482316970825195, 0.04653358459472656, 0.04824399948120117, 0.04995441436767578, 0.05166482925415039, 0.053375244140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 13.0, 8.0, 19.0, 23.0, 31.0, 60.0, 47.0, 66.0, 103.0, 134.0, 178.0, 238.0, 327.0, 457.0, 672.0, 1206.0, 2367.0, 6929.0, 33164.0, 287837.0, 630394.0, 66140.0, 10794.0, 3241.0, 1394.0, 764.0, 533.0, 357.0, 268.0, 165.0, 138.0, 94.0, 109.0, 68.0, 48.0, 34.0, 28.0, 20.0, 23.0, 19.0, 6.0, 6.0, 6.0, 2.0, 6.0, 4.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.139892578125, -0.13579845428466797, -0.13170433044433594, -0.1276102066040039, -0.12351608276367188, -0.11942195892333984, -0.11532783508300781, -0.11123371124267578, -0.10713958740234375, -0.10304546356201172, -0.09895133972167969, -0.09485721588134766, -0.09076309204101562, -0.0866689682006836, -0.08257484436035156, -0.07848072052001953, -0.0743865966796875, -0.07029247283935547, -0.06619834899902344, -0.062104225158691406, -0.058010101318359375, -0.053915977478027344, -0.04982185363769531, -0.04572772979736328, -0.04163360595703125, -0.03753948211669922, -0.03344535827636719, -0.029351234436035156, -0.025257110595703125, -0.021162986755371094, -0.017068862915039062, -0.012974739074707031, -0.008880615234375, -0.004786491394042969, -0.0006923675537109375, 0.0034017562866210938, 0.007495880126953125, 0.011590003967285156, 0.015684127807617188, 0.01977825164794922, 0.02387237548828125, 0.02796649932861328, 0.03206062316894531, 0.036154747009277344, 0.040248870849609375, 0.044342994689941406, 0.04843711853027344, 0.05253124237060547, 0.0566253662109375, 0.06071949005126953, 0.06481361389160156, 0.0689077377319336, 0.07300186157226562, 0.07709598541259766, 0.08119010925292969, 0.08528423309326172, 0.08937835693359375, 0.09347248077392578, 0.09756660461425781, 0.10166072845458984, 0.10575485229492188, 0.1098489761352539, 0.11394309997558594, 0.11803722381591797, 0.12213134765625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 9.0, 17.0, 14.0, 20.0, 22.0, 24.0, 32.0, 25.0, 37.0, 42.0, 37.0, 55.0, 42.0, 62.0, 46.0, 59.0, 60.0, 54.0, 32.0, 33.0, 40.0, 39.0, 28.0, 25.0, 24.0, 23.0, 21.0, 14.0, 9.0, 9.0, 8.0, 7.0, 4.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2020263671875, -0.19610977172851562, -0.19019317626953125, -0.18427658081054688, -0.1783599853515625, -0.17244338989257812, -0.16652679443359375, -0.16061019897460938, -0.154693603515625, -0.14877700805664062, -0.14286041259765625, -0.13694381713867188, -0.1310272216796875, -0.12511062622070312, -0.11919403076171875, -0.11327743530273438, -0.10736083984375, -0.10144424438476562, -0.09552764892578125, -0.08961105346679688, -0.0836944580078125, -0.07777786254882812, -0.07186126708984375, -0.06594467163085938, -0.060028076171875, -0.054111480712890625, -0.04819488525390625, -0.042278289794921875, -0.0363616943359375, -0.030445098876953125, -0.02452850341796875, -0.018611907958984375, -0.0126953125, -0.006778717041015625, -0.00086212158203125, 0.005054473876953125, 0.0109710693359375, 0.016887664794921875, 0.02280426025390625, 0.028720855712890625, 0.034637451171875, 0.040554046630859375, 0.04647064208984375, 0.052387237548828125, 0.0583038330078125, 0.06422042846679688, 0.07013702392578125, 0.07605361938476562, 0.08197021484375, 0.08788681030273438, 0.09380340576171875, 0.09972000122070312, 0.1056365966796875, 0.11155319213867188, 0.11746978759765625, 0.12338638305664062, 0.129302978515625, 0.13521957397460938, 0.14113616943359375, 0.14705276489257812, 0.1529693603515625, 0.15888595581054688, 0.16480255126953125, 0.17071914672851562, 0.1766357421875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 12.0, 26.0, 24.0, 37.0, 51.0, 76.0, 106.0, 197.0, 302.0, 439.0, 791.0, 1479.0, 3067.0, 7660.0, 25500.0, 153989.0, 725289.0, 98382.0, 19181.0, 6185.0, 2598.0, 1294.0, 693.0, 397.0, 234.0, 155.0, 106.0, 81.0, 37.0, 39.0, 29.0, 23.0, 12.0, 6.0, 12.0, 6.0, 1.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.050079345703125, -0.04857969284057617, -0.047080039978027344, -0.045580387115478516, -0.04408073425292969, -0.04258108139038086, -0.04108142852783203, -0.0395817756652832, -0.038082122802734375, -0.03658246994018555, -0.03508281707763672, -0.03358316421508789, -0.03208351135253906, -0.030583858489990234, -0.029084205627441406, -0.027584552764892578, -0.02608489990234375, -0.024585247039794922, -0.023085594177246094, -0.021585941314697266, -0.020086288452148438, -0.01858663558959961, -0.01708698272705078, -0.015587329864501953, -0.014087677001953125, -0.012588024139404297, -0.011088371276855469, -0.00958871841430664, -0.008089065551757812, -0.006589412689208984, -0.005089759826660156, -0.003590106964111328, -0.0020904541015625, -0.0005908012390136719, 0.0009088516235351562, 0.0024085044860839844, 0.0039081573486328125, 0.005407810211181641, 0.006907463073730469, 0.008407115936279297, 0.009906768798828125, 0.011406421661376953, 0.012906074523925781, 0.01440572738647461, 0.015905380249023438, 0.017405033111572266, 0.018904685974121094, 0.020404338836669922, 0.02190399169921875, 0.023403644561767578, 0.024903297424316406, 0.026402950286865234, 0.027902603149414062, 0.02940225601196289, 0.03090190887451172, 0.03240156173706055, 0.033901214599609375, 0.0354008674621582, 0.03690052032470703, 0.03840017318725586, 0.03989982604980469, 0.041399478912353516, 0.042899131774902344, 0.04439878463745117, 0.0458984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 17.0, 10.0, 8.0, 21.0, 33.0, 19.0, 30.0, 53.0, 64.0, 79.0, 79.0, 95.0, 82.0, 72.0, 55.0, 46.0, 31.0, 34.0, 23.0, 30.0, 19.0, 13.0, 13.0, 17.0, 3.0, 9.0, 8.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8100948333740234e-05, -4.640314728021622e-05, -4.47053462266922e-05, -4.300754517316818e-05, -4.1309744119644165e-05, -3.961194306612015e-05, -3.791414201259613e-05, -3.621634095907211e-05, -3.4518539905548096e-05, -3.282073885202408e-05, -3.112293779850006e-05, -2.9425136744976044e-05, -2.7727335691452026e-05, -2.602953463792801e-05, -2.4331733584403992e-05, -2.2633932530879974e-05, -2.0936131477355957e-05, -1.923833042383194e-05, -1.7540529370307922e-05, -1.5842728316783905e-05, -1.4144927263259888e-05, -1.244712620973587e-05, -1.0749325156211853e-05, -9.051524102687836e-06, -7.353723049163818e-06, -5.655921995639801e-06, -3.958120942115784e-06, -2.2603198885917664e-06, -5.62518835067749e-07, 1.1352822184562683e-06, 2.8330832719802856e-06, 4.530884325504303e-06, 6.22868537902832e-06, 7.926486432552338e-06, 9.624287486076355e-06, 1.1322088539600372e-05, 1.301988959312439e-05, 1.4717690646648407e-05, 1.6415491700172424e-05, 1.811329275369644e-05, 1.981109380722046e-05, 2.1508894860744476e-05, 2.3206695914268494e-05, 2.490449696779251e-05, 2.660229802131653e-05, 2.8300099074840546e-05, 2.9997900128364563e-05, 3.169570118188858e-05, 3.33935022354126e-05, 3.5091303288936615e-05, 3.678910434246063e-05, 3.848690539598465e-05, 4.018470644950867e-05, 4.1882507503032684e-05, 4.35803085565567e-05, 4.527810961008072e-05, 4.6975910663604736e-05, 4.8673711717128754e-05, 5.037151277065277e-05, 5.206931382417679e-05, 5.3767114877700806e-05, 5.546491593122482e-05, 5.716271698474884e-05, 5.886051803827286e-05, 6.0558319091796875e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 3.0, 3.0, 6.0, 12.0, 17.0, 30.0, 28.0, 48.0, 62.0, 110.0, 159.0, 235.0, 387.0, 634.0, 1206.0, 2500.0, 5773.0, 16373.0, 70354.0, 648981.0, 245729.0, 37083.0, 10543.0, 3998.0, 1911.0, 881.0, 536.0, 317.0, 193.0, 135.0, 83.0, 60.0, 47.0, 32.0, 17.0, 19.0, 11.0, 7.0, 9.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0494384765625, -0.047976016998291016, -0.04651355743408203, -0.04505109786987305, -0.04358863830566406, -0.04212617874145508, -0.040663719177246094, -0.03920125961303711, -0.037738800048828125, -0.03627634048461914, -0.034813880920410156, -0.03335142135620117, -0.03188896179199219, -0.030426502227783203, -0.02896404266357422, -0.027501583099365234, -0.02603912353515625, -0.024576663970947266, -0.02311420440673828, -0.021651744842529297, -0.020189285278320312, -0.018726825714111328, -0.017264366149902344, -0.01580190658569336, -0.014339447021484375, -0.01287698745727539, -0.011414527893066406, -0.009952068328857422, -0.008489608764648438, -0.007027149200439453, -0.005564689636230469, -0.004102230072021484, -0.0026397705078125, -0.0011773109436035156, 0.00028514862060546875, 0.0017476081848144531, 0.0032100677490234375, 0.004672527313232422, 0.006134986877441406, 0.007597446441650391, 0.009059906005859375, 0.01052236557006836, 0.011984825134277344, 0.013447284698486328, 0.014909744262695312, 0.016372203826904297, 0.01783466339111328, 0.019297122955322266, 0.02075958251953125, 0.022222042083740234, 0.02368450164794922, 0.025146961212158203, 0.026609420776367188, 0.028071880340576172, 0.029534339904785156, 0.03099679946899414, 0.032459259033203125, 0.03392171859741211, 0.035384178161621094, 0.03684663772583008, 0.03830909729003906, 0.03977155685424805, 0.04123401641845703, 0.042696475982666016, 0.044158935546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 7.0, 7.0, 8.0, 14.0, 20.0, 16.0, 31.0, 26.0, 57.0, 47.0, 81.0, 89.0, 103.0, 104.0, 93.0, 62.0, 47.0, 47.0, 26.0, 17.0, 16.0, 11.0, 11.0, 7.0, 8.0, 7.0, 5.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0517578125, -0.050074100494384766, -0.04839038848876953, -0.0467066764831543, -0.04502296447753906, -0.04333925247192383, -0.041655540466308594, -0.03997182846069336, -0.038288116455078125, -0.03660440444946289, -0.034920692443847656, -0.03323698043823242, -0.03155326843261719, -0.029869556427001953, -0.02818584442138672, -0.026502132415771484, -0.02481842041015625, -0.023134708404541016, -0.02145099639892578, -0.019767284393310547, -0.018083572387695312, -0.016399860382080078, -0.014716148376464844, -0.01303243637084961, -0.011348724365234375, -0.00966501235961914, -0.007981300354003906, -0.006297588348388672, -0.0046138763427734375, -0.002930164337158203, -0.0012464523315429688, 0.0004372596740722656, 0.0021209716796875, 0.0038046836853027344, 0.005488395690917969, 0.007172107696533203, 0.008855819702148438, 0.010539531707763672, 0.012223243713378906, 0.01390695571899414, 0.015590667724609375, 0.01727437973022461, 0.018958091735839844, 0.020641803741455078, 0.022325515747070312, 0.024009227752685547, 0.02569293975830078, 0.027376651763916016, 0.02906036376953125, 0.030744075775146484, 0.03242778778076172, 0.03411149978637695, 0.03579521179199219, 0.03747892379760742, 0.039162635803222656, 0.04084634780883789, 0.042530059814453125, 0.04421377182006836, 0.045897483825683594, 0.04758119583129883, 0.04926490783691406, 0.0509486198425293, 0.05263233184814453, 0.054316043853759766, 0.055999755859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 13.0, 16.0, 26.0, 39.0, 76.0, 122.0, 172.0, 210.0, 131.0, 77.0, 46.0, 22.0, 17.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8503308296203613, -0.8212739825248718, -0.7922171354293823, -0.7631603479385376, -0.7341035008430481, -0.7050466537475586, -0.6759898066520691, -0.6469329595565796, -0.6178761124610901, -0.5888192653656006, -0.5597624182701111, -0.5307055711746216, -0.5016487836837769, -0.47259193658828735, -0.44353508949279785, -0.41447824239730835, -0.38542142510414124, -0.35636457800865173, -0.3273077607154846, -0.2982509136199951, -0.2691940665245056, -0.2401372343301773, -0.211080402135849, -0.1820235550403595, -0.1529667228460312, -0.12390988320112228, -0.09485304355621338, -0.06579621136188507, -0.036739371716976166, -0.007682532072067261, 0.021374300122261047, 0.05043114721775055, 0.07948797941207886, 0.10854481905698776, 0.13760165870189667, 0.16665849089622498, 0.19571533799171448, 0.22477217018604279, 0.2538290023803711, 0.2828858494758606, 0.3119426965713501, 0.3409995436668396, 0.3700563609600067, 0.3991132080554962, 0.4281700551509857, 0.45722687244415283, 0.48628371953964233, 0.5153405666351318, 0.5443973541259766, 0.5734542012214661, 0.6025110483169556, 0.6315678358078003, 0.6606246829032898, 0.6896815299987793, 0.7187383770942688, 0.7477952241897583, 0.7768520712852478, 0.8059089183807373, 0.8349657654762268, 0.8640226125717163, 0.893079400062561, 0.9221362471580505, 0.95119309425354, 0.9802499413490295, 1.009306788444519]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 5.0, 4.0, 8.0, 9.0, 6.0, 10.0, 9.0, 15.0, 17.0, 12.0, 19.0, 16.0, 22.0, 19.0, 23.0, 38.0, 30.0, 25.0, 36.0, 41.0, 45.0, 61.0, 65.0, 54.0, 45.0, 38.0, 30.0, 28.0, 29.0, 23.0, 25.0, 23.0, 26.0, 15.0, 18.0, 21.0, 13.0, 13.0, 16.0, 7.0, 10.0, 12.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.69630366563797, -0.675903856754303, -0.655504047870636, -0.6351042985916138, -0.6147044897079468, -0.5943046808242798, -0.5739048719406128, -0.5535050630569458, -0.5331052541732788, -0.5127054452896118, -0.4923056662082672, -0.4719058573246002, -0.4515060782432556, -0.4311062693595886, -0.41070646047592163, -0.39030665159225464, -0.3699069023132324, -0.34950709342956543, -0.3291073143482208, -0.30870750546455383, -0.28830772638320923, -0.26790791749954224, -0.24750810861587524, -0.22710831463336945, -0.20670852065086365, -0.18630872666835785, -0.16590893268585205, -0.14550912380218506, -0.12510932981967926, -0.10470953583717346, -0.08430973440408707, -0.06390993297100067, -0.04351013898849487, -0.023110341280698776, -0.0027105435729026794, 0.017689254134893417, 0.038089051842689514, 0.05848884582519531, 0.07888864725828171, 0.0992884486913681, 0.1196882426738739, 0.1400880366563797, 0.1604878306388855, 0.1808876395225525, 0.2012874335050583, 0.2216872274875641, 0.24208703637123108, 0.2624868154525757, 0.2828866243362427, 0.30328643321990967, 0.3236862123012543, 0.34408602118492126, 0.36448580026626587, 0.38488560914993286, 0.40528541803359985, 0.42568522691726685, 0.44608500599861145, 0.46648481488227844, 0.48688459396362305, 0.50728440284729, 0.527684211730957, 0.548084020614624, 0.5684837698936462, 0.5888835787773132, 0.6092833876609802]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 12.0, 6.0, 9.0, 16.0, 31.0, 44.0, 62.0, 118.0, 207.0, 403.0, 907.0, 2834.0, 14025.0, 155696.0, 3362285.0, 618506.0, 30987.0, 5414.0, 1548.0, 571.0, 253.0, 125.0, 85.0, 52.0, 34.0, 14.0, 12.0, 8.0, 4.0, 4.0, 7.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1251220703125, -0.12171173095703125, -0.1183013916015625, -0.11489105224609375, -0.111480712890625, -0.10807037353515625, -0.1046600341796875, -0.10124969482421875, -0.09783935546875, -0.09442901611328125, -0.0910186767578125, -0.08760833740234375, -0.084197998046875, -0.08078765869140625, -0.0773773193359375, -0.07396697998046875, -0.070556640625, -0.06714630126953125, -0.0637359619140625, -0.06032562255859375, -0.056915283203125, -0.05350494384765625, -0.0500946044921875, -0.04668426513671875, -0.04327392578125, -0.03986358642578125, -0.0364532470703125, -0.03304290771484375, -0.029632568359375, -0.02622222900390625, -0.0228118896484375, -0.01940155029296875, -0.0159912109375, -0.01258087158203125, -0.0091705322265625, -0.00576019287109375, -0.002349853515625, 0.00106048583984375, 0.0044708251953125, 0.00788116455078125, 0.01129150390625, 0.01470184326171875, 0.0181121826171875, 0.02152252197265625, 0.024932861328125, 0.02834320068359375, 0.0317535400390625, 0.03516387939453125, 0.03857421875, 0.04198455810546875, 0.0453948974609375, 0.04880523681640625, 0.052215576171875, 0.05562591552734375, 0.0590362548828125, 0.06244659423828125, 0.06585693359375, 0.06926727294921875, 0.0726776123046875, 0.07608795166015625, 0.079498291015625, 0.08290863037109375, 0.0863189697265625, 0.08972930908203125, 0.0931396484375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 10.0, 8.0, 12.0, 17.0, 30.0, 28.0, 24.0, 44.0, 47.0, 55.0, 52.0, 60.0, 62.0, 72.0, 54.0, 58.0, 61.0, 52.0, 40.0, 36.0, 53.0, 28.0, 16.0, 18.0, 14.0, 7.0, 14.0, 13.0, 8.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05767822265625, -0.05597400665283203, -0.05426979064941406, -0.052565574645996094, -0.050861358642578125, -0.049157142639160156, -0.04745292663574219, -0.04574871063232422, -0.04404449462890625, -0.04234027862548828, -0.04063606262207031, -0.038931846618652344, -0.037227630615234375, -0.035523414611816406, -0.03381919860839844, -0.03211498260498047, -0.0304107666015625, -0.02870655059814453, -0.027002334594726562, -0.025298118591308594, -0.023593902587890625, -0.021889686584472656, -0.020185470581054688, -0.01848125457763672, -0.01677703857421875, -0.015072822570800781, -0.013368606567382812, -0.011664390563964844, -0.009960174560546875, -0.008255958557128906, -0.0065517425537109375, -0.004847526550292969, -0.003143310546875, -0.0014390945434570312, 0.0002651214599609375, 0.0019693374633789062, 0.003673553466796875, 0.005377769470214844, 0.0070819854736328125, 0.008786201477050781, 0.01049041748046875, 0.012194633483886719, 0.013898849487304688, 0.015603065490722656, 0.017307281494140625, 0.019011497497558594, 0.020715713500976562, 0.02241992950439453, 0.0241241455078125, 0.02582836151123047, 0.027532577514648438, 0.029236793518066406, 0.030941009521484375, 0.032645225524902344, 0.03434944152832031, 0.03605365753173828, 0.03775787353515625, 0.03946208953857422, 0.04116630554199219, 0.042870521545410156, 0.044574737548828125, 0.046278953552246094, 0.04798316955566406, 0.04968738555908203, 0.0513916015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 6.0, 12.0, 20.0, 27.0, 48.0, 55.0, 95.0, 152.0, 254.0, 477.0, 1023.0, 3601.0, 40601.0, 3873735.0, 261684.0, 9702.0, 1706.0, 570.0, 249.0, 118.0, 54.0, 46.0, 18.0, 13.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1923828125, -0.18650054931640625, -0.1806182861328125, -0.17473602294921875, -0.168853759765625, -0.16297149658203125, -0.1570892333984375, -0.15120697021484375, -0.14532470703125, -0.13944244384765625, -0.1335601806640625, -0.12767791748046875, -0.121795654296875, -0.11591339111328125, -0.1100311279296875, -0.10414886474609375, -0.0982666015625, -0.09238433837890625, -0.0865020751953125, -0.08061981201171875, -0.074737548828125, -0.06885528564453125, -0.0629730224609375, -0.05709075927734375, -0.05120849609375, -0.04532623291015625, -0.0394439697265625, -0.03356170654296875, -0.027679443359375, -0.02179718017578125, -0.0159149169921875, -0.01003265380859375, -0.004150390625, 0.00173187255859375, 0.0076141357421875, 0.01349639892578125, 0.019378662109375, 0.02526092529296875, 0.0311431884765625, 0.03702545166015625, 0.04290771484375, 0.04878997802734375, 0.0546722412109375, 0.06055450439453125, 0.066436767578125, 0.07231903076171875, 0.0782012939453125, 0.08408355712890625, 0.0899658203125, 0.09584808349609375, 0.1017303466796875, 0.10761260986328125, 0.113494873046875, 0.11937713623046875, 0.1252593994140625, 0.13114166259765625, 0.13702392578125, 0.14290618896484375, 0.1487884521484375, 0.15467071533203125, 0.160552978515625, 0.16643524169921875, 0.1723175048828125, 0.17819976806640625, 0.18408203125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 17.0, 27.0, 75.0, 240.0, 912.0, 1735.0, 718.0, 186.0, 83.0, 35.0, 19.0, 8.0, 6.0, 1.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.305419921875, -0.2983741760253906, -0.29132843017578125, -0.2842826843261719, -0.2772369384765625, -0.2701911926269531, -0.26314544677734375, -0.2560997009277344, -0.249053955078125, -0.24200820922851562, -0.23496246337890625, -0.22791671752929688, -0.2208709716796875, -0.21382522583007812, -0.20677947998046875, -0.19973373413085938, -0.19268798828125, -0.18564224243164062, -0.17859649658203125, -0.17155075073242188, -0.1645050048828125, -0.15745925903320312, -0.15041351318359375, -0.14336776733398438, -0.136322021484375, -0.12927627563476562, -0.12223052978515625, -0.11518478393554688, -0.1081390380859375, -0.10109329223632812, -0.09404754638671875, -0.08700180053710938, -0.0799560546875, -0.07291030883789062, -0.06586456298828125, -0.058818817138671875, -0.0517730712890625, -0.044727325439453125, -0.03768157958984375, -0.030635833740234375, -0.023590087890625, -0.016544342041015625, -0.00949859619140625, -0.002452850341796875, 0.0045928955078125, 0.011638641357421875, 0.01868438720703125, 0.025730133056640625, 0.03277587890625, 0.039821624755859375, 0.04686737060546875, 0.053913116455078125, 0.0609588623046875, 0.06800460815429688, 0.07505035400390625, 0.08209609985351562, 0.089141845703125, 0.09618759155273438, 0.10323333740234375, 0.11027908325195312, 0.1173248291015625, 0.12437057495117188, 0.13141632080078125, 0.13846206665039062, 0.1455078125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 11.0, 41.0, 138.0, 333.0, 313.0, 105.0, 34.0, 12.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1615586280822754, -2.1046102046966553, -2.047661781311035, -1.9907134771347046, -1.9337650537490845, -1.876816749572754, -1.8198683261871338, -1.7629199028015137, -1.705971598625183, -1.649023175239563, -1.5920748710632324, -1.5351264476776123, -1.4781780242919922, -1.4212297201156616, -1.3642812967300415, -1.307332992553711, -1.2503845691680908, -1.1934361457824707, -1.1364878416061401, -1.07953941822052, -1.0225909948349, -0.9656426906585693, -0.9086942672729492, -0.8517459034919739, -0.794797420501709, -0.7378490567207336, -0.6809006333351135, -0.6239522695541382, -0.5670039057731628, -0.5100555419921875, -0.4531071186065674, -0.39615875482559204, -0.3392103910446167, -0.28226199746131897, -0.22531363368034363, -0.1683652400970459, -0.11141686141490936, -0.05446848273277283, 0.0024799108505249023, 0.059428274631500244, 0.11637666821479797, 0.1733250468969345, 0.23027342557907104, 0.2872218191623688, 0.3441702127456665, 0.40111857652664185, 0.4580669701099396, 0.5150153636932373, 0.5719637274742126, 0.628912091255188, 0.6858605146408081, 0.7428088784217834, 0.7997572422027588, 0.8567056655883789, 0.9136540293693542, 0.9706023931503296, 1.0275508165359497, 1.0844992399215698, 1.1414475440979004, 1.1983959674835205, 1.2553443908691406, 1.3122926950454712, 1.3692411184310913, 1.4261894226074219, 1.483137845993042]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 8.0, 8.0, 14.0, 13.0, 17.0, 23.0, 14.0, 41.0, 31.0, 38.0, 43.0, 46.0, 45.0, 51.0, 45.0, 56.0, 66.0, 47.0, 50.0, 44.0, 39.0, 38.0, 44.0, 36.0, 22.0, 22.0, 22.0, 11.0, 19.0, 17.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5158400535583496, -0.49775493144989014, -0.47966980934143066, -0.4615846872329712, -0.44349953532218933, -0.42541441321372986, -0.4073292911052704, -0.3892441391944885, -0.37115901708602905, -0.3530738949775696, -0.3349887728691101, -0.31690365076065063, -0.2988184988498688, -0.2807333767414093, -0.26264825463294983, -0.24456311762332916, -0.22647801041603088, -0.2083928883075714, -0.19030775129795074, -0.17222262918949127, -0.1541374921798706, -0.13605237007141113, -0.11796724796295166, -0.099882110953331, -0.08179698884487152, -0.06371185928583145, -0.04562673345208168, -0.02754160761833191, -0.00945647805929184, 0.00862865149974823, 0.026713773608207703, 0.04479891061782837, 0.06288403272628784, 0.08096916228532791, 0.09905429184436798, 0.11713941395282745, 0.13522455096244812, 0.1533096730709076, 0.17139479517936707, 0.18947993218898773, 0.2075650542974472, 0.22565017640590668, 0.24373531341552734, 0.2618204355239868, 0.2799055576324463, 0.29799067974090576, 0.31607580184936523, 0.3341609537601471, 0.35224607586860657, 0.37033119797706604, 0.3884163200855255, 0.4065014719963074, 0.42458659410476685, 0.4426717162132263, 0.4607568383216858, 0.47884196043014526, 0.49692708253860474, 0.5150122046470642, 0.5330973267555237, 0.5511824488639832, 0.5692675709724426, 0.5873527526855469, 0.6054378747940063, 0.6235229969024658, 0.6416081190109253]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 7.0, 4.0, 9.0, 7.0, 10.0, 7.0, 7.0, 11.0, 13.0, 21.0, 23.0, 44.0, 41.0, 67.0, 89.0, 151.0, 196.0, 310.0, 582.0, 939.0, 1682.0, 3445.0, 7237.0, 15926.0, 38825.0, 93447.0, 212771.0, 320383.0, 200166.0, 86838.0, 36091.0, 15102.0, 6790.0, 3265.0, 1660.0, 920.0, 487.0, 290.0, 204.0, 130.0, 104.0, 64.0, 59.0, 38.0, 25.0, 17.0, 14.0, 8.0, 7.0, 8.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.06671142578125, -0.06477546691894531, -0.06283950805664062, -0.06090354919433594, -0.05896759033203125, -0.05703163146972656, -0.055095672607421875, -0.05315971374511719, -0.0512237548828125, -0.04928779602050781, -0.047351837158203125, -0.04541587829589844, -0.04347991943359375, -0.04154396057128906, -0.039608001708984375, -0.03767204284667969, -0.035736083984375, -0.03380012512207031, -0.031864166259765625, -0.029928207397460938, -0.02799224853515625, -0.026056289672851562, -0.024120330810546875, -0.022184371948242188, -0.0202484130859375, -0.018312454223632812, -0.016376495361328125, -0.014440536499023438, -0.01250457763671875, -0.010568618774414062, -0.008632659912109375, -0.0066967010498046875, -0.0047607421875, -0.0028247833251953125, -0.000888824462890625, 0.0010471343994140625, 0.00298309326171875, 0.0049190521240234375, 0.006855010986328125, 0.008790969848632812, 0.0107269287109375, 0.012662887573242188, 0.014598846435546875, 0.016534805297851562, 0.01847076416015625, 0.020406723022460938, 0.022342681884765625, 0.024278640747070312, 0.026214599609375, 0.028150558471679688, 0.030086517333984375, 0.03202247619628906, 0.03395843505859375, 0.03589439392089844, 0.037830352783203125, 0.03976631164550781, 0.0417022705078125, 0.04363822937011719, 0.045574188232421875, 0.04751014709472656, 0.04944610595703125, 0.05138206481933594, 0.053318023681640625, 0.05525398254394531, 0.05718994140625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 5.0, 5.0, 23.0, 11.0, 18.0, 34.0, 38.0, 34.0, 26.0, 32.0, 46.0, 32.0, 52.0, 58.0, 48.0, 68.0, 52.0, 54.0, 59.0, 39.0, 46.0, 32.0, 38.0, 22.0, 26.0, 22.0, 14.0, 22.0, 8.0, 8.0, 10.0, 3.0, 6.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052520751953125, -0.05090045928955078, -0.04928016662597656, -0.047659873962402344, -0.046039581298828125, -0.044419288635253906, -0.04279899597167969, -0.04117870330810547, -0.03955841064453125, -0.03793811798095703, -0.03631782531738281, -0.034697532653808594, -0.033077239990234375, -0.031456947326660156, -0.029836654663085938, -0.02821636199951172, -0.0265960693359375, -0.02497577667236328, -0.023355484008789062, -0.021735191345214844, -0.020114898681640625, -0.018494606018066406, -0.016874313354492188, -0.015254020690917969, -0.01363372802734375, -0.012013435363769531, -0.010393142700195312, -0.008772850036621094, -0.007152557373046875, -0.005532264709472656, -0.0039119720458984375, -0.0022916793823242188, -0.00067138671875, 0.0009489059448242188, 0.0025691986083984375, 0.004189491271972656, 0.005809783935546875, 0.007430076599121094, 0.009050369262695312, 0.010670661926269531, 0.01229095458984375, 0.013911247253417969, 0.015531539916992188, 0.017151832580566406, 0.018772125244140625, 0.020392417907714844, 0.022012710571289062, 0.02363300323486328, 0.0252532958984375, 0.02687358856201172, 0.028493881225585938, 0.030114173889160156, 0.031734466552734375, 0.033354759216308594, 0.03497505187988281, 0.03659534454345703, 0.03821563720703125, 0.03983592987060547, 0.04145622253417969, 0.043076515197753906, 0.044696807861328125, 0.046317100524902344, 0.04793739318847656, 0.04955768585205078, 0.051177978515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 10.0, 11.0, 21.0, 13.0, 24.0, 23.0, 37.0, 59.0, 72.0, 81.0, 99.0, 142.0, 215.0, 285.0, 450.0, 641.0, 1110.0, 2448.0, 7037.0, 33503.0, 262600.0, 646482.0, 73402.0, 12250.0, 3541.0, 1458.0, 772.0, 446.0, 337.0, 275.0, 167.0, 141.0, 87.0, 83.0, 38.0, 56.0, 34.0, 20.0, 19.0, 15.0, 10.0, 9.0, 5.0, 6.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.150390625, -0.1458606719970703, -0.14133071899414062, -0.13680076599121094, -0.13227081298828125, -0.12774085998535156, -0.12321090698242188, -0.11868095397949219, -0.1141510009765625, -0.10962104797363281, -0.10509109497070312, -0.10056114196777344, -0.09603118896484375, -0.09150123596191406, -0.08697128295898438, -0.08244132995605469, -0.077911376953125, -0.07338142395019531, -0.06885147094726562, -0.06432151794433594, -0.05979156494140625, -0.05526161193847656, -0.050731658935546875, -0.04620170593261719, -0.0416717529296875, -0.03714179992675781, -0.032611846923828125, -0.028081893920898438, -0.02355194091796875, -0.019021987915039062, -0.014492034912109375, -0.009962081909179688, -0.00543212890625, -0.0009021759033203125, 0.003627777099609375, 0.008157730102539062, 0.01268768310546875, 0.017217636108398438, 0.021747589111328125, 0.026277542114257812, 0.0308074951171875, 0.03533744812011719, 0.039867401123046875, 0.04439735412597656, 0.04892730712890625, 0.05345726013183594, 0.057987213134765625, 0.06251716613769531, 0.067047119140625, 0.07157707214355469, 0.07610702514648438, 0.08063697814941406, 0.08516693115234375, 0.08969688415527344, 0.09422683715820312, 0.09875679016113281, 0.1032867431640625, 0.10781669616699219, 0.11234664916992188, 0.11687660217285156, 0.12140655517578125, 0.12593650817871094, 0.13046646118164062, 0.1349964141845703, 0.1395263671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 14.0, 11.0, 15.0, 16.0, 17.0, 15.0, 20.0, 26.0, 36.0, 38.0, 41.0, 49.0, 46.0, 53.0, 51.0, 59.0, 43.0, 51.0, 53.0, 49.0, 39.0, 36.0, 32.0, 26.0, 31.0, 24.0, 22.0, 16.0, 9.0, 15.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.211181640625, -0.20487403869628906, -0.19856643676757812, -0.1922588348388672, -0.18595123291015625, -0.1796436309814453, -0.17333602905273438, -0.16702842712402344, -0.1607208251953125, -0.15441322326660156, -0.14810562133789062, -0.1417980194091797, -0.13549041748046875, -0.1291828155517578, -0.12287521362304688, -0.11656761169433594, -0.110260009765625, -0.10395240783691406, -0.09764480590820312, -0.09133720397949219, -0.08502960205078125, -0.07872200012207031, -0.07241439819335938, -0.06610679626464844, -0.0597991943359375, -0.05349159240722656, -0.047183990478515625, -0.04087638854980469, -0.03456878662109375, -0.028261184692382812, -0.021953582763671875, -0.015645980834960938, -0.00933837890625, -0.0030307769775390625, 0.003276824951171875, 0.009584426879882812, 0.01589202880859375, 0.022199630737304688, 0.028507232666015625, 0.03481483459472656, 0.0411224365234375, 0.04743003845214844, 0.053737640380859375, 0.06004524230957031, 0.06635284423828125, 0.07266044616699219, 0.07896804809570312, 0.08527565002441406, 0.091583251953125, 0.09789085388183594, 0.10419845581054688, 0.11050605773925781, 0.11681365966796875, 0.12312126159667969, 0.12942886352539062, 0.13573646545410156, 0.1420440673828125, 0.14835166931152344, 0.15465927124023438, 0.1609668731689453, 0.16727447509765625, 0.1735820770263672, 0.17988967895507812, 0.18619728088378906, 0.1925048828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 9.0, 12.0, 9.0, 15.0, 28.0, 41.0, 44.0, 72.0, 112.0, 178.0, 389.0, 872.0, 2218.0, 7203.0, 32598.0, 257733.0, 665212.0, 64396.0, 11659.0, 3345.0, 1219.0, 498.0, 276.0, 136.0, 95.0, 49.0, 39.0, 12.0, 18.0, 11.0, 21.0, 7.0, 8.0, 0.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044921875, -0.04326915740966797, -0.04161643981933594, -0.039963722229003906, -0.038311004638671875, -0.036658287048339844, -0.03500556945800781, -0.03335285186767578, -0.03170013427734375, -0.03004741668701172, -0.028394699096679688, -0.026741981506347656, -0.025089263916015625, -0.023436546325683594, -0.021783828735351562, -0.02013111114501953, -0.0184783935546875, -0.01682567596435547, -0.015172958374023438, -0.013520240783691406, -0.011867523193359375, -0.010214805603027344, -0.008562088012695312, -0.006909370422363281, -0.00525665283203125, -0.0036039352416992188, -0.0019512176513671875, -0.00029850006103515625, 0.001354217529296875, 0.0030069351196289062, 0.0046596527099609375, 0.006312370300292969, 0.007965087890625, 0.009617805480957031, 0.011270523071289062, 0.012923240661621094, 0.014575958251953125, 0.016228675842285156, 0.017881393432617188, 0.01953411102294922, 0.02118682861328125, 0.02283954620361328, 0.024492263793945312, 0.026144981384277344, 0.027797698974609375, 0.029450416564941406, 0.031103134155273438, 0.03275585174560547, 0.0344085693359375, 0.03606128692626953, 0.03771400451660156, 0.039366722106933594, 0.041019439697265625, 0.042672157287597656, 0.04432487487792969, 0.04597759246826172, 0.04763031005859375, 0.04928302764892578, 0.05093574523925781, 0.052588462829589844, 0.054241180419921875, 0.055893898010253906, 0.05754661560058594, 0.05919933319091797, 0.06085205078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 6.0, 1.0, 10.0, 4.0, 6.0, 5.0, 16.0, 13.0, 19.0, 17.0, 21.0, 41.0, 35.0, 47.0, 68.0, 82.0, 82.0, 89.0, 85.0, 76.0, 57.0, 40.0, 32.0, 25.0, 21.0, 14.0, 11.0, 10.0, 15.0, 8.0, 8.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4955482482910156e-05, -5.327444523572922e-05, -5.159340798854828e-05, -4.991237074136734e-05, -4.82313334941864e-05, -4.655029624700546e-05, -4.4869258999824524e-05, -4.3188221752643585e-05, -4.1507184505462646e-05, -3.982614725828171e-05, -3.814511001110077e-05, -3.646407276391983e-05, -3.478303551673889e-05, -3.310199826955795e-05, -3.1420961022377014e-05, -2.9739923775196075e-05, -2.8058886528015137e-05, -2.6377849280834198e-05, -2.469681203365326e-05, -2.301577478647232e-05, -2.1334737539291382e-05, -1.9653700292110443e-05, -1.7972663044929504e-05, -1.6291625797748566e-05, -1.4610588550567627e-05, -1.2929551303386688e-05, -1.124851405620575e-05, -9.56747680902481e-06, -7.886439561843872e-06, -6.205402314662933e-06, -4.524365067481995e-06, -2.843327820301056e-06, -1.1622905731201172e-06, 5.187466740608215e-07, 2.1997839212417603e-06, 3.880821168422699e-06, 5.561858415603638e-06, 7.242895662784576e-06, 8.923932909965515e-06, 1.0604970157146454e-05, 1.2286007404327393e-05, 1.3967044651508331e-05, 1.564808189868927e-05, 1.732911914587021e-05, 1.9010156393051147e-05, 2.0691193640232086e-05, 2.2372230887413025e-05, 2.4053268134593964e-05, 2.5734305381774902e-05, 2.741534262895584e-05, 2.909637987613678e-05, 3.077741712331772e-05, 3.245845437049866e-05, 3.4139491617679596e-05, 3.5820528864860535e-05, 3.7501566112041473e-05, 3.918260335922241e-05, 4.086364060640335e-05, 4.254467785358429e-05, 4.422571510076523e-05, 4.590675234794617e-05, 4.7587789595127106e-05, 4.9268826842308044e-05, 5.094986408948898e-05, 5.263090133666992e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 7.0, 13.0, 11.0, 13.0, 21.0, 34.0, 39.0, 56.0, 102.0, 141.0, 213.0, 417.0, 658.0, 1362.0, 3076.0, 9031.0, 38111.0, 238498.0, 642100.0, 88249.0, 17172.0, 4981.0, 1986.0, 999.0, 472.0, 274.0, 171.0, 100.0, 56.0, 58.0, 45.0, 23.0, 10.0, 12.0, 12.0, 8.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04541015625, -0.04404401779174805, -0.042677879333496094, -0.04131174087524414, -0.03994560241699219, -0.038579463958740234, -0.03721332550048828, -0.03584718704223633, -0.034481048583984375, -0.03311491012573242, -0.03174877166748047, -0.030382633209228516, -0.029016494750976562, -0.02765035629272461, -0.026284217834472656, -0.024918079376220703, -0.02355194091796875, -0.022185802459716797, -0.020819664001464844, -0.01945352554321289, -0.018087387084960938, -0.016721248626708984, -0.015355110168457031, -0.013988971710205078, -0.012622833251953125, -0.011256694793701172, -0.009890556335449219, -0.008524417877197266, -0.0071582794189453125, -0.005792140960693359, -0.004426002502441406, -0.003059864044189453, -0.0016937255859375, -0.0003275871276855469, 0.0010385513305664062, 0.0024046897888183594, 0.0037708282470703125, 0.005136966705322266, 0.006503105163574219, 0.007869243621826172, 0.009235382080078125, 0.010601520538330078, 0.011967658996582031, 0.013333797454833984, 0.014699935913085938, 0.01606607437133789, 0.017432212829589844, 0.018798351287841797, 0.02016448974609375, 0.021530628204345703, 0.022896766662597656, 0.02426290512084961, 0.025629043579101562, 0.026995182037353516, 0.02836132049560547, 0.029727458953857422, 0.031093597412109375, 0.03245973587036133, 0.03382587432861328, 0.035192012786865234, 0.03655815124511719, 0.03792428970336914, 0.039290428161621094, 0.04065656661987305, 0.042022705078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 6.0, 16.0, 13.0, 21.0, 21.0, 24.0, 48.0, 63.0, 84.0, 71.0, 121.0, 117.0, 96.0, 73.0, 55.0, 57.0, 34.0, 20.0, 17.0, 8.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06011962890625, -0.05824708938598633, -0.056374549865722656, -0.054502010345458984, -0.05262947082519531, -0.05075693130493164, -0.04888439178466797, -0.0470118522644043, -0.045139312744140625, -0.04326677322387695, -0.04139423370361328, -0.03952169418334961, -0.03764915466308594, -0.035776615142822266, -0.033904075622558594, -0.03203153610229492, -0.03015899658203125, -0.028286457061767578, -0.026413917541503906, -0.024541378021240234, -0.022668838500976562, -0.02079629898071289, -0.01892375946044922, -0.017051219940185547, -0.015178680419921875, -0.013306140899658203, -0.011433601379394531, -0.00956106185913086, -0.0076885223388671875, -0.005815982818603516, -0.003943443298339844, -0.002070903778076172, -0.0001983642578125, 0.0016741752624511719, 0.0035467147827148438, 0.005419254302978516, 0.0072917938232421875, 0.00916433334350586, 0.011036872863769531, 0.012909412384033203, 0.014781951904296875, 0.016654491424560547, 0.01852703094482422, 0.02039957046508789, 0.022272109985351562, 0.024144649505615234, 0.026017189025878906, 0.027889728546142578, 0.02976226806640625, 0.03163480758666992, 0.033507347106933594, 0.035379886627197266, 0.03725242614746094, 0.03912496566772461, 0.04099750518798828, 0.04287004470825195, 0.044742584228515625, 0.0466151237487793, 0.04848766326904297, 0.05036020278930664, 0.05223274230957031, 0.054105281829833984, 0.055977821350097656, 0.05785036087036133, 0.059722900390625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 9.0, 19.0, 29.0, 52.0, 127.0, 268.0, 242.0, 121.0, 57.0, 39.0, 15.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.650573968887329, -1.612048864364624, -1.573523759841919, -1.5349985361099243, -1.4964734315872192, -1.4579483270645142, -1.4194231033325195, -1.3808979988098145, -1.3423728942871094, -1.3038477897644043, -1.2653226852416992, -1.2267974615097046, -1.1882723569869995, -1.1497472524642944, -1.1112220287322998, -1.0726969242095947, -1.0341718196868896, -0.9956467151641846, -0.9571215510368347, -0.9185963869094849, -0.8800712823867798, -0.8415461778640747, -0.8030210137367249, -0.764495849609375, -0.7259707450866699, -0.6874456405639648, -0.648920476436615, -0.6103953123092651, -0.5718702077865601, -0.533345103263855, -0.4948199391365051, -0.45629480481147766, -0.41776978969573975, -0.3792446553707123, -0.3407195210456848, -0.30219438672065735, -0.2636692523956299, -0.22514411807060242, -0.18661898374557495, -0.14809384942054749, -0.10956871509552002, -0.07104358077049255, -0.03251844644546509, 0.006006687879562378, 0.044531822204589844, 0.08305695652961731, 0.12158209085464478, 0.16010722517967224, 0.1986323595046997, 0.23715749382972717, 0.27568262815475464, 0.3142077624797821, 0.35273289680480957, 0.39125803112983704, 0.4297831654548645, 0.46830829977989197, 0.5068334341049194, 0.5453585386276245, 0.5838837027549744, 0.6224088668823242, 0.6609339714050293, 0.6994590759277344, 0.7379842400550842, 0.7765094041824341, 0.8150345087051392]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 11.0, 9.0, 11.0, 17.0, 15.0, 13.0, 15.0, 17.0, 26.0, 35.0, 34.0, 39.0, 55.0, 47.0, 63.0, 73.0, 71.0, 66.0, 40.0, 44.0, 24.0, 33.0, 38.0, 25.0, 18.0, 24.0, 21.0, 18.0, 12.0, 20.0, 8.0, 10.0, 5.0, 7.0, 6.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8334423899650574, -0.8065979480743408, -0.7797535061836243, -0.7529090642929077, -0.7260646224021912, -0.6992201805114746, -0.6723757386207581, -0.6455312967300415, -0.618686854839325, -0.5918424129486084, -0.5649979710578918, -0.5381535291671753, -0.5113090872764587, -0.4844646453857422, -0.45762020349502563, -0.4307757616043091, -0.4039313495159149, -0.37708690762519836, -0.3502424657344818, -0.32339802384376526, -0.2965535819530487, -0.26970916986465454, -0.2428647130727768, -0.21602027118206024, -0.1891758292913437, -0.16233138740062714, -0.13548694550991058, -0.10864251106977463, -0.08179806917905807, -0.05495363473892212, -0.028109192848205566, -0.0012647509574890137, 0.02557969093322754, 0.05242413282394409, 0.07926857471466064, 0.1061130091547966, 0.13295745849609375, 0.1598018854856491, 0.18664632737636566, 0.21349076926708221, 0.24033521115779877, 0.2671796381473541, 0.2940240800380707, 0.32086852192878723, 0.3477129638195038, 0.37455740571022034, 0.4014018476009369, 0.42824628949165344, 0.45509073138237, 0.48193517327308655, 0.5087795853614807, 0.5356240272521973, 0.5624684691429138, 0.5893129110336304, 0.6161573529243469, 0.6430017948150635, 0.66984623670578, 0.6966906785964966, 0.7235351204872131, 0.7503795623779297, 0.7772240042686462, 0.8040684461593628, 0.8309128880500793, 0.8577573299407959, 0.8846017718315125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 11.0, 10.0, 15.0, 16.0, 29.0, 35.0, 40.0, 63.0, 95.0, 117.0, 240.0, 326.0, 806.0, 2063.0, 7139.0, 43033.0, 857723.0, 3083012.0, 174945.0, 17554.0, 4187.0, 1424.0, 588.0, 296.0, 155.0, 128.0, 65.0, 40.0, 35.0, 24.0, 20.0, 13.0, 11.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.09661865234375, -0.09371471405029297, -0.09081077575683594, -0.0879068374633789, -0.08500289916992188, -0.08209896087646484, -0.07919502258300781, -0.07629108428955078, -0.07338714599609375, -0.07048320770263672, -0.06757926940917969, -0.06467533111572266, -0.061771392822265625, -0.058867454528808594, -0.05596351623535156, -0.05305957794189453, -0.0501556396484375, -0.04725170135498047, -0.04434776306152344, -0.041443824768066406, -0.038539886474609375, -0.035635948181152344, -0.03273200988769531, -0.02982807159423828, -0.02692413330078125, -0.02402019500732422, -0.021116256713867188, -0.018212318420410156, -0.015308380126953125, -0.012404441833496094, -0.009500503540039062, -0.006596565246582031, -0.003692626953125, -0.0007886886596679688, 0.0021152496337890625, 0.005019187927246094, 0.007923126220703125, 0.010827064514160156, 0.013731002807617188, 0.01663494110107422, 0.01953887939453125, 0.02244281768798828, 0.025346755981445312, 0.028250694274902344, 0.031154632568359375, 0.034058570861816406, 0.03696250915527344, 0.03986644744873047, 0.0427703857421875, 0.04567432403564453, 0.04857826232910156, 0.051482200622558594, 0.054386138916015625, 0.057290077209472656, 0.06019401550292969, 0.06309795379638672, 0.06600189208984375, 0.06890583038330078, 0.07180976867675781, 0.07471370697021484, 0.07761764526367188, 0.0805215835571289, 0.08342552185058594, 0.08632946014404297, 0.0892333984375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 8.0, 10.0, 24.0, 23.0, 35.0, 32.0, 28.0, 41.0, 32.0, 44.0, 48.0, 62.0, 58.0, 51.0, 59.0, 53.0, 56.0, 56.0, 39.0, 38.0, 42.0, 26.0, 26.0, 27.0, 21.0, 11.0, 6.0, 11.0, 7.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051177978515625, -0.04956626892089844, -0.047954559326171875, -0.04634284973144531, -0.04473114013671875, -0.04311943054199219, -0.041507720947265625, -0.03989601135253906, -0.0382843017578125, -0.03667259216308594, -0.035060882568359375, -0.03344917297363281, -0.03183746337890625, -0.030225753784179688, -0.028614044189453125, -0.027002334594726562, -0.025390625, -0.023778915405273438, -0.022167205810546875, -0.020555496215820312, -0.01894378662109375, -0.017332077026367188, -0.015720367431640625, -0.014108657836914062, -0.0124969482421875, -0.010885238647460938, -0.009273529052734375, -0.0076618194580078125, -0.00605010986328125, -0.0044384002685546875, -0.002826690673828125, -0.0012149810791015625, 0.000396728515625, 0.0020084381103515625, 0.003620147705078125, 0.0052318572998046875, 0.00684356689453125, 0.008455276489257812, 0.010066986083984375, 0.011678695678710938, 0.0132904052734375, 0.014902114868164062, 0.016513824462890625, 0.018125534057617188, 0.01973724365234375, 0.021348953247070312, 0.022960662841796875, 0.024572372436523438, 0.02618408203125, 0.027795791625976562, 0.029407501220703125, 0.031019210815429688, 0.03263092041015625, 0.03424263000488281, 0.035854339599609375, 0.03746604919433594, 0.0390777587890625, 0.04068946838378906, 0.042301177978515625, 0.04391288757324219, 0.04552459716796875, 0.04713630676269531, 0.048748016357421875, 0.05035972595214844, 0.051971435546875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 7.0, 3.0, 25.0, 25.0, 41.0, 72.0, 140.0, 210.0, 416.0, 883.0, 2868.0, 27296.0, 3593056.0, 554934.0, 10929.0, 1871.0, 674.0, 346.0, 198.0, 107.0, 60.0, 33.0, 24.0, 25.0, 10.0, 10.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.195068359375, -0.18912696838378906, -0.18318557739257812, -0.1772441864013672, -0.17130279541015625, -0.1653614044189453, -0.15942001342773438, -0.15347862243652344, -0.1475372314453125, -0.14159584045410156, -0.13565444946289062, -0.1297130584716797, -0.12377166748046875, -0.11783027648925781, -0.11188888549804688, -0.10594749450683594, -0.100006103515625, -0.09406471252441406, -0.08812332153320312, -0.08218193054199219, -0.07624053955078125, -0.07029914855957031, -0.06435775756835938, -0.05841636657714844, -0.0524749755859375, -0.04653358459472656, -0.040592193603515625, -0.03465080261230469, -0.02870941162109375, -0.022768020629882812, -0.016826629638671875, -0.010885238647460938, -0.00494384765625, 0.0009975433349609375, 0.006938934326171875, 0.012880325317382812, 0.01882171630859375, 0.024763107299804688, 0.030704498291015625, 0.03664588928222656, 0.0425872802734375, 0.04852867126464844, 0.054470062255859375, 0.06041145324707031, 0.06635284423828125, 0.07229423522949219, 0.07823562622070312, 0.08417701721191406, 0.090118408203125, 0.09605979919433594, 0.10200119018554688, 0.10794258117675781, 0.11388397216796875, 0.11982536315917969, 0.12576675415039062, 0.13170814514160156, 0.1376495361328125, 0.14359092712402344, 0.14953231811523438, 0.1554737091064453, 0.16141510009765625, 0.1673564910888672, 0.17329788208007812, 0.17923927307128906, 0.1851806640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 8.0, 17.0, 14.0, 40.0, 59.0, 184.0, 457.0, 1080.0, 1254.0, 563.0, 209.0, 81.0, 56.0, 16.0, 9.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1292724609375, -0.12430953979492188, -0.11934661865234375, -0.11438369750976562, -0.1094207763671875, -0.10445785522460938, -0.09949493408203125, -0.09453201293945312, -0.089569091796875, -0.08460617065429688, -0.07964324951171875, -0.07468032836914062, -0.0697174072265625, -0.06475448608398438, -0.05979156494140625, -0.054828643798828125, -0.04986572265625, -0.044902801513671875, -0.03993988037109375, -0.034976959228515625, -0.0300140380859375, -0.025051116943359375, -0.02008819580078125, -0.015125274658203125, -0.010162353515625, -0.005199432373046875, -0.00023651123046875, 0.004726409912109375, 0.0096893310546875, 0.014652252197265625, 0.01961517333984375, 0.024578094482421875, 0.029541015625, 0.034503936767578125, 0.03946685791015625, 0.044429779052734375, 0.0493927001953125, 0.054355621337890625, 0.05931854248046875, 0.06428146362304688, 0.069244384765625, 0.07420730590820312, 0.07917022705078125, 0.08413314819335938, 0.0890960693359375, 0.09405899047851562, 0.09902191162109375, 0.10398483276367188, 0.10894775390625, 0.11391067504882812, 0.11887359619140625, 0.12383651733398438, 0.1287994384765625, 0.13376235961914062, 0.13872528076171875, 0.14368820190429688, 0.148651123046875, 0.15361404418945312, 0.15857696533203125, 0.16353988647460938, 0.1685028076171875, 0.17346572875976562, 0.17842864990234375, 0.18339157104492188, 0.1883544921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 6.0, 10.0, 12.0, 24.0, 75.0, 151.0, 258.0, 269.0, 123.0, 49.0, 16.0, 10.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5752570629119873, -0.534039318561554, -0.4928215444087982, -0.45160380005836487, -0.41038602590560913, -0.3691682815551758, -0.32795053720474243, -0.2867327630519867, -0.24551501870155334, -0.2042972594499588, -0.16307950019836426, -0.12186175584793091, -0.08064399659633636, -0.03942623734474182, 0.0017915070056915283, 0.043009281158447266, 0.08422702550888062, 0.12544478476047516, 0.1666625440120697, 0.20788028836250305, 0.2490980476140976, 0.29031580686569214, 0.3315335512161255, 0.3727513253688812, 0.4139690697193146, 0.4551868140697479, 0.49640458822250366, 0.537622332572937, 0.5788400769233704, 0.6200578212738037, 0.6612756252288818, 0.7024933695793152, 0.7437111139297485, 0.7849288582801819, 0.8261466026306152, 0.8673644065856934, 0.9085821509361267, 0.9497998952865601, 0.9910176396369934, 1.0322353839874268, 1.0734531879425049, 1.114670991897583, 1.1558886766433716, 1.1971064805984497, 1.2383241653442383, 1.2795419692993164, 1.3207597732543945, 1.361977458000183, 1.4031951427459717, 1.4444129467010498, 1.4856306314468384, 1.5268484354019165, 1.568066120147705, 1.6092839241027832, 1.6505017280578613, 1.69171941280365, 1.732937216758728, 1.7741550207138062, 1.8153727054595947, 1.8565905094146729, 1.8978081941604614, 1.9390259981155396, 1.9802436828613281, 2.0214614868164062, 2.0626792907714844]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 15.0, 19.0, 27.0, 27.0, 44.0, 39.0, 52.0, 52.0, 66.0, 57.0, 75.0, 69.0, 57.0, 59.0, 51.0, 57.0, 44.0, 38.0, 26.0, 28.0, 16.0, 18.0, 16.0, 5.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38207244873046875, -0.3666575253009796, -0.35124263167381287, -0.33582770824432373, -0.3204127848148346, -0.30499786138534546, -0.2895829677581787, -0.2741680443286896, -0.25875312089920044, -0.2433382123708725, -0.22792328894138336, -0.21250838041305542, -0.19709345698356628, -0.18167854845523834, -0.1662636399269104, -0.15084871649742126, -0.13543380796909332, -0.12001889199018478, -0.10460397601127625, -0.0891890674829483, -0.07377414405345917, -0.058359235525131226, -0.04294431954622269, -0.027529403567314148, -0.012114487588405609, 0.003300427459180355, 0.01871534250676632, 0.03413025662302971, 0.04954517260193825, 0.06496008485555649, 0.08037500083446503, 0.09578991681337357, 0.1112048327922821, 0.12661974132061005, 0.14203466475009918, 0.15744957327842712, 0.17286449670791626, 0.1882794052362442, 0.20369431376457214, 0.21910923719406128, 0.23452416062355042, 0.24993906915187836, 0.2653539776802063, 0.28076890110969543, 0.29618382453918457, 0.3115987181663513, 0.32701364159584045, 0.3424285650253296, 0.35784345865249634, 0.3732583820819855, 0.3886732757091522, 0.40408819913864136, 0.4195031225681305, 0.43491804599761963, 0.4503329396247864, 0.4657478630542755, 0.48116278648376465, 0.4965777099132538, 0.5119926333427429, 0.5274075269699097, 0.5428224205970764, 0.5582373738288879, 0.5736522674560547, 0.5890672206878662, 0.604482114315033]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 3.0, 5.0, 5.0, 4.0, 0.0, 4.0, 11.0, 18.0, 9.0, 27.0, 30.0, 53.0, 62.0, 126.0, 222.0, 420.0, 838.0, 1999.0, 4716.0, 13340.0, 44066.0, 164321.0, 422907.0, 280593.0, 79425.0, 22653.0, 7422.0, 2747.0, 1177.0, 596.0, 264.0, 175.0, 107.0, 59.0, 52.0, 30.0, 22.0, 13.0, 11.0, 6.0, 10.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.0977783203125, -0.09504127502441406, -0.09230422973632812, -0.08956718444824219, -0.08683013916015625, -0.08409309387207031, -0.08135604858398438, -0.07861900329589844, -0.0758819580078125, -0.07314491271972656, -0.07040786743164062, -0.06767082214355469, -0.06493377685546875, -0.06219673156738281, -0.059459686279296875, -0.05672264099121094, -0.053985595703125, -0.05124855041503906, -0.048511505126953125, -0.04577445983886719, -0.04303741455078125, -0.04030036926269531, -0.037563323974609375, -0.03482627868652344, -0.0320892333984375, -0.029352188110351562, -0.026615142822265625, -0.023878097534179688, -0.02114105224609375, -0.018404006958007812, -0.015666961669921875, -0.012929916381835938, -0.01019287109375, -0.0074558258056640625, -0.004718780517578125, -0.0019817352294921875, 0.00075531005859375, 0.0034923553466796875, 0.006229400634765625, 0.008966445922851562, 0.0117034912109375, 0.014440536499023438, 0.017177581787109375, 0.019914627075195312, 0.02265167236328125, 0.025388717651367188, 0.028125762939453125, 0.030862808227539062, 0.033599853515625, 0.03633689880371094, 0.039073944091796875, 0.04181098937988281, 0.04454803466796875, 0.04728507995605469, 0.050022125244140625, 0.05275917053222656, 0.0554962158203125, 0.05823326110839844, 0.060970306396484375, 0.06370735168457031, 0.06644439697265625, 0.06918144226074219, 0.07191848754882812, 0.07465553283691406, 0.077392578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 7.0, 16.0, 21.0, 12.0, 21.0, 33.0, 32.0, 31.0, 31.0, 52.0, 50.0, 49.0, 47.0, 44.0, 62.0, 44.0, 54.0, 71.0, 47.0, 49.0, 40.0, 31.0, 27.0, 23.0, 19.0, 14.0, 23.0, 16.0, 14.0, 8.0, 2.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.0488896369934082, -0.047303199768066406, -0.04571676254272461, -0.04413032531738281, -0.042543888092041016, -0.04095745086669922, -0.03937101364135742, -0.037784576416015625, -0.03619813919067383, -0.03461170196533203, -0.033025264739990234, -0.03143882751464844, -0.02985239028930664, -0.028265953063964844, -0.026679515838623047, -0.02509307861328125, -0.023506641387939453, -0.021920204162597656, -0.02033376693725586, -0.018747329711914062, -0.017160892486572266, -0.015574455261230469, -0.013988018035888672, -0.012401580810546875, -0.010815143585205078, -0.009228706359863281, -0.007642269134521484, -0.0060558319091796875, -0.004469394683837891, -0.0028829574584960938, -0.0012965202331542969, 0.0002899169921875, 0.0018763542175292969, 0.0034627914428710938, 0.005049228668212891, 0.0066356658935546875, 0.008222103118896484, 0.009808540344238281, 0.011394977569580078, 0.012981414794921875, 0.014567852020263672, 0.01615428924560547, 0.017740726470947266, 0.019327163696289062, 0.02091360092163086, 0.022500038146972656, 0.024086475372314453, 0.02567291259765625, 0.027259349822998047, 0.028845787048339844, 0.03043222427368164, 0.03201866149902344, 0.033605098724365234, 0.03519153594970703, 0.03677797317504883, 0.038364410400390625, 0.03995084762573242, 0.04153728485107422, 0.043123722076416016, 0.04471015930175781, 0.04629659652709961, 0.047883033752441406, 0.0494694709777832, 0.051055908203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 8.0, 4.0, 10.0, 12.0, 12.0, 17.0, 18.0, 35.0, 45.0, 73.0, 74.0, 133.0, 208.0, 408.0, 824.0, 1987.0, 5754.0, 20559.0, 98987.0, 565077.0, 276834.0, 57526.0, 13138.0, 3881.0, 1413.0, 643.0, 337.0, 172.0, 107.0, 61.0, 63.0, 42.0, 27.0, 21.0, 15.0, 7.0, 7.0, 4.0, 5.0, 5.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.12213134765625, -0.11872291564941406, -0.11531448364257812, -0.11190605163574219, -0.10849761962890625, -0.10508918762207031, -0.10168075561523438, -0.09827232360839844, -0.0948638916015625, -0.09145545959472656, -0.08804702758789062, -0.08463859558105469, -0.08123016357421875, -0.07782173156738281, -0.07441329956054688, -0.07100486755371094, -0.067596435546875, -0.06418800354003906, -0.060779571533203125, -0.05737113952636719, -0.05396270751953125, -0.05055427551269531, -0.047145843505859375, -0.04373741149902344, -0.0403289794921875, -0.03692054748535156, -0.033512115478515625, -0.030103683471679688, -0.02669525146484375, -0.023286819458007812, -0.019878387451171875, -0.016469955444335938, -0.0130615234375, -0.009653091430664062, -0.006244659423828125, -0.0028362274169921875, 0.00057220458984375, 0.0039806365966796875, 0.007389068603515625, 0.010797500610351562, 0.0142059326171875, 0.017614364624023438, 0.021022796630859375, 0.024431228637695312, 0.02783966064453125, 0.031248092651367188, 0.034656524658203125, 0.03806495666503906, 0.041473388671875, 0.04488182067871094, 0.048290252685546875, 0.05169868469238281, 0.05510711669921875, 0.05851554870605469, 0.061923980712890625, 0.06533241271972656, 0.0687408447265625, 0.07214927673339844, 0.07555770874023438, 0.07896614074707031, 0.08237457275390625, 0.08578300476074219, 0.08919143676757812, 0.09259986877441406, 0.09600830078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 7.0, 7.0, 6.0, 11.0, 16.0, 14.0, 16.0, 21.0, 23.0, 24.0, 33.0, 30.0, 38.0, 46.0, 46.0, 40.0, 35.0, 51.0, 43.0, 41.0, 34.0, 47.0, 42.0, 37.0, 36.0, 31.0, 23.0, 32.0, 23.0, 19.0, 15.0, 12.0, 17.0, 14.0, 13.0, 5.0, 4.0, 4.0, 13.0, 4.0, 0.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1380615234375, -0.13365936279296875, -0.1292572021484375, -0.12485504150390625, -0.120452880859375, -0.11605072021484375, -0.1116485595703125, -0.10724639892578125, -0.10284423828125, -0.09844207763671875, -0.0940399169921875, -0.08963775634765625, -0.085235595703125, -0.08083343505859375, -0.0764312744140625, -0.07202911376953125, -0.067626953125, -0.06322479248046875, -0.0588226318359375, -0.05442047119140625, -0.050018310546875, -0.04561614990234375, -0.0412139892578125, -0.03681182861328125, -0.03240966796875, -0.02800750732421875, -0.0236053466796875, -0.01920318603515625, -0.014801025390625, -0.01039886474609375, -0.0059967041015625, -0.00159454345703125, 0.0028076171875, 0.00720977783203125, 0.0116119384765625, 0.01601409912109375, 0.020416259765625, 0.02481842041015625, 0.0292205810546875, 0.03362274169921875, 0.03802490234375, 0.04242706298828125, 0.0468292236328125, 0.05123138427734375, 0.055633544921875, 0.06003570556640625, 0.0644378662109375, 0.06884002685546875, 0.0732421875, 0.07764434814453125, 0.0820465087890625, 0.08644866943359375, 0.090850830078125, 0.09525299072265625, 0.0996551513671875, 0.10405731201171875, 0.10845947265625, 0.11286163330078125, 0.1172637939453125, 0.12166595458984375, 0.126068115234375, 0.13047027587890625, 0.1348724365234375, 0.13927459716796875, 0.1436767578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 22.0, 24.0, 34.0, 48.0, 81.0, 120.0, 211.0, 397.0, 734.0, 1452.0, 2936.0, 6692.0, 17957.0, 61097.0, 289540.0, 552756.0, 78156.0, 21623.0, 7645.0, 3401.0, 1633.0, 862.0, 473.0, 250.0, 167.0, 104.0, 45.0, 33.0, 20.0, 10.0, 6.0, 3.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036895751953125, -0.03562736511230469, -0.034358978271484375, -0.03309059143066406, -0.03182220458984375, -0.030553817749023438, -0.029285430908203125, -0.028017044067382812, -0.0267486572265625, -0.025480270385742188, -0.024211883544921875, -0.022943496704101562, -0.02167510986328125, -0.020406723022460938, -0.019138336181640625, -0.017869949340820312, -0.0166015625, -0.015333175659179688, -0.014064788818359375, -0.012796401977539062, -0.01152801513671875, -0.010259628295898438, -0.008991241455078125, -0.0077228546142578125, -0.0064544677734375, -0.0051860809326171875, -0.003917694091796875, -0.0026493072509765625, -0.00138092041015625, -0.0001125335693359375, 0.001155853271484375, 0.0024242401123046875, 0.003692626953125, 0.0049610137939453125, 0.006229400634765625, 0.0074977874755859375, 0.00876617431640625, 0.010034561157226562, 0.011302947998046875, 0.012571334838867188, 0.0138397216796875, 0.015108108520507812, 0.016376495361328125, 0.017644882202148438, 0.01891326904296875, 0.020181655883789062, 0.021450042724609375, 0.022718429565429688, 0.02398681640625, 0.025255203247070312, 0.026523590087890625, 0.027791976928710938, 0.02906036376953125, 0.030328750610351562, 0.031597137451171875, 0.03286552429199219, 0.0341339111328125, 0.03540229797363281, 0.036670684814453125, 0.03793907165527344, 0.03920745849609375, 0.04047584533691406, 0.041744232177734375, 0.04301261901855469, 0.044281005859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 18.0, 19.0, 20.0, 32.0, 46.0, 55.0, 90.0, 83.0, 98.0, 89.0, 94.0, 80.0, 68.0, 60.0, 39.0, 21.0, 16.0, 14.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.8743019104003906e-05, -3.7496909499168396e-05, -3.6250799894332886e-05, -3.5004690289497375e-05, -3.3758580684661865e-05, -3.2512471079826355e-05, -3.1266361474990845e-05, -3.0020251870155334e-05, -2.8774142265319824e-05, -2.7528032660484314e-05, -2.6281923055648804e-05, -2.5035813450813293e-05, -2.3789703845977783e-05, -2.2543594241142273e-05, -2.1297484636306763e-05, -2.0051375031471252e-05, -1.8805265426635742e-05, -1.7559155821800232e-05, -1.631304621696472e-05, -1.5066936612129211e-05, -1.3820827007293701e-05, -1.2574717402458191e-05, -1.132860779762268e-05, -1.008249819278717e-05, -8.83638858795166e-06, -7.59027898311615e-06, -6.34416937828064e-06, -5.098059773445129e-06, -3.851950168609619e-06, -2.605840563774109e-06, -1.3597309589385986e-06, -1.1362135410308838e-07, 1.1324882507324219e-06, 2.378597855567932e-06, 3.6247074604034424e-06, 4.870817065238953e-06, 6.116926670074463e-06, 7.363036274909973e-06, 8.609145879745483e-06, 9.855255484580994e-06, 1.1101365089416504e-05, 1.2347474694252014e-05, 1.3593584299087524e-05, 1.4839693903923035e-05, 1.6085803508758545e-05, 1.7331913113594055e-05, 1.8578022718429565e-05, 1.9824132323265076e-05, 2.1070241928100586e-05, 2.2316351532936096e-05, 2.3562461137771606e-05, 2.4808570742607117e-05, 2.6054680347442627e-05, 2.7300789952278137e-05, 2.8546899557113647e-05, 2.9793009161949158e-05, 3.103911876678467e-05, 3.228522837162018e-05, 3.353133797645569e-05, 3.47774475812912e-05, 3.602355718612671e-05, 3.726966679096222e-05, 3.851577639579773e-05, 3.976188600063324e-05, 4.100799560546875e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 12.0, 19.0, 30.0, 40.0, 82.0, 130.0, 211.0, 472.0, 1008.0, 2462.0, 6551.0, 20702.0, 80803.0, 561219.0, 289958.0, 59830.0, 15964.0, 5243.0, 2094.0, 857.0, 423.0, 179.0, 95.0, 60.0, 40.0, 20.0, 7.0, 8.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038482666015625, -0.03710317611694336, -0.03572368621826172, -0.03434419631958008, -0.03296470642089844, -0.0315852165222168, -0.030205726623535156, -0.028826236724853516, -0.027446746826171875, -0.026067256927490234, -0.024687767028808594, -0.023308277130126953, -0.021928787231445312, -0.020549297332763672, -0.01916980743408203, -0.01779031753540039, -0.01641082763671875, -0.01503133773803711, -0.013651847839355469, -0.012272357940673828, -0.010892868041992188, -0.009513378143310547, -0.008133888244628906, -0.006754398345947266, -0.005374908447265625, -0.003995418548583984, -0.0026159286499023438, -0.0012364387512207031, 0.0001430511474609375, 0.0015225410461425781, 0.0029020309448242188, 0.004281520843505859, 0.0056610107421875, 0.007040500640869141, 0.008419990539550781, 0.009799480438232422, 0.011178970336914062, 0.012558460235595703, 0.013937950134277344, 0.015317440032958984, 0.016696929931640625, 0.018076419830322266, 0.019455909729003906, 0.020835399627685547, 0.022214889526367188, 0.023594379425048828, 0.02497386932373047, 0.02635335922241211, 0.02773284912109375, 0.02911233901977539, 0.03049182891845703, 0.03187131881713867, 0.03325080871582031, 0.03463029861450195, 0.036009788513183594, 0.037389278411865234, 0.038768768310546875, 0.040148258209228516, 0.041527748107910156, 0.0429072380065918, 0.04428672790527344, 0.04566621780395508, 0.04704570770263672, 0.04842519760131836, 0.0498046875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 1.0, 7.0, 5.0, 9.0, 18.0, 11.0, 14.0, 20.0, 35.0, 35.0, 45.0, 62.0, 87.0, 105.0, 113.0, 101.0, 92.0, 65.0, 51.0, 36.0, 35.0, 8.0, 9.0, 12.0, 6.0, 7.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03912353515625, -0.037520408630371094, -0.03591728210449219, -0.03431415557861328, -0.032711029052734375, -0.03110790252685547, -0.029504776000976562, -0.027901649475097656, -0.02629852294921875, -0.024695396423339844, -0.023092269897460938, -0.02148914337158203, -0.019886016845703125, -0.01828289031982422, -0.016679763793945312, -0.015076637268066406, -0.0134735107421875, -0.011870384216308594, -0.010267257690429688, -0.008664131164550781, -0.007061004638671875, -0.005457878112792969, -0.0038547515869140625, -0.0022516250610351562, -0.00064849853515625, 0.0009546279907226562, 0.0025577545166015625, 0.004160881042480469, 0.005764007568359375, 0.007367134094238281, 0.008970260620117188, 0.010573387145996094, 0.012176513671875, 0.013779640197753906, 0.015382766723632812, 0.01698589324951172, 0.018589019775390625, 0.02019214630126953, 0.021795272827148438, 0.023398399353027344, 0.02500152587890625, 0.026604652404785156, 0.028207778930664062, 0.02981090545654297, 0.031414031982421875, 0.03301715850830078, 0.03462028503417969, 0.036223411560058594, 0.0378265380859375, 0.039429664611816406, 0.04103279113769531, 0.04263591766357422, 0.044239044189453125, 0.04584217071533203, 0.04744529724121094, 0.049048423767089844, 0.05065155029296875, 0.052254676818847656, 0.05385780334472656, 0.05546092987060547, 0.057064056396484375, 0.05866718292236328, 0.06027030944824219, 0.061873435974121094, 0.0634765625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 13.0, 3.0, 20.0, 52.0, 113.0, 224.0, 350.0, 133.0, 48.0, 26.0, 11.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7186263799667358, -1.6697492599487305, -1.620872139930725, -1.5719950199127197, -1.5231178998947144, -1.474240779876709, -1.4253636598587036, -1.3764865398406982, -1.3276094198226929, -1.2787322998046875, -1.2298551797866821, -1.1809780597686768, -1.1321009397506714, -1.083223819732666, -1.0343466997146606, -0.9854695796966553, -0.9365924596786499, -0.8877153396606445, -0.8388382196426392, -0.7899610996246338, -0.7410839796066284, -0.692206859588623, -0.6433297395706177, -0.5944526195526123, -0.5455754995346069, -0.49669837951660156, -0.4478212594985962, -0.3989441394805908, -0.35006701946258545, -0.3011898994445801, -0.2523127794265747, -0.20343565940856934, -0.15455865859985352, -0.10568153858184814, -0.05680441856384277, -0.007927298545837402, 0.04094982147216797, 0.08982694149017334, 0.1387040615081787, 0.18758118152618408, 0.23645830154418945, 0.2853354215621948, 0.3342125415802002, 0.38308966159820557, 0.43196678161621094, 0.4808439016342163, 0.5297210216522217, 0.578598141670227, 0.6274752616882324, 0.6763523817062378, 0.7252295017242432, 0.7741066217422485, 0.8229837417602539, 0.8718608617782593, 0.9207379817962646, 0.96961510181427, 1.0184922218322754, 1.0673693418502808, 1.1162464618682861, 1.1651235818862915, 1.2140007019042969, 1.2628778219223022, 1.3117549419403076, 1.360632061958313, 1.4095091819763184]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 10.0, 12.0, 8.0, 7.0, 16.0, 13.0, 17.0, 22.0, 24.0, 24.0, 40.0, 28.0, 29.0, 26.0, 28.0, 46.0, 78.0, 73.0, 65.0, 57.0, 46.0, 35.0, 27.0, 18.0, 29.0, 17.0, 22.0, 28.0, 24.0, 19.0, 22.0, 15.0, 6.0, 12.0, 10.0, 2.0, 5.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.5998488664627075, -0.5819374322891235, -0.5640259981155396, -0.5461145639419556, -0.5282031297683716, -0.5102917551994324, -0.4923803210258484, -0.4744688868522644, -0.4565574526786804, -0.43864601850509644, -0.42073458433151245, -0.40282317996025085, -0.38491174578666687, -0.3670003116130829, -0.3490889072418213, -0.3311774730682373, -0.3132660388946533, -0.29535460472106934, -0.27744317054748535, -0.25953176617622375, -0.24162033200263977, -0.2237088978290558, -0.205797478556633, -0.1878860592842102, -0.16997462511062622, -0.15206319093704224, -0.13415177166461945, -0.11624034494161606, -0.09832891821861267, -0.08041749149560928, -0.0625060647726059, -0.044594645500183105, -0.026683270931243896, -0.008771844208240509, 0.009139582514762878, 0.027051009237766266, 0.04496243596076965, 0.06287386268377304, 0.08078528940677643, 0.09869670867919922, 0.1166081428527832, 0.1345195770263672, 0.15243099629878998, 0.17034241557121277, 0.18825384974479675, 0.20616528391838074, 0.22407670319080353, 0.24198812246322632, 0.2598995566368103, 0.2778109908103943, 0.29572242498397827, 0.31363382935523987, 0.33154526352882385, 0.34945669770240784, 0.36736810207366943, 0.3852795362472534, 0.4031909704208374, 0.4211024045944214, 0.43901383876800537, 0.45692524313926697, 0.47483667731285095, 0.49274811148643494, 0.5106595158576965, 0.5285709500312805, 0.5464823842048645]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 4.0, 6.0, 19.0, 24.0, 42.0, 66.0, 95.0, 223.0, 498.0, 1121.0, 3226.0, 13867.0, 125560.0, 2506617.0, 1464524.0, 64487.0, 9391.0, 2622.0, 966.0, 424.0, 207.0, 108.0, 65.0, 47.0, 19.0, 17.0, 11.0, 8.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09197998046875, -0.0890951156616211, -0.08621025085449219, -0.08332538604736328, -0.08044052124023438, -0.07755565643310547, -0.07467079162597656, -0.07178592681884766, -0.06890106201171875, -0.06601619720458984, -0.06313133239746094, -0.06024646759033203, -0.057361602783203125, -0.05447673797607422, -0.05159187316894531, -0.048707008361816406, -0.0458221435546875, -0.042937278747558594, -0.04005241394042969, -0.03716754913330078, -0.034282684326171875, -0.03139781951904297, -0.028512954711914062, -0.025628089904785156, -0.02274322509765625, -0.019858360290527344, -0.016973495483398438, -0.014088630676269531, -0.011203765869140625, -0.008318901062011719, -0.0054340362548828125, -0.0025491714477539062, 0.000335693359375, 0.0032205581665039062, 0.0061054229736328125, 0.008990287780761719, 0.011875152587890625, 0.014760017395019531, 0.017644882202148438, 0.020529747009277344, 0.02341461181640625, 0.026299476623535156, 0.029184341430664062, 0.03206920623779297, 0.034954071044921875, 0.03783893585205078, 0.04072380065917969, 0.043608665466308594, 0.0464935302734375, 0.049378395080566406, 0.05226325988769531, 0.05514812469482422, 0.058032989501953125, 0.06091785430908203, 0.06380271911621094, 0.06668758392333984, 0.06957244873046875, 0.07245731353759766, 0.07534217834472656, 0.07822704315185547, 0.08111190795898438, 0.08399677276611328, 0.08688163757324219, 0.0897665023803711, 0.0926513671875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 6.0, 6.0, 13.0, 13.0, 23.0, 25.0, 27.0, 28.0, 27.0, 33.0, 36.0, 54.0, 52.0, 64.0, 51.0, 55.0, 53.0, 52.0, 56.0, 48.0, 43.0, 39.0, 42.0, 29.0, 28.0, 26.0, 18.0, 9.0, 13.0, 11.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044677734375, -0.04317760467529297, -0.04167747497558594, -0.040177345275878906, -0.038677215576171875, -0.037177085876464844, -0.03567695617675781, -0.03417682647705078, -0.03267669677734375, -0.03117656707763672, -0.029676437377929688, -0.028176307678222656, -0.026676177978515625, -0.025176048278808594, -0.023675918579101562, -0.02217578887939453, -0.0206756591796875, -0.01917552947998047, -0.017675399780273438, -0.016175270080566406, -0.014675140380859375, -0.013175010681152344, -0.011674880981445312, -0.010174751281738281, -0.00867462158203125, -0.007174491882324219, -0.0056743621826171875, -0.004174232482910156, -0.002674102783203125, -0.0011739730834960938, 0.0003261566162109375, 0.0018262863159179688, 0.003326416015625, 0.004826545715332031, 0.0063266754150390625, 0.007826805114746094, 0.009326934814453125, 0.010827064514160156, 0.012327194213867188, 0.013827323913574219, 0.01532745361328125, 0.01682758331298828, 0.018327713012695312, 0.019827842712402344, 0.021327972412109375, 0.022828102111816406, 0.024328231811523438, 0.02582836151123047, 0.0273284912109375, 0.02882862091064453, 0.030328750610351562, 0.031828880310058594, 0.033329010009765625, 0.034829139709472656, 0.03632926940917969, 0.03782939910888672, 0.03932952880859375, 0.04082965850830078, 0.04232978820800781, 0.043829917907714844, 0.045330047607421875, 0.046830177307128906, 0.04833030700683594, 0.04983043670654297, 0.05133056640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 0.0, 3.0, 4.0, 9.0, 27.0, 32.0, 70.0, 134.0, 314.0, 703.0, 1898.0, 15951.0, 3817136.0, 351130.0, 4927.0, 1129.0, 447.0, 186.0, 94.0, 36.0, 23.0, 18.0, 9.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2486572265625, -0.2410755157470703, -0.23349380493164062, -0.22591209411621094, -0.21833038330078125, -0.21074867248535156, -0.20316696166992188, -0.1955852508544922, -0.1880035400390625, -0.1804218292236328, -0.17284011840820312, -0.16525840759277344, -0.15767669677734375, -0.15009498596191406, -0.14251327514648438, -0.1349315643310547, -0.127349853515625, -0.11976814270019531, -0.11218643188476562, -0.10460472106933594, -0.09702301025390625, -0.08944129943847656, -0.08185958862304688, -0.07427787780761719, -0.0666961669921875, -0.05911445617675781, -0.051532745361328125, -0.04395103454589844, -0.03636932373046875, -0.028787612915039062, -0.021205902099609375, -0.013624191284179688, -0.00604248046875, 0.0015392303466796875, 0.009120941162109375, 0.016702651977539062, 0.02428436279296875, 0.03186607360839844, 0.039447784423828125, 0.04702949523925781, 0.0546112060546875, 0.06219291687011719, 0.06977462768554688, 0.07735633850097656, 0.08493804931640625, 0.09251976013183594, 0.10010147094726562, 0.10768318176269531, 0.115264892578125, 0.12284660339355469, 0.13042831420898438, 0.13801002502441406, 0.14559173583984375, 0.15317344665527344, 0.16075515747070312, 0.1683368682861328, 0.1759185791015625, 0.1835002899169922, 0.19108200073242188, 0.19866371154785156, 0.20624542236328125, 0.21382713317871094, 0.22140884399414062, 0.2289905548095703, 0.236572265625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 15.0, 32.0, 63.0, 86.0, 173.0, 309.0, 609.0, 968.0, 805.0, 460.0, 240.0, 126.0, 65.0, 44.0, 25.0, 19.0, 8.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1318359375, -0.1279287338256836, -0.12402153015136719, -0.12011432647705078, -0.11620712280273438, -0.11229991912841797, -0.10839271545410156, -0.10448551177978516, -0.10057830810546875, -0.09667110443115234, -0.09276390075683594, -0.08885669708251953, -0.08494949340820312, -0.08104228973388672, -0.07713508605957031, -0.0732278823852539, -0.0693206787109375, -0.0654134750366211, -0.06150627136230469, -0.05759906768798828, -0.053691864013671875, -0.04978466033935547, -0.04587745666503906, -0.041970252990722656, -0.03806304931640625, -0.034155845642089844, -0.030248641967773438, -0.02634143829345703, -0.022434234619140625, -0.01852703094482422, -0.014619827270507812, -0.010712623596191406, -0.006805419921875, -0.0028982162475585938, 0.0010089874267578125, 0.004916191101074219, 0.008823394775390625, 0.012730598449707031, 0.016637802124023438, 0.020545005798339844, 0.02445220947265625, 0.028359413146972656, 0.03226661682128906, 0.03617382049560547, 0.040081024169921875, 0.04398822784423828, 0.04789543151855469, 0.051802635192871094, 0.0557098388671875, 0.059617042541503906, 0.06352424621582031, 0.06743144989013672, 0.07133865356445312, 0.07524585723876953, 0.07915306091308594, 0.08306026458740234, 0.08696746826171875, 0.09087467193603516, 0.09478187561035156, 0.09868907928466797, 0.10259628295898438, 0.10650348663330078, 0.11041069030761719, 0.1143178939819336, 0.11822509765625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 10.0, 7.0, 9.0, 19.0, 29.0, 65.0, 98.0, 141.0, 196.0, 167.0, 131.0, 47.0, 33.0, 17.0, 11.0, 9.0, 4.0, 5.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.092214822769165, -1.0596553087234497, -1.0270956754684448, -0.9945361614227295, -0.9619766473770142, -0.929417073726654, -0.896857500076294, -0.8642979860305786, -0.8317384123802185, -0.7991788387298584, -0.7666193246841431, -0.734059751033783, -0.7015001773834229, -0.6689406633377075, -0.6363810896873474, -0.6038215160369873, -0.571262001991272, -0.5387024283409119, -0.5061429142951965, -0.4735833406448364, -0.4410237967967987, -0.408464252948761, -0.3759046792984009, -0.34334513545036316, -0.31078559160232544, -0.2782260477542877, -0.2456664890050888, -0.2131069302558899, -0.18054738640785217, -0.14798784255981445, -0.11542828381061554, -0.08286872506141663, -0.050309062004089355, -0.01774951070547104, 0.014810040593147278, 0.047369591891765594, 0.07992914319038391, 0.11248868703842163, 0.14504824578762054, 0.17760780453681946, 0.21016734838485718, 0.2427268922328949, 0.2752864360809326, 0.3078460097312927, 0.34040555357933044, 0.37296509742736816, 0.40552467107772827, 0.438084214925766, 0.4706437587738037, 0.5032033324241638, 0.5357628464698792, 0.5683224201202393, 0.6008819341659546, 0.6334415078163147, 0.6660010814666748, 0.6985605955123901, 0.7311201691627502, 0.7636797428131104, 0.7962392568588257, 0.8287988305091858, 0.8613584041595459, 0.8939179182052612, 0.9264774918556213, 0.9590370655059814, 0.9915965795516968]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 5.0, 4.0, 8.0, 15.0, 5.0, 17.0, 16.0, 14.0, 17.0, 27.0, 27.0, 34.0, 35.0, 42.0, 39.0, 35.0, 44.0, 53.0, 39.0, 48.0, 47.0, 49.0, 45.0, 45.0, 32.0, 36.0, 26.0, 30.0, 22.0, 21.0, 19.0, 19.0, 13.0, 11.0, 10.0, 5.0, 3.0, 8.0, 5.0, 5.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.37760603427886963, -0.36441338062286377, -0.3512207567691803, -0.33802810311317444, -0.3248354494571686, -0.3116428256034851, -0.29845017194747925, -0.2852575182914734, -0.27206486463546753, -0.25887221097946167, -0.245679572224617, -0.23248693346977234, -0.21929427981376648, -0.20610164105892181, -0.19290900230407715, -0.1797163486480713, -0.16652370989322662, -0.15333107113838196, -0.1401384174823761, -0.12694577872753143, -0.11375312507152557, -0.10056048631668091, -0.08736784011125565, -0.07417519390583038, -0.06098254770040512, -0.04778990149497986, -0.034597255289554596, -0.021404612809419632, -0.00821196660399437, 0.0049806758761405945, 0.018173322081565857, 0.03136596828699112, 0.04455861449241638, 0.057751260697841644, 0.0709439069032669, 0.08413654565811157, 0.09732919931411743, 0.1105218380689621, 0.12371448427438736, 0.13690713047981262, 0.15009978413581848, 0.16329242289066315, 0.176485076546669, 0.18967771530151367, 0.20287036895751953, 0.2160630077123642, 0.22925564646720886, 0.24244830012321472, 0.2556409239768982, 0.26883357763290405, 0.2820262014865875, 0.2952188551425934, 0.30841150879859924, 0.3216041326522827, 0.3347967863082886, 0.34798943996429443, 0.3611820936203003, 0.37437474727630615, 0.3875673711299896, 0.4007600247859955, 0.41395267844200134, 0.4271453022956848, 0.4403379559516907, 0.45353060960769653, 0.4667232632637024]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 11.0, 6.0, 11.0, 11.0, 20.0, 22.0, 39.0, 65.0, 93.0, 123.0, 186.0, 315.0, 599.0, 941.0, 1823.0, 3343.0, 7058.0, 14832.0, 33312.0, 79099.0, 190156.0, 328042.0, 221901.0, 93550.0, 39031.0, 17255.0, 7972.0, 4018.0, 2048.0, 1067.0, 604.0, 356.0, 213.0, 135.0, 93.0, 63.0, 48.0, 25.0, 23.0, 9.0, 7.0, 7.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.06707763671875, -0.06524467468261719, -0.06341171264648438, -0.06157875061035156, -0.05974578857421875, -0.05791282653808594, -0.056079864501953125, -0.05424690246582031, -0.0524139404296875, -0.05058097839355469, -0.048748016357421875, -0.04691505432128906, -0.04508209228515625, -0.04324913024902344, -0.041416168212890625, -0.03958320617675781, -0.037750244140625, -0.03591728210449219, -0.034084320068359375, -0.03225135803222656, -0.03041839599609375, -0.028585433959960938, -0.026752471923828125, -0.024919509887695312, -0.0230865478515625, -0.021253585815429688, -0.019420623779296875, -0.017587661743164062, -0.01575469970703125, -0.013921737670898438, -0.012088775634765625, -0.010255813598632812, -0.0084228515625, -0.0065898895263671875, -0.004756927490234375, -0.0029239654541015625, -0.00109100341796875, 0.0007419586181640625, 0.002574920654296875, 0.0044078826904296875, 0.0062408447265625, 0.008073806762695312, 0.009906768798828125, 0.011739730834960938, 0.01357269287109375, 0.015405654907226562, 0.017238616943359375, 0.019071578979492188, 0.020904541015625, 0.022737503051757812, 0.024570465087890625, 0.026403427124023438, 0.02823638916015625, 0.030069351196289062, 0.031902313232421875, 0.03373527526855469, 0.0355682373046875, 0.03740119934082031, 0.039234161376953125, 0.04106712341308594, 0.04290008544921875, 0.04473304748535156, 0.046566009521484375, 0.04839897155761719, 0.05023193359375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 3.0, 7.0, 4.0, 11.0, 14.0, 23.0, 28.0, 26.0, 29.0, 37.0, 28.0, 35.0, 29.0, 37.0, 49.0, 39.0, 42.0, 59.0, 55.0, 55.0, 55.0, 48.0, 27.0, 31.0, 35.0, 39.0, 31.0, 27.0, 17.0, 13.0, 16.0, 10.0, 9.0, 4.0, 5.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.041778564453125, -0.0403141975402832, -0.038849830627441406, -0.03738546371459961, -0.03592109680175781, -0.034456729888916016, -0.03299236297607422, -0.03152799606323242, -0.030063629150390625, -0.028599262237548828, -0.02713489532470703, -0.025670528411865234, -0.024206161499023438, -0.02274179458618164, -0.021277427673339844, -0.019813060760498047, -0.01834869384765625, -0.016884326934814453, -0.015419960021972656, -0.01395559310913086, -0.012491226196289062, -0.011026859283447266, -0.009562492370605469, -0.008098125457763672, -0.006633758544921875, -0.005169391632080078, -0.0037050247192382812, -0.0022406578063964844, -0.0007762908935546875, 0.0006880760192871094, 0.0021524429321289062, 0.003616809844970703, 0.0050811767578125, 0.006545543670654297, 0.008009910583496094, 0.00947427749633789, 0.010938644409179688, 0.012403011322021484, 0.013867378234863281, 0.015331745147705078, 0.016796112060546875, 0.018260478973388672, 0.01972484588623047, 0.021189212799072266, 0.022653579711914062, 0.02411794662475586, 0.025582313537597656, 0.027046680450439453, 0.02851104736328125, 0.029975414276123047, 0.031439781188964844, 0.03290414810180664, 0.03436851501464844, 0.035832881927490234, 0.03729724884033203, 0.03876161575317383, 0.040225982666015625, 0.04169034957885742, 0.04315471649169922, 0.044619083404541016, 0.04608345031738281, 0.04754781723022461, 0.049012184143066406, 0.0504765510559082, 0.05194091796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 10.0, 11.0, 27.0, 21.0, 43.0, 55.0, 74.0, 113.0, 107.0, 178.0, 242.0, 335.0, 529.0, 980.0, 1935.0, 5151.0, 16805.0, 74130.0, 572834.0, 297244.0, 55812.0, 13431.0, 4122.0, 1779.0, 902.0, 526.0, 322.0, 222.0, 167.0, 115.0, 75.0, 64.0, 44.0, 34.0, 19.0, 23.0, 16.0, 15.0, 11.0, 4.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1058349609375, -0.10229682922363281, -0.09875869750976562, -0.09522056579589844, -0.09168243408203125, -0.08814430236816406, -0.08460617065429688, -0.08106803894042969, -0.0775299072265625, -0.07399177551269531, -0.07045364379882812, -0.06691551208496094, -0.06337738037109375, -0.05983924865722656, -0.056301116943359375, -0.05276298522949219, -0.049224853515625, -0.04568672180175781, -0.042148590087890625, -0.03861045837402344, -0.03507232666015625, -0.03153419494628906, -0.027996063232421875, -0.024457931518554688, -0.0209197998046875, -0.017381668090820312, -0.013843536376953125, -0.010305404663085938, -0.00676727294921875, -0.0032291412353515625, 0.000308990478515625, 0.0038471221923828125, 0.00738525390625, 0.010923385620117188, 0.014461517333984375, 0.017999649047851562, 0.02153778076171875, 0.025075912475585938, 0.028614044189453125, 0.03215217590332031, 0.0356903076171875, 0.03922843933105469, 0.042766571044921875, 0.04630470275878906, 0.04984283447265625, 0.05338096618652344, 0.056919097900390625, 0.06045722961425781, 0.063995361328125, 0.06753349304199219, 0.07107162475585938, 0.07460975646972656, 0.07814788818359375, 0.08168601989746094, 0.08522415161132812, 0.08876228332519531, 0.0923004150390625, 0.09583854675292969, 0.09937667846679688, 0.10291481018066406, 0.10645294189453125, 0.10999107360839844, 0.11352920532226562, 0.11706733703613281, 0.12060546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 7.0, 6.0, 11.0, 14.0, 13.0, 12.0, 16.0, 24.0, 23.0, 25.0, 26.0, 41.0, 41.0, 38.0, 50.0, 61.0, 56.0, 38.0, 47.0, 43.0, 48.0, 45.0, 42.0, 44.0, 29.0, 32.0, 29.0, 24.0, 26.0, 11.0, 11.0, 14.0, 9.0, 4.0, 8.0, 8.0, 3.0, 3.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.19482421875, -0.1891345977783203, -0.18344497680664062, -0.17775535583496094, -0.17206573486328125, -0.16637611389160156, -0.16068649291992188, -0.1549968719482422, -0.1493072509765625, -0.1436176300048828, -0.13792800903320312, -0.13223838806152344, -0.12654876708984375, -0.12085914611816406, -0.11516952514648438, -0.10947990417480469, -0.103790283203125, -0.09810066223144531, -0.09241104125976562, -0.08672142028808594, -0.08103179931640625, -0.07534217834472656, -0.06965255737304688, -0.06396293640136719, -0.0582733154296875, -0.05258369445800781, -0.046894073486328125, -0.04120445251464844, -0.03551483154296875, -0.029825210571289062, -0.024135589599609375, -0.018445968627929688, -0.01275634765625, -0.0070667266845703125, -0.001377105712890625, 0.0043125152587890625, 0.01000213623046875, 0.015691757202148438, 0.021381378173828125, 0.027070999145507812, 0.0327606201171875, 0.03845024108886719, 0.044139862060546875, 0.04982948303222656, 0.05551910400390625, 0.06120872497558594, 0.06689834594726562, 0.07258796691894531, 0.078277587890625, 0.08396720886230469, 0.08965682983398438, 0.09534645080566406, 0.10103607177734375, 0.10672569274902344, 0.11241531372070312, 0.11810493469238281, 0.1237945556640625, 0.1294841766357422, 0.13517379760742188, 0.14086341857910156, 0.14655303955078125, 0.15224266052246094, 0.15793228149414062, 0.1636219024658203, 0.1693115234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 4.0, 7.0, 3.0, 5.0, 8.0, 17.0, 18.0, 40.0, 49.0, 88.0, 171.0, 333.0, 784.0, 1830.0, 4851.0, 14607.0, 53260.0, 303775.0, 582331.0, 60735.0, 16571.0, 5459.0, 1966.0, 827.0, 381.0, 194.0, 93.0, 58.0, 25.0, 21.0, 10.0, 3.0, 6.0, 7.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0260009765625, -0.0247039794921875, -0.023406982421875, -0.0221099853515625, -0.02081298828125, -0.0195159912109375, -0.018218994140625, -0.0169219970703125, -0.015625, -0.0143280029296875, -0.013031005859375, -0.0117340087890625, -0.01043701171875, -0.0091400146484375, -0.007843017578125, -0.0065460205078125, -0.0052490234375, -0.0039520263671875, -0.002655029296875, -0.0013580322265625, -6.103515625e-05, 0.0012359619140625, 0.002532958984375, 0.0038299560546875, 0.005126953125, 0.0064239501953125, 0.007720947265625, 0.0090179443359375, 0.01031494140625, 0.0116119384765625, 0.012908935546875, 0.0142059326171875, 0.0155029296875, 0.0167999267578125, 0.018096923828125, 0.0193939208984375, 0.02069091796875, 0.0219879150390625, 0.023284912109375, 0.0245819091796875, 0.02587890625, 0.0271759033203125, 0.028472900390625, 0.0297698974609375, 0.03106689453125, 0.0323638916015625, 0.033660888671875, 0.0349578857421875, 0.0362548828125, 0.0375518798828125, 0.038848876953125, 0.0401458740234375, 0.04144287109375, 0.0427398681640625, 0.044036865234375, 0.0453338623046875, 0.046630859375, 0.0479278564453125, 0.049224853515625, 0.0505218505859375, 0.05181884765625, 0.0531158447265625, 0.054412841796875, 0.0557098388671875, 0.0570068359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 5.0, 7.0, 9.0, 5.0, 17.0, 22.0, 23.0, 21.0, 34.0, 66.0, 79.0, 91.0, 109.0, 99.0, 95.0, 76.0, 58.0, 42.0, 23.0, 23.0, 17.0, 19.0, 10.0, 10.0, 9.0, 5.0, 2.0, 4.0, 5.0, 5.0, 2.0, 1.0, 0.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.4226646423339844e-05, -4.284083843231201e-05, -4.145503044128418e-05, -4.006922245025635e-05, -3.8683414459228516e-05, -3.7297606468200684e-05, -3.591179847717285e-05, -3.452599048614502e-05, -3.314018249511719e-05, -3.1754374504089355e-05, -3.0368566513061523e-05, -2.898275852203369e-05, -2.759695053100586e-05, -2.6211142539978027e-05, -2.4825334548950195e-05, -2.3439526557922363e-05, -2.205371856689453e-05, -2.06679105758667e-05, -1.9282102584838867e-05, -1.7896294593811035e-05, -1.6510486602783203e-05, -1.5124678611755371e-05, -1.3738870620727539e-05, -1.2353062629699707e-05, -1.0967254638671875e-05, -9.581446647644043e-06, -8.195638656616211e-06, -6.809830665588379e-06, -5.424022674560547e-06, -4.038214683532715e-06, -2.652406692504883e-06, -1.2665987014770508e-06, 1.1920928955078125e-07, 1.5050172805786133e-06, 2.8908252716064453e-06, 4.276633262634277e-06, 5.662441253662109e-06, 7.048249244689941e-06, 8.434057235717773e-06, 9.819865226745605e-06, 1.1205673217773438e-05, 1.259148120880127e-05, 1.3977289199829102e-05, 1.5363097190856934e-05, 1.6748905181884766e-05, 1.8134713172912598e-05, 1.952052116394043e-05, 2.0906329154968262e-05, 2.2292137145996094e-05, 2.3677945137023926e-05, 2.5063753128051758e-05, 2.644956111907959e-05, 2.7835369110107422e-05, 2.9221177101135254e-05, 3.0606985092163086e-05, 3.199279308319092e-05, 3.337860107421875e-05, 3.476440906524658e-05, 3.6150217056274414e-05, 3.7536025047302246e-05, 3.892183303833008e-05, 4.030764102935791e-05, 4.169344902038574e-05, 4.3079257011413574e-05, 4.4465065002441406e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 9.0, 4.0, 20.0, 24.0, 40.0, 52.0, 90.0, 155.0, 354.0, 750.0, 1829.0, 5526.0, 23544.0, 134526.0, 756456.0, 99186.0, 18498.0, 4691.0, 1511.0, 641.0, 268.0, 148.0, 77.0, 46.0, 42.0, 19.0, 15.0, 7.0, 8.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04083251953125, -0.03928709030151367, -0.037741661071777344, -0.036196231842041016, -0.03465080261230469, -0.03310537338256836, -0.03155994415283203, -0.030014514923095703, -0.028469085693359375, -0.026923656463623047, -0.02537822723388672, -0.02383279800415039, -0.022287368774414062, -0.020741939544677734, -0.019196510314941406, -0.017651081085205078, -0.01610565185546875, -0.014560222625732422, -0.013014793395996094, -0.011469364166259766, -0.009923934936523438, -0.00837850570678711, -0.006833076477050781, -0.005287647247314453, -0.003742218017578125, -0.002196788787841797, -0.0006513595581054688, 0.0008940696716308594, 0.0024394989013671875, 0.003984928131103516, 0.005530357360839844, 0.007075786590576172, 0.0086212158203125, 0.010166645050048828, 0.011712074279785156, 0.013257503509521484, 0.014802932739257812, 0.01634836196899414, 0.01789379119873047, 0.019439220428466797, 0.020984649658203125, 0.022530078887939453, 0.02407550811767578, 0.02562093734741211, 0.027166366577148438, 0.028711795806884766, 0.030257225036621094, 0.03180265426635742, 0.03334808349609375, 0.03489351272583008, 0.036438941955566406, 0.037984371185302734, 0.03952980041503906, 0.04107522964477539, 0.04262065887451172, 0.04416608810424805, 0.045711517333984375, 0.0472569465637207, 0.04880237579345703, 0.05034780502319336, 0.05189323425292969, 0.053438663482666016, 0.054984092712402344, 0.05652952194213867, 0.058074951171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 12.0, 13.0, 20.0, 21.0, 22.0, 27.0, 49.0, 59.0, 75.0, 109.0, 128.0, 114.0, 87.0, 60.0, 45.0, 25.0, 27.0, 21.0, 18.0, 15.0, 16.0, 7.0, 5.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044891357421875, -0.043514251708984375, -0.04213714599609375, -0.040760040283203125, -0.0393829345703125, -0.038005828857421875, -0.03662872314453125, -0.035251617431640625, -0.03387451171875, -0.032497406005859375, -0.03112030029296875, -0.029743194580078125, -0.0283660888671875, -0.026988983154296875, -0.02561187744140625, -0.024234771728515625, -0.022857666015625, -0.021480560302734375, -0.02010345458984375, -0.018726348876953125, -0.0173492431640625, -0.015972137451171875, -0.01459503173828125, -0.013217926025390625, -0.0118408203125, -0.010463714599609375, -0.00908660888671875, -0.007709503173828125, -0.0063323974609375, -0.004955291748046875, -0.00357818603515625, -0.002201080322265625, -0.000823974609375, 0.000553131103515625, 0.00193023681640625, 0.003307342529296875, 0.0046844482421875, 0.006061553955078125, 0.00743865966796875, 0.008815765380859375, 0.01019287109375, 0.011569976806640625, 0.01294708251953125, 0.014324188232421875, 0.0157012939453125, 0.017078399658203125, 0.01845550537109375, 0.019832611083984375, 0.021209716796875, 0.022586822509765625, 0.02396392822265625, 0.025341033935546875, 0.0267181396484375, 0.028095245361328125, 0.02947235107421875, 0.030849456787109375, 0.0322265625, 0.033603668212890625, 0.03498077392578125, 0.036357879638671875, 0.0377349853515625, 0.039112091064453125, 0.04048919677734375, 0.041866302490234375, 0.043243408203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 16.0, 20.0, 85.0, 184.0, 446.0, 146.0, 68.0, 17.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.528320074081421, -1.4725862741470337, -1.4168524742126465, -1.3611187934875488, -1.3053849935531616, -1.2496511936187744, -1.1939173936843872, -1.13818359375, -1.0824497938156128, -1.0267159938812256, -0.9709822535514832, -0.915248453617096, -0.8595146536827087, -0.8037809133529663, -0.7480471134185791, -0.6923133134841919, -0.6365795731544495, -0.5808457732200623, -0.5251120328903198, -0.4693782329559326, -0.4136444330215454, -0.3579106628894806, -0.30217689275741577, -0.24644309282302856, -0.19070932269096375, -0.13497553765773773, -0.07924176007509232, -0.0235079824924469, 0.032225802540779114, 0.08795958757400513, 0.14369335770606995, 0.19942715764045715, 0.255160927772522, 0.3108946979045868, 0.366628497838974, 0.4223622679710388, 0.478096067905426, 0.5338298082351685, 0.5895636081695557, 0.6452974081039429, 0.7010312080383301, 0.7567650079727173, 0.8124987483024597, 0.8682325482368469, 0.9239663481712341, 0.9797000885009766, 1.0354338884353638, 1.091167688369751, 1.1469013690948486, 1.2026351690292358, 1.258368968963623, 1.3141026496887207, 1.369836449623108, 1.4255702495574951, 1.4813040494918823, 1.5370378494262695, 1.5927716493606567, 1.648505449295044, 1.7042392492294312, 1.7599730491638184, 1.815706729888916, 1.8714405298233032, 1.9271743297576904, 1.9829081296920776, 2.038641929626465]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 10.0, 5.0, 6.0, 7.0, 5.0, 17.0, 7.0, 10.0, 16.0, 27.0, 20.0, 16.0, 40.0, 37.0, 43.0, 53.0, 71.0, 119.0, 100.0, 63.0, 40.0, 42.0, 43.0, 22.0, 20.0, 19.0, 23.0, 20.0, 20.0, 13.0, 17.0, 9.0, 14.0, 5.0, 5.0, 7.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9326940774917603, -0.9044406414031982, -0.8761872053146362, -0.8479337692260742, -0.8196802735328674, -0.7914268374443054, -0.7631734013557434, -0.7349199652671814, -0.7066665291786194, -0.6784130930900574, -0.6501596570014954, -0.6219061613082886, -0.5936527252197266, -0.5653992891311646, -0.5371458530426025, -0.5088924169540405, -0.48063895106315613, -0.4523855149745941, -0.4241320490837097, -0.3958786129951477, -0.3676251769065857, -0.3393717408180237, -0.3111182749271393, -0.28286483883857727, -0.25461137294769287, -0.22635792195796967, -0.19810448586940765, -0.16985103487968445, -0.14159759879112244, -0.11334414780139923, -0.08509069681167603, -0.056837260723114014, -0.028583824634552002, -0.0003303792327642441, 0.027923066169023514, 0.05617651343345642, 0.08442995697259903, 0.11268340051174164, 0.14093685150146484, 0.16919028759002686, 0.19744373857975006, 0.22569718956947327, 0.2539506256580353, 0.2822040915489197, 0.3104575276374817, 0.3387109637260437, 0.3669643998146057, 0.3952178359031677, 0.4234713017940521, 0.45172473788261414, 0.47997820377349854, 0.5082316398620605, 0.5364850759506226, 0.5647385120391846, 0.5929919481277466, 0.6212453842163086, 0.6494988799095154, 0.6777523159980774, 0.7060057520866394, 0.7342592477798462, 0.7625126838684082, 0.7907661199569702, 0.8190195560455322, 0.8472729921340942, 0.8755264282226562]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 10.0, 13.0, 14.0, 14.0, 28.0, 34.0, 50.0, 68.0, 108.0, 194.0, 291.0, 571.0, 1057.0, 2139.0, 4953.0, 13477.0, 43347.0, 197218.0, 1138897.0, 2133035.0, 526102.0, 93131.0, 24135.0, 8394.0, 3365.0, 1571.0, 801.0, 485.0, 275.0, 157.0, 111.0, 63.0, 44.0, 26.0, 34.0, 16.0, 10.0, 10.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0], "bins": [-0.059051513671875, -0.05722188949584961, -0.05539226531982422, -0.05356264114379883, -0.05173301696777344, -0.04990339279174805, -0.048073768615722656, -0.046244144439697266, -0.044414520263671875, -0.042584896087646484, -0.040755271911621094, -0.0389256477355957, -0.03709602355957031, -0.03526639938354492, -0.03343677520751953, -0.03160715103149414, -0.02977752685546875, -0.02794790267944336, -0.02611827850341797, -0.024288654327392578, -0.022459030151367188, -0.020629405975341797, -0.018799781799316406, -0.016970157623291016, -0.015140533447265625, -0.013310909271240234, -0.011481285095214844, -0.009651660919189453, -0.007822036743164062, -0.005992412567138672, -0.004162788391113281, -0.0023331642150878906, -0.0005035400390625, 0.0013260841369628906, 0.0031557083129882812, 0.004985332489013672, 0.0068149566650390625, 0.008644580841064453, 0.010474205017089844, 0.012303829193115234, 0.014133453369140625, 0.015963077545166016, 0.017792701721191406, 0.019622325897216797, 0.021451950073242188, 0.023281574249267578, 0.02511119842529297, 0.02694082260131836, 0.02877044677734375, 0.03060007095336914, 0.03242969512939453, 0.03425931930541992, 0.03608894348144531, 0.0379185676574707, 0.039748191833496094, 0.041577816009521484, 0.043407440185546875, 0.045237064361572266, 0.047066688537597656, 0.04889631271362305, 0.05072593688964844, 0.05255556106567383, 0.05438518524169922, 0.05621480941772461, 0.05804443359375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 6.0, 5.0, 11.0, 2.0, 13.0, 13.0, 21.0, 28.0, 32.0, 34.0, 35.0, 35.0, 26.0, 44.0, 42.0, 53.0, 56.0, 60.0, 43.0, 41.0, 50.0, 47.0, 33.0, 39.0, 26.0, 34.0, 25.0, 22.0, 27.0, 26.0, 17.0, 15.0, 8.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.043212890625, -0.04171466827392578, -0.04021644592285156, -0.038718223571777344, -0.037220001220703125, -0.035721778869628906, -0.03422355651855469, -0.03272533416748047, -0.03122711181640625, -0.02972888946533203, -0.028230667114257812, -0.026732444763183594, -0.025234222412109375, -0.023736000061035156, -0.022237777709960938, -0.02073955535888672, -0.0192413330078125, -0.01774311065673828, -0.016244888305664062, -0.014746665954589844, -0.013248443603515625, -0.011750221252441406, -0.010251998901367188, -0.008753776550292969, -0.00725555419921875, -0.005757331848144531, -0.0042591094970703125, -0.0027608871459960938, -0.001262664794921875, 0.00023555755615234375, 0.0017337799072265625, 0.0032320022583007812, 0.004730224609375, 0.006228446960449219, 0.0077266693115234375, 0.009224891662597656, 0.010723114013671875, 0.012221336364746094, 0.013719558715820312, 0.015217781066894531, 0.01671600341796875, 0.01821422576904297, 0.019712448120117188, 0.021210670471191406, 0.022708892822265625, 0.024207115173339844, 0.025705337524414062, 0.02720355987548828, 0.0287017822265625, 0.03020000457763672, 0.03169822692871094, 0.033196449279785156, 0.034694671630859375, 0.036192893981933594, 0.03769111633300781, 0.03918933868408203, 0.04068756103515625, 0.04218578338623047, 0.04368400573730469, 0.045182228088378906, 0.046680450439453125, 0.048178672790527344, 0.04967689514160156, 0.05117511749267578, 0.05267333984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 11.0, 8.0, 20.0, 31.0, 88.0, 175.0, 389.0, 1176.0, 7004.0, 400832.0, 3754992.0, 26325.0, 2200.0, 543.0, 265.0, 111.0, 47.0, 31.0, 16.0, 10.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2474365234375, -0.23975563049316406, -0.23207473754882812, -0.2243938446044922, -0.21671295166015625, -0.2090320587158203, -0.20135116577148438, -0.19367027282714844, -0.1859893798828125, -0.17830848693847656, -0.17062759399414062, -0.1629467010498047, -0.15526580810546875, -0.1475849151611328, -0.13990402221679688, -0.13222312927246094, -0.124542236328125, -0.11686134338378906, -0.10918045043945312, -0.10149955749511719, -0.09381866455078125, -0.08613777160644531, -0.07845687866210938, -0.07077598571777344, -0.0630950927734375, -0.05541419982910156, -0.047733306884765625, -0.04005241394042969, -0.03237152099609375, -0.024690628051757812, -0.017009735107421875, -0.009328842163085938, -0.00164794921875, 0.0060329437255859375, 0.013713836669921875, 0.021394729614257812, 0.02907562255859375, 0.03675651550292969, 0.044437408447265625, 0.05211830139160156, 0.0597991943359375, 0.06748008728027344, 0.07516098022460938, 0.08284187316894531, 0.09052276611328125, 0.09820365905761719, 0.10588455200195312, 0.11356544494628906, 0.121246337890625, 0.12892723083496094, 0.13660812377929688, 0.1442890167236328, 0.15196990966796875, 0.1596508026123047, 0.16733169555664062, 0.17501258850097656, 0.1826934814453125, 0.19037437438964844, 0.19805526733398438, 0.2057361602783203, 0.21341705322265625, 0.2210979461669922, 0.22877883911132812, 0.23645973205566406, 0.244140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 5.0, 15.0, 27.0, 41.0, 68.0, 168.0, 414.0, 790.0, 1146.0, 714.0, 322.0, 178.0, 84.0, 43.0, 27.0, 16.0, 6.0, 8.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.217529296875, -0.21187591552734375, -0.2062225341796875, -0.20056915283203125, -0.194915771484375, -0.18926239013671875, -0.1836090087890625, -0.17795562744140625, -0.17230224609375, -0.16664886474609375, -0.1609954833984375, -0.15534210205078125, -0.149688720703125, -0.14403533935546875, -0.1383819580078125, -0.13272857666015625, -0.1270751953125, -0.12142181396484375, -0.1157684326171875, -0.11011505126953125, -0.104461669921875, -0.09880828857421875, -0.0931549072265625, -0.08750152587890625, -0.08184814453125, -0.07619476318359375, -0.0705413818359375, -0.06488800048828125, -0.059234619140625, -0.05358123779296875, -0.0479278564453125, -0.04227447509765625, -0.03662109375, -0.03096771240234375, -0.0253143310546875, -0.01966094970703125, -0.014007568359375, -0.00835418701171875, -0.0027008056640625, 0.00295257568359375, 0.00860595703125, 0.01425933837890625, 0.0199127197265625, 0.02556610107421875, 0.031219482421875, 0.03687286376953125, 0.0425262451171875, 0.04817962646484375, 0.0538330078125, 0.05948638916015625, 0.0651397705078125, 0.07079315185546875, 0.076446533203125, 0.08209991455078125, 0.0877532958984375, 0.09340667724609375, 0.09906005859375, 0.10471343994140625, 0.1103668212890625, 0.11602020263671875, 0.121673583984375, 0.12732696533203125, 0.1329803466796875, 0.13863372802734375, 0.144287109375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 9.0, 25.0, 32.0, 68.0, 104.0, 151.0, 177.0, 165.0, 119.0, 55.0, 35.0, 17.0, 12.0, 11.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3354883193969727, -1.3025181293487549, -1.2695478200912476, -1.2365776300430298, -1.2036073207855225, -1.1706371307373047, -1.137666940689087, -1.1046966314315796, -1.0717264413833618, -1.038756251335144, -1.0057859420776367, -0.972815752029419, -0.9398455023765564, -0.9068752527236938, -0.8739050626754761, -0.8409348130226135, -0.807964563369751, -0.7749943137168884, -0.7420240640640259, -0.7090538740158081, -0.6760836243629456, -0.643113374710083, -0.6101431846618652, -0.5771729350090027, -0.5442026853561401, -0.5112324357032776, -0.4782622158527374, -0.44529199600219727, -0.4123217463493347, -0.37935149669647217, -0.346381276845932, -0.31341105699539185, -0.28044092655181885, -0.2474706918001175, -0.21450045704841614, -0.18153022229671478, -0.14855998754501343, -0.11558975279331207, -0.08261951804161072, -0.04964928328990936, -0.016679048538208008, 0.016291186213493347, 0.0492614209651947, 0.08223165571689606, 0.11520189046859741, 0.14817212522029877, 0.18114235997200012, 0.21411259472370148, 0.24708282947540283, 0.2800530791282654, 0.31302329897880554, 0.3459935188293457, 0.37896376848220825, 0.4119340181350708, 0.44490423798561096, 0.4778744578361511, 0.5108447074890137, 0.5438149571418762, 0.5767852067947388, 0.6097553968429565, 0.6427256464958191, 0.6756958961486816, 0.7086660861968994, 0.741636335849762, 0.7746065855026245]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 10.0, 6.0, 12.0, 14.0, 14.0, 21.0, 26.0, 25.0, 24.0, 36.0, 41.0, 42.0, 43.0, 49.0, 41.0, 63.0, 64.0, 69.0, 52.0, 41.0, 34.0, 38.0, 25.0, 37.0, 26.0, 27.0, 18.0, 20.0, 13.0, 10.0, 11.0, 6.0, 6.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.5460447669029236, -0.5301352739334106, -0.5142258405685425, -0.49831634759902954, -0.482406884431839, -0.46649742126464844, -0.4505879282951355, -0.43467846512794495, -0.4187690019607544, -0.40285953879356384, -0.3869500756263733, -0.37104058265686035, -0.3551311194896698, -0.33922165632247925, -0.3233121633529663, -0.30740270018577576, -0.2914932370185852, -0.27558377385139465, -0.2596743106842041, -0.24376481771469116, -0.2278553545475006, -0.21194589138031006, -0.1960364133119583, -0.18012693524360657, -0.16421747207641602, -0.14830800890922546, -0.13239853084087372, -0.11648906022310257, -0.10057958960533142, -0.08467011898756027, -0.06876064836978912, -0.052851177752017975, -0.0369417667388916, -0.021032296121120453, -0.005122825503349304, 0.010786645114421844, 0.026696115732192993, 0.04260558634996414, 0.05851505696773529, 0.07442452758550644, 0.09033399820327759, 0.10624346882104874, 0.12215293943881989, 0.13806241750717163, 0.15397188067436218, 0.16988134384155273, 0.18579082190990448, 0.20170029997825623, 0.21760976314544678, 0.23351922631263733, 0.24942870438098907, 0.2653381824493408, 0.28124764561653137, 0.2971571087837219, 0.31306660175323486, 0.3289760649204254, 0.34488552808761597, 0.3607949912548065, 0.37670445442199707, 0.39261394739151, 0.40852341055870056, 0.4244328737258911, 0.44034236669540405, 0.4562518298625946, 0.47216129302978516]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 4.0, 2.0, 8.0, 6.0, 18.0, 30.0, 42.0, 46.0, 63.0, 108.0, 187.0, 270.0, 491.0, 880.0, 1574.0, 2736.0, 5424.0, 11164.0, 25279.0, 67304.0, 213227.0, 427156.0, 188179.0, 59669.0, 22984.0, 10492.0, 5013.0, 2602.0, 1436.0, 882.0, 452.0, 298.0, 183.0, 116.0, 70.0, 45.0, 33.0, 26.0, 19.0, 13.0, 8.0, 2.0, 5.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0], "bins": [-0.10028076171875, -0.09752941131591797, -0.09477806091308594, -0.0920267105102539, -0.08927536010742188, -0.08652400970458984, -0.08377265930175781, -0.08102130889892578, -0.07826995849609375, -0.07551860809326172, -0.07276725769042969, -0.07001590728759766, -0.06726455688476562, -0.0645132064819336, -0.06176185607910156, -0.05901050567626953, -0.0562591552734375, -0.05350780487060547, -0.05075645446777344, -0.048005104064941406, -0.045253753662109375, -0.042502403259277344, -0.03975105285644531, -0.03699970245361328, -0.03424835205078125, -0.03149700164794922, -0.028745651245117188, -0.025994300842285156, -0.023242950439453125, -0.020491600036621094, -0.017740249633789062, -0.014988899230957031, -0.012237548828125, -0.009486198425292969, -0.0067348480224609375, -0.003983497619628906, -0.001232147216796875, 0.0015192031860351562, 0.0042705535888671875, 0.007021903991699219, 0.00977325439453125, 0.012524604797363281, 0.015275955200195312, 0.018027305603027344, 0.020778656005859375, 0.023530006408691406, 0.026281356811523438, 0.02903270721435547, 0.0317840576171875, 0.03453540802001953, 0.03728675842285156, 0.040038108825683594, 0.042789459228515625, 0.045540809631347656, 0.04829216003417969, 0.05104351043701172, 0.05379486083984375, 0.05654621124267578, 0.05929756164550781, 0.062048912048339844, 0.06480026245117188, 0.0675516128540039, 0.07030296325683594, 0.07305431365966797, 0.0758056640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 7.0, 7.0, 9.0, 7.0, 6.0, 6.0, 13.0, 23.0, 14.0, 15.0, 25.0, 20.0, 23.0, 31.0, 30.0, 29.0, 53.0, 35.0, 49.0, 53.0, 48.0, 42.0, 52.0, 45.0, 41.0, 56.0, 32.0, 38.0, 28.0, 24.0, 20.0, 24.0, 21.0, 18.0, 21.0, 8.0, 10.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.045562744140625, -0.04403972625732422, -0.04251670837402344, -0.040993690490722656, -0.039470672607421875, -0.037947654724121094, -0.03642463684082031, -0.03490161895751953, -0.03337860107421875, -0.03185558319091797, -0.030332565307617188, -0.028809547424316406, -0.027286529541015625, -0.025763511657714844, -0.024240493774414062, -0.02271747589111328, -0.0211944580078125, -0.01967144012451172, -0.018148422241210938, -0.016625404357910156, -0.015102386474609375, -0.013579368591308594, -0.012056350708007812, -0.010533332824707031, -0.00901031494140625, -0.007487297058105469, -0.0059642791748046875, -0.004441261291503906, -0.002918243408203125, -0.0013952255249023438, 0.0001277923583984375, 0.0016508102416992188, 0.003173828125, 0.004696846008300781, 0.0062198638916015625, 0.007742881774902344, 0.009265899658203125, 0.010788917541503906, 0.012311935424804688, 0.013834953308105469, 0.01535797119140625, 0.01688098907470703, 0.018404006958007812, 0.019927024841308594, 0.021450042724609375, 0.022973060607910156, 0.024496078491210938, 0.02601909637451172, 0.0275421142578125, 0.02906513214111328, 0.030588150024414062, 0.032111167907714844, 0.033634185791015625, 0.035157203674316406, 0.03668022155761719, 0.03820323944091797, 0.03972625732421875, 0.04124927520751953, 0.04277229309082031, 0.044295310974121094, 0.045818328857421875, 0.047341346740722656, 0.04886436462402344, 0.05038738250732422, 0.051910400390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 7.0, 4.0, 7.0, 6.0, 9.0, 9.0, 10.0, 17.0, 23.0, 40.0, 52.0, 75.0, 112.0, 153.0, 233.0, 328.0, 609.0, 1166.0, 2584.0, 10416.0, 109754.0, 847878.0, 62746.0, 7525.0, 2172.0, 1031.0, 509.0, 366.0, 233.0, 165.0, 86.0, 68.0, 48.0, 28.0, 26.0, 21.0, 12.0, 9.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.209716796875, -0.20343780517578125, -0.1971588134765625, -0.19087982177734375, -0.184600830078125, -0.17832183837890625, -0.1720428466796875, -0.16576385498046875, -0.15948486328125, -0.15320587158203125, -0.1469268798828125, -0.14064788818359375, -0.134368896484375, -0.12808990478515625, -0.1218109130859375, -0.11553192138671875, -0.1092529296875, -0.10297393798828125, -0.0966949462890625, -0.09041595458984375, -0.084136962890625, -0.07785797119140625, -0.0715789794921875, -0.06529998779296875, -0.05902099609375, -0.05274200439453125, -0.0464630126953125, -0.04018402099609375, -0.033905029296875, -0.02762603759765625, -0.0213470458984375, -0.01506805419921875, -0.0087890625, -0.00251007080078125, 0.0037689208984375, 0.01004791259765625, 0.016326904296875, 0.02260589599609375, 0.0288848876953125, 0.03516387939453125, 0.04144287109375, 0.04772186279296875, 0.0540008544921875, 0.06027984619140625, 0.066558837890625, 0.07283782958984375, 0.0791168212890625, 0.08539581298828125, 0.0916748046875, 0.09795379638671875, 0.1042327880859375, 0.11051177978515625, 0.116790771484375, 0.12306976318359375, 0.1293487548828125, 0.13562774658203125, 0.14190673828125, 0.14818572998046875, 0.1544647216796875, 0.16074371337890625, 0.167022705078125, 0.17330169677734375, 0.1795806884765625, 0.18585968017578125, 0.192138671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 21.0, 18.0, 27.0, 38.0, 27.0, 37.0, 50.0, 68.0, 61.0, 57.0, 72.0, 64.0, 60.0, 77.0, 63.0, 43.0, 36.0, 29.0, 28.0, 19.0, 19.0, 15.0, 12.0, 11.0, 6.0, 3.0, 1.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.245361328125, -0.2376270294189453, -0.22989273071289062, -0.22215843200683594, -0.21442413330078125, -0.20668983459472656, -0.19895553588867188, -0.1912212371826172, -0.1834869384765625, -0.1757526397705078, -0.16801834106445312, -0.16028404235839844, -0.15254974365234375, -0.14481544494628906, -0.13708114624023438, -0.1293468475341797, -0.121612548828125, -0.11387825012207031, -0.10614395141601562, -0.09840965270996094, -0.09067535400390625, -0.08294105529785156, -0.07520675659179688, -0.06747245788574219, -0.0597381591796875, -0.05200386047363281, -0.044269561767578125, -0.03653526306152344, -0.02880096435546875, -0.021066665649414062, -0.013332366943359375, -0.0055980682373046875, 0.00213623046875, 0.009870529174804688, 0.017604827880859375, 0.025339126586914062, 0.03307342529296875, 0.04080772399902344, 0.048542022705078125, 0.05627632141113281, 0.0640106201171875, 0.07174491882324219, 0.07947921752929688, 0.08721351623535156, 0.09494781494140625, 0.10268211364746094, 0.11041641235351562, 0.11815071105957031, 0.125885009765625, 0.1336193084716797, 0.14135360717773438, 0.14908790588378906, 0.15682220458984375, 0.16455650329589844, 0.17229080200195312, 0.1800251007080078, 0.1877593994140625, 0.1954936981201172, 0.20322799682617188, 0.21096229553222656, 0.21869659423828125, 0.22643089294433594, 0.23416519165039062, 0.2418994903564453, 0.2496337890625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 16.0, 17.0, 17.0, 24.0, 19.0, 40.0, 42.0, 80.0, 130.0, 281.0, 663.0, 1934.0, 7682.0, 64371.0, 892606.0, 69170.0, 8126.0, 1955.0, 658.0, 291.0, 123.0, 55.0, 67.0, 40.0, 34.0, 25.0, 19.0, 17.0, 13.0, 8.0, 7.0, 3.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061004638671875, -0.05886507034301758, -0.056725502014160156, -0.054585933685302734, -0.05244636535644531, -0.05030679702758789, -0.04816722869873047, -0.04602766036987305, -0.043888092041015625, -0.0417485237121582, -0.03960895538330078, -0.03746938705444336, -0.03532981872558594, -0.033190250396728516, -0.031050682067871094, -0.028911113739013672, -0.02677154541015625, -0.024631977081298828, -0.022492408752441406, -0.020352840423583984, -0.018213272094726562, -0.01607370376586914, -0.013934135437011719, -0.011794567108154297, -0.009654998779296875, -0.007515430450439453, -0.005375862121582031, -0.0032362937927246094, -0.0010967254638671875, 0.0010428428649902344, 0.0031824111938476562, 0.005321979522705078, 0.0074615478515625, 0.009601116180419922, 0.011740684509277344, 0.013880252838134766, 0.016019821166992188, 0.01815938949584961, 0.02029895782470703, 0.022438526153564453, 0.024578094482421875, 0.026717662811279297, 0.02885723114013672, 0.03099679946899414, 0.03313636779785156, 0.035275936126708984, 0.037415504455566406, 0.03955507278442383, 0.04169464111328125, 0.04383420944213867, 0.045973777770996094, 0.048113346099853516, 0.05025291442871094, 0.05239248275756836, 0.05453205108642578, 0.0566716194152832, 0.058811187744140625, 0.06095075607299805, 0.06309032440185547, 0.06522989273071289, 0.06736946105957031, 0.06950902938842773, 0.07164859771728516, 0.07378816604614258, 0.075927734375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 7.0, 5.0, 4.0, 5.0, 7.0, 6.0, 14.0, 18.0, 29.0, 61.0, 82.0, 115.0, 138.0, 122.0, 112.0, 78.0, 53.0, 31.0, 25.0, 17.0, 11.0, 15.0, 9.0, 4.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.490945816040039e-05, -6.30086287856102e-05, -6.110779941082001e-05, -5.9206970036029816e-05, -5.7306140661239624e-05, -5.540531128644943e-05, -5.350448191165924e-05, -5.160365253686905e-05, -4.970282316207886e-05, -4.7801993787288666e-05, -4.5901164412498474e-05, -4.400033503770828e-05, -4.209950566291809e-05, -4.01986762881279e-05, -3.829784691333771e-05, -3.6397017538547516e-05, -3.4496188163757324e-05, -3.259535878896713e-05, -3.069452941417694e-05, -2.879370003938675e-05, -2.6892870664596558e-05, -2.4992041289806366e-05, -2.3091211915016174e-05, -2.1190382540225983e-05, -1.928955316543579e-05, -1.73887237906456e-05, -1.5487894415855408e-05, -1.3587065041065216e-05, -1.1686235666275024e-05, -9.785406291484833e-06, -7.884576916694641e-06, -5.9837475419044495e-06, -4.082918167114258e-06, -2.182088792324066e-06, -2.812594175338745e-07, 1.6195699572563171e-06, 3.520399332046509e-06, 5.4212287068367004e-06, 7.322058081626892e-06, 9.222887456417084e-06, 1.1123716831207275e-05, 1.3024546205997467e-05, 1.4925375580787659e-05, 1.682620495557785e-05, 1.8727034330368042e-05, 2.0627863705158234e-05, 2.2528693079948425e-05, 2.4429522454738617e-05, 2.633035182952881e-05, 2.8231181204319e-05, 3.0132010579109192e-05, 3.2032839953899384e-05, 3.3933669328689575e-05, 3.583449870347977e-05, 3.773532807826996e-05, 3.963615745306015e-05, 4.153698682785034e-05, 4.3437816202640533e-05, 4.5338645577430725e-05, 4.723947495222092e-05, 4.914030432701111e-05, 5.10411337018013e-05, 5.294196307659149e-05, 5.484279245138168e-05, 5.6743621826171875e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 8.0, 11.0, 27.0, 28.0, 22.0, 56.0, 81.0, 131.0, 193.0, 276.0, 562.0, 1174.0, 2679.0, 8011.0, 35320.0, 237535.0, 685586.0, 57975.0, 12196.0, 3592.0, 1355.0, 744.0, 340.0, 194.0, 146.0, 91.0, 75.0, 39.0, 35.0, 15.0, 17.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.043701171875, -0.04238271713256836, -0.04106426239013672, -0.03974580764770508, -0.03842735290527344, -0.0371088981628418, -0.035790443420410156, -0.034471988677978516, -0.033153533935546875, -0.031835079193115234, -0.030516624450683594, -0.029198169708251953, -0.027879714965820312, -0.026561260223388672, -0.02524280548095703, -0.02392435073852539, -0.02260589599609375, -0.02128744125366211, -0.01996898651123047, -0.018650531768798828, -0.017332077026367188, -0.016013622283935547, -0.014695167541503906, -0.013376712799072266, -0.012058258056640625, -0.010739803314208984, -0.009421348571777344, -0.008102893829345703, -0.0067844390869140625, -0.005465984344482422, -0.004147529602050781, -0.0028290748596191406, -0.0015106201171875, -0.00019216537475585938, 0.0011262893676757812, 0.002444744110107422, 0.0037631988525390625, 0.005081653594970703, 0.006400108337402344, 0.007718563079833984, 0.009037017822265625, 0.010355472564697266, 0.011673927307128906, 0.012992382049560547, 0.014310836791992188, 0.015629291534423828, 0.01694774627685547, 0.01826620101928711, 0.01958465576171875, 0.02090311050415039, 0.02222156524658203, 0.023540019989013672, 0.024858474731445312, 0.026176929473876953, 0.027495384216308594, 0.028813838958740234, 0.030132293701171875, 0.031450748443603516, 0.032769203186035156, 0.0340876579284668, 0.03540611267089844, 0.03672456741333008, 0.03804302215576172, 0.03936147689819336, 0.040679931640625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 6.0, 6.0, 9.0, 11.0, 9.0, 13.0, 28.0, 29.0, 37.0, 46.0, 57.0, 48.0, 68.0, 105.0, 112.0, 92.0, 78.0, 45.0, 46.0, 41.0, 20.0, 22.0, 20.0, 20.0, 15.0, 6.0, 5.0, 8.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0396728515625, -0.038512229919433594, -0.03735160827636719, -0.03619098663330078, -0.035030364990234375, -0.03386974334716797, -0.03270912170410156, -0.031548500061035156, -0.03038787841796875, -0.029227256774902344, -0.028066635131835938, -0.02690601348876953, -0.025745391845703125, -0.02458477020263672, -0.023424148559570312, -0.022263526916503906, -0.0211029052734375, -0.019942283630371094, -0.018781661987304688, -0.01762104034423828, -0.016460418701171875, -0.015299797058105469, -0.014139175415039062, -0.012978553771972656, -0.01181793212890625, -0.010657310485839844, -0.009496688842773438, -0.008336067199707031, -0.007175445556640625, -0.006014823913574219, -0.0048542022705078125, -0.0036935806274414062, -0.002532958984375, -0.0013723373413085938, -0.0002117156982421875, 0.0009489059448242188, 0.002109527587890625, 0.0032701492309570312, 0.0044307708740234375, 0.005591392517089844, 0.00675201416015625, 0.007912635803222656, 0.009073257446289062, 0.010233879089355469, 0.011394500732421875, 0.012555122375488281, 0.013715744018554688, 0.014876365661621094, 0.0160369873046875, 0.017197608947753906, 0.018358230590820312, 0.01951885223388672, 0.020679473876953125, 0.02184009552001953, 0.023000717163085938, 0.024161338806152344, 0.02532196044921875, 0.026482582092285156, 0.027643203735351562, 0.02880382537841797, 0.029964447021484375, 0.03112506866455078, 0.03228569030761719, 0.033446311950683594, 0.03460693359375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 21.0, 47.0, 116.0, 283.0, 374.0, 95.0, 27.0, 8.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8900411128997803, -1.8346621990203857, -1.7792831659317017, -1.7239042520523071, -1.668525218963623, -1.6131463050842285, -1.557767391204834, -1.50238835811615, -1.4470093250274658, -1.3916304111480713, -1.3362513780593872, -1.2808724641799927, -1.2254934310913086, -1.170114517211914, -1.1147356033325195, -1.0593565702438354, -1.003977656364441, -0.9485986828804016, -0.8932197093963623, -0.8378407955169678, -0.7824617624282837, -0.7270828485488892, -0.6717038750648499, -0.6163249015808105, -0.5609459280967712, -0.5055669546127319, -0.4501879811286926, -0.3948090374469757, -0.3394300639629364, -0.2840510904788971, -0.22867214679718018, -0.17329317331314087, -0.11791419982910156, -0.06253523379564285, -0.007156267762184143, 0.04822269082069397, 0.10360166430473328, 0.15898063778877258, 0.2143595814704895, 0.2697385549545288, 0.3251175284385681, 0.3804965019226074, 0.43587547540664673, 0.49125441908836365, 0.5466333627700806, 0.6020123958587646, 0.6573913097381592, 0.7127702832221985, 0.7681492567062378, 0.8235282301902771, 0.8789072036743164, 0.9342861175537109, 0.989665150642395, 1.0450440645217896, 1.1004230976104736, 1.1558020114898682, 1.2111809253692627, 1.2665598392486572, 1.3219388723373413, 1.3773177862167358, 1.43269681930542, 1.4880757331848145, 1.543454647064209, 1.598833680152893, 1.6542127132415771]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 10.0, 8.0, 11.0, 6.0, 15.0, 12.0, 18.0, 20.0, 21.0, 28.0, 33.0, 27.0, 30.0, 46.0, 103.0, 168.0, 93.0, 47.0, 40.0, 30.0, 30.0, 26.0, 22.0, 19.0, 14.0, 19.0, 13.0, 21.0, 14.0, 8.0, 11.0, 5.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7498286962509155, -0.7225329279899597, -0.6952372193336487, -0.6679414510726929, -0.6406457424163818, -0.613349974155426, -0.5860542058944702, -0.5587584972381592, -0.5314627289772034, -0.5041669607162476, -0.4768712520599365, -0.4495754837989807, -0.4222797453403473, -0.39498400688171387, -0.36768823862075806, -0.34039250016212463, -0.3130967617034912, -0.2858010232448578, -0.25850528478622437, -0.23120951652526855, -0.20391377806663513, -0.1766180396080017, -0.1493222862482071, -0.12202653288841248, -0.09473079442977905, -0.06743504852056503, -0.04013930261135101, -0.012843556702136993, 0.014452189207077026, 0.04174792766571045, 0.06904368102550507, 0.09633943438529968, 0.1236351728439331, 0.15093091130256653, 0.17822666466236115, 0.20552241802215576, 0.23281815648078918, 0.2601138949394226, 0.2874096632003784, 0.31470540165901184, 0.34200114011764526, 0.3692968785762787, 0.3965926170349121, 0.4238883852958679, 0.45118412375450134, 0.47847986221313477, 0.5057756304740906, 0.5330713987350464, 0.5603671073913574, 0.5876628756523132, 0.6149585843086243, 0.6422543525695801, 0.6695500612258911, 0.6968458294868469, 0.7241415977478027, 0.7514373064041138, 0.7787330746650696, 0.8060288429260254, 0.8333245515823364, 0.8606203198432922, 0.887916088104248, 0.9152117967605591, 0.9425075650215149, 0.9698033332824707, 0.9970990419387817]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 7.0, 12.0, 10.0, 22.0, 42.0, 54.0, 116.0, 198.0, 481.0, 999.0, 2355.0, 7104.0, 29282.0, 205371.0, 1602057.0, 2003277.0, 292658.0, 36544.0, 8459.0, 2897.0, 1184.0, 537.0, 280.0, 147.0, 75.0, 34.0, 29.0, 17.0, 17.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.1086578369140625, -0.105560302734375, -0.1024627685546875, -0.099365234375, -0.0962677001953125, -0.093170166015625, -0.0900726318359375, -0.08697509765625, -0.0838775634765625, -0.080780029296875, -0.0776824951171875, -0.0745849609375, -0.0714874267578125, -0.068389892578125, -0.0652923583984375, -0.06219482421875, -0.0590972900390625, -0.055999755859375, -0.0529022216796875, -0.0498046875, -0.0467071533203125, -0.043609619140625, -0.0405120849609375, -0.03741455078125, -0.0343170166015625, -0.031219482421875, -0.0281219482421875, -0.0250244140625, -0.0219268798828125, -0.018829345703125, -0.0157318115234375, -0.01263427734375, -0.0095367431640625, -0.006439208984375, -0.0033416748046875, -0.000244140625, 0.0028533935546875, 0.005950927734375, 0.0090484619140625, 0.01214599609375, 0.0152435302734375, 0.018341064453125, 0.0214385986328125, 0.0245361328125, 0.0276336669921875, 0.030731201171875, 0.0338287353515625, 0.03692626953125, 0.0400238037109375, 0.043121337890625, 0.0462188720703125, 0.04931640625, 0.0524139404296875, 0.055511474609375, 0.0586090087890625, 0.06170654296875, 0.0648040771484375, 0.067901611328125, 0.0709991455078125, 0.0740966796875, 0.0771942138671875, 0.080291748046875, 0.0833892822265625, 0.08648681640625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 5.0, 4.0, 5.0, 10.0, 10.0, 13.0, 13.0, 18.0, 23.0, 23.0, 23.0, 25.0, 30.0, 25.0, 41.0, 36.0, 43.0, 38.0, 44.0, 50.0, 38.0, 39.0, 40.0, 42.0, 47.0, 37.0, 42.0, 34.0, 37.0, 27.0, 18.0, 20.0, 18.0, 20.0, 15.0, 12.0, 10.0, 5.0, 5.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.037872314453125, -0.0364985466003418, -0.035124778747558594, -0.03375101089477539, -0.03237724304199219, -0.031003475189208984, -0.02962970733642578, -0.028255939483642578, -0.026882171630859375, -0.025508403778076172, -0.02413463592529297, -0.022760868072509766, -0.021387100219726562, -0.02001333236694336, -0.018639564514160156, -0.017265796661376953, -0.01589202880859375, -0.014518260955810547, -0.013144493103027344, -0.01177072525024414, -0.010396957397460938, -0.009023189544677734, -0.007649421691894531, -0.006275653839111328, -0.004901885986328125, -0.003528118133544922, -0.0021543502807617188, -0.0007805824279785156, 0.0005931854248046875, 0.0019669532775878906, 0.0033407211303710938, 0.004714488983154297, 0.0060882568359375, 0.007462024688720703, 0.008835792541503906, 0.01020956039428711, 0.011583328247070312, 0.012957096099853516, 0.014330863952636719, 0.015704631805419922, 0.017078399658203125, 0.018452167510986328, 0.01982593536376953, 0.021199703216552734, 0.022573471069335938, 0.02394723892211914, 0.025321006774902344, 0.026694774627685547, 0.02806854248046875, 0.029442310333251953, 0.030816078186035156, 0.03218984603881836, 0.03356361389160156, 0.034937381744384766, 0.03631114959716797, 0.03768491744995117, 0.039058685302734375, 0.04043245315551758, 0.04180622100830078, 0.043179988861083984, 0.04455375671386719, 0.04592752456665039, 0.047301292419433594, 0.0486750602722168, 0.050048828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 2.0, 1.0, 7.0, 11.0, 8.0, 39.0, 64.0, 93.0, 149.0, 341.0, 759.0, 2249.0, 15399.0, 4028352.0, 140823.0, 4121.0, 1017.0, 409.0, 208.0, 100.0, 47.0, 28.0, 19.0, 13.0, 12.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.428466796875, -0.4124412536621094, -0.39641571044921875, -0.3803901672363281, -0.3643646240234375, -0.3483390808105469, -0.33231353759765625, -0.3162879943847656, -0.300262451171875, -0.2842369079589844, -0.26821136474609375, -0.2521858215332031, -0.2361602783203125, -0.22013473510742188, -0.20410919189453125, -0.18808364868164062, -0.17205810546875, -0.15603256225585938, -0.14000701904296875, -0.12398147583007812, -0.1079559326171875, -0.09193038940429688, -0.07590484619140625, -0.059879302978515625, -0.043853759765625, -0.027828216552734375, -0.01180267333984375, 0.004222869873046875, 0.0202484130859375, 0.036273956298828125, 0.05229949951171875, 0.06832504272460938, 0.0843505859375, 0.10037612915039062, 0.11640167236328125, 0.13242721557617188, 0.1484527587890625, 0.16447830200195312, 0.18050384521484375, 0.19652938842773438, 0.212554931640625, 0.22858047485351562, 0.24460601806640625, 0.2606315612792969, 0.2766571044921875, 0.2926826477050781, 0.30870819091796875, 0.3247337341308594, 0.34075927734375, 0.3567848205566406, 0.37281036376953125, 0.3888359069824219, 0.4048614501953125, 0.4208869934082031, 0.43691253662109375, 0.4529380798339844, 0.468963623046875, 0.4849891662597656, 0.5010147094726562, 0.5170402526855469, 0.5330657958984375, 0.5490913391113281, 0.5651168823242188, 0.5811424255371094, 0.59716796875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 13.0, 24.0, 31.0, 44.0, 82.0, 176.0, 279.0, 540.0, 987.0, 906.0, 440.0, 275.0, 137.0, 55.0, 37.0, 14.0, 15.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.474853515625, -0.4653205871582031, -0.45578765869140625, -0.4462547302246094, -0.4367218017578125, -0.4271888732910156, -0.41765594482421875, -0.4081230163574219, -0.398590087890625, -0.3890571594238281, -0.37952423095703125, -0.3699913024902344, -0.3604583740234375, -0.3509254455566406, -0.34139251708984375, -0.3318595886230469, -0.32232666015625, -0.3127937316894531, -0.30326080322265625, -0.2937278747558594, -0.2841949462890625, -0.2746620178222656, -0.26512908935546875, -0.2555961608886719, -0.246063232421875, -0.23653030395507812, -0.22699737548828125, -0.21746444702148438, -0.2079315185546875, -0.19839859008789062, -0.18886566162109375, -0.17933273315429688, -0.1697998046875, -0.16026687622070312, -0.15073394775390625, -0.14120101928710938, -0.1316680908203125, -0.12213516235351562, -0.11260223388671875, -0.10306930541992188, -0.093536376953125, -0.08400344848632812, -0.07447052001953125, -0.06493759155273438, -0.0554046630859375, -0.045871734619140625, -0.03633880615234375, -0.026805877685546875, -0.01727294921875, -0.007740020751953125, 0.00179290771484375, 0.011325836181640625, 0.0208587646484375, 0.030391693115234375, 0.03992462158203125, 0.049457550048828125, 0.058990478515625, 0.06852340698242188, 0.07805633544921875, 0.08758926391601562, 0.0971221923828125, 0.10665512084960938, 0.11618804931640625, 0.12572097778320312, 0.13525390625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 9.0, 11.0, 42.0, 78.0, 210.0, 327.0, 184.0, 79.0, 24.0, 13.0, 6.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.810626029968262, -5.695389747619629, -5.580153465270996, -5.464917182922363, -5.349680423736572, -5.2344441413879395, -5.119207859039307, -5.003971576690674, -4.888735294342041, -4.773499011993408, -4.658262729644775, -4.543025970458984, -4.427789688110352, -4.312553405761719, -4.197317123413086, -4.082080841064453, -3.966844320297241, -3.8516080379486084, -3.7363715171813965, -3.6211352348327637, -3.505898952484131, -3.390662670135498, -3.275426149368286, -3.1601898670196533, -3.0449533462524414, -2.9297170639038086, -2.8144805431365967, -2.699244260787964, -2.584007978439331, -2.468771457672119, -2.3535351753234863, -2.2382988929748535, -2.1230626106262207, -2.007826328277588, -1.8925899267196655, -1.7773535251617432, -1.6621172428131104, -1.546880841255188, -1.4316444396972656, -1.3164081573486328, -1.201171636581421, -1.0859352350234985, -0.9706989526748657, -0.8554625511169434, -0.7402262091636658, -0.6249898672103882, -0.5097534656524658, -0.39451712369918823, -0.27928078174591064, -0.16404442489147186, -0.04880806803703308, 0.0664283037185669, 0.18166464567184448, 0.29690098762512207, 0.41213738918304443, 0.527373731136322, 0.6426100730895996, 0.7578464150428772, 0.8730827569961548, 0.9883191585540771, 1.10355544090271, 1.2187918424606323, 1.3340282440185547, 1.4492645263671875, 1.5645009279251099]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 5.0, 3.0, 12.0, 12.0, 7.0, 12.0, 26.0, 25.0, 29.0, 21.0, 38.0, 47.0, 46.0, 56.0, 64.0, 59.0, 82.0, 68.0, 52.0, 36.0, 55.0, 31.0, 29.0, 38.0, 29.0, 20.0, 21.0, 12.0, 13.0, 8.0, 12.0, 10.0, 3.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2085697650909424, -1.1696727275848389, -1.1307755708694458, -1.0918785333633423, -1.0529813766479492, -1.0140843391418457, -0.9751872420310974, -0.9362901449203491, -0.8973930478096008, -0.8584959506988525, -0.8195988535881042, -0.780701756477356, -0.7418047189712524, -0.7029075622558594, -0.6640105247497559, -0.6251134276390076, -0.5862163305282593, -0.547319233417511, -0.5084221363067627, -0.4695250689983368, -0.4306279718875885, -0.3917308747768402, -0.3528338074684143, -0.313936710357666, -0.2750396132469177, -0.23614251613616943, -0.19724543392658234, -0.15834835171699524, -0.11945125460624695, -0.08055415749549866, -0.04165707528591156, -0.002759993076324463, 0.03613710403442383, 0.07503419369459152, 0.11393128335475922, 0.1528283655643463, 0.1917254626750946, 0.2306225597858429, 0.2695196270942688, 0.3084167242050171, 0.3473138213157654, 0.38621091842651367, 0.42510801553726196, 0.46400508284568787, 0.5029021501541138, 0.5417993068695068, 0.5806963443756104, 0.6195934414863586, 0.6584905385971069, 0.6973876357078552, 0.7362847328186035, 0.7751818299293518, 0.8140789270401001, 0.8529759645462036, 0.8918730616569519, 0.9307701587677002, 0.9696672558784485, 1.0085643529891968, 1.0474613904953003, 1.0863585472106934, 1.1252555847167969, 1.16415274143219, 1.2030497789382935, 1.2419469356536865, 1.28084397315979]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 1.0, 6.0, 10.0, 8.0, 16.0, 22.0, 31.0, 37.0, 69.0, 95.0, 156.0, 294.0, 582.0, 1188.0, 2709.0, 7626.0, 29243.0, 195405.0, 711382.0, 75862.0, 15469.0, 4760.0, 1769.0, 775.0, 393.0, 226.0, 140.0, 91.0, 54.0, 36.0, 37.0, 16.0, 10.0, 11.0, 5.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1556396484375, -0.1506633758544922, -0.14568710327148438, -0.14071083068847656, -0.13573455810546875, -0.13075828552246094, -0.12578201293945312, -0.12080574035644531, -0.1158294677734375, -0.11085319519042969, -0.10587692260742188, -0.10090065002441406, -0.09592437744140625, -0.09094810485839844, -0.08597183227539062, -0.08099555969238281, -0.076019287109375, -0.07104301452636719, -0.06606674194335938, -0.06109046936035156, -0.05611419677734375, -0.05113792419433594, -0.046161651611328125, -0.04118537902832031, -0.0362091064453125, -0.031232833862304688, -0.026256561279296875, -0.021280288696289062, -0.01630401611328125, -0.011327743530273438, -0.006351470947265625, -0.0013751983642578125, 0.00360107421875, 0.008577346801757812, 0.013553619384765625, 0.018529891967773438, 0.02350616455078125, 0.028482437133789062, 0.033458709716796875, 0.03843498229980469, 0.0434112548828125, 0.04838752746582031, 0.053363800048828125, 0.05834007263183594, 0.06331634521484375, 0.06829261779785156, 0.07326889038085938, 0.07824516296386719, 0.083221435546875, 0.08819770812988281, 0.09317398071289062, 0.09815025329589844, 0.10312652587890625, 0.10810279846191406, 0.11307907104492188, 0.11805534362792969, 0.1230316162109375, 0.1280078887939453, 0.13298416137695312, 0.13796043395996094, 0.14293670654296875, 0.14791297912597656, 0.15288925170898438, 0.1578655242919922, 0.162841796875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 9.0, 19.0, 11.0, 17.0, 28.0, 33.0, 38.0, 54.0, 61.0, 54.0, 55.0, 64.0, 78.0, 62.0, 68.0, 57.0, 67.0, 47.0, 35.0, 33.0, 34.0, 18.0, 14.0, 13.0, 8.0, 8.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08624267578125, -0.08343219757080078, -0.08062171936035156, -0.07781124114990234, -0.07500076293945312, -0.0721902847290039, -0.06937980651855469, -0.06656932830810547, -0.06375885009765625, -0.06094837188720703, -0.05813789367675781, -0.055327415466308594, -0.052516937255859375, -0.049706459045410156, -0.04689598083496094, -0.04408550262451172, -0.0412750244140625, -0.03846454620361328, -0.03565406799316406, -0.032843589782714844, -0.030033111572265625, -0.027222633361816406, -0.024412155151367188, -0.02160167694091797, -0.01879119873046875, -0.01598072052001953, -0.013170242309570312, -0.010359764099121094, -0.007549285888671875, -0.004738807678222656, -0.0019283294677734375, 0.0008821487426757812, 0.003692626953125, 0.006503105163574219, 0.009313583374023438, 0.012124061584472656, 0.014934539794921875, 0.017745018005371094, 0.020555496215820312, 0.02336597442626953, 0.02617645263671875, 0.02898693084716797, 0.03179740905761719, 0.034607887268066406, 0.037418365478515625, 0.040228843688964844, 0.04303932189941406, 0.04584980010986328, 0.0486602783203125, 0.05147075653076172, 0.05428123474121094, 0.057091712951660156, 0.059902191162109375, 0.0627126693725586, 0.06552314758300781, 0.06833362579345703, 0.07114410400390625, 0.07395458221435547, 0.07676506042480469, 0.0795755386352539, 0.08238601684570312, 0.08519649505615234, 0.08800697326660156, 0.09081745147705078, 0.0936279296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 16.0, 19.0, 20.0, 35.0, 32.0, 60.0, 83.0, 137.0, 188.0, 328.0, 579.0, 1177.0, 3680.0, 18563.0, 304601.0, 691998.0, 20512.0, 3850.0, 1197.0, 585.0, 296.0, 205.0, 123.0, 79.0, 63.0, 34.0, 27.0, 17.0, 21.0, 9.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1348876953125, -0.13023948669433594, -0.12559127807617188, -0.12094306945800781, -0.11629486083984375, -0.11164665222167969, -0.10699844360351562, -0.10235023498535156, -0.0977020263671875, -0.09305381774902344, -0.08840560913085938, -0.08375740051269531, -0.07910919189453125, -0.07446098327636719, -0.06981277465820312, -0.06516456604003906, -0.060516357421875, -0.05586814880371094, -0.051219940185546875, -0.04657173156738281, -0.04192352294921875, -0.03727531433105469, -0.032627105712890625, -0.027978897094726562, -0.0233306884765625, -0.018682479858398438, -0.014034271240234375, -0.009386062622070312, -0.00473785400390625, -8.96453857421875e-05, 0.004558563232421875, 0.009206771850585938, 0.01385498046875, 0.018503189086914062, 0.023151397705078125, 0.027799606323242188, 0.03244781494140625, 0.03709602355957031, 0.041744232177734375, 0.04639244079589844, 0.0510406494140625, 0.05568885803222656, 0.060337066650390625, 0.06498527526855469, 0.06963348388671875, 0.07428169250488281, 0.07892990112304688, 0.08357810974121094, 0.088226318359375, 0.09287452697753906, 0.09752273559570312, 0.10217094421386719, 0.10681915283203125, 0.11146736145019531, 0.11611557006835938, 0.12076377868652344, 0.1254119873046875, 0.13006019592285156, 0.13470840454101562, 0.1393566131591797, 0.14400482177734375, 0.1486530303955078, 0.15330123901367188, 0.15794944763183594, 0.16259765625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 4.0, 8.0, 11.0, 11.0, 10.0, 11.0, 12.0, 25.0, 24.0, 22.0, 30.0, 29.0, 39.0, 45.0, 61.0, 64.0, 67.0, 73.0, 63.0, 67.0, 48.0, 45.0, 49.0, 30.0, 25.0, 13.0, 21.0, 14.0, 12.0, 13.0, 6.0, 5.0, 6.0, 7.0, 6.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2313232421875, -0.2239246368408203, -0.21652603149414062, -0.20912742614746094, -0.20172882080078125, -0.19433021545410156, -0.18693161010742188, -0.1795330047607422, -0.1721343994140625, -0.1647357940673828, -0.15733718872070312, -0.14993858337402344, -0.14253997802734375, -0.13514137268066406, -0.12774276733398438, -0.12034416198730469, -0.112945556640625, -0.10554695129394531, -0.09814834594726562, -0.09074974060058594, -0.08335113525390625, -0.07595252990722656, -0.06855392456054688, -0.06115531921386719, -0.0537567138671875, -0.04635810852050781, -0.038959503173828125, -0.03156089782714844, -0.02416229248046875, -0.016763687133789062, -0.009365081787109375, -0.0019664764404296875, 0.00543212890625, 0.012830734252929688, 0.020229339599609375, 0.027627944946289062, 0.03502655029296875, 0.04242515563964844, 0.049823760986328125, 0.05722236633300781, 0.0646209716796875, 0.07201957702636719, 0.07941818237304688, 0.08681678771972656, 0.09421539306640625, 0.10161399841308594, 0.10901260375976562, 0.11641120910644531, 0.123809814453125, 0.1312084197998047, 0.13860702514648438, 0.14600563049316406, 0.15340423583984375, 0.16080284118652344, 0.16820144653320312, 0.1756000518798828, 0.1829986572265625, 0.1903972625732422, 0.19779586791992188, 0.20519447326660156, 0.21259307861328125, 0.21999168395996094, 0.22739028930664062, 0.2347888946533203, 0.2421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 6.0, 10.0, 10.0, 14.0, 19.0, 27.0, 33.0, 42.0, 46.0, 73.0, 106.0, 228.0, 400.0, 857.0, 2425.0, 8219.0, 51227.0, 918195.0, 53657.0, 8624.0, 2376.0, 917.0, 444.0, 182.0, 121.0, 71.0, 52.0, 40.0, 27.0, 15.0, 14.0, 16.0, 12.0, 6.0, 8.0, 4.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0264129638671875, -0.025600433349609375, -0.02478790283203125, -0.023975372314453125, -0.023162841796875, -0.022350311279296875, -0.02153778076171875, -0.020725250244140625, -0.0199127197265625, -0.019100189208984375, -0.01828765869140625, -0.017475128173828125, -0.01666259765625, -0.015850067138671875, -0.01503753662109375, -0.014225006103515625, -0.0134124755859375, -0.012599945068359375, -0.01178741455078125, -0.010974884033203125, -0.010162353515625, -0.009349822998046875, -0.00853729248046875, -0.007724761962890625, -0.0069122314453125, -0.006099700927734375, -0.00528717041015625, -0.004474639892578125, -0.003662109375, -0.002849578857421875, -0.00203704833984375, -0.001224517822265625, -0.0004119873046875, 0.000400543212890625, 0.00121307373046875, 0.002025604248046875, 0.002838134765625, 0.003650665283203125, 0.00446319580078125, 0.005275726318359375, 0.0060882568359375, 0.006900787353515625, 0.00771331787109375, 0.008525848388671875, 0.00933837890625, 0.010150909423828125, 0.01096343994140625, 0.011775970458984375, 0.0125885009765625, 0.013401031494140625, 0.01421356201171875, 0.015026092529296875, 0.015838623046875, 0.016651153564453125, 0.01746368408203125, 0.018276214599609375, 0.0190887451171875, 0.019901275634765625, 0.02071380615234375, 0.021526336669921875, 0.0223388671875, 0.023151397705078125, 0.02396392822265625, 0.024776458740234375, 0.0255889892578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 3.0, 3.0, 6.0, 0.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 8.0, 6.0, 17.0, 11.0, 19.0, 26.0, 26.0, 43.0, 39.0, 38.0, 41.0, 69.0, 87.0, 79.0, 66.0, 55.0, 41.0, 58.0, 31.0, 35.0, 22.0, 27.0, 13.0, 10.0, 12.0, 8.0, 11.0, 9.0, 5.0, 0.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0], "bins": [-3.7610530853271484e-05, -3.6442652344703674e-05, -3.5274773836135864e-05, -3.4106895327568054e-05, -3.2939016819000244e-05, -3.1771138310432434e-05, -3.0603259801864624e-05, -2.9435381293296814e-05, -2.8267502784729004e-05, -2.7099624276161194e-05, -2.5931745767593384e-05, -2.4763867259025574e-05, -2.3595988750457764e-05, -2.2428110241889954e-05, -2.1260231733322144e-05, -2.0092353224754333e-05, -1.8924474716186523e-05, -1.7756596207618713e-05, -1.6588717699050903e-05, -1.5420839190483093e-05, -1.4252960681915283e-05, -1.3085082173347473e-05, -1.1917203664779663e-05, -1.0749325156211853e-05, -9.581446647644043e-06, -8.413568139076233e-06, -7.245689630508423e-06, -6.077811121940613e-06, -4.909932613372803e-06, -3.7420541048049927e-06, -2.5741755962371826e-06, -1.4062970876693726e-06, -2.384185791015625e-07, 9.294599294662476e-07, 2.0973384380340576e-06, 3.2652169466018677e-06, 4.433095455169678e-06, 5.600973963737488e-06, 6.768852472305298e-06, 7.936730980873108e-06, 9.104609489440918e-06, 1.0272487998008728e-05, 1.1440366506576538e-05, 1.2608245015144348e-05, 1.3776123523712158e-05, 1.4944002032279968e-05, 1.611188054084778e-05, 1.727975904941559e-05, 1.84476375579834e-05, 1.961551606655121e-05, 2.078339457511902e-05, 2.195127308368683e-05, 2.311915159225464e-05, 2.428703010082245e-05, 2.545490860939026e-05, 2.662278711795807e-05, 2.779066562652588e-05, 2.895854413509369e-05, 3.01264226436615e-05, 3.129430115222931e-05, 3.246217966079712e-05, 3.363005816936493e-05, 3.479793667793274e-05, 3.596581518650055e-05, 3.713369369506836e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 6.0, 6.0, 12.0, 9.0, 16.0, 21.0, 38.0, 42.0, 79.0, 107.0, 211.0, 405.0, 707.0, 1407.0, 3405.0, 8854.0, 30781.0, 696517.0, 262790.0, 28444.0, 8511.0, 3217.0, 1436.0, 637.0, 342.0, 203.0, 119.0, 71.0, 50.0, 29.0, 27.0, 15.0, 10.0, 11.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0204315185546875, -0.019792556762695312, -0.019153594970703125, -0.018514633178710938, -0.01787567138671875, -0.017236709594726562, -0.016597747802734375, -0.015958786010742188, -0.01531982421875, -0.014680862426757812, -0.014041900634765625, -0.013402938842773438, -0.01276397705078125, -0.012125015258789062, -0.011486053466796875, -0.010847091674804688, -0.0102081298828125, -0.009569168090820312, -0.008930206298828125, -0.008291244506835938, -0.00765228271484375, -0.0070133209228515625, -0.006374359130859375, -0.0057353973388671875, -0.005096435546875, -0.0044574737548828125, -0.003818511962890625, -0.0031795501708984375, -0.00254058837890625, -0.0019016265869140625, -0.001262664794921875, -0.0006237030029296875, 1.52587890625e-05, 0.0006542205810546875, 0.001293182373046875, 0.0019321441650390625, 0.00257110595703125, 0.0032100677490234375, 0.003849029541015625, 0.0044879913330078125, 0.005126953125, 0.0057659149169921875, 0.006404876708984375, 0.0070438385009765625, 0.00768280029296875, 0.008321762084960938, 0.008960723876953125, 0.009599685668945312, 0.0102386474609375, 0.010877609252929688, 0.011516571044921875, 0.012155532836914062, 0.01279449462890625, 0.013433456420898438, 0.014072418212890625, 0.014711380004882812, 0.015350341796875, 0.015989303588867188, 0.016628265380859375, 0.017267227172851562, 0.01790618896484375, 0.018545150756835938, 0.019184112548828125, 0.019823074340820312, 0.0204620361328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 5.0, 1.0, 9.0, 9.0, 5.0, 7.0, 11.0, 18.0, 21.0, 22.0, 33.0, 51.0, 68.0, 109.0, 154.0, 133.0, 97.0, 66.0, 43.0, 21.0, 21.0, 27.0, 8.0, 9.0, 3.0, 14.0, 6.0, 5.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022308349609375, -0.021587133407592773, -0.020865917205810547, -0.02014470100402832, -0.019423484802246094, -0.018702268600463867, -0.01798105239868164, -0.017259836196899414, -0.016538619995117188, -0.01581740379333496, -0.015096187591552734, -0.014374971389770508, -0.013653755187988281, -0.012932538986206055, -0.012211322784423828, -0.011490106582641602, -0.010768890380859375, -0.010047674179077148, -0.009326457977294922, -0.008605241775512695, -0.007884025573730469, -0.007162809371948242, -0.006441593170166016, -0.005720376968383789, -0.0049991607666015625, -0.004277944564819336, -0.0035567283630371094, -0.002835512161254883, -0.0021142959594726562, -0.0013930797576904297, -0.0006718635559082031, 4.935264587402344e-05, 0.00077056884765625, 0.0014917850494384766, 0.002213001251220703, 0.0029342174530029297, 0.0036554336547851562, 0.004376649856567383, 0.005097866058349609, 0.005819082260131836, 0.0065402984619140625, 0.007261514663696289, 0.007982730865478516, 0.008703947067260742, 0.009425163269042969, 0.010146379470825195, 0.010867595672607422, 0.011588811874389648, 0.012310028076171875, 0.013031244277954102, 0.013752460479736328, 0.014473676681518555, 0.015194892883300781, 0.015916109085083008, 0.016637325286865234, 0.01735854148864746, 0.018079757690429688, 0.018800973892211914, 0.01952219009399414, 0.020243406295776367, 0.020964622497558594, 0.02168583869934082, 0.022407054901123047, 0.023128271102905273, 0.0238494873046875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 76.0, 685.0, 168.0, 44.0, 11.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9502366781234741, -0.8617105484008789, -0.7731843590736389, -0.6846582293510437, -0.5961320400238037, -0.5076059103012085, -0.4190797805786133, -0.3305535912513733, -0.24202746152877808, -0.15350130200386047, -0.06497515738010406, 0.023550987243652344, 0.11207714676856995, 0.20060330629348755, 0.28912943601608276, 0.37765562534332275, 0.46618175506591797, 0.5547078847885132, 0.6432340741157532, 0.7317602038383484, 0.8202863931655884, 0.9088125228881836, 0.9973386526107788, 1.085864782333374, 1.1743910312652588, 1.262917160987854, 1.3514432907104492, 1.439969539642334, 1.5284956693649292, 1.6170217990875244, 1.7055479288101196, 1.7940740585327148, 1.8826000690460205, 1.9711261987686157, 2.059652328491211, 2.1481785774230957, 2.2367045879364014, 2.325230836868286, 2.413756847381592, 2.5022830963134766, 2.5908093452453613, 2.679335594177246, 2.7678616046905518, 2.8563878536224365, 2.944913864135742, 3.033440113067627, 3.1219663619995117, 3.2104923725128174, 3.299018383026123, 3.387544631958008, 3.4760706424713135, 3.5645968914031982, 3.653122901916504, 3.7416491508483887, 3.8301753997802734, 3.918701410293579, 4.007227897644043, 4.095754146575928, 4.1842803955078125, 4.272806167602539, 4.361332416534424, 4.449858665466309, 4.538384914398193, 4.626911163330078, 4.715436935424805]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 10.0, 8.0, 5.0, 17.0, 7.0, 14.0, 20.0, 22.0, 26.0, 31.0, 32.0, 206.0, 295.0, 44.0, 42.0, 35.0, 15.0, 33.0, 18.0, 24.0, 20.0, 12.0, 8.0, 11.0, 8.0, 8.0, 9.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9682649970054626, -0.9399008750915527, -0.911536693572998, -0.8831725716590881, -0.8548084497451782, -0.8264442682266235, -0.7980801463127136, -0.7697160243988037, -0.7413519024848938, -0.7129877805709839, -0.6846235990524292, -0.6562594771385193, -0.6278953552246094, -0.5995311737060547, -0.5711670517921448, -0.5428029298782349, -0.5144387483596802, -0.4860745966434479, -0.45771047472953796, -0.42934632301330566, -0.40098220109939575, -0.37261804938316345, -0.34425389766693115, -0.31588977575302124, -0.28752565383911133, -0.25916150212287903, -0.23079738020896912, -0.20243322849273682, -0.1740691065788269, -0.1457049548625946, -0.1173408180475235, -0.08897668123245239, -0.06061255931854248, -0.032248422503471375, -0.00388428196310997, 0.024479858577251434, 0.05284399539232254, 0.08120813965797424, 0.10957227647304535, 0.13793641328811646, 0.16630055010318756, 0.19466468691825867, 0.22302882373332977, 0.2513929605484009, 0.2797571122646332, 0.3081212639808655, 0.3364853858947754, 0.3648495078086853, 0.3932136595249176, 0.4215778112411499, 0.4499419331550598, 0.4783060848712921, 0.5066702365875244, 0.5350343585014343, 0.5633984804153442, 0.5917626619338989, 0.6201267838478088, 0.6484909057617188, 0.6768550872802734, 0.7052192091941833, 0.7335833311080933, 0.761947512626648, 0.7903116345405579, 0.8186757564544678, 0.8470398783683777]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 4.0, 7.0, 8.0, 6.0, 8.0, 11.0, 13.0, 15.0, 17.0, 20.0, 27.0, 21.0, 19.0, 17.0, 40.0, 52.0, 209.0, 167.0, 53.0, 38.0, 34.0, 26.0, 21.0, 25.0, 13.0, 18.0, 14.0, 14.0, 11.0, 15.0, 12.0, 13.0, 4.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0540771484375, -0.052381038665771484, -0.05068492889404297, -0.04898881912231445, -0.04729270935058594, -0.04559659957885742, -0.043900489807128906, -0.04220438003540039, -0.040508270263671875, -0.03881216049194336, -0.037116050720214844, -0.03541994094848633, -0.03372383117675781, -0.0320277214050293, -0.03033161163330078, -0.028635501861572266, -0.02693939208984375, -0.025243282318115234, -0.02354717254638672, -0.021851062774658203, -0.020154953002929688, -0.018458843231201172, -0.016762733459472656, -0.01506662368774414, -0.013370513916015625, -0.01167440414428711, -0.009978294372558594, -0.008282184600830078, -0.0065860748291015625, -0.004889965057373047, -0.0031938552856445312, -0.0014977455139160156, 0.0001983642578125, 0.0018944740295410156, 0.0035905838012695312, 0.005286693572998047, 0.0069828033447265625, 0.008678913116455078, 0.010375022888183594, 0.01207113265991211, 0.013767242431640625, 0.01546335220336914, 0.017159461975097656, 0.018855571746826172, 0.020551681518554688, 0.022247791290283203, 0.02394390106201172, 0.025640010833740234, 0.02733612060546875, 0.029032230377197266, 0.03072834014892578, 0.0324244499206543, 0.03412055969238281, 0.03581666946411133, 0.037512779235839844, 0.03920888900756836, 0.040904998779296875, 0.04260110855102539, 0.044297218322753906, 0.04599332809448242, 0.04768943786621094, 0.04938554763793945, 0.05108165740966797, 0.052777767181396484, 0.054473876953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 3.0, 5.0, 6.0, 0.0, 1.0, 8.0, 15.0, 14.0, 22.0, 37.0, 81.0, 134.0, 196.0, 578.0, 2126.0, 13873.0, 8353823.0, 14436.0, 2158.0, 553.0, 219.0, 98.0, 55.0, 39.0, 32.0, 21.0, 4.0, 10.0, 12.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.7835512161254883, -0.7594476938247681, -0.7353441119194031, -0.7112405896186829, -0.6871370673179626, -0.6630334854125977, -0.6389299631118774, -0.6148264408111572, -0.590722918510437, -0.5666193962097168, -0.5425158143043518, -0.5184122920036316, -0.4943087697029114, -0.4702052175998688, -0.44610166549682617, -0.42199814319610596, -0.39789456129074097, -0.37379100918769836, -0.34968748688697815, -0.32558393478393555, -0.30148041248321533, -0.27737686038017273, -0.2532733082771301, -0.22916977107524872, -0.2050662338733673, -0.1809626966714859, -0.1568591594696045, -0.1327556073665619, -0.10865207016468048, -0.08454853296279907, -0.06044498085975647, -0.03634144365787506, -0.012237906455993652, 0.011865634471178055, 0.03596917539834976, 0.06007272005081177, 0.08417625725269318, 0.10827979445457458, 0.1323833465576172, 0.1564868837594986, 0.18059042096138, 0.2046939581632614, 0.22879749536514282, 0.2529010474681854, 0.277004599571228, 0.30110812187194824, 0.32521167397499084, 0.34931522607803345, 0.37341874837875366, 0.39752230048179626, 0.4216258227825165, 0.4457293748855591, 0.4698328971862793, 0.4939364492893219, 0.5180400013923645, 0.5421435236930847, 0.5662471055984497, 0.5903506278991699, 0.6144542098045349, 0.6385577321052551, 0.6626612544059753, 0.6867648363113403, 0.7108683586120605, 0.7349718809127808, 0.759075403213501]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 5.0, 2.0, 8.0, 7.0, 9.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.9152419567108154, -0.885687530040741, -0.8561331033706665, -0.8265787363052368, -0.7970243096351624, -0.7674698829650879, -0.7379155158996582, -0.7083610892295837, -0.6788066625595093, -0.6492522358894348, -0.6196978092193604, -0.5901434421539307, -0.5605890154838562, -0.5310345888137817, -0.501480221748352, -0.4719257950782776, -0.4423713684082031, -0.41281694173812866, -0.3832625448703766, -0.3537081480026245, -0.32415372133255005, -0.2945992946624756, -0.2650448977947235, -0.23549048602581024, -0.20593607425689697, -0.1763816624879837, -0.14682725071907043, -0.11727283895015717, -0.0877184271812439, -0.05816401541233063, -0.02860960364341736, 0.0009448081254959106, 0.03049921989440918, 0.06005363166332245, 0.08960804343223572, 0.11916245520114899, 0.14871686697006226, 0.17827127873897552, 0.2078256905078888, 0.23738010227680206, 0.26693451404571533, 0.2964889407157898, 0.32604333758354187, 0.35559773445129395, 0.3851521611213684, 0.41470658779144287, 0.44426098465919495, 0.473815381526947, 0.5033698081970215, 0.532924234867096, 0.5624786615371704, 0.5920330286026001, 0.6215874552726746, 0.651141881942749, 0.6806962490081787, 0.7102506756782532, 0.7398051023483276, 0.7693595290184021, 0.7989139556884766, 0.8284683227539062, 0.8580227494239807, 0.8875771760940552, 0.9171315431594849, 0.9466859698295593, 0.9762403964996338]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 3.0, 11.0, 16.0, 25.0, 48.0, 85.0, 130.0, 236.0, 521.0, 1316.0, 5480.0, 34929.0, 286742.0, 170095.0, 19244.0, 3504.0, 1005.0, 377.0, 173.0, 104.0, 79.0, 40.0, 24.0, 24.0, 17.0, 7.0, 6.0, 14.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73876953125, -0.7064437866210938, -0.6741180419921875, -0.6417922973632812, -0.609466552734375, -0.5771408081054688, -0.5448150634765625, -0.5124893188476562, -0.48016357421875, -0.44783782958984375, -0.4155120849609375, -0.38318634033203125, -0.350860595703125, -0.31853485107421875, -0.2862091064453125, -0.25388336181640625, -0.2215576171875, -0.18923187255859375, -0.1569061279296875, -0.12458038330078125, -0.092254638671875, -0.05992889404296875, -0.0276031494140625, 0.00472259521484375, 0.03704833984375, 0.06937408447265625, 0.1016998291015625, 0.13402557373046875, 0.166351318359375, 0.19867706298828125, 0.2310028076171875, 0.26332855224609375, 0.295654296875, 0.32798004150390625, 0.3603057861328125, 0.39263153076171875, 0.424957275390625, 0.45728302001953125, 0.4896087646484375, 0.5219345092773438, 0.55426025390625, 0.5865859985351562, 0.6189117431640625, 0.6512374877929688, 0.683563232421875, 0.7158889770507812, 0.7482147216796875, 0.7805404663085938, 0.8128662109375, 0.8451919555664062, 0.8775177001953125, 0.9098434448242188, 0.942169189453125, 0.9744949340820312, 1.0068206787109375, 1.0391464233398438, 1.07147216796875, 1.1037979125976562, 1.1361236572265625, 1.1684494018554688, 1.200775146484375, 1.2331008911132812, 1.2654266357421875, 1.2977523803710938, 1.330078125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 3.0, 9.0, 25.0, 17.0, 28.0, 39.0, 52.0, 74.0, 88.0, 85.0, 100.0, 110.0, 90.0, 76.0, 45.0, 40.0, 26.0, 24.0, 19.0, 14.0, 11.0, 3.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0869140625, -0.08378314971923828, -0.08065223693847656, -0.07752132415771484, -0.07439041137695312, -0.0712594985961914, -0.06812858581542969, -0.06499767303466797, -0.06186676025390625, -0.05873584747314453, -0.05560493469238281, -0.052474021911621094, -0.049343109130859375, -0.046212196350097656, -0.04308128356933594, -0.03995037078857422, -0.0368194580078125, -0.03368854522705078, -0.030557632446289062, -0.027426719665527344, -0.024295806884765625, -0.021164894104003906, -0.018033981323242188, -0.014903068542480469, -0.01177215576171875, -0.008641242980957031, -0.0055103302001953125, -0.0023794174194335938, 0.000751495361328125, 0.0038824081420898438, 0.0070133209228515625, 0.010144233703613281, 0.013275146484375, 0.01640605926513672, 0.019536972045898438, 0.022667884826660156, 0.025798797607421875, 0.028929710388183594, 0.03206062316894531, 0.03519153594970703, 0.03832244873046875, 0.04145336151123047, 0.04458427429199219, 0.047715187072753906, 0.050846099853515625, 0.053977012634277344, 0.05710792541503906, 0.06023883819580078, 0.0633697509765625, 0.06650066375732422, 0.06963157653808594, 0.07276248931884766, 0.07589340209960938, 0.0790243148803711, 0.08215522766113281, 0.08528614044189453, 0.08841705322265625, 0.09154796600341797, 0.09467887878417969, 0.0978097915649414, 0.10094070434570312, 0.10407161712646484, 0.10720252990722656, 0.11033344268798828, 0.11346435546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 13.0, 25.0, 29.0, 39.0, 55.0, 76.0, 75.0, 43.0, 39.0, 15.0, 17.0, 10.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6741411089897156, -0.653797447681427, -0.6334538459777832, -0.6131101846694946, -0.592766523361206, -0.5724228620529175, -0.5520792603492737, -0.5317355990409851, -0.5113919973373413, -0.4910483658313751, -0.47070470452308655, -0.45036107301712036, -0.4300174117088318, -0.4096737802028656, -0.3893301486968994, -0.36898648738861084, -0.34864282608032227, -0.3282991945743561, -0.3079555332660675, -0.2876119017601013, -0.26726824045181274, -0.24692460894584656, -0.22658097743988037, -0.206237331032753, -0.1858936846256256, -0.16555003821849823, -0.14520639181137085, -0.12486276030540466, -0.10451911389827728, -0.0841754674911499, -0.06383182853460312, -0.043488189578056335, -0.02314460277557373, -0.0028009600937366486, 0.017542682588100433, 0.037886325269937515, 0.0582299679517746, 0.07857361435890198, 0.09891725331544876, 0.11926089227199554, 0.13960453867912292, 0.1599481850862503, 0.18029183149337769, 0.20063546299934387, 0.22097910940647125, 0.24132275581359863, 0.2616663873195648, 0.282010018825531, 0.3023536801338196, 0.32269731163978577, 0.34304097294807434, 0.3633846044540405, 0.3837282657623291, 0.4040718972682953, 0.4244155287742615, 0.44475919008255005, 0.46510282158851624, 0.4854464530944824, 0.505790114402771, 0.5261337757110596, 0.5464773774147034, 0.5668210387229919, 0.5871647000312805, 0.6075083017349243, 0.6278519630432129]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 7.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 13.0, 27.0, 39.0, 63.0, 86.0, 66.0, 57.0, 32.0, 22.0, 20.0, 6.0, 8.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.273157000541687, -0.26075565814971924, -0.24835430085659027, -0.2359529584646225, -0.22355160117149353, -0.21115025877952576, -0.19874891638755798, -0.1863475739955902, -0.17394621670246124, -0.16154487431049347, -0.1491435170173645, -0.13674217462539673, -0.12434082478284836, -0.11193947494029999, -0.09953813254833221, -0.08713678270578384, -0.07473543286323547, -0.0623340830206871, -0.04993273690342903, -0.03753139078617096, -0.02513004094362259, -0.012728691101074219, -0.0003273487091064453, 0.012074001133441925, 0.024475350975990295, 0.036876700818538666, 0.04927804693579674, 0.06167939305305481, 0.07408074289560318, 0.08648209273815155, 0.09888343513011932, 0.1112847849726677, 0.12368613481521606, 0.13608747720718384, 0.1484888345003128, 0.16089017689228058, 0.17329153418540955, 0.18569287657737732, 0.1980942189693451, 0.21049556136131287, 0.22289691865444183, 0.2352982610464096, 0.24769961833953857, 0.26010096073150635, 0.2725023031234741, 0.2849036455154419, 0.29730498790740967, 0.30970636010169983, 0.3221077024936676, 0.3345090448856354, 0.34691038727760315, 0.3593117594718933, 0.3717131018638611, 0.38411444425582886, 0.39651578664779663, 0.4089171290397644, 0.4213184714317322, 0.43371981382369995, 0.4461211562156677, 0.4585224986076355, 0.47092387080192566, 0.48332521319389343, 0.4957265555858612, 0.5081279277801514, 0.5205292701721191]}, "eval/loss": 4.601601600646973, "eval/wer": 1.6165807219357398, "eval/runtime": 1317.7455, "eval/samples_per_second": 2.005, "eval/steps_per_second": 0.251} \ No newline at end of file